Skip to content

Commit 48a0030

Browse files
authored
fix rl overlap (#7744)
1 parent cb7a171 commit 48a0030

2 files changed

Lines changed: 13 additions & 1 deletion

File tree

fastdeploy/worker/gpu_model_runner.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3043,6 +3043,13 @@ def clear_parameters(self, pid):
30433043
self.clear_cache()
30443044
paddle.device.cuda.empty_cache()
30453045

3046+
# clear overlap status
3047+
self._cached_model_output_data = None
3048+
self._cached_sampler_output = None
3049+
self._cached_post_process_event = None
3050+
self._cached_launch_token_num = -1
3051+
self._cached_real_bsz = -1
3052+
30463053
self.dynamic_weight_manager._log_memory("dynamic weight manager clear all memory")
30473054

30483055
def clear_requests(self):

fastdeploy/worker/input_batch.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -588,7 +588,6 @@ def reset_share_inputs(self):
588588
fill_paddle_tensor(self, "step_idx", 0)
589589
# fill_paddle_tensor(self, "not_need_stop", False)
590590
fill_paddle_tensor(self, "not_need_stop_device", False)
591-
fill_paddle_tensor(self, "sampled_token_ids", -1)
592591
fill_paddle_tensor(self, "stop_flags", True)
593592

594593
fill_paddle_tensor(self, "bad_tokens", -1)
@@ -726,6 +725,12 @@ def reset_share_inputs(self):
726725
# Reset other miscellaneous tensors
727726
fill_paddle_tensor(self, "mask_rollback", 0)
728727
fill_paddle_tensor(self, "preempted_idx", 0)
728+
fill_paddle_tensor(self, "last_preempted_idx", 0)
729+
730+
# Reset tensors for overlap
731+
self.sampled_token_ids = paddle.full([max_num_seqs, 1], -1, dtype="int64").pin_memory()
732+
self.seq_lens_this_time_cpu = paddle.full([max_num_seqs, 1], 0, dtype="int32").pin_memory()
733+
self.is_block_step_cpu = paddle.full([max_num_seqs], False, dtype="bool").pin_memory()
729734

730735
logger.info("share_inputs reset completed")
731736
except Exception as e:

0 commit comments

Comments
 (0)