Skip to content

Commit e42dc8c

Browse files
ltd0924ltd0924
andauthored
[BUGFIX] clear request (#4320)
Co-authored-by: ltd0924 <[email protected]>
1 parent 63a03ee commit e42dc8c

File tree

4 files changed

+6
-1
lines changed

4 files changed

+6
-1
lines changed

fastdeploy/engine/common_engine.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -806,7 +806,8 @@ def clear_data(self):
806806
llm_logger.info("Clear Data: Start")
807807
self.token_processor.clear_data()
808808
self.engine_worker_queue.clear_data()
809-
self.zmq_server.req_dict.clear()
809+
self.send_response_server.req_dict.clear()
810+
self.recv_request_server.req_dict.clear()
810811
llm_logger.info("Clear Data: Successfully")
811812
return True
812813
except Exception as e:

fastdeploy/entrypoints/openai/api_server.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -499,6 +499,7 @@ def control_scheduler(request: ControlSchedulerRequest):
499499
return JSONResponse(content=content.model_dump(), status_code=500)
500500

501501
if request.reset:
502+
llm_engine.engine.clear_data()
502503
llm_engine.engine.scheduler.reset()
503504

504505
if request.load_shards_num or request.reallocate_shard:

fastdeploy/rl/dynamic_weight_manager.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -223,6 +223,7 @@ def check_model_weights_status(model_weights_status, model_runner, pid):
223223
while model_weights_status.value[0] != ModelWeightsStatus.NORMAL:
224224
if model_weights_status.value[0] == ModelWeightsStatus.UPDATING:
225225
logger.info("infer engine stopped! start to load new checkpoint...")
226+
model_runner.clear_requests()
226227
model_runner.update_parameters(pid)
227228
while model_weights_status.value[0] != ModelWeightsStatus.NORMAL:
228229
time.sleep(0.01)

fastdeploy/worker/worker_process.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -337,6 +337,8 @@ def event_loop_normal(self) -> None:
337337
self.worker.model_runner,
338338
self.parallel_config.engine_worker_queue_port,
339339
)
340+
logger.info(f"current task queue data: {self.task_queue.num_tasks()}")
341+
self.task_queue.clear_data()
340342
self.model_weights_signal[0] = ModelWeightsStatus.NORMAL
341343
logger.info(f"Rank: {self.local_rank} has updated or cleared parameters.")
342344

0 commit comments

Comments
 (0)