diff --git a/fastdeploy/engine/common_engine.py b/fastdeploy/engine/common_engine.py index 545c291b1..ec9d4fcbd 100644 --- a/fastdeploy/engine/common_engine.py +++ b/fastdeploy/engine/common_engine.py @@ -769,7 +769,8 @@ class EngineSevice: llm_logger.info("Clear Data: Start") self.token_processor.clear_data() self.engine_worker_queue.clear_data() - self.zmq_server.req_dict.clear() + self.send_response_server.req_dict.clear() + self.recv_request_server.req_dict.clear() llm_logger.info("Clear Data: Successfully") return True except Exception as e: diff --git a/fastdeploy/entrypoints/openai/api_server.py b/fastdeploy/entrypoints/openai/api_server.py index e135202ad..71e6f8045 100644 --- a/fastdeploy/entrypoints/openai/api_server.py +++ b/fastdeploy/entrypoints/openai/api_server.py @@ -478,8 +478,8 @@ def reset_scheduler(): if llm_engine is None: return Response("Engine not loaded", status_code=500) - llm_engine.engine.clear_data() llm_engine.engine.scheduler.reset() + llm_engine.engine.clear_data() return Response("Scheduler Reset Successfully", status_code=200)