diff --git a/fastdeploy/entrypoints/openai/api_server.py b/fastdeploy/entrypoints/openai/api_server.py index 476b77f9f..5dce373e6 100644 --- a/fastdeploy/entrypoints/openai/api_server.py +++ b/fastdeploy/entrypoints/openai/api_server.py @@ -506,11 +506,13 @@ def control_scheduler(request: ControlSchedulerRequest): return JSONResponse(content=content.model_dump(), status_code=500) if request.reset: - llm_engine.scheduler.reset() + llm_engine.engine.scheduler.reset() if request.load_shards_num or request.reallocate_shard: - if hasattr(llm_engine.scheduler, "update_config") and callable(llm_engine.scheduler.update_config): - llm_engine.scheduler.update_config( + if hasattr(llm_engine.engine.scheduler, "update_config") and callable( + llm_engine.engine.scheduler.update_config + ): + llm_engine.engine.scheduler.update_config( load_shards_num=request.load_shards_num, reallocate=request.reallocate_shard, )