diff --git a/fastdeploy/entrypoints/openai/api_server.py b/fastdeploy/entrypoints/openai/api_server.py index 2a4c0e7ab..3f92ced34 100644 --- a/fastdeploy/entrypoints/openai/api_server.py +++ b/fastdeploy/entrypoints/openai/api_server.py @@ -50,6 +50,8 @@ from fastdeploy.metrics.metrics import ( ) from fastdeploy.metrics.trace_util import fd_start_span, inject_to_metadata, instrument from fastdeploy.plugins.model_register import load_model_register_plugins + +load_model_register_plugins() from fastdeploy.utils import ( FlexibleArgumentParser, StatefulSemaphore, @@ -460,8 +462,6 @@ def launch_controller_server(): def main(): """main函数""" - - load_model_register_plugins() if load_engine() is None: return diff --git a/fastdeploy/rl/dynamic_weight_manager.py b/fastdeploy/rl/dynamic_weight_manager.py index 80f970b35..ad39accdb 100644 --- a/fastdeploy/rl/dynamic_weight_manager.py +++ b/fastdeploy/rl/dynamic_weight_manager.py @@ -82,7 +82,7 @@ class DynamicWeightManager: def _update_ipc_snapshot(self): """Update using IPC snapshot strategy for elastic recovery.""" model_path = os.path.join( - self.model_config.model, + self.fd_config.model_config.model, f"model_state.tp0{self.meta_src_id}.pdparams", )