diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index a94b2b4de..199d6c139 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -707,7 +707,8 @@ def initialize_fd_config(config) -> FDConfig: # Handle vocabulary size model_config.ori_vocab_size = model_config_dict.get("vocab_size", -1) - if "Ernie4_5_ForCausalLM" in model_config_dict.get("architectures", []): + archs = model_config_dict.get("architectures", []) + if "Ernie4_5_ForCausalLM" in archs or "Ernie4_5_MoeForCausalLM" in archs: model_config.ori_vocab_size = getattr(config, 'ori_vocab_size', model_config.ori_vocab_size) # Handle DeepseekV3 specific config