diff --git a/fastdeploy/worker/worker_process.py b/fastdeploy/worker/worker_process.py index 8d5beada1..e1ed72bc3 100644 --- a/fastdeploy/worker/worker_process.py +++ b/fastdeploy/worker/worker_process.py @@ -735,7 +735,8 @@ def initialize_fd_config(config_or_args) -> FDConfig: # Handle vocabulary size model_config.ori_vocab_size = model_config_dict.get("vocab_size", -1) - if "Ernie4_5_ForCausalLM" in model_config_dict.get("architectures", []): + archs = model_config_dict.get("architectures", []) + if "Ernie4_5_ForCausalLM" in archs or "Ernie4_5_MoeForCausalLM" in archs: model_config.ori_vocab_size = getattr(config_or_args, 'ori_vocab_size', model_config.ori_vocab_size) # Handle DeepseekV3 specific config