diff --git a/fastdeploy/model_executor/layers/moe/fused_moe_backend_base.py b/fastdeploy/model_executor/layers/moe/fused_moe_backend_base.py index 0f6b38586..e2c8b6b55 100644 --- a/fastdeploy/model_executor/layers/moe/fused_moe_backend_base.py +++ b/fastdeploy/model_executor/layers/moe/fused_moe_backend_base.py @@ -85,8 +85,8 @@ class MoEMethodBase(QuantMethodBase): layer.top_k, layer.hidden_size, layer.num_experts, - layer.moe_config.num_max_dispatch_tokens_per_rank, layer.fd_config.parallel_config.splitwise_role, + layer.fd_config.model_config.num_max_dispatch_tokens_per_rank, layer.ep_size, layer.ep_rank, layer.fd_config.model_config.redundant_experts_num,