mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[BugFix] BF16 MoE Cutlass Backend Support EP (#5242)
This commit is contained in:
@@ -304,6 +304,8 @@ class ModelConfig:
|
||||
|
||||
if hasattr(self, "num_experts") and getattr(self, "moe_num_experts") is None:
|
||||
self.moe_num_experts = self.num_experts
|
||||
if hasattr(self, "n_routed_experts") and getattr(self, "moe_num_experts") is None:
|
||||
self.moe_num_experts = self.n_routed_experts
|
||||
|
||||
def read_from_env(self):
|
||||
"""
|
||||
|
||||
Reference in New Issue
Block a user