Fix down projection weight shape in fused MOE layer (#4041)

This commit is contained in:
Yuanle Liu
2025-09-10 12:49:03 +08:00
committed by GitHub
parent dfc94371ee
commit 7272afe3dc

View File

@@ -695,7 +695,7 @@ class BlockWiseFP8MoEMethod(QuantMethodBase):
layer,
down_proj_weight_name,
layer.create_parameter(
shape=self.up_gate_proj_weight_shape,
shape=self.down_proj_weight_shape,
dtype=self.weight_dtype,
default_initializer=paddle.nn.initializer.Constant(0),
),