mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-20 07:24:42 +08:00
Fix down projection weight shape in fused MOE layer (#4041)
This commit is contained in:
@@ -695,7 +695,7 @@ class BlockWiseFP8MoEMethod(QuantMethodBase):
|
|||||||
layer,
|
layer,
|
||||||
down_proj_weight_name,
|
down_proj_weight_name,
|
||||||
layer.create_parameter(
|
layer.create_parameter(
|
||||||
shape=self.up_gate_proj_weight_shape,
|
shape=self.down_proj_weight_shape,
|
||||||
dtype=self.weight_dtype,
|
dtype=self.weight_dtype,
|
||||||
default_initializer=paddle.nn.initializer.Constant(0),
|
default_initializer=paddle.nn.initializer.Constant(0),
|
||||||
),
|
),
|
||||||
|
Reference in New Issue
Block a user