diff --git a/fastdeploy/model_executor/layers/quantization/w8a8.py b/fastdeploy/model_executor/layers/quantization/w8a8.py index 16cae1de6..cee8d2dc0 100644 --- a/fastdeploy/model_executor/layers/quantization/w8a8.py +++ b/fastdeploy/model_executor/layers/quantization/w8a8.py @@ -85,7 +85,7 @@ class W8A8LinearMethod(QuantMethodBase): if weight_scale is None or in_scale is None: self.skip_quant = True return - layer.wieght = layer.create_parameter( + layer.weight = layer.create_parameter( shape=layer.weight_shape, dtype=layer.weight_dtype, is_bias=False,