[NewFeatures] support eplb (#3547)

* [NewFeatures] support eplb * fix eplb
2025-10-05 16:48:03 +08:00 · 2025-08-26 16:19:30 +08:00
parent 56e2d7e668
commit 9afa236e39
17 changed files with 174 additions and 67 deletions
--- a/fastdeploy/model_executor/layers/backends/gcu/quantization/weight_only.py
+++ b/fastdeploy/model_executor/layers/backends/gcu/quantization/weight_only.py
@@ -59,7 +59,7 @@ class GCUWeightOnlyLinearMethod(WeightOnlyLinearMethod):
            is_bias=False,
        )

-    def process_prequanted_weights(self, layer, state_dict) -> None:
+    def process_prequanted_weights(self, layer, state_dict, is_rearrange: bool = False) -> None:
        """
        Process pre-quantized weights before applying them to the model
        Args: