mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
support moe offline quant (#5142)
This commit is contained in:
@@ -180,6 +180,7 @@ class ModelConfig:
|
||||
):
|
||||
self.model = ""
|
||||
self.is_quantized = False
|
||||
self.is_moe_quantized = False
|
||||
self.max_model_len = 0
|
||||
self.dtype = "bfloat16"
|
||||
self.enable_logprob = False
|
||||
|
||||
Reference in New Issue
Block a user