support moe offline quant (#5142)

This commit is contained in:
xiaoxiaohehe001
2025-11-24 18:59:18 +08:00
committed by GitHub
parent 5ff93d4998
commit e150a418d4
5 changed files with 12 additions and 3 deletions

View File

@@ -180,6 +180,7 @@ class ModelConfig:
):
self.model = ""
self.is_quantized = False
self.is_moe_quantized = False
self.max_model_len = 0
self.dtype = "bfloat16"
self.enable_logprob = False