* fix

* update
This commit is contained in:
bukejiyu
2025-08-28 17:06:32 +08:00
committed by GitHub
parent 98c217b428
commit 73cf6096da
2 changed files with 3 additions and 1 deletions

View File

@@ -166,7 +166,7 @@ model_param_map = {
],
},
"Qwen2-7B-Instruct": {
"quantizations": ["None", "wint8"],
"quantizations": ["wint4"],
},
"Qwen3-30B-A3B": {
"tensor_parallel_size": 2,