add x1 a3b quantization (#4397)

This commit is contained in:
tianlef
2025-10-14 15:04:06 +08:00
committed by GitHub
parent 73c8e0849f
commit 14eb8b4f8b

View File

@@ -4,3 +4,4 @@ max_num_seqs: 32
reasoning_parser: ernie_x1
tool_call_parser: ernie_x1
load_choices: "default_v1"
quantization: wint8