mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-11-01 12:22:53 +08:00
add x1 a3b quantization (#4397)
This commit is contained in:
@@ -4,3 +4,4 @@ max_num_seqs: 32
|
||||
reasoning_parser: ernie_x1
|
||||
tool_call_parser: ernie_x1
|
||||
load_choices: "default_v1"
|
||||
quantization: wint8
|
||||
|
||||
Reference in New Issue
Block a user