diff --git a/benchmarks/yaml/eb45-vl-28b-thinking-128k-wint8.yaml b/benchmarks/yaml/eb45-vl-28b-thinking-128k-wint8.yaml new file mode 100644 index 000000000..de436dc32 --- /dev/null +++ b/benchmarks/yaml/eb45-vl-28b-thinking-128k-wint8.yaml @@ -0,0 +1,8 @@ +max_model_len: 131072 +tensor_parallel_size: 1 +quantization: wint8 +max_num_seqs: 32 +reasoning_parser: ernie-45-vl-thinking +tool_call_parser: ernie-45-vl-thinking +load_choices: "default_v1" +mm-processor-kwargs: '{"image_max_pixels": 12845056 }' diff --git a/benchmarks/yaml/eb45-vl-28b-thinking-32k-wint8.yaml b/benchmarks/yaml/eb45-vl-28b-thinking-32k-wint8.yaml new file mode 100644 index 000000000..2be1e0e86 --- /dev/null +++ b/benchmarks/yaml/eb45-vl-28b-thinking-32k-wint8.yaml @@ -0,0 +1,8 @@ +max_model_len: 32768 +tensor_parallel_size: 1 +quantization: wint8 +max_num_seqs: 32 +reasoning_parser: ernie-45-vl-thinking +tool_call_parser: ernie-45-vl-thinking +load_choices: "default_v1" +mm-processor-kwargs: '{"image_max_pixels": 12845056 }'