[XPU][CI]Change ci vl model to 28 b (#4764)

* Update XPU_VISIBLE_DEVICES and model parameters * Update base response and adjust max tokens * Implement process cleanup in CI workflow Add process cleanup commands to prevent port conflicts * Remove process cleanup commands from CI workflow Removed old process cleanup commands to prevent port conflicts.
2025-12-24 13:28:13 +08:00 · 2025-11-06 14:12:23 +08:00
parent 354ddc8bc5
commit fc8bef2c95
3 changed files with 5 additions and 6 deletions
--- a/scripts/run_ci_xpu.sh
+++ b/scripts/run_ci_xpu.sh
@@ -187,11 +187,11 @@ rm -f core*
 #清空消息队列
 ipcrm --all=msg
 echo "============================开始vl模型测试!============================"
-export XPU_VISIBLE_DEVICES="0,1,2,3,4,5,6,7"
+export XPU_VISIBLE_DEVICES="0,1,2,3"
 python -m fastdeploy.entrypoints.openai.api_server \
-    --model ${MODEL_PATH}/ERNIE-4.5-VL-424B-A47B-Paddle \
+    --model ${MODEL_PATH}/ERNIE-4.5-VL-28B-A3B-Paddle \
    --port 8188 \
-    --tensor-parallel-size 8 \
+    --tensor-parallel-size 4 \
    --max-model-len 32768 \
    --max-num-seqs 10 \
    --quantization wint8 \