From bcde7980985e2baf801b92314db928da284dc654 Mon Sep 17 00:00:00 2001 From: zccjjj <62829461+zccjjj@users.noreply.github.com> Date: Wed, 10 Dec 2025 19:40:38 +0800 Subject: [PATCH] [CI][XPU] ep+prefix cache+chunk prefill (#5490) --- tests/xpu_ci/test_ep4tp1_online.py | 1 + tests/xpu_ci/test_ep4tp4_all2all.py | 1 + tests/xpu_ci/test_ep4tp4_online.py | 1 + 3 files changed, 3 insertions(+) diff --git a/tests/xpu_ci/test_ep4tp1_online.py b/tests/xpu_ci/test_ep4tp1_online.py index 8acb5da3a..c248b24e2 100644 --- a/tests/xpu_ci/test_ep4tp1_online.py +++ b/tests/xpu_ci/test_ep4tp1_online.py @@ -63,6 +63,7 @@ def test_ep4tp1_online(xpu_env): "--tensor-parallel-size", "1", "--enable-expert-parallel", + "--enable-prefix-caching", "--data-parallel-size", "4", "--max-model-len", diff --git a/tests/xpu_ci/test_ep4tp4_all2all.py b/tests/xpu_ci/test_ep4tp4_all2all.py index e2fbbf227..8c5a81e0b 100644 --- a/tests/xpu_ci/test_ep4tp4_all2all.py +++ b/tests/xpu_ci/test_ep4tp4_all2all.py @@ -65,6 +65,7 @@ def test_ep4tp4_all2all(xpu_env): "--tensor-parallel-size", "4", "--enable-expert-parallel", + "--enable-prefix-caching", "--data-parallel-size", "1", "--max-model-len", diff --git a/tests/xpu_ci/test_ep4tp4_online.py b/tests/xpu_ci/test_ep4tp4_online.py index 3850b4efb..6f64016be 100644 --- a/tests/xpu_ci/test_ep4tp4_online.py +++ b/tests/xpu_ci/test_ep4tp4_online.py @@ -64,6 +64,7 @@ def test_ep4tp4_online(xpu_env): "--tensor-parallel-size", "4", "--enable-expert-parallel", + "--enable-prefix-caching", "--data-parallel-size", "1", "--max-model-len",