[XPU]Fixed the issue of performance degradation caused by enabling ENABLE_V1_KVCACHE_SCHEDULER (#3897)

* fix bug * fix bug * update * update * update
2025-10-05 08:37:06 +08:00 · 2025-09-08 10:34:46 +08:00
parent b649494655
commit 7833f2f6cb
4 changed files with 20 additions and 4 deletions
--- a/fastdeploy/engine/sched/resource_manager_v1.py
+++ b/fastdeploy/engine/sched/resource_manager_v1.py
@@ -363,7 +363,9 @@ class ResourceManagerV1(ResourceManager):
                while self.waiting and token_budget > 0:
                    if len(self.running) == self.max_num_seqs:
                        break
-                    if self.config.model_config.enable_mm and self.exist_prefill(scheduled_reqs):
+                    if (self.config.model_config.enable_mm or paddle.is_compiled_with_xpu()) and self.exist_prefill(
+                        scheduled_reqs
+                    ):
                        break
                    request = self.waiting[0]
                    if request.status == RequestStatus.WAITING: