[XPU]Fixed the issue of performance degradation caused by enabling ENABLE_V1_KVCACHE_SCHEDULER (#3900)

* fix bug

* fix bug

* update

* udpate

* update
This commit is contained in:
yinwei
2025-09-05 19:17:25 +08:00
committed by GitHub
parent 473cde779f
commit 77c1bd0813
4 changed files with 20 additions and 4 deletions

View File

@@ -345,7 +345,9 @@ class ResourceManagerV1(ResourceManager):
while self.waiting and token_budget > 0:
if len(self.running) == self.max_num_seqs:
break
if self.config.model_config.enable_mm and self.exist_prefill(scheduled_reqs):
if (self.config.model_config.enable_mm or paddle.is_compiled_with_xpu()) and self.exist_prefill(
scheduled_reqs
):
break
request = self.waiting[0]
if request.status == RequestStatus.WAITING: