mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[BugFix] fix token_processor zmq (#4827)
* fix_token_processor_zmq * check pooling_model's token_ids is None * revert
This commit is contained in:
@@ -241,6 +241,11 @@ class TokenProcessor:
|
||||
|
||||
task_id = task.request_id
|
||||
token_ids = stream_data.tokens # numpy.array
|
||||
if token_ids is not None and token_ids[-1] <= 0:
|
||||
if envs.ENABLE_V1_KVCACHE_SCHEDULER:
|
||||
if task_id in self.resource_manager.to_be_rescheduled_request_id_set:
|
||||
self.resource_manager.reschedule_preempt_task(task_id)
|
||||
continue
|
||||
|
||||
current_time = time.time()
|
||||
if self.tokens_counter[task_id] == 0:
|
||||
|
||||
Reference in New Issue
Block a user