mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 17:17:14 +08:00
[Feature] Support batched tokens for EP (#3415)
* Support batched tokens for EP * Support batched tokens for EP * Support batched tokens for EP * Support batched tokens for EP * Support batched tokens for EP and fix bug * Support batched tokens for EP and fix bug * Support batched tokens for EP and fix bug * Support batched tokens for EP and fix bug
This commit is contained in:
@@ -270,7 +270,7 @@ class TokenProcessor:
|
||||
self.resource_manager._recycle_block_tables(task)
|
||||
if self.prefill_result_status[task_id] != "finished":
|
||||
result.error_code = 400
|
||||
result.error_message = f"{task_id} failed to {self.prefill_result_status[task_id]}"
|
||||
result.error_msg = f"{task_id} failed to {self.prefill_result_status[task_id]}"
|
||||
self.split_connector.send_first_token(task.disaggregate_info, [result])
|
||||
del self.resource_manager.req_dict[task_id]
|
||||
break
|
||||
|
Reference in New Issue
Block a user