mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] support eb5 video chunk (#4671)
Some checks failed
CE Compile Job / ce_job_pre_check (push) Has been cancelled
CE Compile Job / print_ce_job_pre_check_outputs (push) Has been cancelled
CE Compile Job / FD-Clone-Linux (push) Has been cancelled
CE Compile Job / Show Code Archive Output (push) Has been cancelled
CE Compile Job / BUILD_SM8090 (push) Has been cancelled
CE Compile Job / BUILD_SM8689 (push) Has been cancelled
CE Compile Job / CE_UPLOAD (push) Has been cancelled
Some checks failed
CE Compile Job / ce_job_pre_check (push) Has been cancelled
CE Compile Job / print_ce_job_pre_check_outputs (push) Has been cancelled
CE Compile Job / FD-Clone-Linux (push) Has been cancelled
CE Compile Job / Show Code Archive Output (push) Has been cancelled
CE Compile Job / BUILD_SM8090 (push) Has been cancelled
CE Compile Job / BUILD_SM8689 (push) Has been cancelled
CE Compile Job / CE_UPLOAD (push) Has been cancelled
This commit is contained in:
@@ -28,6 +28,7 @@ import paddle
|
||||
|
||||
from fastdeploy.engine.request import Request, RequestStatus, RequestType
|
||||
from fastdeploy.engine.resource_manager import ResourceManager
|
||||
from fastdeploy.input.utils import IDS_TYPE_FLAG
|
||||
from fastdeploy.metrics.metrics import main_process_metrics
|
||||
from fastdeploy.utils import llm_logger
|
||||
|
||||
@@ -151,6 +152,24 @@ class ResourceManagerV1(ResourceManager):
|
||||
new_end_idx = pre_end_idx + num_new_tokens
|
||||
|
||||
prompt_token_ids_len = len(request.prompt_token_ids)
|
||||
|
||||
if new_end_idx >= prompt_token_ids_len:
|
||||
return num_new_tokens
|
||||
|
||||
if inputs.get("can_split_idx_list") is not None:
|
||||
if new_end_idx >= prompt_token_ids_len:
|
||||
return num_new_tokens
|
||||
patch_idx = inputs["patch_idx"][new_end_idx]
|
||||
patch_map = inputs["patch_map"][patch_idx]
|
||||
modal_id = patch_map["modal_id"]
|
||||
if modal_id == IDS_TYPE_FLAG["text"]:
|
||||
return num_new_tokens
|
||||
elif modal_id == IDS_TYPE_FLAG["video"]:
|
||||
can_split_idx_list = inputs["can_split_idx_list"]
|
||||
for i in range(len(can_split_idx_list)):
|
||||
if can_split_idx_list[i] >= new_end_idx:
|
||||
return can_split_idx_list[i] - pre_end_idx
|
||||
|
||||
assert prompt_token_ids_len == len(inputs["patch_idx"]), (prompt_token_ids_len, len(inputs["patch_idx"]))
|
||||
|
||||
# start
|
||||
|
||||
Reference in New Issue
Block a user