mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 09:07:10 +08:00
[fix] fix completion stream api output_tokens not in usage (#3588)
This commit is contained in:
@@ -413,6 +413,7 @@ class OpenAIServingCompletion:
|
|||||||
usage=UsageInfo(
|
usage=UsageInfo(
|
||||||
prompt_tokens=len(prompt_batched_token_ids[idx]),
|
prompt_tokens=len(prompt_batched_token_ids[idx]),
|
||||||
completion_tokens=output_tokens[idx],
|
completion_tokens=output_tokens[idx],
|
||||||
|
total_tokens=len(prompt_batched_token_ids[idx]) + output_tokens[idx],
|
||||||
),
|
),
|
||||||
)
|
)
|
||||||
yield f"data: {usage_chunk.model_dump_json(exclude_unset=True)}\n\n"
|
yield f"data: {usage_chunk.model_dump_json(exclude_unset=True)}\n\n"
|
||||||
|
Reference in New Issue
Block a user