mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 00:57:33 +08:00
[fix] fix completion stream api output_tokens not in usage (#3588)
This commit is contained in:
@@ -413,6 +413,7 @@ class OpenAIServingCompletion:
|
||||
usage=UsageInfo(
|
||||
prompt_tokens=len(prompt_batched_token_ids[idx]),
|
||||
completion_tokens=output_tokens[idx],
|
||||
total_tokens=len(prompt_batched_token_ids[idx]) + output_tokens[idx],
|
||||
),
|
||||
)
|
||||
yield f"data: {usage_chunk.model_dump_json(exclude_unset=True)}\n\n"
|
||||
|
Reference in New Issue
Block a user