mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-15 05:01:00 +08:00
[fix] fix output tokens count in streaming completion api (#3507)
This commit is contained in:
@@ -407,7 +407,6 @@ class OpenAIServingCompletion:
|
||||
delta_message.tool_calls = delta_message_output.tool_calls
|
||||
|
||||
choices.append(delta_message)
|
||||
output_tokens[idx] += 1
|
||||
|
||||
if res["finished"]:
|
||||
choices[-1].finish_reason = self.calc_finish_reason(
|
||||
|
Reference in New Issue
Block a user