mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] support stop_token_ids (#5399)
* support stop_token_ids * fix * delete chinese * support both * delete print
This commit is contained in:
@@ -355,6 +355,7 @@ def post_process_normal(
|
||||
model_output.step_idx,
|
||||
model_output.stop_token_ids,
|
||||
model_output.stop_seqs_len,
|
||||
model_output.min_tokens,
|
||||
False,
|
||||
) # multi ends
|
||||
elif current_platform.is_maca():
|
||||
@@ -368,6 +369,7 @@ def post_process_normal(
|
||||
model_output.step_idx,
|
||||
model_output.stop_token_ids,
|
||||
model_output.stop_seqs_len,
|
||||
model_output.min_tokens,
|
||||
False,
|
||||
) # multi ends
|
||||
else:
|
||||
@@ -472,6 +474,7 @@ def post_process_specualate(
|
||||
model_output.stop_token_ids,
|
||||
model_output.stop_seqs_len,
|
||||
model_output.eos_token_id,
|
||||
model_output.min_tokens,
|
||||
)
|
||||
speculate_update(
|
||||
model_output.seq_lens_encoder,
|
||||
|
||||
Reference in New Issue
Block a user