mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[BugFix] fix mtp logprob bugs in chunk prefill (#5244)
* fix mtp logprob bugs in chunk prefill * fix * fix
This commit is contained in:
@@ -514,8 +514,11 @@ def post_process_specualate(
|
||||
sampler_output.token_num_per_batch,
|
||||
sampler_output.cu_batch_token_offset,
|
||||
model_output.not_need_stop,
|
||||
model_output.seq_lens_decoder,
|
||||
model_output.prompt_lens,
|
||||
3, # mtype
|
||||
model_output.mp_rank,
|
||||
save_each_rank,
|
||||
)
|
||||
|
||||
# Update pre_ids through accept tokens
|
||||
|
||||
Reference in New Issue
Block a user