diff --git a/fastdeploy/model_executor/layers/sample/sampler.py b/fastdeploy/model_executor/layers/sample/sampler.py index f064cf9d1..dd314a60b 100644 --- a/fastdeploy/model_executor/layers/sample/sampler.py +++ b/fastdeploy/model_executor/layers/sample/sampler.py @@ -429,8 +429,8 @@ class MTPSampler(nn.Layer): sampling_metadata.min_dec_lens, sampling_metadata.eos_token_ids, share_inputs["seq_lens_this_time"], - share_inputs["seq_lens_encoder"], - share_inputs["seq_lens_decoder"], + share_inputs["output_padding_offset"], + share_inputs["output_cum_offsets"], max_model_len, ) probs = F.softmax(logits)