delete max-len (#2959)

2025-10-04 16:22:57 +08:00 · 2025-07-23 15:11:39 +08:00
parent 5b59a97030
commit 9b22b8d2c3
5 changed files with 3 additions and 7 deletions
--- a/fastdeploy/worker/gpu_model_runner.py
+++ b/fastdeploy/worker/gpu_model_runner.py
@@ -601,7 +601,6 @@ class GPUModelRunner(ModelRunnerBase):
            output_cum_offsets,
            output_padding_offset,
        ) = pre_process(
-            self.parallel_config.max_model_len,
            self.share_inputs["input_ids"],
            self.share_inputs["seq_lens_this_time"],
            self.speculative_decoding,