[Bug Fix] fix bug of prompt penalty (#2888)

2025-10-05 08:37:06 +08:00 · 2025-07-17 17:21:37 +08:00
parent 273efba76f
commit 67180c1ff9
1 changed files with 1 additions and 1 deletions
--- a/fastdeploy/worker/gpu_model_runner.py
+++ b/fastdeploy/worker/gpu_model_runner.py
@@ -217,7 +217,7 @@ class GPUModelRunner(ModelRunnerBase):
                self.share_inputs["input_ids"][idx:idx + 1,
                                               0] = request.prompt_token_ids[0]
                self.share_inputs["prompt_ids"][idx:idx + 1,
-                                               0] = request.prompt_token_ids[0]
+                                               :length] = np.array(request.prompt_token_ids)
                self.share_inputs['seq_lens_encoder'][idx:idx + 1] = 0
                self.share_inputs['seq_lens_decoder'][idx:idx + 1] = length
                self.share_inputs['seq_lens_this_time'][idx:idx + 1] = 1