mirror of
				https://github.com/PaddlePaddle/FastDeploy.git
				synced 2025-10-25 09:31:38 +08:00 
			
		
		
		
	[Bug Fix] fix bug of prompt penalty (#2888)
This commit is contained in:
		| @@ -217,7 +217,7 @@ class GPUModelRunner(ModelRunnerBase): | ||||
|                 self.share_inputs["input_ids"][idx:idx + 1, | ||||
|                                                0] = request.prompt_token_ids[0] | ||||
|                 self.share_inputs["prompt_ids"][idx:idx + 1, | ||||
|                                                0] = request.prompt_token_ids[0] | ||||
|                                                :length] = np.array(request.prompt_token_ids) | ||||
|                 self.share_inputs['seq_lens_encoder'][idx:idx + 1] = 0 | ||||
|                 self.share_inputs['seq_lens_decoder'][idx:idx + 1] = length | ||||
|                 self.share_inputs['seq_lens_this_time'][idx:idx + 1] = 1 | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 ming1753
					ming1753