From 99d09210498b5aaeb7e4486cae1cbd54afd7624c Mon Sep 17 00:00:00 2001 From: Wanglongzhi2001 <583087864@qq.com> Date: Thu, 9 Jan 2025 07:16:13 +0000 Subject: [PATCH] update --- llm/server/server/engine/infer.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llm/server/server/engine/infer.py b/llm/server/server/engine/infer.py index 04c85d497..2641e8899 100644 --- a/llm/server/server/engine/infer.py +++ b/llm/server/server/engine/infer.py @@ -500,8 +500,8 @@ class ModelRunner: if self.proposer is not None: self.proposer.run( self.share_inputs, - real_batch_size=self.args.max_batch_size, - seq_lens_this_time=self.share_inputs["seq_lens_this_time"], + real_batch_size=seq_lens_this_time.shape[0], + seq_lens_this_time=seq_lens_this_time, ) self.infer_engine.predictor.run()