[FDConfig]Remove max_model_len in FDConfig (#4350)

* modify max_model_len

* fix unittest

* fix unittest

---------

Co-authored-by: root <root@yqlcc01-sys-rpm12rzmwjd.yqlcc01.baidu.com>
This commit is contained in:
YuanRisheng
2025-10-11 14:04:17 +08:00
committed by GitHub
parent 365601ea5a
commit a2ec2c4152
36 changed files with 127 additions and 121 deletions

View File

@@ -630,7 +630,7 @@ class EngineService:
available_blocks=available_blocks,
block_size=self.cfg.cache_config.block_size,
reserved_output_blocks=self.cfg.cache_config.enc_dec_block_num,
max_num_batched_tokens=self.cfg.max_model_len,
max_num_batched_tokens=self.cfg.model_config.max_model_len,
batch=num_prefill_batch,
)
if self.cfg.scheduler_config.splitwise_role != "mixed":