mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[FDConfig]Remove max_model_len in FDConfig (#4350)
* modify max_model_len * fix unittest * fix unittest --------- Co-authored-by: root <root@yqlcc01-sys-rpm12rzmwjd.yqlcc01.baidu.com>
This commit is contained in:
@@ -106,6 +106,7 @@ class TestCUDAGrpahSpecDecode(unittest.TestCase):
|
||||
cache_config = CacheConfig({})
|
||||
parallel_config = ParallelConfig(args={})
|
||||
model_config = Mock()
|
||||
model_config.max_model_len = 512
|
||||
# Initialize cuda graph capture list
|
||||
graph_opt_config._set_cudagraph_sizes(max_num_seqs=scheduler_config.max_num_seqs)
|
||||
graph_opt_config.init_with_cudagrpah_size(max_capture_size=scheduler_config.max_num_seqs)
|
||||
|
||||
Reference in New Issue
Block a user