mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[FDConfig]Remove max_num_batched_tokens/max_num_seqs in parallel config (#4116)
* remove max_num_batched_tokens in parallel config * remove max_num_seqs * update test case * fix test * fix --------- Co-authored-by: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com>
This commit is contained in:
@@ -50,8 +50,9 @@ class Proposer(ABC):
|
||||
self.speculative_config = self.cfg.speculative_config
|
||||
self.cache_config = self.cfg.cache_config
|
||||
self.quant_config = self.cfg.quant_config
|
||||
self.scheduler_config = self.cfg.scheduler_config
|
||||
|
||||
self.max_num_seqs = self.parallel_config.max_num_seqs
|
||||
self.max_num_seqs = self.scheduler_config.max_num_seqs
|
||||
self.max_model_len = self.parallel_config.max_model_len
|
||||
self.speculative_method = self.speculative_config.method
|
||||
self.max_draft_token_num = self.speculative_config.num_speculative_tokens
|
||||
|
||||
Reference in New Issue
Block a user