mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
Unify server-side and model-side Config (Part1) (#3018)
* move cache config * fix mtp
This commit is contained in:
@@ -95,7 +95,7 @@ class AppendAttentionBackend(AttentionBackend):
|
||||
"""
|
||||
super().__init__()
|
||||
self.attention_metadata: AppendAttentionMetadata = None
|
||||
self.block_size: int = fd_config.parallel_config.block_size
|
||||
self.block_size: int = fd_config.cache_config.block_size
|
||||
self.max_seq_len: int = fd_config.parallel_config.max_model_len
|
||||
self.rope_theta: float = (
|
||||
10000.0 if fd_config.model_config.rope_theta is None else fd_config.model_config.rope_theta
|
||||
|
Reference in New Issue
Block a user