mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
Unify server-side and model-side Config (Part1) (#3018)
* move cache config * fix mtp
This commit is contained in:
@@ -113,7 +113,7 @@ class MLAAttentionBackend(AttentionBackend):
|
||||
self.attention_metadata: MLAAttentionMetadata = None
|
||||
|
||||
# 基础配置
|
||||
self.block_size: int = fd_config.parallel_config.block_size
|
||||
self.block_size: int = fd_config.cache_config.block_size
|
||||
self.max_seq_len: int = fd_config.parallel_config.max_model_len
|
||||
self.rope_theta: float = (
|
||||
10000.0 if fd_config.model_config.rope_theta is None else fd_config.model_config.rope_theta
|
||||
|
Reference in New Issue
Block a user