mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
Unify server-side and model-side Config (Part1) (#3018)
* move cache config * fix mtp
This commit is contained in:
@@ -92,7 +92,7 @@ class XPUAttentionBackend(AttentionBackend):
|
||||
super().__init__()
|
||||
self.attention_metadata: XPUAttentionMetadata = None
|
||||
# TODO(gongshaotian): Use fd_config parameters in the correct location
|
||||
self.block_size: int = fd_config.parallel_config.block_size
|
||||
self.block_size: int = fd_config.cache_config.block_size
|
||||
self.max_seq_len: int = fd_config.parallel_config.max_model_len
|
||||
self.rope_theta: float = (
|
||||
10000.0 if fd_config.model_config.rope_theta is None else fd_config.model_config.rope_theta
|
||||
|
Reference in New Issue
Block a user