mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 08:37:06 +08:00
Add custom op declaration for all_reduce
(#3473)
* add custom op declaration * roll back try except
This commit is contained in:
@@ -89,6 +89,9 @@ class MLAAttentionMetadata(AttentionMetadata):
|
||||
kv_signal_metadata: Optional[paddle.Tensor] = None
|
||||
kv_signal_data_list: List[Optional[paddle.Tensor]] = field(default_factory=list)
|
||||
|
||||
max_enc_len_this_time: Optional[paddle.Tensor] = None
|
||||
max_dec_len_this_time: Optional[paddle.Tensor] = None
|
||||
|
||||
|
||||
class MLAAttentionBackend(AttentionBackend):
|
||||
"""
|
||||
|
Reference in New Issue
Block a user