mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
dcu adapter ernie45t (#2756)
Co-authored-by: lifu <lifu@sugon.com> Co-authored-by: yongqiangma <xing.wo@163.com>
This commit is contained in:
@@ -20,9 +20,11 @@ from .mla_attention_backend import MLAAttentionBackend
|
||||
from .native_paddle_backend import PaddleNativeAttnBackend
|
||||
from .xpu_attn_backend import XPUAttentionBackend
|
||||
from .iluvatar_attn_backend import IluvatarAttnBackend
|
||||
from .block_multihead_attn_backend import BlockAttentionBackend
|
||||
|
||||
__all__ = [
|
||||
"AttentionBackend", "PaddleNativeAttnBackend",
|
||||
"get_attention_backend", "AppendAttentionBackend", "XPUAttentionBackend",
|
||||
"MLAAttentionBackend", "FlashAttentionBackend", "IluvatarAttnBackend"
|
||||
"MLAAttentionBackend", "FlashAttentionBackend", "IluvatarAttnBackend",
|
||||
"BlockAttentionBackend"
|
||||
]
|
||||
|
||||
Reference in New Issue
Block a user