mirror of
				https://github.com/PaddlePaddle/FastDeploy.git
				synced 2025-10-31 03:46:40 +08:00 
			
		
		
		
	Adapt for iluvatar gpu (#2684)
This commit is contained in:
		| @@ -19,9 +19,10 @@ from .flash_attn_backend import FlashAttentionBackend | ||||
| from .mla_attention_backend import MLAAttentionBackend | ||||
| from .native_paddle_backend import PaddleNativeAttnBackend | ||||
| from .xpu_attn_backend import XPUAttentionBackend | ||||
| from .iluvatar_attn_backend import IluvatarAttnBackend | ||||
|  | ||||
| __all__ = [ | ||||
|     "AttentionBackend", "PaddleNativeAttnBackend", | ||||
|     "get_attention_backend", "AppendAttentionBackend", "XPUAttentionBackend", | ||||
|     "MLAAttentionBackend", "FlashAttentionBackend" | ||||
|     "MLAAttentionBackend", "FlashAttentionBackend", "IluvatarAttnBackend" | ||||
| ] | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 liddk1121
					liddk1121