mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[XPU] refactor of block_attn param 'pos_emb_type' (#5511)
This commit is contained in:
@@ -253,8 +253,6 @@ class XPUForwardMeta(ForwardMeta):
|
||||
dec_batch: Optional[paddle.Tensor] = None
|
||||
#
|
||||
total_enc_len: Optional[paddle.Tensor] = None
|
||||
# position embedding type in rope, supports 'NORMAL' or 'HALF_HEAD_DIM'
|
||||
pos_emb_type: Optional[str] = "NORMAL"
|
||||
# for pd_disaggregation
|
||||
kv_signal_sender: Optional[paddle.Tensor] = None
|
||||
|
||||
|
||||
@@ -213,7 +213,7 @@ class XPUAttentionBackend(AttentionBackend):
|
||||
None, # smooth
|
||||
metadata.kv_signal_data_list[layer.layer_id], # kv_signal_data
|
||||
forward_meta.kv_signal_sender, # kv_signal_sender
|
||||
forward_meta.pos_emb_type,
|
||||
layer.use_neox_rotary_style,
|
||||
self.rope_3d,
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user