mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[XPU] refactor of block_attn param 'pos_emb_type' (#5511)
This commit is contained in:
@@ -253,8 +253,6 @@ class XPUForwardMeta(ForwardMeta):
|
||||
dec_batch: Optional[paddle.Tensor] = None
|
||||
#
|
||||
total_enc_len: Optional[paddle.Tensor] = None
|
||||
# position embedding type in rope, supports 'NORMAL' or 'HALF_HEAD_DIM'
|
||||
pos_emb_type: Optional[str] = "NORMAL"
|
||||
# for pd_disaggregation
|
||||
kv_signal_sender: Optional[paddle.Tensor] = None
|
||||
|
||||
|
||||
Reference in New Issue
Block a user