mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[XPU] ep+tp all2all (#4836)
This commit is contained in:
@@ -577,6 +577,15 @@ class ParallelConfig:
|
||||
else:
|
||||
self.pd_disaggregation_mode = "None"
|
||||
|
||||
# ep+tp strategy: "all_reduce" or "all_to_all"
|
||||
# all_reduce: qkv_linear + attn + out_linear + allreduce
|
||||
# all_to_all: allgather + qkv_linear + attn + all2all + out_linear
|
||||
self.ep_tp_strategy = envs.FD_EP_TP_STRATEGY
|
||||
assert self.ep_tp_strategy in [
|
||||
"all_reduce",
|
||||
"all_to_all",
|
||||
], f"FD_EP_TP_STRATEGY: '{self.ep_tp_strategy}' is not supported, only supports 'all_reduce' or 'all_to_all'."
|
||||
|
||||
def set_communicate_group(self):
|
||||
# different tp group id
|
||||
# prevent different tp_groups using the same group_id
|
||||
|
||||
Reference in New Issue
Block a user