[BugFix] fix TPDP mix parallel infer (#4583)

Co-authored-by: Yuanle Liu <yuanlehome@163.com>
This commit is contained in:
lizhenyun01
2025-10-28 16:58:20 +08:00
committed by GitHub
parent c63361fd1d
commit 4d2f478d53
3 changed files with 13 additions and 13 deletions

View File

@@ -720,7 +720,9 @@ def initialize_fd_config(args, ranks: int = 1, local_rank: int = 0) -> FDConfig:
num_experts_per_rank = num_experts // parallel_config.expert_parallel_size
num_experts_start_offset = expert_parallel_rank * num_experts_per_rank
max_chips_per_node = 16 if current_platform.is_iluvatar() else 8
parallel_config.local_data_parallel_id = expert_parallel_rank % max_chips_per_node
parallel_config.local_data_parallel_id = parallel_config.data_parallel_rank % (
max_chips_per_node // parallel_config.tensor_parallel_size
)
parallel_config.expert_parallel_rank = expert_parallel_rank
parallel_config.num_experts_per_rank = num_experts_per_rank