ep support logprob (#4089) (#4151)

This commit is contained in:
chen
2025-09-19 14:07:31 +08:00
committed by GitHub
parent a685e5ad35
commit 66a98b44ed
3 changed files with 11 additions and 17 deletions

View File

@@ -303,24 +303,23 @@ class TokenProcessor:
continue
else:
if (
if self.use_logprobs:
get_output_topk(
self.output_tokens,
self.output_scores,
self.output_ranks,
K,
rank_id,
is_blocking,
)
elif (
self.cfg.parallel_config.enable_expert_parallel
and self.cfg.parallel_config.data_parallel_size > 1
):
get_output_ep(self.output_tokens, rank_id, is_blocking)
else:
if self.use_logprobs:
get_output_topk(
self.output_tokens,
self.output_scores,
self.output_ranks,
K,
rank_id,
is_blocking,
)
else:
get_output(self.output_tokens, rank_id, is_blocking)
get_output(self.output_tokens, rank_id, is_blocking)
if self.output_tokens[0, 0] == -2:
continue