[Optimization] compulte real max_logprobs in batch (#5430) (#5448)

This commit is contained in:
chen
2025-12-09 16:48:06 +08:00
committed by GitHub
parent 2c55bbc3f8
commit b491dcd23c
4 changed files with 48 additions and 7 deletions

View File

@@ -187,7 +187,12 @@ class Request:
pooling_params = PoolingParams.from_dict(d["pooling_params"])
else:
sampling_params = SamplingParams.from_dict(d)
logprobs = d.get("logprobs", None)
if logprobs is not None:
if logprobs is True:
sampling_params.logprobs = d.get("top_logprobs", None)
elif logprobs is False:
sampling_params.logprobs = None
if (
isinstance(d.get("multimodal_inputs"), dict)
and isinstance(d["multimodal_inputs"].get("mm_positions"), list)