fix num_blocks_local when small size model in TP2 running mode (#2793)

This commit is contained in:
gaoziyuan
2025-07-10 13:44:56 +08:00
committed by GitHub
parent 1107e08cd9
commit 39d2a1de46

View File

@@ -346,11 +346,11 @@ class PaddleDisWorkerProc():
model_block_memory_used)
# NOTE(liuzichang): Too many block will lead to illegal memory access
# We will develop dynamic limits in future.
if num_blocks_local > 20000:
if num_blocks_local > 40000:
logger.info(
f"------- Reset num_blocks_local {num_blocks_local} to 20000"
f"------- Reset num_blocks_local {num_blocks_local} to 40000"
)
num_blocks_local = min(20000, num_blocks_local)
num_blocks_local = min(40000, num_blocks_local)
logger.info(
f"------- model_block_memory_used:{model_block_memory_used} --------"
)