fix num_blocks_local when small size model in TP2 running mode (#2792)

This commit is contained in:
gaoziyuan
2025-07-12 12:50:48 +08:00
committed by GitHub
parent 749b2e9c89
commit e9e8443ea8

View File

@@ -360,11 +360,11 @@ class PaddleDisWorkerProc():
model_block_memory_used) model_block_memory_used)
# NOTE(liuzichang): Too many block will lead to illegal memory access # NOTE(liuzichang): Too many block will lead to illegal memory access
# We will develop dynamic limits in future. # We will develop dynamic limits in future.
if num_blocks_local > 20000: if num_blocks_local > 40000:
logger.info( logger.info(
f"------- Reset num_blocks_local {num_blocks_local} to 20000" f"------- Reset num_blocks_local {num_blocks_local} to 40000"
) )
num_blocks_local = min(20000, num_blocks_local) num_blocks_local = min(40000, num_blocks_local)
logger.info( logger.info(
f"------- model_block_memory_used:{model_block_memory_used} --------" f"------- model_block_memory_used:{model_block_memory_used} --------"
) )