[BugFix]Set default OMP_NUM_THREADS=3 and fix extra GPU memory usage in DeepSeek (#5219)

* fix bug

* update

* update

* update

* fix copy

* update
This commit is contained in:
bukejiyu
2025-11-28 14:22:04 +08:00
committed by GitHub
parent 7dc06cac6e
commit 1539fd6056
6 changed files with 29 additions and 16 deletions

View File

@@ -453,7 +453,7 @@ class LLMEngine:
"PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION": "python",
"NCCL_ALGO": "Ring",
"FLAGS_max_partition_size": int(os.getenv("FLAGS_max_partition_size", 1024)),
"OMP_NUM_THREADS": int(os.getenv("OMP_NUM_THREADS", 3)),
"OMP_NUM_THREADS": 3,
"FD_ENABLE_PDL": envs.FD_ENABLE_PDL,
}
# environment variables needed by Dy2St