Revert "Revert "[Optim] Remove limitation of number of kvcache blocks (#5612)…"

This reverts commit c1aa66df02.
This commit is contained in:
Jiang-Jia-Jun
2025-12-23 15:42:10 +08:00
committed by GitHub
parent c1aa66df02
commit 6250c686cc
7 changed files with 20 additions and 12 deletions

View File

@@ -88,5 +88,9 @@ environment_variables: dict[str, Callable[[], Any]] = {
# Count for cache_transfer_manager process error
"FD_CACHE_PROC_ERROR_COUNT": lambda: int(os.getenv("FD_CACHE_PROC_ERROR_COUNT", "10")),
# Max allocated KV cache blocks. Use this to limit how many KV cache blocks the engine is allowed to allocate.
# Set to -1 (default) for no limit, or a positive integer to cap the maximum number of blocks that can be allocated.
"FD_MAX_KVCACHE_BLOCKS": lambda: int(os.getenv("FD_MAX_KVCACHE_BLOCKS", "-1")),
}
```