From fb2eb403abfa4a8db7c8d8ac4231d50d6561a4c9 Mon Sep 17 00:00:00 2001 From: chenjian <1435317881@qq.com> Date: Mon, 10 Nov 2025 21:38:02 +0800 Subject: [PATCH] [Opti] Unlimit zmq message lens limit (#4465) Co-authored-by: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com> --- fastdeploy/envs.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/fastdeploy/envs.py b/fastdeploy/envs.py index 901f677cd..9311948c4 100644 --- a/fastdeploy/envs.py +++ b/fastdeploy/envs.py @@ -44,7 +44,7 @@ environment_variables: dict[str, Callable[[], Any]] = { # Whether to use HuggingFace tokenizer. "FD_USE_HF_TOKENIZER": lambda: bool(int(os.getenv("FD_USE_HF_TOKENIZER", "0"))), # Set the high watermark (HWM) for receiving data during ZMQ initialization - "FD_ZMQ_SNDHWM": lambda: os.getenv("FD_ZMQ_SNDHWM", 64000), + "FD_ZMQ_SNDHWM": lambda: os.getenv("FD_ZMQ_SNDHWM", 0), # cache kv quant params directory "FD_CACHE_PARAMS": lambda: os.getenv("FD_CACHE_PARAMS", "none"), # Set attention backend. "NATIVE_ATTN", "APPEND_ATTN"