Fix chunked prefill (#3778)

* update enable chunked_prefill * update code * update code * update code
2025-10-05 00:33:03 +08:00 · 2025-09-02 13:41:55 +08:00
parent 0cdbc950b5
commit a86b35ab49
4 changed files with 29 additions and 25 deletions
--- a/fastdeploy/envs.py
+++ b/fastdeploy/envs.py
@@ -93,8 +93,8 @@ environment_variables: dict[str, Callable[[], Any]] = {
    # enable multi api server
    "FD_ENABLE_MULTI_API_SERVER": lambda: bool(int(os.getenv("FD_ENABLE_MULTI_API_SERVER", "0"))),
    "FD_FOR_TORCH_MODEL_FORMAT": lambda: bool(int(os.getenv("FD_FOR_TORCH_MODEL_FORMAT", "0"))),
-    # force enable chunked prefill
-    "FD_FORCE_CHUNKED_PREFILL": lambda: bool(int(os.getenv("FD_FORCE_CHUNKED_PREFILL", "0"))),
+    # force disable default chunked prefill
+    "FD_DISABLE_CHUNKED_PREFILL": lambda: bool(int(os.getenv("FD_DISABLE_CHUNKED_PREFILL", "0"))),
 }