diff --git a/fastdeploy/engine/engine.py b/fastdeploy/engine/engine.py index cf7d31fe0..b28593697 100644 --- a/fastdeploy/engine/engine.py +++ b/fastdeploy/engine/engine.py @@ -235,9 +235,6 @@ class LLMEngine: request.get("max_tokens"), ), ) - if request.get("reasoning_max_tokens") is None: - default_reasoning_max_tokens = max(int(request.get("max_tokens") * 0.8), 1) - request.set("reasoning_max_tokens", default_reasoning_max_tokens) min_tokens = request.get("min_tokens") if input_ids_len + min_tokens >= self.cfg.max_model_len: error_msg = (