diff --git a/fastdeploy/entrypoints/engine_client.py b/fastdeploy/entrypoints/engine_client.py index 9babe8fec..5b2684529 100644 --- a/fastdeploy/entrypoints/engine_client.py +++ b/fastdeploy/entrypoints/engine_client.py @@ -438,12 +438,12 @@ class EngineClient: raise ParameterError("prompt_logprobs", err_msg) if not envs.FD_USE_GET_SAVE_OUTPUT_V1: - err_msg = "prompt_logprobs is not support when FD_USE_GET_SAVE_OUTPUT_V1 is disabled." + err_msg = "prompt_logprobs is not supported when FD_USE_GET_SAVE_OUTPUT_V1 is disabled." api_server_logger.error(err_msg) raise ParameterError("prompt_logprobs", err_msg) if self.enable_prefix_caching: - err_msg = "prompt_logprobs is not support when prefix caching is enabled." + err_msg = "prompt_logprobs is not supported when prefix caching is enabled." api_server_logger.error(err_msg) raise ParameterError("prompt_logprobs", err_msg) diff --git a/fastdeploy/model_executor/layers/activation.py b/fastdeploy/model_executor/layers/activation.py index 35aa40b77..d0e6400e2 100644 --- a/fastdeploy/model_executor/layers/activation.py +++ b/fastdeploy/model_executor/layers/activation.py @@ -104,7 +104,7 @@ class SiluAndMul(nn.Layer): bfloat16 as default dtype, but received {self._dtype}" ) - # fp8 is not support smooth quantization + # fp8 does not support smooth quantization if fd_config.quant_config and "fp8" in fd_config.quant_config.name(): self.dequant_scales = None self.shift = None diff --git a/fastdeploy/spec_decode/__init__.py b/fastdeploy/spec_decode/__init__.py index 086b5003a..6340691f4 100644 --- a/fastdeploy/spec_decode/__init__.py +++ b/fastdeploy/spec_decode/__init__.py @@ -19,7 +19,7 @@ from fastdeploy.platforms import current_platform from .base import Proposer from .mtp import MTPProposer -# XPU is not support ngram proposer now +# XPU does not support ngram proposer now if not current_platform.is_xpu(): from .ngram import NgramProposer __all__ = ["Proposer", "MTPProposer", "NgramProposer"]