[Feature] Online Chat API Support Return logprobs (#2777)

* online chat support logprobs * check xpu * check vl_gpu_model_runner and xpu_model_runner * get_worker() check platform
2025-10-05 08:37:06 +08:00 · 2025-07-10 16:33:40 +08:00
parent 24f934f1f9
commit d33105baeb
22 changed files with 608 additions and 114 deletions
--- a/fastdeploy/engine/config.py
+++ b/fastdeploy/engine/config.py
@@ -590,6 +590,7 @@ class Config:
        guided_decoding_backend: Optional[str] = None,
        disable_any_whitespace: bool = False,
        enable_custom_all_reduce: bool = False,
+        enable_logprob: bool = False,
    ):
        """
        Initialize the Config class.
@@ -686,6 +687,8 @@ class Config:
        self.device_ids = ",".join([str(i) for i in range(self.worker_num_per_node)])
        self.device_ids = os.getenv("CUDA_VISIBLE_DEVICES", self.device_ids)

+        self.enable_logprob = enable_logprob
+
        self.read_from_config()
        self.postprocess()
        self.check()