[Feature] support custom all-reduce (#2758)

* [Feature] support custom all-reduce * add vllm adapted
2025-10-05 08:37:06 +08:00 · 2025-07-09 16:00:27 +08:00
parent be21ef5047
commit b89180f1cd
16 changed files with 1194 additions and 2 deletions
--- a/fastdeploy/engine/config.py
+++ b/fastdeploy/engine/config.py
@@ -447,6 +447,7 @@ class ParallelConfig:
        tensor_parallel_size: int = 1,
        data_parallel_size: int = 1,
        enable_expert_parallel: bool = False,
+        enable_custom_all_reduce: bool = False,
    ):
        """
        Initialize the ParallelConfig class.
@@ -462,6 +463,7 @@ class ParallelConfig:
        self.enable_expert_parallel = enable_expert_parallel
        self.expert_parallel_size = data_parallel_size
        self.local_data_parallel_id = 0
+        self.enable_custom_all_reduce = enable_custom_all_reduce

    def print(self):
        """
@@ -587,6 +589,7 @@ class Config:
        max_capture_batch_size: int = 64,
        guided_decoding_backend: Optional[str] = None,
        disable_any_whitespace: bool = False,
+        enable_custom_all_reduce: bool = False,
    ):
        """
        Initialize the Config class.