mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-03 15:56:49 +08:00
[Feature] support custom all-reduce (#2758)
* [Feature] support custom all-reduce * add vllm adapted
This commit is contained in:
@@ -207,6 +207,8 @@ class ParallelConfig:
|
||||
guided_decoding_backend: str = None
|
||||
# disable any whitespace for guided decoding
|
||||
disable_any_whitespace: bool = True
|
||||
# enable the custom all-reduce kernel and fall back to NCCL(dist.all_reduce).
|
||||
enable_custom_all_reduce: str = "store_true"
|
||||
|
||||
|
||||
@dataclass
|
||||
|
Reference in New Issue
Block a user