mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-06 17:17:14 +08:00
This reverts commit b0f1e0eef4
.
This commit is contained in:
@@ -124,9 +124,19 @@ class EngineArgs:
|
||||
Ratio of tokens to process in a block.
|
||||
"""
|
||||
|
||||
ips: Optional[List[str]] = None
|
||||
dist_init_ip: Optional[str] = None
|
||||
"""
|
||||
The ips of multinode deployment
|
||||
The master node ip of multinode deployment
|
||||
"""
|
||||
|
||||
nnodes: int = 1
|
||||
"""
|
||||
The number of nodes in multinode deployment
|
||||
"""
|
||||
|
||||
node_rank: int = 0
|
||||
"""
|
||||
The rank of the current node in multinode deployment
|
||||
"""
|
||||
|
||||
swap_space: float = None
|
||||
@@ -485,11 +495,25 @@ class EngineArgs:
|
||||
# Cluster system parameters group
|
||||
system_group = parser.add_argument_group("System Configuration")
|
||||
system_group.add_argument(
|
||||
"--ips",
|
||||
type=lambda s: s.split(",") if s else None,
|
||||
default=EngineArgs.ips,
|
||||
"--dist-init-ip",
|
||||
default=EngineArgs.dist_init_ip,
|
||||
help=
|
||||
"IP addresses of all nodes participating in distributed inference.")
|
||||
"IP addresses of master node.")
|
||||
|
||||
system_group.add_argument(
|
||||
"--nnodes",
|
||||
type=int,
|
||||
default=EngineArgs.nnodes,
|
||||
help=
|
||||
"The number of all nodes.")
|
||||
|
||||
system_group.add_argument(
|
||||
"--node-rank",
|
||||
type=int,
|
||||
default=EngineArgs.node_rank,
|
||||
help=
|
||||
"node rank id (range [0, nnodes)).")
|
||||
|
||||
|
||||
|
||||
# Performance tuning parameters group
|
||||
@@ -789,7 +813,9 @@ class EngineArgs:
|
||||
max_num_seqs=self.max_num_seqs,
|
||||
speculative_config=speculative_cfg,
|
||||
max_num_batched_tokens=self.max_num_batched_tokens,
|
||||
ips=self.ips,
|
||||
dist_init_ip=self.dist_init_ip,
|
||||
nnodes=self.nnodes,
|
||||
node_rank=self.node_rank,
|
||||
use_warmup=self.use_warmup,
|
||||
engine_worker_queue_port=self.engine_worker_queue_port,
|
||||
limit_mm_per_prompt=self.limit_mm_per_prompt,
|
||||
|
Reference in New Issue
Block a user