mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[PD Disaggregation] support different tp_size for prefill and decode (#5296)
* up * up * up * fix
This commit is contained in:
@@ -1888,6 +1888,7 @@ class FDConfig:
|
||||
logger.info(f"disaggregate_info: {self.disaggregate_info}")
|
||||
|
||||
if self.router_config:
|
||||
# the information for registering this server to router
|
||||
self.register_info = {
|
||||
"role": self.scheduler_config.splitwise_role,
|
||||
"host_ip": self.host_ip,
|
||||
@@ -1897,6 +1898,7 @@ class FDConfig:
|
||||
"engine_worker_queue_port": engine_worker_queue_port,
|
||||
"device_ids": self.local_device_ids,
|
||||
"transfer_protocol": self.cache_config.cache_transfer_protocol.split(","),
|
||||
"tp_size": self.parallel_config.tensor_parallel_size,
|
||||
}
|
||||
logger.info(f"register_info: {self.register_info}")
|
||||
|
||||
|
||||
Reference in New Issue
Block a user