mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] support eplb in api_server (#4782)
* support eplb in api_server * update code * add eplb test case * update eplb * support tp+dp eplb * update test cese * update code * update code * fix bug * update copilot review * update test case name
This commit is contained in:
@@ -22,6 +22,7 @@ from .ipc_signal_const import (
|
||||
KVCacheStatus,
|
||||
ModelWeightsStatus,
|
||||
PrefixTreeStatus,
|
||||
RearrangeExpertStatus,
|
||||
)
|
||||
from .zmq_client import ZmqIpcClient
|
||||
from .zmq_server import ZmqIpcServer, ZmqTcpServer
|
||||
@@ -38,4 +39,5 @@ __all__ = [
|
||||
"PrefixTreeStatus",
|
||||
"ModelWeightsStatus",
|
||||
"KVCacheStatus",
|
||||
"RearrangeExpertStatus",
|
||||
]
|
||||
|
||||
Reference in New Issue
Block a user