mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] support chunked moe (#4575)
* [Feature] support chunked moe * update * update * fix and add test * update * fix conflict and modity test * fix fused_moe * fix fused_moe * fix docstring * fix * fix typo * fix test * fix * fix * fix test * fix test
This commit is contained in:
@@ -540,6 +540,11 @@ class ParallelConfig:
|
||||
self.expert_parallel_size = 1 # EP degree
|
||||
self.data_parallel_size = 1 # DP degree
|
||||
self.enable_expert_parallel = False
|
||||
self.enable_chunked_moe = False
|
||||
self.chunked_moe_size = 256
|
||||
self.max_moe_num_chunk = 1
|
||||
self.moe_num_chunk = 1
|
||||
|
||||
self.local_data_parallel_id = 0
|
||||
# Engine worker queue port
|
||||
self.engine_worker_queue_port: str = "9923"
|
||||
|
||||
Reference in New Issue
Block a user