mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Feature] Support_eplb (#2997)
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled
Some checks failed
Deploy GitHub Pages / deploy (push) Has been cancelled
* [Feature] support_eplb * [Feature] support_eplb * [Fix] fix mm ep
This commit is contained in:
@@ -254,7 +254,7 @@ std::vector<paddle::DataType> MoERedundantTopKSelectKernelInferDtype(
|
||||
}
|
||||
|
||||
|
||||
PD_BUILD_OP(moe_redundant_topk_select)
|
||||
PD_BUILD_STATIC_OP(moe_redundant_topk_select)
|
||||
.Inputs({"gating_logits", "expert_id_to_ep_rank_array", "expert_in_rank_num_list", "tokens_per_expert_stats_list", paddle::Optional("bias")})
|
||||
.Outputs({"topk_ids",
|
||||
"topk_weights",
|
||||
|
||||
Reference in New Issue
Block a user