diff --git a/fastdeploy/model_executor/layers/moe/ep.py b/fastdeploy/model_executor/layers/moe/ep.py index b1ab322a1..c2d076d0d 100644 --- a/fastdeploy/model_executor/layers/moe/ep.py +++ b/fastdeploy/model_executor/layers/moe/ep.py @@ -193,20 +193,22 @@ class DeepEPEngine: Return: combined_hidden_states: [num_tokens, hidden] """ - # TODO(@wufeisheng): Delete them when deepep in PaddlePaddle is fixed - ( - src_info, - layout_range, - num_max_dispatch_tokens_per_rank, - num_experts, - ) = handle - handle = ( - src_info, - layout_range, - num_max_dispatch_tokens_per_rank, - None, - num_experts, - ) + if paddle.__version__ != "0.0.0" and paddle.__version__ <= "3.1.0": # not develop version of PaddlePaddle + # TODO(@wanglongzhi): Delete them when deepep in PaddlePaddle is fixed + # and when the default recommended version of PaddlePaddle is greater than 3.1.0 + ( + src_info, + layout_range, + num_max_dispatch_tokens_per_rank, + num_experts, + ) = handle + handle = ( + src_info, + layout_range, + num_max_dispatch_tokens_per_rank, + None, + num_experts, + ) combined_hidden_states, _, combine_hook = self.decode_deepep_engine.low_latency_combine( hidden_states,