fix w4afp8_gemm_scale_permute import error on A100 (#3611)

This commit is contained in:
Yuan Xiaolan
2025-08-28 11:42:23 +08:00
committed by GitHub
parent ad9b95e6dd
commit d37331fc71

View File

@@ -31,8 +31,12 @@ if current_platform.is_cuda():
moe_expert_dispatch, moe_expert_dispatch,
moe_expert_reduce, moe_expert_reduce,
noaux_tc, noaux_tc,
w4afp8_gemm_scale_permute,
) )
try:
from fastdeploy.model_executor.ops.gpu import w4afp8_gemm_scale_permute
except:
logger.warning("import w4afp8_gemm_scale_permute Failed!")
elif current_platform.is_iluvatar(): elif current_platform.is_iluvatar():
from fastdeploy.model_executor.ops.iluvatar import ( from fastdeploy.model_executor.ops.iluvatar import (
moe_expert_dispatch, moe_expert_dispatch,