mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
dcu adapter ernie45t (#2756)
Co-authored-by: lifu <lifu@sugon.com> Co-authored-by: yongqiangma <xing.wo@163.com>
This commit is contained in:
@@ -29,7 +29,7 @@ from fastdeploy.model_executor.layers.attention.ops import (
|
||||
open_shm_and_get_meta_signal)
|
||||
from fastdeploy.platforms import current_platform
|
||||
|
||||
if current_platform.is_cuda():
|
||||
if current_platform.is_cuda() and not current_platform.is_dcu():
|
||||
from fastdeploy.model_executor.ops.gpu import (decode_mla_write_cache,
|
||||
multi_head_latent_attention,
|
||||
prefill_mla_write_cache)
|
||||
|
Reference in New Issue
Block a user