mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-30 11:26:39 +08:00
Support 45t fp8 8 GPU (#3659)
This commit is contained in:
@@ -14,14 +14,11 @@
|
||||
# limitations under the License.
|
||||
"""
|
||||
|
||||
import triton
|
||||
import triton.language as tl
|
||||
|
||||
from fastdeploy.model_executor.ops.triton_ops.triton_utils_v2 import (
|
||||
paddle_use_triton_v2,
|
||||
)
|
||||
|
||||
|
||||
@paddle_use_triton_v2()
|
||||
@triton.jit()
|
||||
def fused_moe_kernel_paddle(
|
||||
a_ptr,
|
||||
b_ptr,
|
||||
|
||||
Reference in New Issue
Block a user