mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
@@ -83,14 +83,9 @@ void w4afp8_gemm_M{M}_N{N}_TAILN{TAILN}_K{K}_B{BATCH}_P{PADDING}_{TYPE}(
|
||||
}}
|
||||
"""
|
||||
|
||||
gemm_case = [
|
||||
[8192, 3584, 8, 0], # eb45T ffn1
|
||||
[8192, 3584, 8, 2048], # eb45T ffn1
|
||||
[7168, 8192, 8, 0], # eb45T ffn2
|
||||
[7168, 8192, 8, 2048], # eb45T ffn2
|
||||
]
|
||||
gemm_case = [[256, 256, 1, 0]]
|
||||
|
||||
dtype = ["BF16", "FP16"]
|
||||
dtype = ["BF16"]
|
||||
|
||||
|
||||
def get_cutlass_type(type):
|
||||
|
||||
Reference in New Issue
Block a user