FastDeploy

mirror of https://github.com/PaddlePaddle/FastDeploy.git synced 2025-12-24 13:28:13 +08:00

Files

YuBaoku 819b2dbbae Revert "【New Feature】W4afp8 supports per group quantization (#4272 )" (#4854 )

This reverts commit 93fcf7e4ec.

2025-11-06 17:48:28 +08:00

__init__.py

2025-08-25 11:27:45 +08:00

ep.py

2025-11-04 16:35:40 +08:00

fused_moe_backend_base.py

2025-11-06 10:32:15 +08:00

fused_moe_cutlass_backend.py

2025-11-06 17:48:28 +08:00

fused_moe_deepgemm_backend.py

2025-11-06 10:32:15 +08:00

fused_moe_marlin_backend.py

2025-10-30 18:59:04 +08:00

fused_moe_triton_backend.py

2025-10-17 11:47:16 +08:00

fused_moe_wint2_backend.py

2025-11-06 17:48:28 +08:00

moe.py

2025-11-06 17:26:14 +08:00

triton_moe_kernels.py

2025-09-24 16:39:51 +08:00