This commit is contained in:
co63oc
2025-09-01 17:50:17 +08:00
committed by GitHub
parent 0513a78ecc
commit d6369b4d51
67 changed files with 85 additions and 85 deletions

View File

@@ -176,7 +176,7 @@ class FlashAttentionBackend(AttentionBackend):
kv_cache_quant_type: str = None,
):
"""
Caculate kv cache shape
Calculate kv cache shape
"""
if kv_cache_quant_type is not None and kv_cache_quant_type == "int4_zp":
return (