[Graph Optimization][BugFix][CI] Fix 0size bug && add unitest (#5495)

This commit is contained in:
Ryan
2025-12-11 16:25:26 +08:00
committed by GitHub
parent e1347be4d9
commit e58fed3665
7 changed files with 25 additions and 4 deletions

View File

@@ -1541,6 +1541,9 @@ class GPUModelRunner(ModelRunnerBase):
for attn_backend in self.attn_backends:
attn_backend.init_attention_metadata(self.forward_meta)
# for zero size
self.forward_meta.is_zero_size = self.forward_meta.ids_remove_padding.shape[0] == 0
def initialize_kv_cache(self, profile: bool = False) -> None:
"""
Initialize kv cache