[Graph Optimization][BugFix][CI] Fix 0size bug && add unitest (#5495)

2025-12-24 13:28:13 +08:00 · 2025-12-11 16:25:26 +08:00
parent e1347be4d9
commit e58fed3665
7 changed files with 25 additions and 4 deletions
--- a/fastdeploy/worker/gpu_model_runner.py
+++ b/fastdeploy/worker/gpu_model_runner.py
@@ -1541,6 +1541,9 @@ class GPUModelRunner(ModelRunnerBase):
        for attn_backend in self.attn_backends:
            attn_backend.init_attention_metadata(self.forward_meta)

+        # for zero size
+        self.forward_meta.is_zero_size = self.forward_meta.ids_remove_padding.shape[0] == 0
+
    def initialize_kv_cache(self, profile: bool = False) -> None:
        """
        Initialize kv cache