This commit is contained in:
RAM
2025-08-01 22:34:59 +08:00
committed by GitHub
parent c8dd5976ae
commit d4059cabf0

View File

@@ -208,7 +208,7 @@ class FlashAttentionBackend(AttentionBackend):
) = pre_cache_len_concat( ) = pre_cache_len_concat(
forward_meta.seq_lens_decoder, forward_meta.seq_lens_decoder,
forward_meta.seq_lens_this_time, forward_meta.seq_lens_this_time,
metadata.set_max_lengths[2], forward_meta.max_len_tensor_cpu[2],
self.block_size, self.block_size,
) )