[Bugfix] Free cross attention block table for preempted-for-recompute sequence group. (#10013)

Signed-off-by: Kathy Yu <feiyangyu@google.com>
This commit is contained in:
Kathy Yu 2025-01-02 10:28:09 -08:00 committed by GitHub
parent 84c35c374a
commit 2f385183f3
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1579,6 +1579,7 @@ class Scheduler:
seq.status = SequenceStatus.WAITING seq.status = SequenceStatus.WAITING
self.free_seq(seq) self.free_seq(seq)
seq.reset_state_for_recompute() seq.reset_state_for_recompute()
self._free_seq_group_cross_attn_blocks(seq_group)
def _preempt_by_swap( def _preempt_by_swap(
self, self,