From 2f3461ad23cc5db8c04550b95404630453a03746 Mon Sep 17 00:00:00 2001 From: Sage Moore Date: Thu, 3 Jul 2025 13:45:52 +0000 Subject: [PATCH] cleanup flashmla.py Signed-off-by: Sage Moore --- vllm/v1/attention/backends/mla/flashmla.py | 1 - 1 file changed, 1 deletion(-) diff --git a/vllm/v1/attention/backends/mla/flashmla.py b/vllm/v1/attention/backends/mla/flashmla.py index f67278b6693db..be26e0060db5e 100644 --- a/vllm/v1/attention/backends/mla/flashmla.py +++ b/vllm/v1/attention/backends/mla/flashmla.py @@ -76,7 +76,6 @@ class FlashMLAMetadataBuilder(MLACommonMetadataBuilder[FlashMLAMetadata]): ) if self.runner.full_cuda_graph: - n = num_splits.size(0) # First time around (CUDAGraph capture), allocate the static buffer if self.cg_buf_tile_scheduler_metadata is None: self.cg_buf_tile_scheduler_metadata = tile_scheduler_metadata