From 86ed77022db254cab1386c211f150d3840af156c Mon Sep 17 00:00:00 2001 From: Wentao Ye <44945378+yewentao256@users.noreply.github.com> Date: Tue, 21 Oct 2025 13:25:55 -0400 Subject: [PATCH] [Feature] Batch Invariant for R1 TP 8 on Blackwell (#27229) Signed-off-by: yewentao256 --- vllm/model_executor/layers/batch_invariant.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/model_executor/layers/batch_invariant.py b/vllm/model_executor/layers/batch_invariant.py index f3ec6b5035889..7368bfd35fec9 100644 --- a/vllm/model_executor/layers/batch_invariant.py +++ b/vllm/model_executor/layers/batch_invariant.py @@ -756,10 +756,10 @@ def override_envs_for_invariance(): "FLEX_ATTENTION", "FLASHINFER", "FLASH_ATTN_MLA", + "FLASHINFER_MLA", "TRITON_MLA", # Not yet supported MLA backends # "FLASHMLA", - # "FLASHINFER_MLA", ] if curr_attn_backend not in supported_backends: warning = (