From e2fbfc955e1bc9f67c349c5a2bde63a3edd86b84 Mon Sep 17 00:00:00 2001 From: Divakar Verma <137818590+divakar-amd@users.noreply.github.com> Date: Mon, 1 Dec 2025 23:27:46 -0600 Subject: [PATCH] [CI][AMD] spec_decode:eagle skip FLASH_ATTN for deepseek on ROCm (#29827) Signed-off-by: Divakar Verma --- tests/v1/e2e/test_spec_decode.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/tests/v1/e2e/test_spec_decode.py b/tests/v1/e2e/test_spec_decode.py index f711715dec0e6..5246ea6517f6c 100644 --- a/tests/v1/e2e/test_spec_decode.py +++ b/tests/v1/e2e/test_spec_decode.py @@ -414,7 +414,10 @@ def test_eagle_correctness( ) if attn_backend == "FLASH_ATTN" and current_platform.is_rocm(): - m.setenv("VLLM_ROCM_USE_AITER", "1") + if "deepseek" in model_setup[1].lower(): + pytest.skip("FLASH_ATTN for deepseek not supported on ROCm platform") + else: + m.setenv("VLLM_ROCM_USE_AITER", "1") method, model_name, spec_model_name, tp_size = model_setup max_model_len = 2048