diff --git a/tests/v1/e2e/test_spec_decode.py b/tests/v1/e2e/test_spec_decode.py index f711715dec0e6..5246ea6517f6c 100644 --- a/tests/v1/e2e/test_spec_decode.py +++ b/tests/v1/e2e/test_spec_decode.py @@ -414,7 +414,10 @@ def test_eagle_correctness( ) if attn_backend == "FLASH_ATTN" and current_platform.is_rocm(): - m.setenv("VLLM_ROCM_USE_AITER", "1") + if "deepseek" in model_setup[1].lower(): + pytest.skip("FLASH_ATTN for deepseek not supported on ROCm platform") + else: + m.setenv("VLLM_ROCM_USE_AITER", "1") method, model_name, spec_model_name, tp_size = model_setup max_model_len = 2048