From 28566d73b3c76aa80548a4fb91b4b97cc02b22bc Mon Sep 17 00:00:00 2001 From: Hongxia Yang <62075498+hongxiayang@users.noreply.github.com> Date: Thu, 1 May 2025 10:54:25 -0400 Subject: [PATCH] [ROCm] remove unsupported archs from rocm triton flash-attention supported list (#17536) Signed-off-by: Hongxia Yang --- vllm/attention/ops/triton_flash_attention.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/attention/ops/triton_flash_attention.py b/vllm/attention/ops/triton_flash_attention.py index e98b5254541b6..23ac7d7dc84ca 100644 --- a/vllm/attention/ops/triton_flash_attention.py +++ b/vllm/attention/ops/triton_flash_attention.py @@ -650,7 +650,7 @@ def get_general_autotune_configs(): def has_cdna_target(): - ROCM_CDNA_TARGETS = ["gfx940", "gfx941", "gfx942", "gfx90a", "gfx908"] + ROCM_CDNA_TARGETS = ["gfx942", "gfx90a", "gfx908"] return triton.runtime.driver.active.get_current_target( ).arch in ROCM_CDNA_TARGETS