From 07334959d81076d49ea78b9ab3bfcafa4227f0ee Mon Sep 17 00:00:00 2001 From: Lucas Wilkinson Date: Mon, 16 Jun 2025 23:32:49 -0400 Subject: [PATCH] [Wheel Size] Only build FA2 8.0+PTX (#19336) --- cmake/external_projects/vllm_flash_attn.cmake | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cmake/external_projects/vllm_flash_attn.cmake b/cmake/external_projects/vllm_flash_attn.cmake index a4edd5b96fe2..dba5baa362b8 100644 --- a/cmake/external_projects/vllm_flash_attn.cmake +++ b/cmake/external_projects/vllm_flash_attn.cmake @@ -38,7 +38,7 @@ else() FetchContent_Declare( vllm-flash-attn GIT_REPOSITORY https://github.com/vllm-project/flash-attention.git - GIT_TAG 8798f27777fb57f447070301bf33a9f9c607f491 + GIT_TAG 763ad155a1c826f71ff318f41edb1e4e5e376ddb GIT_PROGRESS TRUE # Don't share the vllm-flash-attn build between build types BINARY_DIR ${CMAKE_BINARY_DIR}/vllm-flash-attn