[misc] Add FlashMLA as a new option of VLLM_ATTENTION_BACKEND env (#14267)

This commit is contained in:
Serena 2025-03-06 05:28:50 +08:00 committed by GitHub
parent ac60dc7fe1
commit 1b7624bf5c
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -321,6 +321,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
# - "XFORMERS": use XFormers
# - "ROCM_FLASH": use ROCmFlashAttention
# - "FLASHINFER": use flashinfer
# - "FLASHMLA": use FlashMLA
"VLLM_ATTENTION_BACKEND":
lambda: os.getenv("VLLM_ATTENTION_BACKEND", None),