mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-27 16:58:42 +08:00
[misc] Add FlashMLA as a new option of VLLM_ATTENTION_BACKEND env (#14267)
This commit is contained in:
parent
ac60dc7fe1
commit
1b7624bf5c
@ -321,6 +321,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
|
||||
# - "XFORMERS": use XFormers
|
||||
# - "ROCM_FLASH": use ROCmFlashAttention
|
||||
# - "FLASHINFER": use flashinfer
|
||||
# - "FLASHMLA": use FlashMLA
|
||||
"VLLM_ATTENTION_BACKEND":
|
||||
lambda: os.getenv("VLLM_ATTENTION_BACKEND", None),
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user