mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-05 06:57:27 +08:00
[Feature] Batch Invariant for R1 TP 8 on Blackwell (#27229)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
aa1356ec53
commit
86ed77022d
@ -756,10 +756,10 @@ def override_envs_for_invariance():
|
||||
"FLEX_ATTENTION",
|
||||
"FLASHINFER",
|
||||
"FLASH_ATTN_MLA",
|
||||
"FLASHINFER_MLA",
|
||||
"TRITON_MLA",
|
||||
# Not yet supported MLA backends
|
||||
# "FLASHMLA",
|
||||
# "FLASHINFER_MLA",
|
||||
]
|
||||
if curr_attn_backend not in supported_backends:
|
||||
warning = (
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user