mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-26 06:49:38 +08:00
fix amd triton mla path (#17871)
This commit is contained in:
parent
9112155283
commit
eea22a56ab
@ -1063,7 +1063,7 @@ class MLACommonImpl(MLAAttentionImpl[T], Generic[T]):
|
||||
softmax_scale,
|
||||
None, # bias
|
||||
)
|
||||
if is_vllm_fa:
|
||||
elif is_vllm_fa:
|
||||
attn_out = self.flash_attn_varlen_func(
|
||||
q=q,
|
||||
k=k,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user