mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-23 16:14:37 +08:00
[Bugfix] Add missing VIT backend dispatch on CPU (#24623)
Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
parent
f17a6aa4ec
commit
29799ddacc
@ -399,7 +399,8 @@ class MultiHeadAttention(nn.Module):
|
||||
key,
|
||||
value,
|
||||
scale=self.scale)
|
||||
elif self.attn_backend == _Backend.TORCH_SDPA:
|
||||
elif (self.attn_backend == _Backend.TORCH_SDPA
|
||||
or self.attn_backend == _Backend.TORCH_SDPA_VLLM_V1):
|
||||
query, key, value = (x.transpose(1, 2)
|
||||
for x in (query, key, value))
|
||||
out = F.scaled_dot_product_attention(query,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user