mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-26 11:35:53 +08:00
Minor
This commit is contained in:
parent
e4377dd698
commit
0fb07c08d0
@ -24,5 +24,5 @@ def flash_attn(
|
||||
min(_DEFAULT_BLOCK_SIZES["block_q"], q.shape[1]),
|
||||
min(_DEFAULT_BLOCK_SIZES["block_k_major"], k.shape[1]),
|
||||
min(_DEFAULT_BLOCK_SIZES["block_k"], k.shape[1]),
|
||||
min(_DEFAULT_BLOCK_SIZES["block_b"], q.shape[0]))
|
||||
min(_DEFAULT_BLOCK_SIZES["block_b"], q.shape[0])),
|
||||
).transpose(0, 2, 1, 3)
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user