mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 06:35:00 +08:00
[ROCm][AMD][Bugfix] adding a missing triton autotune config (#4845)
This commit is contained in:
parent
f09edd8a25
commit
b5853f9963
@ -239,6 +239,16 @@ def _attn_fwd_inner(
|
||||
num_stages=1,
|
||||
num_warps=8,
|
||||
),
|
||||
triton.Config(
|
||||
{
|
||||
"BLOCK_M": 128,
|
||||
"BLOCK_N": 64,
|
||||
"waves_per_eu": 1,
|
||||
"PRE_LOAD_V": False,
|
||||
},
|
||||
num_stages=1,
|
||||
num_warps=4,
|
||||
),
|
||||
triton.Config(
|
||||
{
|
||||
"BLOCK_M": 128,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user