mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-16 15:57:15 +08:00
[XPU][Triton]add xpu config in triton_reshape_and_cache_flash (#25643)
Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
This commit is contained in:
parent
0bcc3a160d
commit
d2af67441d
@ -137,7 +137,7 @@ def triton_reshape_and_cache_flash(
|
||||
|
||||
# heuristics instead of autotuning
|
||||
TILE_SIZE = min(2048, triton.next_power_of_2(n))
|
||||
if torch.version.hip:
|
||||
if torch.version.hip or torch.version.xpu:
|
||||
num_stages = 4
|
||||
num_warps = 8
|
||||
else: # cuda
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user