mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-20 19:57:02 +08:00
[XPU][Triton]add xpu config in triton_reshape_and_cache_flash (#25643)
Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
This commit is contained in:
parent
0bcc3a160d
commit
d2af67441d
@ -137,7 +137,7 @@ def triton_reshape_and_cache_flash(
|
|||||||
|
|
||||||
# heuristics instead of autotuning
|
# heuristics instead of autotuning
|
||||||
TILE_SIZE = min(2048, triton.next_power_of_2(n))
|
TILE_SIZE = min(2048, triton.next_power_of_2(n))
|
||||||
if torch.version.hip:
|
if torch.version.hip or torch.version.xpu:
|
||||||
num_stages = 4
|
num_stages = 4
|
||||||
num_warps = 8
|
num_warps = 8
|
||||||
else: # cuda
|
else: # cuda
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user