[XPU][Triton]add xpu config in triton_reshape_and_cache_flash (#25643)

Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
2026-06-22 16:57:16 +08:00 · 2025-09-25 20:38:11 +08:00 · 2025-09-25 20:38:11 +08:00 · d2af67441d
commit d2af67441d
parent 0bcc3a160d
1 changed files with 1 additions and 1 deletions
--- a/vllm/attention/ops/triton_reshape_and_cache_flash.py
+++ b/vllm/attention/ops/triton_reshape_and_cache_flash.py
@ -137,7 +137,7 @@ def triton_reshape_and_cache_flash(

    # heuristics instead of autotuning
    TILE_SIZE = min(2048, triton.next_power_of_2(n))
-    if torch.version.hip:
+    if torch.version.hip or torch.version.xpu:
        num_stages = 4
        num_warps = 8
    else:  # cuda