[XPU] Fix xpu model runner call torch.cuda APIs (#25011)

Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
2025-12-17 15:15:42 +08:00 · 2025-09-17 14:45:25 +08:00 · 2025-09-17 14:45:25 +08:00 · dd39baf717
commit dd39baf717
parent 43a62c51be
1 changed files with 5 additions and 1 deletions
--- a/vllm/v1/worker/xpu_model_runner.py
+++ b/vllm/v1/worker/xpu_model_runner.py
@ -45,8 +45,12 @@ def _torch_cuda_wrapper():
            self.synchronize = lambda: None
    try:
-        # replace cuda Event with xpu Event, this should work by default
+        # replace cuda APIs with xpu APIs, this should work by default
        torch.cuda.Event = torch.xpu.Event
        torch.cuda.Stream = torch.xpu.Stream
        torch.cuda.default_stream = torch.xpu.current_stream
        torch.cuda.current_stream = torch.xpu.current_stream
        torch.cuda.stream = torch.xpu.stream
        yield
    finally:
        # if anything goes wrong, just patch it with a placeholder