From d9f9a3fd96b8461680495dee8f004037eef61d04 Mon Sep 17 00:00:00 2001 From: Chaojun Zhang Date: Thu, 24 Jul 2025 23:23:36 +0800 Subject: [PATCH] [XPU] Conditionally import CUDA-specific passes to avoid import errors on xpu platform (#21036) Signed-off-by: chzhang --- vllm/compilation/pass_manager.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/vllm/compilation/pass_manager.py b/vllm/compilation/pass_manager.py index 58216a1f0ed3..11e03daced16 100644 --- a/vllm/compilation/pass_manager.py +++ b/vllm/compilation/pass_manager.py @@ -5,12 +5,15 @@ from torch import fx as fx from vllm.config import VllmConfig from vllm.logger import init_logger +from vllm.platforms import current_platform + +if current_platform.is_cuda_alike(): + from .fusion import FusionPass + from .collective_fusion import AllReduceFusionPass, AsyncTPPass + from .fusion_attn import AttnFusionPass from .activation_quant_fusion import ActivationQuantFusionPass -from .collective_fusion import AllReduceFusionPass, AsyncTPPass from .fix_functionalization import FixFunctionalizationPass -from .fusion import FusionPass -from .fusion_attn import AttnFusionPass from .inductor_pass import CustomGraphPass, InductorPass, get_pass_context from .noop_elimination import NoOpEliminationPass from .sequence_parallelism import SequenceParallelismPass