diff --git a/vllm/compilation/pass_manager.py b/vllm/compilation/pass_manager.py index 58216a1f0ed3..11e03daced16 100644 --- a/vllm/compilation/pass_manager.py +++ b/vllm/compilation/pass_manager.py @@ -5,12 +5,15 @@ from torch import fx as fx from vllm.config import VllmConfig from vllm.logger import init_logger +from vllm.platforms import current_platform + +if current_platform.is_cuda_alike(): + from .fusion import FusionPass + from .collective_fusion import AllReduceFusionPass, AsyncTPPass + from .fusion_attn import AttnFusionPass from .activation_quant_fusion import ActivationQuantFusionPass -from .collective_fusion import AllReduceFusionPass, AsyncTPPass from .fix_functionalization import FixFunctionalizationPass -from .fusion import FusionPass -from .fusion_attn import AttnFusionPass from .inductor_pass import CustomGraphPass, InductorPass, get_pass_context from .noop_elimination import NoOpEliminationPass from .sequence_parallelism import SequenceParallelismPass