From 6597d7a4566d344835f5a90621397d8fee490b10 Mon Sep 17 00:00:00 2001 From: wangxiyuan Date: Fri, 29 Aug 2025 13:54:16 +0800 Subject: [PATCH] [Platform] import activation_quant_fusion for CUDA only (#23882) Signed-off-by: wangxiyuan --- vllm/compilation/pass_manager.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/compilation/pass_manager.py b/vllm/compilation/pass_manager.py index e07e52be9fdf6..1b1cbe4fa12c2 100644 --- a/vllm/compilation/pass_manager.py +++ b/vllm/compilation/pass_manager.py @@ -8,13 +8,13 @@ from vllm.logger import init_logger from vllm.platforms import current_platform if current_platform.is_cuda_alike(): + from .activation_quant_fusion import ActivationQuantFusionPass from .fusion import FusionPass from .fusion_attn import AttnFusionPass if current_platform.is_cuda(): from .collective_fusion import AllReduceFusionPass, AsyncTPPass -from .activation_quant_fusion import ActivationQuantFusionPass from .fix_functionalization import FixFunctionalizationPass from .inductor_pass import CustomGraphPass, InductorPass, get_pass_context from .noop_elimination import NoOpEliminationPass