diff --git a/vllm/model_executor/layers/quantization/qutlass_utils.py b/vllm/model_executor/layers/quantization/qutlass_utils.py index 395bde76d02ae..555bb50da199e 100644 --- a/vllm/model_executor/layers/quantization/qutlass_utils.py +++ b/vllm/model_executor/layers/quantization/qutlass_utils.py @@ -14,10 +14,10 @@ from typing import Literal import torch -import triton -import triton.language as tl from torch.library import wrap_triton +from vllm.triton_utils import tl, triton + @triton.jit def triton_scale_swizzle(