From d3fc0729f78dc982ab7006ceabd2e36c935cb193 Mon Sep 17 00:00:00 2001 From: vllmellm Date: Wed, 24 Dec 2025 21:54:58 +0000 Subject: [PATCH] format Signed-off-by: vllmellm --- tests/compile/test_fusion.py | 4 +--- .../layers/quantization/kernels/scaled_mm/__init__.py | 2 +- .../layers/quantization/kernels/scaled_mm/aiter.py | 2 +- 3 files changed, 3 insertions(+), 5 deletions(-) diff --git a/tests/compile/test_fusion.py b/tests/compile/test_fusion.py index b8ef7822208e8..ac92fb13fdc09 100644 --- a/tests/compile/test_fusion.py +++ b/tests/compile/test_fusion.py @@ -46,13 +46,11 @@ from vllm.model_executor.layers.quantization.utils.quant_utils import ( from vllm.model_executor.layers.quantization.utils.w8a8_utils import ( cutlass_block_fp8_supported, ) - +from vllm.platforms import current_platform from vllm.utils.deep_gemm import ( is_deep_gemm_supported, ) -from vllm.platforms import current_platform - from ..utils import TestBlockFP8Layer, TestFP8Layer from .backend import TestBackend diff --git a/vllm/model_executor/layers/quantization/kernels/scaled_mm/__init__.py b/vllm/model_executor/layers/quantization/kernels/scaled_mm/__init__.py index 1ce422c63a7a6..24d85b93db2b1 100644 --- a/vllm/model_executor/layers/quantization/kernels/scaled_mm/__init__.py +++ b/vllm/model_executor/layers/quantization/kernels/scaled_mm/__init__.py @@ -96,7 +96,7 @@ def is_supported_and_can_implement_kernel( _cc = current_platform.get_device_capability() if _cc is not None: compute_capability = _cc[0] * 10 + _cc[1] - + # If the current platform uses compute_capability, # make sure the kernel supports the compute cability. if compute_capability is not None: diff --git a/vllm/model_executor/layers/quantization/kernels/scaled_mm/aiter.py b/vllm/model_executor/layers/quantization/kernels/scaled_mm/aiter.py index 5cd6f9f820b66..e3f94eaa7e847 100644 --- a/vllm/model_executor/layers/quantization/kernels/scaled_mm/aiter.py +++ b/vllm/model_executor/layers/quantization/kernels/scaled_mm/aiter.py @@ -42,7 +42,7 @@ class AiterScaledMMLinearKernel(CutlassScaledMMLinearKernel): + "and `VLLM_ROCM_USE_AITER_LINEAR=1`. " + "`VLLM_ROCM_USE_AITER_LINEAR` default is True.", ) - + if not c.input_symmetric: return ( False,