diff --git a/vllm/model_executor/layers/quantization/gptq_bitblas.py b/vllm/model_executor/layers/quantization/gptq_bitblas.py index 6ee3a2f1bbbb0..b06c9579d63db 100644 --- a/vllm/model_executor/layers/quantization/gptq_bitblas.py +++ b/vllm/model_executor/layers/quantization/gptq_bitblas.py @@ -134,7 +134,7 @@ class GPTQBitBLASConfig(QuantizationConfig): @classmethod def get_min_capability(cls) -> int: - return 70 + return 80 @classmethod def get_config_filenames(cls) -> List[str]: