diff --git a/vllm/model_executor/layers/quantization/bitsandbytes.py b/vllm/model_executor/layers/quantization/bitsandbytes.py index a96f3ee5c3015..5359189caa2a8 100644 --- a/vllm/model_executor/layers/quantization/bitsandbytes.py +++ b/vllm/model_executor/layers/quantization/bitsandbytes.py @@ -412,12 +412,12 @@ class BitsAndBytesMoEMethod(FusedMoEMethodBase): def __init__(self, quant_config: BitsAndBytesConfig): try: import bitsandbytes - if bitsandbytes.__version__ < "0.45.3": + if bitsandbytes.__version__ < "0.46.1": raise ImportError("bitsandbytes version is wrong. Please " - "install bitsandbytes>=0.45.3.") + "install bitsandbytes>=0.46.1.") except ImportError as err: - raise ImportError("Please install bitsandbytes>=0.45.3 via " - "`pip install bitsandbytes>=0.45.3` to use " + raise ImportError("Please install bitsandbytes>=0.46.1 via " + "`pip install bitsandbytes>=0.46.1` to use " "bitsandbytes quantizer.") from err self.topk_indices_dtype = None self.quant_config = quant_config