mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 00:06:06 +08:00
[[Misc]Upgrade bitsandbytes to the latest version 0.45.0 (#11201)
This commit is contained in:
parent
886936837c
commit
15859f2357
@ -218,7 +218,7 @@ FROM vllm-base AS vllm-openai
|
|||||||
|
|
||||||
# install additional dependencies for openai api server
|
# install additional dependencies for openai api server
|
||||||
RUN --mount=type=cache,target=/root/.cache/pip \
|
RUN --mount=type=cache,target=/root/.cache/pip \
|
||||||
pip install accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.44.0' timm==0.9.10
|
pip install accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.45.0' timm==0.9.10
|
||||||
|
|
||||||
ENV VLLM_USAGE_SOURCE production-docker-image
|
ENV VLLM_USAGE_SOURCE production-docker-image
|
||||||
|
|
||||||
|
|||||||
@ -11,7 +11,7 @@ Below are the steps to utilize BitsAndBytes with vLLM.
|
|||||||
|
|
||||||
.. code-block:: console
|
.. code-block:: console
|
||||||
|
|
||||||
$ pip install bitsandbytes>=0.44.0
|
$ pip install bitsandbytes>=0.45.0
|
||||||
|
|
||||||
vLLM reads the model's config file and supports both in-flight quantization and pre-quantized checkpoint.
|
vLLM reads the model's config file and supports both in-flight quantization and pre-quantized checkpoint.
|
||||||
|
|
||||||
|
|||||||
@ -25,7 +25,7 @@ datamodel_code_generator # required for minicpm3 test
|
|||||||
lm-eval[api]==0.4.4 # required for model evaluation test
|
lm-eval[api]==0.4.4 # required for model evaluation test
|
||||||
|
|
||||||
# quantization
|
# quantization
|
||||||
bitsandbytes>=0.44.0
|
bitsandbytes>=0.45.0
|
||||||
buildkite-test-collector==0.1.9
|
buildkite-test-collector==0.1.9
|
||||||
|
|
||||||
numpy < 2.0.0
|
numpy < 2.0.0
|
||||||
|
|||||||
@ -37,7 +37,7 @@ audioread==3.0.1
|
|||||||
# via librosa
|
# via librosa
|
||||||
awscli==1.35.23
|
awscli==1.35.23
|
||||||
# via -r requirements-test.in
|
# via -r requirements-test.in
|
||||||
bitsandbytes==0.44.1
|
bitsandbytes>=0.45.0
|
||||||
# via -r requirements-test.in
|
# via -r requirements-test.in
|
||||||
black==24.10.0
|
black==24.10.0
|
||||||
# via datamodel-code-generator
|
# via datamodel-code-generator
|
||||||
|
|||||||
@ -145,12 +145,12 @@ class BitsAndBytesLinearMethod(LinearMethodBase):
|
|||||||
def __init__(self, quant_config: BitsAndBytesConfig):
|
def __init__(self, quant_config: BitsAndBytesConfig):
|
||||||
try:
|
try:
|
||||||
import bitsandbytes
|
import bitsandbytes
|
||||||
if bitsandbytes.__version__ < "0.44.0":
|
if bitsandbytes.__version__ < "0.45.0":
|
||||||
raise ImportError("bitsandbytes version is wrong. Please "
|
raise ImportError("bitsandbytes version is wrong. Please "
|
||||||
"install bitsandbytes>=0.44.0.")
|
"install bitsandbytes>=0.45.0.")
|
||||||
except ImportError as err:
|
except ImportError as err:
|
||||||
raise ImportError("Please install bitsandbytes>=0.44.0 via "
|
raise ImportError("Please install bitsandbytes>=0.45.0 via "
|
||||||
"`pip install bitsandbytes>=0.44.0` to use "
|
"`pip install bitsandbytes>=0.45.0` to use "
|
||||||
"bitsandbytes quantizer.") from err
|
"bitsandbytes quantizer.") from err
|
||||||
|
|
||||||
self.quant_config = quant_config
|
self.quant_config = quant_config
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user