mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 14:15:55 +08:00
Build some nightly wheels by default (#6380)
This commit is contained in:
parent
aa48e502fb
commit
d719ba24c5
@ -1,5 +1,24 @@
|
|||||||
steps:
|
steps:
|
||||||
- block: "Build wheels"
|
- label: "Build wheel default - Python {{matrix.python_version}}, CUDA {{matrix.cuda_version}}"
|
||||||
|
agents:
|
||||||
|
queue: cpu_queue
|
||||||
|
commands:
|
||||||
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION={{matrix.cuda_version}} --build-arg PYTHON_VERSION={{matrix.python_version}} --tag vllm-ci:build-image -e CMAKE_BUILD_TYPE=Release --target build --progress plain ."
|
||||||
|
- "mkdir artifacts"
|
||||||
|
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image cp -r dist /artifacts_host"
|
||||||
|
# rename the files to change linux -> manylinux1
|
||||||
|
- "for f in artifacts/dist/*.whl; do mv -- \"$f\" \"${f/linux/manylinux1}\"; done"
|
||||||
|
- "aws s3 cp --recursive --acl public-read artifacts/dist s3://vllm-wheels/$BUILDKITE_COMMIT/"
|
||||||
|
- "aws s3 cp --recursive --acl public-read artifacts/dist s3://vllm-wheels/nightly/"
|
||||||
|
matrix:
|
||||||
|
setup:
|
||||||
|
cuda_version:
|
||||||
|
- "12.1.0"
|
||||||
|
python_version:
|
||||||
|
- "3.10"
|
||||||
|
- "3.11"
|
||||||
|
|
||||||
|
- block: "Build wheels full"
|
||||||
|
|
||||||
- label: "Build wheel - Python {{matrix.python_version}}, CUDA {{matrix.cuda_version}}"
|
- label: "Build wheel - Python {{matrix.python_version}}, CUDA {{matrix.cuda_version}}"
|
||||||
agents:
|
agents:
|
||||||
@ -8,7 +27,9 @@ steps:
|
|||||||
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION={{matrix.cuda_version}} --build-arg PYTHON_VERSION={{matrix.python_version}} --tag vllm-ci:build-image --target build --progress plain ."
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION={{matrix.cuda_version}} --build-arg PYTHON_VERSION={{matrix.python_version}} --tag vllm-ci:build-image --target build --progress plain ."
|
||||||
- "mkdir artifacts"
|
- "mkdir artifacts"
|
||||||
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image cp -r dist /artifacts_host"
|
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image cp -r dist /artifacts_host"
|
||||||
- "aws s3 cp --recursive artifacts/dist s3://vllm-wheels/$BUILDKITE_COMMIT/"
|
- "for f in artifacts/dist/*.whl; do mv -- \"$f\" \"${f/linux/manylinux1}\"; done
|
||||||
|
- "aws s3 cp --recursive --acl public-read artifacts/dist s3://vllm-wheels/$BUILDKITE_COMMIT/"
|
||||||
|
- "aws s3 cp --recursive --acl public-read artifacts/dist s3://vllm-wheels/nightly/"
|
||||||
matrix:
|
matrix:
|
||||||
setup:
|
setup:
|
||||||
cuda_version:
|
cuda_version:
|
||||||
@ -19,3 +40,12 @@ steps:
|
|||||||
- "3.9"
|
- "3.9"
|
||||||
- "3.10"
|
- "3.10"
|
||||||
- "3.11"
|
- "3.11"
|
||||||
|
adjustments:
|
||||||
|
- with:
|
||||||
|
cuda_version: "12.1.0"
|
||||||
|
python_version: "3.10"
|
||||||
|
skip: true
|
||||||
|
- with:
|
||||||
|
cuda_version: "12.1.0"
|
||||||
|
python_version: "3.11"
|
||||||
|
skip: true
|
||||||
|
|||||||
@ -42,6 +42,20 @@ You can install vLLM using pip:
|
|||||||
|
|
||||||
Therefore, it is recommended to install vLLM with a **fresh new** conda environment. If either you have a different CUDA version or you want to use an existing PyTorch installation, you need to build vLLM from source. See below for instructions.
|
Therefore, it is recommended to install vLLM with a **fresh new** conda environment. If either you have a different CUDA version or you want to use an existing PyTorch installation, you need to build vLLM from source. See below for instructions.
|
||||||
|
|
||||||
|
.. note::
|
||||||
|
|
||||||
|
vLLM also publishes a subset of wheels (Python 3.10, 3.11 with CUDA 12) for every commit since v0.5.3. You can download them with the following command:
|
||||||
|
|
||||||
|
.. code-block:: console
|
||||||
|
|
||||||
|
$ export VLLM_VERSION=0.5.2 # vLLM's main branch version is currently set to latest released tag
|
||||||
|
$ export PYTHON_VERSION=310
|
||||||
|
$ pip install https://vllm-wheels.s3.us-west-2.amazonaws.com/nightly/vllm-${VLLM_VERSION}-cp${PYTHON_VERSION}-cp${PYTHON_VERSION}-manylinux1_x86_64.whl
|
||||||
|
$ # You can also access a specific commit
|
||||||
|
$ # export VLLM_COMMIT=...
|
||||||
|
$ # pip install https://vllm-wheels.s3.us-west-2.amazonaws.com/${VLLM_COMMIT}/vllm-${VLLM_VERSION}-cp${PYTHON_VERSION}-cp${PYTHON_VERSION}-manylinux1_x86_64.whl
|
||||||
|
|
||||||
|
|
||||||
.. _build_from_source:
|
.. _build_from_source:
|
||||||
|
|
||||||
Build from source
|
Build from source
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user