diff --git a/docker/Dockerfile b/docker/Dockerfile index e61021b6eeb85..b76c51cadce85 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -466,9 +466,10 @@ RUN --mount=type=cache,target=/root/.cache/uv \ # Install FlashInfer pre-compiled kernel cache and binaries # This is ~1.1GB and only changes when FlashInfer version bumps # https://docs.flashinfer.ai/installation.html -ARG FLASHINFER_VERSION=0.5.3 +ARG FLASHINFER_VERSION=0.6.0rc1 RUN --mount=type=cache,target=/root/.cache/uv \ uv pip install --system flashinfer-cubin==${FLASHINFER_VERSION} \ + --extra-index-url https://flashinfer.ai/whl \ && uv pip install --system flashinfer-jit-cache==${FLASHINFER_VERSION} \ --extra-index-url https://flashinfer.ai/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') \ && flashinfer show-config diff --git a/docker/Dockerfile.nightly_torch b/docker/Dockerfile.nightly_torch index d663c82c3885e..c5a0b8fd365ac 100644 --- a/docker/Dockerfile.nightly_torch +++ b/docker/Dockerfile.nightly_torch @@ -213,15 +213,14 @@ RUN pip install setuptools==75.6.0 packaging==23.2 ninja==1.11.1.3 build==1.2.2. # build flashinfer for torch nightly from source around 10 mins -# release version: v0.5.2 +# release version: v0.6.0rc1 # todo(elainewy): cache flashinfer build result for faster build ENV CCACHE_DIR=/root/.cache/ccache RUN --mount=type=cache,target=/root/.cache/ccache \ --mount=type=cache,target=/root/.cache/uv \ echo "git clone flashinfer..." \ - && git clone --recursive https://github.com/flashinfer-ai/flashinfer.git \ + && git clone --depth 1 --branch v0.6.0rc1 --recursive https://github.com/flashinfer-ai/flashinfer.git \ && cd flashinfer \ - && git checkout v0.5.2 \ && git submodule update --init --recursive \ && echo "finish git clone flashinfer..." \ && rm -rf build \ diff --git a/requirements/cuda.txt b/requirements/cuda.txt index 1417fb99120bc..11a34df677fd5 100644 --- a/requirements/cuda.txt +++ b/requirements/cuda.txt @@ -10,4 +10,4 @@ torchaudio==2.9.1 # These must be updated alongside torch torchvision==0.24.1 # Required for phi3v processor. See https://github.com/pytorch/vision?tab=readme-ov-file#installation for corresponding version # FlashInfer should be updated together with the Dockerfile -flashinfer-python==0.5.3 +flashinfer-python==0.6.0rc1