mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 09:15:55 +08:00
[ROCm] Dockerfile fix for flash-attention build (#2885)
This commit is contained in:
parent
4f2ad11135
commit
5255d99dc5
@ -56,10 +56,10 @@ ENV LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/opt/rocm/lib/:/libtorch/lib:
|
|||||||
ENV CPLUS_INCLUDE_PATH=$CPLUS_INCLUDE_PATH:/libtorch/include:/libtorch/include/torch/csrc/api/include/:/opt/rocm/include/:
|
ENV CPLUS_INCLUDE_PATH=$CPLUS_INCLUDE_PATH:/libtorch/include:/libtorch/include/torch/csrc/api/include/:/opt/rocm/include/:
|
||||||
|
|
||||||
# Install ROCm flash-attention
|
# Install ROCm flash-attention
|
||||||
RUN if [ "$BUILD_FA" == "1" ]; then \
|
RUN if [ "$BUILD_FA" = "1" ]; then \
|
||||||
mkdir libs \
|
mkdir libs \
|
||||||
&& cd libs \
|
&& cd libs \
|
||||||
&& git clone https://github.com/ROCmSoftwarePlatform/flash-attention.git \
|
&& git clone https://github.com/ROCm/flash-attention.git \
|
||||||
&& cd flash-attention \
|
&& cd flash-attention \
|
||||||
&& git checkout ${FA_BRANCH} \
|
&& git checkout ${FA_BRANCH} \
|
||||||
&& git submodule update --init \
|
&& git submodule update --init \
|
||||||
@ -83,7 +83,7 @@ RUN if [ "$BASE_IMAGE" = "rocm/pytorch:rocm6.0_ubuntu20.04_py3.9_pytorch_2.1.1"
|
|||||||
RUN cd /app \
|
RUN cd /app \
|
||||||
&& cd vllm \
|
&& cd vllm \
|
||||||
&& pip install -U -r requirements-rocm.txt \
|
&& pip install -U -r requirements-rocm.txt \
|
||||||
&& if [ "$BUILD_FA" == "1" ]; then \
|
&& if [ "$BUILD_FA" = "1" ]; then \
|
||||||
bash patch_xformers.rocm.sh; fi \
|
bash patch_xformers.rocm.sh; fi \
|
||||||
&& patch /opt/rocm/include/hip/amd_detail/amd_hip_bf16.h /app/vllm/rocm_patch/rocm_bf16.patch \
|
&& patch /opt/rocm/include/hip/amd_detail/amd_hip_bf16.h /app/vllm/rocm_patch/rocm_bf16.patch \
|
||||||
&& python3 setup.py install \
|
&& python3 setup.py install \
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user