From 9f376e4c986fa30d37f8b50ec1f8c84350bcea3f Mon Sep 17 00:00:00 2001 From: dhuangnm Date: Mon, 1 Jul 2024 13:45:34 -0400 Subject: [PATCH] remove flash-attn related --- Dockerfile | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/Dockerfile b/Dockerfile index 60fe17c4f08d9..4eb26239f2f97 100644 --- a/Dockerfile +++ b/Dockerfile @@ -63,16 +63,16 @@ RUN apt-get update -y && apt-get install -y ccache #################### EXTENSION Build IMAGE #################### #################### FLASH_ATTENTION Build IMAGE #################### -FROM dev as flash-attn-builder -# flash attention version -ARG flash_attn_version=v2.5.8 -ENV FLASH_ATTN_VERSION=${flash_attn_version} +#FROM dev as flash-attn-builder +## flash attention version +#ARG flash_attn_version=v2.5.8 +#ENV FLASH_ATTN_VERSION=${flash_attn_version} -WORKDIR /usr/src/flash-attention-v2 +#WORKDIR /usr/src/flash-attention-v2 # Download the wheel or build it if a pre-compiled release doesn't exist -RUN pip --verbose wheel flash-attn==${FLASH_ATTN_VERSION} \ - --no-build-isolation --no-deps --no-cache-dir +#RUN pip --verbose wheel flash-attn==${FLASH_ATTN_VERSION} \ +# --no-build-isolation --no-deps --no-cache-dir #################### FLASH_ATTENTION Build IMAGE #################### @@ -114,9 +114,9 @@ RUN --mount=type=bind,from=build \ fi; \ fi -RUN --mount=type=bind,from=flash-attn-builder,src=/usr/src/flash-attention-v2,target=/usr/src/flash-attention-v2 \ - --mount=type=cache,target=/root/.cache/pip \ - pip install /usr/src/flash-attention-v2/*.whl --no-cache-dir +#RUN --mount=type=bind,from=flash-attn-builder,src=/usr/src/flash-attention-v2,target=/usr/src/flash-attention-v2 \ +# --mount=type=cache,target=/root/.cache/pip \ +# pip install /usr/src/flash-attention-v2/*.whl --no-cache-dir #################### vLLM installation IMAGE #################### #################### TEST IMAGE ####################