From 3be261cf3e4bfe3eee1650ca6d59e50d52d3d169 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Daniele=20Trifir=C3=B2?= Date: Tue, 21 May 2024 12:16:19 +0200 Subject: [PATCH] Dockerfile.ubi: remove leftover flash-attn references --- Dockerfile.ubi | 4 ---- 1 file changed, 4 deletions(-) diff --git a/Dockerfile.ubi b/Dockerfile.ubi index d4fbd52d1c8ce..16ad4e6018f39 100644 --- a/Dockerfile.ubi +++ b/Dockerfile.ubi @@ -240,10 +240,6 @@ RUN pip install \ mv /root/.config/vllm/nccl/cu12/libnccl.so.2.18.1 /opt/vllm/lib/ && \ chmod 0755 /opt/vllm/lib/libnccl.so.2.18.1 -# Install flash attention (from pre-built wheel) -RUN --mount=type=bind,from=flash-attn-builder,src=/usr/src/flash-attention-v2,target=/usr/src/flash-attention-v2 \ - pip install /usr/src/flash-attention-v2/*.whl --no-cache-dir - RUN --mount=type=cache,target=/root/.cache/pip \ pip install \ # additional dependencies for the TGIS gRPC server