Skip to content

Commit

Permalink
install numactl to enable fastsafetensors and adapter for 0.6.5
Browse files Browse the repository at this point in the history
Signed-off-by: Jefferson Fialho <[email protected]>
  • Loading branch information
fialhocoelho committed Dec 18, 2024
1 parent 24c996d commit 6db125b
Showing 1 changed file with 20 additions and 1 deletion.
21 changes: 20 additions & 1 deletion Dockerfile.ubi
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,20 @@ ENV CUDA_HOME="/usr/local/cuda" \
PATH="${CUDA_HOME}/bin:${PATH}" \
LD_LIBRARY_PATH="${CUDA_HOME}/lib64:${CUDA_HOME}/extras/CUPTI/lib64:${LD_LIBRARY_PATH}"

# Install necessary packages to build numactl from source
RUN microdnf install -y autoconf automake libtool make rpm-build

# Download the numactl source RPM to /root directory
WORKDIR /root
RUN microdnf download --enablerepo=ubi-9-baseos-source --source numactl.src

# Get NUMACTL_V (just the version part of the RPM file)
RUN NUMACTL_V=$(ls /root/numactl-* | sed -r 's|/root/numactl-(.+)\.el9\.src\.rpm|\1|') && \
echo "########################################### NUMACTL_V is set to $NUMACTL_V" && \
rpm -i /root/numactl-${NUMACTL_V}.el9.src.rpm && \
rpmbuild -ba /root/rpmbuild/SPECS/numactl.spec && \
rpm -i /root/rpmbuild/RPMS/x86_64/{numactl-libs-${NUMACTL_V}.el9.x86_64.rpm,numactl-${NUMACTL_V}.el9.x86_64.rpm,numactl-devel-${NUMACTL_V}.el9.x86_64.rpm}

## Python cuda base #################################################################
FROM cuda-base AS python-cuda-base

Expand Down Expand Up @@ -206,10 +220,15 @@ FROM vllm-openai as vllm-grpc-adapter

USER root

RUN --mount=type=bind,from=cuda-base,source=/root/rpmbuild/RPMS/x86_64,target=/tmp/rpm/ \
rpm -i --nodeps /tmp/rpm/numactl-libs-*.el9.x86_64.rpm

RUN --mount=type=cache,target=/root/.cache/pip \
--mount=type=cache,target=/root/.cache/uv \
--mount=type=bind,from=build,src=/workspace/dist,target=/workspace/dist \
HOME=/root uv pip install "$(echo /workspace/dist/*.whl)[tensorizer]" vllm-tgis-adapter==0.5.3
HOME=/root uv pip install "$(echo /workspace/dist/*.whl)[tensorizer]"

RUN pip install git+https://github.com/opendatahub-io/vllm-tgis-adapter.git@vllm0p6p5

ENV GRPC_PORT=8033 \
PORT=8000 \
Expand Down

0 comments on commit 6db125b

Please sign in to comment.