-
Notifications
You must be signed in to change notification settings - Fork 191
/
Dockerfile
39 lines (31 loc) · 1.39 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
# The data-juicer image includes all open-source contents of data-juicer,
# and it will be instaled in editable mode.
FROM nvidia/cuda:12.4.1-cudnn-devel-ubuntu22.04
# install python 3.10
RUN apt-get update \
&& apt-get install -y git curl vim wget python3.10 libpython3.10-dev python3-pip \
&& apt-get install -y libgl1-mesa-glx libglib2.0-0 \
&& ln -sf /usr/bin/python3.10 /usr/bin/python3 \
&& ln -sf /usr/bin/python3.10 /usr/bin/python \
&& apt-get autoclean && rm -rf /var/lib/apt/lists/* \
&& pip install --upgrade pip
# install 3rd-party system dependencies
RUN apt-get update \
&& apt-get install ffmpeg libsm6 libxext6 software-properties-common build-essential cmake gfortran libopenblas-dev liblapack-dev -y
# prepare the java env
WORKDIR /opt
# download jdk
RUN wget https://aka.ms/download-jdk/microsoft-jdk-17.0.9-linux-x64.tar.gz -O jdk.tar.gz \
&& tar -xzf jdk.tar.gz \
&& rm -rf jdk.tar.gz \
&& mv jdk-17.0.9+8 jdk
# set the environment variable
ENV JAVA_HOME=/opt/jdk
WORKDIR /data-juicer
# install requirements which need to be installed from source
RUN pip install --upgrade setuptools==69.5.1 setuptools_scm \
&& pip install git+https://github.com/xinyu1205/recognize-anything.git --default-timeout 1000
# install data-juicer then
COPY . .
RUN pip install -v -e .[all] --default-timeout 1000
RUN pip install -v -e .[sandbox] --default-timeout 1000