Skip to content

Commit c361e00

Browse files
committed
NGC pytorch 22.12
1 parent 4b53164 commit c361e00

File tree

1 file changed

+267
-0
lines changed

1 file changed

+267
-0
lines changed
Lines changed: 267 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,267 @@
1+
FROM nvcr.io/nvidia/pytorch:22.12-py3
2+
# NVIDIA NGC PyTorch with Python 3.8
3+
4+
ENV DEBIAN_FRONTEND=noninteractive \
5+
MPLBACKEND=Svg \
6+
PIP_IGNORE_INSTALLED=0 \
7+
PYTHONUNBUFFERED=1 \
8+
LD_LIBRARY_PATH="/usr/local/lib/python3.8/dist-packages/torch/lib:/usr/local/lib/python3.8/dist-packages/torch_tensorrt/lib:/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/cuda/extras/CUPTI/lib64:/usr/local/cuda-11.8/include:/usr/include/x86_64-linux-gnu" \
9+
PATH="/usr/local/nvm/versions/node/v16.15.1/bin:/usr/local/lib/python3.8/dist-packages/torch_tensorrt/bin:/usr/local/mpi/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/tensorrt/bin:/usr/local/src/lightgbm/LightGBM:/usr/local/bin/mecab" \
10+
mecab_dicdir=/usr/local/lib/mecab/dic/mecab-ko-dic \
11+
CPLUS_INCLUDE_PATH=/usr/include/gdal \
12+
C_INCLUDE_PATH=/usr/include/gdal \
13+
LANG=C.UTF-8
14+
15+
RUN apt-get update && \
16+
apt-get install -y --no-install-recommends \
17+
automake \
18+
bzip2 \
19+
cabextract \
20+
ffmpeg \
21+
fonts-nanum \
22+
fonts-nanum-coding \
23+
fonts-nanum-extra \
24+
gfortran \
25+
htop \
26+
libasound2-dev \
27+
libatlas-base-dev \
28+
libavresample-dev \
29+
libdc1394-22-dev \
30+
libeigen3-dev \
31+
libfaac-dev \
32+
libgdal-dev \
33+
libgflags-dev \
34+
libgoogle-glog-dev \
35+
libgphoto2-dev \
36+
libgstreamer-plugins-base1.0-dev \
37+
libgstreamer1.0-dev \
38+
libgtk-3-dev \
39+
libhdf5-dev \
40+
libjemalloc-dev \
41+
libmp3lame-dev \
42+
libncurses-dev \
43+
libopenblas-dev \
44+
libopencore-amrnb-dev \
45+
libopencore-amrwb-dev \
46+
libprotobuf-dev \
47+
libtheora-dev \
48+
libvorbis-dev \
49+
libx264-dev \
50+
libxext6 \
51+
libxrender-dev \
52+
libxvidcore-dev \
53+
libsm6 \
54+
libtbb-dev \
55+
mercurial \
56+
ncurses-term \
57+
openjdk-8-jdk \
58+
pbzip2 \
59+
pv \
60+
pdsh \
61+
protobuf-compiler \
62+
v4l-utils \
63+
x264
64+
65+
# Install CUDA + cuDNN
66+
RUN ln -s /usr/lib/x86_64-linux-gnu/libcudnn.so.8.3.2 /usr/local/cuda/lib64/libcudnn.so && \
67+
rm -rf /var/lib/apt/lists/* && \
68+
ldconfig
69+
70+
# Install cmake
71+
RUN wget https://github.com/Kitware/CMake/releases/download/v3.25.1/cmake-3.25.1-Linux-x86_64.sh \
72+
-q -O /tmp/cmake-install.sh && \
73+
chmod u+x /tmp/cmake-install.sh && \
74+
mkdir /usr/bin/cmake && \
75+
/tmp/cmake-install.sh --skip-license --prefix=/usr/bin/cmake && \
76+
rm /tmp/cmake-install.sh
77+
78+
RUN update-alternatives --install /usr/bin/python python /usr/bin/python3 2
79+
80+
# install NLP packages *mecab-ko & khai*
81+
WORKDIR /tmp
82+
RUN curl -LO https://bitbucket.org/eunjeon/mecab-ko/downloads/mecab-0.996-ko-0.9.2.tar.gz && \
83+
tar zxfv mecab-0.996-ko-0.9.2.tar.gz && \
84+
cd mecab-0.996-ko-0.9.2 && \
85+
./configure && \
86+
make -j$(nproc) && \
87+
make check && \
88+
make install
89+
90+
RUN echo "Install mecab-ko-dic" && \
91+
cd /tmp && \
92+
ldconfig && \
93+
curl -LO https://bitbucket.org/eunjeon/mecab-ko-dic/downloads/mecab-ko-dic-2.1.1-20180720.tar.gz && \
94+
tar -zxvf mecab-ko-dic-2.1.1-20180720.tar.gz && \
95+
cd mecab-ko-dic-2.1.1-20180720 && \
96+
./autogen.sh && \
97+
./configure && \
98+
make -j$(nproc) && \
99+
sh -c 'echo "dicdir=/usr/local/lib/mecab/dic/mecab-ko-dic" > /usr/local/etc/mecabrc' && \
100+
make install && \
101+
cd /tmp && \
102+
git clone https://bitbucket.org/eunjeon/mecab-python-0.996.git && \
103+
python3 -m pip install /tmp/mecab-python-0.996
104+
105+
# OpenCV
106+
ENV OPENCV_VERSION="4.5.5"
107+
WORKDIR /tmp
108+
RUN wget https://github.com/opencv/opencv/archive/${OPENCV_VERSION}.zip && \
109+
wget -O opencv-contrib.zip https://github.com/opencv/opencv_contrib/archive/${OPENCV_VERSION}.zip && \
110+
unzip ${OPENCV_VERSION}.zip && \
111+
unzip opencv-contrib.zip && \
112+
mkdir opencv-${OPENCV_VERSION}/cmake_binary && \
113+
cd opencv-${OPENCV_VERSION}/cmake_binary && \
114+
cmake \
115+
-DCMAKE_BUILD_TYPE=RELEASE \
116+
-D BUILD_TIFF=ON \
117+
-D BUILD_opencv_java=OFF \
118+
-D WITH_CUDA=ON \
119+
-D CUDA_NVCC_FLAGS=--expt-relaxed-constexpr \
120+
-D CUDA_TOOLKIT_ROOT_DIR=/usr/local/cuda-11.8 \
121+
-D ENABLE_FAST_MATH=1 \
122+
-D CUDA_FAST_MATH=1 \
123+
-D WITH_CUBLAS=1 \
124+
-D WITH_OPENGL=ON \
125+
-D WITH_OPENCL=ON \
126+
-D WITH_IPP=ON \
127+
-D WITH_TBB=ON \
128+
-D WITH_EIGEN=ON \
129+
-D WITH_V4L=ON \
130+
-D BUILD_TESTS=OFF \
131+
-D BUILD_PERF_TESTS=OFF \
132+
-D OPENCV_EXTRA_MODULES_PATH="../../opencv_contrib-4.5.5/modules" \
133+
-D CMAKE_BUILD_TYPE=RELEASE \
134+
-D CMAKE_INSTALL_PREFIX=$(python3 -c "import sys; print(sys.prefix)") \
135+
-D PYTHON_EXECUTABLE=$(which python3) \
136+
-D PYTHON_INCLUDE_DIR=$(python3 -c "from distutils.sysconfig import get_python_inc; print(get_python_inc())") \
137+
-D PYTHON_PACKAGES_PATH=$(python3 -c "from distutils.sysconfig import get_python_lib; print(get_python_lib())") \
138+
.. 2>&1 | tee cmake_messages.txt && \
139+
make -j$(nproc) && \
140+
make install && \
141+
cd /tmp && \
142+
python3 -m pip install --no-cache-dir opencv-python && \
143+
rm -fr opencv*
144+
145+
WORKDIR /tmp
146+
RUN git clone -q --branch=v0.3.21 https://github.com/xianyi/OpenBLAS.git && \
147+
cd OpenBLAS && \
148+
make DYNAMIC_ARCH=1 NO_AFFINITY=1 NUM_THREADS=48 FC=gfortran && \
149+
make install && \
150+
cd /tmp && \
151+
git clone --recursive https://github.com/bodono/scs-python.git && \
152+
cd /tmp/scs-python && \
153+
python setup.py install --scs --gpu
154+
155+
# install git-lfs
156+
WORKDIR /tmp
157+
RUN curl -sLO https://github.com/git-lfs/git-lfs/releases/download/v3.3.0/git-lfs-linux-amd64-v3.3.0.tar.gz && \
158+
tar -zxf git-lfs-linux-amd64-v3.3.0.tar.gz && \
159+
cd git-lfs-3.3.0 && \
160+
bash install.sh && \
161+
rm -rf /tmp/*
162+
163+
WORKDIR /tmp
164+
RUN git clone https://github.com/aristocratos/bashtop.git && \
165+
cd bashtop && \
166+
make install
167+
168+
RUN curl -fL https://github.com/cdr/code-server/releases/download/v4.9.1/code-server-4.9.1-linux-amd64.tar.gz \
169+
| tar -C /usr/local/lib -xz && \
170+
mv /usr/local/lib/code-server-4.9.1-linux-amd64 /usr/local/lib/code-server-4.9.1 && \
171+
ln -s /usr/local/lib/code-server-4.9.1/bin/code-server /usr/local/bin/code-server
172+
173+
WORKDIR /tmp
174+
COPY ./requirements.22.09.1.txt /tmp/requirements.txt
175+
RUN /opt/conda/bin/python3 -m pip install --no-cache-dir -r requirements.txt
176+
COPY ./requirements.22.09.2.txt /tmp/requirements.txt
177+
RUN /opt/conda/bin/python3 -m pip install --no-cache-dir -r requirements.txt
178+
COPY ./requirements.22.09.3.txt /tmp/requirements.txt
179+
RUN /opt/conda/bin/python3 -m pip install --no-cache-dir -r requirements.txt
180+
COPY ./requirements.22.09.4.txt /tmp/requirements.txt
181+
RUN /opt/conda/bin/python3 -m pip install --no-cache-dir -r requirements.txt
182+
COPY ./requirements.22.09.5.txt /tmp/requirements.txt
183+
RUN /opt/conda/bin/python3 -m pip install --no-cache-dir -r requirements.txt && \
184+
rm -f /tmp/*.whl /tmp/requirem*
185+
186+
# Install Open MPI
187+
RUN mkdir /tmp/openmpi && \
188+
cd /tmp/openmpi && \
189+
wget https://download.open-mpi.org/release/open-mpi/v4.1/openmpi-4.1.4.tar.gz && \
190+
tar zxf openmpi-4.1.4.tar.gz && \
191+
cd openmpi-4.1.4 && \
192+
./configure --enable-orterun-prefix-by-default && \
193+
make -j $(nproc) all && \
194+
make install && \
195+
ldconfig && \
196+
rm -rf /tmp/openmpi* && \
197+
# Create a wrapper for OpenMPI to allow running as root by default
198+
mv /usr/local/bin/mpirun /usr/local/bin/mpirun.real && \
199+
echo '#!/bin/bash' > /usr/local/bin/mpirun && \
200+
echo 'mpirun.real --allow-run-as-root "$@"' >> /usr/local/bin/mpirun && \
201+
chmod a+x /usr/local/bin/mpirun && \
202+
# Configure OpenMPI to run good defaults:
203+
echo "btl_tcp_if_exclude = lo,docker0" >> /usr/local/etc/openmpi-mca-params.conf
204+
205+
# Install Horovod, temporarily using CUDA stubs
206+
RUN ldconfig /usr/local/cuda/targets/x86_64-linux/lib/stubs && \
207+
LD_LIBRARY_PATH="/usr/local/cuda/compat/lib:/usr/local/cuda/extras/CUPTI/lib64:/usr/local/cuda/lib:/usr/local/cuda/lib64:/usr/local/nvidia/lib64:/usr/local/cuda-11.8/include:/usr/include/x86_64-linux-gnu:/usr/include:$LD_LIBRARY_PATH" \
208+
HOROVOD_NCCL_LINK=SHARED \
209+
HOROVOD_WITH_MPI=1 \
210+
HOROVOD_GPU_ALLREDUCE=NCCL \
211+
NCCL_LIBRARY=/usr/include \
212+
HOROVOD_NCCL_INCLUDE=/usr/include \
213+
HOROVOD_NCCL_LIB=/lib/x86_64-linux-gnu \
214+
HOROVOD_GPU_BROADCAST=NCCL \
215+
HOROVOD_WITHOUT_TENSORFLOW=1 HOROVOD_WITH_PYTORCH=1 HOROVOD_WITHOUT_MXNET=1 \
216+
pip install --no-cache-dir horovod==0.24.2 && \
217+
ldconfig
218+
219+
RUN python3 -m pip install --no-cache-dir \
220+
mpi4py==3.1.3 \
221+
nni==2.9 \
222+
mlflow==1.29.0 \
223+
scikit-nni==0.2.1
224+
225+
RUN jupyter nbextensions_configurator enable && \
226+
jupyter contrib nbextension install && \
227+
jupyter nbextension enable --py --sys-prefix widgetsnbextension && \
228+
jupyter serverextension enable --py jupyterlab --sys-prefix && \
229+
jupyter labextension install --no-build @jupyter-widgets/jupyterlab-manager && \
230+
jupyter labextension install --no-build @krassowski/jupyterlab-lsp && \
231+
jupyter serverextension enable --py jupyter_lsp && \
232+
jupyter nbextension enable execute_time/ExecuteTime && \
233+
jupyter nbextension enable toc2/main && \
234+
jupyter lab build
235+
236+
RUN apt autoclean && \
237+
sed -i 's/source \/usr\/local\/nvm\/nvm.sh//' /etc/bash.bashrc && \
238+
ln -sf /usr/share/terminfo/x/xterm-color /usr/share/terminfo/x/xterm-256color && \
239+
rm -rf /var/lib/apt/lists/* && \
240+
rm -rf /root/.cache && \
241+
rm -rf /tmp/*
242+
243+
RUN /opt/conda/bin/python3 -m ipykernel install \
244+
--prefix=/opt/conda/ \
245+
--display-name "PyTorch 1.13 (NGC 22.09/Python 3.8 Conda) on Backend.AI" && \
246+
cat /opt/conda/share/jupyter/kernels/python3/kernel.json
247+
ENV JUPYTER_PATH="/opt/conda/share/jupyter"
248+
249+
# Backend.AI specifics
250+
COPY ./service-defs /etc/backend.ai/service-defs
251+
COPY ./runner-scripts/bootstrap.sh runner-scripts/setup_multinode.py /opt/container/
252+
253+
LABEL ai.backend.kernelspec="1" \
254+
ai.backend.envs.corecount="OPENBLAS_NUM_THREADS,OMP_NUM_THREADS,NPROC" \
255+
ai.backend.features="batch query uid-match user-input" \
256+
ai.backend.base-distro="ubuntu16.04" \
257+
ai.backend.accelerators="cuda" \
258+
ai.backend.resource.min.cpu="1" \
259+
ai.backend.resource.min.mem="1g" \
260+
ai.backend.resource.min.cuda.device=1 \
261+
ai.backend.resource.min.cuda.shares=0 \
262+
ai.backend.base-distro="ubuntu22.04" \
263+
ai.backend.runtime-type="python" \
264+
ai.backend.runtime-path="/opt/conda/bin/python3" \
265+
ai.backend.service-ports="ipython:pty:3000,jupyter:http:8091,jupyterlab:http:8090,vscode:http:8180,tensorboard:http:6006,mlflow-ui:preopen:5000,nniboard:preopen:8080"
266+
267+
WORKDIR /home/work

0 commit comments

Comments
 (0)