forked from thoth-station/tensorflow-build-s2i
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDockerfile.ubi7gpu
306 lines (265 loc) · 13.2 KB
/
Dockerfile.ubi7gpu
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
FROM submod/s2i-core-ubi7:latest
MAINTAINER Subin Modeel <smodeel@redhat.com>
USER root
ENV BUILDER_VERSION 1.0
LABEL io.k8s.description="S2I builder for Tensorflow binaries." \
io.k8s.display-name="Tensorflow BUILD" \
io.openshift.expose-services="8080:http" \
io.openshift.tags="builder,python,tf-build" \
io.openshift.s2i.scripts-url="image:///usr/libexec/s2i"
ARG CUDA_VERSION=10.1.105
ENV CUDA_VERSION=$CUDA_VERSION
ARG CUDNN_VERSION=7.5.0.56
ENV CUDNN_VERSION=$CUDNN_VERSION
############################################
## taken from base
## https://hub.docker.com/r/nvidia/cuda/
############################################
RUN NVIDIA_GPGKEY_SUM=d1be581509378368edeec8c1eb2958702feedf3bc3d17011adbf24efacce4ab5 && \
curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/rhel7/x86_64/7fa2af80.pub | sed '/^Version/d' > /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA && \
echo "$NVIDIA_GPGKEY_SUM /etc/pki/rpm-gpg/RPM-GPG-KEY-NVIDIA" | sha256sum -c --strict -
COPY cuda.repo /etc/yum.repos.d/cuda.repo
ENV CUDA_PKG_VERSION 10-1-$CUDA_VERSION-1
# For libraries in the cuda-compat-* package: https://docs.nvidia.com/cuda/eula/index.html#attachment-a
RUN yum install -y \
cuda-cudart-$CUDA_PKG_VERSION \
cuda-compat-10-1-418.39 && \
ln -s cuda-10.1 /usr/local/cuda && \
rm -rf /var/cache/yum/*
# nvidia-docker 1.0
RUN echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && \
echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf
ENV PATH /usr/local/nvidia/bin:/usr/local/cuda/bin:${PATH}
ENV LD_LIBRARY_PATH /usr/local/nvidia/lib:/usr/local/nvidia/lib64
# nvidia-container-runtime
ENV NVIDIA_VISIBLE_DEVICES all
ENV NVIDIA_DRIVER_CAPABILITIES compute,utility
ENV NVIDIA_REQUIRE_CUDA "cuda>=10.1 brand=tesla,driver>=418,driver<419"
############################################
## taken from devel
## https://hub.docker.com/r/nvidia/cuda/
############################################
ENV LIBRARY_PATH /usr/local/cuda/lib64/stubs
RUN yum install -y \
cuda-libraries-dev-$CUDA_PKG_VERSION \
cuda-nvml-dev-$CUDA_PKG_VERSION \
cuda-minimal-build-$CUDA_PKG_VERSION \
cuda-command-line-tools-$CUDA_PKG_VERSION && \
rm -rf /var/cache/yum/*
############################################
## taken from runtime
## https://hub.docker.com/r/nvidia/cuda/
############################################
LABEL com.nvidia.cudnn.version="${CUDNN_VERSION}"
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
RUN CUDNN_DOWNLOAD_SUM=c31697d6b71afe62838ad2e57da3c3c9419c4e9f5635d14b683ebe63f904fbc8 && \
curl -fsSL http://developer.download.nvidia.com/compute/redist/cudnn/v7.5.0/cudnn-10.1-linux-x64-v7.5.0.56.tgz -O && \
echo "$CUDNN_DOWNLOAD_SUM cudnn-10.1-linux-x64-v7.5.0.56.tgz" | sha256sum -c - && \
tar --no-same-owner -xzf cudnn-10.1-linux-x64-v7.5.0.56.tgz -C /usr/local --wildcards 'cuda/lib64/libcudnn.so.*' && \
rm cudnn-10.1-linux-x64-v7.5.0.56.tgz && \
ldconfig
RUN yum install -y \
cuda-libraries-$CUDA_PKG_VERSION \
cuda-nvtx-$CUDA_PKG_VERSION && \
rm -rf /var/cache/yum/*
############################################
## taken from tensorflow
############################################
ENV LD_LIBRARY_PATH /usr/local/cuda/extras/CUPTI/lib64:$LD_LIBRARY_PATH
ENV TF_NEED_CUDA 1
ENV TF_NEED_TENSORRT 1
ENV TF_CUDA_COMPUTE_CAPABILITIES=3.5,5.2,6.0,6.1,7.0
ENV TF_CUDA_VERSION=9.0
ENV TF_CUDNN_VERSION=7
############################################
# DONOT uncomment. uncomment for dev.
ARG BAZEL_VERSION=0.21.0
ARG PYTHON_VERSION=3.6
ENV BAZEL_VERSION=$BAZEL_VERSION
ENV PYTHON_VERSION=$PYTHON_VERSION
# fix fatal: unable to look up current user in the passwd file: no such user
ENV GIT_COMMITTER_NAME=sub-mod
ENV GIT_COMMITTER_NAME=subin@apache.org
# Not essential, but wise to set the lang
# Note: Users with other languages should set this in their derivative image
ENV LANGUAGE en_US.UTF-8
ENV LANG en_US.UTF-8
ENV LC_ALL=""
ENV PYTHONIOENCODING UTF-8
ENV NB_USER=default
ENV NB_UID=1001
ENV PYTHON_BIN_PATH=/usr/bin/python
ENV TINI_VERSION=v0.18.0
## Bazel
ENV PYTHON_LIB_PATH=/usr/lib64/python$PYTHON_VERSION/site-packages
ENV LD_LIBRARY_PATH="/usr/local/lib${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}";
ENV BAZELRC /root/.bazelrc
###ENV BAZEL_VERSION 0.15.0
################################################
## Tensorflow ./configure options for Bazel
################################################
ENV PYTHON_BIN_PATH=/usr/bin/python
ENV CC_OPT_FLAGS -march=native
ENV TF_NEED_JEMALLOC 1
ENV TF_NEED_GCP 0
ENV TF_NEED_VERBS 0
ENV TF_NEED_HDFS 0
ENV TF_ENABLE_XLA 0
ENV TF_NEED_OPENCL 0
ENV TF_NEED_CUDA 0
ENV TF_NEED_MPI 0
ENV TF_NEED_GDR 0
ENV TF_NEED_S3 0
ENV TF_NEED_KAFKA 0
ENV TF_NEED_OPENCL_SYCL 0
ENV TF_DOWNLOAD_CLANG 0
ENV TF_SET_ANDROID_WORKSPACE 0
ENV PATH /usr/local/bin:$PATH:/home/default/.local/bin
ENV JAVA_HOME /usr/lib/jvm/java-1.8.0-openjdk-1.8.0*
RUN echo 'PS1="\u@\h:\w\\$ \[$(tput sgr0)\]"' >> /root/.bashrc \
&& yum install -y yum-utils \
&& prepare-yum-repositories rhel-server-rhscl-7-rpms \
&& if [ "$PYTHON_VERSION" = "2.7" ] ; then yum install -y tkinter scl-utils python27 python-devel python27-python-devel && scl enable python27 bash ; fi \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then yum install -y scl-utils rh-python${PYTHON_VERSION//.} rh-python${PYTHON_VERSION//.}-python-pip rh-python${PYTHON_VERSION//.}-scldevel && scl enable rh-python${PYTHON_VERSION//.} bash ; fi \
&& echo "-----IMAGE_TEST--------" \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then ls -l /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/bin ; fi \
&& echo "which_python="`which python` \
&& echo "link_which_python=`ls -l $(which python) | awk '{print $9 $10 $11}'`" \
&& echo "link_bin_python=`ls -l /usr/bin/python |awk '{print $9 $10 $11}'`" \
&& echo "which_pip="`which pip` \
&& echo "which_pip_site="`pip --version |awk '{print $4}'` \
&& echo "link_which_pip=`ls -l $(which pip) | awk '{print $9 $10 $11}'`" \
&& echo "PATH=$PATH" \
&& echo "PYTHON_VERSION=$PYTHON_VERSION" \
&& echo "LD_LIBRARY_PATH=$LD_LIBRARY_PATH" \
&& echo "PYTHON_LIB_PATH=$PYTHON_LIB_PATH" \
&& echo "-----IMAGE_TEST--------" \
&& chgrp -R root /opt \
&& chmod -R a+rwx /opt \
&& chmod a+rw /etc/passwd \
&& yum install -y vim gcc gcc-c++ glibc-devel openssl-devel gpg perf \
&& yum install -y which findutils x86info cpuid dmidecode procps \
&& yum install -y kernel-devel make automake autoconf swig zip unzip libtool binutils \
&& yum install -y freetype-devel libpng12-devel zlib-devel giflib-devel zeromq-devel zeromq3-devel \
&& yum install -y libxml2 libxml2-devel libxslt libxslt-devel gzip \
&& yum install -y java-1.8.0-openjdk java-1.8.0-openjdk-devel patch gdb file pciutils cmake \
&& yum install -y tar tree which git curl wget java-headless bzip2 gnupg2 sqlite protobuf-compiler \
&& echo "-----IMAGE_TEST--------" \
&& echo "which_python="`which python` \
&& echo "link_which_python=`ls -l $(which python) | awk '{print $9 $10 $11}'`" \
&& echo "link_bin_python=`ls -l /usr/bin/python |awk '{print $9 $10 $11}'`" \
&& echo "which_pip="`which pip` \
&& echo "which_pip_site="`pip --version |awk '{print $4}'` \
&& echo "link_which_pip=`ls -l $(which pip) | awk '{print $9 $10 $11}'`" \
&& echo "PATH=$PATH" \
&& echo "PYTHON_VERSION=$PYTHON_VERSION" \
&& echo "LD_LIBRARY_PATH=$LD_LIBRARY_PATH" \
&& echo "PYTHON_LIB_PATH=$PYTHON_LIB_PATH" \
&& echo "-----IMAGE_TEST--------" \
&& ln -s /usr/local/cuda/lib64/stubs/libcuda.so /usr/local/cuda/lib64/stubs/libcuda.so.1 \
&& LD_LIBRARY_PATH=/usr/local/cuda/lib64/stubs:${LD_LIBRARY_PATH} \
&& rpm -qf /bin/scl \
&& scl -l \
&& ls -l /usr/bin/python* \
&& chgrp -R root /opt \
&& curl "https://bootstrap.pypa.io/get-pip.py" -o "get-pip.py" \
&& echo "PATH=$PATH" \
&& echo "LD_LIBRARY_PATH=$LD_LIBRARY_PATH" \
&& echo $PYTHON_VERSION \
&& if [ "$PYTHON_VERSION" = "2.7" ] ; then python$PYTHON_VERSION get-pip.py ; fi \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then ls -l /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/lib64/ && export LD_LIBRARY_PATH="/opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/lib64/:/usr/local/lib${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}" && echo $LD_LIBRARY_PATH && export PYTHON_LIB_PATH=/opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/lib/python${PYTHON_VERSION}/site-packages && echo $PYTHON_LIB_PATH && rm -fr /usr/bin/python && ln -s /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/bin/python${PYTHON_VERSION} /usr/bin/python && ls -l /usr/bin/python* && python get-pip.py && rm -fr /usr/bin/pip && ln -s /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/bin/pip /usr/bin/pip; fi \
&& echo "-----IMAGE_TEST--------" \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then echo "PYTHON_H="`rpm -ql rh-python${PYTHON_VERSION//.}-python-devel | grep Python.h` ; fi \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then ls -l /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/include/ && ls -l /opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/lib64/ ; fi \
&& echo "which_python="`which python` \
&& echo "link_which_python=`ls -l $(which python) | awk '{print $9 $10 $11}'`" \
&& echo "link_bin_python=`ls -l /usr/bin/python |awk '{print $9 $10 $11}'`" \
&& echo "which_pip="`which pip` \
&& echo "link_which_pip=`ls -l $(which pip) | awk '{print $9 $10 $11}'`" \
&& echo "which_pip_ver="`pip --version` \
&& echo "which_pip_site="`pip --version |awk '{print $4}'` \
&& echo "PATH=$PATH" \
&& echo "LD_LIBRARY_PATH=$LD_LIBRARY_PATH" \
&& echo "PYTHON_LIB_PATH=$PYTHON_LIB_PATH" \
&& echo "PYTHON_VERSION=$PYTHON_VERSION" \
&& ls -l /usr/bin/python* \
&& echo "-----IMAGE_TEST--------"
RUN wget https://github.com/krallin/tini/releases/download/${TINI_VERSION}/tini -P /tmp \
&& wget https://github.com/krallin/tini/releases/download/${TINI_VERSION}/tini.asc -P /tmp \
&& cd /tmp \
&& \
TINI_GPGKEY=595E85A6B1B4779EA4DAAEC70B588DFF0527A9B7; \
found=''; \
for server in \
ha.pool.sks-keyservers.net \
hkp://keyserver.ubuntu.com:80 \
hkp://p80.pool.sks-keyservers.net:80 \
pgp.mit.edu \
; do \
echo "Fetching GPG key $TINI_GPGKEY from $server"; \
gpg --batch --keyserver "$server" --recv-keys "$TINI_GPGKEY" && found=yes && break; \
done; \
test -z "$found" && echo >&2 "ERROR: failed to fetch GPG key $TINI_GPGKEY" && exit 1; \
gpg --batch --verify /tmp/tini.asc /tmp/tini \
&& mv /tmp/tini /usr/local/bin/tini \
&& chmod +x /usr/local/bin/tini \
&& chown -R 1001:1001 /opt/app-root \
&& chgrp -R root /opt/app-root \
&& chmod -R ug+rwx /opt/app-root \
&& echo "startup --batch" >>/etc/.bazelrc \
&& echo "startup --batch" >>/root/.bazelrc \
&& echo "build --spawn_strategy=standalone --genrule_strategy=standalone" >>/etc/.bazelrc \
&& echo "build --spawn_strategy=standalone --genrule_strategy=standalone" >>/root/.bazelrc
#https://github.com/tensorflow/tensorflow/blob/master/tensorflow/tools/ci_build/install/.bazelrc
# Running bazel inside a `docker build` command causes trouble, cf:
# https://github.com/bazelbuild/bazel/issues/134
# The easiest solution is to set up a bazelrc file forcing --batch.
# Similarly, we need to workaround sandboxing issues:
# https://github.com/bazelbuild/bazel/issues/418
#
# A cloned repo is found under serving folder
#Size of bazel-$BAZEL_VERSION-installer-linux-x86_64.sh is 200MB+
# downloaded file is available under bazel folder
# No yum commands here
# removed python to fix numpy issue
RUN mkdir -p /tf \
&& if [[ $PYTHON_VERSION == 3.* ]] ; then export LD_LIBRARY_PATH="/opt/rh/rh-python${PYTHON_VERSION//.}/root/usr/lib64/:/usr/local/lib${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}" ; fi \
&& echo $LD_LIBRARY_PATH \
&& pip install --no-cache-dir --upgrade pip \
&& pip install --no-cache-dir -U setuptools \
&& pip install --no-cache-dir enum34 futures mock numpy six pixiedust pillow pyaml keras \
&& mkdir -p /tf/tools \
&& cd /tf/tools \
&& wget -q https://github.com/bazelbuild/bazel/releases/download/$BAZEL_VERSION/bazel-$BAZEL_VERSION-installer-linux-x86_64.sh \
&& ls -l /tf/tools \
&& chmod +x bazel-$BAZEL_VERSION-installer-linux-x86_64.sh \
&& ./bazel-$BAZEL_VERSION-installer-linux-x86_64.sh \
&& bazel \
&& usermod -g root $NB_USER \
&& mkdir -p /workspace \
&& chown $NB_UID:root /workspace \
&& chmod 1777 /workspace \
&& mkdir -p /home/$NB_USER \
&& chown -R $NB_UID:root /home/$NB_USER \
&& chmod g+rwX,o+rX -R /home/$NB_USER
COPY ./s2i/bin/ /usr/libexec/s2i
# ADD test/ /tmp/test/
ADD entrypoint /entrypoint
RUN chmod +x /entrypoint
ADD build_tools /build_tools
# NO CLEANUP
# Donot add below commands
# && yum erase -y gcc gcc-c++ glibc-devel \
# && yum clean all -y \
EXPOSE 8080
ENV HOME /home/$NB_USER
# This default user is created in the openshift/base-centos7 image
USER 1001
# Make the default PWD somewhere that the user can write. This is
# useful when connecting with 'oc run' and starting a 'spark-shell',
# which will likely try to create files and directories in PWD and
# error out if it cannot.
WORKDIR /workspace
ENTRYPOINT ["/entrypoint"]
# TODO: Set the default CMD for the image
CMD ["/usr/libexec/s2i/usage"]