131 lines
4.7 KiB
Docker
131 lines
4.7 KiB
Docker
# Copyright The PyTorch Lightning team.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
# Existing images:
|
|
# --build-arg PYTHON_VERSION=3.7 --build-arg PYTORCH_VERSION=1.7 --build-arg CUDA_VERSION=10.2
|
|
# --build-arg PYTHON_VERSION=3.7 --build-arg PYTORCH_VERSION=1.6 --build-arg CUDA_VERSION=10.2
|
|
# --build-arg PYTHON_VERSION=3.7 --build-arg PYTORCH_VERSION=1.5 --build-arg CUDA_VERSION=10.2
|
|
# --build-arg PYTHON_VERSION=3.7 --build-arg PYTORCH_VERSION=1.4 --build-arg CUDA_VERSION=10.1
|
|
|
|
ARG CUDNN_VERSION=8
|
|
ARG CUDA_VERSION=10.2
|
|
|
|
# FROM nvidia/cuda:${CUDA_VERSION}-devel-ubuntu20.04
|
|
FROM nvidia/cuda:${CUDA_VERSION}-cudnn${CUDNN_VERSION}-devel-ubuntu18.04
|
|
# FROM nvidia/cuda:${CUDA_VERSION}-devel-ubuntu18.04
|
|
|
|
ARG PYTHON_VERSION=3.7
|
|
ARG PYTORCH_VERSION=1.6
|
|
ARG CMAKE_VERSION=3.18.4
|
|
|
|
SHELL ["/bin/bash", "-c"]
|
|
# https://techoverflow.net/2019/05/18/how-to-fix-configuring-tzdata-interactive-input-when-building-docker-images/
|
|
ENV \
|
|
DEBIAN_FRONTEND=noninteractive \
|
|
TZ=Europe/Prague \
|
|
PATH="$PATH:/root/.local/bin" \
|
|
CUDA_TOOLKIT_ROOT_DIR="/usr/local/cuda" \
|
|
MKL_THREADING_LAYER=GNU
|
|
|
|
RUN apt-get update -qq && \
|
|
apt-get install -y --no-install-recommends \
|
|
build-essential \
|
|
pkg-config \
|
|
cmake \
|
|
git \
|
|
wget \
|
|
curl \
|
|
unzip \
|
|
ca-certificates \
|
|
software-properties-common \
|
|
libopenmpi-dev \
|
|
&& \
|
|
|
|
# Install python
|
|
add-apt-repository ppa:deadsnakes/ppa && \
|
|
apt-get install -y \
|
|
python${PYTHON_VERSION} \
|
|
python${PYTHON_VERSION}-distutils \
|
|
python${PYTHON_VERSION}-dev \
|
|
&& \
|
|
|
|
update-alternatives --install /usr/bin/python${PYTHON_VERSION%%.*} python${PYTHON_VERSION%%.*} /usr/bin/python${PYTHON_VERSION} 1 && \
|
|
update-alternatives --install /usr/bin/python python /usr/bin/python${PYTHON_VERSION} 1 && \
|
|
|
|
# Cleaning
|
|
apt-get autoremove -y && \
|
|
apt-get clean && \
|
|
rm -rf /root/.cache && \
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
ENV \
|
|
HOROVOD_GPU_OPERATIONS=NCCL \
|
|
HOROVOD_WITH_PYTORCH=1 \
|
|
HOROVOD_WITHOUT_TENSORFLOW=1 \
|
|
HOROVOD_WITHOUT_MXNET=1 \
|
|
HOROVOD_WITH_GLOO=1 \
|
|
HOROVOD_WITHOUT_MPI=1 \
|
|
# MAKEFLAGS="-j$(nproc)" \
|
|
MAKEFLAGS="-j1" \
|
|
TORCH_CUDA_ARCH_LIST="3.7;5.0;6.0;7.0;7.5"
|
|
|
|
COPY ./requirements.txt requirements.txt
|
|
COPY ./requirements/ ./requirements/
|
|
|
|
# conda init
|
|
RUN \
|
|
wget https://bootstrap.pypa.io/get-pip.py --progress=bar:force:noscroll --no-check-certificate && \
|
|
python${PYTHON_VERSION} get-pip.py && \
|
|
rm get-pip.py && \
|
|
|
|
# Disable cache
|
|
pip config set global.cache-dir false && \
|
|
# eventualy use pre-release
|
|
#pip install "torch==${PYTORCH_VERSION}.*" --pre && \
|
|
# set particular PyTorch version
|
|
python ./requirements/adjust_versions.py requirements.txt ${PYTORCH_VERSION} && \
|
|
python ./requirements/adjust_versions.py requirements/extra.txt ${PYTORCH_VERSION} && \
|
|
python ./requirements/adjust_versions.py requirements/examples.txt ${PYTORCH_VERSION} && \
|
|
# Install all requirements
|
|
# todo: find a way how to install nightly PT version
|
|
# --pre --extra-index-url https://download.pytorch.org/whl/nightly/cu${cuda_ver[0]}${cuda_ver[1]}/torch_nightly.html
|
|
pip install -r requirements/devel.txt --no-cache-dir && \
|
|
rm -rf requirements.* requirements/
|
|
|
|
RUN \
|
|
# install DALI, needed for examples
|
|
pip install --extra-index-url https://developer.download.nvidia.com/compute/redist nvidia-dali-cuda${CUDA_VERSION%%.*}0
|
|
|
|
RUN \
|
|
# install NVIDIA apex
|
|
# TODO: later commits break CI when cpp extensions are compiling. Unset when fixed
|
|
pip install --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" git+https://github.com/NVIDIA/apex@705cba9
|
|
|
|
RUN \
|
|
# install FairScale
|
|
pip install fairscale>=0.3.4
|
|
|
|
RUN \
|
|
# install DeepSpeed
|
|
# TODO(@SeanNaren): 0.3.15 is broken - skipping to unblock
|
|
pip install 'deepspeed>=0.3.14,!=0.3.15'
|
|
|
|
RUN \
|
|
# Show what we have
|
|
pip --version && \
|
|
pip list && \
|
|
python -c 'from nvidia.dali.pipeline import Pipeline' && \
|
|
python -c "import sys; assert sys.version[:3] == '$PYTHON_VERSION', sys.version" && \
|
|
python -c "import torch; assert torch.__version__[:3] == '$PYTORCH_VERSION', torch.__version__"
|