From 90bd3401411f2bfed1e9bf83fa5d91aea807117b Mon Sep 17 00:00:00 2001 From: Martin Milenkoski Date: Fri, 9 Jul 2021 23:51:02 +0200 Subject: [PATCH] Upgrade images to PyTorch 1.9.0 --- pytorch/backend_benchmark/Dockerfile | 2 +- pytorch/backend_benchmark/requirements.txt | 2 +- pytorch/base/Dockerfile | 4 ++-- .../imagerecognition/cifar10-resnet20-all-reduce/Dockerfile | 2 +- .../cifar10-resnet20-all-reduce/requirements.txt | 2 +- pytorch/imagerecognition/cifar10-resnet20-ddp/Dockerfile | 2 +- .../imagerecognition/cifar10-resnet20-ddp/requirements.txt | 2 +- .../epsilon-logistic-regression-all-reduce/Dockerfile | 2 +- .../epsilon-logistic-regression-all-reduce/requirements.txt | 2 +- .../language-modeling/wikitext2-lstm-all-reduce/Dockerfile | 2 +- .../wikitext2-lstm-all-reduce/requirements.txt | 2 +- pytorch/nlp/translation/wmt16-gnmt-all-reduce/Dockerfile | 2 +- .../nlp/translation/wmt16-gnmt-all-reduce/requirements.txt | 2 +- .../nlp/translation/wmt17-transformer-all-reduce/Dockerfile | 2 +- .../translation/wmt17-transformer-all-reduce/requirements.txt | 2 +- 15 files changed, 16 insertions(+), 16 deletions(-) diff --git a/pytorch/backend_benchmark/Dockerfile b/pytorch/backend_benchmark/Dockerfile index 053e6d3..c7b8b0d 100644 --- a/pytorch/backend_benchmark/Dockerfile +++ b/pytorch/backend_benchmark/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 #RUN HOROVOD_GPU_ALLREDUCE=MPI HOROVOD_GPU_BROADCAST=MPI \ # HOROVOD_WITH_PYTORCH=1\ diff --git a/pytorch/backend_benchmark/requirements.txt b/pytorch/backend_benchmark/requirements.txt index 3aa018f..45a48f6 100644 --- a/pytorch/backend_benchmark/requirements.txt +++ b/pytorch/backend_benchmark/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24 diff --git a/pytorch/base/Dockerfile b/pytorch/base/Dockerfile index 16ce435..55001f3 100644 --- a/pytorch/base/Dockerfile +++ b/pytorch/base/Dockerfile @@ -95,12 +95,12 @@ RUN conda install -y python=$PYTHON_VERSION numpy pyyaml scipy mkl mkl-include n # Build pytorch from source 1.7.0a0 RUN git clone --recursive https://github.com/pytorch/pytorch && \ cd pytorch && \ - git checkout v1.8.1 && \ + git checkout v1.9.0 && \ git submodule sync && \ git submodule update --init --recursive && \ TORCH_CUDA_ARCH_LIST="3.5 5.2 6.0 6.1 7.0+PTX" TORCH_NVCC_FLAGS="-Xfatbin -compress-all" \ NCCL_INCLUDE_DIR="/usr/include/" USE_NCCL=1 USE_SYSTEM_NCCL=1 USE_MKLDNN=1 \ - CMAKE_PREFIX_PATH="$(dirname $(which conda))/../" PYTORCH_BUILD_VERSION=1.8.1 PYTORCH_BUILD_NUMBER=1 \ + CMAKE_PREFIX_PATH="$(dirname $(which conda))/../" PYTORCH_BUILD_VERSION=1.9.0 PYTORCH_BUILD_NUMBER=1 \ pip install -v . #RUN git clone https://github.com/pytorch/vision.git && cd vision && git checkout tags/v0.5.0 && pip install -v . diff --git a/pytorch/imagerecognition/cifar10-resnet20-all-reduce/Dockerfile b/pytorch/imagerecognition/cifar10-resnet20-all-reduce/Dockerfile index f41556c..0c107b8 100644 --- a/pytorch/imagerecognition/cifar10-resnet20-all-reduce/Dockerfile +++ b/pytorch/imagerecognition/cifar10-resnet20-all-reduce/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # The reference implementation and user defined implementations are placed here. ADD ./requirements.txt /requirements.txt diff --git a/pytorch/imagerecognition/cifar10-resnet20-all-reduce/requirements.txt b/pytorch/imagerecognition/cifar10-resnet20-all-reduce/requirements.txt index 3aa018f..45a48f6 100644 --- a/pytorch/imagerecognition/cifar10-resnet20-all-reduce/requirements.txt +++ b/pytorch/imagerecognition/cifar10-resnet20-all-reduce/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24 diff --git a/pytorch/imagerecognition/cifar10-resnet20-ddp/Dockerfile b/pytorch/imagerecognition/cifar10-resnet20-ddp/Dockerfile index f41556c..0c107b8 100644 --- a/pytorch/imagerecognition/cifar10-resnet20-ddp/Dockerfile +++ b/pytorch/imagerecognition/cifar10-resnet20-ddp/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # The reference implementation and user defined implementations are placed here. ADD ./requirements.txt /requirements.txt diff --git a/pytorch/imagerecognition/cifar10-resnet20-ddp/requirements.txt b/pytorch/imagerecognition/cifar10-resnet20-ddp/requirements.txt index 3aa018f..45a48f6 100644 --- a/pytorch/imagerecognition/cifar10-resnet20-ddp/requirements.txt +++ b/pytorch/imagerecognition/cifar10-resnet20-ddp/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24 diff --git a/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/Dockerfile b/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/Dockerfile index 58b423e..34f8cdc 100644 --- a/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/Dockerfile +++ b/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # Add and install requirements ADD ./requirements.txt /requirements.txt diff --git a/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/requirements.txt b/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/requirements.txt index 3aa018f..45a48f6 100644 --- a/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/requirements.txt +++ b/pytorch/linearmodels/epsilon-logistic-regression-all-reduce/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24 diff --git a/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/Dockerfile b/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/Dockerfile index 0d6a9ee..24202ad 100644 --- a/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/Dockerfile +++ b/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # -------------------- Debug -------------------- # RUN apt-get update && apt-get install -y vim net-tools diff --git a/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/requirements.txt b/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/requirements.txt index 6f95c5b..5a98442 100644 --- a/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/requirements.txt +++ b/pytorch/nlp/language-modeling/wikitext2-lstm-all-reduce/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 \ No newline at end of file +mlbench-core[torch]==3.0.0.dev24 \ No newline at end of file diff --git a/pytorch/nlp/translation/wmt16-gnmt-all-reduce/Dockerfile b/pytorch/nlp/translation/wmt16-gnmt-all-reduce/Dockerfile index 3629350..47de7e0 100644 --- a/pytorch/nlp/translation/wmt16-gnmt-all-reduce/Dockerfile +++ b/pytorch/nlp/translation/wmt16-gnmt-all-reduce/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # -------------------- Debug -------------------- # RUN apt-get update && apt-get install -y vim net-tools diff --git a/pytorch/nlp/translation/wmt16-gnmt-all-reduce/requirements.txt b/pytorch/nlp/translation/wmt16-gnmt-all-reduce/requirements.txt index 9be4451..2a680c7 100644 --- a/pytorch/nlp/translation/wmt16-gnmt-all-reduce/requirements.txt +++ b/pytorch/nlp/translation/wmt16-gnmt-all-reduce/requirements.txt @@ -1,2 +1,2 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24 mosestokenizer==1.1.0 diff --git a/pytorch/nlp/translation/wmt17-transformer-all-reduce/Dockerfile b/pytorch/nlp/translation/wmt17-transformer-all-reduce/Dockerfile index 38e3e5a..5a50393 100644 --- a/pytorch/nlp/translation/wmt17-transformer-all-reduce/Dockerfile +++ b/pytorch/nlp/translation/wmt17-transformer-all-reduce/Dockerfile @@ -1,4 +1,4 @@ -FROM mlbench/mlbench-pytorch-base:pytorch-v1.8.1 +FROM mlbench/mlbench-pytorch-base:pytorch-v1.9.0 # -------------------- Debug -------------------- RUN git clone https://github.com/NVIDIA/apex && cd apex && git checkout f3a960f && \ diff --git a/pytorch/nlp/translation/wmt17-transformer-all-reduce/requirements.txt b/pytorch/nlp/translation/wmt17-transformer-all-reduce/requirements.txt index 3aa018f..45a48f6 100644 --- a/pytorch/nlp/translation/wmt17-transformer-all-reduce/requirements.txt +++ b/pytorch/nlp/translation/wmt17-transformer-all-reduce/requirements.txt @@ -1 +1 @@ -mlbench-core[torch]==3.0.0.dev23 +mlbench-core[torch]==3.0.0.dev24