Final results.

mlperf · Jul 29, 2020 · c664061 · c664061
1 parent f7918f2
commit c664061
Show file tree

Hide file tree

Showing 15,666 changed files with 10,873,062 additions and 0 deletions.
diff --git a/Alibaba/README.md b/Alibaba/README.md
@@ -0,0 +1 @@
+Alibaba submission
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/Dockerfile b/Alibaba/benchmark/source_mxnet_resnet_a100/Dockerfile
@@ -0,0 +1,47 @@
+# Copyright (c) 2018-2020, NVIDIA CORPORATION. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+ARG FROM_IMAGE_NAME=nvcr.io/nvidian/mxnet:20.06-py3
+FROM ${FROM_IMAGE_NAME}
+
+# Install dependencies for system configuration logger
+RUN apt-get update \
+ && apt-get install -y --no-install-recommends \
+        infiniband-diags \
+        pciutils \
+ && rm -rf /var/lib/apt/lists/*
+
+# Install Python dependencies
+WORKDIR /workspace/image_classification
+
+COPY requirements.txt .
+RUN pip install --no-cache-dir https://github.com/mlperf/logging/archive/9ea0afa.zip \
+ && pip install --no-cache-dir -r requirements.txt
+
+# Copy ResNet-50 code
+COPY . .
+
+# Configure environment variables
+ENV MXNET_UPDATE_ON_KVSTORE=0      \
+    MXNET_EXEC_ENABLE_ADDTO=1      \
+    MXNET_USE_TENSORRT=0           \
+    MXNET_GPU_WORKER_NTHREADS=1    \
+    MXNET_GPU_COPY_NTHREADS=1      \
+    MXNET_CUDNN_AUTOTUNE_DEFAULT=0 \
+    HOROVOD_BATCH_D2D_MEMCOPIES=1  \
+    HOROVOD_GROUPED_ALLREDUCES=1  \
+    NCCL_SOCKET_IFNAME=ib0 \ 
+    OMPI_MCA_btl=^openib \
+    OMP_NUM_THREADS=1 \
+    OPENCV_FOR_THREADS_NUM=1
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/README.md b/Alibaba/benchmark/source_mxnet_resnet_a100/README.md
@@ -0,0 +1,85 @@
+# 1. Problem
+
+This problem uses the ResNet-50 CNN to do image classification.
+
+## Requirements
+* [MXNet 19.05-py3 NGC container](https://ngc.nvidia.com/catalog/containers/nvidia:mxnet)
+* [nvidia-docker](https://github.com/NVIDIA/nvidia-docker) (single-node)
+* Slurm with [Pyxis](https://github.com/NVIDIA/pyxis) (multi-node)
+
+# 2. Directions
+
+## Steps to download and verify data
+Download the data using the following command:
+
+Please download the dataset manually following the instructions from the [ImageNet website](http://image-net.org/download). We use non-resized Imagenet dataset, packed into MXNet recordio database. It is not resized and not normalized. No preprocessing was performed on the raw ImageNet jpegs.
+
+For further instructions, see https://github.com/NVIDIA/DeepLearningExamples/blob/master/MxNet/Classification/RN50v1.5/README.md#prepare-dataset .
+
+## Steps to launch training on a single node
+
+For single-node training, we use docker to run our container.
+
+### NVIDIA DGX-1 (single node)
+Launch configuration and system-specific hyperparameters for the NVIDIA DGX-1
+single node submission are in the `config_DGX1.sh` script.
+
+Steps required to launch single node training on NVIDIA DGX-1:
+
+```
+docker build --pull -t mlperf-nvidia:image_classification .
+source config_DGX1.sh
+CONT=mlperf-nvidia:image_classification DATADIR=<path/to/data/dir> LOGDIR=<path/to/output/dir> ./run_with_docker.sh
+```
+
+### NVIDIA DGX-2 (single node)
+Launch configuration and system-specific hyperparameters for the NVIDIA DGX-2
+single node submission are in the `config_DGX2.sh` script.
+
+Steps required to launch single node training on NVIDIA DGX-2:
+
+```
+docker build --pull -t mlperf-nvidia:image_classification .
+source config_DGX2.sh
+CONT=mlperf-nvidia:image_classification DATADIR=<path/to/data/dir> LOGDIR=<path/to/output/dir> ./run_with_docker.sh
+```
+
+## Steps to launch training on multiple nodes
+
+For multi-node training, we use Slurm for scheduling and Pyxis to run our container.
+
+### NVIDIA DGX-1 (multi node)
+Launch configuration and system-specific hyperparameters for the NVIDIA DGX-1
+multi node submission are in the `config_DGX1_multi.sh` script.
+
+Steps required to launch multi node training on NVIDIA DGX-1:
+
+1. Build the docker container and push to a docker registry
+```
+docker build --pull -t <docker/registry>/mlperf-nvidia:image_classification .
+docker push <docker/registry>/mlperf-nvidia:image_classification
+```
+
+2. Launch the training
+```
+source config_DGX1_multi.sh
+CONT="<docker/registry>/mlperf-nvidia:image_classification" DATADIR=<path/to/data/dir> LOGDIR=<path/to/output/dir> sbatch -N $DGXNNODES -t $WALLTIME --ntasks-per-node $DGXNGPU run.sub
+```
+
+### NVIDIA DGX-2 (multi node)
+Launch configuration and system-specific hyperparameters for the NVIDIA DGX-2
+multi node submission are in the `config_DGX2_multi.sh` script.
+
+Steps required to launch multi node training on NVIDIA DGX-2:
+
+1. Build the docker container and push to a docker registry
+```
+docker build --pull -t <docker/registry>/mlperf-nvidia:image_classification .
+docker push <docker/registry>/mlperf-nvidia:image_classification
+```
+
+2. Launch the training
+```
+source config_DGX2_multi.sh
+CONT="<docker/registry>/mlperf-nvidia:image_classification" DATADIR=<path/to/data/dir> LOGDIR=<path/to/output/dir> sbatch -N $DGXNNODES -t $WALLTIME --ntasks-per-node $DGXNGPU run.sub
+```
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/__init__.py b/Alibaba/benchmark/source_mxnet_resnet_a100/__init__.py
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/bind.sh b/Alibaba/benchmark/source_mxnet_resnet_a100/bind.sh
@@ -0,0 +1,212 @@
+#! /bin/bash
+set -euo pipefail
+
+print_usage() {
+    cat << EOF
+${0} [options] [--] COMMAND [ARG...]
+
+Control binding policy for each task. Assumes one rank will be launched for each GPU.
+
+Options:
+    --cpu=MODE
+        * exclusive -- bind each rank to an exclusive set of cores near its GPU
+        * exclusive,nosmt -- bind each rank to an exclusive set of cores near its GPU, without hyperthreading
+        * node -- bind each rank to all cores in the NUMA node nearest its GPU [default]
+	* *.sh -- bind each rank using the bash associative array bind_cpu_cores or bind_cpu_nodes from a file
+        * off -- don't bind
+    --mem=MODE
+        * node -- bind each rank to the nearest NUMA node [default]
+	* *.sh -- bind each rank using the bash associative array bind_mem from a file
+        * off -- don't bind
+    --ib=MODE
+        * single -- bind each rank to a single IB device near its GPU
+        * off -- don't bind [default]
+    --cluster=CLUSTER
+        Select which cluster is being used. May be required if system params cannot be detected.
+EOF
+}
+
+################################################################################
+# Argument parsing
+################################################################################
+
+cpu_mode='node'
+mem_mode='node'
+ib_mode='off'
+cluster=''
+while [ $# -gt 0 ]; do
+    case "$1" in
+        -h|--help) print_usage ; exit 0 ;;
+        --cpu=*) cpu_mode="${1/*=/}"; shift ;;
+        --cpu)   cpu_mode="$2"; shift 2 ;;
+        --mem=*) mem_mode="${1/*=/}"; shift ;;
+        --mem)   mem_mode="$2"; shift 2 ;;
+        --ib=*) ib_mode="${1/*=/}"; shift ;;
+        --ib)   ib_mode="$2"; shift 2 ;;
+        --cluster=*) cluster="${1/*=/}"; shift ;;
+        --cluster)   cluster="$2"; shift 2 ;;
+        --) shift; break ;;
+        *) break ;;
+    esac
+done
+if [ $# -lt 1 ]; then
+    echo 'ERROR: no command given' 2>&1
+    print_usage
+    exit 1
+fi
+
+################################################################################
+# Get system params
+################################################################################
+
+# LOCAL_RANK is set with an enroot hook for Pytorch containers
+# SLURM_LOCALID is set by Slurm
+# OMPI_COMM_WORLD_LOCAL_RANK is set by mpirun
+readonly local_rank="${LOCAL_RANK:=${SLURM_LOCALID:=${OMPI_COMM_WORLD_LOCAL_RANK:-}}}"
+if [ -z "${local_rank}" ]; then
+    echo 'ERROR: cannot read LOCAL_RANK from env' >&2
+    exit 1
+fi
+
+num_gpus=$(nvidia-smi -i 0 --query-gpu=count --format=csv,noheader,nounits)
+if [ "${local_rank}" -ge "${num_gpus}" ]; then
+    echo "ERROR: local rank is ${local_rank}, but there are only ${num_gpus} gpus available" >&2
+    exit 1
+fi
+
+get_lscpu_value() {
+    awk -F: "(\$1 == \"${1}\"){gsub(/ /, \"\", \$2); print \$2; found=1} END{exit found!=1}"
+}
+lscpu_out=$(lscpu)
+num_sockets=$(get_lscpu_value 'Socket(s)' <<< "${lscpu_out}")
+num_nodes=$(get_lscpu_value 'NUMA node(s)' <<< "${lscpu_out}")
+cores_per_socket=$(get_lscpu_value 'Core(s) per socket' <<< "${lscpu_out}")
+
+echo "num_sockets = ${num_sockets} num_nodes=${num_nodes} cores_per_socket=${cores_per_socket}"
+
+readonly cores_per_node=$(( (num_sockets * cores_per_socket) / num_nodes ))
+if [ ${num_gpus} -gt 1 ]; then
+    readonly gpus_per_node=$(( num_gpus / num_nodes ))
+else
+    readonly gpus_per_node=1
+fi
+readonly cores_per_gpu=$(( cores_per_node / gpus_per_node ))
+readonly local_node=$(( local_rank / gpus_per_node ))
+
+
+declare -a ibdevs=()
+case "${cluster}" in
+    circe)
+        # Need to specialize for circe because IB detection is hard
+        ibdevs=(mlx5_1 mlx5_2 mlx5_3 mlx5_4 mlx5_7 mlx5_8 mlx5_9 mlx5_10)
+        ;;
+   selene)
+        # Need to specialize for selene because IB detection is hard
+        ibdevs=(mlx5_0 mlx5_1 mlx5_2 mlx5_3 mlx5_6 mlx5_7 mlx5_8 mlx5_9)
+        ;;
+    '')
+        if ibstat_out="$(ibstat -l 2>/dev/null | sort -V)" ; then
+            mapfile -t ibdevs <<< "${ibstat_out}"
+        fi
+        ;;
+    *)
+        echo "ERROR: Unknown cluster '${cluster}'" >&2
+        exit 1
+        ;;
+esac
+readonly num_ibdevs="${#ibdevs[@]}"
+
+################################################################################
+# Setup for exec
+################################################################################
+
+declare -a numactl_args=()
+
+case "${cpu_mode}" in
+    exclusive)
+        numactl_args+=( "$(printf -- "--physcpubind=%u-%u,%u-%u" \
+            $(( local_rank * cores_per_gpu )) \
+            $(( (local_rank + 1) * cores_per_gpu - 1 )) \
+            $(( local_rank * cores_per_gpu + (cores_per_gpu * gpus_per_node * num_nodes) )) \
+            $(( (local_rank + 1) * cores_per_gpu + (cores_per_gpu * gpus_per_node * num_nodes) - 1 )) \
+        )" )
+        ;;
+    exclusive,nosmt)
+        numactl_args+=( "$(printf -- "--physcpubind=%u-%u" \
+            $(( local_rank * cores_per_gpu )) \
+            $(( (local_rank + 1) * cores_per_gpu - 1 )) \
+        )" )
+        ;;
+    node)
+        numactl_args+=( "--cpunodebind=${local_node}" )
+        ;;
+    *.sh)
+	source "${cpu_mode}"
+	if [ -n "${bind_cpu_cores:-}" ]; then
+	    numactl_args+=( "--physcpubind=${bind_cpu_cores[${local_rank}]}" )
+	elif [ -n "${bind_cpu_nodes:-}" ]; then
+	    numactl_args+=( "--cpunodebind=${bind_cpu_nodes[${local_rank}]}" )
+	else
+	    echo "ERROR: invalid CPU affinity file ${cpu_mode}." >&2
+	    exit 1
+	fi
+	;;
+    off|'')
+        ;;
+    *)
+        echo "ERROR: invalid cpu mode '${cpu_mode}'" 2>&1
+        print_usage
+        exit 1
+        ;;
+esac
+
+case "${mem_mode}" in
+    node)
+        numactl_args+=( "--membind=${local_node}" )
+        ;;
+    *.sh)
+	source "${mem_mode}"
+	if [ -z "${bind_mem:-}" ]; then
+	    echo "ERROR: invalid memory affinity file ${mem_mode}." >&2
+	    exit 1
+	fi
+	numactl_args+=( "--membind=${bind_mem[${local_rank}]}" )
+	;;
+    off|'')
+        ;;
+    *)
+        echo "ERROR: invalid mem mode '${mem_mode}'" 2>&1
+        print_usage
+        exit 1
+        ;;
+esac
+
+case "${ib_mode}" in
+    single)
+        if [ "${num_ibdevs}" -eq 0 ]; then
+            echo "WARNING: used '$0 --ib=single', but there are 0 IB devices available; skipping IB binding." 2>&1
+        else
+            readonly ibdev="${ibdevs[$(( local_rank * num_ibdevs / num_gpus ))]}"
+            export OMPI_MCA_btl_openib_if_include="${OMPI_MCA_btl_openib_if_include-$ibdev}"
+            export UCX_NET_DEVICES="${UCX_NET_DEVICES-$ibdev:1}"
+        fi
+        ;;
+    off|'')
+        ;;
+    *)
+        echo "ERROR: invalid ib mode '${ib_mode}'" 2>&1
+        print_usage
+        exit 1
+        ;;
+esac
+
+################################################################################
+# Exec
+################################################################################
+
+if [ "${#numactl_args[@]}" -gt 0 ] ; then
+    set -x
+    exec numactl "${numactl_args[@]}" -- "${@}"
+else
+    exec "${@}"
+fi
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/check.sh b/Alibaba/benchmark/source_mxnet_resnet_a100/check.sh
@@ -0,0 +1,12 @@
+export LOGDEST="/data1/weiwei/scripts-v2/logA100" && echo "LOGDEST=${LOGDEST}"
+export COMPLIANCESCRIPTS="/data1/weiwei/scripts-v2/logA100/mlperf_logging" && echo "COMPLIANCESCRIPTS=${COMPLIANCESCRIPTS}"
+git clone --depth=1 "https://github.com/mlperf/logging" "${COMPLIANCESCRIPTS}" || true
+cd ${COMPLIANCESCRIPTS}
+git fetch origin || true
+git reset --hard ${COMPLIANCE_VERSION}
+git clean -f
+find ${LOGDEST} -name "20*_*.log" > ${COMPLIANCESCRIPTS}/file.list
+cat file.list | wc -l
+for l in `cat file.list`
+do python3.6 -m mlperf_logging.compliance_checker $l
+done
diff --git a/Alibaba/benchmark/source_mxnet_resnet_a100/common/__init__.py b/Alibaba/benchmark/source_mxnet_resnet_a100/common/__init__.py