|
28 | 28 | TZ=Europe/Prague \
|
29 | 29 | PATH="$PATH:/root/.local/bin" \
|
30 | 30 | CUDA_TOOLKIT_ROOT_DIR="/usr/local/cuda" \
|
31 |
| - TORCH_CUDA_ARCH_LIST="3.7;5.0;6.0;7.0;7.5;8.0" \ |
32 | 31 | MKL_THREADING_LAYER=GNU \
|
33 | 32 | # MAKEFLAGS="-j$(nproc)"
|
34 | 33 | MAKEFLAGS="-j2"
|
@@ -100,24 +99,6 @@ RUN \
|
100 | 99 | pip install -r requirements/pytorch/base.txt --no-cache-dir --find-links https://download.pytorch.org/whl/cu${CUDA_VERSION_MM}/torch_stable.html && \
|
101 | 100 | rm assistant.py
|
102 | 101 |
|
103 |
| -ENV \ |
104 |
| - HOROVOD_CUDA_HOME=$CUDA_TOOLKIT_ROOT_DIR \ |
105 |
| - HOROVOD_GPU_OPERATIONS=NCCL \ |
106 |
| - HOROVOD_WITH_PYTORCH=1 \ |
107 |
| - HOROVOD_WITHOUT_TENSORFLOW=1 \ |
108 |
| - HOROVOD_WITHOUT_MXNET=1 \ |
109 |
| - HOROVOD_WITH_GLOO=1 \ |
110 |
| - HOROVOD_WITH_MPI=1 |
111 |
| - |
112 |
| -RUN \ |
113 |
| - # CUDA 10.2 doesn't support ampere architecture (8.0). |
114 |
| - if [[ "$CUDA_VERSION" < "11.0" ]]; then export TORCH_CUDA_ARCH_LIST=${TORCH_CUDA_ARCH_LIST//";8.0"/}; echo $TORCH_CUDA_ARCH_LIST; fi && \ |
115 |
| - HOROVOD_BUILD_CUDA_CC_LIST=${TORCH_CUDA_ARCH_LIST//";"/","} && \ |
116 |
| - export HOROVOD_BUILD_CUDA_CC_LIST=${HOROVOD_BUILD_CUDA_CC_LIST//"."/""} && \ |
117 |
| - echo $HOROVOD_BUILD_CUDA_CC_LIST && \ |
118 |
| - cmake --version && \ |
119 |
| - pip install --no-cache-dir horovod && \ |
120 |
| - horovodrun --check-build |
121 | 102 |
|
122 | 103 | RUN \
|
123 | 104 | CUDA_VERSION_MAJOR=$(python -c "import torch; print(torch.version.cuda.split('.')[0])") && \
|
@@ -156,7 +137,6 @@ RUN \
|
156 | 137 | # install rest of strategies
|
157 | 138 | # remove colossalai from requirements since they are installed separately
|
158 | 139 | python -c "fname = 'requirements/pytorch/strategies.txt' ; lines = [line for line in open(fname).readlines() if 'colossalai' not in line] ; open(fname, 'w').writelines(lines)" ; \
|
159 |
| - python -c "fname = 'requirements/pytorch/strategies.txt' ; lines = [line for line in open(fname).readlines() if 'horovod' not in line] ; open(fname, 'w').writelines(lines)" ; \ |
160 | 140 | cat requirements/pytorch/strategies.txt && \
|
161 | 141 | pip install -r requirements/pytorch/devel.txt -r requirements/pytorch/strategies.txt --no-cache-dir --find-links https://download.pytorch.org/whl/cu${CUDA_VERSION_MM}/torch_stable.html
|
162 | 142 |
|
|
0 commit comments