Skip to content

Commit 3627db3

Browse files
authored
Move ppc64le CI to TF 2.6.0 and PyTorch 1.9.1 (horovod#3208)
Signed-off-by: Nicolas Castet <[email protected]>
1 parent df18797 commit 3627db3

File tree

1 file changed

+7
-8
lines changed

1 file changed

+7
-8
lines changed

Jenkinsfile.ppc64le

+7-8
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ pipeline {
66
agent {
77
docker {
88
alwaysPull true
9-
// WMLCE 1.7.0 has CUDA 10.2, NCCL 2.5.6, TensorFlow 2.1.0, and PyTorch 1.8.0
10-
image 'tensorflowppc64le/tensorflow-ppc64le:osuosl-ubuntu-horovod-wlmce1.7.0-py3.7-ppc64le'
9+
// Open-CE 1.4.1 has CUDA 10.2, NCCL 2.8.3, TensorFlow 2.6.0, and PyTorch 1.9.1
10+
image 'tensorflowppc64le/tensorflow-ppc64le:osuosl-ubi7-horovod-opence1.4.1-py3.9-ppc64le'
1111
args '--cap-add=SYS_PTRACE --shm-size=256g'
1212
label 'power8-gpu'
1313
registryCredentialsId 'TensorFlow'
@@ -25,10 +25,9 @@ pipeline {
2525
git submodule update --init --recursive
2626
. ${CONDA_INIT}
2727
conda activate ${CONDA_ENV}
28-
conda install -y cmake make
2928
set -xe
30-
HOROVOD_WITHOUT_MXNET=1 HOROVOD_WITHOUT_GLOO=1 HOROVOD_WITHOUT_PYTORCH=1 HOROVOD_WITH_TENSORFLOW=1 \
31-
HOROVOD_CUDA_HOME=$CONDA_PREFIX HOROVOD_GPU_OPERATIONS=NCCL MAKEFLAGS="-j1" \
29+
HOROVOD_WITHOUT_MXNET=1 HOROVOD_WITHOUT_GLOO=1 HOROVOD_WITH_PYTORCH=1 HOROVOD_WITH_TENSORFLOW=1 \
30+
HOROVOD_CUDA_HOME="/usr/local/cuda" HOROVOD_GPU_OPERATIONS=NCCL \
3231
pip install -v . --no-cache-dir --no-deps
3332
'''
3433
}
@@ -42,12 +41,12 @@ pipeline {
4241
set -xe
4342

4443
# TensorFlow unit tests
45-
horovodrun -n 2 -H localhost:2 --mpi-args="-pami_noib" pytest -k 'not multi_gpu' -v -s test/parallel/test_tensorflow.py
44+
horovodrun -n 2 -H localhost:2 pytest -k 'not multi_gpu' -v -s test/parallel/test_tensorflow.py
4645
# Container has only 2 GPUs, so run the 'multi_gpu' test seperatly on one process
47-
horovodrun -n 1 -H localhost:1 --mpi-args="-pami_noib" pytest -k 'multi_gpu' -v -s test/parallel/test_tensorflow.py
46+
horovodrun -n 1 -H localhost:1 pytest -k 'multi_gpu' -v -s test/parallel/test_tensorflow.py
4847

4948
# PyTorch unit tests
50-
# horovodrun -n 2 -H localhost:2 --mpi-args="-pami_noib" pytest -v -s test/parallel/test_torch.py
49+
horovodrun -n 2 -H localhost:2 pytest -v -s test/parallel/test_torch.py
5150
'''
5251
}
5352
}

0 commit comments

Comments
 (0)