From 7f9aa447cc17addeaefa09f2a67b7bb89e3fcfe1 Mon Sep 17 00:00:00 2001 From: mhuguesaws <71357145+mhuguesaws@users.noreply.github.com> Date: Thu, 21 Mar 2024 14:06:53 -0500 Subject: [PATCH] Change nccl version to 2.20.3 NCCL 2.19.4 has performance regression. --- .../0.nccl-tests/0.nccl-tests.Dockerfile | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/4.validation_and_observability/0.nccl-tests/0.nccl-tests.Dockerfile b/4.validation_and_observability/0.nccl-tests/0.nccl-tests.Dockerfile index f0b24830..0d8faf7f 100644 --- a/4.validation_and_observability/0.nccl-tests/0.nccl-tests.Dockerfile +++ b/4.validation_and_observability/0.nccl-tests/0.nccl-tests.Dockerfile @@ -2,10 +2,10 @@ # SPDX-License-Identifier: MIT-0 FROM nvidia/cuda:12.2.0-devel-ubuntu22.04 -ARG EFA_INSTALLER_VERSION=1.30.0 +ARG EFA_INSTALLER_VERSION=1.31.0 ARG AWS_OFI_NCCL_VERSION=v1.8.1-aws ARG NCCL_TESTS_VERSION=2.13.9 -ARG NCCL_VERSION=2.19.4 +ARG NCCL_VERSION=2.20.3 RUN apt-get update -y RUN apt-get remove -y --allow-change-held-packages \ @@ -102,4 +102,4 @@ RUN git clone -b v${NCCL_TESTS_VERSION} https://github.com/NVIDIA/nccl-tests.git NVCC_GENCODE="-gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_86,code=sm_86 -gencode=arch=compute_90,code=sm_90" RUN rm -rf /var/lib/apt/lists/* -ENV LD_PRELOAD /opt/nccl/build/lib/libnccl.so \ No newline at end of file +ENV LD_PRELOAD /opt/nccl/build/lib/libnccl.so