diff --git a/iso/builder/Dockerfile b/iso/builder/Dockerfile index 4a225ba..e485ad4 100644 --- a/iso/builder/Dockerfile +++ b/iso/builder/Dockerfile @@ -36,7 +36,7 @@ RUN wget -qO /tmp/cuda-keyring.gpg \ https://developer.download.nvidia.com/compute/cuda/repos/debian12/x86_64/ /" \ > /etc/apt/sources.list.d/cuda.list \ && apt-get update -qq \ - && apt-get install -y cuda-nvcc-13-0 \ + && apt-get install -y cuda-nvcc-12-6 \ && rm -rf /var/lib/apt/lists/* RUN arch="$(dpkg --print-architecture)" \ diff --git a/iso/builder/VERSIONS b/iso/builder/VERSIONS index cfe40ee..a1e5b50 100644 --- a/iso/builder/VERSIONS +++ b/iso/builder/VERSIONS @@ -5,6 +5,7 @@ NCCL_VERSION=2.28.9-1 NCCL_CUDA_VERSION=13.0 NCCL_SHA256=2e6faafd2c19cffc7738d9283976a3200ea9db9895907f337f0c7e5a25563186 NCCL_TESTS_VERSION=2.13.10 +NVCC_VERSION=12.6 CUBLAS_VERSION=13.0.2.14-1 CUDA_USERSPACE_VERSION=13.0.96-1 GO_VERSION=1.24.0 diff --git a/iso/builder/build-nccl-tests.sh b/iso/builder/build-nccl-tests.sh index 2e26060..7ffe3f3 100755 --- a/iso/builder/build-nccl-tests.sh +++ b/iso/builder/build-nccl-tests.sh @@ -34,9 +34,9 @@ if [ -f "${CACHE_DIR}/bin/all_reduce_perf" ]; then exit 0 fi -# Resolve nvcc path (cuda-nvcc-13-0 installs to /usr/local/cuda-13.0/bin/nvcc) +# Resolve nvcc path (cuda-nvcc-12-6 installs to /usr/local/cuda-12.6/bin/nvcc) NVCC="" -for candidate in nvcc /usr/local/cuda-13.0/bin/nvcc /usr/local/cuda/bin/nvcc; do +for candidate in nvcc /usr/local/cuda-12.6/bin/nvcc /usr/local/cuda-12/bin/nvcc /usr/local/cuda/bin/nvcc; do if command -v "$candidate" >/dev/null 2>&1 || [ -x "$candidate" ]; then NVCC="$candidate" break @@ -96,8 +96,11 @@ SRC_DIR=$(ls -d nccl-tests-* 2>/dev/null | head -1) cd "$SRC_DIR" echo "=== building all_reduce_perf ===" -# CUDA 13.0 supports only Hopper (sm_90) and newer. -GENCODE="-gencode=arch=compute_90,code=sm_90" +# CUDA 12.6 supports Volta through Hopper (sm_70..sm_90). +GENCODE="-gencode=arch=compute_70,code=sm_70 \ + -gencode=arch=compute_80,code=sm_80 \ + -gencode=arch=compute_86,code=sm_86 \ + -gencode=arch=compute_90,code=sm_90" make MPI=0 \ NVCC="$NVCC" \ CUDA_HOME="$CUDA_HOME" \