fix(nccl-tests): use cuda-nvcc-12-6 to support Ampere/Volta (sm_70..sm_90)

This commit is contained in:
2026-03-26 23:50:36 +03:00
parent 5407c26e25
commit 896bdb6ee8
3 changed files with 9 additions and 5 deletions

View File

@@ -34,9 +34,9 @@ if [ -f "${CACHE_DIR}/bin/all_reduce_perf" ]; then
exit 0
fi
# Resolve nvcc path (cuda-nvcc-13-0 installs to /usr/local/cuda-13.0/bin/nvcc)
# Resolve nvcc path (cuda-nvcc-12-6 installs to /usr/local/cuda-12.6/bin/nvcc)
NVCC=""
for candidate in nvcc /usr/local/cuda-13.0/bin/nvcc /usr/local/cuda/bin/nvcc; do
for candidate in nvcc /usr/local/cuda-12.6/bin/nvcc /usr/local/cuda-12/bin/nvcc /usr/local/cuda/bin/nvcc; do
if command -v "$candidate" >/dev/null 2>&1 || [ -x "$candidate" ]; then
NVCC="$candidate"
break
@@ -96,8 +96,11 @@ SRC_DIR=$(ls -d nccl-tests-* 2>/dev/null | head -1)
cd "$SRC_DIR"
echo "=== building all_reduce_perf ==="
# CUDA 13.0 supports only Hopper (sm_90) and newer.
GENCODE="-gencode=arch=compute_90,code=sm_90"
# CUDA 12.6 supports Volta through Hopper (sm_70..sm_90).
GENCODE="-gencode=arch=compute_70,code=sm_70 \
-gencode=arch=compute_80,code=sm_80 \
-gencode=arch=compute_86,code=sm_86 \
-gencode=arch=compute_90,code=sm_90"
make MPI=0 \
NVCC="$NVCC" \
CUDA_HOME="$CUDA_HOME" \