Skip to content

Commit d1f6551

Browse files
authored
Switch nvidia nightly testing to use CUDA 12.8 (#27822)
Switches nightly testing to use CUDA 12.8 [Reviewed by @e-kayrakli]
2 parents 4436c9f + b24eef3 commit d1f6551

8 files changed

+13
-18
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
# common settings for running GPU nightly testing on the HPE Cray EX system with CUDA 12
2+
3+
# We need 12.8 for the stream test because the CUDA driver on pinoak
4+
# only supports PTX for 12.8, until the driver is updated, we need to
5+
# stick with 12.8 instead of 12.9
6+
module load cuda/12.8 # default is CUDA 12.9

util/cron/test-gpu-ex-cuda-12.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,7 @@ UTIL_CRON_DIR=$(cd $(dirname ${BASH_SOURCE[0]}) ; pwd)
66
source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
9-
10-
module load cuda/12.4
9+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1110

1211
export CHPL_COMM=none
1312
export CHPL_GPU=nvidia # amd is also detected automatically

util/cron/test-gpu-ex-cuda-12.colocales.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,12 +7,11 @@ source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-ofi.bash
99
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
10+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1011

1112
export SLURM_NETWORK=single_node_vni
1213
export CHPL_RT_LOCALES_PER_NODE=2
13-
module load cuda/12.4
1414

15-
export CHPL_GPU=nvidia
1615
export CHPL_NIGHTLY_TEST_DIRS="gpu/native/multiLocale"
1716

1817
export CHPL_NIGHTLY_TEST_CONFIG_NAME="gpu-ex-cuda-12.colocales"

util/cron/test-gpu-ex-cuda-12.interop.bash

Lines changed: 1 addition & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,7 @@ UTIL_CRON_DIR=$(cd $(dirname ${BASH_SOURCE[0]}) ; pwd)
66
source $UTIL_CRON_DIR/common.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
9-
10-
11-
# We need 12.4 for the stream test because the CUDA driver on pinoak
12-
# only supports PTX for 12.4, until the driver is updated, we need to
13-
# stick with 12.4 instead of 12.5
14-
module load cuda/12.4 # default is CUDA 12.5
9+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1510

1611
# We need cublas for the cublas interop test, but since we are using 12.4 above
1712
# pinoak doesn't have the cublas library for 12.4, so we need to use the cublas

util/cron/test-gpu-ex-cuda-12.ofi.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,7 @@ UTIL_CRON_DIR=$(cd $(dirname ${BASH_SOURCE[0]}) ; pwd)
66
source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
9-
10-
module load cuda/12.4
9+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1110

1211
export CHPL_COMM=ofi
1312
export CHPL_GPU=nvidia # amd is also detected automatically

util/cron/test-gpu-ex-cuda-12.specialization.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,7 @@ source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-hpe-cray-ex.bash
99
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
10-
11-
module load cuda/12.4
10+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1211

1312
export CHPL_COMM=none
1413
export CHPL_GPU=nvidia # amd is also detected automatically

util/cron/test-perf.gpu-ex-cuda-12.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,7 @@ UTIL_CRON_DIR=$(cd $(dirname ${BASH_SOURCE[0]}) ; pwd)
66
source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
9-
10-
module load cuda/12.4
9+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1110

1211
export CHPL_COMM=none
1312
export CHPL_GPU=nvidia # amd is detected automatically

util/cron/test-perf.gpu-ex-cuda-12.um.bash

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,7 @@ UTIL_CRON_DIR=$(cd $(dirname ${BASH_SOURCE[0]}) ; pwd)
66
source $UTIL_CRON_DIR/common-native-gpu.bash
77
source $UTIL_CRON_DIR/common-hpe-cray-ex.bash
88
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex.bash
9-
10-
module load cuda/12.4
9+
source $UTIL_CRON_DIR/common-gpu-nvidia-hpe-cray-ex-cuda-12.bash
1110

1211
export CHPL_COMM=none
1312
export CHPL_GPU=nvidia # amd is detected automatically

0 commit comments

Comments
 (0)