|
1 | 1 | name: H100 |
2 | 2 |
|
3 | | - |
4 | 3 | permissions: |
5 | 4 | contents: none |
6 | 5 |
|
7 | 6 | on: |
8 | 7 | workflow_call: |
9 | 8 |
|
10 | 9 | jobs: |
11 | | - PR_CUDA1250_OPENMPI504: |
12 | | - name: PR_CUDA1250_OPENMPI504 |
13 | | - runs-on: [cuda125-openmpi504-latest-latest] |
| 10 | + PR_CUDA1262_OPENMPI505: |
| 11 | + name: PR_CUDA1262_OPENMPI505 |
14 | 12 |
|
| 13 | + # this label is correct, but the underlying AT2 runner is actually |
| 14 | + # CUDA 12.6.2 and OpenMPI 5.0.5 <facepalm> |
| 15 | + runs-on: [cuda125-openmpi504-latest-latest] |
15 | 16 | steps: |
16 | | - - name: Checkout Kokkos Comm |
| 17 | + - name: Check NVIDIA GPU |
| 18 | + run: nvidia-smi |
| 19 | + |
| 20 | + - name: Kokkos - Checkout |
| 21 | + uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 |
| 22 | + with: |
| 23 | + repository: kokkos/kokkos |
| 24 | + ref: 4.7.01 |
| 25 | + path: kokkos |
| 26 | + - name: Kokkos - Configure |
| 27 | + run: > |
| 28 | + cmake |
| 29 | + -S kokkos |
| 30 | + -B kokkos/build |
| 31 | + -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) |
| 32 | + -DCMAKE_CXX_STANDARD=20 |
| 33 | + -DCMAKE_CXX_EXTENSIONS=OFF |
| 34 | + -DCMAKE_INSTALL_PREFIX=kokkos/install |
| 35 | + -DKokkos_ENABLE_CUDA=ON |
| 36 | + -DKokkos_ARCH_HOPPER90=ON |
| 37 | + -DKokkos_ENABLE_TESTS=OFF |
| 38 | + -DKokkos_ENABLE_EXAMPLES=OFF |
| 39 | + -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF |
| 40 | + -DKokkos_ENABLE_DEPRECATED_CODE_4=OFF |
| 41 | + -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF |
| 42 | + - name: Kokkos - Build |
| 43 | + run: cmake --build kokkos/build --parallel $(nproc) |
| 44 | + - name: Kokkos - Install |
| 45 | + run: cmake --build kokkos/build --target install --parallel $(nproc) |
| 46 | + - name: KokkosComm - Checkout |
17 | 47 | uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 |
18 | 48 | with: |
19 | 49 | path: kokkos-comm |
| 50 | + - name: KokkosComm - Configure MPI backend |
| 51 | + run: > |
| 52 | + cmake |
| 53 | + -S kokkos-comm |
| 54 | + -B build-mpi |
| 55 | + -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) |
| 56 | + -DCMAKE_CXX_STANDARD=20 |
| 57 | + -DCMAKE_CXX_EXTENSIONS=OFF |
| 58 | + -DCMAKE_CXX_FLAGS="-Werror" |
| 59 | + -DKokkos_ROOT=kokkos/install |
| 60 | + -DKokkosComm_ENABLE_MPI=ON |
| 61 | + -DKokkosComm_ENABLE_TESTS=ON |
| 62 | + -DKokkosComm_ENABLE_PERFTESTS=ON |
| 63 | + - name: KokkosComm - Build MPI backend |
| 64 | + run: cmake --build build-mpi --parallel $(nproc) |
| 65 | + - name: KokkosComm - Test MPI backend |
| 66 | + working-directory: build-mpi |
| 67 | + run: ctest --output-on-failure -V --timeout 1200 |
20 | 68 |
|
21 | | - - name: Checkout Kokkos |
| 69 | + PR_CUDA1262_NCCL2275: |
| 70 | + name: PR_CUDA1262_NCCL2275 |
| 71 | + |
| 72 | + # this label is correct, but the underlying AT2 runner is actually |
| 73 | + # CUDA 12.6.2 and OpenMPI 5.0.5 <facepalm> |
| 74 | + runs-on: [cuda125-openmpi504-latest-latest] |
| 75 | + steps: |
| 76 | + - name: Check NVIDIA GPU |
| 77 | + run: nvidia-smi |
| 78 | + |
| 79 | + - name: Kokkos - Checkout |
22 | 80 | uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 |
23 | 81 | with: |
24 | 82 | repository: kokkos/kokkos |
25 | | - ref: 4.5.01 |
| 83 | + ref: 4.7.01 |
26 | 84 | path: kokkos |
27 | 85 |
|
28 | | - - name: nvidia-smi |
29 | | - run: nvidia-smi |
| 86 | + - name: Kokkos - Configure |
| 87 | + run: > |
| 88 | + cmake |
| 89 | + -S kokkos |
| 90 | + -B kokkos/build |
| 91 | + -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) |
| 92 | + -DCMAKE_CXX_STANDARD=20 |
| 93 | + -DCMAKE_CXX_EXTENSIONS=OFF |
| 94 | + -DCMAKE_INSTALL_PREFIX=kokkos/install |
| 95 | + -DKokkos_ENABLE_CUDA=ON |
| 96 | + -DKokkos_ARCH_HOPPER90=ON |
| 97 | + -DKokkos_ENABLE_TESTS=OFF |
| 98 | + -DKokkos_ENABLE_EXAMPLES=OFF |
| 99 | + -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF |
| 100 | + -DKokkos_ENABLE_DEPRECATED_CODE_4=OFF |
| 101 | + -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF |
| 102 | + - name: Kokkos - Build |
| 103 | + run: cmake --build kokkos/build --parallel $(nproc) |
30 | 104 |
|
31 | | - - name: Configure Kokkos |
32 | | - run: | |
33 | | - cmake -S kokkos -B kokkos/build \ |
34 | | - -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) \ |
35 | | - -DCMAKE_CXX_STANDARD=20 \ |
36 | | - -DCMAKE_CXX_EXTENSIONS=OFF \ |
37 | | - -DCMAKE_INSTALL_PREFIX=kokkos/install \ |
38 | | - -DKokkos_ENABLE_CUDA=ON \ |
39 | | - -DKokkos_ARCH_HOPPER90=ON \ |
40 | | - -DKokkos_ENABLE_TESTS=OFF \ |
41 | | - -DKokkos_ENABLE_EXAMPLES=OFF \ |
42 | | - -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF \ |
43 | | - -DKokkos_ENABLE_DEPRECATED_CODE_4=OFF \ |
44 | | - -DKokkos_ENABLE_DEPRECATION_WARNINGS=OFF |
45 | | -
|
46 | | - - name: Build Kokkos |
| 105 | + - name: Kokkos - Install |
47 | 106 | run: cmake --build kokkos/build --target install --parallel $(nproc) |
48 | 107 |
|
49 | | - - name: Configure Kokkos Comm |
50 | | - run: | |
51 | | - cmake -S kokkos-comm -B build \ |
52 | | - -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) \ |
53 | | - -DCMAKE_CXX_STANDARD=20 \ |
54 | | - -DCMAKE_CXX_EXTENSIONS=OFF \ |
55 | | - -DCMAKE_CXX_FLAGS="-Werror" \ |
56 | | - -DKokkos_ROOT=kokkos/install \ |
57 | | - -DKokkosComm_ENABLE_TESTS=ON \ |
58 | | - -DKokkosComm_ENABLE_PERFTESTS=ON |
| 108 | + - name: KokkosComm - Checkout |
| 109 | + uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 |
| 110 | + with: |
| 111 | + path: kokkos-comm |
| 112 | + |
| 113 | + - name: KokkosComm - Configure NCCL backend |
| 114 | + # FIXME_NCCL: no performance tests on NCCL |
| 115 | + run: > |
| 116 | + cmake |
| 117 | + -S kokkos-comm |
| 118 | + -B build-nccl |
| 119 | + -DCMAKE_CXX_COMPILER=$(realpath kokkos/bin/nvcc_wrapper) |
| 120 | + -DCMAKE_CXX_STANDARD=20 |
| 121 | + -DCMAKE_CXX_EXTENSIONS=OFF |
| 122 | + -DKokkos_ROOT=kokkos/install |
| 123 | + -DKokkosComm_ENABLE_MPI=OFF |
| 124 | + -DKokkosComm_ENABLE_NCCL=ON |
| 125 | + -DKokkosComm_ENABLE_TESTS=ON |
| 126 | + -DKokkosComm_ENABLE_PERFTESTS=OFF |
59 | 127 |
|
60 | | - - name: Build Kokkos Comm |
61 | | - run: cmake --build build --parallel $(nproc) |
| 128 | + - name: KokkosComm - Build NCCL backend |
| 129 | + run: cmake --build build-nccl --parallel $(nproc) |
62 | 130 |
|
63 | | - - name: Test Kokkos Comm |
64 | | - working-directory: build |
| 131 | + - name: KokkosComm - Test NCCL backend |
| 132 | + working-directory: build-nccl |
65 | 133 | run: ctest --output-on-failure -V --timeout 1200 |
0 commit comments