Skip to content

Commit cc7270b

Browse files
committed
add spack job
side note: - add cuda 12.2 and do not compile bfloat16 below cuda 12.2 - cuda 11.8.0 starts to support 8.9 and 9.0 - current docker image does not support A770. set up another without docker for A770 - tum does not contain HWLOC yet
1 parent 13eb133 commit cc7270b

3 files changed

Lines changed: 322 additions & 12 deletions

File tree

.gitlab-ci.yml

Lines changed: 183 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -110,7 +110,6 @@ build/cuda110/nompi/gcc/cuda/release/shared:
110110
# this is seemingly broken with CUDA 11
111111
# EXTRA_CMAKE_FLAGS: "-DCMAKE_CUDA_FLAGS=-diag-suppress=177"
112112

113-
114113
# nvhpc and friends
115114
build/nvhpc233/cuda120/nompi/nvcpp/release/static:
116115
extends:
@@ -149,6 +148,63 @@ build/nvhpc227/cuda117/nompi/nvcpp/debug/shared:
149148
# disable spurious unused argument warning
150149
EXTRA_CMAKE_FLAGS: "-DCMAKE_CUDA_FLAGS=-diag-suppress=177"
151150

151+
build/cuda118/nompi/gcc/cuda/debug/shared:
152+
extends:
153+
- .build_and_test_tum_template
154+
- .default_variables
155+
- .quick_test_condition
156+
- .use_tum-nvidia
157+
variables:
158+
BUILD_CUDA: "ON"
159+
BUILD_HWLOC: "OFF"
160+
ENABLE_HALF: "ON"
161+
BUILD_TYPE: "Debug"
162+
MODULE_LOAD: "cmake/3.18.6 cuda/11.8.0 gcc/7.5.0"
163+
164+
build/cuda120/openmpi/gcc/cuda/release/static:
165+
extends:
166+
- .build_and_test_tum_template
167+
- .default_variables
168+
- .quick_test_condition
169+
- .use_tum-nvidia
170+
variables:
171+
BUILD_CUDA: "ON"
172+
BUILD_HWLOC: "OFF"
173+
ENABLE_HALF: "ON"
174+
BUILD_MPI: "ON"
175+
BUILD_SHARED_LIBS: "OFF"
176+
BUILD_TYPE: "Release"
177+
MODULE_LOAD: "cmake/3.18.6 cuda/12.0.1 gcc/12.4.0 openmpi/4.1.6"
178+
179+
build/cuda122/openmpi/gcc/cuda/release/static:
180+
extends:
181+
- .build_and_test_tum_template
182+
- .default_variables
183+
- .quick_test_condition
184+
- .use_tum-nvidia
185+
variables:
186+
BUILD_CUDA: "ON"
187+
BUILD_HWLOC: "OFF"
188+
ENABLE_HALF: "ON"
189+
ENABLE_BFLOAT16: "ON"
190+
BUILD_SHARED_LIBS: "OFF"
191+
BUILD_TYPE: "Release"
192+
MODULE_LOAD: "cmake/3.20.6 cuda/12.2.2 gcc/12.4.0 openmpi/4.1.6"
193+
194+
build/cuda126/nompi/gcc/cuda/release/shared:
195+
extends:
196+
- .build_and_test_tum_template
197+
- .default_variables
198+
- .quick_test_condition
199+
- .use_tum-nvidia
200+
variables:
201+
BUILD_CUDA: "ON"
202+
BUILD_HWLOC: "OFF"
203+
ENABLE_HALF: "ON"
204+
ENABLE_BFLOAT16: "ON"
205+
BUILD_TYPE: "Release"
206+
MODULE_LOAD: "cmake/3.30.5 cuda/12.6.2 gcc/13.3.0"
207+
152208
# ROCm 4.5 and friends
153209
build/amd/nompi/gcc/rocm45/release/shared:
154210
extends:
@@ -230,6 +286,48 @@ build/amd/nompi/gcc/rocm514_wo_omp/release/shared:
230286
BUILD_HIP: "ON"
231287
BUILD_TYPE: "Release"
232288

289+
build/amd/openmpi/gcc/rocm600/release/static:
290+
extends:
291+
- .build_and_test_tum_template
292+
- .default_variables
293+
- .quick_test_condition
294+
- .use_tum-amd
295+
variables:
296+
BUILD_HIP: "ON"
297+
BUILD_HWLOC: "OFF"
298+
BUILD_MPI: "ON"
299+
BUILD_TYPE: "Release"
300+
BUILD_SHARED_LIBS: "OFF"
301+
MODULE_LOAD: "cmake/3.24.4 rocm/6.0.0 gcc/13.3.0 openmpi/5.0.5"
302+
303+
build/amd/nompi/gcc/rocm573/debug/shared:
304+
extends:
305+
- .build_and_test_tum_template
306+
- .default_variables
307+
- .quick_test_condition
308+
- .use_tum-amd
309+
variables:
310+
BUILD_HIP: "ON"
311+
BUILD_OMP: "OFF"
312+
BUILD_HWLOC: "OFF"
313+
BUILD_TYPE: "Debug"
314+
ENABLE_BFLOAT16: "ON"
315+
ENABLE_HALF: "OFF"
316+
MODULE_LOAD: "cmake/3.25.3 rocm/5.7.3 gcc/12.4.0"
317+
318+
build/amd/openmpi/gcc/rocm634_wo_omp/release/shared:
319+
extends:
320+
- .build_and_test_tum_template
321+
- .default_variables
322+
- .quick_test_condition
323+
- .use_tum-amd
324+
variables:
325+
BUILD_HIP: "ON"
326+
BUILD_HWLOC: "OFF"
327+
BUILD_MPI: "ON"
328+
BUILD_TYPE: "Release"
329+
MODULE_LOAD: "cmake/3.29.6 rocm/6.3.4 gcc/13.3.0 openmpi/5.0.5"
330+
233331
# no cuda but latest gcc and clang
234332
build/nocuda/nompi/gcc/core/debug/static:
235333
extends:
@@ -350,13 +448,42 @@ build/nocuda-nomixed/nompi/clang/omp/debug/static:
350448
BUILD_SHARED_LIBS: "OFF"
351449
MIXED_PRECISION: "OFF"
352450

451+
build/nogpu/nompi/gcc/omp/debug/static:
452+
extends:
453+
- .build_and_test_tum_template
454+
- .default_variables
455+
- .quick_test_condition
456+
- .use_tum-cpu
457+
variables:
458+
BUILD_OMP: "ON"
459+
BUILD_TYPE: "Debug"
460+
BUILD_SHARED_LIBS: "OFF"
461+
MIXED_PRECISION: "OFF"
462+
BUILD_HWLOC: "OFF"
463+
MODULE_LOAD: "cmake/3.16.9 gcc/7.5.0"
464+
465+
build/nogpu/nompi/gcc/omp/release/static:
466+
extends:
467+
- .build_and_test_tum_template
468+
- .default_variables
469+
- .quick_test_condition
470+
- .use_tum-cpu
471+
variables:
472+
BUILD_OMP: "ON"
473+
BUILD_TYPE: "Release"
474+
BUILD_SHARED_LIBS: "OFF"
475+
ENABLE_HALF: "ON"
476+
ENABLE_BFLOAT16: "ON"
477+
BUILD_HWLOC: "OFF"
478+
MODULE_LOAD: "cmake/3.16.9 gcc/9.5.0"
479+
353480
# spack oneapi 2023.1
354481
build/icpx20231/gpu/release/shared:
355482
extends:
356483
- .build_and_test_template
357484
- .default_variables
358485
- .quick_test_condition
359-
- .use_gko-oneapi20231-igpu
486+
- .use_gko-oneapi20231-gpu
360487
variables:
361488
CXX_COMPILER: "icpx"
362489
CXX_FLAGS: "-Wpedantic -ffp-model=precise"
@@ -367,13 +494,65 @@ build/icpx20231/gpu/release/shared:
367494
ONEAPI_DEVICE_SELECTOR: "opencl:gpu"
368495
BUILD_HWLOC: "OFF"
369496

497+
build/dpcpp20231/gpu/release/shared:
498+
extends:
499+
- .build_and_test_tum_template
500+
- .default_variables
501+
- .quick_test_condition
502+
- .use_tum-intel-fp32
503+
variables:
504+
CXX_COMPILER: "dpcpp"
505+
CXX_FLAGS: "-Wpedantic -ffp-model=precise"
506+
BUILD_SYCL: "ON"
507+
BUILD_TYPE: "Release"
508+
BUILD_SHARED_LIBS: "ON"
509+
DPCPP_SINGLE_MODE: "ON"
510+
MODULE_LOAD: "cmake/3.21.7 intel-oneapi-compilers/2023.1.0 intel-oneapi-dpl/2022.1.0 intel-oneapi-tbb/2021.9.0 intel-oneapi-mkl/2023.1.0"
511+
ONEAPI_DEVICE_SELECTOR: "opencl:gpu"
512+
BUILD_HWLOC: "OFF"
513+
514+
build/icpx202402/gpu/release/shared:
515+
extends:
516+
- .build_and_test_tum_template
517+
- .default_variables
518+
- .quick_test_condition
519+
- .use_tum-intel
520+
variables:
521+
CXX_COMPILER: "icpx"
522+
CXX_FLAGS: "-Wpedantic -ffp-model=precise -Wno-deprecated-declarations"
523+
BUILD_SYCL: "ON"
524+
BUILD_HWLOC: "OFF"
525+
BUILD_TYPE: "Release"
526+
ENABLE_HALF: "OFF"
527+
ENABLE_BFLOAT16: "OFF"
528+
ONEAPI_DEVICE_SELECTOR: "opencl:gpu"
529+
MODULE_LOAD: "cmake/3.21.7 intel-oneapi-compilers/2024.0.2 intel-oneapi-dpl/2022.3.0 intel-oneapi-tbb/2021.11.0 intel-oneapi-mkl/2024.0.0"
530+
531+
build/icpx202421/gpu/release/shared:
532+
extends:
533+
- .build_and_test_tum_template
534+
- .default_variables
535+
- .quick_test_condition
536+
- .use_tum-intel
537+
variables:
538+
CXX_COMPILER: "icpx"
539+
CXX_FLAGS: "-Wpedantic -ffp-model=precise -Wno-deprecated-declarations"
540+
BUILD_SYCL: "ON"
541+
BUILD_OMP: "ON"
542+
BUILD_HWLOC: "OFF"
543+
BUILD_TYPE: "Release"
544+
ENABLE_HALF: "ON"
545+
ENABLE_BFLOAT16: "ON"
546+
ONEAPI_DEVICE_SELECTOR: "level_zero:gpu"
547+
MODULE_LOAD: "cmake/3.28.6 intel-oneapi-compilers/2024.2.1 intel-oneapi-dpl/2022.6.1 intel-oneapi-tbb/2021.13.1 intel-oneapi-mkl/2024.2.1"
548+
370549
# TODO: Enable when debug shared library size issues are fixed
371550
# build/dpcpp/level_zero_igpu/debug/shared:
372551
# extends:
373552
# - .build_and_test_template
374553
# - .default_variables
375554
# - .full_test_condition
376-
# - .use_gko-oneapi-igpu
555+
# - .use_gko-oneapi-gpu
377556
# variables:
378557
# CXX_COMPILER: "dpcpp"
379558
# CXX_FLAGS: "-Wpedantic -ffp-model=precise"
@@ -389,7 +568,7 @@ build/dpcpp/gpu/release/shared:
389568
- .build_and_test_template
390569
- .default_variables
391570
- .full_test_condition
392-
- .use_gko-oneapi-igpu
571+
- .use_gko-oneapi-gpu
393572
variables:
394573
CXX_COMPILER: "dpcpp"
395574
CXX_FLAGS: "-Wpedantic -ffp-model=precise"

.gitlab/image.yml

Lines changed: 40 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -18,26 +18,26 @@
1818
.use_gko_cuda110-mvapich-gnu9-llvm9:
1919
image: ginkgohub/cuda:110-mvapich2-gnu9-llvm9-intel2020
2020
tags:
21-
- tum
2221
- nvidia-gpus-p100
22+
- tum
2323

2424
.use_gko_cuda114-openmpi-gnu10-llvm12:
2525
image: ginkgohub/cuda:114-openmpi-gnu10-llvm12
2626
tags:
27-
- tum
2827
- nvidia-gpus-p100
28+
- tum
2929

3030
.use_gko_nvhpc233-cuda120-openmpi-gnu12-llvm16:
3131
image: ginkgohub/nvhpc:233-cuda120-openmpi-gnu12-llvm16
3232
tags:
33-
- tum
3433
- nvidia-gpus
34+
- tum
3535

3636
.use_gko_nvhpc227-cuda117-openmpi-gnu11-llvm14:
3737
image: ginkgohub/nvhpc:227-cuda117-openmpi-gnu11-llvm14
3838
tags:
39-
- tum
4039
- nvidia-gpus-p100
40+
- tum
4141

4242
.use_gko-rocm45-nompi-gnu8-llvm8:
4343
image: ginkgohub/rocm:45-mvapich2-gnu8-llvm8
@@ -51,17 +51,49 @@
5151
- private_ci
5252
- amd-gpu
5353

54-
.use_gko-oneapi-igpu:
54+
# the image is focal which seems not to support A770
55+
.use_gko-oneapi-gpu:
5556
image: ginkgohub/oneapi:latest
5657
tags:
5758
- intel-gpus
59+
- tum
5860

59-
.use_gko-oneapi20231-igpu:
61+
# the image is focal which seems not to support A770
62+
.use_gko-oneapi20231-gpu:
6063
image: ginkgohub/spack-oneapi:20231-openmpi
6164
tags:
6265
- intel-gpus
66+
- tum
6367

64-
.use_gko-oneapi-dgpu:
65-
image: ginkgohub/oneapi:latest
68+
69+
# contains "s" so it uses tum now
70+
.use_tum-nvidia:
71+
image: rocky_tum
72+
tags:
73+
- nvidia-gpus
74+
- tum
75+
76+
.use_tum-amd:
77+
image: rocky_tum
78+
tags:
79+
- amd-gpus
80+
- tum
81+
82+
.use_tum-intel:
83+
image: rocky_tum_intel
6684
tags:
6785
- intel-gpus
86+
- tum
87+
88+
# This gets the gpu without fp64 native support
89+
.use_tum-intel-fp32:
90+
image: rocky_tum_intel
91+
tags:
92+
- intel-fp32-gpus
93+
- tum
94+
95+
.use_tum-cpu:
96+
image: rocky_tum
97+
tags:
98+
- cpu
99+
- tum

0 commit comments

Comments
 (0)