@@ -110,7 +110,6 @@ build/cuda110/nompi/gcc/cuda/release/shared:
110110 # this is seemingly broken with CUDA 11
111111 # EXTRA_CMAKE_FLAGS: "-DCMAKE_CUDA_FLAGS=-diag-suppress=177"
112112
113-
114113# nvhpc and friends
115114build/nvhpc233/cuda120/nompi/nvcpp/release/static :
116115 extends :
@@ -149,6 +148,63 @@ build/nvhpc227/cuda117/nompi/nvcpp/debug/shared:
149148 # disable spurious unused argument warning
150149 EXTRA_CMAKE_FLAGS : " -DCMAKE_CUDA_FLAGS=-diag-suppress=177"
151150
151+ build/cuda118/nompi/gcc/cuda/debug/shared :
152+ extends :
153+ - .build_and_test_tum_template
154+ - .default_variables
155+ - .quick_test_condition
156+ - .use_tum-nvidia
157+ variables :
158+ BUILD_CUDA : " ON"
159+ BUILD_HWLOC : " OFF"
160+ ENABLE_HALF : " ON"
161+ BUILD_TYPE : " Debug"
162+ MODULE_LOAD : " cmake/3.18.6 cuda/11.8.0 gcc/7.5.0"
163+
164+ build/cuda120/openmpi/gcc/cuda/release/static :
165+ extends :
166+ - .build_and_test_tum_template
167+ - .default_variables
168+ - .quick_test_condition
169+ - .use_tum-nvidia
170+ variables :
171+ BUILD_CUDA : " ON"
172+ BUILD_HWLOC : " OFF"
173+ ENABLE_HALF : " ON"
174+ BUILD_MPI : " ON"
175+ BUILD_SHARED_LIBS : " OFF"
176+ BUILD_TYPE : " Release"
177+ MODULE_LOAD : " cmake/3.18.6 cuda/12.0.1 gcc/12.4.0 openmpi/4.1.6"
178+
179+ build/cuda122/openmpi/gcc/cuda/release/static :
180+ extends :
181+ - .build_and_test_tum_template
182+ - .default_variables
183+ - .quick_test_condition
184+ - .use_tum-nvidia
185+ variables :
186+ BUILD_CUDA : " ON"
187+ BUILD_HWLOC : " OFF"
188+ ENABLE_HALF : " ON"
189+ ENABLE_BFLOAT16 : " ON"
190+ BUILD_SHARED_LIBS : " OFF"
191+ BUILD_TYPE : " Release"
192+ MODULE_LOAD : " cmake/3.20.6 cuda/12.2.2 gcc/12.4.0 openmpi/4.1.6"
193+
194+ build/cuda126/nompi/gcc/cuda/release/shared :
195+ extends :
196+ - .build_and_test_tum_template
197+ - .default_variables
198+ - .quick_test_condition
199+ - .use_tum-nvidia
200+ variables :
201+ BUILD_CUDA : " ON"
202+ BUILD_HWLOC : " OFF"
203+ ENABLE_HALF : " ON"
204+ ENABLE_BFLOAT16 : " ON"
205+ BUILD_TYPE : " Release"
206+ MODULE_LOAD : " cmake/3.30.5 cuda/12.6.2 gcc/13.3.0"
207+
152208# ROCm 4.5 and friends
153209build/amd/nompi/gcc/rocm45/release/shared :
154210 extends :
@@ -230,6 +286,48 @@ build/amd/nompi/gcc/rocm514_wo_omp/release/shared:
230286 BUILD_HIP : " ON"
231287 BUILD_TYPE : " Release"
232288
289+ build/amd/openmpi/gcc/rocm600/release/static :
290+ extends :
291+ - .build_and_test_tum_template
292+ - .default_variables
293+ - .quick_test_condition
294+ - .use_tum-amd
295+ variables :
296+ BUILD_HIP : " ON"
297+ BUILD_HWLOC : " OFF"
298+ BUILD_MPI : " ON"
299+ BUILD_TYPE : " Release"
300+ BUILD_SHARED_LIBS : " OFF"
301+ MODULE_LOAD : " cmake/3.24.4 rocm/6.0.0 gcc/13.3.0 openmpi/5.0.5"
302+
303+ build/amd/nompi/gcc/rocm573/debug/shared :
304+ extends :
305+ - .build_and_test_tum_template
306+ - .default_variables
307+ - .quick_test_condition
308+ - .use_tum-amd
309+ variables :
310+ BUILD_HIP : " ON"
311+ BUILD_OMP : " OFF"
312+ BUILD_HWLOC : " OFF"
313+ BUILD_TYPE : " Debug"
314+ ENABLE_BFLOAT16 : " ON"
315+ ENABLE_HALF : " OFF"
316+ MODULE_LOAD : " cmake/3.25.3 rocm/5.7.3 gcc/12.4.0"
317+
318+ build/amd/openmpi/gcc/rocm634_wo_omp/release/shared :
319+ extends :
320+ - .build_and_test_tum_template
321+ - .default_variables
322+ - .quick_test_condition
323+ - .use_tum-amd
324+ variables :
325+ BUILD_HIP : " ON"
326+ BUILD_HWLOC : " OFF"
327+ BUILD_MPI : " ON"
328+ BUILD_TYPE : " Release"
329+ MODULE_LOAD : " cmake/3.29.6 rocm/6.3.4 gcc/13.3.0 openmpi/5.0.5"
330+
233331# no cuda but latest gcc and clang
234332build/nocuda/nompi/gcc/core/debug/static :
235333 extends :
@@ -350,13 +448,42 @@ build/nocuda-nomixed/nompi/clang/omp/debug/static:
350448 BUILD_SHARED_LIBS : " OFF"
351449 MIXED_PRECISION : " OFF"
352450
451+ build/nogpu/nompi/gcc/omp/debug/static :
452+ extends :
453+ - .build_and_test_tum_template
454+ - .default_variables
455+ - .quick_test_condition
456+ - .use_tum-cpu
457+ variables :
458+ BUILD_OMP : " ON"
459+ BUILD_TYPE : " Debug"
460+ BUILD_SHARED_LIBS : " OFF"
461+ MIXED_PRECISION : " OFF"
462+ BUILD_HWLOC : " OFF"
463+ MODULE_LOAD : " cmake/3.16.9 gcc/7.5.0"
464+
465+ build/nogpu/nompi/gcc/omp/release/static :
466+ extends :
467+ - .build_and_test_tum_template
468+ - .default_variables
469+ - .quick_test_condition
470+ - .use_tum-cpu
471+ variables :
472+ BUILD_OMP : " ON"
473+ BUILD_TYPE : " Release"
474+ BUILD_SHARED_LIBS : " OFF"
475+ ENABLE_HALF : " ON"
476+ ENABLE_BFLOAT16 : " ON"
477+ BUILD_HWLOC : " OFF"
478+ MODULE_LOAD : " cmake/3.16.9 gcc/9.5.0"
479+
353480# spack oneapi 2023.1
354481build/icpx20231/gpu/release/shared :
355482 extends :
356483 - .build_and_test_template
357484 - .default_variables
358485 - .quick_test_condition
359- - .use_gko-oneapi20231-igpu
486+ - .use_gko-oneapi20231-gpu
360487 variables :
361488 CXX_COMPILER : " icpx"
362489 CXX_FLAGS : " -Wpedantic -ffp-model=precise"
@@ -367,13 +494,65 @@ build/icpx20231/gpu/release/shared:
367494 ONEAPI_DEVICE_SELECTOR : " opencl:gpu"
368495 BUILD_HWLOC : " OFF"
369496
497+ build/dpcpp20231/gpu/release/shared :
498+ extends :
499+ - .build_and_test_tum_template
500+ - .default_variables
501+ - .quick_test_condition
502+ - .use_tum-intel-fp32
503+ variables :
504+ CXX_COMPILER : " dpcpp"
505+ CXX_FLAGS : " -Wpedantic -ffp-model=precise"
506+ BUILD_SYCL : " ON"
507+ BUILD_TYPE : " Release"
508+ BUILD_SHARED_LIBS : " ON"
509+ DPCPP_SINGLE_MODE : " ON"
510+ MODULE_LOAD : " cmake/3.21.7 intel-oneapi-compilers/2023.1.0 intel-oneapi-dpl/2022.1.0 intel-oneapi-tbb/2021.9.0 intel-oneapi-mkl/2023.1.0"
511+ ONEAPI_DEVICE_SELECTOR : " opencl:gpu"
512+ BUILD_HWLOC : " OFF"
513+
514+ build/icpx202402/gpu/release/shared :
515+ extends :
516+ - .build_and_test_tum_template
517+ - .default_variables
518+ - .quick_test_condition
519+ - .use_tum-intel
520+ variables :
521+ CXX_COMPILER : " icpx"
522+ CXX_FLAGS : " -Wpedantic -ffp-model=precise -Wno-deprecated-declarations"
523+ BUILD_SYCL : " ON"
524+ BUILD_HWLOC : " OFF"
525+ BUILD_TYPE : " Release"
526+ ENABLE_HALF : " OFF"
527+ ENABLE_BFLOAT16 : " OFF"
528+ ONEAPI_DEVICE_SELECTOR : " opencl:gpu"
529+ MODULE_LOAD : " cmake/3.21.7 intel-oneapi-compilers/2024.0.2 intel-oneapi-dpl/2022.3.0 intel-oneapi-tbb/2021.11.0 intel-oneapi-mkl/2024.0.0"
530+
531+ build/icpx202421/gpu/release/shared :
532+ extends :
533+ - .build_and_test_tum_template
534+ - .default_variables
535+ - .quick_test_condition
536+ - .use_tum-intel
537+ variables :
538+ CXX_COMPILER : " icpx"
539+ CXX_FLAGS : " -Wpedantic -ffp-model=precise -Wno-deprecated-declarations"
540+ BUILD_SYCL : " ON"
541+ BUILD_OMP : " ON"
542+ BUILD_HWLOC : " OFF"
543+ BUILD_TYPE : " Release"
544+ ENABLE_HALF : " ON"
545+ ENABLE_BFLOAT16 : " ON"
546+ ONEAPI_DEVICE_SELECTOR : " level_zero:gpu"
547+ MODULE_LOAD : " cmake/3.28.6 intel-oneapi-compilers/2024.2.1 intel-oneapi-dpl/2022.6.1 intel-oneapi-tbb/2021.13.1 intel-oneapi-mkl/2024.2.1"
548+
370549# TODO: Enable when debug shared library size issues are fixed
371550# build/dpcpp/level_zero_igpu/debug/shared:
372551# extends:
373552# - .build_and_test_template
374553# - .default_variables
375554# - .full_test_condition
376- # - .use_gko-oneapi-igpu
555+ # - .use_gko-oneapi-gpu
377556# variables:
378557# CXX_COMPILER: "dpcpp"
379558# CXX_FLAGS: "-Wpedantic -ffp-model=precise"
@@ -389,7 +568,7 @@ build/dpcpp/gpu/release/shared:
389568 - .build_and_test_template
390569 - .default_variables
391570 - .full_test_condition
392- - .use_gko-oneapi-igpu
571+ - .use_gko-oneapi-gpu
393572 variables :
394573 CXX_COMPILER : " dpcpp"
395574 CXX_FLAGS : " -Wpedantic -ffp-model=precise"
0 commit comments