revert load_store changes

jcosborn · jcosborn · commit 456a3a036fc3 · 2026-05-28T17:07:49.000-05:00
change STRICT build optimization level
make run CI use STRICT build
diff --git a/.github/workflows/oneapi_githubactions_run.yml b/.github/workflows/oneapi_githubactions_run.yml
@@ -9,7 +9,7 @@ defaults:
     shell: bash
 
 env:
-  BUILD_TYPE: RELEASE
+  BUILD_TYPE: STRICT
 
 jobs:
   buildrun:
diff --git a/include/targets/generic/load_store.h b/include/targets/generic/load_store.h
@@ -11,21 +11,14 @@ namespace quda
     static constexpr int size = prefetch;
   };
 
-  /**
-     @brief Element type used for coalesced storage.
-   */
-  template <typename T>
-  using atom_t = std::conditional_t<sizeof(T) % 16 == 0, int4, std::conditional_t<sizeof(T) % 8 == 0, int2, int>>;
-
   /**
      @brief Non-specialized load operation
   */
   template <bool is_device> struct vector_load_impl {
     template <typename T, size_t prefetch_size>
     __device__ __host__ inline void operator()(T &value, const void *ptr, int idx, const prefetch_t<prefetch_size> &)
     {
-      // value = reinterpret_cast<const T *>(ptr)[idx];
-      memcpy(&value, static_cast<const T *>(ptr) + idx, sizeof(value));
+      value = reinterpret_cast<const T *>(ptr)[idx];
     }
   };
 
@@ -60,12 +53,11 @@ namespace quda
   template <bool is_device> struct vector_store_impl {
     template <typename T> __device__ __host__ inline void operator()(void *ptr, int idx, const T &value)
     {
-      // reinterpret_cast<T *>(ptr)[idx] = value;
-      memcpy(static_cast<T *>(ptr) + idx, &value, sizeof(value));
+      reinterpret_cast<T *>(ptr)[idx] = value;
     }
   };
 
-  template <typename vector_t> __device__ __host__ inline void vector_storeV(void *ptr, int idx, const vector_t &value)
+  template <typename vector_t> __device__ __host__ inline void vector_store(void *ptr, int idx, const vector_t &value)
   {
     target::dispatch<vector_store_impl>(ptr, idx, value);
   }
@@ -77,9 +69,7 @@ namespace quda
     vector_t value_v;
     static_assert(sizeof(value_a) == sizeof(value_v), "array type and vector type are different sizes");
     memcpy(&value_v, &value_a, sizeof(vector_t));
-    // vector_storeV<vector_t>(ptr, idx, value_v);
-    scalar_t *a = static_cast<scalar_t *>(ptr) + N * idx;
-    memcpy(a, &value_v, sizeof(value_v));
+    vector_store<vector_t>(ptr, idx, value_v);
   }
 
   template <typename scalar_t, int N>
diff --git a/include/targets/sycl/load_store.h b/include/targets/sycl/load_store.h
@@ -0,0 +1,14 @@
+#pragma once
+
+namespace quda
+{
+
+  /**
+     @brief Element type used for coalesced storage.
+   */
+  template <typename T>
+  using atom_t = std::conditional_t<sizeof(T) % 16 == 0, int4, std::conditional_t<sizeof(T) % 8 == 0, int2, int>>;
+
+} // namespace quda
+
+#include "../generic/load_store.h"
diff --git a/lib/targets/sycl/target_sycl.cmake b/lib/targets/sycl/target_sycl.cmake
@@ -63,7 +63,7 @@ set(CMAKE_SYCL_FLAGS_DEVEL
     "-O3 -gline-directives-only -Wall -Wextra"
     CACHE STRING "Flags used by the C++ compiler during regular development builds.")
 set(CMAKE_SYCL_FLAGS_STRICT
-    "-O3 -Wall -Wextra -Werror"
+    "-Os -Wall -Wextra -Werror"
     CACHE STRING "Flags used by the C++ compiler during strict jenkins builds.")
 set(CMAKE_SYCL_FLAGS_RELEASE
     "-O3 -w ${CXX_OPT}"