man-group
diff --git a/‎cpp/arcticdb/util/mean.hpp
+63-37 b/‎cpp/arcticdb/util/mean.hpp
+63-37
diff --git a/‎cpp/arcticdb/util/min_max_float.hpp
+42-72 b/‎cpp/arcticdb/util/min_max_float.hpp
+42-72
@@ -8,72 +8,98 @@
 
 namespace arcticdb {
 
-#ifndef _WIN32
+#if HAS_VECTOR_EXTENSIONS
+
+template<typename Vec, typename U>
+inline void fill_vector(Vec &vec, U value) {
+    U* p = reinterpret_cast<U*>(&vec);
+    constexpr size_t count = sizeof(Vec) / sizeof(U);
+    for (size_t i = 0; i < count; i++) {
+        p[i] = value;
+    }
+}
 
 template<typename T>
 class MeanFinder {
     static_assert(is_supported_int<T>::value || is_supported_float<T>::value, "Unsupported type");
-
 public:
     static double find(const T* __restrict data, size_t n) {
+        util::check(n > 0, "Empty array provided");
         using VectorType = vector_type<T>;
         using AccumVectorType = vector_type<double>;
-
-        AccumVectorType vsum = {0.0};
         constexpr size_t elements_per_vector = sizeof(VectorType) / sizeof(T);
         constexpr size_t doubles_per_vector = sizeof(AccumVectorType) / sizeof(double);
         constexpr size_t vectors_per_acc = elements_per_vector / doubles_per_vector;
-
+        AccumVectorType vsum;
+        double* vsum_ptr = reinterpret_cast<double*>(&vsum);
+        fill_vector<AccumVectorType, double>(vsum, 0.0);
         size_t valid_count = 0;
-
-        const auto* vdata = reinterpret_cast<const VectorType*>(data);
+        const VectorType* vdata = reinterpret_cast<const VectorType*>(data);
         const size_t vector_len = n / elements_per_vector;
-
-        for(size_t i = 0; i < vector_len; i++) {
+        for (size_t i = 0; i < vector_len; i++) {
             VectorType v = vdata[i];
-
-            if constexpr(std::is_floating_point_v<T>) {
-                VectorType mask = v == v;
-                v = v & mask;
-
-                const T* mask_arr = reinterpret_cast<const T*>(&mask);
-
-                for(size_t j = 0; j < elements_per_vector; j++) {
-                    if(mask_arr[j] != 0)
-                        ++valid_count;
+            const T* v_arr = reinterpret_cast<const T*>(&v);
+            if constexpr (std::is_floating_point_v<T>) {
+                bool has_nan = false;
+                for (size_t j = 0; j < elements_per_vector; j++) {
+                    if (std::isnan(v_arr[j])) { has_nan = true; break; }
+                }
+                if (!has_nan) {
+                    for (size_t chunk = 0; chunk < vectors_per_acc; chunk++) {
+                        size_t base = chunk * doubles_per_vector;
+                        for (size_t j = 0; j < doubles_per_vector; j++) {
+                            if constexpr (std::is_same_v<T, double>)
+                                vsum_ptr[j] += v_arr[base + j];
+                            else
+                                vsum_ptr[j] += static_cast<double>(v_arr[base + j]);
+                        }
+                    }
+                    valid_count += elements_per_vector;
+                } else {
+                    for (size_t chunk = 0; chunk < vectors_per_acc; chunk++) {
+                        size_t base = chunk * doubles_per_vector;
+                        for (size_t j = 0; j < doubles_per_vector; j++) {
+                            size_t idx = base + j;
+                            if (!std::isnan(v_arr[idx])) {
+                                if constexpr (std::is_same_v<T, double>)
+                                    vsum_ptr[j] += v_arr[idx];
+                                else
+                                    vsum_ptr[j] += static_cast<double>(v_arr[idx]);
+                                valid_count++;
+                            }
+                        }
+                    }
                 }
             } else {
-                valid_count += elements_per_vector;
-            }
-
-            const T* v_arr = reinterpret_cast<const T*>(&v);
-            for(size_t chunk = 0; chunk < vectors_per_acc; chunk++) {
-                for(size_t j = 0; j < doubles_per_vector; j++) {
-                    size_t idx = chunk * doubles_per_vector + j;
-                    reinterpret_cast<double*>(&vsum)[j] += static_cast<double>(v_arr[idx]);
+                for (size_t chunk = 0; chunk < vectors_per_acc; chunk++) {
+                    size_t base = chunk * doubles_per_vector;
+                    for (size_t j = 0; j < doubles_per_vector; j++) {
+                        vsum_ptr[j] += static_cast<double>(v_arr[base + j]);
+                    }
                 }
+                valid_count += elements_per_vector;
             }
         }
-
         double total = 0.0;
-        const auto* sum_arr = reinterpret_cast<const double*>(&vsum);
-        for(size_t i = 0; i < doubles_per_vector; i++) {
-            total += sum_arr[i];
+        for (size_t j = 0; j < doubles_per_vector; j++) {
+            total += vsum_ptr[j];
         }
-
         const T* remain = data + (vector_len * elements_per_vector);
-        for(size_t i = 0; i < n % elements_per_vector; i++) {
-            if constexpr(std::is_floating_point_v<T>) {
-                if (remain[i] == remain[i]) {  // Not NaN
-                    total += static_cast<double>(remain[i]);
+        size_t rem = n % elements_per_vector;
+        for (size_t i = 0; i < rem; i++) {
+            if constexpr (std::is_floating_point_v<T>) {
+                if (!std::isnan(remain[i])) {
+                    if constexpr (std::is_same_v<T, double>)
+                        total += remain[i];
+                    else
+                        total += static_cast<double>(remain[i]);
                     valid_count++;
                 }
             } else {
                 total += static_cast<double>(remain[i]);
                 valid_count++;
             }
         }
-
         return valid_count > 0 ? total / static_cast<double>(valid_count) : 0.0;
     }
 };
 
@@ -7,106 +7,76 @@
 #include <arcticdb/util/vector_common.hpp>
 
 namespace arcticdb {
-#ifndef _WIN32
 
-template<typename T>
-class FloatMinFinder {
+#if HAS_VECTOR_EXTENSIONS
+
+template<typename T, typename Comparator>
+class FloatExtremumFinder {
     static_assert(is_supported_float<T>::value, "Type must be float or double");
     static_assert(std::is_floating_point_v<T>, "Type must be floating point");
-
 public:
     static T find(const T* data, size_t n) {
+        if (n == 0)
+            return Comparator::identity();
         using vec_t = vector_type<T>;
-
-        vec_t vmin;
-        for(size_t i = 0; i < sizeof(vec_t)/sizeof(T); i++) {
-            reinterpret_cast<T*>(&vmin)[i] = std::numeric_limits<T>::infinity();
-        }
+        constexpr size_t lane_count = sizeof(vec_t) / sizeof(T);
+        vec_t vext;
+        for (size_t i = 0; i < lane_count; i++)
+            reinterpret_cast<T*>(&vext)[i] = Comparator::identity();
 
         const vec_t* vdata = reinterpret_cast<const vec_t*>(data);
-        const size_t elements_per_vector = sizeof(vec_t) / sizeof(T);
-        const size_t vlen = n / elements_per_vector;
-
-        for(size_t i = 0; i < vlen; i++) {
+        size_t vlen = n / lane_count;
+        for (size_t i = 0; i < vlen; i++) {
             vec_t v = vdata[i];
-            vmin = (v < vmin) ? v : vmin;
+            if constexpr (Comparator::is_min)
+                vext = (v < vext) ? v : vext;
+            else
+                vext = (v > vext) ? v : vext;
         }
-
-        T min_val = std::numeric_limits<T>::infinity();
-        const T* min_arr = reinterpret_cast<const T*>(&vmin);
-        for(size_t i = 0; i < elements_per_vector; i++) {
-            if (min_arr[i] == min_arr[i]) {  // Not NaN
-                min_val = std::min(min_val, min_arr[i]);
-            }
+        T result = Comparator::identity();
+        const T* lanes = reinterpret_cast<const T*>(&vext);
+        for (size_t i = 0; i < lane_count; i++) {
+            if (lanes[i] == lanes[i])
+                result = Comparator::compare(lanes[i], result);
         }
-
-        const T* remain = data + (vlen * elements_per_vector);
-        for(size_t i = 0; i < n % elements_per_vector; i++) {
-            if (remain[i] == remain[i]) {  // Not NaN
-                min_val = std::min(min_val, remain[i]);
-            }
+        const T* remain = data + (vlen * lane_count);
+        size_t remain_count = n % lane_count;
+        for (size_t i = 0; i < remain_count; i++) {
+            if (remain[i] == remain[i])
+                result = Comparator::compare(remain[i], result);
         }
-
-        return min_val;
+        return result;
     }
 };
 
 template<typename T>
-class FloatMaxFinder {
-    static_assert(is_supported_float<T>::value, "Type must be float or double");
-    static_assert(std::is_floating_point_v<T>, "Type must be floating point");
-
-public:
-    static T find(const T* data, size_t n) {
-        using vec_t = vector_type<T>;
-
-        vec_t vmax;
-        for(size_t i = 0; i < sizeof(vec_t)/sizeof(T); i++) {
-            reinterpret_cast<T*>(&vmax)[i] = -std::numeric_limits<T>::infinity();
-        }
-
-        const vec_t* vdata = reinterpret_cast<const vec_t*>(data);
-        const size_t elements_per_vector = sizeof(vec_t) / sizeof(T);
-        const size_t vlen = n / elements_per_vector;
-
-        for(size_t i = 0; i < vlen; i++) {
-            vec_t v = vdata[i];
-            vmax = (v > vmax) ? v : vmax;
-        }
-
-        T max_val = -std::numeric_limits<T>::infinity();
-        const T* max_arr = reinterpret_cast<const T*>(&vmax);
-        for(size_t i = 0; i < elements_per_vector; i++) {
-            if (max_arr[i] == max_arr[i]) {  // Not NaN
-                max_val = std::max(max_val, max_arr[i]);
-            }
-        }
-
-        const T* remain = data + (vlen * elements_per_vector);
-        for(size_t i = 0; i < n % elements_per_vector; i++) {
-            if (remain[i] == remain[i]) {  // Not NaN
-                max_val = std::max(max_val, remain[i]);
-            }
-        }
+struct FloatMinComparator {
+    static constexpr bool is_min = true;
+    static T identity() { return std::numeric_limits<T>::infinity(); }
+    static T compare(T a, T b) { return std::min(a, b); }
+};
 
-        return max_val;
-    }
+template<typename T>
+struct FloatMaxComparator {
+    static constexpr bool is_min = false;
+    static T identity() { return -std::numeric_limits<T>::infinity(); }
+    static T compare(T a, T b) { return std::max(a, b); }
 };
 
 template<typename T>
-T find_float_min(const T *data, size_t n) {
-    return FloatMinFinder<T>::find(data, n);
+T find_float_min(const T* data, size_t n) {
+    return FloatExtremumFinder<T, FloatMinComparator<T>>::find(data, n);
 }
 
 template<typename T>
-T find_float_max(const T *data, size_t n) {
-    return FloatMaxFinder<T>::find(data, n);
+T find_float_max(const T* data, size_t n) {
+    return FloatExtremumFinder<T, FloatMaxComparator<T>>::find(data, n);
 }
 
 #else
 
 template<typename T>
-typename std::enable_if<std::is_integral<T>::value, T>::type
+typename std::enable_if<std::is_floating_point<T>::value, T>::type
 find_float_min(const T *data, size_t n) {
     return *std::min_element(data, data + n);
 }