Stabilize DWA LUT test half-distance compare on i686

cary-ilm · cary-ilm · commit e0102a66d9c3 · 2026-04-21T18:57:52.000-07:00
Add `ieeeFloatAbsDiffHalf()` using volatile float steps so each
half→float conversion and subtraction rounds to IEEE binary32 before
fabs. Without this, i686 387 FPU extended precision can pick a
different closest candidate than `dwaQuantTables.h` (built with typical
SSE float math), breaking `testLutHeader`.

Made with Cursor
Signed-off-by: Cary Phillips &lt;cary@ilm.com&gt;
diff --git a/src/test/OpenEXRCoreTest/compressionTables.cpp b/src/test/OpenEXRCoreTest/compressionTables.cpp
@@ -32,6 +32,7 @@
 #include "IlmThreadSemaphore.h"
 
 #include <cstddef>
+#include <cmath>
 #include <math.h>
 #include <stdio.h>
 #include <stdlib.h>
@@ -68,6 +69,19 @@ using namespace OPENEXR_IMF_NAMESPACE;
 namespace
 {
 
+// Absolute |float(a)-float(b)| for half values, using volatile intermediates so
+// each step rounds to IEEE binary32. Without this, i686 defaults (387 stack) can
+// keep extra precision and change which candidate "wins" vs tables built with
+// SSE float math — no special compile flags required for users running tests.
+static inline float
+ieeeFloatAbsDiffHalf (const half& a, const half& b)
+{
+    volatile float af = static_cast<float> (a);
+    volatile float bf = static_cast<float> (b);
+    volatile float d  = af - bf;
+    return std::fabs (static_cast<float> (d));
+}
+
 class LutHeaderWorker
 {
 public:
@@ -160,8 +174,8 @@ class LutHeaderWorker
 
                         tmpHalf.setBits (i);
 
-                        if (fabs ((float) inputHalf - (float) tmpHalf) <
-                            fabs ((float) inputHalf - (float) closestHalf))
+                        if (ieeeFloatAbsDiffHalf (inputHalf, tmpHalf) <
+                            ieeeFloatAbsDiffHalf (inputHalf, closestHalf))
                         {
                             closestHalf = tmpHalf;
                         }