copilot suggested changes

ashwins990 · ashwins990 · commit c084a1d376f5 · 2026-01-20T09:25:58.000+05:30
diff --git a/src/plugins/intel_cpu/src/nodes/kernels/scaled_attn/softmax_kernel.hpp b/src/plugins/intel_cpu/src/nodes/kernels/scaled_attn/softmax_kernel.hpp
@@ -1444,23 +1444,19 @@ inline void attn_softmax_kernel<ov::float16>(ov::float16* a,
 
     ov::float16 sum = 0.0f;
     if (sink != nullptr) {
-        max = max > static_cast<const ov::float16>(*sink) ? max : static_cast<const ov::float16>(*sink);
+        max = std::max(max, static_cast<const ov::float16>(*sink));
+    }
+    exp_reduce_sum_f32(a, max, len, sum);
+    if (sink != nullptr) {
+        sum += std::exp(*sink - max);
     }
     if (dst_precision == ov::element::f32) {
-        exp_reduce_sum_f32(a, max, len, sum);
-        if (sink != nullptr) {
-            sum += std::exp(*sink - max);
-        }
         ov::float16 scalar = 1.0f / sum;
         multiply_scalar(a, static_cast<float*>(a_dst), scalar, len);
         // apply causual mask to final result instead of attn_score
         if (total_size > len)
             memset(static_cast<float*>(a_dst) + len, 0, sizeof(float) * (total_size - len));
     } else {
-        exp_reduce_sum_f32(a, max, len, sum);
-        if (sink != nullptr) {
-            sum += std::exp(*sink - max);
-        }
         ov::float16 scalar = 1.0f / sum;
         multiply_scalar_f32(a, static_cast<ov::float16*>(a_dst), scalar, len);
         // apply causual mask to final result instead of attn_score