fix(gemma4): implement float32 safe RMSNorm wrapper, resolving NaN overflow shattering on Apple Silicon without compromising base magnitudes

Aegis AI Assistant · Aegis AI Assistant · commit d16b6c0b8afd · 2026-04-13T13:52:22.000-07:00
diff --git a/Libraries/MLXLLM/Models/Gemma4.swift b/Libraries/MLXLLM/Models/Gemma4.swift
@@ -21,9 +21,16 @@ public class Gemma4RMSNorm: Module, UnaryLayer {
     }
 
     public func callAsFunction(_ x: MLXArray) -> MLXArray {
-        // vLLM: standard RMSNorm — weight * x / sqrt(E[x^2] + eps)
-        // Gemma 4 norm weights are trained scale factors (~8-10), NOT zero-init offsets.
-        return MLXFast.rmsNorm(x, weight: self.weight, eps: self.eps)
+        // Evaluate in Float32 to prevent Float16 infinity overflow on M1/M2 architectures.
+        // Vision models like SigLIP/Qwen inject imageFeatures at magnitude ~300.
+        // 300^2 = 90,000, which overflows MLX .float16 max of 65504 causing NaNs if not isolated.
+        let originalType = x.dtype
+        let xF32 = x.asType(.float32)
+        let variance = MLX.mean(MLX.square(xF32), axis: -1, keepDims: true)
+        let rsqrtVar = MLX.rsqrt(variance + eps)
+        
+        // Weight is applied after to the original type to avoid type mismatch
+        return (self.weight * (xF32 * rsqrtVar).asType(originalType))
     }
 }
 

Original file line number	Diff line number	Diff line change
`@@ -21,9 +21,16 @@ public class Gemma4RMSNorm: Module, UnaryLayer {`
`21`	`21`	`}`
`22`	`22`
`23`	`23`	`public func callAsFunction(_ x: MLXArray) -> MLXArray {`
`24`		`- // vLLM: standard RMSNorm — weight * x / sqrt(E[x^2] + eps)`
`25`		`- // Gemma 4 norm weights are trained scale factors (~8-10), NOT zero-init offsets.`
`26`		`- return MLXFast.rmsNorm(x, weight: self.weight, eps: self.eps)`
	`24`	`+ // Evaluate in Float32 to prevent Float16 infinity overflow on M1/M2 architectures.`
	`25`	`+ // Vision models like SigLIP/Qwen inject imageFeatures at magnitude ~300.`
	`26`	`+ // 300^2 = 90,000, which overflows MLX .float16 max of 65504 causing NaNs if not isolated.`
	`27`	`+ let originalType = x.dtype`
	`28`	`+ let xF32 = x.asType(.float32)`
	`29`	`+ let variance = MLX.mean(MLX.square(xF32), axis: -1, keepDims: true)`
	`30`	`+ let rsqrtVar = MLX.rsqrt(variance + eps)`
	`31`	`+`
	`32`	`+ // Weight is applied after to the original type to avoid type mismatch`
	`33`	`+ return (self.weight * (xF32 * rsqrtVar).asType(originalType))`
`27`	`34`	`}`
`28`	`35`	`}`
`29`	`36`