docs: add 3rd order AD example using Reactant

avik-pal · avik-pal · commit e38be450f9b7 · 2025-11-02T10:25:41.000-05:00
[skip ci]
diff --git a/docs/src/.vitepress/config.mts b/docs/src/.vitepress/config.mts
@@ -356,6 +356,10 @@ export default defineConfig({
               {
                 text: "Profiling Lux Training Loops",
                 link: "/manual/profiling_training_loop",
+              },
+              {
+                text: "Nested AutoDiff",
+                link: "/manual/nested_autodiff_reactant",
               }
             ],
           },
diff --git a/docs/src/manual/nested_autodiff.md b/docs/src/manual/nested_autodiff.md
@@ -9,7 +9,13 @@ In this manual, we will explore how to use automatic differentiation (AD) inside
 or loss functions and have Lux automatically switch the AD backend with a faster one when
 needed.
 
-!!! tip
+!!! tip "Reactant Support"
+
+    Reactant + Lux natively supports Nested AD (even higher dimensions). If you are using
+    Reactant, please see the [Nested AD with Reactant](@ref nested_autodiff_reactant)
+    manual.
+
+!!! tip "Disabling Nested AD Switching"
 
     Don't wan't Lux to do this switching for you? You can disable it by setting the
     `automatic_nested_ad_switching` Preference to `false`.
diff --git a/docs/src/manual/nested_autodiff_reactant.md b/docs/src/manual/nested_autodiff_reactant.md
@@ -0,0 +1,69 @@
+# [Nested AutoDiff with Reactant](@id nested_autodiff_reactant)
+
+We will be using the example from [issue 614](https://github.com/LuxDL/Lux.jl/issues/614).
+
+```@example nested_ad_reactant
+using Reactant, Enzyme, Lux, Random, LinearAlgebra
+
+const xdev = reactant_device(; force=true)
+const cdev = cpu_device()
+
+function ∇potential(potential, x)
+    dxs = stack(onehot(x))
+    ∇p = similar(x)
+    colons = [Colon() for _ in 1:ndims(x)]
+    @trace for i in 1:length(x)
+        dxᵢ = dxs[colons..., i]
+        res = only(Enzyme.autodiff(
+            Enzyme.set_abi(Forward, Reactant.ReactantABI), potential, Duplicated(x, dxᵢ)
+        ))
+        @allowscalar ∇p[i] = res[i]
+    end
+    return ∇p
+end
+
+function ∇²potential(potential, x)
+    dxs = stack(onehot(x))
+    ∇²p = similar(x)
+    colons = [Colon() for _ in 1:ndims(x)]
+    @trace for i in 1:length(x)
+        dxᵢ = dxs[colons..., i]
+        res = only(Enzyme.autodiff(
+            Enzyme.set_abi(Forward, Reactant.ReactantABI),
+            ∇potential, Const(potential), Duplicated(x, dxᵢ)
+        ))
+        @allowscalar ∇²p[i] = res[i]
+    end
+    return ∇²p
+end
+
+struct PotentialNet{P} <: AbstractLuxWrapperLayer{:potential}
+    potential::P
+end
+
+function (potential::PotentialNet)(x, ps, st)
+    pnet = StatefulLuxLayer{true}(potential.potential, ps, st)
+    return ∇²potential(pnet, x), pnet.st
+end
+
+model = PotentialNet(Dense(5 => 5, gelu))
+ps, st = Lux.setup(Random.default_rng(), model) |> xdev
+
+x_ra = randn(Float32, 5, 3) |> xdev
+
+@code_hlo model(x_ra, ps, st)
+
+@jit model(x_ra, ps, st)
+```
+
+```@example nested_ad_reactant
+sumabs2first(model, x, ps, st) = sum(abs2, first(model(x, ps, st)))
+
+function enzyme_gradient(model, x, ps, st)
+    return Enzyme.gradient(
+        Enzyme.Reverse, Const(sumabs2first), Const(model), Const(x), ps, Const(st)
+    )
+end
+
+@jit enzyme_gradient(model, x_ra, ps, st)
+```

Original file line number	Diff line number	Diff line change
`@@ -356,6 +356,10 @@ export default defineConfig({`
`356`	`356`	`{`
`357`	`357`	`text: "Profiling Lux Training Loops",`
`358`	`358`	`link: "/manual/profiling_training_loop",`
	`359`	`+ },`
	`360`	`+ {`
	`361`	`+ text: "Nested AutoDiff",`
	`362`	`+ link: "/manual/nested_autodiff_reactant",`
`359`	`363`	`}`
`360`	`364`	`],`
`361`	`365`	`},`