Fix Enzyme: type-stable _unflatten, @inline v&g, DimensionMismatch checks

yebai · Copilot · yebai · commit fe53b23be573 · 2026-04-15T00:38:06.000+01:00
Replace Any[]-based _unflatten with recursive peel approach that avoids Union types Enzyme cannot differentiate through. Add @inline to all value_and_gradient methods to prevent boxing the (value, grad) sret tuple. Add DimensionMismatch length checks to all vector adapters. Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
diff --git a/docs/src/interface.md b/docs/src/interface.md
@@ -316,7 +316,7 @@ There are two things that make them more special, though:
     vi[@varname(x[1])] = 1
     vi[@varname(x[2])] = 2
     keys(vi) == [x[1], x[2]]
-
+    
     vi[@varname(x)] = [1, 2]
     keys(vi) == [x]
     ```
diff --git a/ext/AbstractPPLDifferentiationInterfaceExt.jl b/ext/AbstractPPLDifferentiationInterfaceExt.jl
@@ -21,6 +21,8 @@ function (p::DIPrepared)(values::NamedTuple)
 end
 
 function (p::DIPrepared)(x::AbstractVector)
+    length(x) == p.dim ||
+        throw(DimensionMismatch("expected vector of length $(p.dim), got $(length(x))"))
     return p.f_vec(x)
 end
 
@@ -34,7 +36,7 @@ function AbstractPPL.prepare(adtype::AbstractADType, problem, prototype::NamedTu
     return DIPrepared(evaluator, f_vec, adtype, prep, prototype, length(x0))
 end
 
-function AbstractPPL.value_and_gradient(p::DIPrepared, values::NamedTuple)
+@inline function AbstractPPL.value_and_gradient(p::DIPrepared, values::NamedTuple)
     x = AbstractPPL.flatten_to_vec(values)
     val, dx = DI.value_and_gradient(p.f_vec, p.prep, p.backend, x)
     grad_nt = AbstractPPL.unflatten_from_vec(p.prototype, dx)
diff --git a/ext/AbstractPPLEnzymeExt.jl b/ext/AbstractPPLEnzymeExt.jl
@@ -20,6 +20,8 @@ function (p::EnzymePrepared)(values::NamedTuple)
 end
 
 function (p::EnzymePrepared)(x::AbstractVector)
+    length(x) == p.dim ||
+        throw(DimensionMismatch("expected vector of length $(p.dim), got $(length(x))"))
     return p.f_vec(x)
 end
 
@@ -33,7 +35,7 @@ function AbstractPPL.prepare(::AutoEnzyme, problem, prototype::NamedTuple)
     return EnzymePrepared(evaluator, f_vec, grad_buf, prototype, length(x0))
 end
 
-function AbstractPPL.value_and_gradient(p::EnzymePrepared, values::NamedTuple)
+@inline function AbstractPPL.value_and_gradient(p::EnzymePrepared, values::NamedTuple)
     x = AbstractPPL.flatten_to_vec(values)
     fill!(p.gradient_buffer, 0.0)
     result = Enzyme.autodiff(
diff --git a/ext/AbstractPPLForwardDiffExt.jl b/ext/AbstractPPLForwardDiffExt.jl
@@ -21,6 +21,8 @@ function (p::ForwardDiffPrepared)(values::NamedTuple)
 end
 
 function (p::ForwardDiffPrepared)(x::AbstractVector)
+    length(x) == p.dim ||
+        throw(DimensionMismatch("expected vector of length $(p.dim), got $(length(x))"))
     return p.f_vec(x)
 end
 
@@ -36,7 +38,7 @@ function AbstractPPL.prepare(::AutoForwardDiff, problem, prototype::NamedTuple)
     return ForwardDiffPrepared(evaluator, f_vec, cfg, result, prototype, length(x0))
 end
 
-function AbstractPPL.value_and_gradient(p::ForwardDiffPrepared, values::NamedTuple)
+@inline function AbstractPPL.value_and_gradient(p::ForwardDiffPrepared, values::NamedTuple)
     x = AbstractPPL.flatten_to_vec(values)
     ForwardDiff.gradient!(p.result, p.f_vec, x, p.config)
     val = ForwardDiff.DiffResults.value(p.result)
diff --git a/ext/AbstractPPLMooncakeExt.jl b/ext/AbstractPPLMooncakeExt.jl
@@ -20,6 +20,8 @@ function (p::MooncakePrepared)(values::NamedTuple)
 end
 
 function (p::MooncakePrepared)(x::AbstractVector)
+    length(x) == p.dim ||
+        throw(DimensionMismatch("expected vector of length $(p.dim), got $(length(x))"))
     return p.f_vec(x)
 end
 
@@ -33,7 +35,7 @@ function AbstractPPL.prepare(adtype::AutoMooncake, problem, prototype::NamedTupl
     return MooncakePrepared(evaluator, f_vec, cache, prototype, length(x0))
 end
 
-function AbstractPPL.value_and_gradient(p::MooncakePrepared, values::NamedTuple)
+@inline function AbstractPPL.value_and_gradient(p::MooncakePrepared, values::NamedTuple)
     x = AbstractPPL.flatten_to_vec(values)
     val, (_, dx) = Mooncake.value_and_gradient!!(p.cache, p.f_vec, x)
     grad_nt = AbstractPPL.unflatten_from_vec(p.prototype, dx)
diff --git a/src/evaluator.jl b/src/evaluator.jl
@@ -99,13 +99,15 @@ function _unflatten(proto::AbstractArray{<:Real}, vec::AbstractVector, offset::I
     result = reshape(@view(vec[offset:(offset + n - 1)]), size(proto))
     return result, offset + n
 end
-function _unflatten(proto::NamedTuple, vec::AbstractVector, offset::Int)
-    rebuilt = Any[]
-    for v in values(proto)
-        val, offset = _unflatten(v, vec, offset)
-        push!(rebuilt, val)
-    end
-    return NamedTuple{keys(proto)}(Tuple(rebuilt)), offset
+# Recursive peel keeps this type-stable (Enzyme needs it).
+function _unflatten(::NamedTuple{(),Tuple{}}, ::AbstractVector, offset::Int)
+    return NamedTuple(), offset
+end
+function _unflatten(proto::NamedTuple{K}, vec::AbstractVector, offset::Int) where {K}
+    first_val, offset = _unflatten(first(values(proto)), vec, offset)
+    rest_proto = NamedTuple{Base.tail(K)}(Base.tail(values(proto)))
+    rest_nt, offset = _unflatten(rest_proto, vec, offset)
+    return merge(NamedTuple{(first(K),)}((first_val,)), rest_nt), offset
 end
 
 function unflatten_from_vec(prototype::NamedTuple, vec::AbstractVector)
diff --git a/test/varname/hasvalue.jl b/test/varname/hasvalue.jl
@@ -34,11 +34,11 @@ using Test
         @test canview(@opticof(_[1:2]), x)
         @test canview(@opticof(_[:]), x)
         @test !canview(@opticof(_[4]), x)
-        @test canview(@opticof(_[i=1]), x)
+        @test canview(@opticof(_[i = 1]), x)
         # For some weird reason DimData does not error on these two but just warns that
         # there's no index j!
-        @test canview(@opticof(_[j=2]), x)
-        @test canview(@opticof(_[i=1, j=2]), x)
+        @test canview(@opticof(_[j = 2]), x)
+        @test canview(@opticof(_[i = 1, j = 2]), x)
     end
 
     @testset "Dict" begin
@@ -246,14 +246,14 @@ end
         @test getvalue(x, @varname(a[1, 2])) == x.a[1, 2]
         @test hasvalue(x, @varname(a[:]))
         @test getvalue(x, @varname(a[:])) == x.a[:]
-        @test canview(@opticof(_[i=1]), x.a)
-        @test hasvalue(x, @varname(a[i=1]))
-        @test getvalue(x, @varname(a[i=1])) == x.a[i=1]
-        @test canview(@opticof(_[i=1, j=2]), x.a)
-        @test hasvalue(x, @varname(a[i=1, j=2]))
-        @test getvalue(x, @varname(a[i=1, j=2])) == x.a[i=1, j=2]
-        @test hasvalue(x, @varname(a[i=DD.Not(1)]))
-        @test getvalue(x, @varname(a[i=DD.Not(1)])) == x.a[i=DD.Not(1)]
+        @test canview(@opticof(_[i = 1]), x.a)
+        @test hasvalue(x, @varname(a[i = 1]))
+        @test getvalue(x, @varname(a[i = 1])) == x.a[i = 1]
+        @test canview(@opticof(_[i = 1, j = 2]), x.a)
+        @test hasvalue(x, @varname(a[i = 1, j = 2]))
+        @test getvalue(x, @varname(a[i = 1, j = 2])) == x.a[i = 1, j = 2]
+        @test hasvalue(x, @varname(a[i = DD.Not(1)]))
+        @test getvalue(x, @varname(a[i = DD.Not(1)])) == x.a[i = DD.Not(1)]
 
         y = (; b=DD.DimArray(randn(2, 3), (DD.X, DD.Y)))
         @test hasvalue(y, @varname(b))
diff --git a/test/varname/optic.jl b/test/varname/optic.jl
@@ -31,7 +31,7 @@ using AbstractPPL
             @opticof(_.a[2]),
             @opticof(_.a[1, :]),
             @opticof(_[1].a),
-            @opticof(_[1, x=1].a),
+            @opticof(_[1, x = 1].a),
         )
         for (i, optic1) in enumerate(optics)
             for (j, optic2) in enumerate(optics)
@@ -103,7 +103,7 @@ using AbstractPPL
                 @opticof(_.a),
                 @opticof(_.a.b),
                 @opticof(_[1].a),
-                @opticof(_[1, x=1].a),
+                @opticof(_[1, x = 1].a),
                 @opticof(_[].a[:]),
             )
             for optic in optics
@@ -196,8 +196,8 @@ using AbstractPPL
 
         @testset "keyword arguments to getindex" begin
             dimarray = DD.DimArray([0.0 1.0; 2.0 3.0], (:x, :y))
-            @test @opticof(_[x=1])(dimarray) == dimarray[x=1]
-            @test set(dimarray, @opticof(_[y=2]), [9.0; 8.0]) ==
+            @test @opticof(_[x = 1])(dimarray) == dimarray[x = 1]
+            @test set(dimarray, @opticof(_[y = 2]), [9.0; 8.0]) ==
                 DD.DimArray([0.0 9.0; 2.0 8.0], (:x, :y))
         end
 
@@ -288,10 +288,10 @@ using AbstractPPL
             @testset "keyword index" begin
                 x = DD.DimArray(zeros(2, 2), (:x, :y))
                 old_objid = objectid(x)
-                optic = with_mutation(@opticof(_[x=1, y=2]))
-                @test optic(x) === x[x=1, y=2]
+                optic = with_mutation(@opticof(_[x = 1, y = 2]))
+                @test optic(x) === x[x = 1, y = 2]
                 set(x, optic, 2.0)
-                @test x[x=1, y=2] == 2.0
+                @test x[x = 1, y = 2] == 2.0
                 @test collect(x) == [0.0 2.0; 0.0 0.0]
                 @test objectid(x) == old_objid
             end
diff --git a/test/varname/serialize.jl b/test/varname/serialize.jl
@@ -37,10 +37,10 @@ using Test
             @varname(z[:, :], true),
             @varname(z[2:5, :], false),
             @varname(z[2:5, :], true),
-            @varname(x[i=1]),
-            @varname(x[j=2, i=1]),
-            @varname(x[i=1, j=2]),
-            @varname(x[].a[j=2].b[3, 4, 5, [6]]),
+            @varname(x[i = 1]),
+            @varname(x[j = 2, i = 1]),
+            @varname(x[i = 1, j = 2]),
+            @varname(x[].a[j = 2].b[3, 4, 5, [6]]),
             @varname(x[[1, 2, 5, 6]]),
         ]
         for vn in vns
@@ -65,8 +65,9 @@ using Test
             "type" => "InvertedIndices.InvertedIndex",
             "skip" => AbstractPPL.index_to_dict(o.skip),
         )
-        AbstractPPL.dict_to_index(::Val{Symbol("InvertedIndices.InvertedIndex")}, d) =
-            InvertedIndex(AbstractPPL.dict_to_index(d["skip"]))
+        AbstractPPL.dict_to_index(::Val{Symbol("InvertedIndices.InvertedIndex")}, d) = InvertedIndex(
+            AbstractPPL.dict_to_index(d["skip"])
+        )
 
         # Serialisation should now work
         @test string_to_varname(varname_to_string(vn)) == vn
diff --git a/test/varname/subsumes.jl b/test/varname/subsumes.jl
@@ -65,12 +65,14 @@ using Test
         end
 
         @testset "keyword indices" begin
-            @test strictly_subsumes(@varname(x), @varname(x[a=1]))
-            @test strictly_subsumes(@varname(x[a=1:10, b=1:10]), @varname(x[a=1:10]))
-            @test strictly_subsumes(@varname(x[a=1:10, b=1:10]), @varname(x[a=1:5, b=1:5]))
-            @test strictly_subsumes(@varname(x[a=:]), @varname(x[a=1]))
-            @test uncomparable(@varname(x[a=1:10, b=5]), @varname(x[a=5, b=1:10]))
-            @test uncomparable(@varname(x[a=1]), @varname(x[b=1]))
+            @test strictly_subsumes(@varname(x), @varname(x[a = 1]))
+            @test strictly_subsumes(@varname(x[a = 1:10, b = 1:10]), @varname(x[a = 1:10]))
+            @test strictly_subsumes(
+                @varname(x[a = 1:10, b = 1:10]), @varname(x[a = 1:5, b = 1:5])
+            )
+            @test strictly_subsumes(@varname(x[a=:]), @varname(x[a = 1]))
+            @test uncomparable(@varname(x[a = 1:10, b = 5]), @varname(x[a = 5, b = 1:10]))
+            @test uncomparable(@varname(x[a = 1]), @varname(x[b = 1]))
         end
     end
 end
diff --git a/test/varname/varname.jl b/test/varname/varname.jl
@@ -40,8 +40,8 @@ using JET: @test_call
         check_doubleeq_and_hash(@varname(x.a[1]), @varname(x.a[1]), true)
         check_doubleeq_and_hash(@varname(x.a[1]), @varname(x.a[2]), false)
         check_doubleeq_and_hash(@varname(x.a[1]), @varname(x.b[1]), false)
-        check_doubleeq_and_hash(@varname(x[1, i=2]), @varname(x[1, i=2]), true)
-        check_doubleeq_and_hash(@varname(x[i=2, 4]), @varname(x[4, i=2]), true)
+        check_doubleeq_and_hash(@varname(x[1, i = 2]), @varname(x[1, i = 2]), true)
+        check_doubleeq_and_hash(@varname(x[i = 2, 4]), @varname(x[4, i = 2]), true)
 
         @testset "dynamic indices" begin
             check_doubleeq_and_hash(@varname(x[begin]), @varname(x[begin]), true)
@@ -90,7 +90,7 @@ using JET: @test_call
         @test string(@varname(x[begin])) == "x[DynamicIndex(begin)]"
         @test string(@varname(x[end])) == "x[DynamicIndex(end)]"
         @test string(@varname(x[:])) == "x[:]"
-        @test string(@varname(x[1, i=3])) == "x[1, i=3]"
+        @test string(@varname(x[1, i = 3])) == "x[1, i=3]"
     end
 
     @testset "dynamic indices and manual concretization" begin
@@ -148,7 +148,7 @@ using JET: @test_call
         @test !is_dynamic(@varname(x[1:3, 3, 2 + 9]))
         i = 10
         @test !is_dynamic(@varname(x[1:3, 3, 2 + 9, 1:3:i]))
-        @test !is_dynamic(@varname(x[k=i]))
+        @test !is_dynamic(@varname(x[k = i]))
     end
 
     @testset "automatic concretization" begin
@@ -187,8 +187,8 @@ using JET: @test_call
             @test @varname(x[idx]) == @varname(x[3])
             @test @varname(x[2 * idx]) == @varname(x[6])
             @test @varname(x[1:idx]) == @varname(x[1:3])
-            @test @varname(x[k=idx]) == @varname(x[k=3])
-            @test @varname(x[k=2 * idx]) == @varname(x[k=6])
+            @test @varname(x[k = idx]) == @varname(x[k = 3])
+            @test @varname(x[k = 2 * idx]) == @varname(x[k = 6])
         end
 
         @testset "with dynamic indices" begin