From 7346dca36e4624cdf4e99e828cace76531c8fe9b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Beno=C3=AEt=20Legat?= <benoit.legat@gmail.com>
Date: Fri, 5 Jun 2026 10:10:43 +0100
Subject: [PATCH 1/2] Refactor neural

---
 perf/neural.jl | 62 ++++++++++++++++++++++++++++----------------------
 1 file changed, 35 insertions(+), 27 deletions(-)

diff --git a/perf/neural.jl b/perf/neural.jl
index f32aef8..bdcf972 100644
--- a/perf/neural.jl
+++ b/perf/neural.jl
@@ -6,34 +6,42 @@
 
 using JuMP
 using ArrayDiff
+import Random
 import NLopt
-
-n = 2
-X = rand(n, n)
-target = rand(n, n)
-
-model = direct_model(NLopt.Optimizer())
-set_attribute(model, "algorithm", :LD_LBFGS)
-
-@variable(model, W1[1:n, 1:n], container = ArrayDiff.ArrayOfVariables)
-@variable(model, W2[1:n, 1:n], container = ArrayDiff.ArrayOfVariables)
-
-# Set non-zero starting values to avoid saddle point at zero
-for i in 1:n, j in 1:n
-    set_start_value(W1[i, j], 0.1 * randn())
-    set_start_value(W2[i, j], 0.1 * randn())
+import NLPModelsJuMP
+
+function bench(solver, ::Type{T} = Float64; h::Int = 4096, d::Int = 13, n::Int = 178, out_dim = 2, gpu::Bool = false) where {T<:Real}
+    Random.seed!(0)
+    X = randn(T, d, n)
+    Y = randn(T, out_dim, n)
+
+    model = GenericModel{T}(solver)
+    V = gpu ? CUDA.CuVector{T} : Vector{T}
+    set_attribute(model, MOI.AutomaticDifferentiationBackend(), ArrayDiff.Mode{V}())
+
+    @variable(model, W1[1:h, 1:d], container = ArrayDiff.ArrayOfVariables)
+    @variable(model, W2[1:out_dim, 1:h], container = ArrayDiff.ArrayOfVariables)
+
+    Y_hat = W2 * tanh.(W1 * X)
+    loss = sum((Y_hat .- Y) .^ 2)
+    @objective(model, Min, loss)
+
+    for i in 1:n, j in 1:n
+        set_start_value(W1[i, j], 0.1 * randn())
+        set_start_value(W2[i, j], 0.1 * randn())
+    end
+    optimize!(model)
+
+    if !is_solved_and_feasible(model)
+        @warn(solution_summary(model))
+    end
+    return solve_time(model)
 end
 
-# Forward pass: Y = W2 * tanh.(W1 * X)
-Y = W2 * tanh.(W1 * X)
-
-# Loss: sum of squared errors
-loss = sum((Y .- target) .^ 2)
-@objective(model, Min, loss)
-
-optimize!(model)
+nlopt = optimizer_with_attributes(
+    NLopt.Optimizer,
+    "algorithm" => :LD_LBFGS,
+    MOI.AutomaticDifferentiationBackend() => ArrayDiff.Mode(),
+)
 
-println("Termination status: ", termination_status(model))
-println("Objective value:    ", objective_value(model))
-println("W1 = ", [value(W1[i, j]) for i in 1:n, j in 1:n])
-println("W2 = ", [value(W2[i, j]) for i in 1:n, j in 1:n])
+bench(nlopt)

From 4e47d5df237f0db351a2329754147e81cff007dd Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Beno=C3=AEt=20Legat?= <benoit.legat@gmail.com>
Date: Fri, 5 Jun 2026 14:22:44 +0100
Subject: [PATCH 2/2] Add benchmark for SIAM'OP 26 talk

---
 perf/Project.toml | 15 +++++++++++++-
 perf/neural.jl    | 51 ++++++++++++++++++++++++++++++++++++-----------
 2 files changed, 53 insertions(+), 13 deletions(-)

diff --git a/perf/Project.toml b/perf/Project.toml
index 4aa5df2..daaa5d5 100644
--- a/perf/Project.toml
+++ b/perf/Project.toml
@@ -1,21 +1,34 @@
 name = "ArrayDiffPerf"
 uuid = "00000000-0000-0000-0000-000000000001"
-authors = ["Benoît Legat <benoit.legat@gmail.com>"]
 version = "0.0.0"
+authors = ["Benoît Legat <benoit.legat@gmail.com>"]
 
 [deps]
 ArrayDiff = "c45fa1ca-6901-44ac-ae5b-5513a4852d50"
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 CondaPkg = "992eb4ea-22a4-4c89-a5bb-47a3300528ab"
+JSOSolvers = "10dff2fc-5484-5881-a0e0-c90441020f8a"
 JuMP = "4076af6c-e467-56ae-b986-b466b2749572"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 Lux = "b2108857-7c20-44ae-9111-449ecde12c47"
 MathOptInterface = "b8f27783-ece8-5eb3-8dc8-9495eed66fee"
 Mooncake = "da2b9cff-9c12-43a0-ae48-6db2b0edb7d6"
+NLPModels = "a4795742-8479-5a88-8948-cc11e1c8c1a6"
+NLPModelsJuMP = "792afdf1-32c1-5681-94e0-d7bf7a5df49e"
+NLopt = "76087f3c-5699-56af-9a33-bf431cd00edd"
+Optimisers = "3bd65402-5787-11e9-1adc-39752487f4e2"
 Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 PythonCall = "6099a3de-0909-46bc-b1f4-468b9a2dfc0d"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
+SolverCore = "ff4d7338-4cf1-434d-91df-b86cb86fb843"
 
 [sources]
 ArrayDiff = {path = ".."}
+
+[compat]
+JSOSolvers = "0.14.8"
+NLPModels = "0.21.12"
+NLPModelsJuMP = "0.13.5"
+Optimisers = "0.4.7"
+SolverCore = "0.3.10"
diff --git a/perf/neural.jl b/perf/neural.jl
index bdcf972..3cc9ebf 100644
--- a/perf/neural.jl
+++ b/perf/neural.jl
@@ -1,5 +1,4 @@
-# Neural network optimization using ArrayDiff + NLopt
-#
+# Neural network optimization using ArrayDiff + NLopt #
 # This demonstrates end-to-end optimization of a simple two-layer neural
 # network with array-valued decision variables, array-aware AD, and a
 # first-order NLP solver.
@@ -7,22 +6,21 @@
 using JuMP
 using ArrayDiff
 import Random
-import NLopt
-import NLPModelsJuMP
 
+# Benchmark used for SIAM'OP 26 talk.
 function bench(solver, ::Type{T} = Float64; h::Int = 4096, d::Int = 13, n::Int = 178, out_dim = 2, gpu::Bool = false) where {T<:Real}
     Random.seed!(0)
     X = randn(T, d, n)
     Y = randn(T, out_dim, n)
 
     model = GenericModel{T}(solver)
-    V = gpu ? CUDA.CuVector{T} : Vector{T}
-    set_attribute(model, MOI.AutomaticDifferentiationBackend(), ArrayDiff.Mode{V}())
-
-    @variable(model, W1[1:h, 1:d], container = ArrayDiff.ArrayOfVariables)
-    @variable(model, W2[1:out_dim, 1:h], container = ArrayDiff.ArrayOfVariables)
-
+    @variable(model, W1[1:h, 1:d],
+        container = ArrayDiff.ArrayOfVariables)
+    @variable(model, W2[1:out_dim, 1:h],
+        container = ArrayDiff.ArrayOfVariables)
     Y_hat = W2 * tanh.(W1 * X)
+    # We need `.-` and not `-` as a workaround for
+    # https://github.com/blegat/ArrayDiff.jl/issues/83
     loss = sum((Y_hat .- Y) .^ 2)
     @objective(model, Min, loss)
 
@@ -30,18 +28,47 @@ function bench(solver, ::Type{T} = Float64; h::Int = 4096, d::Int = 13, n::Int =
         set_start_value(W1[i, j], 0.1 * randn())
         set_start_value(W2[i, j], 0.1 * randn())
     end
+    V = gpu ? CUDA.CuVector{T} : Vector{T}
+    set_attribute(model,
+        MOI.AutomaticDifferentiationBackend(),
+        ArrayDiff.Mode{V}())
     optimize!(model)
 
+    display(solution_summary(model))
     if !is_solved_and_feasible(model)
         @warn(solution_summary(model))
     end
+    return model
     return solve_time(model)
 end
 
+import NLopt
 nlopt = optimizer_with_attributes(
     NLopt.Optimizer,
     "algorithm" => :LD_LBFGS,
-    MOI.AutomaticDifferentiationBackend() => ArrayDiff.Mode(),
+    "ftol_rel" => 1e-14,                                                      
+    "ftol_abs" => 1e-14,
+    "xtol_rel" => 1e-14,                                                      
+    "maxeval"  => 100_000,
+)
+m = bench(nlopt)
+
+import NLPModelsJuMP
+include(joinpath(dirname(dirname(pathof(ArrayDiff))), "test", "OptimisersSolver.jl"))
+
+import JSOSolvers
+lbfgs = optimizer_with_attributes(
+    NLPModelsJuMP.Optimizer,
+    "solver" => JSOSolvers.lbfgs,
+)
+bench(lbfgs)
+
+adam = optimizer_with_attributes(
+    NLPModelsJuMP.Optimizer,
+    "tol" => 1e-4,
+    "solver" => OptimisersSolver,
 )
+bench(adam)
 
-bench(nlopt)
+import CUDA
+bench(adam, Float32, gpu = true)