Fix sparse jacobians and add sparsereversediff backend

Vaibhavdixit02 · Vaibhavdixit02 · commit d98580b68c56 · 2023-09-11T09:17:45.000-04:00
diff --git a/ext/OptimizationForwardDiffExt.jl b/ext/OptimizationForwardDiffExt.jl
@@ -107,8 +107,8 @@ function Optimization.instantiate_function(f::OptimizationFunction{true},
 
     if f.hess === nothing
         hesscfg = ForwardDiff.HessianConfig(_f, cache.u0, ForwardDiff.Chunk{chunksize}())
-        hess = (res, θ, args...) -> ForwardDiff.hessian!(res, x -> _f(x, args...), θ,
-            hesscfg, Val{false}())
+        hess = (res, θ, args...) -> (ForwardDiff.hessian!(res, x -> _f(x, args...), θ,
+            hesscfg, Val{false}()))
     else
         hess = (H, θ, args...) -> f.hess(H, θ, cache.p, args...)
     end
@@ -135,6 +135,7 @@ function Optimization.instantiate_function(f::OptimizationFunction{true},
             ForwardDiff.Chunk{chunksize}())
         cons_j = function (J, θ)
             ForwardDiff.jacobian!(J, cons_oop, θ, cjconfig)
+            println(J)
         end
     else
         cons_j = (J, θ) -> f.cons_j(J, θ, cache.p)
@@ -149,6 +150,7 @@ function Optimization.instantiate_function(f::OptimizationFunction{true},
             for i in 1:num_cons
                 ForwardDiff.hessian!(res[i], fncs[i], θ, hess_config_cache[i], Val{true}())
             end
+            # println(res)
         end
     else
         cons_h = (res, θ) -> f.cons_h(res, θ, cache.p)
diff --git a/ext/OptimizationReverseDiffExt.jl b/ext/OptimizationReverseDiffExt.jl
@@ -20,11 +20,9 @@ function Optimization.instantiate_function(f, x, adtype::AutoReverseDiff,
     end
 
     if f.hess === nothing
+        
         hess = function (res, θ, args...)
-            
-            res .= SparseDiffTools.forwarddiff_color_jacobian(θ, colorvec = hess_colors, sparsity = hess_sparsity) do θ
-                ReverseDiff.gradient(x -> _f(x, args...), θ)
-            end
+            ReverseDiff.hessian!(res, x -> _f(x, args...), θ)
         end
     else
         hess = (H, θ, args...) -> f.hess(H, θ, p, args...)
@@ -61,9 +59,7 @@ function Optimization.instantiate_function(f, x, adtype::AutoReverseDiff,
         
         cons_h = function (res, θ)
             for i in 1:num_cons
-                res[i] .= SparseDiffTools.forwarddiff_color_jacobian(θ, ) do θ
-                    ReverseDiff.gradient(fncs[i], θ)
-                end
+                ReverseDiff.gradient(res[i], fncs[i], θ)
             end
         end
     else
@@ -83,82 +79,82 @@ function Optimization.instantiate_function(f, x, adtype::AutoReverseDiff,
         lag_h, f.lag_hess_prototype)
 end
 
-# function Optimization.instantiate_function(f, cache::Optimization.ReInitCache,
-#     adtype::AutoReverseDiff, num_cons = 0)
-#     _f = (θ, args...) -> first(f.f(θ, cache.p, args...))
-
-#     if f.grad === nothing
-#         grad = (res, θ, args...) -> ReverseDiff.gradient!(res, x -> _f(x, args...), θ)
-#     else
-#         grad = (G, θ, args...) -> f.grad(G, θ, cache.p, args...)
-#     end
-
-#     if f.hess === nothing
-#         hess_sparsity = Symbolics.hessian_sparsity(_f, cache.u0)
-#         hess_colors = SparseDiffTools.matrix_colors(tril(hess_sparsity))
-#         hess = function (res, θ, args...)
-#             res .= SparseDiffTools.forwarddiff_color_jacobian(θ, colorvec = hess_colors, sparsity = hess_sparsity) do θ
-#                 ReverseDiff.gradient(x -> _f(x, args...), θ)
-#             end
-#         end
-#     else
-#         hess = (H, θ, args...) -> f.hess(H, θ, cache.p, args...)
-#     end
-
-#     if f.hv === nothing
-#         hv = function (H, θ, v, args...)
-#             _θ = ForwardDiff.Dual.(θ, v)
-#             res = similar(_θ)
-#             grad(res, _θ, args...)
-#             H .= getindex.(ForwardDiff.partials.(res), 1)
-#         end
-#     else
-#         hv = f.hv
-#     end
-
-#     if f.cons === nothing
-#         cons = nothing
-#     else
-#         cons = (res, θ) -> f.cons(res, θ, cache.p)
-#         cons_oop = (x) -> (_res = zeros(eltype(x), num_cons); cons(_res, x); _res)
-#     end
-
-#     if cons !== nothing && f.cons_j === nothing
-#         cjconfig = ReverseDiff.JacobianConfig(cache.u0)
-#         cons_j = function (J, θ)
-#             ReverseDiff.jacobian!(J, cons_oop, θ, cjconfig)
-#         end
-#     else
-#         cons_j = (J, θ) -> f.cons_j(J, θ, cache.p)
-#     end
-
-#     if cons !== nothing && f.cons_h === nothing
-#         fncs = [(x) -> cons_oop(x)[i] for i in 1:num_cons]
-#         conshess_sparsity = Symbolics.hessian_sparsity.(fncs, Ref(cache.u0))
-#         conshess_colors = SparseDiffTools.matrix_colors.(conshess_sparsity)
-#         cons_h = function (res, θ)
-#             for i in 1:num_cons
-#                 res[i] .= SparseDiffTools.forwarddiff_color_jacobian(θ, colorvec = conshess_colors[i], sparsity = conshess_sparsity[i]) do θ
-#                     ReverseDiff.gradient(fncs[i], θ)
-#                 end
-#             end
-#         end
-#     else
-#         cons_h = (res, θ) -> f.cons_h(res, θ, cache.p)
-#     end
-
-#     if f.lag_h === nothing
-#         lag_h = nothing # Consider implementing this
-#     else
-#         lag_h = (res, θ, σ, μ) -> f.lag_h(res, θ, σ, μ, cache.p)
-#     end
-
-#     return OptimizationFunction{true}(f.f, adtype; grad = grad, hess = hess, hv = hv,
-#         cons = cons, cons_j = cons_j, cons_h = cons_h,
-#         hess_prototype = f.hess_prototype,
-#         cons_jac_prototype = f.cons_jac_prototype,
-#         cons_hess_prototype = f.cons_hess_prototype,
-#         lag_h, f.lag_hess_prototype)
-# end
+function Optimization.instantiate_function(f, cache::Optimization.ReInitCache,
+    adtype::AutoReverseDiff, num_cons = 0)
+    _f = (θ, args...) -> first(f.f(θ, cache.p, args...))
+
+    if f.grad === nothing
+        grad = (res, θ, args...) -> ReverseDiff.gradient!(res, x -> _f(x, args...), θ)
+    else
+        grad = (G, θ, args...) -> f.grad(G, θ, cache.p, args...)
+    end
+
+    if f.hess === nothing
+        hess_sparsity = Symbolics.hessian_sparsity(_f, cache.u0)
+        hess_colors = SparseDiffTools.matrix_colors(tril(hess_sparsity))
+        hess = function (res, θ, args...)
+            res .= SparseDiffTools.forwarddiff_color_jacobian(θ, colorvec = hess_colors, sparsity = hess_sparsity) do θ
+                ReverseDiff.gradient(x -> _f(x, args...), θ)
+            end
+        end
+    else
+        hess = (H, θ, args...) -> f.hess(H, θ, cache.p, args...)
+    end
+
+    if f.hv === nothing
+        hv = function (H, θ, v, args...)
+            _θ = ForwardDiff.Dual.(θ, v)
+            res = similar(_θ)
+            grad(res, _θ, args...)
+            H .= getindex.(ForwardDiff.partials.(res), 1)
+        end
+    else
+        hv = f.hv
+    end
+
+    if f.cons === nothing
+        cons = nothing
+    else
+        cons = (res, θ) -> f.cons(res, θ, cache.p)
+        cons_oop = (x) -> (_res = zeros(eltype(x), num_cons); cons(_res, x); _res)
+    end
+
+    if cons !== nothing && f.cons_j === nothing
+        cjconfig = ReverseDiff.JacobianConfig(cache.u0)
+        cons_j = function (J, θ)
+            ReverseDiff.jacobian!(J, cons_oop, θ, cjconfig)
+        end
+    else
+        cons_j = (J, θ) -> f.cons_j(J, θ, cache.p)
+    end
+
+    if cons !== nothing && f.cons_h === nothing
+        fncs = [(x) -> cons_oop(x)[i] for i in 1:num_cons]
+        conshess_sparsity = Symbolics.hessian_sparsity.(fncs, Ref(cache.u0))
+        conshess_colors = SparseDiffTools.matrix_colors.(conshess_sparsity)
+        cons_h = function (res, θ)
+            for i in 1:num_cons
+                res[i] .= SparseDiffTools.forwarddiff_color_jacobian(θ, colorvec = conshess_colors[i], sparsity = conshess_sparsity[i]) do θ
+                    ReverseDiff.gradient(fncs[i], θ)
+                end
+            end
+        end
+    else
+        cons_h = (res, θ) -> f.cons_h(res, θ, cache.p)
+    end
+
+    if f.lag_h === nothing
+        lag_h = nothing # Consider implementing this
+    else
+        lag_h = (res, θ, σ, μ) -> f.lag_h(res, θ, σ, μ, cache.p)
+    end
+
+    return OptimizationFunction{true}(f.f, adtype; grad = grad, hess = hess, hv = hv,
+        cons = cons, cons_j = cons_j, cons_h = cons_h,
+        hess_prototype = f.hess_prototype,
+        cons_jac_prototype = f.cons_jac_prototype,
+        cons_hess_prototype = f.cons_hess_prototype,
+        lag_h, f.lag_hess_prototype)
+end
 
 end
diff --git a/ext/OptimizationSparseDiffExt.jl b/ext/OptimizationSparseDiffExt.jl