From 3ec0acc1e2c3d68248727b9097e11c85d56599b8 Mon Sep 17 00:00:00 2001
From: Yash Raj Singh <yash.raj270998@gmail.com>
Date: Mon, 20 Feb 2023 23:47:57 +0100
Subject: [PATCH 1/3] multivariate halley and some tests

---
 lib/SimpleNonlinearSolve/src/halley.jl      | 77 ++++++++++++++++-----
 lib/SimpleNonlinearSolve/test/basictests.jl | 21 +++---
 2 files changed, 71 insertions(+), 27 deletions(-)

diff --git a/lib/SimpleNonlinearSolve/src/halley.jl b/lib/SimpleNonlinearSolve/src/halley.jl
index 77ea3a4a1..557f43473 100644
--- a/lib/SimpleNonlinearSolve/src/halley.jl
+++ b/lib/SimpleNonlinearSolve/src/halley.jl
@@ -42,10 +42,28 @@ function SciMLBase.__solve(prob::NonlinearProblem,
                            maxiters = 1000, kwargs...)
     f = Base.Fix2(prob.f, prob.p)
     x = float(prob.u0)
-    fx = f(x)
-    # fx = float(prob.u0)
-    if !isa(fx, Number) || !isa(x, Number)
-        error("Halley currently only supports scalar-valued single-variable functions")
+    # Defining all derivative expressions in one place before the iterations
+    if isa(x, AbstractArray)
+        if alg_autodiff(alg)
+            n = length(x)
+            a_dfdx(x) = ForwardDiff.jacobian(f, x)
+            a_d2fdx(x) = ForwardDiff.jacobian(a_dfdx, x)
+            A = Array{Union{Nothing, Number}}(nothing, n, n)
+            #fx = f(x)
+        else
+            n = length(x)
+            f_dfdx(x) = FiniteDiff.finite_difference_jacobian(f, x, diff_type(alg), eltype(x))
+            f_d2fdx(x) = FiniteDiff.finite_difference_jacobian(f_dfdx, x, diff_type(alg), eltype(x))
+            A = Array{Union{Nothing, Number}}(nothing, n, n)
+        end
+    elseif isa(x, Number)
+        if alg_autodiff(alg)
+            sa_dfdx(x) = ForwardDiff.derivative(f, x)
+            sa_d2fdx(x) = ForwardDiff.derivative(sa_dfdx, x)
+        else
+            sf_dfdx(x) = FiniteDiff.finite_difference_derivative(f, x, diff_type(alg), eltype(x))
+            sf_d2fdx(x) = FiniteDiff.finite_difference_derivative(sf_dfdx, x, diff_type(alg), eltype(x))
+        end
     end
     T = typeof(x)
 
@@ -65,22 +83,49 @@ function SciMLBase.__solve(prob::NonlinearProblem,
 
     for i in 1:maxiters
         if alg_autodiff(alg)
-            fx = f(x)
-            dfdx(x) = ForwardDiff.derivative(f, x)
-            dfx = dfdx(x)
-            d2fx = ForwardDiff.derivative(dfdx, x)
+            if isa(x, Number)
+                fx = f(x)
+                dfx = sa_dfdx(x)
+                d2fx = sa_d2fdx(x)
+            else
+                fx = f(x)
+                dfx = a_dfdx(x)
+                d2fx = reshape(a_d2fdx(x), (n,n,n)) # A 3-dim Hessian Tensor
+                ai = -(dfx \ fx)
+                for j in 1:n
+                    tmp = transpose(d2fx[:, :, j] * ai)
+                    A[j, :] = tmp
+                end
+                bi = (dfx) \ (A * ai)
+                ci = (ai .* ai) ./ (ai .+ (0.5 .* bi))
+            end
         else
-            fx = f(x)
-            dfx = FiniteDiff.finite_difference_derivative(f, x, diff_type(alg), eltype(x),
-                                                          fx)
-            d2fx = FiniteDiff.finite_difference_derivative(x -> FiniteDiff.finite_difference_derivative(f,
-                                                                                                        x),
-                                                           x, diff_type(alg), eltype(x), fx)
+            if isa(x, Number)
+                fx = f(x)
+                dfx = sf_dfdx(x)
+                d2fx = sf_d2fdx(x)
+            else
+                fx = f(x)
+                dfx = f_dfdx(x)
+                d2fx = reshape(f_d2fdx(x), (n,n,n)) # A 3-dim Hessian Tensor
+                ai = -(dfx \ fx)
+                for j in 1:n
+                    tmp = transpose(d2fx[:, :, j] * ai)
+                    A[j, :] = tmp
+                end
+                bi = (dfx) \ (A * ai)
+                ci = (ai .* ai) ./ (ai .+ (0.5 .* bi))
+            end
         end
         iszero(fx) &&
             return SciMLBase.build_solution(prob, alg, x, fx; retcode = ReturnCode.Success)
-        Δx = (2 * dfx^2 - fx * d2fx) \ (2fx * dfx)
-        x -= Δx
+        if isa(x, Number)
+            Δx = (2 * dfx^2 - fx * d2fx) \ (2fx * dfx)
+            x -= Δx
+        else
+            Δx = ci
+            x += Δx
+        end
         if isapprox(x, xo, atol = atol, rtol = rtol)
             return SciMLBase.build_solution(prob, alg, x, fx; retcode = ReturnCode.Success)
         end
diff --git a/lib/SimpleNonlinearSolve/test/basictests.jl b/lib/SimpleNonlinearSolve/test/basictests.jl
index 26e92dfe8..8fbdfffaf 100644
--- a/lib/SimpleNonlinearSolve/test/basictests.jl
+++ b/lib/SimpleNonlinearSolve/test/basictests.jl
@@ -49,10 +49,10 @@ function benchmark_scalar(f, u0)
     sol = (solve(probN, Halley()))
 end
 
-# function ff(u, p)
-#     u .* u .- 2
-# end
-# const cu0 = @SVector[1.0, 1.0]
+function ff(u, p)
+    u .* u .- 2
+end
+const cu0 = @SVector[1.0, 1.0]
 function sf(u, p)
     u * u - 2
 end
@@ -62,6 +62,10 @@ sol = benchmark_scalar(sf, csu0)
 @test sol.retcode === ReturnCode.Success
 @test sol.u * sol.u - 2 < 1e-9
 
+sol = benchmark_scalar(ff, cu0)
+@test sol.retcode === ReturnCode.Success
+@test sol.u .* sol.u .- 2 < [1e-9, 1e-9]
+
 if VERSION >= v"1.7"
     @test (@ballocated benchmark_scalar(sf, csu0)) == 0
 end
@@ -122,7 +126,7 @@ using ForwardDiff
 f, u0 = (u, p) -> u .* u .- p, @SVector[1.0, 1.0]
 
 for alg in (SimpleNewtonRaphson(), LBroyden(), Klement(), SimpleTrustRegion(),
-            SimpleDFSane(), BROYDEN_SOLVERS...)
+            SimpleDFSane(), Halley(), BROYDEN_SOLVERS...)
     g = function (p)
         probN = NonlinearProblem{false}(f, csu0, p)
         sol = solve(probN, alg, abstol = 1e-9)
@@ -221,7 +225,7 @@ probN = NonlinearProblem(f, u0)
 
 for alg in (SimpleNewtonRaphson(), SimpleNewtonRaphson(; autodiff = false),
             SimpleTrustRegion(),
-            SimpleTrustRegion(; autodiff = false), LBroyden(), Klement(), SimpleDFSane(),
+            SimpleTrustRegion(; autodiff = false), Halley(), Halley(; autodiff = false), LBroyden(), Klement(), SimpleDFSane(),
             BROYDEN_SOLVERS...)
     sol = solve(probN, alg)
 
@@ -229,11 +233,6 @@ for alg in (SimpleNewtonRaphson(), SimpleNewtonRaphson(; autodiff = false),
     @test sol.u[end] ≈ sqrt(2.0)
 end
 
-# Separate Error check for Halley; will be included in above error checks for the improved Halley
-f, u0 = (u, p) -> u * u - 2.0, 1.0
-probN = NonlinearProblem(f, u0)
-
-@test solve(probN, Halley()).u ≈ sqrt(2.0)
 
 for u0 in [1.0, [1, 1.0]]
     local f, probN, sol

From 5f531f7f1e923dd68dbd009142d89116f0c7bb67 Mon Sep 17 00:00:00 2001
From: Yash Raj Singh <yash.raj270998@gmail.com>
Date: Tue, 21 Feb 2023 22:42:23 +0100
Subject: [PATCH 2/3] modified allocations

---
 lib/SimpleNonlinearSolve/src/halley.jl | 50 +++++++-------------------
 1 file changed, 13 insertions(+), 37 deletions(-)

diff --git a/lib/SimpleNonlinearSolve/src/halley.jl b/lib/SimpleNonlinearSolve/src/halley.jl
index 557f43473..70b8a7f8c 100644
--- a/lib/SimpleNonlinearSolve/src/halley.jl
+++ b/lib/SimpleNonlinearSolve/src/halley.jl
@@ -42,28 +42,8 @@ function SciMLBase.__solve(prob::NonlinearProblem,
                            maxiters = 1000, kwargs...)
     f = Base.Fix2(prob.f, prob.p)
     x = float(prob.u0)
-    # Defining all derivative expressions in one place before the iterations
     if isa(x, AbstractArray)
-        if alg_autodiff(alg)
-            n = length(x)
-            a_dfdx(x) = ForwardDiff.jacobian(f, x)
-            a_d2fdx(x) = ForwardDiff.jacobian(a_dfdx, x)
-            A = Array{Union{Nothing, Number}}(nothing, n, n)
-            #fx = f(x)
-        else
-            n = length(x)
-            f_dfdx(x) = FiniteDiff.finite_difference_jacobian(f, x, diff_type(alg), eltype(x))
-            f_d2fdx(x) = FiniteDiff.finite_difference_jacobian(f_dfdx, x, diff_type(alg), eltype(x))
-            A = Array{Union{Nothing, Number}}(nothing, n, n)
-        end
-    elseif isa(x, Number)
-        if alg_autodiff(alg)
-            sa_dfdx(x) = ForwardDiff.derivative(f, x)
-            sa_d2fdx(x) = ForwardDiff.derivative(sa_dfdx, x)
-        else
-            sf_dfdx(x) = FiniteDiff.finite_difference_derivative(f, x, diff_type(alg), eltype(x))
-            sf_d2fdx(x) = FiniteDiff.finite_difference_derivative(sf_dfdx, x, diff_type(alg), eltype(x))
-        end
+        n = length(x)
     end
     T = typeof(x)
 
@@ -85,34 +65,30 @@ function SciMLBase.__solve(prob::NonlinearProblem,
         if alg_autodiff(alg)
             if isa(x, Number)
                 fx = f(x)
-                dfx = sa_dfdx(x)
-                d2fx = sa_d2fdx(x)
+                dfx = ForwardDiff.derivative(f, x)
+                d2fx = ForwardDiff.derivative(x -> ForwardDiff.derivative(f, x), x)
             else
                 fx = f(x)
-                dfx = a_dfdx(x)
-                d2fx = reshape(a_d2fdx(x), (n,n,n)) # A 3-dim Hessian Tensor
+                dfx = ForwardDiff.jacobian(f, x)
+                d2fx = ForwardDiff.jacobian(x -> ForwardDiff.jacobian(f, x), x) #  n^2 by n matrix
                 ai = -(dfx \ fx)
-                for j in 1:n
-                    tmp = transpose(d2fx[:, :, j] * ai)
-                    A[j, :] = tmp
-                end
+                A = reshape(d2fx * ai, (n, n))
                 bi = (dfx) \ (A * ai)
                 ci = (ai .* ai) ./ (ai .+ (0.5 .* bi))
             end
         else
             if isa(x, Number)
                 fx = f(x)
-                dfx = sf_dfdx(x)
-                d2fx = sf_d2fdx(x)
+                dfx = FiniteDiff.finite_difference_derivative(f, x, diff_type(alg), eltype(x))
+                d2fx = FiniteDiff.finite_difference_derivative(x -> FiniteDiff.finite_difference_derivative(f, x), x,
+                                                                                            diff_type(alg), eltype(x))
             else
                 fx = f(x)
-                dfx = f_dfdx(x)
-                d2fx = reshape(f_d2fdx(x), (n,n,n)) # A 3-dim Hessian Tensor
+                dfx = FiniteDiff.finite_difference_jacobian(f, x, diff_type(alg), eltype(x))
+                d2fx = FiniteDiff.finite_difference_jacobian(x -> FiniteDiff.finite_difference_jacobian(f, x), x, 
+                                                                        diff_type(alg), eltype(x))
                 ai = -(dfx \ fx)
-                for j in 1:n
-                    tmp = transpose(d2fx[:, :, j] * ai)
-                    A[j, :] = tmp
-                end
+                A = reshape(d2fx * ai, (n, n))
                 bi = (dfx) \ (A * ai)
                 ci = (ai .* ai) ./ (ai .+ (0.5 .* bi))
             end

From 7f542660bbeeb2db088f70db93a90c6f970d8a64 Mon Sep 17 00:00:00 2001
From: Yash Raj Singh <yash.raj270998@gmail.com>
Date: Thu, 23 Feb 2023 01:29:26 +0100
Subject: [PATCH 3/3] fixed allocations and tests pass

---
 lib/SimpleNonlinearSolve/src/halley.jl | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/lib/SimpleNonlinearSolve/src/halley.jl b/lib/SimpleNonlinearSolve/src/halley.jl
index 70b8a7f8c..0e5417642 100644
--- a/lib/SimpleNonlinearSolve/src/halley.jl
+++ b/lib/SimpleNonlinearSolve/src/halley.jl
@@ -42,6 +42,7 @@ function SciMLBase.__solve(prob::NonlinearProblem,
                            maxiters = 1000, kwargs...)
     f = Base.Fix2(prob.f, prob.p)
     x = float(prob.u0)
+    fx = f(x)
     if isa(x, AbstractArray)
         n = length(x)
     end
@@ -70,7 +71,7 @@ function SciMLBase.__solve(prob::NonlinearProblem,
             else
                 fx = f(x)
                 dfx = ForwardDiff.jacobian(f, x)
-                d2fx = ForwardDiff.jacobian(x -> ForwardDiff.jacobian(f, x), x) #  n^2 by n matrix
+                d2fx = ForwardDiff.jacobian(x -> ForwardDiff.jacobian(f, x), x)
                 ai = -(dfx \ fx)
                 A = reshape(d2fx * ai, (n, n))
                 bi = (dfx) \ (A * ai)