From a9d884f85c4e9ff4c37e54724ef373389d913c70 Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Sat, 14 Oct 2023 19:05:07 -0400 Subject: [PATCH 1/5] Add a wrapper over LeastSquaresOptim --- Project.toml | 9 +++- ext/NonlinearSolveLeastSquaresOptimExt.jl | 65 +++++++++++++++++++++++ src/NonlinearSolve.jl | 5 +- src/algorithms.jl | 28 ++++++++++ src/gaussnewton.jl | 4 +- src/jacobian.jl | 8 +-- src/levenberg.jl | 5 +- src/utils.jl | 8 +++ 8 files changed, 123 insertions(+), 9 deletions(-) create mode 100644 ext/NonlinearSolveLeastSquaresOptimExt.jl create mode 100644 src/algorithms.jl diff --git a/Project.toml b/Project.toml index fd8cc2fce..bd2fca7ae 100644 --- a/Project.toml +++ b/Project.toml @@ -1,7 +1,7 @@ name = "NonlinearSolve" uuid = "8913a72c-1f9b-4ce2-8d82-65094dcecaec" authors = ["SciML"] -version = "2.2.1" +version = "2.3.0" [deps] ADTypes = "47edcb42-4c32-4615-8424-f2b9edc5f35b" @@ -24,6 +24,12 @@ SparseDiffTools = "47a9eef4-7e08-11e9-0b38-333d64bd3804" StaticArraysCore = "1e83bf80-4336-4d27-bf5d-d5a4f845583c" UnPack = "3a884ed6-31ef-47d7-9d2a-63182c4928ed" +[weakdeps] +LeastSquaresOptim = "0fc2ff8b-aaa3-5acd-a817-1944a5e08891" + +[extensions] +NonlinearSolveLeastSquaresOptimExt = "LeastSquaresOptim" + [compat] ADTypes = "0.2" ArrayInterface = "6.0.24, 7" @@ -33,6 +39,7 @@ EnumX = "1" Enzyme = "0.11" FiniteDiff = "2" ForwardDiff = "0.10.3" +LeastSquaresOptim = "0.8" LineSearches = "7" LinearSolve = "2" NonlinearProblemLibrary = "0.1" diff --git a/ext/NonlinearSolveLeastSquaresOptimExt.jl b/ext/NonlinearSolveLeastSquaresOptimExt.jl new file mode 100644 index 000000000..b0e562a3b --- /dev/null +++ b/ext/NonlinearSolveLeastSquaresOptimExt.jl @@ -0,0 +1,65 @@ +module NonlinearSolveLeastSquaresOptimExt + +using NonlinearSolve, SciMLBase +import ConcreteStructs: @concrete +import LeastSquaresOptim as LSO + +extension_loaded(::Val{:LeastSquaresOptim}) = true + +function _lso_solver(::LSOptimSolver{alg, linsolve}) where {alg, linsolve} + ls = linsolve == :qr ? LSO.QR() : + (linsolve == :cholesky ? LSO.Cholesky() : + (linsolve == :lsmr ? LSO.LSMR() : nothing)) + if alg == :lm + return LSO.LevenbergMarquardt(ls) + elseif alg == :dogleg + return LSO.Dogleg(ls) + else + throw(ArgumentError("Unknown LeastSquaresOptim Algorithm: $alg")) + end +end + +@concrete struct LeastSquaresOptimCache + prob + alg + allocated_prob + kwargs +end + +@concrete struct FunctionWrapper{iip} + f + p +end + +(f::FunctionWrapper{true})(du, u) = f.f(du, u, f.p) +(f::FunctionWrapper{false})(du, u) = (du .= f.f(u, f.p)) + +function SciMLBase.__init(prob::NonlinearLeastSquaresProblem, alg::LSOptimSolver, args...; + abstol = 1e-8, reltol = 1e-8, verbose = false, maxiters = 1000, kwargs...) + iip = SciMLBase.isinplace(prob) + + f! = FunctionWrapper{iip}(prob.f, prob.p) + g! = prob.f.jac === nothing ? nothing : FunctionWrapper{iip}(prob.f.jac, prob.p) + + lsoprob = LSO.LeastSquaresProblem(; x = prob.u0, f!, y = prob.f.resid_prototype, g!, + J = prob.f.jac_prototype, alg.autodiff, + output_length = length(prob.f.resid_prototype)) + allocated_prob = LSO.LeastSquaresProblemAllocated(lsoprob, _lso_solver(alg)) + + return LeastSquaresOptimCache(prob, alg, allocated_prob, + (; x_tol = abstol, f_tol = reltol, iterations = maxiters, show_trace = verbose, + kwargs...)) +end + +function SciMLBase.solve!(cache::LeastSquaresOptimCache) + res = LSO.optimize!(cache.allocated_prob; cache.kwargs...) + maxiters = cache.kwargs[:iterations] + retcode = res.x_converged || res.f_converged || res.g_converged ? ReturnCode.Success : + (res.iterations ≥ maxiters ? ReturnCode.MaxIters : + ReturnCode.ConvergenceFailure) + stats = SciMLBase.NLStats(res.f_calls, res.g_calls, -1, -1, res.iterations) + return SciMLBase.build_solution(cache.prob, cache.alg, res.minimizer, res.ssr / 2; + retcode, original = res, stats) +end + +end diff --git a/src/NonlinearSolve.jl b/src/NonlinearSolve.jl index f8ae69939..d9dcbba39 100644 --- a/src/NonlinearSolve.jl +++ b/src/NonlinearSolve.jl @@ -30,6 +30,8 @@ abstract type AbstractNewtonAlgorithm{CJ, AD} <: AbstractNonlinearSolveAlgorithm abstract type AbstractNonlinearSolveCache{iip} end +extension_loaded(::Val) = false + isinplace(::AbstractNonlinearSolveCache{iip}) where {iip} = iip function SciMLBase.__solve(prob::Union{NonlinearProblem, NonlinearLeastSquaresProblem}, @@ -60,6 +62,7 @@ function SciMLBase.solve!(cache::AbstractNonlinearSolveCache) end include("utils.jl") +include("algorithms.jl") include("linesearch.jl") include("raphson.jl") include("trustRegion.jl") @@ -92,7 +95,7 @@ end export RadiusUpdateSchemes -export NewtonRaphson, TrustRegion, LevenbergMarquardt, GaussNewton +export NewtonRaphson, TrustRegion, LevenbergMarquardt, GaussNewton, LSOptimSolver export LineSearch diff --git a/src/algorithms.jl b/src/algorithms.jl new file mode 100644 index 000000000..b9a694866 --- /dev/null +++ b/src/algorithms.jl @@ -0,0 +1,28 @@ +# Define Algorithms extended via extensions +""" + LSOptimSolver(alg = :lm; linsolve = nothing, autodiff::Symbol = :central) + +Wrapper over [LeastSquaresOptim.jl](https://github.com/matthieugomez/LeastSquaresOptim.jl) for solving +`NonlinearLeastSquaresProblem`. + +## Arguments: + +- `alg`: Algorithm to use. Can be `:lm` or `:dogleg`. +- `linsolve`: Linear solver to use. Can be `:qr`, `:cholesky` or `:lsmr`. If + `nothing`, then `LeastSquaresOptim.jl` will choose the best linear solver based + on the Jacobian structure. + +!!! note + This algorithm is only available if `LeastSquaresOptim.jl` is installed. +""" +struct LSOptimSolver{alg, linsolve} <: AbstractNonlinearSolveAlgorithm + autodiff::Symbol + + function LSOptimSolver(alg = :lm; linsolve = nothing, autodiff::Symbol = :central) + @assert alg in (:lm, :dogleg) + @assert linsolve === nothing || linsolve in (:qr, :cholesky, :lsmr) + @assert autodiff in (:central, :forward) + + return new{alg, linsolve}(autodiff) + end +end diff --git a/src/gaussnewton.jl b/src/gaussnewton.jl index 7c94ec4f3..6c03b6c2e 100644 --- a/src/gaussnewton.jl +++ b/src/gaussnewton.jl @@ -93,8 +93,8 @@ end function perform_step!(cache::GaussNewtonCache{true}) @unpack u, fu1, f, p, alg, J, JᵀJ, Jᵀf, linsolve, du = cache jacobian!!(J, cache) - mul!(JᵀJ, J', J) - mul!(Jᵀf, J', fu1) + __matmul!(JᵀJ, J', J) + __matmul!(Jᵀf, J', fu1) # u = u - J \ fu linres = dolinsolve(alg.precs, linsolve; A = JᵀJ, b = _vec(Jᵀf), linu = _vec(du), diff --git a/src/jacobian.jl b/src/jacobian.jl index a069598bb..10ac69ec6 100644 --- a/src/jacobian.jl +++ b/src/jacobian.jl @@ -65,7 +65,7 @@ function jacobian_caches(alg::AbstractNonlinearSolveAlgorithm, f, u, p, ::Val{ii # NOTE: The deepcopy is needed here since we are using the resid_prototype elsewhere fu = f.resid_prototype === nothing ? (iip ? _mutable_zero(u) : _mutable(f(u, p))) : (iip ? deepcopy(f.resid_prototype) : f.resid_prototype) - if !has_analytic_jac && (linsolve_needs_jac || alg_wants_jac) + if !has_analytic_jac && (linsolve_needs_jac || alg_wants_jac || needsJᵀJ) sd = sparsity_detection_alg(f, alg.ad) ad = alg.ad jac_cache = iip ? sparse_jacobian_cache(ad, sd, uf, fu, _maybe_mutable(u, ad)) : @@ -74,7 +74,9 @@ function jacobian_caches(alg::AbstractNonlinearSolveAlgorithm, f, u, p, ::Val{ii jac_cache = nothing end - J = if !(linsolve_needs_jac || alg_wants_jac) + # FIXME: To properly support needsJᵀJ without Jacobian, we need to implement + # a reverse diff operation with the seed being `Jx`, this is not yet implemented + J = if !(linsolve_needs_jac || alg_wants_jac || needsJᵀJ) # We don't need to construct the Jacobian JacVec(uf, u; autodiff = __get_nonsparse_ad(alg.ad)) else @@ -114,7 +116,7 @@ __get_nonsparse_ad(::AutoSparseZygote) = AutoZygote() __get_nonsparse_ad(ad) = ad __init_JᵀJ(J::Number) = zero(J) -__init_JᵀJ(J::AbstractArray) = zeros(eltype(J), size(J, 2), size(J, 2)) +__init_JᵀJ(J::AbstractArray) = J' * J __init_JᵀJ(J::StaticArray) = MArray{Tuple{size(J, 2), size(J, 2)}, eltype(J)}(undef) ## Special Handling for Scalars diff --git a/src/levenberg.jl b/src/levenberg.jl index 1a0343010..8b0e5728e 100644 --- a/src/levenberg.jl +++ b/src/levenberg.jl @@ -192,7 +192,7 @@ function perform_step!(cache::LevenbergMarquardtCache{true}) if make_new_J jacobian!!(cache.J, cache) - mul!(cache.JᵀJ, cache.J', cache.J) + __matmul!(cache.JᵀJ, cache.J', cache.J) cache.DᵀD .= max.(cache.DᵀD, Diagonal(cache.JᵀJ)) cache.make_new_J = false cache.stats.njacs += 1 @@ -216,7 +216,8 @@ function perform_step!(cache::LevenbergMarquardtCache{true}) mul!(cache.Jv, J, v) @. cache.fu_tmp = (2 / h) * ((cache.fu_tmp - fu1) / h - cache.Jv) mul!(cache.u_tmp, J', cache.fu_tmp) - linres = dolinsolve(alg.precs, linsolve; A = cache.mat_tmp, b = _vec(cache.u_tmp), + # NOTE: Don't pass `A` in again, since we want to reuse the previous solve + linres = dolinsolve(alg.precs, linsolve; b = _vec(cache.u_tmp), linu = _vec(cache.du), p = p, reltol = cache.abstol) cache.linsolve = linres.cache @. cache.a = -cache.du diff --git a/src/utils.jl b/src/utils.jl index bd6a5a036..6dd1eeb75 100644 --- a/src/utils.jl +++ b/src/utils.jl @@ -163,3 +163,11 @@ function evaluate_f(f, u, p, ::Val{iip}; fu = nothing) where {iip} return f(u, p) end end + +""" + __matmul!(C, A, B) + +Defaults to `mul!(C, A, B)`. However, for sparse matrices uses `C .= A * B`. +""" +__matmul!(C, A, B) = mul!(C, A, B) +__matmul!(C::AbstractSparseMatrix, A, B) = C .= A * B From 890ae75efab759a55b4e54e6684a3633405aee03 Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Sat, 14 Oct 2023 20:17:15 -0400 Subject: [PATCH 2/5] Add tests --- Project.toml | 3 ++- ext/NonlinearSolveLeastSquaresOptimExt.jl | 9 +++++--- test/nonlinear_least_squares.jl | 28 ++++++++--------------- 3 files changed, 17 insertions(+), 23 deletions(-) diff --git a/Project.toml b/Project.toml index bd2fca7ae..b4f7c2553 100644 --- a/Project.toml +++ b/Project.toml @@ -58,6 +58,7 @@ julia = "1.9" BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf" Enzyme = "7da242da-08ed-463a-9acd-ee780be4f1d9" ForwardDiff = "f6369f11-7733-5829-9624-2563aa707210" +LeastSquaresOptim = "0fc2ff8b-aaa3-5acd-a817-1944a5e08891" LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" LinearSolve = "7ed4a6bd-45f5-4d41-b270-4a48e9bafcae" NonlinearProblemLibrary = "b7050fa9-e91f-4b37-bcee-a89a063da141" @@ -71,4 +72,4 @@ Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40" Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f" [targets] -test = ["Enzyme", "BenchmarkTools", "SafeTestsets", "Pkg", "Test", "ForwardDiff", "StaticArrays", "Symbolics", "LinearSolve", "Random", "LinearAlgebra", "Zygote", "SparseDiffTools", "NonlinearProblemLibrary"] +test = ["Enzyme", "BenchmarkTools", "SafeTestsets", "Pkg", "Test", "ForwardDiff", "StaticArrays", "Symbolics", "LinearSolve", "Random", "LinearAlgebra", "Zygote", "SparseDiffTools", "NonlinearProblemLibrary", "LeastSquaresOptim"] diff --git a/ext/NonlinearSolveLeastSquaresOptimExt.jl b/ext/NonlinearSolveLeastSquaresOptimExt.jl index b0e562a3b..7514931d5 100644 --- a/ext/NonlinearSolveLeastSquaresOptimExt.jl +++ b/ext/NonlinearSolveLeastSquaresOptimExt.jl @@ -41,9 +41,12 @@ function SciMLBase.__init(prob::NonlinearLeastSquaresProblem, alg::LSOptimSolver f! = FunctionWrapper{iip}(prob.f, prob.p) g! = prob.f.jac === nothing ? nothing : FunctionWrapper{iip}(prob.f.jac, prob.p) - lsoprob = LSO.LeastSquaresProblem(; x = prob.u0, f!, y = prob.f.resid_prototype, g!, - J = prob.f.jac_prototype, alg.autodiff, - output_length = length(prob.f.resid_prototype)) + resid_prototype = prob.f.resid_prototype === nothing ? + (!iip ? prob.f(prob.u0, prob.p) : zeros(prob.u0)) : + prob.f.resid_prototype + + lsoprob = LSO.LeastSquaresProblem(; x = prob.u0, f!, y = resid_prototype, g!, + J = prob.f.jac_prototype, alg.autodiff, output_length = length(resid_prototype)) allocated_prob = LSO.LeastSquaresProblemAllocated(lsoprob, _lso_solver(alg)) return LeastSquaresOptimCache(prob, alg, allocated_prob, diff --git a/test/nonlinear_least_squares.jl b/test/nonlinear_least_squares.jl index 27775bc40..c9fda61ba 100644 --- a/test/nonlinear_least_squares.jl +++ b/test/nonlinear_least_squares.jl @@ -1,4 +1,5 @@ using NonlinearSolve, LinearSolve, LinearAlgebra, Test, Random +import LeastSquaresOptim true_function(x, θ) = @. θ[1] * exp(θ[2] * x) * cos(θ[3] * x + θ[4]) true_function(y, x, θ) = (@. y = θ[1] * exp(θ[2] * x) * cos(θ[3] * x + θ[4])) @@ -25,22 +26,11 @@ prob_oop = NonlinearLeastSquaresProblem{false}(loss_function, θ_init, x) prob_iip = NonlinearLeastSquaresProblem(NonlinearFunction(loss_function; resid_prototype = zero(y_target)), θ_init, x) -sol = solve(prob_oop, GaussNewton(; linsolve = NormalCholeskyFactorization()); - maxiters = 1000, abstol = 1e-8) -@test SciMLBase.successful_retcode(sol) -@test norm(sol.resid) < 1e-6 - -sol = solve(prob_iip, GaussNewton(; linsolve = NormalCholeskyFactorization()); - maxiters = 1000, abstol = 1e-8) -@test SciMLBase.successful_retcode(sol) -@test norm(sol.resid) < 1e-6 - -sol = solve(prob_oop, LevenbergMarquardt(; linsolve = NormalCholeskyFactorization()); - maxiters = 1000, abstol = 1e-8) -@test SciMLBase.successful_retcode(sol) -@test norm(sol.resid) < 1e-6 - -sol = solve(prob_iip, LevenbergMarquardt(; linsolve = NormalCholeskyFactorization()); - maxiters = 1000, abstol = 1e-8) -@test SciMLBase.successful_retcode(sol) -@test norm(sol.resid) < 1e-6 +nlls_problems = [prob_oop, prob_iip] +solvers = [GaussNewton(), LevenbergMarquardt(), LSOptimSolver(:lm), LSOptimSolver(:dogleg)] + +for prob in nlls_problems, solver in solvers + @time sol = solve(prob, solver; maxiters = 1000, abstol = 1e-8) + @test SciMLBase.successful_retcode(sol) + @test norm(sol.resid) < 1e-6 +end From 8f68ef1324ab56d950b80eea5b2e39ef06b5db12 Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Sun, 15 Oct 2023 14:22:15 -0400 Subject: [PATCH 3/5] Run autoselect --- src/gaussnewton.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/gaussnewton.jl b/src/gaussnewton.jl index 6c03b6c2e..f8c0c7fbe 100644 --- a/src/gaussnewton.jl +++ b/src/gaussnewton.jl @@ -41,8 +41,8 @@ for large-scale and numerically-difficult nonlinear least squares problems. precs end -function GaussNewton(; concrete_jac = nothing, linsolve = NormalCholeskyFactorization(), - precs = DEFAULT_PRECS, adkwargs...) +function GaussNewton(; concrete_jac = nothing, linsolve = nothing, precs = DEFAULT_PRECS, + adkwargs...) ad = default_adargs_to_adtype(; adkwargs...) return GaussNewton{_unwrap_val(concrete_jac)}(ad, linsolve, precs) end From f151a0aa270ade6845fbd51c92a5cf9ec1db095f Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Sun, 15 Oct 2023 18:40:46 -0400 Subject: [PATCH 4/5] Use symmetric linear solve if possible --- src/gaussnewton.jl | 16 ++++++++-------- src/jacobian.jl | 14 ++++++++++---- src/levenberg.jl | 14 +++++++------- test/nonlinear_least_squares.jl | 9 +++++++-- 4 files changed, 32 insertions(+), 21 deletions(-) diff --git a/src/gaussnewton.jl b/src/gaussnewton.jl index f8c0c7fbe..42521189e 100644 --- a/src/gaussnewton.jl +++ b/src/gaussnewton.jl @@ -1,6 +1,6 @@ """ - GaussNewton(; concrete_jac = nothing, linsolve = nothing, precs = DEFAULT_PRECS, - adkwargs...) + GaussNewton(; concrete_jac = nothing, linsolve = nothing, + precs = DEFAULT_PRECS, adkwargs...) An advanced GaussNewton implementation with support for efficient handling of sparse matrices via colored automatic differentiation and preconditioned linear solvers. Designed @@ -41,8 +41,8 @@ for large-scale and numerically-difficult nonlinear least squares problems. precs end -function GaussNewton(; concrete_jac = nothing, linsolve = nothing, precs = DEFAULT_PRECS, - adkwargs...) +function GaussNewton(; concrete_jac = nothing, linsolve = CholeskyFactorization(), + precs = DEFAULT_PRECS, adkwargs...) ad = default_adargs_to_adtype(; adkwargs...) return GaussNewton{_unwrap_val(concrete_jac)}(ad, linsolve, precs) end @@ -97,8 +97,8 @@ function perform_step!(cache::GaussNewtonCache{true}) __matmul!(Jᵀf, J', fu1) # u = u - J \ fu - linres = dolinsolve(alg.precs, linsolve; A = JᵀJ, b = _vec(Jᵀf), linu = _vec(du), - p, reltol = cache.abstol) + linres = dolinsolve(alg.precs, linsolve; A = __maybe_symmetric(JᵀJ), b = _vec(Jᵀf), + linu = _vec(du), p, reltol = cache.abstol) cache.linsolve = linres.cache @. u = u - du f(cache.fu_new, u, p) @@ -125,8 +125,8 @@ function perform_step!(cache::GaussNewtonCache{false}) if linsolve === nothing cache.du = fu1 / cache.J else - linres = dolinsolve(alg.precs, linsolve; A = cache.JᵀJ, b = _vec(cache.Jᵀf), - linu = _vec(cache.du), p, reltol = cache.abstol) + linres = dolinsolve(alg.precs, linsolve; A = __maybe_symmetric(cache.JᵀJ), + b = _vec(cache.Jᵀf), linu = _vec(cache.du), p, reltol = cache.abstol) cache.linsolve = linres.cache end cache.u = @. u - cache.du # `u` might not support mutation diff --git a/src/jacobian.jl b/src/jacobian.jl index 10ac69ec6..eddfdaef4 100644 --- a/src/jacobian.jl +++ b/src/jacobian.jl @@ -95,14 +95,14 @@ function jacobian_caches(alg::AbstractNonlinearSolveAlgorithm, f, u, p, ::Val{ii Jᵀfu = J' * fu end - linprob = LinearProblem(needsJᵀJ ? JᵀJ : J, needsJᵀJ ? _vec(Jᵀfu) : _vec(fu); - u0 = _vec(du)) + linprob = LinearProblem(needsJᵀJ ? __maybe_symmetric(JᵀJ) : J, + needsJᵀJ ? _vec(Jᵀfu) : _vec(fu); u0 = _vec(du)) weight = similar(u) recursivefill!(weight, true) - Pl, Pr = wrapprecs(alg.precs(J, nothing, u, p, nothing, nothing, nothing, nothing, - nothing)..., weight) + Pl, Pr = wrapprecs(alg.precs(needsJᵀJ ? __maybe_symmetric(JᵀJ) : J, nothing, u, p, + nothing, nothing, nothing, nothing, nothing)..., weight) linsolve = init(linprob, alg.linsolve; alias_A = true, alias_b = true, Pl, Pr, linsolve_kwargs...) @@ -119,6 +119,12 @@ __init_JᵀJ(J::Number) = zero(J) __init_JᵀJ(J::AbstractArray) = J' * J __init_JᵀJ(J::StaticArray) = MArray{Tuple{size(J, 2), size(J, 2)}, eltype(J)}(undef) +__maybe_symmetric(x) = Symmetric(x) +__maybe_symmetric(x::Number) = x +# LinearSolve with `nothing` doesn't dispatch correctly here +__maybe_symmetric(x::StaticArray) = x +__maybe_symmetric(x::SparseArrays.AbstractSparseMatrix) = x + ## Special Handling for Scalars function jacobian_caches(alg::AbstractNonlinearSolveAlgorithm, f, u::Number, p, ::Val{false}; linsolve_with_JᵀJ::Val{needsJᵀJ} = Val(false), diff --git a/src/levenberg.jl b/src/levenberg.jl index 8b0e5728e..07a8b8251 100644 --- a/src/levenberg.jl +++ b/src/levenberg.jl @@ -13,8 +13,8 @@ numerically-difficult nonlinear systems. ### Keyword Arguments - `autodiff`: determines the backend used for the Jacobian. Note that this argument is - ignored if an analytical Jacobian is passed, as that will be used instead. Defaults to - `AutoForwardDiff()`. Valid choices are types from ADTypes.jl. + ignored if an analytical Jacobian is passed, as that will be used instead. Defaults to + `AutoForwardDiff()`. Valid choices are types from ADTypes.jl. - `concrete_jac`: whether to build a concrete Jacobian. If a Krylov-subspace method is used, then the Jacobian will not be constructed and instead direct Jacobian-vector products `J*v` are computed using forward-mode automatic differentiation or finite differencing @@ -203,8 +203,8 @@ function perform_step!(cache::LevenbergMarquardtCache{true}) # The following lines do: cache.v = -cache.mat_tmp \ cache.u_tmp mul!(cache.u_tmp, J', fu1) @. cache.mat_tmp = JᵀJ + λ * DᵀD - linres = dolinsolve(alg.precs, linsolve; A = cache.mat_tmp, b = _vec(cache.u_tmp), - linu = _vec(cache.du), p = p, reltol = cache.abstol) + linres = dolinsolve(alg.precs, linsolve; A = __maybe_symmetric(cache.mat_tmp), + b = _vec(cache.u_tmp), linu = _vec(cache.du), p = p, reltol = cache.abstol) cache.linsolve = linres.cache @. cache.v = -cache.du @@ -280,8 +280,8 @@ function perform_step!(cache::LevenbergMarquardtCache{false}) if linsolve === nothing cache.v = -cache.mat_tmp \ (J' * fu1) else - linres = dolinsolve(alg.precs, linsolve; A = -cache.mat_tmp, b = _vec(J' * fu1), - linu = _vec(cache.v), p, reltol = cache.abstol) + linres = dolinsolve(alg.precs, linsolve; A = -__maybe_symmetric(cache.mat_tmp), + b = _vec(J' * fu1), linu = _vec(cache.v), p, reltol = cache.abstol) cache.linsolve = linres.cache end @@ -291,7 +291,7 @@ function perform_step!(cache::LevenbergMarquardtCache{false}) cache.a = -cache.mat_tmp \ _vec(J' * ((2 / h) .* ((f(u .+ h .* v, p) .- fu1) ./ h .- J * v))) else - linres = dolinsolve(alg.precs, linsolve; A = -cache.mat_tmp, + linres = dolinsolve(alg.precs, linsolve; b = _mutable(_vec(J' * ((2 / h) .* ((f(u .+ h .* v, p) .- fu1) ./ h .- J * v)))), linu = _vec(cache.a), p, reltol = cache.abstol) diff --git a/test/nonlinear_least_squares.jl b/test/nonlinear_least_squares.jl index c9fda61ba..9ea4b0eca 100644 --- a/test/nonlinear_least_squares.jl +++ b/test/nonlinear_least_squares.jl @@ -27,10 +27,15 @@ prob_iip = NonlinearLeastSquaresProblem(NonlinearFunction(loss_function; resid_prototype = zero(y_target)), θ_init, x) nlls_problems = [prob_oop, prob_iip] -solvers = [GaussNewton(), LevenbergMarquardt(), LSOptimSolver(:lm), LSOptimSolver(:dogleg)] +solvers = [ + GaussNewton(), + LevenbergMarquardt(), + LSOptimSolver(:lm), + LSOptimSolver(:dogleg), +] for prob in nlls_problems, solver in solvers - @time sol = solve(prob, solver; maxiters = 1000, abstol = 1e-8) + @time sol = solve(prob, solver; maxiters = 10000, abstol = 1e-8) @test SciMLBase.successful_retcode(sol) @test norm(sol.resid) < 1e-6 end From 1c19fa7f15538df0eaf922ca80b0648e3f044d8c Mon Sep 17 00:00:00 2001 From: Avik Pal Date: Sun, 15 Oct 2023 21:39:03 -0400 Subject: [PATCH 5/5] Wrap FastLM.jl --- Project.toml | 6 +- ...NonlinearSolveFastLevenbergMarquardtExt.jl | 71 +++++++++++++++++++ ext/NonlinearSolveLeastSquaresOptimExt.jl | 2 +- src/NonlinearSolve.jl | 3 +- src/algorithms.jl | 62 ++++++++++++++-- test/nonlinear_least_squares.jl | 27 ++++--- 6 files changed, 155 insertions(+), 16 deletions(-) create mode 100644 ext/NonlinearSolveFastLevenbergMarquardtExt.jl diff --git a/Project.toml b/Project.toml index b4f7c2553..ad8c24075 100644 --- a/Project.toml +++ b/Project.toml @@ -25,9 +25,11 @@ StaticArraysCore = "1e83bf80-4336-4d27-bf5d-d5a4f845583c" UnPack = "3a884ed6-31ef-47d7-9d2a-63182c4928ed" [weakdeps] +FastLevenbergMarquardt = "7a0df574-e128-4d35-8cbd-3d84502bf7ce" LeastSquaresOptim = "0fc2ff8b-aaa3-5acd-a817-1944a5e08891" [extensions] +NonlinearSolveFastLevenbergMarquardtExt = "FastLevenbergMarquardt" NonlinearSolveLeastSquaresOptimExt = "LeastSquaresOptim" [compat] @@ -37,6 +39,7 @@ ConcreteStructs = "0.2" DiffEqBase = "6.130" EnumX = "1" Enzyme = "0.11" +FastLevenbergMarquardt = "0.1" FiniteDiff = "2" ForwardDiff = "0.10.3" LeastSquaresOptim = "0.8" @@ -57,6 +60,7 @@ julia = "1.9" [extras] BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf" Enzyme = "7da242da-08ed-463a-9acd-ee780be4f1d9" +FastLevenbergMarquardt = "7a0df574-e128-4d35-8cbd-3d84502bf7ce" ForwardDiff = "f6369f11-7733-5829-9624-2563aa707210" LeastSquaresOptim = "0fc2ff8b-aaa3-5acd-a817-1944a5e08891" LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" @@ -72,4 +76,4 @@ Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40" Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f" [targets] -test = ["Enzyme", "BenchmarkTools", "SafeTestsets", "Pkg", "Test", "ForwardDiff", "StaticArrays", "Symbolics", "LinearSolve", "Random", "LinearAlgebra", "Zygote", "SparseDiffTools", "NonlinearProblemLibrary", "LeastSquaresOptim"] +test = ["Enzyme", "BenchmarkTools", "SafeTestsets", "Pkg", "Test", "ForwardDiff", "StaticArrays", "Symbolics", "LinearSolve", "Random", "LinearAlgebra", "Zygote", "SparseDiffTools", "NonlinearProblemLibrary", "LeastSquaresOptim", "FastLevenbergMarquardt"] diff --git a/ext/NonlinearSolveFastLevenbergMarquardtExt.jl b/ext/NonlinearSolveFastLevenbergMarquardtExt.jl new file mode 100644 index 000000000..7a853c327 --- /dev/null +++ b/ext/NonlinearSolveFastLevenbergMarquardtExt.jl @@ -0,0 +1,71 @@ +module NonlinearSolveFastLevenbergMarquardtExt + +using ArrayInterface, NonlinearSolve, SciMLBase +import ConcreteStructs: @concrete +import FastLevenbergMarquardt as FastLM + +NonlinearSolve.extension_loaded(::Val{:FastLevenbergMarquardt}) = true + +function _fast_lm_solver(::FastLevenbergMarquardtSolver{linsolve}, x) where {linsolve} + if linsolve == :cholesky + return FastLM.CholeskySolver(ArrayInterface.undefmatrix(x)) + elseif linsolve == :qr + return FastLM.QRSolver(eltype(x), length(x)) + else + throw(ArgumentError("Unknown FastLevenbergMarquardt Linear Solver: $linsolve")) + end +end + +@concrete struct FastLMCache + f! + J! + prob + alg + lmworkspace + solver + kwargs +end + +@concrete struct InplaceFunction{iip} <: Function + f +end + +(f::InplaceFunction{true})(fx, x, p) = f.f(fx, x, p) +(f::InplaceFunction{false})(fx, x, p) = (fx .= f.f(x, p)) + +function SciMLBase.__init(prob::NonlinearLeastSquaresProblem, + alg::FastLevenbergMarquardtSolver, args...; abstol = 1e-8, reltol = 1e-8, + verbose = false, maxiters = 1000, kwargs...) + iip = SciMLBase.isinplace(prob) + + @assert prob.f.jac!==nothing "FastLevenbergMarquardt requires a Jacobian!" + + f! = InplaceFunction{iip}(prob.f) + J! = InplaceFunction{iip}(prob.f.jac) + + resid_prototype = prob.f.resid_prototype === nothing ? + (!iip ? prob.f(prob.u0, prob.p) : zeros(prob.u0)) : + prob.f.resid_prototype + + J = similar(prob.u0, length(resid_prototype), length(prob.u0)) + + solver = _fast_lm_solver(alg, prob.u0) + LM = FastLM.LMWorkspace(prob.u0, resid_prototype, J) + + return FastLMCache(f!, J!, prob, alg, LM, solver, + (; xtol = abstol, ftol = reltol, maxit = maxiters, alg.factor, alg.factoraccept, + alg.factorreject, alg.minscale, alg.maxscale, alg.factorupdate, alg.minfactor, + alg.maxfactor, kwargs...)) +end + +function SciMLBase.solve!(cache::FastLMCache) + res, fx, info, iter, nfev, njev, LM, solver = FastLM.lmsolve!(cache.f!, cache.J!, + cache.lmworkspace, cache.prob.p; cache.solver, cache.kwargs...) + stats = SciMLBase.NLStats(nfev, njev, -1, -1, iter) + retcode = info == 1 ? ReturnCode.Success : + (info == -1 ? ReturnCode.MaxIters : ReturnCode.Default) + return SciMLBase.build_solution(cache.prob, cache.alg, res, fx; + retcode, original = (res, fx, info, iter, nfev, njev, LM, solver), stats) +end + +end diff --git a/ext/NonlinearSolveLeastSquaresOptimExt.jl b/ext/NonlinearSolveLeastSquaresOptimExt.jl index 7514931d5..40299f5b3 100644 --- a/ext/NonlinearSolveLeastSquaresOptimExt.jl +++ b/ext/NonlinearSolveLeastSquaresOptimExt.jl @@ -4,7 +4,7 @@ using NonlinearSolve, SciMLBase import ConcreteStructs: @concrete import LeastSquaresOptim as LSO -extension_loaded(::Val{:LeastSquaresOptim}) = true +NonlinearSolve.extension_loaded(::Val{:LeastSquaresOptim}) = true function _lso_solver(::LSOptimSolver{alg, linsolve}) where {alg, linsolve} ls = linsolve == :qr ? LSO.QR() : diff --git a/src/NonlinearSolve.jl b/src/NonlinearSolve.jl index d9dcbba39..efcce13f5 100644 --- a/src/NonlinearSolve.jl +++ b/src/NonlinearSolve.jl @@ -95,7 +95,8 @@ end export RadiusUpdateSchemes -export NewtonRaphson, TrustRegion, LevenbergMarquardt, GaussNewton, LSOptimSolver +export NewtonRaphson, TrustRegion, LevenbergMarquardt, GaussNewton +export LSOptimSolver, FastLevenbergMarquardtSolver export LineSearch diff --git a/src/algorithms.jl b/src/algorithms.jl index b9a694866..3f288433e 100644 --- a/src/algorithms.jl +++ b/src/algorithms.jl @@ -11,18 +11,70 @@ Wrapper over [LeastSquaresOptim.jl](https://github.com/matthieugomez/LeastSquare - `linsolve`: Linear solver to use. Can be `:qr`, `:cholesky` or `:lsmr`. If `nothing`, then `LeastSquaresOptim.jl` will choose the best linear solver based on the Jacobian structure. +- `autodiff`: Automatic differentiation / Finite Differences. Can be `:central` or `:forward`. !!! note This algorithm is only available if `LeastSquaresOptim.jl` is installed. """ struct LSOptimSolver{alg, linsolve} <: AbstractNonlinearSolveAlgorithm autodiff::Symbol +end + +function LSOptimSolver(alg = :lm; linsolve = nothing, autodiff::Symbol = :central) + @assert alg in (:lm, :dogleg) + @assert linsolve === nothing || linsolve in (:qr, :cholesky, :lsmr) + @assert autodiff in (:central, :forward) + + if !extension_loaded(Val(:LeastSquaresOptim)) + @warn "LeastSquaresOptim.jl is not loaded! It needs to be explicitly loaded \ + before `solve(prob, LSOptimSolver())` is called." + end + + return LSOptimSolver{alg, linsolve}(autodiff) +end + +""" + FastLevenbergMarquardtSolver(linsolve = :cholesky) + +Wrapper over [FastLevenbergMarquardt.jl](https://github.com/kamesy/FastLevenbergMarquardt.jl) for solving +`NonlinearLeastSquaresProblem`. - function LSOptimSolver(alg = :lm; linsolve = nothing, autodiff::Symbol = :central) - @assert alg in (:lm, :dogleg) - @assert linsolve === nothing || linsolve in (:qr, :cholesky, :lsmr) - @assert autodiff in (:central, :forward) +!!! warning + This is not really the fastest solver. It is called that since the original package + is called "Fast". `LevenbergMarquardt()` is almost always a better choice. - return new{alg, linsolve}(autodiff) +!!! warning + This algorithm requires the jacobian function to be provided! + +## Arguments: + +- `linsolve`: Linear solver to use. Can be `:qr` or `:cholesky`. + +!!! note + This algorithm is only available if `FastLevenbergMarquardt.jl` is installed. +""" +@concrete struct FastLevenbergMarquardtSolver{linsolve} <: AbstractNonlinearSolveAlgorithm + factor + factoraccept + factorreject + factorupdate::Symbol + minscale + maxscale + minfactor + maxfactor +end + +function FastLevenbergMarquardtSolver(linsolve::Symbol = :cholesky; factor = 1e-6, + factoraccept = 13.0, factorreject = 3.0, factorupdate = :marquardt, + minscale = 1e-12, maxscale = 1e16, minfactor = 1e-28, maxfactor = 1e32) + @assert linsolve in (:qr, :cholesky) + @assert factorupdate in (:marquardt, :nielson) + + if !extension_loaded(Val(:FastLevenbergMarquardt)) + @warn "FastLevenbergMarquardt.jl is not loaded! It needs to be explicitly loaded \ + before `solve(prob, FastLevenbergMarquardtSolver())` is called." end + + return FastLevenbergMarquardtSolver{linsolve}(factor, factoraccept, factorreject, + factorupdate, minscale, maxscale, minfactor, maxfactor) end diff --git a/test/nonlinear_least_squares.jl b/test/nonlinear_least_squares.jl index 9ea4b0eca..4f67ef28e 100644 --- a/test/nonlinear_least_squares.jl +++ b/test/nonlinear_least_squares.jl @@ -1,5 +1,5 @@ -using NonlinearSolve, LinearSolve, LinearAlgebra, Test, Random -import LeastSquaresOptim +using NonlinearSolve, LinearSolve, LinearAlgebra, Test, Random, ForwardDiff +import FastLevenbergMarquardt, LeastSquaresOptim true_function(x, θ) = @. θ[1] * exp(θ[2] * x) * cos(θ[3] * x + θ[4]) true_function(y, x, θ) = (@. y = θ[1] * exp(θ[2] * x) * cos(θ[3] * x + θ[4])) @@ -27,15 +27,26 @@ prob_iip = NonlinearLeastSquaresProblem(NonlinearFunction(loss_function; resid_prototype = zero(y_target)), θ_init, x) nlls_problems = [prob_oop, prob_iip] -solvers = [ - GaussNewton(), - LevenbergMarquardt(), - LSOptimSolver(:lm), - LSOptimSolver(:dogleg), -] +solvers = [GaussNewton(), LevenbergMarquardt(), LSOptimSolver(:lm), LSOptimSolver(:dogleg)] for prob in nlls_problems, solver in solvers @time sol = solve(prob, solver; maxiters = 10000, abstol = 1e-8) @test SciMLBase.successful_retcode(sol) @test norm(sol.resid) < 1e-6 end + +function jac!(J, θ, p) + ForwardDiff.jacobian!(J, resid -> loss_function(resid, θ, p), θ) + return J +end + +prob = NonlinearLeastSquaresProblem(NonlinearFunction(loss_function; + resid_prototype = zero(y_target), jac = jac!), θ_init, x) + +solvers = [FastLevenbergMarquardtSolver(:cholesky), FastLevenbergMarquardtSolver(:qr)] + +for solver in solvers + @time sol = solve(prob, solver; maxiters = 10000, abstol = 1e-8) + @test SciMLBase.successful_retcode(sol) + @test norm(sol.resid) < 1e-6 +end