Merge pull request #60 from JuliaNLSolvers/pkm/nonlineardocs

Update nleq-solving docs and adjust code to support the written text.
JuliaNLSolvers · Jul 28, 2023 · 3de9973 · 3de9973
2 parents b72dc96 + caf28dc
commit 3de9973
Show file tree

Hide file tree

Showing 8 changed files with 179 additions and 86 deletions.
diff --git a/docs/src/mkdocs.yml b/docs/src/mkdocs.yml
diff --git a/docs/src/nonlineareq.md b/docs/src/nonlineareq.md
@@ -1 +1,117 @@
-# Solving non-linear systems of equations
+# Solving non-linear systems of equations
+Non-linear systems of equations arise in many different applications. As for optimization, different situations will call for different inputs and optimizations: scalar, static, mutating, iterative solvers, etc. Below, we will cover some important algorithms and special cases.
+
+## Scalar solving with 1st order derivatives
+Assume that you have a residual system that you want to solve. This means that if your original system to solve is is `F(x) = K` for some real number `K`, you have made sure to provide a residual function `G(x) = F(x) - K` that we can solve for `G(x) = 0` instead. Then, you can use Newton's method for root finding as follows:
+
+
+```
+function F(x)
+    x^2
+    end
+    
+    function FJ(Jx, x)
+        x^2, 2x
+    end
+    
+    prob_obj = NLSolvers.ScalarObjective(
+        f=F,
+        fg=FJ,
+    )
+    
+prob = NEqProblem(prob_obj; inplace = false)
+
+x0 = 0.3
+res = solve(prob, x0, LineSearch(Newton(), Backtracking()))
+```
+
+with output
+
+```
+julia> res = solve(prob, x0, LineSearch(Newton(), Backtracking()))
+Results of solving non-linear equations
+
+* Algorithm:
+  Newton's method with default linsolve with backtracking (no interp)
+
+* Candidate solution:
+  Final residual 2-norm:      5.36e-09
+  Final residual Inf-norm:    5.36e-09
+
+  Initial residual 2-norm:    9.00e-02
+  Initial residual Inf-norm:  9.00e-02
+
+* Stopping criteria
+  |F(x')|               = 5.36e-09 <= 1.00e-08 (true)
+
+* Work counters
+  Seconds run:   1.41e-05
+  Iterations:    12
+```
+The output reports initial and final residual norms. The convergence check is also reported, and some work counters report the time spent and the number of iterations. 
+
+## Multivariate non-linear equation solving
+Multivariate non-linear equation solving requires writing a `VectorObjective` instead of a `ScalarObjective` as above. The `VectorObjective` is 
+
+```
+using NLSolvers, ForwardDiff
+function theta(x)
+    if x[1] > 0
+        return atan(x[2] / x[1]) / (2.0 * pi)
+    else
+        return (pi + atan(x[2] / x[1])) / (2.0 * pi)
+    end
+end
+
+function F_powell!(Fx, x)
+    if (x[1]^2 + x[2]^2 == 0)
+        dtdx1 = 0
+        dtdx2 = 0
+    else
+        dtdx1 = -x[2] / (2 * pi * (x[1]^2 + x[2]^2))
+        dtdx2 = x[1] / (2 * pi * (x[1]^2 + x[2]^2))
+    end
+    Fx[1] =
+        -2000.0 * (x[3] - 10.0 * theta(x)) * dtdx1 +
+        200.0 * (sqrt(x[1]^2 + x[2]^2) - 1) * x[1] / sqrt(x[1]^2 + x[2]^2)
+    Fx[2] =
+        -2000.0 * (x[3] - 10.0 * theta(x)) * dtdx2 +
+        200.0 * (sqrt(x[1]^2 + x[2]^2) - 1) * x[2] / sqrt(x[1]^2 + x[2]^2)
+    Fx[3] = 200.0 * (x[3] - 10.0 * theta(x)) + 2.0 * x[3]
+    Fx
+end
+
+function F_jacobian_powell!(Fx, Jx, x)
+    ForwardDiff.jacobian!(Jx, F_powell!, Fx, x)
+    Fx, Jx
+end
+
+prob_obj = VectorObjective(F=F_powell!, J=F_jacobian_powell!)
+prob = NEqProblem(prob_obj)
+
+x0 = [-1.0, 0.0, 0.0]
+res = solve(prob, copy(x0), LineSearch(Newton(), Backtracking()))
+```
+with result
+```
+julia> res = solve(prob, copy(x0), LineSearch(Newton(), Backtracking()))
+Results of solving non-linear equations
+
+* Algorithm:
+  Newton's method with default linsolve with backtracking (no interp)
+
+* Candidate solution:
+  Final residual 2-norm:      8.57e-16
+  Final residual Inf-norm:    6.24e-16
+
+  Initial residual 2-norm:    1.88e+03
+  Initial residual Inf-norm:  1.59e+03
+
+* Stopping criteria
+  |F(x')|               = 6.24e-16 <= 1.00e-08 (true)
+
+* Work counters
+  Seconds run:   2.10e-04
+  Iterations:    33
+```
+We again see initial and final residual norms. This time the 2- and Inf-norm are different because there is more than one element in the state to be optimized over. The final 2-norm also satisfies the required threshold, and the run-time and number of iterations are reported.
diff --git a/src/NLSolvers.jl b/src/NLSolvers.jl
@@ -109,7 +109,7 @@ include("Manifolds.jl")
 include("objectives.jl")
 export LeastSquaresObjective
 include("linearalgebra.jl")
-export NonDiffed, OnceDiffed, TwiceDiffed, ScalarObjective
+export NonDiffed, OnceDiffed, TwiceDiffed, ScalarObjective, VectorObjective
 
 # make this struct that has scheme and approx
 abstract type QuasiNewton{T1} end

diff --git a/src/nlsolve/linesearch/newton.jl b/src/nlsolve/linesearch/newton.jl
@@ -12,23 +12,25 @@ function solve(
 
     # Unpack
     scheme, linesearch = modelscheme(method), algorithm(method)
-    # Unpack important objectives
-    F = problem.R.F
-    FJ = problem.R.FJ
+
     # Unpack state
     z, d, Fx, Jx = state
-    z .= x
+    if mstyle(problem) isa InPlace
+        z .= x
+    else
+        z = copy(x)
+    end
     T = eltype(Fx)
 
 
     # Set up MeritObjective. This defines the least squares
     # objective for the line search.
-    merit = MeritObjective(problem, F, FJ, Fx, Jx, d)
+    merit = MeritObjective(problem, Fx, d)
     meritproblem =
         OptimizationProblem(merit, nothing, Euclidean(0), nothing, mstyle(problem), nothing)
 
     # Evaluate the residual and Jacobian
-    Fx, Jx = FJ(Fx, Jx, x)
+    Fx, Jx = value_jacobian(problem, Fx, Jx, x)
     if !(scheme.reset_age === nothing)
         JFx = factorize(Jx)
     else
@@ -160,7 +162,7 @@ function update_model(
 )
     # Update F, J, JF, and age as necessary
     if scheme.reset_age === nothing
-        F, J = problem.R.FJ(F, J, z)
+        F, J = value_jacobian(problem, F, J, z)
         if scheme.factorizer === nothing
             JF = nothing
         else

diff --git a/src/nlsolve/problem_types.jl b/src/nlsolve/problem_types.jl
@@ -30,20 +30,21 @@ is_inplace(problem::NEqProblem) = mstyle(problem) === InPlace()
 #function value(nleq::NEqProblem, x)
 #    nleq.R(x)
 #end
-function value(nleq::NEqProblem, x, F)
-    value(nleq.R, x, F)
+function value(nleq::NEqProblem, F, x)
+    value(nleq.R, F, x)
 end
-struct VectorObjective{TF,TJ,TFJ,TJv}
-    F::TF
-    J::TJ
-    FJ::TFJ
-    Jv::TJv
+function jacobian(nleq::NEqProblem{<:ScalarObjective}, J, x)
+    gradient(nleq.R, J, x)
 end
+function value_jacobian(nleq::NEqProblem{<:ScalarObjective, <:Any, <:Any, OutOfPlace}, F, J, x)
+    nleq.R.fg(J, x)
+end
+
 function value(nleq::VectorObjective, F, x)
     nleq.F(F, x)
 end
-function value_jacobian!(nleq::NEqProblem{<:VectorObjective,<:Any,<:Any}, F, J, x)
-    nleq.FJ(F, J, x)
+function value_jacobian(nleq::NEqProblem{<:VectorObjective,<:Any,<:Any,<:Any}, F, J, x)
+    nleq.R.FJ(F, J, x)
 end
 
 """
@@ -100,7 +101,7 @@ function Base.show(io::IO, ci::ConvergenceInfo{<:Any,<:Any,<:NEqOptions})
             ρF = norm(info.best_residual, Inf)
             println(
                 io,
-                "  |F(x')|               = $(@sprintf("%.2e", ρF)) <= $(@sprintf("%.2e", opt.f_limit)) ($(ρF<=opt.f_limit))",
+                "  |F(x')|               = $(@sprintf("%.2e", ρF)) <= $(@sprintf("%.2e", opt.f_abstol)) ($(ρF<=opt.f_abstol))",
             )
         end
         if haskey(info, :fx)

diff --git a/src/nlsolve/spectral/dfsane.jl b/src/nlsolve/spectral/dfsane.jl
@@ -75,7 +75,7 @@ function solve(
     prob::NEqProblem,
     x0,
     method::DFSANE,
-    options::NEqOptions,
+    options::NEqOptions = NEqOptions(),
     state = init(prob, method; x = copy(x0)),
 )
     if !(mstyle(prob) === InPlace())

diff --git a/src/objectives.jl b/src/objectives.jl
@@ -103,6 +103,15 @@ function batched_value(so::ScalarObjective, F, X)
     end
 end
 
+
+struct VectorObjective{TF,TJ,TFJ,TJv}
+    F::TF
+    J::TJ
+    FJ::TFJ
+    Jv::TJv
+end
+VectorObjective(; F=nothing, J=nothing, FJ=nothing, Jv=nothing) = VectorObjective(F, J, FJ, Jv)
+
 ## If prob is a NEqProblem, then we can just dispatch to least squares MeritObjective
 # if fast JacVec exists then maybe even line searches that updates the gradient can be used??? 
 struct LineObjective!{TP,T1,T2,T3}
@@ -151,16 +160,20 @@ _lineobjective(mstyle::InPlace, prob::AbstractProblem, ∇fz, z, x, d, φ0, dφ0
 _lineobjective(mstyle::OutOfPlace, prob::AbstractProblem, ∇fz, z, x, d, φ0, dφ0) =
     LineObjective(prob, ∇fz, z, x, d, φ0, real(dφ0))
 
-struct MeritObjective{TP,T1,T2,T3,T4,T5}
+struct MeritObjective{TP,T1,T2}
     prob::TP
-    F::T1
-    FJ::T2
-    Fx::T3
-    Jx::T4
-    d::T5
+    Fx::T1
+    d::T2
 end
 function value(mo::MeritObjective, x)
-    Fx = mo.F(mo.Fx, x)
+    _value(mo, mo.prob.R, mo.Fx, x)
+end
+function _value(mo, R::ScalarObjective, Fx, x)
+    Fx = R.f(x)
+    (ϕ = (norm(Fx)^2) / 2, Fx = Fx)
+end
+function _value(mo, R::VectorObjective, Fx, x)
+    Fx = mo.prob.R.F(mo.Fx, x)
     (ϕ = (norm(Fx)^2) / 2, Fx = Fx)
 end
 

diff --git a/test/nlsolve/interface.jl b/test/nlsolve/interface.jl
@@ -448,3 +448,23 @@ end
     @test norm(res.info.best_residual) < 1e-10
 
 end
+
+@testset "scalar nlsolves" begin
+    function ff(x)
+        x^2
+     end
+
+     function fgg(Jx, x)
+         x^2, 2x
+     end
+
+     prob_obj = NLSolvers.ScalarObjective(
+         f=ff,
+         fg=fgg,
+     )
+
+    prob = NEqProblem(prob_obj; inplace = false)
+
+    x0 = 0.3
+    res = solve(prob, x0, LineSearch(Newton(), Backtracking()))
+end