Merge pull request #69 from yash2798/ys/itp

Itp method
SciML · Jul 18, 2023 · 491a632 · 491a632
2 parents f20f5e4 + 1e4eb4b
commit 491a632
Show file tree

Hide file tree

Showing 3 changed files with 166 additions and 3 deletions.
diff --git a/src/SimpleNonlinearSolve.jl b/src/SimpleNonlinearSolve.jl
@@ -38,6 +38,7 @@ include("dfsane.jl")
 include("ad.jl")
 include("halley.jl")
 include("alefeld.jl")
+include("itp.jl")
 
 # Batched Solver Support
 include("batched/utils.jl")
@@ -68,15 +69,15 @@ PrecompileTools.@compile_workload begin
         prob_brack = IntervalNonlinearProblem{false}((u, p) -> u * u - p,
             T.((0.0, 2.0)),
             T(2))
-        for alg in (Bisection, Falsi, Ridder, Brent, Alefeld)
+        for alg in (Bisection, Falsi, Ridder, Brent, Alefeld, Itp)
             solve(prob_brack, alg(), abstol = T(1e-2))
         end
     end
 end
 
 # DiffEq styled algorithms
 export Bisection, Brent, Broyden, LBroyden, SimpleDFSane, Falsi, Halley, Klement,
-    Ridder, SimpleNewtonRaphson, SimpleTrustRegion, Alefeld
+    Ridder, SimpleNewtonRaphson, SimpleTrustRegion, Alefeld, Itp
 export BatchedBroyden, BatchedSimpleNewtonRaphson, BatchedSimpleDFSane
 
 end # module
diff --git a/src/itp.jl b/src/itp.jl
@@ -0,0 +1,138 @@
+"""
+```julia
+Itp(; k1::Real = 0.007, k2::Real = 1.5, n0::Int = 10)
+```
+
+ITP (Interpolate Truncate & Project)
+
+Use the [ITP method](https://en.wikipedia.org/wiki/ITP_method) to find
+a root of a bracketed function, with a convergence rate between 1 and 1.62.
+
+This method was introduced in the paper "An Enhancement of the Bisection Method
+Average Performance Preserving Minmax Optimality"
+(https://doi.org/10.1145/3423597) by I. F. D. Oliveira and R. H. C. Takahashi.
+
+# Tuning Parameters
+
+The following keyword parameters are accepted.
+
+- `n₀::Int = 1`, the 'slack'. Must not be negative.\n
+  When n₀ = 0 the worst-case is identical to that of bisection,
+  but increacing n₀ provides greater oppotunity for superlinearity.
+- `κ₁::Float64 = 0.1`. Must not be negative.\n
+  The recomended value is `0.2/(x₂ - x₁)`.
+  Lower values produce tighter asymptotic behaviour, while higher values
+  improve the steady-state behaviour when truncation is not helpful.
+- `κ₂::Real = 2`. Must lie in [1, 1+ϕ ≈ 2.62).\n
+  Higher values allow for a greater convergence rate,
+  but also make the method more succeptable to worst-case performance.
+  In practice, κ=1,2 seems to work well due to the computational simplicity,
+  as κ₂ is used as an exponent in the method.
+
+### Worst Case Performance
+
+n½ + `n₀` iterations, where n½ is the number of iterations using bisection
+(n½ = ⌈log2(Δx)/2`tol`⌉).
+
+### Asymptotic Performance
+
+If `f` is twice differentiable and the root is simple,
+then with `n₀` > 0 the convergence rate is √`κ₂`.
+"""
+struct Itp{T} <: AbstractBracketingAlgorithm
+    k1::T
+    k2::T
+    n0::Int
+    function Itp(; k1::Real = 0.007, k2::Real = 1.5, n0::Int = 10)
+        if k1 < 0
+            error("Hyper-parameter κ₁ should not be negative")
+        end
+        if n0 < 0
+            error("Hyper-parameter n₀ should not be negative")
+        end
+        if k2 < 1 || k2 > (1.5 + sqrt(5) / 2)
+            ArgumentError("Hyper-parameter κ₂ should be between 1 and 1 + ϕ where ϕ ≈ 1.618... is the golden ratio")
+        end
+        T = promote_type(eltype(k1), eltype(k2))
+        return new{T}(k1, k2, n0)
+    end
+end
+
+function SciMLBase.solve(prob::IntervalNonlinearProblem, alg::Itp,
+    args...; abstol = 1.0e-15,
+    maxiters = 1000, kwargs...)
+    f = Base.Fix2(prob.f, prob.p)
+    left, right = prob.tspan # a and b
+    fl, fr = f(left), f(right)
+    ϵ = abstol
+    if iszero(fl)
+        return SciMLBase.build_solution(prob, alg, left, fl;
+            retcode = ReturnCode.ExactSolutionLeft, left = left,
+            right = right)
+    elseif iszero(fr)
+        return SciMLBase.build_solution(prob, alg, right, fr;
+            retcode = ReturnCode.ExactSolutionRight, left = left,
+            right = right)
+    end
+    #defining variables/cache
+    k1 = alg.k1
+    k2 = alg.k2
+    n0 = alg.n0
+    n_h = ceil(log2((right - left) / (2 * ϵ)))
+    mid = (left + right) / 2
+    x_f = (fr * left - fl * right) / (fr - fl)
+    xt = left
+    xp = left
+    r = zero(left) #minmax radius
+    δ = zero(left) # truncation error
+    σ = 1.0
+    ϵ_s = ϵ * 2^(n_h + n0)
+    i = 0 #iteration
+    while i <= maxiters
+        #mid = (left + right) / 2
+        r = ϵ_s - ((right - left) / 2)
+        δ = k1 * ((right - left)^k2)
+
+        ## Interpolation step ##
+        x_f = (fr * left - fl * right) / (fr - fl)
+
+        ## Truncation step ##
+        σ = sign(mid - x_f)
+        if δ <= abs(mid - x_f)
+            xt = x_f + (σ * δ)
+        else
+            xt = mid
+        end
+
+        ## Projection step ##
+        if abs(xt - mid) <= r
+            xp = xt
+        else
+            xp = mid - (σ * r)
+        end
+
+        ## Update ##
+        yp = f(xp)
+        if yp > 0
+            right = xp
+            fr = yp
+        elseif yp < 0
+            left = xp
+            fl = yp
+        else
+            left = xp
+            right = xp
+        end
+        i += 1
+        mid = (left + right) / 2
+        ϵ_s /= 2
+
+        if (right - left < 2 * ϵ)
+            return SciMLBase.build_solution(prob, alg, mid, f(mid);
+                retcode = ReturnCode.Success, left = left,
+                right = right)
+        end
+    end
+    return SciMLBase.build_solution(prob, alg, left, fl; retcode = ReturnCode.MaxIters,
+        left = left, right = right)
+end
diff --git a/test/basictests.jl b/test/basictests.jl
@@ -219,6 +219,18 @@ for p in 1.1:0.1:100.0
     @test ForwardDiff.derivative(g, p) ≈ 1 / (2 * sqrt(p))
 end
 
+# ITP
+g = function (p)
+    probN = IntervalNonlinearProblem{false}(f, typeof(p).(tspan), p)
+    sol = solve(probN, Itp())
+    return sol.u
+end
+
+for p in 1.1:0.1:100.0
+    @test g(p) ≈ sqrt(p)
+    @test ForwardDiff.derivative(g, p) ≈ 1 / (2 * sqrt(p))
+end
+
 # Alefeld
 g = function (p)
     probN = IntervalNonlinearProblem{false}(f, typeof(p).(tspan), p)
@@ -246,7 +258,7 @@ end
 f, tspan = (u, p) -> p[1] * u * u - p[2], (1.0, 100.0)
 t = (p) -> [sqrt(p[2] / p[1])]
 p = [0.9, 50.0]
-for alg in [Bisection(), Falsi(), Ridder(), Brent()]
+for alg in [Bisection(), Falsi(), Ridder(), Brent(), Itp()]
     global g, p
     g = function (p)
         probN = IntervalNonlinearProblem{false}(f, tspan, p)
@@ -349,6 +361,18 @@ probB = IntervalNonlinearProblem(f, tspan)
 sol = solve(probB, Alefeld())
 @test sol.u ≈ sqrt(2.0)
 
+# Itp
+sol = solve(probB, Itp())
+@test sol.u ≈ sqrt(2.0)
+tspan = (sqrt(2.0), 10.0)
+probB = IntervalNonlinearProblem(f, tspan)
+sol = solve(probB, Itp())
+@test sol.u ≈ sqrt(2.0)
+tspan = (0.0, sqrt(2.0))
+probB = IntervalNonlinearProblem(f, tspan)
+sol = solve(probB, Itp())
+@test sol.u ≈ sqrt(2.0)
+
 # Garuntee Tests for Bisection
 f = function (u, p)
     if u < 2.0