From 60b408cb1c0669902e3bf3bdf88a3e629ad0a609 Mon Sep 17 00:00:00 2001
From: Avik Pal <avikpal@mit.edu>
Date: Wed, 6 Dec 2023 14:31:16 -0500
Subject: [PATCH] More improvements to Klement

---
 src/NonlinearSolve.jl    |  2 +-
 src/broyden.jl           | 60 ++++++++++++++++---------
 src/default.jl           |  5 ++-
 src/klement.jl           | 96 +++++++++++++++++++++++++++-------------
 src/utils.jl             | 57 ++++++++++++++++++++++--
 test/23_test_problems.jl | 19 ++++++--
 test/basictests.jl       | 19 ++++----
 7 files changed, 187 insertions(+), 71 deletions(-)

diff --git a/src/NonlinearSolve.jl b/src/NonlinearSolve.jl
index 424166ca2..3cdfa6c43 100644
--- a/src/NonlinearSolve.jl
+++ b/src/NonlinearSolve.jl
@@ -81,7 +81,7 @@ function SciMLBase.reinit!(cache::AbstractNonlinearSolveCache{iip}, u0 = get_u(c
             get_u(cache), p, get_fu(cache), Val(iip))
     end
 
-    hasfield(typeof(cache), :uf) && (cache.uf.p = p)
+    hasfield(typeof(cache), :uf) && cache.uf !== nothing && (cache.uf.p = p)
 
     cache.abstol = abstol
     cache.reltol = reltol
diff --git a/src/broyden.jl b/src/broyden.jl
index 0884e07a8..ffacfcb9a 100644
--- a/src/broyden.jl
+++ b/src/broyden.jl
@@ -1,13 +1,13 @@
 # Sadly `Broyden` is taken up by SimpleNonlinearSolve.jl
 """
-    GeneralBroyden(; max_resets = 3, linesearch = nothing, reset_tolerance = nothing,
-        init_jacobian::Val = Val(:identity), autodiff = nothing, alpha = 1.0)
+    GeneralBroyden(; max_resets = 100, linesearch = nothing, reset_tolerance = nothing,
+        init_jacobian::Val = Val(:identity), autodiff = nothing, alpha = nothing)
 
 An implementation of `Broyden` with resetting and line search.
 
 ## Arguments
 
-  - `max_resets`: the maximum number of resets to perform. Defaults to `3`.
+  - `max_resets`: the maximum number of resets to perform. Defaults to `100`.
 
   - `reset_tolerance`: the tolerance for the reset check. Defaults to
     `sqrt(eps(real(eltype(u))))`.
@@ -16,11 +16,15 @@ An implementation of `Broyden` with resetting and line search.
     used here directly, and they will be converted to the correct `LineSearch`. It is
     recommended to use [LiFukushimaLineSearch](@ref) -- a derivative free linesearch
     specifically designed for Broyden's method.
-  - `alpha_initial`: If `init_jacobian` is set to `Val(:identity)`, then the initial
-    Jacobian inverse is set to be `(αI)⁻¹`. Defaults to `1.0`.
-  - `init_jacobian`: the method to use for initializing the jacobian. Defaults to using the
-    identity matrix (`Val(:identitiy)`). Alternatively, can be set to `Val(:true_jacobian)`
-    to use the true jacobian as initialization.
+  - `alpha`: If `init_jacobian` is set to `Val(:identity)`, then the initial Jacobian
+    inverse is set to be `(αI)⁻¹`. Defaults to `nothing` which implies
+    `α = max(norm(u), 1) / (2 * norm(fu))`.
+  - `init_jacobian`: the method to use for initializing the jacobian. Defaults to
+    `Val(:identity)`. Choices include:
+
+      + `Val(:identity)`: Identity Matrix.
+      + `Val(:true_jacobian)`: True Jacobian. This is a good choice for differentiable
+        problems.
   - `autodiff`: determines the backend used for the Jacobian. Note that this argument is
     ignored if an analytical Jacobian is passed, as that will be used instead. Defaults to
     `nothing` which means that a default is selected according to the problem specification!
@@ -29,39 +33,45 @@ An implementation of `Broyden` with resetting and line search.
 
       + `Val(:good_broyden)`: Good Broyden's Update Rule
       + `Val(:bad_broyden)`: Bad Broyden's Update Rule
+      + `Val(:diagonal)`: Only update the diagonal of the Jacobian. This algorithm may be
+        useful for specific problems, but whether it will work may depend strongly on the
+        problem.
+      + `Val(:exciting_mixing)`: Update the diagonal of the Jacobian. This is based off
+        SciPy's implementation of Broyden's method. This algorithm may be useful for
+        specific problems, but whether it will work may depend strongly on the problem.
 """
 @concrete struct GeneralBroyden{IJ, UR, CJ, AD} <: AbstractNewtonAlgorithm{CJ, AD}
     ad::AD
     max_resets::Int
     reset_tolerance
     linesearch
-    inv_alpha
+    alpha
 end
 
 function __alg_print_modifiers(alg::GeneralBroyden{IJ, UR}) where {IJ, UR}
     modifiers = String[]
     IJ !== :identity && push!(modifiers, "init_jacobian = :$(IJ)")
     UR !== :good_broyden && push!(modifiers, "update_rule = :$(UR)")
-    alg.inv_alpha != 1 && push!(modifiers, "alpha = $(1 / alg.inv_alpha)")
+    alg.alpha !== nothing && push!(modifiers, "alpha = $(alg.alpha)")
     return modifiers
 end
 
 function set_ad(alg::GeneralBroyden{IJ, UR, CJ}, ad) where {IJ, UR, CJ}
     return GeneralBroyden{IJ, UR, CJ}(ad, alg.max_resets, alg.reset_tolerance,
-        alg.linesearch, alg.inv_alpha)
+        alg.linesearch, alg.alpha)
 end
 
-function GeneralBroyden(; max_resets = 3, linesearch = nothing, reset_tolerance = nothing,
-        init_jacobian::Val = Val(:identity), autodiff = nothing, alpha = 1.0,
+function GeneralBroyden(; max_resets = 100, linesearch = nothing, reset_tolerance = nothing,
+        init_jacobian::Val = Val(:identity), autodiff = nothing, alpha = nothing,
         update_rule = Val(:good_broyden))
     UR = _unwrap_val(update_rule)
-    @assert UR ∈ (:good_broyden, :bad_broyden)
+    @assert UR ∈ (:good_broyden, :bad_broyden, :diagonal, :exciting_mixing)
     IJ = _unwrap_val(init_jacobian)
     @assert IJ ∈ (:identity, :true_jacobian)
     linesearch = linesearch isa LineSearch ? linesearch : LineSearch(; method = linesearch)
     CJ = IJ === :true_jacobian
     return GeneralBroyden{IJ, UR, CJ}(autodiff, max_resets, reset_tolerance, linesearch,
-        1 / alpha)
+        alpha)
 end
 
 @concrete mutable struct GeneralBroydenCache{iip, IJ, UR} <:
@@ -78,6 +88,8 @@ end
     uf
     J⁻¹
     J⁻¹dfu
+    inv_alpha
+    alpha_initial
     force_stop::Bool
     resets::Int
     max_resets::Int
@@ -105,6 +117,8 @@ function SciMLBase.__init(prob::NonlinearProblem{uType, iip}, alg_::GeneralBroyd
     fu = evaluate_f(prob, u)
     @bb du = copy(u)
 
+    inv_alpha = __initial_inv_alpha(alg_.alpha, u, fu, internalnorm)
+
     if IJ === :true_jacobian
         alg = get_concrete_algorithm(alg_, prob)
         uf, _, J, fu_cache, jac_cache, du = jacobian_caches(alg, f, u, p, Val(iip);
@@ -114,7 +128,7 @@ function SciMLBase.__init(prob::NonlinearProblem{uType, iip}, alg_::GeneralBroyd
         alg = alg_
         @bb du = similar(u)
         uf, fu_cache, jac_cache = nothing, nothing, nothing
-        J⁻¹ = __init_identity_jacobian(u, fu, alg.inv_alpha)
+        J⁻¹ = __init_identity_jacobian(u, fu, inv_alpha)
     end
 
     reset_tolerance = alg.reset_tolerance === nothing ? sqrt(eps(real(eltype(u)))) :
@@ -131,9 +145,9 @@ function SciMLBase.__init(prob::NonlinearProblem{uType, iip}, alg_::GeneralBroyd
         kwargs...)
 
     return GeneralBroydenCache{iip, IJ, UR}(f, alg, u, u_cache, du, fu, fu_cache, dfu, p,
-        uf, J⁻¹, J⁻¹dfu, false, 0, alg.max_resets, maxiters, internalnorm,
-        ReturnCode.Default, abstol, reltol, reset_tolerance, reset_check, jac_cache, prob,
-        NLStats(1, 0, 0, 0, 0),
+        uf, J⁻¹, J⁻¹dfu, inv_alpha, alg.alpha, false, 0, alg.max_resets, maxiters,
+        internalnorm, ReturnCode.Default, abstol, reltol, reset_tolerance, reset_check,
+        jac_cache, prob, NLStats(1, 0, 0, 0, 0),
         init_linesearch_cache(alg.linesearch, f, u, p, fu, Val(iip)), tc_cache, trace)
 end
 
@@ -167,7 +181,9 @@ function perform_step!(cache::GeneralBroydenCache{iip, IJ, UR}) where {iip, IJ,
         if IJ === :true_jacobian
             cache.J⁻¹ = inv(jacobian!!(cache.J⁻¹, cache))
         else
-            cache.J⁻¹ = __reinit_identity_jacobian!!(cache.J⁻¹, cache.alg.inv_alpha)
+            cache.inv_alpha = __initial_inv_alpha(cache.inv_alpha, cache.alpha_initial,
+                cache.u, cache.fu, cache.internalnorm)
+            cache.J⁻¹ = __reinit_identity_jacobian!!(cache.J⁻¹, cache.inv_alpha)
         end
         cache.resets += 1
     else
@@ -194,7 +210,9 @@ function perform_step!(cache::GeneralBroydenCache{iip, IJ, UR}) where {iip, IJ,
 end
 
 function __reinit_internal!(cache::GeneralBroydenCache; kwargs...)
-    cache.J⁻¹ = __reinit_identity_jacobian!!(cache.J⁻¹, cache.alg.inv_alpha)
+    cache.inv_alpha = __initial_inv_alpha(cache.inv_alpha, cache.alpha_initial, cache.u,
+        cache.fu, cache.internalnorm)
+    cache.J⁻¹ = __reinit_identity_jacobian!!(cache.J⁻¹, cache.inv_alpha)
     cache.resets = 0
     return nothing
 end
diff --git a/src/default.jl b/src/default.jl
index 04198a1e0..459cf4083 100644
--- a/src/default.jl
+++ b/src/default.jl
@@ -248,8 +248,9 @@ function FastShortcutNonlinearPolyalg(; concrete_jac = nothing, linsolve = nothi
             TrustRegion(; concrete_jac, linsolve, precs,
                 radius_update_scheme = RadiusUpdateSchemes.Bastin, adkwargs...))
     else
-        algs = (GeneralKlement(; linsolve, precs),
-            GeneralBroyden(),
+        algs = (GeneralBroyden(),
+            GeneralBroyden(; init_jacobian = Val(:true_jacobian)),
+            GeneralKlement(; linsolve, precs),
             NewtonRaphson(; concrete_jac, linsolve, precs, adkwargs...),
             NewtonRaphson(; concrete_jac, linsolve, precs, linesearch = BackTracking(),
                 adkwargs...),
diff --git a/src/klement.jl b/src/klement.jl
index dc47149a5..e98e01f7d 100644
--- a/src/klement.jl
+++ b/src/klement.jl
@@ -1,13 +1,15 @@
 """
-    GeneralKlement(; max_resets = 5, linsolve = nothing, linesearch = nothing,
-        precs = DEFAULT_PRECS)
+    GeneralKlement(; max_resets = 100, linsolve = nothing, linesearch = nothing,
+        precs = DEFAULT_PRECS, alpha = true, init_jacobian::Val = Val(:identity),
+        autodiff = nothing)
 
 An implementation of `Klement` with line search, preconditioning and customizable linear
-solves.
+solves. It is recommended to use `Broyden` for most problems over this.
 
 ## Keyword Arguments
 
-  - `max_resets`: the maximum number of resets to perform. Defaults to `5`.
+  - `max_resets`: the maximum number of resets to perform. Defaults to `100`.
+
   - `linsolve`: the [LinearSolve.jl](https://github.com/SciML/LinearSolve.jl) used for the
     linear solves within the Newton method. Defaults to `nothing`, which means it uses the
     LinearSolve.jl default algorithm choice. For more information on available algorithm
@@ -19,10 +21,18 @@ solves.
   - `linesearch`: the line search algorithm to use. Defaults to [`LineSearch()`](@ref),
     which means that no line search is performed. Algorithms from `LineSearches.jl` can be
     used here directly, and they will be converted to the correct `LineSearch`.
-  - `init_jacobian`: the method to use for initializing the jacobian. Defaults to using the
-    identity matrix (`Val(:identitiy)`). Alternatively, can be set to `Val(:true_jacobian)`
-    to use the true jacobian as initialization. (Our tests suggest it is a good idea to
-    to initialize with an identity matrix)
+  - `alpha`: If `init_jacobian` is set to `Val(:identity)`, then the initial Jacobian
+    inverse is set to be `αI`. Defaults to `1`. Can be set to `nothing` which implies
+    `α = max(norm(u), 1) / (2 * norm(fu))`.
+  - `init_jacobian`: the method to use for initializing the jacobian. Defaults to
+    `Val(:identity)`. Choices include:
+
+      + `Val(:identity)`: Identity Matrix.
+      + `Val(:true_jacobian)`: True Jacobian. Our tests suggest that this is not very
+        stable. Instead using `Broyden` with `Val(:true_jacobian)` gives faster and more
+        reliable convergence.
+      + `Val(:true_jacobian_diagonal)`: Diagonal of True Jacobian. This is a good choice for
+        differentiable problems.
   - `autodiff`: determines the backend used for the Jacobian. Note that this argument is
     ignored if an analytical Jacobian is passed, as that will be used instead. Defaults to
     `nothing` which means that a default is selected according to the problem specification!
@@ -34,32 +44,30 @@ solves.
     linsolve
     precs
     linesearch
+    alpha
 end
 
-function __alg_print_modifiers(::GeneralKlement{IJ}) where {IJ}
+function __alg_print_modifiers(alg::GeneralKlement{IJ}) where {IJ}
     modifiers = String[]
     IJ !== :identity && push!(modifiers, "init_jacobian = :$(IJ)")
+    alg.alpha !== nothing && push!(modifiers, "alpha = $(alg.alpha)")
     return modifiers
 end
 
-function set_linsolve(alg::GeneralKlement{IJ, CS}, linsolve) where {IJ, CS}
-    return GeneralKlement{IJ, CS}(alg.ad, alg.max_resets, linsolve, alg.precs,
-        alg.linesearch)
-end
-
-function set_ad(alg::GeneralKlement{IJ, CS}, ad) where {IJ, CS}
-    return GeneralKlement{IJ, CS}(ad, alg.max_resets, alg.linsolve, alg.precs,
-        alg.linesearch)
+function set_ad(alg::GeneralKlement{IJ, CJ}, ad) where {IJ, CJ}
+    return GeneralKlement{IJ, CJ}(ad, alg.max_resets, alg.linsolve, alg.precs,
+        alg.linesearch, alg.alpha)
 end
 
-function GeneralKlement(; max_resets::Int = 5, linsolve = nothing,
+function GeneralKlement(; max_resets::Int = 100, linsolve = nothing, alpha = true,
         linesearch = nothing, precs = DEFAULT_PRECS, init_jacobian::Val = Val(:identity),
         autodiff = nothing)
     IJ = _unwrap_val(init_jacobian)
-    @assert IJ ∈ (:identity, :true_jacobian)
+    @assert IJ ∈ (:identity, :true_jacobian, :true_jacobian_diagonal)
     linesearch = linesearch isa LineSearch ? linesearch : LineSearch(; method = linesearch)
-    CJ = IJ === :true_jacobian
-    return GeneralKlement{IJ, CJ}(autodiff, max_resets, linsolve, precs, linesearch)
+    CJ = IJ !== :identity
+    return GeneralKlement{IJ, CJ}(autodiff, max_resets, linsolve, precs, linesearch,
+        alpha)
 end
 
 @concrete mutable struct GeneralKlementCache{iip, IJ} <: AbstractNonlinearSolveCache{iip}
@@ -79,6 +87,8 @@ end
     J_cache_2
     Jdu
     Jdu_cache
+    alpha
+    alpha_initial
     resets
     force_stop
     maxiters::Int
@@ -102,15 +112,23 @@ function SciMLBase.__init(prob::NonlinearProblem{uType, iip}, alg_::GeneralKleme
     u = __maybe_unaliased(u0, alias_u0)
     fu = evaluate_f(prob, u)
 
+    alpha = __initial_alpha(alg_.alpha, u, fu, internalnorm)
+
     if IJ === :true_jacobian
         alg = get_concrete_algorithm(alg_, prob)
         uf, _, J, fu_cache, jac_cache, du = jacobian_caches(alg, f, u, p, Val(iip);
             lininit = Val(false))
+    elseif IJ === :true_jacobian_diagonal
+        alg = get_concrete_algorithm(alg_, prob)
+        uf, _, J_cache, fu_cache, jac_cache, du = jacobian_caches(alg, f, u, p, Val(iip);
+            lininit = Val(false))
+        J = __diag(J_cache)
     elseif IJ === :identity
         alg = alg_
         @bb du = similar(u)
         uf, fu_cache, jac_cache = nothing, nothing, nothing
         J = one.(u) # Identity Init Jacobian for Klement maintains a Diagonal Structure
+        @bb J .*= alpha
     else
         error("Invalid `init_jacobian` value")
     end
@@ -133,13 +151,14 @@ function SciMLBase.__init(prob::NonlinearProblem{uType, iip}, alg_::GeneralKleme
         @bb J_cache_2 = similar(J)
         @bb Jdu_cache = similar(fu)
     else
-        J_cache, J_cache_2, Jdu_cache = nothing, nothing, nothing
+        IJ === :identity && (J_cache = nothing)
+        J_cache_2, Jdu_cache = nothing, nothing
     end
 
     return GeneralKlementCache{iip, IJ}(f, alg, u, u_cache, fu, fu_cache, fu_cache_2, du, p,
-        uf, linsolve, J, J_cache, J_cache_2, Jdu, Jdu_cache, 0, false, maxiters,
-        internalnorm,
-        ReturnCode.Default, abstol, reltol, prob, jac_cache, NLStats(1, 0, 0, 0, 0),
+        uf, linsolve, J, J_cache, J_cache_2, Jdu, Jdu_cache, alpha, alg.alpha, 0, false,
+        maxiters, internalnorm, ReturnCode.Default, abstol, reltol, prob, jac_cache,
+        NLStats(1, 0, 0, 0, 0),
         init_linesearch_cache(alg.linesearch, f, u, p, fu, Val(iip)), tc_cache, trace)
 end
 
@@ -150,6 +169,12 @@ function perform_step!(cache::GeneralKlementCache{iip, IJ}) where {iip, IJ}
     if IJ === :true_jacobian
         cache.stats.nsteps == 0 && (cache.J = jacobian!!(cache.J, cache))
         ill_conditioned = __is_ill_conditioned(cache.J)
+    elseif IJ === :true_jacobian_diagonal
+        if cache.stats.nsteps == 0
+            cache.J_cache = jacobian!!(cache.J_cache, cache)
+            cache.J = __get_diagonal!!(cache.J, cache.J_cache)
+        end
+        ill_conditioned = __is_ill_conditioned(cache.J)
     elseif IJ === :identity
         ill_conditioned = __is_ill_conditioned(cache.J)
     end
@@ -162,13 +187,18 @@ function perform_step!(cache::GeneralKlementCache{iip, IJ}) where {iip, IJ}
         end
         if IJ === :true_jacobian && cache.stats.nsteps != 0
             cache.J = jacobian!!(cache.J, cache)
-        else
-            cache.J = __reinit_identity_jacobian!!(cache.J)
+        elseif IJ === :true_jacobian_diagonal && cache.stats.nsteps != 0
+            cache.J_cache = jacobian!!(cache.J_cache, cache)
+            cache.J = __get_diagonal!!(cache.J, cache.J_cache)
+        elseif IJ === :identity
+            cache.alpha = __initial_alpha(cache.alpha, cache.alpha_initial, cache.u,
+                cache.fu, cache.internalnorm)
+            cache.J = __reinit_identity_jacobian!!(cache.J, cache.alpha)
         end
         cache.resets += 1
     end
 
-    if IJ === :identity
+    if cache.J isa AbstractVector || cache.J isa Number
         @bb @. cache.du = cache.fu / cache.J
     else
         # u = u - J \ fu
@@ -193,13 +223,15 @@ function perform_step!(cache::GeneralKlementCache{iip, IJ}) where {iip, IJ}
 
     # Update the Jacobian
     @bb cache.du .*= -1
-    if IJ === :identity
+    if cache.J isa AbstractVector || cache.J isa Number
         @bb @. cache.Jdu = (cache.J^2) * (cache.du^2)
         @bb @. cache.J += ((cache.fu - cache.fu_cache_2 - cache.J * cache.du) /
                            ifelse(iszero(cache.Jdu), T(1e-5), cache.Jdu)) * cache.du *
                           (cache.J^2)
     else
-        @bb cache.J_cache .= cache.J' .^ 2
+        # Klement Updates to the Full Jacobian don't work for most problems, we should
+        # probably be using the Broyden Update Rule here
+        @bb @. cache.J_cache = cache.J' ^ 2
         @bb @. cache.Jdu = cache.du^2
         @bb cache.Jdu_cache = cache.J_cache × vec(cache.Jdu)
         @bb cache.Jdu = cache.J × vec(cache.du)
@@ -217,7 +249,9 @@ function perform_step!(cache::GeneralKlementCache{iip, IJ}) where {iip, IJ}
 end
 
 function __reinit_internal!(cache::GeneralKlementCache; kwargs...)
-    cache.J = __reinit_identity_jacobian!!(cache.J)
+    cache.alpha = __initial_alpha(cache.alpha, cache.alpha_initial, cache.u, cache.fu,
+        cache.internalnorm)
+    cache.J = __reinit_identity_jacobian!!(cache.J, cache.alpha)
     cache.resets = 0
     return nothing
 end
diff --git a/src/utils.jl b/src/utils.jl
index 59535aea1..1b341fd69 100644
--- a/src/utils.jl
+++ b/src/utils.jl
@@ -111,10 +111,10 @@ function dolinsolve(cache, precs::P, linsolve; A = nothing, linu = nothing, b =
     # Some Algorithms would reuse factorization but it causes the cache to not reset in
     # certain cases
     if A !== nothing
-        alg = linsolve.alg
-        if (alg isa LinearSolve.AbstractFactorization) ||
-           (alg isa LinearSolve.DefaultLinearSolver && !(alg ==
-              LinearSolve.DefaultLinearSolver(LinearSolve.DefaultAlgorithmChoice.KrylovJL_GMRES)))
+        alg = __getproperty(linsolve, Val(:alg))
+        if alg !== nothing && ((alg isa LinearSolve.AbstractFactorization) ||
+            (alg isa LinearSolve.DefaultLinearSolver && !(alg ==
+               LinearSolve.DefaultLinearSolver(LinearSolve.DefaultAlgorithmChoice.KrylovJL_GMRES))))
             # Factorization Algorithm
             if reuse_A_if_factorization
                 cache.stats.nfactors -= 1
@@ -477,3 +477,52 @@ end
         return Diagonal(@.. broadcast=false max(y.diag, @view(x[idxs])))
     end
 end
+
+# Alpha for Initial Jacobian Guess
+# The values are somewhat different from SciPy, these were tuned to the 23 test problems
+@inline function __initial_inv_alpha(α::Number, u, fu, norm::F) where {F}
+    return convert(promote_type(eltype(u), eltype(fu)), inv(α))
+end
+@inline function __initial_inv_alpha(::Nothing, u, fu, norm::F) where {F}
+    norm_fu = norm(fu)
+    return ifelse(norm_fu ≥ 1e-5, max(norm(u), true) / (2 * norm_fu),
+        convert(promote_type(eltype(u), eltype(fu)), true))
+end
+@inline __initial_inv_alpha(inv_α, α::Number, u, fu, norm::F) where {F} = inv_α
+@inline function __initial_inv_alpha(inv_α, α::Nothing, u, fu, norm::F) where {F}
+    return __initial_inv_alpha(α, u, fu, norm)
+end
+
+@inline function __initial_alpha(α::Number, u, fu, norm::F) where {F}
+    return convert(promote_type(eltype(u), eltype(fu)), α)
+end
+@inline function __initial_alpha(::Nothing, u, fu, norm::F) where {F}
+    norm_fu = norm(fu)
+    return ifelse(1e-5 ≤ norm_fu ≤ 1e5, max(norm(u), true) / (2 * norm_fu),
+        convert(promote_type(eltype(u), eltype(fu)), true))
+end
+@inline __initial_alpha(α_initial, α::Number, u, fu, norm::F) where {F} = α_initial
+@inline function __initial_alpha(α_initial, α::Nothing, u, fu, norm::F) where {F}
+    return __initial_alpha(α, u, fu, norm)
+end
+
+# Diagonal
+@inline function __get_diagonal!!(J::AbstractVector, J_full::AbstractMatrix)
+    if can_setindex(J)
+        if fast_scalar_indexing(J)
+            @inbounds for i in eachindex(J)
+                J[i] = J_full[i, i]
+            end
+        else
+            J .= view(J_full, diagind(J_full))
+        end
+    else
+        J = __diag(J_full)
+    end
+    return J
+end
+@inline __get_diagonal!!(J::Number, J_full::Number) = J_full
+
+@inline __diag(x::AbstractMatrix) = diag(x)
+@inline __diag(x::AbstractVector) = x
+@inline __diag(x::Number) = x
diff --git a/test/23_test_problems.jl b/test/23_test_problems.jl
index 21879b816..689b6266c 100644
--- a/test/23_test_problems.jl
+++ b/test/23_test_problems.jl
@@ -90,25 +90,36 @@ end
 end
 
 @testset "GeneralBroyden 23 Test Problems" begin
-    alg_ops = (GeneralBroyden(; max_resets = 1000),
-        GeneralBroyden(; max_resets = 1000, init_jacobian = Val(:true_jacobian)))
+    alg_ops = (GeneralBroyden(),
+        GeneralBroyden(; init_jacobian = Val(:true_jacobian)),
+        GeneralBroyden(; update_rule = Val(:bad_broyden)),
+        GeneralBroyden(; init_jacobian = Val(:true_jacobian),
+            update_rule = Val(:bad_broyden)))
 
     broken_tests = Dict(alg => Int[] for alg in alg_ops)
-    broken_tests[alg_ops[1]] = [1, 4, 5, 6, 11, 12, 13, 14]
+    broken_tests[alg_ops[1]] = [1, 5, 6, 11]
     broken_tests[alg_ops[2]] = [1, 5, 6, 8, 11, 18]
+    broken_tests[alg_ops[3]] = [1, 4, 5, 6, 9, 11]
+    broken_tests[alg_ops[4]] = [1, 5, 6, 8, 11]
 
     skip_tests = Dict(alg => Int[] for alg in alg_ops)
     skip_tests[alg_ops[1]] = [2, 22]
     skip_tests[alg_ops[2]] = [2, 22]
+    skip_tests[alg_ops[3]] = [2, 22]
+    skip_tests[alg_ops[4]] = [2, 22]
 
     test_on_library(problems, dicts, alg_ops, broken_tests; skip_tests)
 end
 
 @testset "GeneralKlement 23 Test Problems" begin
-    alg_ops = (GeneralKlement(; max_resets = 1000),)
+    alg_ops = (GeneralKlement(),
+        GeneralKlement(; init_jacobian = Val(:true_jacobian)),
+        GeneralKlement(; init_jacobian = Val(:true_jacobian_diagonal)))
 
     broken_tests = Dict(alg => Int[] for alg in alg_ops)
     broken_tests[alg_ops[1]] = [1, 2, 4, 5, 6, 11, 22]
+    broken_tests[alg_ops[2]] = [1, 2, 4, 5, 6, 8, 9, 10, 11, 13, 17, 21, 22, 23]
+    broken_tests[alg_ops[3]] = [2, 4, 5, 6, 7, 18, 22]
 
     test_on_library(problems, dicts, alg_ops, broken_tests)
 end
diff --git a/test/basictests.jl b/test/basictests.jl
index 3963571da..869690298 100644
--- a/test/basictests.jl
+++ b/test/basictests.jl
@@ -789,25 +789,28 @@ end
 # --- GeneralKlement tests ---
 
 @testset "GeneralKlement" begin
-    function benchmark_nlsolve_oop(f, u0, p = 2.0; linesearch = nothing)
+    function benchmark_nlsolve_oop(f, u0, p = 2.0; linesearch = nothing,
+            init_jacobian = Val(:identity))
         prob = NonlinearProblem{false}(f, u0, p)
-        return solve(prob, GeneralKlement(; linesearch), abstol = 1e-9)
+        return solve(prob, GeneralKlement(; linesearch, init_jacobian), abstol = 1e-9)
     end
 
-    function benchmark_nlsolve_iip(f, u0, p = 2.0; linesearch = nothing)
+    function benchmark_nlsolve_iip(f, u0, p = 2.0; linesearch = nothing,
+            init_jacobian = Val(:identity))
         prob = NonlinearProblem{true}(f, u0, p)
-        return solve(prob, GeneralKlement(; linesearch), abstol = 1e-9)
+        return solve(prob, GeneralKlement(; linesearch, init_jacobian), abstol = 1e-9)
     end
 
-    @testset "LineSearch: $(_nameof(lsmethod)) LineSearch AD: $(_nameof(ad))" for lsmethod in (Static(),
+    @testset "LineSearch: $(_nameof(lsmethod)) LineSearch AD: $(_nameof(ad)) Init Jacobian: $(init_jacobian)" for lsmethod in (Static(),
             StrongWolfe(), BackTracking(), HagerZhang(), MoreThuente()),
-        ad in (AutoFiniteDiff(), AutoZygote())
+        ad in (AutoFiniteDiff(), AutoZygote()),
+        init_jacobian in (Val(:identity), Val(:true_jacobian), Val(:true_jacobian_diagonal))
 
         linesearch = LineSearch(; method = lsmethod, autodiff = ad)
         u0s = ([1.0, 1.0], @SVector[1.0, 1.0], 1.0)
 
         @testset "[OOP] u0: $(typeof(u0))" for u0 in u0s
-            sol = benchmark_nlsolve_oop(quadratic_f, u0; linesearch)
+            sol = benchmark_nlsolve_oop(quadratic_f, u0; linesearch, init_jacobian)
             # Some are failing by a margin
             # @test SciMLBase.successful_retcode(sol)
             @test all(abs.(sol.u .* sol.u .- 2) .< 3e-9)
@@ -819,7 +822,7 @@ end
 
         @testset "[IIP] u0: $(typeof(u0))" for u0 in ([1.0, 1.0],)
             ad isa AutoZygote && continue
-            sol = benchmark_nlsolve_iip(quadratic_f!, u0; linesearch)
+            sol = benchmark_nlsolve_iip(quadratic_f!, u0; linesearch, init_jacobian)
             @test SciMLBase.successful_retcode(sol)
             @test all(abs.(sol.u .* sol.u .- 2) .< 1e-9)