General tweaks

ojwoodford · Oct 26, 2023 · bfa26ce · bfa26ce · ojwoodford · Oct 26, 2023
1 parent d4e3d98
commit bfa26ce
Show file tree

Hide file tree

Showing 9 changed files with 51 additions and 31 deletions.
diff --git a/examples/rosenbrock.jl b/examples/rosenbrock.jl
@@ -17,7 +17,7 @@ NLLSsolver.ndeps(::Rosenbrock) = static(1) # Residual depends on 1 variable
 NLLSsolver.nres(::Rosenbrock) = static(2) # Residual has length 2
 NLLSsolver.varindices(::Rosenbrock) = SVector(1) # There's only one variable
 NLLSsolver.getvars(::Rosenbrock, vars::Vector) = (vars[1]::NLLSsolver.EuclideanVector{2, Float64},)
-NLLSsolver.computeresidual(res::Rosenbrock, x) = SVector(res.a - x[1], res.b * (x[1] ^ 2 - x[2]))
+NLLSsolver.computeresidual(res::Rosenbrock, x) = SVector(res.a * (1 - x[1]), res.b * (x[1] ^ 2 - x[2]))
 
 function constructrosenbrockprob()
     # Create the problem

diff --git a/src/callbacks.jl b/src/callbacks.jl
@@ -5,21 +5,25 @@ nullcallback(cost, unusedargs...) = (cost, 0)
 
 # Print out per-iteration results
 function printoutcallback(cost, problem, data, trailingargs...)
+    prevcost = data.bestcost
     if data.iternum == 1
+        prevcost = data.startcost
         # First iteration, so print out column headers and the zeroth iteration (i.e. start) values
         println("iter      cost      cost_change    |step|")
-        @printf("% 4d % 8e  % 4.3e   % 3.2e\n", 0, data.bestcost, 0, 0)
+        @printf("% 4d % 8e  % 4.3e   % 3.2e\n", 0, prevcost, 0, 0)
     end
-    @printf("% 4d % 8e  % 4.3e   % 3.2e\n", data.iternum, cost, data.bestcost-cost, norm(data.linsystem.x))
+    @printf("% 4d % 8e  % 4.3e   % 3.2e\n", data.iternum, cost, prevcost-cost, norm(data.linsystem.x))
     return cost, 0
 end
 function printoutcallback(cost, data, trradius::Float64)
+    prevcost = data.bestcost
     if data.iternum == 1
+        prevcost = data.startcost
         # First iteration, so print out column headers and the zeroth iteration (i.e. start) values
         println("iter      cost      cost_change    |step|    tr_radius")
-        @printf("% 4d % 8e  % 4.3e   % 3.2e   % 2.1e\n", 0, data.bestcost, 0, 0, trradius)
+        @printf("% 4d % 8e  % 4.3e   % 3.2e   % 2.1e\n", 0, prevcost, 0, 0, trradius)
     end
-    @printf("% 4d % 8e  % 4.3e   % 3.2e   % 2.1e\n", data.iternum, cost, data.bestcost-cost, norm(data.linsystem.x), trradius)
+    @printf("% 4d % 8e  % 4.3e   % 3.2e   % 2.1e\n", data.iternum, cost, prevcost-cost, norm(data.linsystem.x), trradius)
     return cost, 0
 end
 

diff --git a/src/iterators.jl b/src/iterators.jl
@@ -2,6 +2,9 @@ using SparseArrays
 
 negate!(x) = @.(x = -x)
 
+# Default preoptimization - do nothing, return lowest cost possible
+preoptimization(::Any, unusedargs...) = -Inf
+
 # Iterators assume that the linear problem has been constructed
 
 # Newton optimization (undamped-Hessian form)
@@ -32,15 +35,14 @@ mutable struct DoglegData{T}
         return new{typeof(data.linsystem.x)}(0.0, similar(data.linsystem.x))
     end
 end
+gettr(dd::DoglegData) = dd.trustradius
+settr!(dd::DoglegData, tr) = dd.trustradius = tr
 function reset!(dd::DoglegData{T}, ::NLLSProblem, data::NLLSInternal) where T<:Vector
-    dd.trustradius = 0.0
+    settr!(dd, 0.0)
     resize!(dd.cauchy, length(data.linsystem.x))
     return
 end
-function reset!(dd::DoglegData{T}, ::NLLSProblem, data::NLLSInternal) where T<:StaticVector
-    dd.trustradius = 0.0
-    return
-end
+reset!(dd::DoglegData{T}, ::NLLSProblem, data::NLLSInternal) where T<:StaticVector = settr!(dd, 0.0)
 
 function iterate!(doglegdata::DoglegData, data, problem::NLLSProblem, options::NLLSOptions)::Float64
     hessian, gradient = gethessgrad(data.linsystem)
@@ -122,13 +124,23 @@ mutable struct LevMarData
         return new(0.0)
     end
 end
-reset!(lmd::LevMarData, ::NLLSProblem, ::NLLSInternal) = lmd.lambda = 0.0
+gettr(lmd::LevMarData) = lmd.lambda
+settr!(lmd::LevMarData, tr) = lmd.lambda = tr
+reset!(lmd::LevMarData, ::NLLSProblem, ::NLLSInternal) = settr!(lmd, 0.0)
+
+function initlambda(hessian)
+    m = zero(eltype(hessian))
+    for i in indices(hessian, 1)
+        @inbounds m = max(m, abs(hessian[i,i]))
+    end
+    return m * 1e-6
+end
 
 function iterate!(levmardata::LevMarData, data, problem::NLLSProblem, options::NLLSOptions)::Float64
     @assert levmardata.lambda >= 0.
     hessian, gradient = gethessgrad(data.linsystem)
     if levmardata.lambda == 0
-        levmardata.lambda = tr(hessian) ./ (size(hessian, 1) * 1e6)
+        levmardata.lambda = initlambda(hessian)
     end
     lastlambda = 0.
     mu = 2.
@@ -145,7 +157,7 @@ function iterate!(levmardata::LevMarData, data, problem::NLLSProblem, options::N
         data.timecost += @elapsed_ns cost_ = cost(problem.varnext, problem.costs)
         data.costcomputations += 1
         # Check for exit
-        if !(cost_ > data.bestcost) || (maximum(abs, data.linsystem.x) < options.dstep)
+        if !(cost_ > data.bestcost) || maximum(abs, data.linsystem.x) < options.dstep
             # Success (or convergence) - update lambda
             uniformscaling!(hessian, -lastlambda)
             stepquality = (cost_ - data.bestcost) / (0.5 * fast_bAb(hessian, data.linsystem.x) + dot(gradient, data.linsystem.x))

diff --git a/src/linearsystem.jl b/src/linearsystem.jl
@@ -61,9 +61,9 @@ struct MultiVariateLSsparse
             hessian = SparseMatrixCSC{Float64, Int}(sparseindices.m, sparseindices.n, sparseindices.colptr, sparseindices.rowval, Vector{Float64}(undef, length(sparseindices.nzval)))
             sparseindices = sparseindices.nzval
         else
-            x = Vector{Float64}()
+            x = Vector{Float64}(undef, 1)
             sparseindices = Vector{Int}()
-            hessian = spzeros(0, 0)
+            hessian = spzeros(1, 1)
         end
         ldlfac = ldl_analyze(hessian)
         return new(A, zeros(Float64, blen), x, blockindices, boffsets, hessian, sparseindices, ldlfac)

diff --git a/src/marginalize.jl b/src/marginalize.jl
@@ -91,6 +91,7 @@ function marginalize!(to::MultiVariateLS, from::MultiVariateLSsparse, fromblock
             marginalize!(to, from, range, blocksz)
         end
     end
+    return to
 end
 
 function initcrop!(to::MultiVariateLSsparse, from::MultiVariateLSsparse, fromblock=length(to.A.rowblocksizes)+1)
@@ -100,6 +101,7 @@ function initcrop!(to::MultiVariateLSsparse, from::MultiVariateLSsparse, fromblo
     to.b .= view(from.b, 1:lastindex(to.b))
     endind = from.A.indicestransposed.nzval[from.A.indicestransposed.colptr[fromblock]] - 1
     view(to.A.data, 1:endind) .= view(from.A.data, 1:endind)
+    return to
 end
 
 function initcrop!(to::MultiVariateLSdense, from::MultiVariateLSsparse, fromblock=length(to.A.rowblockoffsets))
@@ -115,6 +117,7 @@ function initcrop!(to::MultiVariateLSdense, from::MultiVariateLSsparse, frombloc
             block(to.A, row, col, lenr, lenc) .= reshape(view(from.A.data, (0:lenr*lenc-1) .+ from.A.indicestransposed.nzval[colind]), lenr, lenc)
         end
     end 
+    return to
 end
 
 function constructcrop(from::MultiVariateLSsparse, fromblock, forcesparse=false)
@@ -150,10 +153,10 @@ function constructcrop(from::MultiVariateLSsparse, fromblock, forcesparse=false)
             A = BlockSparseMatrix{Float64}(start-1, cropsparsity, blocksizes, blocksizes)
 
             # Construct the sparse linear system
-            return MultiVariateLSsparse(A, from.blockindices[1:findfirst(isequal(fromblock), from.blockindices)])
+            return MultiVariateLSsparse(A, from.blockindices[1:findfirst(isequal(fromblock), from.blockindices)-1])
         end
     end
 
     # Construct a dense linear system
-    return MultiVariateLSdense(toblocksizes, from.blockindices)
+    return MultiVariateLSdense(toblocksizes, from.blockindices[1:findfirst(isequal(fromblock), from.blockindices)-1])
 end
diff --git a/src/optimize.jl b/src/optimize.jl
@@ -78,18 +78,19 @@ end
 
 # The meat of an optimization
 function optimizeinternal!(problem::NLLSProblem, options::NLLSOptions, data, iteratedata, callback)
-    # Timing initializations
+    # Do any preoptimization for the iterator
+    data.startcost = preoptimization(iteratedata, problem, options, data)::Float64
+    # Other initializations
+    fails = 0
+    data.iternum = 0
     stoptime = data.starttime + options.maxtime
     data.timeinit += Base.time_ns() - data.starttime
     # Initialize the linear problem
-    data.timegradient += @elapsed_ns data.bestcost = costgradhess!(data.linsystem, problem.variables, problem.costs)
+    data.timegradient += @elapsed_ns cost = costgradhess!(data.linsystem, problem.variables, problem.costs)
     data.gradientcomputations += 1
-    data.startcost = data.bestcost
+    data.bestcost = cost
+    data.startcost = max(cost, data.startcost)
     # Do the iterations
-    fails = 0
-    cost = data.bestcost
-    converged = 0
-    data.iternum = 0
     while true
         data.iternum += 1
         # Call the per iteration solver
@@ -158,11 +159,11 @@ function optimizeinternal!(problem::NLLSProblem, options::NLLSOptions, data, ite
 end
 
 # Optimizing variables one at a time (e.g. in alternation)
-function optimizesinglesinternal!(problem::NLLSProblem, options::NLLSOptions, data::NLLSInternal{LST}, iteratedata, allcosts::CostStruct, costindices, indices, first) where {LST<:UniVariateLS}
+function optimizesinglesinternal!(problem::NLLSProblem, options::NLLSOptions, data::NLLSInternal{LST}, iteratedata, allcosts::CostStruct, costindices, varindices, first) where {LST<:UniVariateLS}
     iternum = data.iternum
-    while first <= length(indices)
+    while first <= length(varindices)
         # Bail out if the variable size changes
-        ind = indices[first]
+        ind = varindices[first]
         if nvars(problem.variables[ind]) != length(data.linsystem.b)
             break
         end

diff --git a/src/utils.jl b/src/utils.jl
@@ -105,7 +105,7 @@ function fast_bAb(A::SparseMatrixCSC, b::Vector)
     return total
 end
 
-sparse_dense_decision(d, nnz) = (nnz * 32) < (25 * d * (d - 40)) # Threshold nnz = 25/32 * (d^2 - 40d)
+sparse_dense_decision(d, nnz) = (nnz * 64) < (25 * d * (d - 40)) # Threshold nnz (for lower triangle) = 25/64 * (d^2 - 40d)
 
 function block_sparse_nnz(sparsity, blocksizes)
     # Compute the number of non-zeros in a block sparse matrix

diff --git a/test/functional.jl b/test/functional.jl
@@ -9,7 +9,7 @@ NLLSsolver.ndeps(::RosenbrockA) = static(1)
 NLLSsolver.nres(::RosenbrockA) = 1
 NLLSsolver.varindices(::RosenbrockA) = SVector(1)
 NLLSsolver.getvars(::RosenbrockA, vars::Vector) = (vars[1]::Float64,)
-NLLSsolver.computeresidual(res::RosenbrockA, x) = res.a - x
+NLLSsolver.computeresidual(res::RosenbrockA, x) = res.a * (1 - x)
 Base.eltype(::RosenbrockA) = Float64
 const rosenbrockrobustifier = NLLSsolver.Scaled(NLLSsolver.Huber2oKernel(1.6), 1.0)
 NLLSsolver.robustkernel(::RosenbrockA) = rosenbrockrobustifier

diff --git a/test/marginalize.jl b/test/marginalize.jl
@@ -60,7 +60,7 @@ using NLLSsolver, SparseArrays, StaticArrays, Test, Random
     @test hess_d ≈ hess_s
     @test to_d.b == to_s.b
 
-    # Check that the reduced systems gives the correct variable update
+    # Check that the reduced systems give the correct variable update
     @test hessian \ gradient ≈ gtupdate
     @test hess_d \ to_d.b ≈ gtupdate
     @test hess_s \ to_s.b ≈ gtupdate
@@ -79,7 +79,7 @@ using NLLSsolver, SparseArrays, StaticArrays, Test, Random
     @test hess_d ≈ hess_s
     @test to_d.b == to_s.b
 
-    # Check that the reduced systems gives the correct variable update
+    # Check that the reduced systems give the correct variable update
     @test hess_d \ to_d.b ≈ gtupdate
     @test hess_s \ to_s.b ≈ gtupdate
 end