Sleipnir C++ API
Loading...
Searching...
No Matches
newton.hpp
1// Copyright (c) Sleipnir contributors
2
3#pragma once
4
5#include <chrono>
6#include <cmath>
7#include <functional>
8#include <span>
9
10#include <Eigen/Core>
11#include <Eigen/SparseCore>
12#include <gch/small_vector.hpp>
13
14#include "sleipnir/optimization/solver/exit_status.hpp"
15#include "sleipnir/optimization/solver/iteration_info.hpp"
16#include "sleipnir/optimization/solver/newton_matrix_callbacks.hpp"
17#include "sleipnir/optimization/solver/options.hpp"
18#include "sleipnir/optimization/solver/util/all_finite.hpp"
19#include "sleipnir/optimization/solver/util/filter.hpp"
20#include "sleipnir/optimization/solver/util/kkt_error.hpp"
21#include "sleipnir/optimization/solver/util/regularized_ldlt.hpp"
22#include "sleipnir/util/assert.hpp"
23#include "sleipnir/util/print_diagnostics.hpp"
24#include "sleipnir/util/profiler.hpp"
25#include "sleipnir/util/scope_exit.hpp"
26#include "sleipnir/util/symbol_exports.hpp"
27
28// See docs/algorithms.md#Works_cited for citation definitions.
29
30namespace slp {
31
50template <typename Scalar>
51ExitStatus newton(
52 const NewtonMatrixCallbacks<Scalar>& matrix_callbacks,
53 std::span<std::function<bool(const IterationInfo<Scalar>& info)>>
54 iteration_callbacks,
55 const Options& options, Eigen::Vector<Scalar, Eigen::Dynamic>& x) {
56 using DenseVector = Eigen::Vector<Scalar, Eigen::Dynamic>;
57 using SparseMatrix = Eigen::SparseMatrix<Scalar>;
58 using SparseVector = Eigen::SparseVector<Scalar>;
59
60 using std::isfinite;
61
62 const auto solve_start_time = std::chrono::steady_clock::now();
63
64 gch::small_vector<SolveProfiler> solve_profilers;
65 solve_profilers.emplace_back("solver");
66 solve_profilers.emplace_back("↳ setup");
67 solve_profilers.emplace_back("↳ iteration");
68 solve_profilers.emplace_back(" ↳ feasibility check");
69 solve_profilers.emplace_back(" ↳ callbacks");
70 solve_profilers.emplace_back(" ↳ KKT matrix decomp");
71 solve_profilers.emplace_back(" ↳ KKT system solve");
72 solve_profilers.emplace_back(" ↳ line search");
73 solve_profilers.emplace_back(" ↳ f(x)");
74 solve_profilers.emplace_back(" ↳ ∇f(x)");
75 solve_profilers.emplace_back(" ↳ ∇²ₓₓL");
76
77 auto& solver_prof = solve_profilers[0];
78 auto& setup_prof = solve_profilers[1];
79 auto& inner_iter_prof = solve_profilers[2];
80 auto& feasibility_check_prof = solve_profilers[3];
81 auto& iter_callbacks_prof = solve_profilers[4];
82 auto& kkt_matrix_decomp_prof = solve_profilers[5];
83 auto& kkt_system_solve_prof = solve_profilers[6];
84 auto& line_search_prof = solve_profilers[7];
85
86 // Set up profiled matrix callbacks
87#ifndef SLEIPNIR_DISABLE_DIAGNOSTICS
88 auto& f_prof = solve_profilers[8];
89 auto& g_prof = solve_profilers[9];
90 auto& H_prof = solve_profilers[10];
91
92 NewtonMatrixCallbacks<Scalar> matrices{
93 matrix_callbacks.num_decision_variables,
94 [&](const DenseVector& x) -> Scalar {
95 ScopedProfiler prof{f_prof};
96 return matrix_callbacks.f(x);
97 },
98 [&](const DenseVector& x) -> SparseVector {
99 ScopedProfiler prof{g_prof};
100 return matrix_callbacks.g(x);
101 },
102 [&](const DenseVector& x) -> SparseMatrix {
103 ScopedProfiler prof{H_prof};
104 return matrix_callbacks.H(x);
105 }};
106#else
107 const auto& matrices = matrix_callbacks;
108#endif
109
110 solver_prof.start();
111 setup_prof.start();
112
113 Scalar f = matrices.f(x);
114 SparseVector g = matrices.g(x);
115 SparseMatrix H = matrices.H(x);
116
117 // Ensure matrix callback dimensions are consistent
118 slp_assert(g.rows() == matrices.num_decision_variables);
119 slp_assert(H.rows() == matrices.num_decision_variables);
120 slp_assert(H.cols() == matrices.num_decision_variables);
121
122 DenseVector trial_x;
123
124 Scalar trial_f;
125
126 // Check whether initial guess has finite cost and derivatives
127 if (!isfinite(f) || !all_finite(g) || !all_finite(H)) {
128 return ExitStatus::NONFINITE_INITIAL_GUESS;
129 }
130
131 int iterations = 0;
132
133 Filter<Scalar> filter;
134
135 RegularizedLDLT<Scalar> solver{matrices.num_decision_variables, 0};
136
137 // Variables for determining when a step is acceptable
138 constexpr Scalar α_reduction_factor(0.5);
139 constexpr Scalar α_min(1e-20);
140
141 // Error
142 Scalar E_0 = kkt_error<Scalar, KKTErrorType::INF_NORM_SCALED>(g);
143
144 setup_prof.stop();
145
146 // Prints final solver diagnostics when the solver exits
147 scope_exit exit{[&] {
148 if (options.diagnostics) {
149 solver_prof.stop();
150 if (iterations > 0) {
151 print_bottom_iteration_diagnostics();
152 }
153 print_solver_diagnostics(solve_profilers);
154 }
155 }};
156
157 while (E_0 > Scalar(options.tolerance)) {
158 ScopedProfiler inner_iter_profiler{inner_iter_prof};
159 ScopedProfiler feasibility_check_profiler{feasibility_check_prof};
160
161 // Check for diverging iterates
162 if (x.template lpNorm<Eigen::Infinity>() > Scalar(1e10) || !x.allFinite()) {
163 return ExitStatus::DIVERGING_ITERATES;
164 }
165
166 feasibility_check_profiler.stop();
167 ScopedProfiler iter_callbacks_profiler{iter_callbacks_prof};
168
169 // Call iteration callbacks
170 for (const auto& callback : iteration_callbacks) {
171 if (callback({iterations, x, {}, {}, {}, g, H, {}, {}})) {
172 return ExitStatus::CALLBACK_REQUESTED_STOP;
173 }
174 }
175
176 iter_callbacks_profiler.stop();
177 ScopedProfiler kkt_matrix_decomp_profiler{kkt_matrix_decomp_prof};
178
179 // Solve the Newton-KKT system
180 //
181 // Hpˣ = −∇f
182 solver.compute(H);
183
184 kkt_matrix_decomp_profiler.stop();
185 ScopedProfiler kkt_system_solve_profiler{kkt_system_solve_prof};
186
187 DenseVector p_x = solver.solve(-g);
188
189 kkt_system_solve_profiler.stop();
190 ScopedProfiler line_search_profiler{line_search_prof};
191
192 constexpr Scalar α_max(1);
193 Scalar α = α_max;
194
195 // Loop until a step is accepted. If a step becomes acceptable, the loop
196 // will exit early.
197 while (1) {
198 trial_x = x + α * p_x;
199
200 trial_f = matrices.f(trial_x);
201
202 // If f(xₖ + αpₖˣ) isn't finite, reduce step size immediately
203 if (!isfinite(trial_f)) {
204 // Reduce step size
205 α *= α_reduction_factor;
206
207 if (α < α_min) {
208 return ExitStatus::LINE_SEARCH_FAILED;
209 }
210 continue;
211 }
212
213 // Check whether filter accepts trial iterate
214 if (filter.try_add(FilterEntry{f}, FilterEntry{trial_f}, p_x, g, α)) {
215 // Accept step
216 break;
217 }
218
219 // Reduce step size
220 α *= α_reduction_factor;
221
222 // If step size hit a minimum, check if the KKT error was reduced. If it
223 // wasn't, report bad line search.
224 if (α < α_min) {
225 Scalar current_kkt_error = kkt_error<Scalar, KKTErrorType::ONE_NORM>(g);
226
227 trial_x = x + α_max * p_x;
228
229 Scalar next_kkt_error =
230 kkt_error<Scalar, KKTErrorType::ONE_NORM>(matrices.g(trial_x));
231
232 // If the step using αᵐᵃˣ reduced the KKT error, accept it anyway
233 if (next_kkt_error <= Scalar(0.999) * current_kkt_error) {
234 trial_f = matrices.f(trial_x);
235
236 // Accept step
237 break;
238 }
239
240 return ExitStatus::LINE_SEARCH_FAILED;
241 }
242 }
243
244 line_search_profiler.stop();
245
246 // Update iterates
247 x = trial_x;
248
249 f = trial_f;
250
251 // Update autodiff for Hessian
252 g = matrices.g(x);
253 H = matrices.H(x);
254
255 // Update the error
256 E_0 = kkt_error<Scalar, KKTErrorType::INF_NORM_SCALED>(g);
257
258 inner_iter_profiler.stop();
259
260 if (options.diagnostics) {
261 print_iteration_diagnostics(iterations, IterationType::NORMAL,
262 inner_iter_profiler.current_duration(), E_0,
263 f, Scalar(0), Scalar(0), Scalar(0),
264 solver.hessian_regularization(), α, α_max,
265 α_reduction_factor, Scalar(1));
266 }
267
268 ++iterations;
269
270 // Check for max iterations
271 if (iterations >= options.max_iterations) {
272 return ExitStatus::MAX_ITERATIONS_EXCEEDED;
273 }
274
275 // Check for max wall clock time
276 if (std::chrono::steady_clock::now() - solve_start_time > options.timeout) {
277 return ExitStatus::TIMEOUT;
278 }
279 }
280
281 return ExitStatus::SUCCESS;
282}
283
284extern template SLEIPNIR_DLLEXPORT ExitStatus
285newton(const NewtonMatrixCallbacks<double>& matrix_callbacks,
286 std::span<std::function<bool(const IterationInfo<double>& info)>>
287 iteration_callbacks,
288 const Options& options, Eigen::Vector<double, Eigen::Dynamic>& x);
289
290} // namespace slp