| // Ceres Solver - A fast non-linear least squares minimizer |
| // Copyright 2023 Google Inc. All rights reserved. |
| // http://ceres-solver.org/ |
| // |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are met: |
| // |
| // * Redistributions of source code must retain the above copyright notice, |
| // this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above copyright notice, |
| // this list of conditions and the following disclaimer in the documentation |
| // and/or other materials provided with the distribution. |
| // * Neither the name of Google Inc. nor the names of its contributors may be |
| // used to endorse or promote products derived from this software without |
| // specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
| // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE |
| // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
| // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
| // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| // POSSIBILITY OF SUCH DAMAGE. |
| // |
| // Author: sameeragarwal@google.com (Sameer Agarwal) |
| // |
| // Interface for and implementation of various Line search algorithms. |
| |
| #ifndef CERES_INTERNAL_LINE_SEARCH_H_ |
| #define CERES_INTERNAL_LINE_SEARCH_H_ |
| |
| #include <memory> |
| #include <string> |
| #include <vector> |
| |
| #include "absl/time/time.h" |
| #include "ceres/function_sample.h" |
| #include "ceres/internal/eigen.h" |
| #include "ceres/internal/export.h" |
| #include "ceres/types.h" |
| |
| namespace ceres::internal { |
| |
| class Evaluator; |
| class LineSearchFunction; |
| |
| // Line search is another name for a one dimensional optimization |
| // algorithm. The name "line search" comes from the fact one |
| // dimensional optimization problems that arise as subproblems of |
| // general multidimensional optimization problems. |
| // |
| // While finding the exact minimum of a one dimensional function is |
| // hard, instances of LineSearch find a point that satisfies a |
| // sufficient decrease condition. Depending on the particular |
| // condition used, we get a variety of different line search |
| // algorithms, e.g., Armijo, Wolfe etc. |
| class CERES_NO_EXPORT LineSearch { |
| public: |
| struct Summary; |
| |
| struct CERES_NO_EXPORT Options { |
| // Degree of the polynomial used to approximate the objective |
| // function. |
| LineSearchInterpolationType interpolation_type = CUBIC; |
| |
| // Armijo and Wolfe line search parameters. |
| |
| // Solving the line search problem exactly is computationally |
| // prohibitive. Fortunately, line search based optimization |
| // algorithms can still guarantee convergence if instead of an |
| // exact solution, the line search algorithm returns a solution |
| // which decreases the value of the objective function |
| // sufficiently. More precisely, we are looking for a step_size |
| // s.t. |
| // |
| // f(step_size) <= f(0) + sufficient_decrease * f'(0) * step_size |
| double sufficient_decrease = 1e-4; |
| |
| // In each iteration of the Armijo / Wolfe line search, |
| // |
| // new_step_size >= max_step_contraction * step_size |
| // |
| // Note that by definition, for contraction: |
| // |
| // 0 < max_step_contraction < min_step_contraction < 1 |
| // |
| double max_step_contraction = 1e-3; |
| |
| // In each iteration of the Armijo / Wolfe line search, |
| // |
| // new_step_size <= min_step_contraction * step_size |
| // Note that by definition, for contraction: |
| // |
| // 0 < max_step_contraction < min_step_contraction < 1 |
| // |
| double min_step_contraction = 0.9; |
| |
| // If during the line search, the step_size falls below this |
| // value, it is truncated to zero. |
| double min_step_size = 1e-9; |
| |
| // Maximum number of trial step size iterations during each line search, |
| // if a step size satisfying the search conditions cannot be found within |
| // this number of trials, the line search will terminate. |
| int max_num_iterations = 20; |
| |
| // Wolfe-specific line search parameters. |
| |
| // The strong Wolfe conditions consist of the Armijo sufficient |
| // decrease condition, and an additional requirement that the |
| // step-size be chosen s.t. the _magnitude_ ('strong' Wolfe |
| // conditions) of the gradient along the search direction |
| // decreases sufficiently. Precisely, this second condition |
| // is that we seek a step_size s.t. |
| // |
| // |f'(step_size)| <= sufficient_curvature_decrease * |f'(0)| |
| // |
| // Where f() is the line search objective and f'() is the derivative |
| // of f w.r.t step_size (d f / d step_size). |
| double sufficient_curvature_decrease = 0.9; |
| |
| // During the bracketing phase of the Wolfe search, the step size is |
| // increased until either a point satisfying the Wolfe conditions is |
| // found, or an upper bound for a bracket containing a point satisfying |
| // the conditions is found. Precisely, at each iteration of the |
| // expansion: |
| // |
| // new_step_size <= max_step_expansion * step_size. |
| // |
| // By definition for expansion, max_step_expansion > 1.0. |
| double max_step_expansion = 10; |
| |
| bool is_silent = false; |
| |
| // The one dimensional function that the line search algorithm |
| // minimizes. |
| LineSearchFunction* function = nullptr; |
| }; |
| |
| // Result of the line search. |
| struct Summary { |
| bool success = false; |
| FunctionSample optimal_point; |
| int num_function_evaluations = 0; |
| int num_gradient_evaluations = 0; |
| int num_iterations = 0; |
| // Cumulative time spent evaluating the value of the cost function across |
| // all iterations. |
| absl::Duration cost_evaluation_time = absl::ZeroDuration(); |
| // Cumulative time spent evaluating the gradient of the cost function across |
| // all iterations. |
| absl::Duration gradient_evaluation_time = absl::ZeroDuration(); |
| // Cumulative time spent minimizing the interpolating polynomial to compute |
| // the next candidate step size across all iterations. |
| absl::Duration polynomial_minimization_time = absl::ZeroDuration(); |
| absl::Duration total_time = absl::ZeroDuration(); |
| std::string error; |
| }; |
| |
| explicit LineSearch(const LineSearch::Options& options); |
| virtual ~LineSearch(); |
| |
| static std::unique_ptr<LineSearch> Create( |
| const LineSearchType line_search_type, |
| const LineSearch::Options& options, |
| std::string* error); |
| |
| // Perform the line search. |
| // |
| // step_size_estimate must be a positive number. |
| // |
| // initial_cost and initial_gradient are the values and gradient of |
| // the function at zero. |
| // summary must not be null and will contain the result of the line |
| // search. |
| // |
| // Summary::success is true if a non-zero step size is found. |
| void Search(double step_size_estimate, |
| double initial_cost, |
| double initial_gradient, |
| Summary* summary) const; |
| double InterpolatingPolynomialMinimizingStepSize( |
| const LineSearchInterpolationType& interpolation_type, |
| const FunctionSample& lowerbound_sample, |
| const FunctionSample& previous_sample, |
| const FunctionSample& current_sample, |
| const double min_step_size, |
| const double max_step_size) const; |
| |
| protected: |
| const LineSearch::Options& options() const { return options_; } |
| |
| private: |
| virtual void DoSearch(double step_size_estimate, |
| double initial_cost, |
| double initial_gradient, |
| Summary* summary) const = 0; |
| |
| private: |
| LineSearch::Options options_; |
| }; |
| |
| // An object used by the line search to access the function values |
| // and gradient of the one dimensional function being optimized. |
| // |
| // In practice, this object provides access to the objective |
| // function value and the directional derivative of the underlying |
| // optimization problem along a specific search direction. |
| class CERES_NO_EXPORT LineSearchFunction { |
| public: |
| explicit LineSearchFunction(Evaluator* evaluator); |
| void Init(const Vector& position, const Vector& direction); |
| |
| // Evaluate the line search objective |
| // |
| // f(x) = p(position + x * direction) |
| // |
| // Where, p is the objective function of the general optimization |
| // problem. |
| // |
| // evaluate_gradient controls whether the gradient will be evaluated |
| // or not. |
| // |
| // On return output->*_is_valid indicate indicate whether the |
| // corresponding fields have numerically valid values or not. |
| void Evaluate(double x, bool evaluate_gradient, FunctionSample* output); |
| |
| double DirectionInfinityNorm() const; |
| |
| // Resets to now, the start point for the results from TimeStatistics(). |
| void ResetTimeStatistics(); |
| void TimeStatistics(absl::Duration* cost_evaluation_time, |
| absl::Duration* gradient_evaluation_time) const; |
| const Vector& position() const { return position_; } |
| const Vector& direction() const { return direction_; } |
| |
| private: |
| Evaluator* evaluator_; |
| Vector position_; |
| Vector direction_; |
| |
| // scaled_direction = x * direction_; |
| Vector scaled_direction_; |
| |
| // We may not exclusively own the evaluator (e.g. in the Trust Region |
| // minimizer), hence we need to save the initial evaluation durations for the |
| // value & gradient to accurately determine the duration of the evaluations |
| // we invoked. These are reset by a call to ResetTimeStatistics(). |
| absl::Duration initial_evaluator_residual_time = absl::ZeroDuration(); |
| absl::Duration initial_evaluator_jacobian_time = absl::ZeroDuration(); |
| }; |
| |
| // Backtracking and interpolation based Armijo line search. This |
| // implementation is based on the Armijo line search that ships in the |
| // minFunc package by Mark Schmidt. |
| // |
| // For more details: http://www.di.ens.fr/~mschmidt/Software/minFunc.html |
| class CERES_NO_EXPORT ArmijoLineSearch final : public LineSearch { |
| public: |
| explicit ArmijoLineSearch(const LineSearch::Options& options); |
| |
| private: |
| void DoSearch(double step_size_estimate, |
| double initial_cost, |
| double initial_gradient, |
| Summary* summary) const final; |
| }; |
| |
| // Bracketing / Zoom Strong Wolfe condition line search. This implementation |
| // is based on the pseudo-code algorithm presented in Nocedal & Wright [1] |
| // (p60-61) with inspiration from the WolfeLineSearch which ships with the |
| // minFunc package by Mark Schmidt [2]. |
| // |
| // [1] Nocedal J., Wright S., Numerical Optimization, 2nd Ed., Springer, 1999. |
| // [2] http://www.di.ens.fr/~mschmidt/Software/minFunc.html. |
| class CERES_NO_EXPORT WolfeLineSearch final : public LineSearch { |
| public: |
| explicit WolfeLineSearch(const LineSearch::Options& options); |
| |
| // Returns true iff either a valid point, or valid bracket are found. |
| bool BracketingPhase(const FunctionSample& initial_position, |
| const double step_size_estimate, |
| FunctionSample* bracket_low, |
| FunctionSample* bracket_high, |
| bool* perform_zoom_search, |
| Summary* summary) const; |
| // Returns true iff final_line_sample satisfies strong Wolfe conditions. |
| bool ZoomPhase(const FunctionSample& initial_position, |
| FunctionSample bracket_low, |
| FunctionSample bracket_high, |
| FunctionSample* solution, |
| Summary* summary) const; |
| |
| private: |
| void DoSearch(double step_size_estimate, |
| double initial_cost, |
| double initial_gradient, |
| Summary* summary) const final; |
| }; |
| |
| } // namespace ceres::internal |
| |
| #endif // CERES_INTERNAL_LINE_SEARCH_H_ |