math/wolfe__line__search_8hpp_source.html

#ifndef STAN_MATH_MIX_FUNCTOR_WOLFE_LINE_SEARCH_HPP

#define STAN_MATH_MIX_FUNCTOR_WOLFE_LINE_SEARCH_HPP


#include <stan/math/prim/fun/Eigen.hpp>

#include <stan/math/mix/functor/laplace_likelihood.hpp>

#include <stan/math/rev/meta.hpp>

#include <stan/math/rev/core.hpp>

#include <stan/math/rev/fun.hpp>

#include <stan/math/rev/fun/value_of.hpp>

#include <stan/math/rev/functor.hpp>

#include <stan/math/prim/fun/to_ref.hpp>

#include <stan/math/prim/fun/quad_form_diag.hpp>

#include <stan/math/prim/functor/iter_tuple_nested.hpp>

#include <algorithm>

#include <cmath>

#include <limits>

#include <tuple>

#include <type_traits>


namespace stan::math {


struct laplace_line_search_options {

  constexpr explicit laplace_line_search_options(int max_iter)

      : max_iterations(max_iter) {}

  constexpr laplace_line_search_options() = default;

  int max_iterations{1000};

  double c1{1e-4};


  double c2{0.9};


  double tau{0.5};


  double min_alpha{1e-8};


  double max_alpha{16.0};


  double scale_up{2.0};


  double abs_grad_threshold{1e-12};


  double abs_obj_threshold{1e-12};


  double rel_grad_threshold{1e-3};  // off by default

  double rel_obj_threshold{1e-10};  // off by default

};

namespace internal {


template <typename Scalar>

[[nodiscard]] inline Scalar cubic_spline(Scalar x_left, Scalar f_left,

                                         Scalar df_left, Scalar x_right,

                                         Scalar f_right,

                                         Scalar df_right) noexcept {

  const Scalar midpoint = (x_left + x_right) / Scalar(2);


  // Basic validation: ordering + finiteness.

  if (!(x_right > x_left) || !std::isfinite(f_left) || !std::isfinite(f_right)

      || !std::isfinite(df_left) || !std::isfinite(df_right)) {

    return midpoint;

  }


  const Scalar width = x_right - x_left;

  const Scalar eps = std::numeric_limits<Scalar>::epsilon();


  // If the bracket is extremely tight, just bisect.

  {

    const Scalar x_scale

        = std::max(std::max(std::abs(x_left), std::abs(x_right)), Scalar(1));

    if (width <= eps * x_scale) {

      return midpoint;

    }

  }


  // Derivatives with respect to s, where x = x_left + s * width.

  const Scalar df_left_s = width * df_left;    // F'(0)

  const Scalar df_right_s = width * df_right;  // F'(1)


  // Cubic Hermite coefficients in $s \in [0,1]$:

  //   F(s) = a3*s^3 + a2*s^2 + a1*s + a0

  // with F(0) = f_left, F'(0) = df_left_s, F(1) = f_right, F'(1) = df_right_s.

  const Scalar a0 = f_left;

  const Scalar a1 = df_left_s;

  const Scalar a2

      = Scalar(3) * (f_right - f_left) - Scalar(2) * df_left_s - df_right_s;

  const Scalar a3 = Scalar(2) * (f_left - f_right) + df_left_s + df_right_s;


  auto eval = [&](Scalar s) -> Scalar {

    // Horner evaluation of F(s).

    return ((a3 * s + a2) * s + a1) * s + a0;

  };


  // Candidates are restricted to a trimmed interior [edge_guard, 1 -

  // edge_guard].

  constexpr Scalar edge_guard = Scalar(1e-9);


  Scalar best_s = 0.5;

  Scalar best_val = eval(0.5);

  auto consider = [&](Scalar s) {

    if (!std::isfinite(s)) {

      return;

    }

    if (!(s > edge_guard && s < Scalar(1) - edge_guard)) {

      return;

    }

    const Scalar value = eval(s);

    if (value > best_val) {

      best_s = s;

      best_val = value;

    }

  };


  // 1) Secant estimate for the derivative root between s = 0 and s = 1.

  {

    const Scalar denom = df_left_s - df_right_s;

    const Scalar deriv_scale = std::max(

        std::max(std::abs(df_left_s), std::abs(df_right_s)), Scalar(1));

    if (std::abs(denom) > eps * deriv_scale) {

      const Scalar s_secant

          = df_left_s / denom;  // Root of linear interpolation of F'.

      consider(s_secant);

    }

  }


  // 2) Stationary points of the cubic model (F'(s) = 0).

  {

    // F'(s) = 3*a3*s^2 + 2*a2*s + a1 = 0.

    const Scalar A = Scalar(3) * a3;

    const Scalar B = Scalar(2) * a2;

    const Scalar C = a1;


    const Scalar scale

        = std::max(std::max(std::abs(B), std::abs(C)), Scalar(1));

    const Scalar A_tol = eps * scale;


    if (std::abs(A) <= A_tol) {

      // Degenerate to (approximately) linear: B*s + C = 0.

      const Scalar B_tol = eps * scale;

      if (std::abs(B) > B_tol) {

        consider(-C / B);

      }

    } else {

      // Proper quadratic: A*s^2 + B*s + C = 0.

      Scalar disc = std::fma(-Scalar(4) * A, C, B * B);  // B^2 - 4AC

      const Scalar disc_scale

          = std::max(B * B + std::abs(Scalar(4) * A * C), Scalar(1));

      const Scalar disc_tol = Scalar(10) * eps * disc_scale;


      // Treat tiny negative discriminants as zero.

      if (disc < Scalar(0) && -disc <= disc_tol) {

        disc = Scalar(0);

      }


      if (disc >= Scalar(0)) {

        const Scalar r = std::sqrt(disc);

        const Scalar q = -Scalar(0.5) * (B + std::copysign(r, B));

        const Scalar q_scale = std::max(std::abs(B) + r, Scalar(1));

        const Scalar q_tol = eps * q_scale;


        if (std::abs(q) > q_tol) {

          const Scalar s1 = q / A;

          const Scalar s2 = C / q;

          consider(s1);

          consider(s2);

        } else {

          // Fallback: vertex of the quadratic derivative.

          const Scalar s_vertex = -B / (Scalar(2) * A);

          consider(s_vertex);

        }

      }

    }

  }


  return x_left + best_s * width;

}


template <typename Eval, typename Options>

inline auto cubic_spline(Eval&& low, Eval&& high, Options&& opt) {

  auto alpha = cubic_spline(low.alpha(), low.obj(), low.dir(), high.alpha(),

                            high.obj(), high.dir());

  const double width = high.alpha() - low.alpha();

  const double guard = 1e-3 * width;  // or make this an option

  alpha = std::clamp(alpha, low.alpha() + guard, high.alpha() - guard);

  return alpha;

}


template <typename Option>

inline auto check_armijo(double obj_next, double obj_init, double alpha_next,

                         double dir0, Option&& opt) {

  return (obj_next >= obj_init)

         && (obj_next >= obj_init + alpha_next * dir0 * opt.c1);

}


template <typename Eval, typename WolfeT, typename Option>

inline bool check_armijo(const Eval& eval, const WolfeT& prev,

                         const Option& opt) {

  return check_armijo(eval.obj(), prev.obj(), eval.alpha(), prev.dir(), opt);

}


template <typename Option>

inline auto check_wolfe_curve(double dir_deriv_next, double dir_deriv_init,

                              Option&& opt) {

  return std::abs(dir_deriv_next) <= (opt.c2 * std::abs(dir_deriv_init));

}


template <typename Eval, typename WolfeT, typename Option>

inline bool check_wolfe(const Eval& eval, const WolfeT& prev,

                        const Option& opt) {

  return check_wolfe_curve(eval.dir(), prev.dir(), opt);

}


enum class WolfeReturn : uint8_t {

  // both conditions true

  Wolfe,

  // Armijo true, curvature false

  Armijo,

  // |phi'| small

  ConvergedGradient,

  // |phi - phi0| small

  ConvergedObjective,

  // |phi - phi0| and |phi'| small

  ConvergedObjectiveAndGradient,

  // high and low became too small

  IntervalTooSmall,

  // alpha < min_alpha

  StepTooSmall,

  // max iters reached

  ReachedMaxStep,

  // failed to find a step

  NumericalIssue,

  // All other failures

  Fail,

  // When a check passes and we want to continue searching

  Continue

};


struct WolfeStatus {

  // total updates/evaluations

  int num_evals_{0};

  int num_backtracks_{-1};

  WolfeReturn stop_{WolfeReturn::Fail};

  // Whether a valid new step was found

  bool accept_{false};

  WolfeStatus() = default;

  WolfeStatus(WolfeReturn stop, int evals, int back)

      : num_evals_(evals), num_backtracks_(back), stop_(stop), accept_{false} {}

  WolfeStatus(WolfeReturn stop, int evals, int back, bool success)

      : num_evals_(evals),

        num_backtracks_(back),

        stop_(stop),

        accept_{success} {}

};


inline auto wolfe_status_str(WolfeStatus s) {

  switch (s.stop_) {

    case WolfeReturn::Wolfe:

      return "Wolfe";

    case WolfeReturn::Armijo:

      return "Armijo";

    case WolfeReturn::ConvergedGradient:

      return "ConvergedGradient";

    case WolfeReturn::ConvergedObjective:

      return "ConvergedObjective";

    case WolfeReturn::ConvergedObjectiveAndGradient:

      return "ConvergedObjectiveAndGradient";

    case WolfeReturn::IntervalTooSmall:

      return "IntervalTooSmall";

    case WolfeReturn::StepTooSmall:

      return "StepTooSmall";

    case WolfeReturn::ReachedMaxStep:

      return "ReachedMaxStep";

    case WolfeReturn::NumericalIssue:

      return "NumericalIssue";

    case WolfeReturn::Fail:

      return "Fail";

    case WolfeReturn::Continue:

      return "Continue";

    default:

      return "UNKNOWN";

  }

}


struct Eval {

  // alpha

  double alpha_{0.0};

  // obj

  double obj_{0.0};

  // directional derivative

  double dir_{0.0};

  inline auto& alpha() { return alpha_; }

  inline const auto& alpha() const { return alpha_; }

  inline auto& obj() { return obj_; }

  inline const auto& obj() const { return obj_; }

  inline auto& dir() { return dir_; }

  inline const auto& dir() const { return dir_; }

  constexpr Eval(double alpha, double obj, double dir)

      : alpha_(alpha), obj_(obj), dir_(dir) {}

  constexpr Eval() = default;

};


struct WolfeData {

  // current parameter values

  Eigen::VectorXd theta_;

  // parameter gradients

  Eigen::VectorXd theta_grad_;

  // latent variable

  Eigen::VectorXd a_;

  // evaluation data

  Eval eval_;

  explicit WolfeData(Eigen::Index n)

      : theta_(Eigen::VectorXd::Zero(n)),

        theta_grad_(Eigen::VectorXd::Zero(n)),

        a_(Eigen::VectorXd::Zero(n)),

        eval_() {}


  template <typename ObjFun, typename ThetaGradF, typename Theta0>

  WolfeData(ObjFun&& obj_fun, const Eigen::VectorXd& a, const Theta0& theta0,

            ThetaGradF&& theta_grad_f)

      : theta_(theta0),

        theta_grad_(theta_grad_f(theta_)),

        a_(a),

        eval_(1.0, obj_fun(a_, theta_), 0.0) {}


  template <typename ObjFun, typename ThetaGradF, typename Theta0>

  WolfeData(ObjFun&& obj_fun, Eigen::Index n, const Theta0& theta0,

            ThetaGradF&& theta_grad_f)

      : theta_(theta0),

        theta_grad_(theta_grad_f(theta_)),

        a_(Eigen::VectorXd::Zero(n)),

        eval_(1.0, obj_fun(a_, theta_), 0.0) {}


  // Initialize with theta = 0

  template <typename LLFun, typename LLArgs, typename Msgs>

  WolfeData(Eigen::Index n, const LLFun& ll_fun, const LLArgs& ll_args,

            const Msgs& msgs)

      : WolfeData(n, Eigen::VectorXd::Zero(n), ll_fun, ll_args, msgs) {}


  void update(WolfeData& other) {

    theta_.swap(other.theta_);

    theta_grad_.swap(other.theta_grad_);

    a_.swap(other.a_);

    eval_ = other.eval_;

  }

  void update(WolfeData& other, const Eval& eval) {

    theta_.swap(other.theta_);

    a_.swap(other.a_);

    theta_grad_.swap(other.theta_grad_);

    eval_ = eval;

  }

  inline auto& theta() & { return theta_; }

  inline auto&& theta() && { return std::move(theta_); }

  inline const auto& theta() const& { return theta_; }


  inline auto& theta_grad() & { return theta_grad_; }

  inline const auto& theta_grad() const& { return theta_grad_; }

  inline auto&& theta_grad() && { return std::move(theta_grad_); }

  inline auto& a() & { return a_; }

  inline const auto& a() const& { return a_; }

  inline auto&& a() && { return std::move(a_); }

  inline auto& obj() & { return eval_.obj(); }

  inline const auto& obj() const& { return eval_.obj(); }

  inline auto& alpha() & { return eval_.alpha(); }

  inline const auto& alpha() const& { return eval_.alpha(); }

  inline auto& dir() & { return eval_.dir(); }

  inline const auto& dir() const& { return eval_.dir(); }

};


struct WolfeInfo {

  // Current step data. On output will be the proposal step

  WolfeData curr_;

  // Previous step data

  WolfeData prev_;

  // Scratch space for evaluations of proposal steps

  WolfeData scratch_;

  // Search direction

  Eigen::VectorXd p_;

  // Initial directional derivative

  double init_dir_;

  template <typename ObjFun, typename Theta0, typename ThetaGradF>

  WolfeInfo(ObjFun&& obj_fun, Eigen::Index n, Theta0&& theta0,

            ThetaGradF&& theta_grad_f)

      : curr_(std::forward<ObjFun>(obj_fun), n, std::forward<Theta0>(theta0),

              std::forward<ThetaGradF>(theta_grad_f)),

        prev_(curr_),

        scratch_(n) {

    if (!std::isfinite(curr_.obj())) {

      throw std::domain_error(

          "laplace_marginal_density: log likelihood is not finite at initial "

          "theta and likelihood arguments.");

    }

  }

  WolfeInfo(WolfeData&& curr, WolfeData&& prev)

      : curr_(std::move(curr)),

        prev_(std::move(prev)),

        scratch_(curr_.theta().size()),

        p_(Eigen::VectorXd::Zero(curr_.theta().size())),

        init_dir_(0.0) {}

  explicit WolfeInfo(Eigen::Index n)

      : curr_(n),

        prev_(curr_),

        scratch_(n),

        p_(Eigen::VectorXd::Zero(n)),

        init_dir_(0.0) {}


  inline void flip_direction() {

    if (this->init_dir_ < 0) {

      this->p_ *= -1;

      this->init_dir_ *= -1;

    }

  }


  inline auto& curr() & { return curr_; }

  inline const auto& curr() const& { return curr_; }

  inline auto&& curr() && { return std::move(curr_); }

  inline auto& prev() & { return prev_; }

  inline const auto& prev() const& { return prev_; }

  inline auto&& prev() && { return std::move(prev_); }

  inline auto& scratch() & { return scratch_; }

  inline const auto& scratch() const& { return scratch_; }

  inline auto&& scratch() && { return std::move(scratch_); }

};


template <typename Update, typename Proposal, typename Curr, typename Prev,

          typename Eval, typename P, typename Backoff>

inline auto retry_evaluate(Update&& update, Proposal&& proposal, Curr&& curr,

                           Prev&& prev, Eval& eval, P&& p, Backoff&& backoff) {

  while (true) {

    auto res = update(proposal, curr, prev, eval, p);

    if (res) {

      return res;

    }

    if (!backoff(eval)) {

      return res;

    }

  }

}


template <typename Info, typename UpdateFun, typename Options, typename Stream>

inline WolfeStatus wolfe_line_search(Info& wolfe_info, UpdateFun&& update_fun,

                                     Options&& opt, Stream* msgs) {

  auto& curr = wolfe_info.curr_;

  auto& prev = wolfe_info.prev_;

  auto& scratch = wolfe_info.scratch_;

  auto&& p = wolfe_info.p_;

  auto&& dir_deriv_init = wolfe_info.init_dir_;

  Eval low{0.0, prev.obj(), dir_deriv_init};

  prev.dir() = dir_deriv_init;

  int total_updates = 0;

  Eval best = low;  // keep the best Armijo-OK in case strong-Wolfe fails

  auto update_with_tick = [&total_updates, &opt, &best, &update_fun](

                              auto&& proposal, auto&& curr, auto&& prev,

                              Eval& e, auto&& p) {

    const bool over_budget = total_updates > opt.max_iterations;

    if (over_budget) {

      // Soft budget: stop evaluating new trial points once exceeded.

      if (check_armijo(best, prev, opt)) {

        update_fun(proposal, curr, prev, best, p);

        curr.update(proposal, best);

        if (check_wolfe(best, prev, opt)) {

          return WolfeStatus{WolfeReturn::Wolfe, total_updates, 0, true};

        } else {

          return WolfeStatus{WolfeReturn::Armijo, total_updates, 0, true};

        }

      }

      return WolfeStatus{WolfeReturn::ReachedMaxStep, total_updates, 0, false};

    } else {

      update_fun(proposal, curr, prev, e, p);

      ++total_updates;

      return WolfeStatus{WolfeReturn::Continue, total_updates, 0, false};

    }

  };

  double alpha_start

      = std::clamp(curr.alpha() * opt.scale_up, opt.min_alpha, opt.max_alpha);

  Eval high{alpha_start, curr.obj(), dir_deriv_init};

  WolfeStatus wolfe_check{WolfeReturn::Continue, 0, 0, false};

  // Initial check for numerical trouble

  {

    wolfe_check = update_with_tick(scratch, curr, prev, high, p);

    if (wolfe_check.stop_ != WolfeReturn::Continue) {

      return wolfe_check;

    }

    if (high.alpha() < opt.min_alpha) {

      return WolfeStatus{WolfeReturn::StepTooSmall, total_updates, 0, false};

    }

    // Quick accept if Armijo and Wolfe conditions are satisfied

    if (check_armijo(high, prev, opt)) {

      if (check_wolfe(high, prev, opt)) {

        // Try zooming up till we hit a fail

        best = high;

        while (check_armijo(high, prev, opt) && check_wolfe(high, prev, opt)) {

          best = high;

          high.alpha() *= opt.scale_up;

          if (high.alpha() > opt.max_alpha) {

            break;

          }

          wolfe_check = update_with_tick(scratch, curr, prev, high, p);

          if (wolfe_check.stop_ != WolfeReturn::Continue) {

            return wolfe_check;

          }

        }

        wolfe_check = update_with_tick(scratch, curr, prev, best, p);

        if (wolfe_check.stop_ != WolfeReturn::Continue) {

          return wolfe_check;

        }

        curr.update(scratch, best);

        return WolfeStatus{WolfeReturn::Wolfe, total_updates, 0, true};

      } else {

        if (best.obj() < high.obj()) {

          best = high;

        }

      }

    }

  }

  int num_backtracks = 0;

  while (high.alpha() < opt.max_alpha) {

    num_backtracks++;

    // 1. Evaluate f(alpha) and g(alpha)

    wolfe_check = update_with_tick(scratch, curr, prev, high, p);

    if (wolfe_check.stop_ != WolfeReturn::Continue) {

      return wolfe_check;

    }

    if (check_armijo(high, prev, opt)) {

      if (check_wolfe(high, prev, opt)) {  // [1]

        curr.update(scratch, high);

        return WolfeStatus{WolfeReturn::Wolfe, total_updates, num_backtracks,

                           true};

      }

      if (best.obj() < high.obj()) {

        best = high;

      }

      if (high.dir() > 0) {  // [2]

        low = high;

        high.alpha() *= opt.scale_up;

        continue;

      }

    }

    // [3,4,5]

    break;

  }

  const double grad_tol

      = std::max(opt.abs_grad_threshold,

                 opt.rel_grad_threshold * std::abs(dir_deriv_init));

  const double obj_tol

      = std::max(opt.abs_obj_threshold,

                 opt.rel_obj_threshold * (1.0 + std::abs(prev.obj())));

  auto check_bounds = [&](auto&& curr_eval) {

    // Check for grad convergence

    const bool slope_check = std::abs(curr_eval.dir()) <= grad_tol;

    // tiny slope or gain

    const bool obj_check = std::abs(curr_eval.obj() - prev.obj()) <= obj_tol;

    // alpha too small

    const bool alpha_check = curr_eval.alpha() < opt.min_alpha;

    if (slope_check || obj_check || alpha_check) {

      bool step_ok

          = curr_eval.obj() != low.obj() && check_armijo(curr_eval, prev, opt);

      if (slope_check && obj_check) {

        return WolfeStatus{WolfeReturn::ConvergedObjectiveAndGradient,

                           total_updates, num_backtracks, step_ok};

      } else if (slope_check) {

        return WolfeStatus{WolfeReturn::ConvergedGradient, total_updates,

                           num_backtracks, step_ok};

      } else if (obj_check) {

        return WolfeStatus{WolfeReturn::ConvergedObjective, total_updates,

                           num_backtracks, step_ok};

      } else {

        return WolfeStatus{WolfeReturn::IntervalTooSmall, total_updates,

                           num_backtracks, step_ok};

      }

    }

    return WolfeStatus{WolfeReturn::Continue, total_updates, num_backtracks,

                       false};

  };

  auto check_b = check_bounds(high);

  if (check_b.stop_ != WolfeReturn::Continue) {

    if (check_b.accept_) {

      curr.update(scratch, high);

    }

    return check_b;

  }

  wolfe_check = update_with_tick(scratch, curr, prev, high, p);

  if (wolfe_check.stop_ != WolfeReturn::Continue) {

    return wolfe_check;

  }

  while ((high.alpha() - low.alpha() > opt.min_alpha)

         && high.alpha() > opt.min_alpha) {

    num_backtracks++;

    const bool have_sign_change = (low.dir() * high.dir() < 0);

    const bool high_armijo_ok = check_armijo(high, prev, opt);

    const bool use_cubic = have_sign_change && high_armijo_ok;

    // Choose trial alpha: cubic when bracket is good, else bisection.

    double alpha_mid{0};

    if (use_cubic) {

      alpha_mid = cubic_spline(low, high, opt);

    } else {

      alpha_mid = 0.5 * (low.alpha() + high.alpha());

    }

    if (alpha_mid <= opt.min_alpha) {

      break;

    }

    Eval mid{alpha_mid, 0.0, 0.0};

    auto wolfe_check = update_with_tick(scratch, curr, prev, mid, p);

    if (wolfe_check.stop_ != WolfeReturn::Continue) {

      return wolfe_check;

    }

    if (mid.alpha() <= opt.min_alpha) {

      return WolfeStatus{WolfeReturn::StepTooSmall, total_updates,

                         num_backtracks, false};

    }

    if (check_armijo(mid, prev, opt)) {

      if (check_wolfe(mid, prev, opt)) {  // [1]

        curr.update(scratch, mid);

        return WolfeStatus{WolfeReturn::Wolfe, total_updates, num_backtracks,

                           true};

      }

      // Track best Armijo-OK point for fallback.

      if (mid.obj() > best.obj()) {

        best = mid;

      }

      if (mid.obj() > low.obj()) {

        if (mid.dir() > 0) {  // [2]

          low = mid;

        } else {  // [3]

          high = mid;

        }

      }

      // [4]

      high = mid;

    } else {

      // [5]

      high = mid;

    }

    // Convergence/guard-rail checks (uses prev/grad_tol/obj_tol etc.)

    auto bounds_check = check_bounds(mid);

    if (bounds_check.stop_ != WolfeReturn::Continue) {

      if (bounds_check.accept_) {

        curr.update(scratch, mid);

      }

      return bounds_check;

    }

  }

  // On failure, use the best point we have found so far that at least satisfies

  // armijo

  const bool armijo_ok_best = check_armijo(best, prev, opt);

  if (armijo_ok_best) {

    wolfe_check = update_with_tick(scratch, curr, prev, best, p);

    curr.update(scratch, best);

    return WolfeStatus{WolfeReturn::Armijo, total_updates, num_backtracks,

                       true};

  } else {

    return WolfeStatus{WolfeReturn::Fail, total_updates, num_backtracks, false};

  }

}

}  // namespace internal


}  // namespace stan::math

#endif

Eigen.hpp

stan::math::size
int64_t size(const T &m)
Returns the size (number of the elements) of a matrix_cl or var_value<matrix_cl<T>>.
Definition size.hpp:19

iter_tuple_nested.hpp

laplace_likelihood.hpp

Eigen
(Expert) Numerical traits for algorithmic differentiation variables.
Definition Eigen_NumTraits.hpp:11

stan::math::internal::wolfe_line_search
WolfeStatus wolfe_line_search(Info &wolfe_info, UpdateFun &&update_fun, Options &&opt, Stream *msgs)
Strong Wolfe line search for maximization.
Definition wolfe_line_search.hpp:699

stan::math::internal::WolfeReturn
WolfeReturn
Definition wolfe_line_search.hpp:320

stan::math::internal::WolfeReturn::Wolfe
@ Wolfe

stan::math::internal::WolfeReturn::IntervalTooSmall
@ IntervalTooSmall

stan::math::internal::WolfeReturn::ReachedMaxStep
@ ReachedMaxStep

stan::math::internal::WolfeReturn::StepTooSmall
@ StepTooSmall

stan::math::internal::WolfeReturn::ConvergedGradient
@ ConvergedGradient

stan::math::internal::WolfeReturn::NumericalIssue
@ NumericalIssue

stan::math::internal::WolfeReturn::Armijo
@ Armijo

stan::math::internal::WolfeReturn::ConvergedObjectiveAndGradient
@ ConvergedObjectiveAndGradient

stan::math::internal::WolfeReturn::Continue
@ Continue

stan::math::internal::WolfeReturn::ConvergedObjective
@ ConvergedObjective

stan::math::internal::WolfeReturn::Fail
@ Fail

stan::math::internal::check_wolfe_curve
auto check_wolfe_curve(double dir_deriv_next, double dir_deriv_init, Option &&opt)
Definition wolfe_line_search.hpp:309

stan::math::internal::wolfe_status_str
auto wolfe_status_str(WolfeStatus s)
Helper function for pretty printing.
Definition wolfe_line_search.hpp:368

stan::math::internal::check_armijo
auto check_armijo(double obj_next, double obj_init, double alpha_next, double dir0, Option &&opt)
Definition wolfe_line_search.hpp:296

stan::math::internal::cubic_spline
Scalar cubic_spline(Scalar x_left, Scalar f_left, Scalar df_left, Scalar x_right, Scalar f_right, Scalar df_right) noexcept
Selects a safeguarded trial point for maximizing a scalar function on a line.
Definition wolfe_line_search.hpp:159

stan::math::internal::check_wolfe
bool check_wolfe(const Eval &eval, const WolfeT &prev, const Option &opt)
Definition wolfe_line_search.hpp:315

stan::math::internal::retry_evaluate
auto retry_evaluate(Update &&update, Proposal &&proposal, Curr &&curr, Prev &&prev, Eval &eval, P &&p, Backoff &&backoff)
Retry evaluation of a step until it passes a validity check.
Definition wolfe_line_search.hpp:579

stan::math::e
static constexpr double e()
Return the base of the natural logarithm.
Definition constants.hpp:20

stan::math::eval
T eval(T &&arg)
Inputs which have a plain_type equal to the own time are forwarded unmodified (for Eigen expressions ...
Definition eval.hpp:20

stan::math
Matrices and templated mathematical functions.
Definition unit_vector_constrain.hpp:16

std
STL namespace.

quad_form_diag.hpp

core.hpp

value_of.hpp

fun.hpp

functor.hpp

meta.hpp

stan::math::internal::Eval::dir
auto & dir()
Definition wolfe_line_search.hpp:411

stan::math::internal::Eval::alpha
const auto & alpha() const
Definition wolfe_line_search.hpp:408

stan::math::internal::Eval::obj
const auto & obj() const
Definition wolfe_line_search.hpp:410

stan::math::internal::Eval::dir_
double dir_
Definition wolfe_line_search.hpp:406

stan::math::internal::Eval::Eval
constexpr Eval(double alpha, double obj, double dir)
Definition wolfe_line_search.hpp:413

stan::math::internal::Eval::alpha_
double alpha_
Definition wolfe_line_search.hpp:402

stan::math::internal::Eval::obj
auto & obj()
Definition wolfe_line_search.hpp:409

stan::math::internal::Eval::alpha
auto & alpha()
Definition wolfe_line_search.hpp:407

stan::math::internal::Eval::Eval
constexpr Eval()=default

stan::math::internal::Eval::dir
const auto & dir() const
Definition wolfe_line_search.hpp:412

stan::math::internal::Eval::obj_
double obj_
Definition wolfe_line_search.hpp:404

stan::math::internal::Eval
evaluation struct for Wolfe line search
Definition wolfe_line_search.hpp:400

stan::math::internal::WolfeData::a
auto & a() &
Definition wolfe_line_search.hpp:477

stan::math::internal::WolfeData::update
void update(WolfeData &other, const Eval &eval)
Definition wolfe_line_search.hpp:464

stan::math::internal::WolfeData::update
void update(WolfeData &other)
Definition wolfe_line_search.hpp:458

stan::math::internal::WolfeData::theta_
Eigen::VectorXd theta_
Definition wolfe_line_search.hpp:423

stan::math::internal::WolfeData::theta_grad
auto && theta_grad() &&
Definition wolfe_line_search.hpp:476

stan::math::internal::WolfeData::dir
const auto & dir() const &
Definition wolfe_line_search.hpp:485

stan::math::internal::WolfeData::a
const auto & a() const &
Definition wolfe_line_search.hpp:478

stan::math::internal::WolfeData::obj
auto & obj() &
Definition wolfe_line_search.hpp:480

stan::math::internal::WolfeData::theta
const auto & theta() const &
Definition wolfe_line_search.hpp:472

stan::math::internal::WolfeData::theta
auto && theta() &&
Definition wolfe_line_search.hpp:471

stan::math::internal::WolfeData::theta
auto & theta() &
Definition wolfe_line_search.hpp:470

stan::math::internal::WolfeData::WolfeData
WolfeData(Eigen::Index n)
Definition wolfe_line_search.hpp:430

stan::math::internal::WolfeData::alpha
auto & alpha() &
Definition wolfe_line_search.hpp:482

stan::math::internal::WolfeData::WolfeData
WolfeData(ObjFun &&obj_fun, Eigen::Index n, const Theta0 &theta0, ThetaGradF &&theta_grad_f)
Definition wolfe_line_search.hpp:445

stan::math::internal::WolfeData::a_
Eigen::VectorXd a_
Definition wolfe_line_search.hpp:427

stan::math::internal::WolfeData::WolfeData
WolfeData(Eigen::Index n, const LLFun &ll_fun, const LLArgs &ll_args, const Msgs &msgs)
Definition wolfe_line_search.hpp:454

stan::math::internal::WolfeData::alpha
const auto & alpha() const &
Definition wolfe_line_search.hpp:483

stan::math::internal::WolfeData::theta_grad
auto & theta_grad() &
Definition wolfe_line_search.hpp:474

stan::math::internal::WolfeData::WolfeData
WolfeData(ObjFun &&obj_fun, const Eigen::VectorXd &a, const Theta0 &theta0, ThetaGradF &&theta_grad_f)
Definition wolfe_line_search.hpp:437

stan::math::internal::WolfeData::dir
auto & dir() &
Definition wolfe_line_search.hpp:484

stan::math::internal::WolfeData::obj
const auto & obj() const &
Definition wolfe_line_search.hpp:481

stan::math::internal::WolfeData::theta_grad_
Eigen::VectorXd theta_grad_
Definition wolfe_line_search.hpp:425

stan::math::internal::WolfeData::a
auto && a() &&
Definition wolfe_line_search.hpp:479

stan::math::internal::WolfeData::theta_grad
const auto & theta_grad() const &
Definition wolfe_line_search.hpp:475

stan::math::internal::WolfeData::eval_
Eval eval_
Definition wolfe_line_search.hpp:429

stan::math::internal::WolfeData
Data used in current evaluation of wolfe line search at a particular stepsize.
Definition wolfe_line_search.hpp:421

stan::math::internal::WolfeInfo::scratch_
WolfeData scratch_
Definition wolfe_line_search.hpp:497

stan::math::internal::WolfeInfo::curr
auto & curr() &
Definition wolfe_line_search.hpp:535

stan::math::internal::WolfeInfo::p_
Eigen::VectorXd p_
Definition wolfe_line_search.hpp:499

stan::math::internal::WolfeInfo::scratch
const auto & scratch() const &
Definition wolfe_line_search.hpp:542

stan::math::internal::WolfeInfo::prev
auto & prev() &
Definition wolfe_line_search.hpp:538

stan::math::internal::WolfeInfo::curr
auto && curr() &&
Definition wolfe_line_search.hpp:537

stan::math::internal::WolfeInfo::scratch
auto & scratch() &
Definition wolfe_line_search.hpp:541

stan::math::internal::WolfeInfo::prev
const auto & prev() const &
Definition wolfe_line_search.hpp:539

stan::math::internal::WolfeInfo::WolfeInfo
WolfeInfo(Eigen::Index n)
Definition wolfe_line_search.hpp:521

stan::math::internal::WolfeInfo::curr
const auto & curr() const &
Definition wolfe_line_search.hpp:536

stan::math::internal::WolfeInfo::curr_
WolfeData curr_
Definition wolfe_line_search.hpp:493

stan::math::internal::WolfeInfo::WolfeInfo
WolfeInfo(ObjFun &&obj_fun, Eigen::Index n, Theta0 &&theta0, ThetaGradF &&theta_grad_f)
Definition wolfe_line_search.hpp:503

stan::math::internal::WolfeInfo::WolfeInfo
WolfeInfo(WolfeData &&curr, WolfeData &&prev)
Definition wolfe_line_search.hpp:515

stan::math::internal::WolfeInfo::prev_
WolfeData prev_
Definition wolfe_line_search.hpp:495

stan::math::internal::WolfeInfo::flip_direction
void flip_direction()
Definition wolfe_line_search.hpp:528

stan::math::internal::WolfeInfo::init_dir_
double init_dir_
Definition wolfe_line_search.hpp:501

stan::math::internal::WolfeInfo::prev
auto && prev() &&
Definition wolfe_line_search.hpp:540

stan::math::internal::WolfeInfo::scratch
auto && scratch() &&
Definition wolfe_line_search.hpp:543

stan::math::internal::WolfeInfo
Data object used in wolfe line search.
Definition wolfe_line_search.hpp:491

stan::math::internal::WolfeStatus::WolfeStatus
WolfeStatus(WolfeReturn stop, int evals, int back)
Definition wolfe_line_search.hpp:356

stan::math::internal::WolfeStatus::num_evals_
int num_evals_
Definition wolfe_line_search.hpp:350

stan::math::internal::WolfeStatus::WolfeStatus
WolfeStatus(WolfeReturn stop, int evals, int back, bool success)
Definition wolfe_line_search.hpp:358

stan::math::internal::WolfeStatus::num_backtracks_
int num_backtracks_
Definition wolfe_line_search.hpp:351

stan::math::internal::WolfeStatus::stop_
WolfeReturn stop_
Definition wolfe_line_search.hpp:352

stan::math::internal::WolfeStatus::WolfeStatus
WolfeStatus()=default

stan::math::internal::WolfeStatus::accept_
bool accept_
Definition wolfe_line_search.hpp:354

stan::math::internal::WolfeStatus
Struct to hold the result status of the Wolfe line search.
Definition wolfe_line_search.hpp:348

stan::math::laplace_line_search_options::rel_grad_threshold
double rel_grad_threshold
Definition wolfe_line_search.hpp:101

stan::math::laplace_line_search_options::laplace_line_search_options
constexpr laplace_line_search_options(int max_iter)
Definition wolfe_line_search.hpp:30

stan::math::laplace_line_search_options::tau
double tau
Backtracking shrinkage factor.
Definition wolfe_line_search.hpp:58

stan::math::laplace_line_search_options::max_iterations
int max_iterations
Definition wolfe_line_search.hpp:33

stan::math::laplace_line_search_options::min_alpha
double min_alpha
Minimum allowable step size.
Definition wolfe_line_search.hpp:66

stan::math::laplace_line_search_options::abs_grad_threshold
double abs_grad_threshold
Absolute gradient tolerance.
Definition wolfe_line_search.hpp:90

stan::math::laplace_line_search_options::scale_up
double scale_up
Step size expansion factor.
Definition wolfe_line_search.hpp:82

stan::math::laplace_line_search_options::c2
double c2
Curvature condition parameter.
Definition wolfe_line_search.hpp:50

stan::math::laplace_line_search_options::laplace_line_search_options
constexpr laplace_line_search_options()=default

stan::math::laplace_line_search_options::c1
double c1
Armijo condition parameter (sufficient decrease).
Definition wolfe_line_search.hpp:41

stan::math::laplace_line_search_options::max_alpha
double max_alpha
Maximum allowable step size.
Definition wolfe_line_search.hpp:73

stan::math::laplace_line_search_options::abs_obj_threshold
double abs_obj_threshold
Absolute objective tolerance.
Definition wolfe_line_search.hpp:99

stan::math::laplace_line_search_options::rel_obj_threshold
double rel_obj_threshold
Definition wolfe_line_search.hpp:102

stan::math::laplace_line_search_options
Options for Wolfe line search during optimization.
Definition wolfe_line_search.hpp:29

to_ref.hpp