1.0.0a19/Doxygen/accelerators_2lbfgs_8hpp_source.html

#pragma once


#include <alpaqa/config/config.hpp>

#include <alpaqa/export.hpp>


#include <cmath>

#include <limits>

#include <string>

#include <utility>

#include <vector>


namespace alpaqa {


/// Cautious BFGS update.

/// @see @ref LBFGSParams::cbfgs

/// @ingroup grp_Parameters

template <Config Conf = DefaultConfig>


struct CBFGSParams {

    USING_ALPAQA_CONFIG(Conf);

    real_t α = 1;

    real_t ϵ = 0; ///< Set to zero to disable CBFGS check.

    explicit operator bool() const { return ϵ > 0; }

};


/// Which method to use to select the L-BFGS step size.


enum class LBFGSStepSize {

    /// Initial inverse Hessian approximation is set to

    /// @f$ H_0 = \gamma I @f$, where @f$ \gamma @f$ is the forward-backward

    /// splitting step size.

    BasedOnExternalStepSize = 0,

    /// Initial inverse Hessian approximation is set to

    /// @f$ H_0 = \frac{s^\top y}{y^\top y} I @f$.

    BasedOnCurvature = 1,

    BasedOnGradientStepSize

    [[deprecated("use BasedOnExternalStepSize instead")]] =

        BasedOnExternalStepSize,

};


/// Parameters for the @ref LBFGS class.

/// @ingroup grp_Parameters

template <Config Conf = DefaultConfig>


struct LBFGSParams {

    USING_ALPAQA_CONFIG(Conf);


    /// Length of the history to keep.

    length_t memory = 10;

    /// Reject update if @f$ y^\top s \le \text{min_div_fac} \cdot s^\top s @f$.

    /// Keeps the inverse Hessian approximation positive definite.

    real_t min_div_fac = std::numeric_limits<real_t>::epsilon();

    /// Reject update if @f$ s^\top s \le \text{min_abs_s} @f$.

    /// Keeps the Hessian approximation nonsingular.

    real_t min_abs_s =

        std::pow(std::numeric_limits<real_t>::epsilon(), real_t(2));

    /// Parameters in the cautious BFGS update condition

    /// @f[ \frac{y^\top s}{s^\top s} \ge \epsilon \| g \|^\alpha. @f]

    /// Disabled by default.

    /// @see https://epubs.siam.org/doi/10.1137/S1052623499354242

    CBFGSParams<config_t> cbfgs = {};

    /// If set to true, the inverse Hessian estimate should remain definite,

    /// i.e. a check is performed that rejects the update if

    /// @f$ y^\top s \le \text{min_div_fac} \cdot s^\top s @f$.

    /// If set to false, just try to prevent a singular Hessian by rejecting the

    /// update if

    /// @f$ \left| y^\top s \right| \le \text{min_div_fac} \cdot s^\top s @f$.

    bool force_pos_def = true;

    /// Scale of the initial inverse Hessian approximation that the rank-one

    /// L-BFGS updates are applied to, @f$ H_0 @f$.

    /// You probably want to keep this as the default.

    /// @see LBFGSStepSize

    LBFGSStepSize stepsize = LBFGSStepSize::BasedOnCurvature;

};


/// Layout:

/// ~~~

///       ┌───── 2 m ─────┐

///     ┌ ┌───┬───┬───┬───┐

///     │ │   │   │   │   │

///     │ │ s │ y │ s │ y │

/// n+1 │ │   │   │   │   │

///     │ ├───┼───┼───┼───┤

///     │ │ ρ │ α │ ρ │ α │

///     └ └───┴───┴───┴───┘

/// ~~~

template <Config Conf = DefaultConfig>


struct LBFGSStorage {

    USING_ALPAQA_CONFIG(Conf);


    /// Re-allocate storage for a problem with a different size.

    void resize(length_t n, length_t history);


    /// Get the size of the s and y vectors in the buffer.

    length_t n() const { return sto.rows() - 1; }

    /// Get the number of previous vectors s and y stored in the buffer.

    length_t history() const { return sto.cols() / 2; }


    auto s(index_t i) { return sto.col(2 * i).topRows(n()); }


    auto s(index_t i) const {

        return std::as_const(sto).col(2 * i).topRows(n());

    }


    auto y(index_t i) { return sto.col(2 * i + 1).topRows(n()); }


    auto y(index_t i) const {

        return std::as_const(sto).col(2 * i + 1).topRows(n());

    }


    real_t &ρ(index_t i) { return sto.coeffRef(n(), 2 * i); }

    real_t &ρ(index_t i) const { return sto.coeffRef(n(), 2 * i); }

    real_t &α(index_t i) { return sto.coeffRef(n(), 2 * i + 1); }

    real_t &α(index_t i) const { return sto.coeffRef(n(), 2 * i + 1); }


    using storage_t = mat;

    static_assert(!storage_t::IsRowMajor);

    mutable storage_t sto;

};


/// Limited memory Broyden–Fletcher–Goldfarb–Shanno (L-BFGS) algorithm

/// @ingroup grp_Accelerators

template <Config Conf = DefaultConfig>


class LBFGS {

  public:

    USING_ALPAQA_CONFIG(Conf);


    using Params = LBFGSParams<config_t>;


    /// The sign of the vectors @f$ p @f$ passed to the @ref update method.


    enum class Sign {

        Positive, ///< @f$ p \sim \nabla \psi(x) @f$

        Negative, ///< @f$ p \sim -\nabla \psi(x) @f$

    };


    LBFGS() = default;

    LBFGS(Params params) : params(params) {}

    LBFGS(Params params, length_t n) : params(params) { resize(n); }


    /// Check if the new vectors s and y allow for a valid BFGS update that

    /// preserves the positive definiteness of the Hessian approximation.

    static bool update_valid(const Params &params, real_t yᵀs, real_t sᵀs,

                             real_t pᵀp);


    /// Update the inverse Hessian approximation using the new vectors

    /// sₖ = xₙₑₓₜ - xₖ and yₖ = pₙₑₓₜ - pₖ.

    bool update_sy(crvec s, crvec y, real_t pₙₑₓₜᵀpₙₑₓₜ, bool forced = false);

    /// @see @ref update_sy

    bool update_sy_impl(const auto &s, const auto &y, real_t pₙₑₓₜᵀpₙₑₓₜ,

                        bool forced = false);


    /// Update the inverse Hessian approximation using the new vectors xₙₑₓₜ

    /// and pₙₑₓₜ.

    bool update(crvec xₖ, crvec xₙₑₓₜ, crvec pₖ, crvec pₙₑₓₜ,

                Sign sign = Sign::Positive, bool forced = false);


    /// Apply the inverse Hessian approximation to the given vector q.

    /// Initial inverse Hessian approximation is set to @f$ H_0 = \gamma I @f$.

    /// If @p γ is negative, @f$ H_0 = \frac{s^\top y}{y^\top y} I @f$.

    bool apply(rvec q, real_t γ = -1) const;


    /// Apply the inverse Hessian approximation to the given vector q, applying

    /// only the columns and rows of the Hessian in the index set J.

    bool apply_masked(rvec q, real_t γ, crindexvec J) const;

    /// @copydoc apply_masked(rvec, real_t, crindexvec) const

    bool apply_masked(rvec q, real_t γ, const std::vector<index_t> &J) const;

    /// @copydoc apply_masked(rvec, real_t, crindexvec) const

    bool apply_masked_impl(rvec q, real_t γ, const auto &J) const;


    /// Throw away the approximation and all previous vectors s and y.

    void reset();

    /// Re-allocate storage for a problem with a different size. Causes

    /// a @ref reset.

    void resize(length_t n);


    /// Scale the stored y vectors by the given factor.

    void scale_y(real_t factor);


    /// Get a string identifier for this accelerator.


    std::string get_name() const {

        return "LBFGS<" + std::string(config_t::get_name()) + '>';

    }


    /// Get the parameters.

    const Params &get_params() const { return params; }


    /// Get the size of the s and y vectors in the buffer.

    length_t n() const { return sto.n(); }

    /// Get the number of previous vectors s and y stored in the buffer.

    length_t history() const { return sto.history(); }

    /// Get the next index in the circular buffer of previous s and y vectors.

    index_t succ(index_t i) const { return i + 1 < history() ? i + 1 : 0; }

    /// Get the previous index in the circular buffer of s and y vectors.

    index_t pred(index_t i) const { return i > 0 ? i - 1 : history() - 1; }

    /// Get the number of previous s and y vectors currently stored in the

    /// buffer.

    length_t current_history() const { return full ? history() : idx; }


    auto s(index_t i) { return sto.s(i); }

    auto s(index_t i) const { return sto.s(i); }

    auto y(index_t i) { return sto.y(i); }

    auto y(index_t i) const { return sto.y(i); }

    real_t &ρ(index_t i) { return sto.ρ(i); }

    real_t &ρ(index_t i) const { return sto.ρ(i); }

    real_t &α(index_t i) { return sto.α(i); }

    real_t &α(index_t i) const { return sto.α(i); }


    /// Iterate over the indices in the history buffer, oldest first.

    template <class F>


    void foreach_fwd(const F &fun) const {

        if (full)

            for (index_t i = idx; i < history(); ++i)

                fun(i);

        if (idx)

            for (index_t i = 0; i < idx; ++i)

                fun(i);

    }


    /// Iterate over the indices in the history buffer, newest first.

    template <class F>


    void foreach_rev(const F &fun) const {

        if (idx)

            for (index_t i = idx; i-- > 0;)

                fun(i);

        if (full)

            for (index_t i = history(); i-- > idx;)

                fun(i);

    }


  private:

    LBFGSStorage<config_t> sto;

    index_t idx = 0;

    bool full   = false;

    Params params;

};


inline constexpr const char *enum_name(LBFGSStepSize s) {

    switch (s) {

        case LBFGSStepSize::BasedOnExternalStepSize:

            return "BasedOnExternalStepSize";

        case LBFGSStepSize::BasedOnCurvature: return "BasedOnCurvature";

        default:;

    }

    throw std::out_of_range("invalid value for alpaqa::LBFGSStepSize");

}


// clang-format off

ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, CBFGSParams, EigenConfigd);

ALPAQA_IF_FLOAT(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, CBFGSParams, EigenConfigf);)

ALPAQA_IF_LONGD(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, CBFGSParams, EigenConfigl);)

ALPAQA_IF_QUADF(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, CBFGSParams, EigenConfigq);)


ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, LBFGSParams, EigenConfigd);

ALPAQA_IF_FLOAT(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, LBFGSParams, EigenConfigf);)

ALPAQA_IF_LONGD(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, LBFGSParams, EigenConfigl);)

ALPAQA_IF_QUADF(ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, LBFGSParams, EigenConfigq);)


ALPAQA_EXPORT_EXTERN_TEMPLATE(class, LBFGS, EigenConfigd);

ALPAQA_IF_FLOAT(ALPAQA_EXPORT_EXTERN_TEMPLATE(class, LBFGS, EigenConfigf);)

ALPAQA_IF_LONGD(ALPAQA_EXPORT_EXTERN_TEMPLATE(class, LBFGS, EigenConfigl);)

ALPAQA_IF_QUADF(ALPAQA_EXPORT_EXTERN_TEMPLATE(class, LBFGS, EigenConfigq);)

// clang-format on


} // namespace alpaqa

alpaqa::LBFGS
Limited memory Broyden–Fletcher–Goldfarb–Shanno (L-BFGS) algorithm.
Definition lbfgs.hpp:117

alpaqa::LBFGS::params
Params params
Definition lbfgs.hpp:226

alpaqa::LBFGS::get_name
std::string get_name() const
Get a string identifier for this accelerator.
Definition lbfgs.hpp:173

alpaqa::LBFGS::foreach_rev
void foreach_rev(const F &fun) const
Iterate over the indices in the history buffer, newest first.
Definition lbfgs.hpp:213

alpaqa::LBFGS::s
auto s(index_t i)
Definition lbfgs.hpp:191

alpaqa::LBFGS::apply_masked
bool apply_masked(rvec q, real_t γ, crindexvec J) const
Apply the inverse Hessian approximation to the given vector q, applying only the columns and rows of ...
Definition lbfgs.tpp:196

alpaqa::LBFGS::full
bool full
Definition lbfgs.hpp:225

alpaqa::LBFGS::s
auto s(index_t i) const
Definition lbfgs.hpp:192

alpaqa::LBFGS::current_history
length_t current_history() const
Get the number of previous s and y vectors currently stored in the buffer.
Definition lbfgs.hpp:189

alpaqa::LBFGS::LBFGS
LBFGS()=default

alpaqa::LBFGS::Params
LBFGSParams< config_t > Params
Definition lbfgs.hpp:121

alpaqa::LBFGS::succ
index_t succ(index_t i) const
Get the next index in the circular buffer of previous s and y vectors.
Definition lbfgs.hpp:184

alpaqa::LBFGS::pred
index_t pred(index_t i) const
Get the previous index in the circular buffer of s and y vectors.
Definition lbfgs.hpp:186

alpaqa::LBFGS::n
length_t n() const
Get the size of the s and y vectors in the buffer.
Definition lbfgs.hpp:180

alpaqa::LBFGS::LBFGS
LBFGS(Params params, length_t n)
Definition lbfgs.hpp:131

alpaqa::LBFGS::LBFGS
LBFGS(Params params)
Definition lbfgs.hpp:130

alpaqa::LBFGS::sto
LBFGSStorage< config_t > sto
Definition lbfgs.hpp:223

alpaqa::LBFGS::get_params
const Params & get_params() const
Get the parameters.
Definition lbfgs.hpp:177

alpaqa::LBFGS::history
length_t history() const
Get the number of previous vectors s and y stored in the buffer.
Definition lbfgs.hpp:182

alpaqa::LBFGS::foreach_fwd
void foreach_fwd(const F &fun) const
Iterate over the indices in the history buffer, oldest first.
Definition lbfgs.hpp:202

alpaqa::LBFGS::idx
index_t idx
Definition lbfgs.hpp:224

alpaqa::LBFGS::α
real_t & α(index_t i) const
Definition lbfgs.hpp:198

alpaqa::LBFGS::update_sy
bool update_sy(crvec s, crvec y, real_t pₙₑₓₜᵀpₙₑₓₜ, bool forced=false)
Update the inverse Hessian approximation using the new vectors sₖ = xₙₑₓₜ - xₖ and yₖ = pₙₑₓₜ - pₖ.
Definition lbfgs.tpp:60

alpaqa::LBFGS::ρ
real_t & ρ(index_t i) const
Definition lbfgs.hpp:196

alpaqa::LBFGS::update_valid
static bool update_valid(const Params &params, real_t yᵀs, real_t sᵀs, real_t pᵀp)
Check if the new vectors s and y allow for a valid BFGS update that preserves the positive definitene...
Definition lbfgs.tpp:12

alpaqa::LBFGS::apply_masked_impl
bool apply_masked_impl(rvec q, real_t γ, const auto &J) const
Apply the inverse Hessian approximation to the given vector q, applying only the columns and rows of ...
Definition lbfgs.tpp:103

alpaqa::LBFGS::resize
void resize(length_t n)
Re-allocate storage for a problem with a different size.
Definition lbfgs.tpp:213

alpaqa::LBFGS::α
real_t & α(index_t i)
Definition lbfgs.hpp:197

alpaqa::LBFGS::ρ
real_t & ρ(index_t i)
Definition lbfgs.hpp:195

alpaqa::LBFGS::reset
void reset()
Throw away the approximation and all previous vectors s and y.
Definition lbfgs.tpp:207

alpaqa::LBFGS::update_sy_impl
bool update_sy_impl(const auto &s, const auto &y, real_t pₙₑₓₜᵀpₙₑₓₜ, bool forced=false)
Definition lbfgs.tpp:37

alpaqa::LBFGS::y
auto y(index_t i) const
Definition lbfgs.hpp:194

alpaqa::LBFGS::Sign
Sign
The sign of the vectors  passed to the update method.
Definition lbfgs.hpp:124

alpaqa::LBFGS::Sign::Positive
@ Positive

alpaqa::LBFGS::Sign::Negative
@ Negative

alpaqa::LBFGS::apply
bool apply(rvec q, real_t γ=-1) const
Apply the inverse Hessian approximation to the given vector q.
Definition lbfgs.tpp:74

alpaqa::LBFGS::scale_y
void scale_y(real_t factor)
Scale the stored y vectors by the given factor.
Definition lbfgs.tpp:226

alpaqa::LBFGS::update
bool update(crvec xₖ, crvec xₙₑₓₜ, crvec pₖ, crvec pₙₑₓₜ, Sign sign=Sign::Positive, bool forced=false)
Update the inverse Hessian approximation using the new vectors xₙₑₓₜ and pₙₑₓₜ.
Definition lbfgs.tpp:65

alpaqa::LBFGS::y
auto y(index_t i)
Definition lbfgs.hpp:193

config.hpp

USING_ALPAQA_CONFIG
#define USING_ALPAQA_CONFIG(Conf)
Definition config.hpp:77

ALPAQA_IF_QUADF
#define ALPAQA_IF_QUADF(...)
Definition config.hpp:221

ALPAQA_IF_LONGD
#define ALPAQA_IF_LONGD(...)
Definition config.hpp:233

ALPAQA_IF_FLOAT
#define ALPAQA_IF_FLOAT(...)
Definition config.hpp:227

export.hpp

ALPAQA_EXPORT_EXTERN_TEMPLATE
#define ALPAQA_EXPORT_EXTERN_TEMPLATE(...)
Definition export.hpp:21

alpaqa::LBFGSParams::min_abs_s
real_t min_abs_s
Reject update if .
Definition lbfgs.hpp:52

alpaqa::LBFGSParams::memory
length_t memory
Length of the history to keep.
Definition lbfgs.hpp:46

alpaqa::LBFGSParams::stepsize
LBFGSStepSize stepsize
Scale of the initial inverse Hessian approximation that the rank-one L-BFGS updates are applied to,...
Definition lbfgs.hpp:70

alpaqa::LBFGSParams::cbfgs
CBFGSParams< config_t > cbfgs
Parameters in the cautious BFGS update condition.
Definition lbfgs.hpp:58

alpaqa::LBFGSParams::force_pos_def
bool force_pos_def
If set to true, the inverse Hessian estimate should remain definite, i.e.
Definition lbfgs.hpp:65

alpaqa::LBFGSParams::min_div_fac
real_t min_div_fac
Reject update if .
Definition lbfgs.hpp:49

alpaqa::LBFGSParams
Parameters for the LBFGS class.
Definition lbfgs.hpp:42

alpaqa
Definition anderson.hpp:10

alpaqa::mat
typename Conf::mat mat
Definition config.hpp:93

alpaqa::real_t
typename Conf::real_t real_t
Definition config.hpp:86

alpaqa::index_t
typename Conf::index_t index_t
Definition config.hpp:104

alpaqa::length_t
typename Conf::length_t length_t
Definition config.hpp:103

alpaqa::inf
constexpr const auto inf
Definition config.hpp:112

alpaqa::rvec
typename Conf::rvec rvec
Definition config.hpp:91

alpaqa::crvec
typename Conf::crvec crvec
Definition config.hpp:92

alpaqa::enum_name
constexpr const char * enum_name(LBFGSStepSize s)
Definition lbfgs.hpp:229

alpaqa::LBFGSStepSize
LBFGSStepSize
Which method to use to select the L-BFGS step size.
Definition lbfgs.hpp:26

alpaqa::LBFGSStepSize::BasedOnGradientStepSize
@ BasedOnGradientStepSize

alpaqa::LBFGSStepSize::BasedOnCurvature
@ BasedOnCurvature
Initial inverse Hessian approximation is set to .

alpaqa::LBFGSStepSize::BasedOnExternalStepSize
@ BasedOnExternalStepSize
Initial inverse Hessian approximation is set to , where  is the forward-backward splitting step size.

alpaqa::crindexvec
typename Conf::crindexvec crindexvec
Definition config.hpp:107

alpaqa::LBFGSParams< config_t >

alpaqa::CBFGSParams
Cautious BFGS update.
Definition lbfgs.hpp:18

alpaqa::CBFGSParams::α
real_t α
Definition lbfgs.hpp:20

alpaqa::CBFGSParams::ϵ
real_t ϵ
Set to zero to disable CBFGS check.
Definition lbfgs.hpp:21

alpaqa::LBFGSStorage
Layout:
Definition lbfgs.hpp:85

alpaqa::LBFGSStorage::storage_t
mat storage_t
Definition lbfgs.hpp:109

alpaqa::LBFGSStorage::s
auto s(index_t i)
Definition lbfgs.hpp:96

alpaqa::LBFGSStorage::s
auto s(index_t i) const
Definition lbfgs.hpp:97

alpaqa::LBFGSStorage::resize
void resize(length_t n, length_t history)
Re-allocate storage for a problem with a different size.
Definition lbfgs.tpp:221

alpaqa::LBFGSStorage::n
length_t n() const
Get the size of the s and y vectors in the buffer.
Definition lbfgs.hpp:92

alpaqa::LBFGSStorage::history
length_t history() const
Get the number of previous vectors s and y stored in the buffer.
Definition lbfgs.hpp:94

alpaqa::LBFGSStorage::α
real_t & α(index_t i) const
Definition lbfgs.hpp:107

alpaqa::LBFGSStorage::ρ
real_t & ρ(index_t i) const
Definition lbfgs.hpp:105

alpaqa::LBFGSStorage::α
real_t & α(index_t i)
Definition lbfgs.hpp:106

alpaqa::LBFGSStorage::ρ
real_t & ρ(index_t i)
Definition lbfgs.hpp:104

alpaqa::LBFGSStorage::y
auto y(index_t i) const
Definition lbfgs.hpp:101

alpaqa::LBFGSStorage::sto
storage_t sto
Definition lbfgs.hpp:111

alpaqa::LBFGSStorage::y
auto y(index_t i)
Definition lbfgs.hpp:100