0.0.1/Doxygen/decl_2lbfgs_8hpp_source.html

#pragma once


#include <alpaqa/util/box.hpp>

#include <alpaqa/util/vec.hpp>


#include <alpaqa/inner/directions/decl/lbfgs-fwd.hpp>

#include <alpaqa/inner/directions/decl/panoc-direction-update.hpp>


namespace alpaqa {


/// Parameters for the @ref LBFGS and @ref SpecializedLBFGS classes.

struct LBFGSParams {

    /// Length of the history to keep.

    unsigned memory = 10;

    struct {

        real_t α = 1;

        real_t ϵ = 0;

    }

    /// Parameters in the cautious BFGS update condition

    /// @f[ \frac{y^\top s}{s^\top s} \ge \epsilon \| g \|^\alpha @f]

    /// @see https://epubs.siam.org/doi/10.1137/S1052623499354242

    cbfgs;


    bool rescale_when_γ_changes = false;

};


/// Limited memory Broyden–Fletcher–Goldfarb–Shanno (L-BFGS) algorithm

/// @ingroup  grp_PANOCDirectionProviders

class LBFGS {

  public:

    using Params = LBFGSParams;


    /// The sign of the vectors @f$ p @f$ passed to the @ref LBFGS::update

    /// method.

    enum class Sign {

        Positive, ///< @f$ p \sim \nabla \psi(x) @f$

        Negative, ///< @f$ p \sim -\nabla \psi(x) @f$

    };


    LBFGS(Params params) : params(params) {}

    LBFGS(Params params, size_t n) : params(params) { resize(n); }


    /// Check if the new vectors s and y allow for a valid BFGS update that

    /// preserves the positive definiteness of the Hessian approximation.

    static bool update_valid(LBFGSParams params, real_t yᵀs, real_t sᵀs,

                             real_t pᵀp);


    /// Update the inverse Hessian approximation using the new vectors xₖ₊₁

    /// and pₖ₊₁.

    bool update(crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁,

                Sign sign, bool forced = false);


    /// Apply the inverse Hessian approximation to the given vector q.

    template <class Vec>

    bool apply(Vec &&q, real_t γ);


    /// Apply the inverse Hessian approximation to the given vector q, applying

    /// only the columns and rows of the Hessian in the index set J.

    template <class Vec, class IndexVec>

    bool apply(Vec &&q, real_t γ, const IndexVec &J);


    /// Throw away the approximation and all previous vectors s and y.

    void reset();

    /// Re-allocate storage for a problem with a different size. Causes

    /// a @ref reset.

    void resize(size_t n);


    /// Scale the stored y vectors by the given factor.

    void scale_y(real_t factor);


    std::string get_name() const { return "LBFGS"; }


    const Params &get_params() const { return params; }


    /// Get the size of the s and y vectors in the buffer.

    size_t n() const { return sto.rows() - 1; }

    /// Get the number of previous vectors s and y stored in the buffer.

    size_t history() const { return sto.cols() / 2; }

    /// Get the next index in the circular buffer of previous s and y vectors.

    size_t succ(size_t i) const { return i + 1 < history() ? i + 1 : 0; }


    auto s(size_t i) { return sto.col(2 * i).topRows(n()); }

    auto s(size_t i) const { return sto.col(2 * i).topRows(n()); }

    auto y(size_t i) { return sto.col(2 * i + 1).topRows(n()); }

    auto y(size_t i) const { return sto.col(2 * i + 1).topRows(n()); }

    real_t &ρ(size_t i) { return sto.coeffRef(n(), 2 * i); }

    const real_t &ρ(size_t i) const { return sto.coeff(n(), 2 * i); }

    real_t &α(size_t i) { return sto.coeffRef(n(), 2 * i + 1); }

    const real_t &α(size_t i) const { return sto.coeff(n(), 2 * i + 1); }


  private:

    using storage_t = Eigen::Matrix<real_t, Eigen::Dynamic, Eigen::Dynamic>;


    storage_t sto;

    size_t idx = 0;

    bool full  = false;

    Params params;

};


template <>

struct PANOCDirection<LBFGS> {

    LBFGS lbfgs;

    PANOCDirection(const LBFGSParams &params) : lbfgs(params) {}

    PANOCDirection(const LBFGS &lbfgs) : lbfgs(lbfgs) {}

    PANOCDirection(LBFGS &&lbfgs) : lbfgs(std::move(lbfgs)) {}


    void initialize(crvec x₀, crvec x̂₀, crvec p₀,

                    crvec grad₀);

    bool update(crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁,

                crvec grad_new, const Box &C, real_t γ_new);

    bool apply(crvec xₖ, crvec x̂ₖ, crvec pₖ, real_t γ, rvec qₖ);

    void changed_γ(real_t γₖ, real_t old_γₖ);

    void reset();

    std::string get_name() const;

    LBFGSParams get_params() const;

};


} // namespace alpaqa

box.hpp

alpaqa::LBFGS
Limited memory Broyden–Fletcher–Goldfarb–Shanno (L-BFGS) algorithm.
Definition: decl/lbfgs.hpp:29

alpaqa::LBFGS::s
auto s(size_t i) const
Definition: decl/lbfgs.hpp:83

alpaqa::LBFGS::params
Params params
Definition: decl/lbfgs.hpp:97

alpaqa::LBFGS::get_name
std::string get_name() const
Definition: decl/lbfgs.hpp:71

alpaqa::LBFGS::succ
size_t succ(size_t i) const
Get the next index in the circular buffer of previous s and y vectors.
Definition: decl/lbfgs.hpp:80

alpaqa::LBFGS::idx
size_t idx
Definition: decl/lbfgs.hpp:95

alpaqa::LBFGS::full
bool full
Definition: decl/lbfgs.hpp:96

alpaqa::LBFGS::y
auto y(size_t i) const
Definition: decl/lbfgs.hpp:85

alpaqa::LBFGS::apply
bool apply(Vec &&q, real_t γ)
Apply the inverse Hessian approximation to the given vector q.
Definition: lbfgs.hpp:59

alpaqa::LBFGS::update
bool update(crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁, Sign sign, bool forced=false)
Update the inverse Hessian approximation using the new vectors xₖ₊₁ and pₖ₊₁.
Definition: lbfgs.hpp:33

alpaqa::LBFGS::resize
void resize(size_t n)
Re-allocate storage for a problem with a different size.
Definition: lbfgs.hpp:188

alpaqa::LBFGS::history
size_t history() const
Get the number of previous vectors s and y stored in the buffer.
Definition: decl/lbfgs.hpp:78

alpaqa::LBFGS::s
auto s(size_t i)
Definition: decl/lbfgs.hpp:82

alpaqa::LBFGS::storage_t
Eigen::Matrix< real_t, Eigen::Dynamic, Eigen::Dynamic > storage_t
Definition: decl/lbfgs.hpp:92

alpaqa::LBFGS::α
real_t & α(size_t i)
Definition: decl/lbfgs.hpp:88

alpaqa::LBFGS::LBFGS
LBFGS(Params params)
Definition: decl/lbfgs.hpp:40

alpaqa::LBFGS::get_params
const Params & get_params() const
Definition: decl/lbfgs.hpp:73

alpaqa::LBFGS::update_valid
static bool update_valid(LBFGSParams params, real_t yᵀs, real_t sᵀs, real_t pᵀp)
Check if the new vectors s and y allow for a valid BFGS update that preserves the positive definitene...
Definition: lbfgs.hpp:9

alpaqa::LBFGS::y
auto y(size_t i)
Definition: decl/lbfgs.hpp:84

alpaqa::LBFGS::n
size_t n() const
Get the size of the s and y vectors in the buffer.
Definition: decl/lbfgs.hpp:76

alpaqa::LBFGS::α
const real_t & α(size_t i) const
Definition: decl/lbfgs.hpp:89

alpaqa::LBFGS::reset
void reset()
Throw away the approximation and all previous vectors s and y.
Definition: lbfgs.hpp:183

alpaqa::LBFGS::sto
storage_t sto
Definition: decl/lbfgs.hpp:94

alpaqa::LBFGS::Sign
Sign
The sign of the vectors  passed to the LBFGS::update method.
Definition: decl/lbfgs.hpp:35

alpaqa::LBFGS::Sign::Positive
@ Positive

alpaqa::LBFGS::Sign::Negative
@ Negative

alpaqa::LBFGS::scale_y
void scale_y(real_t factor)
Scale the stored y vectors by the given factor.
Definition: lbfgs.hpp:195

alpaqa::LBFGS::ρ
real_t & ρ(size_t i)
Definition: decl/lbfgs.hpp:86

alpaqa::LBFGS::ρ
const real_t & ρ(size_t i) const
Definition: decl/lbfgs.hpp:87

alpaqa::LBFGS::LBFGS
LBFGS(Params params, size_t n)
Definition: decl/lbfgs.hpp:41

lbfgs-fwd.hpp

alpaqa.test.params
params
Definition: test.py:275

alpaqa.test.C
C
Definition: test.py:262

alpaqa.test.α
α
Definition: test.py:33

alpaqa
Definition: __init__.py:1

alpaqa::crvec
Eigen::Ref< const vec > crvec
Default type for immutable references to vectors.
Definition: vec.hpp:18

alpaqa::LBFGSParams::rescale_when_γ_changes
bool rescale_when_γ_changes
Definition: decl/lbfgs.hpp:24

alpaqa::LBFGSParams::memory
unsigned memory
Length of the history to keep.
Definition: decl/lbfgs.hpp:14

alpaqa::LBFGSParams::cbfgs
struct alpaqa::LBFGSParams::@0 cbfgs
Parameters in the cautious BFGS update condition.

alpaqa::real_t
double real_t
Default floating point type.
Definition: vec.hpp:8

alpaqa::rvec
Eigen::Ref< vec > rvec
Default type for mutable references to vectors.
Definition: vec.hpp:16

alpaqa::Box
Definition: box.hpp:7

alpaqa::LBFGSParams
Parameters for the LBFGS and SpecializedLBFGS classes.
Definition: decl/lbfgs.hpp:12

panoc-direction-update.hpp

alpaqa::PANOCDirection< LBFGS >::PANOCDirection
PANOCDirection(LBFGS &&lbfgs)
Definition: decl/lbfgs.hpp:105

alpaqa::PANOCDirection< LBFGS >::lbfgs
LBFGS lbfgs
Definition: decl/lbfgs.hpp:102

alpaqa::PANOCDirection< LBFGS >::PANOCDirection
PANOCDirection(const LBFGSParams &params)
Definition: decl/lbfgs.hpp:103

alpaqa::PANOCDirection< LBFGS >::PANOCDirection
PANOCDirection(const LBFGS &lbfgs)
Definition: decl/lbfgs.hpp:104

alpaqa::PANOCDirection
Definition: panoc-direction-update.hpp:8

alpaqa::PANOCDirection::update
static bool update(DirectionProviderT &dp, crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁, crvec gradₖ₊₁, const Box &C, real_t γₖ₊₁)=delete

alpaqa::PANOCDirection::apply
static bool apply(DirectionProviderT &dp, crvec xₖ, crvec x̂ₖ, crvec pₖ, real_t γ, rvec qₖ)=delete
Apply the direction estimation in the current point.

alpaqa::PANOCDirection::changed_γ
static void changed_γ(DirectionProviderT &dp, real_t γₖ, real_t old_γₖ)=delete

alpaqa::PANOCDirection::initialize
static void initialize(DirectionProviderT &dp, crvec x₀, crvec x̂₀, crvec p₀, crvec grad₀)=delete

vec.hpp