0.0.1/Doxygen/specialized-lbfgs_8hpp_source.html

#pragma once


#include <alpaqa/inner/detail/panoc-helpers.hpp>

#include <alpaqa/inner/directions/decl/specialized-lbfgs.hpp>

#include <alpaqa/inner/directions/lbfgs.hpp>


#include <cmath>


namespace alpaqa {


inline void SpecializedLBFGS::initialize(crvec x₀, crvec grad₀) {

    idx  = 0;

    full = false;

    x(0) = x₀;

    g(0) = grad₀;

}


/// Standard L-BFGS update without changing the step size γ.

inline bool SpecializedLBFGS::standard_update(crvec xₖ, crvec xₖ₊₁,

                                              crvec pₖ, crvec pₖ₊₁,

                                              crvec gradₖ₊₁) {

    const auto s = xₖ₊₁ - xₖ;

    const auto y = pₖ - pₖ₊₁;


    real_t yᵀs = y.dot(s);

    real_t sᵀs = s.squaredNorm();

    real_t pᵀp = pₖ₊₁.squaredNorm();

    real_t ρ   = 1 / yᵀs;


    if (not LBFGS::update_valid(params, yᵀs, sᵀs, pᵀp))

        return false;


    // Store the new s and y vectors

    this->s(idx) = s;

    this->y(idx) = y;

    this->ρ(idx) = ρ;


    // Store x and the gradient

    this->x(succ(idx)) = xₖ₊₁;

    this->g(succ(idx)) = gradₖ₊₁;


    // Increment the index in the circular buffer

    idx = succ(idx);

    full |= idx == 0;


    return true;

}


/// L-BFGS update when changing the step size γ, recomputing everything.

inline bool SpecializedLBFGS::full_update(crvec xₖ, crvec xₖ₊₁,

                                          crvec pₖ_old_γ, crvec pₖ₊₁,

                                          crvec gradₖ₊₁, const Box &C,

                                          real_t γ) {

    auto &&sₖ = xₖ₊₁ - xₖ;

    auto &&yₖ = this->w(); // temporary workspace

    // Old pₖ is no longer valid, recompute with new γ

    (void)pₖ_old_γ;

    auto &&pₖ = this->p();

    pₖ        = detail::projected_gradient_step(C, γ, x(idx), g(idx));

    yₖ        = pₖ - pₖ₊₁;


    assert(x(idx) == xₖ);


    real_t yᵀs = yₖ.dot(sₖ);

    real_t sᵀs = sₖ.squaredNorm();

    real_t pᵀp = pₖ₊₁.squaredNorm();

    real_t ρₖ  = 1 / yᵀs;


    if (not LBFGS::update_valid(params, yᵀs, sᵀs, pᵀp))

        return false;


    // Recompute all residuals with new γ

    // yₖ = pₖ - pₖ₊₁

    // pₖ = Π(-γ∇ψ(xₖ), C - xₖ)

    size_t endidx = full ? idx : pred(0);

    for (size_t i = pred(idx); i != endidx; i = pred(i)) {

        this->y(i) = -pₖ /* i+1 */;

        pₖ = detail::projected_gradient_step(C, γ, this->x(i), this->g(i));

        this->y(i) += pₖ /* i */;

    }

    // Store the new s and y vectors

    this->s(idx) = sₖ;

    this->y(idx) = yₖ;

    this->ρ(idx) = ρₖ;


    // Store x and the gradient

    this->x(succ(idx)) = xₖ₊₁;

    this->g(succ(idx)) = gradₖ₊₁;


    // Increment the index in the circular buffer

    idx = succ(idx);

    full |= idx == 0;


    return true;

}


inline bool SpecializedLBFGS::update(crvec xₖ, crvec xₖ₊₁,

                                     crvec pₖ, crvec pₖ₊₁,

                                     crvec gradₖ₊₁, const Box &C,

                                     real_t γ) {

    bool ret = (γ == old_γ || old_γ == 0)

                   ? standard_update(xₖ, xₖ₊₁, pₖ, pₖ₊₁, gradₖ₊₁)

                   : full_update(xₖ, xₖ₊₁, pₖ, pₖ₊₁, gradₖ₊₁, C, γ);

    old_γ    = γ;

    return ret;

}


template <class Vec>

void SpecializedLBFGS::apply(Vec &&q) {

    // TODO: dry, reuse standard LBFGS::apply

    auto update1 = [&](size_t i) {

        α(i) = ρ(i) * (s(i).dot(q));

        q -= α(i) * y(i);

    };

    if (idx)

        for (size_t i = idx; i-- > 0;)

            update1(i);

    if (full)

        for (size_t i = history(); i-- > idx;)

            update1(i);


    // q = H₀ * q; // TODO: diagonal matrix H₀?


    auto update2 = [&](size_t i) {

        real_t β = ρ(i) * (y(i).dot(q));

        q += (α(i) - β) * s(i);

    };

    if (full)

        for (size_t i = idx; i < history(); ++i)

            update2(i);

    for (size_t i = 0; i < idx; ++i)

        update2(i);

}


inline void SpecializedLBFGS::resize(size_t n, size_t history) {

    sto.resize(n + 1, history * 4 + 2);

    sto.fill(std::numeric_limits<real_t>::quiet_NaN());

    idx  = 0;

    full = false;

}


inline void SpecializedLBFGS::reset() {

    x(0) = x(idx);

    g(0) = x(idx);

    idx  = 0;

    full = false;

}


} // namespace alpaqa


#include <alpaqa/inner/directions/decl/panoc-direction-update.hpp>


namespace alpaqa {


template <>

struct PANOCDirection<SpecializedLBFGS> {


    static void initialize(SpecializedLBFGS &lbfgs, crvec x₀,

                           crvec x̂₀, crvec p₀, crvec grad₀) {

        lbfgs.initialize(x₀, grad₀);

        (void)x̂₀;

        (void)p₀;

    }


    static bool update(SpecializedLBFGS &lbfgs, crvec xₖ, crvec xₖ₊₁,

                       crvec pₖ, crvec pₖ₊₁, crvec gradₖ₊₁,

                       const Box &C, real_t γ) {

        return lbfgs.update(xₖ, xₖ₊₁, pₖ, pₖ₊₁, gradₖ₊₁, C, γ);

    }


    static bool apply(SpecializedLBFGS &lbfgs, crvec xₖ, crvec x̂ₖ,

                      crvec pₖ, real_t γ, rvec qₖ) {

        (void)xₖ;

        (void)x̂ₖ;

        (void)γ; // TODO: add this parameter to SLBFGS

        qₖ = pₖ;

        lbfgs.apply(qₖ);

        return true;

    }


    static void changed_γ(SpecializedLBFGS &lbfgs, real_t γₖ, real_t old_γₖ) {

        (void)lbfgs;

        (void)γₖ;

        (void)old_γₖ;

    }

};


} // namespace alpaqa

alpaqa::LBFGS::update_valid
static bool update_valid(LBFGSParams params, real_t yᵀs, real_t sᵀs, real_t pᵀp)
Check if the new vectors s and y allow for a valid BFGS update that preserves the positive definitene...
Definition: lbfgs.hpp:9

alpaqa::SpecializedLBFGS
Limited memory Broyden–Fletcher–Goldfarb–Shanno (L-BFGS) algorithm that can handle updates of the γ p...
Definition: decl/specialized-lbfgs.hpp:10

alpaqa::SpecializedLBFGS::params
Params params
Definition: decl/specialized-lbfgs.hpp:84

alpaqa::SpecializedLBFGS::full_update
bool full_update(crvec xₖ, crvec xₖ₊₁, crvec pₖ_old_γ, crvec pₖ₊₁, crvec gradₖ₊₁, const Box &C, real_t γ)
L-BFGS update when changing the step size γ, recomputing everything.
Definition: specialized-lbfgs.hpp:50

alpaqa::SpecializedLBFGS::succ
size_t succ(size_t i) const
Get the next index in the circular buffer of previous s, y, x and g vectors.
Definition: decl/specialized-lbfgs.hpp:51

alpaqa::SpecializedLBFGS::idx
size_t idx
Definition: decl/specialized-lbfgs.hpp:81

alpaqa::SpecializedLBFGS::full
bool full
Definition: decl/specialized-lbfgs.hpp:82

alpaqa::SpecializedLBFGS::initialize
void initialize(crvec x₀, crvec grad₀)
Initialize with the starting point x₀ and the gradient in that point.
Definition: specialized-lbfgs.hpp:11

alpaqa::SpecializedLBFGS::pred
size_t pred(size_t i) const
Get the previous index in the circular buffer of previous s, y, x and g vectors.
Definition: decl/specialized-lbfgs.hpp:54

alpaqa::SpecializedLBFGS::apply
void apply(Vec &&q)
Apply the inverse Hessian approximation to the given vector q.
Definition: specialized-lbfgs.hpp:109

alpaqa::SpecializedLBFGS::w
auto w()
Definition: decl/specialized-lbfgs.hpp:70

alpaqa::SpecializedLBFGS::old_γ
real_t old_γ
Definition: decl/specialized-lbfgs.hpp:83

alpaqa::SpecializedLBFGS::standard_update
bool standard_update(crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁, crvec gradₖ₊₁)
Standard L-BFGS update without changing the step size γ.
Definition: specialized-lbfgs.hpp:19

alpaqa::SpecializedLBFGS::history
size_t history() const
Get the number of previous vectors s, y, x and g stored in the buffer.
Definition: decl/specialized-lbfgs.hpp:48

alpaqa::SpecializedLBFGS::s
auto s(size_t i)
Definition: decl/specialized-lbfgs.hpp:56

alpaqa::SpecializedLBFGS::update
bool update(crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁, crvec gradₖ₊₁, const Box &C, real_t γ)
Update the inverse Hessian approximation using the new vectors xₖ₊₁ and pₖ₊₁.
Definition: specialized-lbfgs.hpp:97

alpaqa::SpecializedLBFGS::α
real_t & α(size_t i)
Definition: decl/specialized-lbfgs.hpp:74

alpaqa::SpecializedLBFGS::g
auto g(size_t i)
Definition: decl/specialized-lbfgs.hpp:64

alpaqa::SpecializedLBFGS::p
auto p()
Definition: decl/specialized-lbfgs.hpp:68

alpaqa::SpecializedLBFGS::resize
void resize(size_t n, size_t history)
Re-allocate storage for a problem with a different size.
Definition: specialized-lbfgs.hpp:135

alpaqa::SpecializedLBFGS::y
auto y(size_t i)
Definition: decl/specialized-lbfgs.hpp:58

alpaqa::SpecializedLBFGS::n
size_t n() const
Get the size of the s, y, x and g vectors in the buffer.
Definition: decl/specialized-lbfgs.hpp:46

alpaqa::SpecializedLBFGS::x
auto x(size_t i)
Definition: decl/specialized-lbfgs.hpp:60

alpaqa::SpecializedLBFGS::reset
void reset()
Throw away the approximation and all previous vectors s and y.
Definition: specialized-lbfgs.hpp:142

alpaqa::SpecializedLBFGS::sto
storage_t sto
Definition: decl/specialized-lbfgs.hpp:80

alpaqa::SpecializedLBFGS::ρ
real_t & ρ(size_t i)
Definition: decl/specialized-lbfgs.hpp:72

specialized-lbfgs.hpp

lbfgs.hpp

alpaqa::detail::projected_gradient_step
auto projected_gradient_step(const Box &C, real_t γ, crvec x, crvec grad_ψ)
Projected gradient step.
Definition: panoc-helpers.hpp:131

alpaqa.test.n
int n
Definition: test.py:40

alpaqa.test.C
C
Definition: test.py:262

alpaqa
Definition: __init__.py:1

alpaqa::crvec
Eigen::Ref< const vec > crvec
Default type for immutable references to vectors.
Definition: vec.hpp:18

alpaqa::real_t
double real_t
Default floating point type.
Definition: vec.hpp:8

alpaqa::rvec
Eigen::Ref< vec > rvec
Default type for mutable references to vectors.
Definition: vec.hpp:16

alpaqa::Box
Definition: box.hpp:7

panoc-direction-update.hpp

panoc-helpers.hpp

alpaqa::PANOCDirection< SpecializedLBFGS >::update
static bool update(SpecializedLBFGS &lbfgs, crvec xₖ, crvec xₖ₊₁, crvec pₖ, crvec pₖ₊₁, crvec gradₖ₊₁, const Box &C, real_t γ)
Definition: specialized-lbfgs.hpp:165

alpaqa::PANOCDirection< SpecializedLBFGS >::initialize
static void initialize(SpecializedLBFGS &lbfgs, crvec x₀, crvec x̂₀, crvec p₀, crvec grad₀)
Definition: specialized-lbfgs.hpp:158

alpaqa::PANOCDirection< SpecializedLBFGS >::apply
static bool apply(SpecializedLBFGS &lbfgs, crvec xₖ, crvec x̂ₖ, crvec pₖ, real_t γ, rvec qₖ)
Definition: specialized-lbfgs.hpp:171

alpaqa::PANOCDirection< SpecializedLBFGS >::changed_γ
static void changed_γ(SpecializedLBFGS &lbfgs, real_t γₖ, real_t old_γₖ)
Definition: specialized-lbfgs.hpp:181

alpaqa::PANOCDirection
Definition: panoc-direction-update.hpp:8