0.0.1/Doxygen/inner_2panoc_8hpp_source.html

#pragma once


#include <alpaqa/inner/decl/panoc.hpp>

#include <alpaqa/inner/detail/panoc-helpers.hpp>

#include <alpaqa/inner/directions/decl/panoc-direction-update.hpp>


#include <cassert>

#include <cmath>

#include <iomanip>

#include <iostream>

#include <stdexcept>


namespace alpaqa {


using std::chrono::duration_cast;

using std::chrono::microseconds;


template <class DirectionProviderT>

std::string PANOCSolver<DirectionProviderT>::get_name() const {

    return "PANOCSolver<" + direction_provider.get_name() + ">";

}


template <class DirectionProviderT>

typename PANOCSolver<DirectionProviderT>::Stats

PANOCSolver<DirectionProviderT>::operator()(

    /// [in]    Problem description

    const Problem &problem,

    /// [in]    Constraint weights @f$ \Sigma @f$

    crvec Σ,

    /// [in]    Tolerance @f$ \varepsilon @f$

    real_t ε,

    /// [in]    Overwrite @p x, @p y and @p err_z even if not converged

    bool always_overwrite_results,

    /// [inout] Decision variable @f$ x @f$

    rvec x,

    /// [inout] Lagrange multipliers @f$ y @f$

    rvec y,

    /// [out]   Slack variable error @f$ g(x) - z @f$

    rvec err_z) {


    auto start_time = std::chrono::steady_clock::now();

    Stats s;


    const auto n = problem.n;

    const auto m = problem.m;


    // Allocate vectors, init L-BFGS -------------------------------------------


    // TODO: the L-BFGS objects and vectors allocate on each iteration of ALM,

    //       and there are more vectors than strictly necessary.


    bool need_grad_̂ψₖ = detail::stop_crit_requires_grad_̂ψₖ(params.stop_crit);


    vec xₖ = x,   // Value of x at the beginning of the iteration

        x̂ₖ(n),    // Value of x after a projected gradient step

        xₖ₊₁(n),  // xₖ for next iteration

        x̂ₖ₊₁(n),  // x̂ₖ for next iteration

        ŷx̂ₖ(m),   // ŷ(x̂ₖ) = Σ (g(x̂ₖ) - ẑₖ)

        ŷx̂ₖ₊₁(m), // ŷ(x̂ₖ) for next iteration

        pₖ(n),    // Projected gradient step pₖ = x̂ₖ - xₖ

        pₖ₊₁(n), // Projected gradient step pₖ₊₁ = x̂ₖ₊₁ - xₖ₊₁

        qₖ(n),   // Newton step Hₖ pₖ

        grad_ψₖ(n),                    // ∇ψ(xₖ)

        grad_̂ψₖ(need_grad_̂ψₖ ? n : 0), // ∇ψ(x̂ₖ)

        grad_ψₖ₊₁(n);                  // ∇ψ(xₖ₊₁)


    vec work_n(n), work_m(m);


    // Keep track of how many successive iterations didn't update the iterate

    unsigned no_progress = 0;


    // Helper functions --------------------------------------------------------


    // Wrappers for helper functions that automatically pass along any arguments

    // that are constant within PANOC (for readability in the main algorithm)

    auto calc_ψ_ŷ = [&problem, &y, &Σ](crvec x, rvec ŷ) {

        return detail::calc_ψ_ŷ(problem, x, y, Σ, ŷ);

    };

    auto calc_ψ_grad_ψ = [&problem, &y, &Σ, &work_n, &work_m](crvec x,

                                                              rvec grad_ψ) {

        return detail::calc_ψ_grad_ψ(problem, x, y, Σ, grad_ψ, work_n, work_m);

    };

    auto calc_grad_ψ_from_ŷ = [&problem, &work_n](crvec x, crvec ŷ,

                                                  rvec grad_ψ) {

        detail::calc_grad_ψ_from_ŷ(problem, x, ŷ, grad_ψ, work_n);

    };

    auto calc_x̂ = [&problem](real_t γ, crvec x, crvec grad_ψ, rvec x̂, rvec p) {

        detail::calc_x̂(problem, γ, x, grad_ψ, x̂, p);

    };

    auto calc_err_z = [&problem, &y, &Σ](crvec x̂, rvec err_z) {

        detail::calc_err_z(problem, x̂, y, Σ, err_z);

    };

    auto descent_lemma = [this, &problem, &y,

                          &Σ](crvec xₖ, real_t ψₖ, crvec grad_ψₖ, rvec x̂ₖ,

                              rvec pₖ, rvec ŷx̂ₖ, real_t &ψx̂ₖ, real_t &pₖᵀpₖ,

                              real_t &grad_ψₖᵀpₖ, real_t &Lₖ, real_t &γₖ) {

        return detail::descent_lemma(

            problem, params.quadratic_upperbound_tolerance_factor, params.L_max,

            xₖ, ψₖ, grad_ψₖ, y, Σ, x̂ₖ, pₖ, ŷx̂ₖ, ψx̂ₖ, pₖᵀpₖ, grad_ψₖᵀpₖ, Lₖ, γₖ);

    };

    auto print_progress = [&](unsigned k, real_t ψₖ, crvec grad_ψₖ,

                              real_t pₖᵀpₖ, real_t γₖ, real_t εₖ) {

        std::cout << "[PANOC] " << std::setw(6) << k

                  << ": ψ = " << std::setw(13) << ψₖ

                  << ", ‖∇ψ‖ = " << std::setw(13) << grad_ψₖ.norm()

                  << ", ‖p‖ = " << std::setw(13) << std::sqrt(pₖᵀpₖ)

                  << ", γ = " << std::setw(13) << γₖ

                  << ", εₖ = " << std::setw(13) << εₖ << "\r\n";

    };


    // Estimate Lipschitz constant ---------------------------------------------


    real_t ψₖ, Lₖ;

    // Finite difference approximation of ∇²ψ in starting point

    if (params.Lipschitz.L₀ <= 0) {

        Lₖ = detail::initial_lipschitz_estimate(

            problem, xₖ, y, Σ, params.Lipschitz.ε, params.Lipschitz.δ,

            params.L_min, params.L_max,

            /* in ⟹ out */ ψₖ, grad_ψₖ, x̂ₖ, grad_ψₖ₊₁, work_n, work_m);

    }

    // Initial Lipschitz constant provided by the user

    else {

        Lₖ = params.Lipschitz.L₀;

        // Calculate ψ(xₖ), ∇ψ(x₀)

        ψₖ = calc_ψ_grad_ψ(xₖ, /* in ⟹ out */ grad_ψₖ);

    }

    if (not std::isfinite(Lₖ)) {

        s.status = SolverStatus::NotFinite;

        return s;

    }

    real_t γₖ = params.Lipschitz.Lγ_factor / Lₖ;

    real_t τ  = NaN;


    // First projected gradient step -------------------------------------------


    // Calculate x̂₀, p₀ (projected gradient step)

    calc_x̂(γₖ, xₖ, grad_ψₖ, /* in ⟹ out */ x̂ₖ, pₖ);

    // Calculate ψ(x̂ₖ) and ŷ(x̂ₖ)

    real_t ψx̂ₖ        = calc_ψ_ŷ(x̂ₖ, /* in ⟹ out */ ŷx̂ₖ);

    real_t grad_ψₖᵀpₖ = grad_ψₖ.dot(pₖ);

    real_t pₖᵀpₖ      = pₖ.squaredNorm();

    // Compute forward-backward envelope

    real_t φₖ = ψₖ + 1 / (2 * γₖ) * pₖᵀpₖ + grad_ψₖᵀpₖ;


    // Main PANOC loop

    // =========================================================================

    for (unsigned k = 0; k <= params.max_iter; ++k) {


        // Quadratic upper bound -----------------------------------------------

        if (k == 0 || params.update_lipschitz_in_linesearch == false) {

            // Decrease step size until quadratic upper bound is satisfied

            real_t old_γₖ =

                descent_lemma(xₖ, ψₖ, grad_ψₖ,

                              /* in ⟹ out */ x̂ₖ, pₖ, ŷx̂ₖ,

                              /* inout */ ψx̂ₖ, pₖᵀpₖ, grad_ψₖᵀpₖ, Lₖ, γₖ);

            if (k > 0 && γₖ != old_γₖ) // Flush L-BFGS if γ changed

                direction_provider.changed_γ(γₖ, old_γₖ);

            else if (k == 0) // Initialize L-BFGS

                direction_provider.initialize(xₖ, x̂ₖ, pₖ, grad_ψₖ);

            if (γₖ != old_γₖ)

                φₖ = ψₖ + 1 / (2 * γₖ) * pₖᵀpₖ + grad_ψₖᵀpₖ;

        }

        // Calculate ∇ψ(x̂ₖ)

        if (need_grad_̂ψₖ)

            calc_grad_ψ_from_ŷ(x̂ₖ, ŷx̂ₖ, /* in ⟹ out */ grad_̂ψₖ);


        // Check stop condition ------------------------------------------------

        real_t εₖ = detail::calc_error_stop_crit(

            problem.C, params.stop_crit, pₖ, γₖ, xₖ, x̂ₖ, ŷx̂ₖ, grad_ψₖ, grad_̂ψₖ);


        // Print progress

        if (params.print_interval != 0 && k % params.print_interval == 0)

            print_progress(k, ψₖ, grad_ψₖ, pₖᵀpₖ, γₖ, εₖ);

        if (progress_cb)

            progress_cb({k, xₖ, pₖ, pₖᵀpₖ, x̂ₖ, φₖ, ψₖ, grad_ψₖ, ψx̂ₖ, grad_̂ψₖ,

                         Lₖ, γₖ, τ, εₖ, Σ, y, problem, params});


        auto time_elapsed = std::chrono::steady_clock::now() - start_time;

        auto stop_status  = detail::check_all_stop_conditions(

            params, time_elapsed, k, stop_signal, ε, εₖ, no_progress);

        if (stop_status != SolverStatus::Unknown) {

            // TODO: We could cache g(x) and ẑ, but would that faster?

            //       It saves 1 evaluation of g per ALM iteration, but requires

            //       many extra stores in the inner loops of PANOC.

            // TODO: move the computation of ẑ and g(x) to ALM?

            if (stop_status == SolverStatus::Converged ||

                stop_status == SolverStatus::Interrupted ||

                always_overwrite_results) {

                calc_err_z(x̂ₖ, /* in ⟹ out */ err_z);

                x = std::move(x̂ₖ);

                y = std::move(ŷx̂ₖ);

            }

            s.iterations   = k;

            s.ε            = εₖ;

            s.elapsed_time = duration_cast<microseconds>(time_elapsed);

            s.status       = stop_status;

            return s;

        }


        // Calculate quasi-Newton step -----------------------------------------

        real_t step_size =

            params.lbfgs_stepsize == LBFGSStepSize::BasedOnGradientStepSize

                ? 1

                : -1;

        if (k > 0)

            direction_provider.apply(xₖ, x̂ₖ, pₖ, step_size,

                                     /* in ⟹ out */ qₖ);


        // Line search initialization ------------------------------------------

        τ                  = 1;

        real_t σₖγₖ⁻¹pₖᵀpₖ = (1 - γₖ * Lₖ) * pₖᵀpₖ / (2 * γₖ);

        real_t φₖ₊₁, ψₖ₊₁, ψx̂ₖ₊₁, grad_ψₖ₊₁ᵀpₖ₊₁, pₖ₊₁ᵀpₖ₊₁;

        real_t Lₖ₊₁, γₖ₊₁;

        real_t ls_cond;

        // TODO: make separate parameter

        real_t margin =

            (1 + std::abs(φₖ)) * params.quadratic_upperbound_tolerance_factor;


        // Make sure quasi-Newton step is valid

        if (k == 0) {

            τ = 0; // Always use prox step on first iteration

        } else if (not qₖ.allFinite()) {

            τ = 0;

            ++s.lbfgs_failures;

            direction_provider.reset(); // Is there anything else we can do?

        }


        // Line search loop ----------------------------------------------------

        do {

            Lₖ₊₁ = Lₖ;

            γₖ₊₁ = γₖ;


            // Calculate xₖ₊₁

            if (τ / 2 < params.τ_min) { // line search failed

                xₖ₊₁.swap(x̂ₖ);          // → safe prox step

                ψₖ₊₁ = ψx̂ₖ;

                if (need_grad_̂ψₖ)

                    grad_ψₖ₊₁.swap(grad_̂ψₖ);

                else

                    calc_grad_ψ_from_ŷ(xₖ₊₁, ŷx̂ₖ, /* in ⟹ out */ grad_ψₖ₊₁);

            } else {        // line search didn't fail (yet)

                if (τ == 1) // → faster quasi-Newton step

                    xₖ₊₁ = xₖ + qₖ;

                else

                    xₖ₊₁ = xₖ + (1 - τ) * pₖ + τ * qₖ;

                // Calculate ψ(xₖ₊₁), ∇ψ(xₖ₊₁)

                ψₖ₊₁ = calc_ψ_grad_ψ(xₖ₊₁, /* in ⟹ out */ grad_ψₖ₊₁);

            }


            // Calculate x̂ₖ₊₁, pₖ₊₁ (projected gradient step in xₖ₊₁)

            calc_x̂(γₖ₊₁, xₖ₊₁, grad_ψₖ₊₁, /* in ⟹ out */ x̂ₖ₊₁, pₖ₊₁);

            // Calculate ψ(x̂ₖ₊₁) and ŷ(x̂ₖ₊₁)

            ψx̂ₖ₊₁ = calc_ψ_ŷ(x̂ₖ₊₁, /* in ⟹ out */ ŷx̂ₖ₊₁);


            // Quadratic upper bound -------------------------------------------

            grad_ψₖ₊₁ᵀpₖ₊₁ = grad_ψₖ₊₁.dot(pₖ₊₁);

            pₖ₊₁ᵀpₖ₊₁      = pₖ₊₁.squaredNorm();

            real_t pₖ₊₁ᵀpₖ₊₁_ₖ = pₖ₊₁ᵀpₖ₊₁; // prox step with step size γₖ


            if (params.update_lipschitz_in_linesearch == true) {

                // Decrease step size until quadratic upper bound is satisfied

                (void)descent_lemma(xₖ₊₁, ψₖ₊₁, grad_ψₖ₊₁,

                                    /* in ⟹ out */ x̂ₖ₊₁, pₖ₊₁, ŷx̂ₖ₊₁,

                                    /* inout */ ψx̂ₖ₊₁, pₖ₊₁ᵀpₖ₊₁,

                                    grad_ψₖ₊₁ᵀpₖ₊₁, Lₖ₊₁, γₖ₊₁);

            }


            // Compute forward-backward envelope

            φₖ₊₁ = ψₖ₊₁ + 1 / (2 * γₖ₊₁) * pₖ₊₁ᵀpₖ₊₁ + grad_ψₖ₊₁ᵀpₖ₊₁;

            // Compute line search condition

            ls_cond = φₖ₊₁ - (φₖ - σₖγₖ⁻¹pₖᵀpₖ);

            if (params.alternative_linesearch_cond)

                ls_cond -= (0.5 / γₖ₊₁ - 0.5 / γₖ) * pₖ₊₁ᵀpₖ₊₁_ₖ;


            τ /= 2;

        } while (ls_cond > margin && τ >= params.τ_min);


        // If τ < τ_min the line search failed and we accepted the prox step

        if (τ < params.τ_min && k != 0) {

            ++s.linesearch_failures;

            τ = 0;

        }

        if (k != 0) {

            s.count_τ += 1;

            s.sum_τ += τ * 2;

            s.τ_1_accepted += τ * 2 == 1;

        }


        // Update L-BFGS -------------------------------------------------------

        if (γₖ != γₖ₊₁) // Flush L-BFGS if γ changed

            direction_provider.changed_γ(γₖ₊₁, γₖ);


        s.lbfgs_rejected += not direction_provider.update(

            xₖ, xₖ₊₁, pₖ, pₖ₊₁, grad_ψₖ₊₁, problem.C, γₖ₊₁);


        // Check if we made any progress

        if (no_progress > 0 || k % params.max_no_progress == 0)

            no_progress = xₖ == xₖ₊₁ ? no_progress + 1 : 0;


        // Advance step --------------------------------------------------------

        Lₖ = Lₖ₊₁;

        γₖ = γₖ₊₁;


        ψₖ  = ψₖ₊₁;

        ψx̂ₖ = ψx̂ₖ₊₁;

        φₖ  = φₖ₊₁;


        xₖ.swap(xₖ₊₁);

        x̂ₖ.swap(x̂ₖ₊₁);

        ŷx̂ₖ.swap(ŷx̂ₖ₊₁);

        pₖ.swap(pₖ₊₁);

        grad_ψₖ.swap(grad_ψₖ₊₁);

        grad_ψₖᵀpₖ = grad_ψₖ₊₁ᵀpₖ₊₁;

        pₖᵀpₖ      = pₖ₊₁ᵀpₖ₊₁;

    }

    throw std::logic_error("[PANOC] loop error");

}


} // namespace alpaqa

alpaqa::PANOCSolver::get_name
std::string get_name() const
Definition: inner/panoc.hpp:19

alpaqa::PANOCSolver::operator()
Stats operator()(const Problem &problem, crvec Σ, real_t ε, bool always_overwrite_results, rvec x, rvec y, rvec err_z)
Definition: inner/panoc.hpp:25

panoc.hpp

alpaqa::detail::calc_error_stop_crit
real_t calc_error_stop_crit(const Box &C, PANOCStopCrit crit, crvec pₖ, real_t γ, crvec xₖ, crvec x̂ₖ, crvec ŷₖ, crvec grad_ψₖ, crvec grad_̂ψₖ)
Compute the ε from the stopping criterion, see PANOCStopCrit.
Definition: panoc-helpers.hpp:169

alpaqa::detail::check_all_stop_conditions
SolverStatus check_all_stop_conditions(const ParamsT &params, DurationT time_elapsed, unsigned iteration, const AtomicStopSignal &stop_signal, real_t ε, real_t εₖ, unsigned no_progress)
Check all stop conditions (required tolerance reached, out of time, maximum number of iterations exce...
Definition: panoc-helpers.hpp:307

alpaqa::detail::calc_ψ_ŷ
real_t calc_ψ_ŷ(const Problem &p, crvec x, crvec y, crvec Σ, rvec ŷ)
Calculate both ψ(x) and the vector ŷ that can later be used to compute ∇ψ.
Definition: panoc-helpers.hpp:16

alpaqa::detail::descent_lemma
real_t descent_lemma(const Problem &problem, real_t rounding_tolerance, real_t L_max, crvec xₖ, real_t ψₖ, crvec grad_ψₖ, crvec y, crvec Σ, rvec x̂ₖ, rvec pₖ, rvec ŷx̂ₖ, real_t &ψx̂ₖ, real_t &norm_sq_pₖ, real_t &grad_ψₖᵀpₖ, real_t &Lₖ, real_t &γₖ)
Increase the estimate of the Lipschitz constant of the objective gradient and decrease the step size ...
Definition: panoc-helpers.hpp:242

alpaqa::detail::stop_crit_requires_grad_̂ψₖ
bool stop_crit_requires_grad_̂ψₖ(PANOCStopCrit crit)
Definition: panoc-helpers.hpp:153

alpaqa::detail::calc_ψ_grad_ψ
real_t calc_ψ_grad_ψ(const Problem &p, crvec x, crvec y, crvec Σ, rvec grad_ψ, rvec work_n, rvec work_m)
Calculate both ψ(x) and its gradient ∇ψ(x).
Definition: panoc-helpers.hpp:62

alpaqa::detail::calc_err_z
void calc_err_z(const Problem &p, crvec x̂, crvec y, crvec Σ, rvec err_z)
Calculate the error between ẑ and g(x).
Definition: panoc-helpers.hpp:107

alpaqa::detail::initial_lipschitz_estimate
real_t initial_lipschitz_estimate(const Problem &problem, crvec xₖ, crvec y, crvec Σ, real_t ε, real_t δ, real_t L_min, real_t L_max, real_t &ψ, rvec grad_ψ, rvec work_n1, rvec work_n2, rvec work_n3, rvec work_m)
Estimate the Lipschitz constant of the gradient  using finite differences.
Definition: panoc-helpers.hpp:412

alpaqa::detail::calc_grad_ψ_from_ŷ
void calc_grad_ψ_from_ŷ(const Problem &p, crvec x, crvec ŷ, rvec grad_ψ, rvec work_n)
Calculate ∇ψ(x) using ŷ.
Definition: panoc-helpers.hpp:44

alpaqa::detail::calc_x̂
void calc_x̂(const Problem &prob, real_t γ, crvec x, crvec grad_ψ, rvec x̂, rvec p)
Definition: panoc-helpers.hpp:142

alpaqa::detail::print_progress
void print_progress(unsigned k, real_t ψₖ, crvec grad_ψₖ, real_t pₖᵀpₖ, real_t γₖ, real_t εₖ)
Definition: standalone/panoc.hpp:139

alpaqa.test.params
params
Definition: test.py:275

alpaqa.test.Σ
int Σ
Definition: test.py:72

alpaqa.test.err_z
err_z
Definition: test.py:78

alpaqa.test.m
int m
Definition: test.py:41

alpaqa.test.n
int n
Definition: test.py:40

alpaqa.test.ε
int ε
Definition: test.py:73

alpaqa
Definition: __init__.py:1

alpaqa::PANOCStats::lbfgs_rejected
unsigned lbfgs_rejected
Definition: inner/decl/panoc.hpp:58

alpaqa::PANOCStats::τ_1_accepted
unsigned τ_1_accepted
Definition: inner/decl/panoc.hpp:59

alpaqa::PANOCStats::lbfgs_failures
unsigned lbfgs_failures
Definition: inner/decl/panoc.hpp:57

alpaqa::crvec
Eigen::Ref< const vec > crvec
Default type for immutable references to vectors.
Definition: vec.hpp:18

alpaqa::NaN
constexpr real_t NaN
Not a number.
Definition: vec.hpp:28

alpaqa::PANOCStats::sum_τ
real_t sum_τ
Definition: inner/decl/panoc.hpp:61

alpaqa::SolverStatus::Interrupted
@ Interrupted
Solver was interrupted by the user.

alpaqa::SolverStatus::Unknown
@ Unknown
Initial value.

alpaqa::SolverStatus::Converged
@ Converged
Converged and reached given tolerance.

alpaqa::SolverStatus::NotFinite
@ NotFinite
Intermediate results were infinite or not-a-number.

alpaqa::vec
realvec vec
Default type for vectors.
Definition: vec.hpp:14

alpaqa::PANOCStats::ε
real_t ε
Definition: inner/decl/panoc.hpp:53

alpaqa::PANOCStats::elapsed_time
std::chrono::microseconds elapsed_time
Definition: inner/decl/panoc.hpp:54

alpaqa::real_t
double real_t
Default floating point type.
Definition: vec.hpp:8

alpaqa::PANOCStats::linesearch_failures
unsigned linesearch_failures
Definition: inner/decl/panoc.hpp:56

alpaqa::LBFGSStepSize::BasedOnGradientStepSize
@ BasedOnGradientStepSize

alpaqa::PANOCStats::iterations
unsigned iterations
Definition: inner/decl/panoc.hpp:55

alpaqa::PANOCStats::status
SolverStatus status
Definition: inner/decl/panoc.hpp:52

alpaqa::PANOCStats::count_τ
unsigned count_τ
Definition: inner/decl/panoc.hpp:60

alpaqa::rvec
Eigen::Ref< vec > rvec
Default type for mutable references to vectors.
Definition: vec.hpp:16

alpaqa::PANOCStats
Definition: inner/decl/panoc.hpp:51

codegen-rosenbrock.y
y
Definition: codegen-rosenbrock.py:9

codegen-rosenbrock.x
x
Definition: codegen-rosenbrock.py:8

getting-started.p
p
Definition: getting-started.py:11

main.problem
problem
Definition: main.py:16

panoc-direction-update.hpp

panoc-helpers.hpp

alpaqa::Problem
Problem description for minimization problems.
Definition: include/alpaqa/util/problem.hpp:26