pantr/Doxygen/structured-newton_8hpp_source.html

#pragma once


#include <alpaqa/config/config.hpp>

#include <alpaqa/export.hpp>

#include <alpaqa/inner/directions/panoc-direction-update.hpp>

#include <alpaqa/inner/internal/panoc-helpers.hpp>

#include <alpaqa/problem/type-erased-problem.hpp>

#include <alpaqa/util/alloc-check.hpp>

#include <alpaqa/util/index-set.hpp>

#include <alpaqa/util/print.hpp>

#include <iostream>

#include <limits>

#include <optional>

#include <stdexcept>


#include <Eigen/Cholesky>

#include <Eigen/Eigenvalues>


namespace alpaqa {


/// Parameters for the @ref StructuredNewtonDirection class.

template <Config Conf>

struct StructuredNewtonRegularizationParams {

    USING_ALPAQA_CONFIG(Conf);

    /// Minimum eigenvalue of the Hessian, scaled by

    /// @f$ 1 + |\lambda_\mathrm{max}| @f$, enforced by regularization using

    /// a multiple of identity.

    real_t min_eig = std::cbrt(std::numeric_limits<real_t>::epsilon());

    /// Print the minimum and maximum eigenvalue of the Hessian.

    bool print_eig = false;

};


/// Parameters for the @ref StructuredNewtonDirection class.

template <Config Conf>

struct StructuredNewtonDirectionParams {

    USING_ALPAQA_CONFIG(Conf);

    /// Set this option to true to include the Hessian-vector product

    /// @f$ \nabla^2_{x_\mathcal{J}x_\mathcal{K}}\psi(x) q_\mathcal{K} @f$ from

    /// equation 12b in @cite pas2022alpaqa, false to leave out that term.

    bool hessian_vec = true;

};


/// @ingroup grp_DirectionProviders

template <Config Conf = DefaultConfig>

struct StructuredNewtonDirection {

    USING_ALPAQA_CONFIG(Conf);

    using Problem           = TypeErasedProblem<config_t>;

    using DirectionParams   = StructuredNewtonDirectionParams<config_t>;

    using AcceleratorParams = StructuredNewtonRegularizationParams<config_t>;


    struct Params {

        AcceleratorParams accelerator = {};

        DirectionParams direction     = {};

    };


    StructuredNewtonDirection() = default;

    StructuredNewtonDirection(const Params &params)

        : reg_params(params.accelerator), direction_params(params.direction) {}

    StructuredNewtonDirection(const AcceleratorParams &params,

                              const DirectionParams &directionparams = {})

        : reg_params(params), direction_params(directionparams) {}


    /// @see @ref PANOCDirection::initialize

    void initialize(const Problem &problem, crvec y, crvec Σ,

                    [[maybe_unused]] real_t γ_0, [[maybe_unused]] crvec x_0,

                    [[maybe_unused]] crvec x̂_0, [[maybe_unused]] crvec p_0,

                    [[maybe_unused]] crvec grad_ψx_0) {

        if (!(problem.provides_get_box_C() && problem.provides_get_box_D()))

            throw std::invalid_argument(

                "Structured Newton only supports box-constrained problems");

        // TODO: support eval_inactive_indices_res_lna

        if (!problem.provides_eval_hess_ψ())

            throw std::invalid_argument("Structured Newton requires hess_ψ");

        // Store references to problem and ALM variables

        this->problem = &problem;

        this->y.emplace(y);

        this->Σ.emplace(Σ);

        // Allocate workspaces

        const auto n = problem.get_n();

        JK.resize(n);

        H_storage.resize(n * n);

        HJ_storage.resize(n * n);

        // Store sparsity of H

        length_t nnz_H = problem.get_hess_ψ_num_nonzeros();

        if (nnz_H > 0) {

            inner_idx_H.resize(nnz_H);

            outer_ptr_H.resize(n + 1);

            mvec null{nullptr, 0};

            problem.eval_hess_ψ(x_0, y, Σ, 1, inner_idx_H, outer_ptr_H, null);

            throw std::logic_error("Sparse hessians not yet implemented");

        }

    }


    /// @see @ref PANOCDirection::has_initial_direction

    bool has_initial_direction() const { return true; }


    /// @see @ref PANOCDirection::update

    bool update([[maybe_unused]] real_t γₖ, [[maybe_unused]] real_t γₙₑₓₜ,

                [[maybe_unused]] crvec xₖ, [[maybe_unused]] crvec xₙₑₓₜ,

                [[maybe_unused]] crvec pₖ, [[maybe_unused]] crvec pₙₑₓₜ,

                [[maybe_unused]] crvec grad_ψxₖ,

                [[maybe_unused]] crvec grad_ψxₙₑₓₜ) {

        return true;

    }


    /// @see @ref PANOCDirection::apply

    bool apply(real_t γₖ, crvec xₖ, [[maybe_unused]] crvec x̂ₖ, crvec pₖ,

               crvec grad_ψxₖ, rvec qₖ) const {


        const auto n  = problem->get_n();

        const auto &C = problem->get_box_C();


        // Find inactive indices J

        auto nJ = 0;

        for (index_t i = 0; i < n; ++i) {

            real_t gd = xₖ(i) - γₖ * grad_ψxₖ(i);

            if (gd <= C.lowerbound(i)) {        // i ∊ J̲ ⊆ K

                qₖ(i) = pₖ(i);                  //

            } else if (C.upperbound(i) <= gd) { // i ∊ J̅ ⊆ K

                qₖ(i) = pₖ(i);                  //

            } else {                            // i ∊ J

                JK(nJ++) = i;

                qₖ(i)    = -grad_ψxₖ(i);

            }

        }


        // There are no inactive indices J

        if (nJ == 0) {

            // No free variables, no Newton step possible

            return false; // Simply use the projection step

        }


        // Compute the Hessian

        mmat H{H_storage.data(), n, n};

        problem->eval_hess_ψ(xₖ, *y, *Σ, 1, inner_idx_H, outer_ptr_H,

                             H_storage);


        // There are no active indices K

        if (nJ == n) {

            // If all indices are free, we can factor the entire matrix.

            // Find the minimum eigenvalue to regularize the Hessian matrix and

            // make it positive definite.

            ScopedMallocAllower ma;

            // Find the minimum eigenvalue to regularize the Hessian matrix and

            // make it positive definite.

            Eigen::SelfAdjointEigenSolver<mat> eig{H,

                                                   Eigen::ComputeEigenvectors};


            auto λ_min = eig.eigenvalues().minCoeff(),

                 λ_max = eig.eigenvalues().maxCoeff();


            if (reg_params.print_eig)

                std::cout << "λ(H):    " << float_to_str(λ_min, 3) << ", "

                          << float_to_str(λ_max, 3) << std::endl;

            // Regularization

            real_t ε = reg_params.min_eig * (1 + std::abs(λ_max)); // TODO

            // Solve the system

            qₖ = eig.eigenvectors().transpose() * qₖ;

            qₖ = eig.eigenvalues().cwiseMax(ε).asDiagonal().inverse() * qₖ;

            qₖ = eig.eigenvectors() * qₖ;

            return true;

        }


        // There are active indices K

        crindexvec J = JK.topRows(nJ);

        rindexvec K  = JK.bottomRows(n - nJ);

        detail::IndexSet<config_t>::compute_complement(J, K, n);


        // Compute right-hand side of 6.1c

        if (direction_params.hessian_vec)

            qₖ(J).noalias() -= H(J, K) * qₖ(K);


        // If there are active indices, we need to solve the Newton system with

        // just the inactive indices.

        mmat HJ{HJ_storage.data(), nJ, nJ};

        // We copy the inactive block of the Hessian to a temporary dense matrix.

        // Since it's symmetric, only the lower part is copied.

        HJ.template triangularView<Eigen::Lower>() =

            H(J, J).template triangularView<Eigen::Lower>();


        ScopedMallocAllower ma;

        // Find the minimum eigenvalue to regularize the Hessian matrix and

        // make it positive definite.

        Eigen::SelfAdjointEigenSolver<mat> eig{HJ, Eigen::ComputeEigenvectors};


        auto λ_min = eig.eigenvalues().minCoeff(),

             λ_max = eig.eigenvalues().maxCoeff();


        if (reg_params.print_eig)

            std::cout << "λ(H_JJ): " << float_to_str(λ_min, 3) << ", "

                      << float_to_str(λ_max, 3) << std::endl;

        // Regularization

        real_t ε = reg_params.min_eig * (1 + std::abs(λ_max)); // TODO

        // Solve the system

        auto qJ = H.col(0).topRows(nJ);

        qJ      = qₖ(J);

        qJ      = eig.eigenvectors().transpose() * qJ;

        qJ      = eig.eigenvalues().cwiseMax(ε).asDiagonal().inverse() * qJ;

        qₖ(J)   = eig.eigenvectors() * qJ;

        return true;

    }


    /// @see @ref PANOCDirection::changed_γ

    void changed_γ([[maybe_unused]] real_t γₖ, [[maybe_unused]] real_t old_γₖ) {

    }


    /// @see @ref PANOCDirection::reset

    void reset() {}


    /// @see @ref PANOCDirection::get_name

    std::string get_name() const {

        return "StructuredNewtonDirection<" +

               std::string(config_t::get_name()) + '>';

    }


    const auto &get_params() const { return direction_params; }


  private:

    const Problem *problem = nullptr;

#ifndef _WIN32

    std::optional<crvec> y = std::nullopt;

    std::optional<crvec> Σ = std::nullopt;

#else

    std::optional<vec> y = std::nullopt;

    std::optional<vec> Σ = std::nullopt;

#endif


    mutable indexvec JK;

    mutable vec H_storage;

    mutable vec HJ_storage;

    mutable indexvec inner_idx_H, outer_ptr_H;


  public:

    AcceleratorParams reg_params;

    DirectionParams direction_params;

};


ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, StructuredNewtonDirection, DefaultConfig);

ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, StructuredNewtonDirection, EigenConfigf);

ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, StructuredNewtonDirection, EigenConfigd);

ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, StructuredNewtonDirection, EigenConfigl);

#ifdef ALPAQA_WITH_QUAD_PRECISION

ALPAQA_EXPORT_EXTERN_TEMPLATE(struct, StructuredNewtonDirection, EigenConfigq);

#endif


} // namespace alpaqa


#include <alpaqa/inner/panoc.hpp>


namespace alpaqa {


// clang-format off

ALPAQA_EXPORT_EXTERN_TEMPLATE(class, PANOCSolver, StructuredNewtonDirection<DefaultConfig>);

ALPAQA_EXPORT_EXTERN_TEMPLATE(class, PANOCSolver, StructuredNewtonDirection<EigenConfigf>);

ALPAQA_EXPORT_EXTERN_TEMPLATE(class, PANOCSolver, StructuredNewtonDirection<EigenConfigd>);

ALPAQA_EXPORT_EXTERN_TEMPLATE(class, PANOCSolver, StructuredNewtonDirection<EigenConfigl>);

#ifdef ALPAQA_WITH_QUAD_PRECISION

ALPAQA_EXPORT_EXTERN_TEMPLATE(class, PANOCSolver, StructuredNewtonDirection<EigenConfigq>);

#endif

// clang-format on


} // namespace alpaqa

alloc-check.hpp

alpaqa::TypeErasedProblem< config_t >

alpaqa::TypeErasedProblem::eval_hess_ψ
void eval_hess_ψ(crvec x, crvec y, crvec Σ, real_t scale, rindexvec inner_idx, rindexvec outer_ptr, rvec H_values) const
[Optional] Function that evaluates the Hessian of the augmented Lagrangian,
Definition: type-erased-problem.hpp:775

alpaqa::TypeErasedProblem::provides_get_box_C
bool provides_get_box_C() const
Returns true if the problem provides an implementation of get_box_C.
Definition: type-erased-problem.hpp:648

alpaqa::TypeErasedProblem::get_n
length_t get_n() const
[Required] Number of decision variables.
Definition: type-erased-problem.hpp:697

alpaqa::TypeErasedProblem::provides_eval_hess_ψ
bool provides_eval_hess_ψ() const
Returns true if the problem provides an implementation of eval_hess_ψ.
Definition: type-erased-problem.hpp:613

alpaqa::TypeErasedProblem::provides_get_box_D
bool provides_get_box_D() const
Returns true if the problem provides an implementation of get_box_D.
Definition: type-erased-problem.hpp:651

alpaqa::TypeErasedProblem::get_box_C
const Box & get_box_C() const
[Optional] Get the rectangular constraint set of the decision variables, .
Definition: type-erased-problem.hpp:821

alpaqa::TypeErasedProblem::get_hess_ψ_num_nonzeros
length_t get_hess_ψ_num_nonzeros() const
[Optional] Function that gets the number of nonzeros of the Hessian of the augmented Lagrangian.
Definition: type-erased-problem.hpp:781

config.hpp

USING_ALPAQA_CONFIG
#define USING_ALPAQA_CONFIG(Conf)
Definition: config.hpp:42

export.hpp

ALPAQA_EXPORT_EXTERN_TEMPLATE
#define ALPAQA_EXPORT_EXTERN_TEMPLATE(...)
Definition: export.hpp:21

index-set.hpp

alpaqa
Definition: accelerators/anderson.hpp:10

alpaqa::mvec
typename Conf::mvec mvec
Definition: config.hpp:53

alpaqa::StructuredNewtonDirectionParams::hessian_vec
bool hessian_vec
Set this option to true to include the Hessian-vector product  from equation 12b in ,...
Definition: structured-newton.hpp:40

alpaqa::indexvec
typename Conf::indexvec indexvec
Definition: config.hpp:64

alpaqa::StructuredNewtonRegularizationParams::min_eig
real_t min_eig
Minimum eigenvalue of the Hessian, scaled by , enforced by regularization using a multiple of identit...
Definition: structured-newton.hpp:28

alpaqa::real_t
typename Conf::real_t real_t
Definition: config.hpp:51

alpaqa::rindexvec
typename Conf::rindexvec rindexvec
Definition: config.hpp:65

alpaqa::index_t
typename Conf::index_t index_t
Definition: config.hpp:63

alpaqa::mmat
typename Conf::mmat mmat
Definition: config.hpp:58

alpaqa::length_t
typename Conf::length_t length_t
Definition: config.hpp:62

alpaqa::rvec
typename Conf::rvec rvec
Definition: config.hpp:55

alpaqa::crvec
typename Conf::crvec crvec
Definition: config.hpp:56

alpaqa::vec
typename Conf::vec vec
Definition: config.hpp:52

alpaqa::StructuredNewtonRegularizationParams::print_eig
bool print_eig
Print the minimum and maximum eigenvalue of the Hessian.
Definition: structured-newton.hpp:30

alpaqa::float_to_str
std::string float_to_str(F value, int precision)
Definition: print.tpp:66

alpaqa::crindexvec
typename Conf::crindexvec crindexvec
Definition: config.hpp:66

alpaqa::StructuredNewtonDirectionParams< config_t >

alpaqa::StructuredNewtonDirectionParams
Parameters for the StructuredNewtonDirection class.
Definition: structured-newton.hpp:35

alpaqa::StructuredNewtonRegularizationParams
Parameters for the StructuredNewtonDirection class.
Definition: structured-newton.hpp:23

panoc-direction-update.hpp

panoc-helpers.hpp

panoc.hpp

print.hpp

alpaqa::DefaultConfig
Definition: config.hpp:132

alpaqa::EigenConfigd
Double-precision double configuration.
Definition: config.hpp:115

alpaqa::EigenConfigf
Single-precision float configuration.
Definition: config.hpp:111

alpaqa::EigenConfigl
long double configuration.
Definition: config.hpp:120

alpaqa::ScopedMallocAllower
Definition: alloc-check.hpp:21

alpaqa::StructuredNewtonDirection
Definition: structured-newton.hpp:45

alpaqa::StructuredNewtonDirection::get_name
std::string get_name() const
Definition: structured-newton.hpp:211

alpaqa::StructuredNewtonDirection::changed_γ
void changed_γ(real_t γₖ, real_t old_γₖ)
Definition: structured-newton.hpp:204

alpaqa::StructuredNewtonDirection::StructuredNewtonDirection
StructuredNewtonDirection()=default

alpaqa::StructuredNewtonDirection::get_params
const auto & get_params() const
Definition: structured-newton.hpp:216

alpaqa::StructuredNewtonDirection::direction_params
DirectionParams direction_params
Definition: structured-newton.hpp:235

alpaqa::StructuredNewtonDirection::Params::direction
DirectionParams direction
Definition: structured-newton.hpp:53

alpaqa::StructuredNewtonDirection::StructuredNewtonDirection
StructuredNewtonDirection(const AcceleratorParams &params, const DirectionParams &directionparams={})
Definition: structured-newton.hpp:59

alpaqa::StructuredNewtonDirection::update
bool update(real_t γₖ, real_t γₙₑₓₜ, crvec xₖ, crvec xₙₑₓₜ, crvec pₖ, crvec pₙₑₓₜ, crvec grad_ψxₖ, crvec grad_ψxₙₑₓₜ)
Definition: structured-newton.hpp:98

alpaqa::StructuredNewtonDirection::JK
indexvec JK
Definition: structured-newton.hpp:228

alpaqa::StructuredNewtonDirection::StructuredNewtonDirection
StructuredNewtonDirection(const Params &params)
Definition: structured-newton.hpp:57

alpaqa::StructuredNewtonDirection::inner_idx_H
indexvec inner_idx_H
Definition: structured-newton.hpp:231

alpaqa::StructuredNewtonDirection::reg_params
AcceleratorParams reg_params
Definition: structured-newton.hpp:234

alpaqa::StructuredNewtonDirection::HJ_storage
vec HJ_storage
Definition: structured-newton.hpp:230

alpaqa::StructuredNewtonDirection::y
std::optional< crvec > y
Definition: structured-newton.hpp:221

alpaqa::StructuredNewtonDirection::outer_ptr_H
indexvec outer_ptr_H
Definition: structured-newton.hpp:231

alpaqa::StructuredNewtonDirection::H_storage
vec H_storage
Definition: structured-newton.hpp:229

alpaqa::StructuredNewtonDirection::initialize
void initialize(const Problem &problem, crvec y, crvec Σ, real_t γ_0, crvec x_0, crvec x̂_0, crvec p_0, crvec grad_ψx_0)
Definition: structured-newton.hpp:64

alpaqa::StructuredNewtonDirection::problem
const Problem * problem
Definition: structured-newton.hpp:219

alpaqa::StructuredNewtonDirection::apply
bool apply(real_t γₖ, crvec xₖ, crvec x̂ₖ, crvec pₖ, crvec grad_ψxₖ, rvec qₖ) const
Definition: structured-newton.hpp:107

alpaqa::StructuredNewtonDirection::reset
void reset()
Definition: structured-newton.hpp:208

alpaqa::StructuredNewtonDirection::has_initial_direction
bool has_initial_direction() const
Definition: structured-newton.hpp:95

alpaqa::StructuredNewtonDirection::Params::accelerator
AcceleratorParams accelerator
Definition: structured-newton.hpp:52

alpaqa::StructuredNewtonDirection::Σ
std::optional< crvec > Σ
Definition: structured-newton.hpp:222

alpaqa::StructuredNewtonDirection::Params
Definition: structured-newton.hpp:51

alpaqa::detail::IndexSet::compute_complement
static void compute_complement(std::span< const index_t > in, std::span< index_t > out)
Definition: index-set.hpp:36

type-erased-problem.hpp