conan-profiles/Doxygen/newton-tr_8hpp_source.html

#pragma once


#include <alpaqa/accelerators/steihaugcg.hpp>

#include <alpaqa/problem/type-erased-problem.hpp>

#include <alpaqa/util/alloc-check.hpp>

#include <alpaqa/util/index-set.hpp>

#include <cmath>

#include <limits>

#include <optional>

#include <stdexcept>


namespace alpaqa {


/// Parameters for the @ref NewtonTRDirection class.

/// @ingroup grp_Parameters

template <Config Conf>


struct NewtonTRDirectionParams {

    USING_ALPAQA_CONFIG(Conf);

    /// The factor in front of the term @f$ \langle H_{\mathcal{JK}}

    /// d_{\mathcal {K}}, d_{\mathcal{J}} \rangle @f$ in equation (9) in

    /// @cite bodard2023pantr.

    /// Set it to zero to leave out that term (this usually only slightly

    /// increases the number of iterations, and eliminates one Hessian-vector

    /// product per iteration, improving the overall runtime).

    real_t hessian_vec_factor = real_t(1);

    /// Use finite differences to compute Hessian-vector products.

    bool finite_diff = false;

    /// Size of the perturbation for the finite differences computation.

    /// Multiplied by @f$ 1+\|x\| @f$.

    real_t finite_diff_stepsize =

        std::sqrt(std::numeric_limits<real_t>::epsilon());

};


/// @ingroup grp_DirectionProviders

template <Config Conf>


struct NewtonTRDirection {

    USING_ALPAQA_CONFIG(Conf);


    using Problem           = TypeErasedProblem<config_t>;

    using AcceleratorParams = SteihaugCGParams<config_t>;

    using DirectionParams   = NewtonTRDirectionParams<config_t>;


    struct Params {

        AcceleratorParams accelerator = {};

        DirectionParams direction     = {};

    };


    NewtonTRDirection() = default;


    NewtonTRDirection(const Params &params)

        : steihaug(params.accelerator), direction_params(params.direction) {}


    NewtonTRDirection(const AcceleratorParams &params,

                      const DirectionParams &directionparams = {})

        : steihaug(params), direction_params(directionparams) {}


    /// @see @ref PANTRDirection::initialize


    void initialize(const Problem &problem, [[maybe_unused]] crvec y,

                    [[maybe_unused]] crvec Σ, [[maybe_unused]] real_t γ_0,

                    [[maybe_unused]] crvec x_0, [[maybe_unused]] crvec x̂_0,

                    [[maybe_unused]] crvec p_0,

                    [[maybe_unused]] crvec grad_ψx_0) {

        if (!direction_params.finite_diff &&

            !problem.provides_eval_augmented_lagrangian_hessian_product() &&

            !(problem.provides_eval_lagrangian_hessian_product() &&

              problem.get_num_constraints() == 0))

            throw std::invalid_argument(

                "NewtonTR without finite differences requires "

                "Problem::eval_augmented_lagrangian_hessian_product()");

        if (!problem.provides_eval_inactive_indices_res_lna())

            throw std::invalid_argument(

                "NewtonTR requires "

                "Problem::eval_inactive_indices_res_lna()");

        // Store references to problem and ALM variables

        this->problem = &problem;

        this->y.emplace(y);

        this->Σ.emplace(Σ);

        // Resize workspaces

        const auto n = problem.get_num_variables(),

                   m = problem.get_num_constraints();

        JK_sto.resize(n);

        rJ_sto.resize(n);

        qJ_sto.resize(n);

        work.resize(n);

        work_2.resize(n);

        steihaug.resize(n);

        if (direction_params.finite_diff) {

            work_n_fd.resize(n);

            work_m_fd.resize(m);

        }

    }


    /// @see @ref PANTRDirection::has_initial_direction

    bool has_initial_direction() const { return true; }


    /// @see @ref PANTRDirection::update


    bool update([[maybe_unused]] real_t γₖ, [[maybe_unused]] real_t γₙₑₓₜ,

                [[maybe_unused]] crvec xₖ, [[maybe_unused]] crvec xₙₑₓₜ,

                [[maybe_unused]] crvec pₖ, [[maybe_unused]] crvec pₙₑₓₜ,

                [[maybe_unused]] crvec grad_ψxₖ,

                [[maybe_unused]] crvec grad_ψxₙₑₓₜ) {

        return true;

    }


    /// @see @ref PANTRDirection::apply


    real_t apply([[maybe_unused]] real_t γₖ, [[maybe_unused]] crvec xₖ,

                 [[maybe_unused]] crvec x̂ₖ, crvec pₖ,

                 [[maybe_unused]] crvec grad_ψxₖ, real_t radius,

                 rvec qₖ) const {


        if (!std::isfinite(radius))

            throw std::logic_error("Invalid trust radius");

        if (radius < std::numeric_limits<real_t>::epsilon())

            throw std::logic_error("Trust radius too small");


        // Newton with exact Hessian


        // Find inactive and active constraints

        const auto n = problem->get_num_variables();

        index_t nJ =

            problem->eval_inactive_indices_res_lna(γₖ, xₖ, grad_ψxₖ, JK_sto);

        crindexvec J = JK_sto.topRows(nJ);

        rindexvec K  = JK_sto.bottomRows(n - nJ);

        detail::IndexSet<config_t>::compute_complement(J, K, n);

        auto rJ = rJ_sto.topRows(nJ);

        auto qJ = qJ_sto.topRows(nJ);

        rJ      = (-real_t(1) / γₖ) * pₖ(J);

        qₖ(K)   = pₖ(K);

        qₖ(J).setZero();

        real_t norm_qK_sq = pₖ(K).squaredNorm();


        // Hessian-vector term

        if (direction_params.hessian_vec_factor != 0) {

            if (direction_params.finite_diff) {

                real_t ε =

                    (1 + xₖ(J).norm()) * direction_params.finite_diff_stepsize;

                /// TODO: use a better rule to determine the step size

                work = xₖ + ε * qₖ;

                problem->eval_augmented_lagrangian_gradient(

                    work, *y, *Σ, work_2, work_n_fd, work_m_fd);

                rJ.noalias() += (work_2 - grad_ψxₖ)(J) *

                                (direction_params.hessian_vec_factor / ε);

            } else {

                problem->eval_augmented_lagrangian_hessian_product(xₖ, *y, *Σ,

                                                                   1, qₖ, work);

                rJ.noalias() += work(J) * direction_params.hessian_vec_factor;

            }

        }


        // Hessian-vector product on subset J

        auto hess_vec_mult = [&](crvec p, rvec Bp) {

            if (direction_params.finite_diff) {

                real_t ε =

                    (1 + xₖ(J).norm()) * direction_params.finite_diff_stepsize;

                /// TODO: use a better rule to determine the step size

                work = xₖ;

                work(J) += ε * p;

                problem->eval_augmented_lagrangian_gradient(

                    work, *y, *Σ, work_2, work_n_fd, work_m_fd);

                Bp.topRows(nJ) = (work_2 - grad_ψxₖ)(J) / ε;

            } else {

                work.setZero();

                work(J) = p;

                problem->eval_augmented_lagrangian_hessian_product(

                    xₖ, *y, *Σ, 1, work, work_2);

                Bp.topRows(nJ) = work_2(J);

            }

        };


        // Steihaug conjugate gradients

        real_t qJ_model = steihaug.solve(rJ, hess_vec_mult, radius, qJ);

        qₖ(J)           = qJ;

        return qJ_model - norm_qK_sq / (2 * γₖ);

    }


    /// @see @ref PANTRDirection::changed_γ


    void changed_γ([[maybe_unused]] real_t γₖ, [[maybe_unused]] real_t old_γₖ) {

    }


    /// @see @ref PANTRDirection::reset

    void reset() {}


    /// @see @ref PANTRDirection::get_name


    std::string get_name() const {

        return "NewtonTRDirection<" + std::string(config_t::get_name()) + '>';

    }


    auto get_params() const {

        return std::tie(steihaug.params, direction_params);

    }


    SteihaugCG<config_t> steihaug;

    DirectionParams direction_params;

    const Problem *problem = nullptr;

#ifndef _WIN32

    std::optional<crvec> y = std::nullopt;

    std::optional<crvec> Σ = std::nullopt;

#else

    std::optional<vec> y = std::nullopt;

    std::optional<vec> Σ = std::nullopt;

#endif

    mutable indexvec JK_sto;

    mutable vec rJ_sto;

    mutable vec qJ_sto;

    mutable vec work, work_2, work_n_fd, work_m_fd;

};


} // namespace alpaqa

alloc-check.hpp

alpaqa::TypeErasedProblem
The main polymorphic minimization problem interface.
Definition type-erased-problem.hpp:243

USING_ALPAQA_CONFIG
#define USING_ALPAQA_CONFIG(Conf)
Definition config.hpp:77

alpaqa::NewtonTRDirectionParams< config_t >::hessian_vec_factor
real_t hessian_vec_factor
Definition newton-tr.hpp:25

alpaqa::NewtonTRDirectionParams< config_t >::finite_diff
bool finite_diff
Definition newton-tr.hpp:27

alpaqa::NewtonTRDirectionParams< config_t >::finite_diff_stepsize
real_t finite_diff_stepsize
Definition newton-tr.hpp:30

alpaqa::NewtonTRDirectionParams
Parameters for the NewtonTRDirection class.
Definition newton-tr.hpp:17

alpaqa::SteihaugCGParams
Parameters for SteihaugCG.
Definition steihaugcg.hpp:12

index-set.hpp

alpaqa::params
Definition json.tpp:12

alpaqa
Definition anderson.hpp:10

alpaqa::indexvec
typename Conf::indexvec indexvec
Definition config.hpp:105

alpaqa::real_t
typename Conf::real_t real_t
Definition config.hpp:86

alpaqa::rindexvec
typename Conf::rindexvec rindexvec
Definition config.hpp:106

alpaqa::index_t
typename Conf::index_t index_t
Definition config.hpp:104

alpaqa::rvec
typename Conf::rvec rvec
Definition config.hpp:91

alpaqa::crvec
typename Conf::crvec crvec
Definition config.hpp:92

alpaqa::vec
typename Conf::vec vec
Definition config.hpp:88

alpaqa::crindexvec
typename Conf::crindexvec crindexvec
Definition config.hpp:107

steihaugcg.hpp

alpaqa::NewtonTRDirection::get_name
std::string get_name() const
Definition newton-tr.hpp:182

alpaqa::NewtonTRDirection::changed_γ
void changed_γ(real_t γₖ, real_t old_γₖ)
Definition newton-tr.hpp:175

alpaqa::NewtonTRDirection::steihaug
SteihaugCG< config_t > steihaug
Definition newton-tr.hpp:190

alpaqa::NewtonTRDirection::apply
real_t apply(real_t γₖ, crvec xₖ, crvec x̂ₖ, crvec pₖ, crvec grad_ψxₖ, real_t radius, rvec qₖ) const
Definition newton-tr.hpp:104

alpaqa::NewtonTRDirection::NewtonTRDirection
NewtonTRDirection(const Params &params)
Definition newton-tr.hpp:49

alpaqa::NewtonTRDirection::NewtonTRDirection
NewtonTRDirection(const AcceleratorParams &params, const DirectionParams &directionparams={})
Definition newton-tr.hpp:51

alpaqa::NewtonTRDirection::direction_params
DirectionParams direction_params
Definition newton-tr.hpp:191

alpaqa::NewtonTRDirection::Params::direction
DirectionParams direction
Definition newton-tr.hpp:45

alpaqa::NewtonTRDirection::update
bool update(real_t γₖ, real_t γₙₑₓₜ, crvec xₖ, crvec xₙₑₓₜ, crvec pₖ, crvec pₙₑₓₜ, crvec grad_ψxₖ, crvec grad_ψxₙₑₓₜ)
Definition newton-tr.hpp:95

alpaqa::NewtonTRDirection::work_m_fd
vec work_m_fd
Definition newton-tr.hpp:203

alpaqa::NewtonTRDirection::get_params
auto get_params() const
Definition newton-tr.hpp:186

alpaqa::NewtonTRDirection::work_n_fd
vec work_n_fd
Definition newton-tr.hpp:203

alpaqa::NewtonTRDirection::NewtonTRDirection
NewtonTRDirection()=default

alpaqa::NewtonTRDirection::work_2
vec work_2
Definition newton-tr.hpp:203

alpaqa::NewtonTRDirection::rJ_sto
vec rJ_sto
Definition newton-tr.hpp:201

alpaqa::NewtonTRDirection::qJ_sto
vec qJ_sto
Definition newton-tr.hpp:202

alpaqa::NewtonTRDirection::y
std::optional< crvec > y
Definition newton-tr.hpp:194

alpaqa::NewtonTRDirection::initialize
void initialize(const Problem &problem, crvec y, crvec Σ, real_t γ_0, crvec x_0, crvec x̂_0, crvec p_0, crvec grad_ψx_0)
Definition newton-tr.hpp:56

alpaqa::NewtonTRDirection::problem
const Problem * problem
Definition newton-tr.hpp:192

alpaqa::NewtonTRDirection::AcceleratorParams
SteihaugCGParams< config_t > AcceleratorParams
Definition newton-tr.hpp:40

alpaqa::NewtonTRDirection::work
vec work
Definition newton-tr.hpp:203

alpaqa::NewtonTRDirection::reset
void reset()
Definition newton-tr.hpp:179

alpaqa::NewtonTRDirection::has_initial_direction
bool has_initial_direction() const
Definition newton-tr.hpp:92

alpaqa::NewtonTRDirection::Params::accelerator
AcceleratorParams accelerator
Definition newton-tr.hpp:44

alpaqa::NewtonTRDirection::DirectionParams
NewtonTRDirectionParams< config_t > DirectionParams
Definition newton-tr.hpp:41

alpaqa::NewtonTRDirection::Problem
TypeErasedProblem< config_t > Problem
Definition newton-tr.hpp:39

alpaqa::NewtonTRDirection::Σ
std::optional< crvec > Σ
Definition newton-tr.hpp:195

alpaqa::NewtonTRDirection::JK_sto
indexvec JK_sto
Definition newton-tr.hpp:200

alpaqa::NewtonTRDirection::Params
Definition newton-tr.hpp:43

alpaqa::SteihaugCG
Steihaug conjugate gradients procedure based on https://github.com/scipy/scipy/blob/583e70a50573169fc...
Definition steihaugcg.hpp:39

alpaqa::detail::IndexSet::compute_complement
static void compute_complement(std::span< const index_t > in, std::span< index_t > out)
Definition index-set.hpp:37

type-erased-problem.hpp