develop/Doxygen/data_8tpp_source.html

#include <cyqlone/cyqlone.hpp>


#include <batmat/assume.hpp>

#include <batmat/linalg/simdify.hpp>

#include <guanaqo/blas/hl-blas-interface.hpp>

#include <limits>

#if !BATMAT_WITH_OPENMP

#include <batmat/thread-pool.hpp>

#endif


namespace CYQLONE_NS(cyqlone) {


using batmat::linalg::simdify;


namespace detail {

/// Simple (inefficient) matrix copy that supports slices with non-unit strides.

template <class T1, class I1, class S1, guanaqo::StorageOrder O1, class T2, class I2, class S2,

          guanaqo::StorageOrder O2>


void copy(guanaqo::MatrixView<T1, I1, S1, O1> src, guanaqo::MatrixView<T2, I2, S2, O2> dst) {

    assert(src.rows == dst.rows);

    assert(src.cols == dst.cols);

    for (index_t r = 0; r < src.rows; ++r) // TODO: optimize

        for (index_t c = 0; c < src.cols; ++c)

            dst(r, c) = src(r, c);

}


template <class T0, class T1, class I1, class S1, guanaqo::StorageOrder O1, class T2, class I2,

          class S2, guanaqo::StorageOrder O2>

/// Simple (inefficient) scaled matrix copy that supports slices with non-unit strides.


void scale(T0 scalar, guanaqo::MatrixView<T1, I1, S1, O1> src,

           guanaqo::MatrixView<T2, I2, S2, O2> dst) {

    assert(src.rows == dst.rows);

    assert(src.cols == dst.cols);

    for (index_t r = 0; r < src.rows; ++r) // TODO: optimize

        for (index_t c = 0; c < src.cols; ++c)

            dst(r, c) = scalar * src(r, c);

}


} // namespace detail


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>

CyqloneSolver<VL, T, DefaultOrder, Ctx>


CyqloneSolver<VL, T, DefaultOrder, Ctx>::build(const CyqloneStorage<value_type> &ocp, index_t p) {

    BATMAT_ASSERT(p > 0);

    BATMAT_ASSERT(v == 1 || is_pow_2(p));

    CyqloneSolver<VL, T, DefaultOrder> res{

        .N_horiz = ocp.N_horiz,

        .nx      = ocp.nx,

        .nu      = ocp.nu,

        .ny      = ocp.ny,

        .ny_0    = ocp.ny_0,

        .ny_N    = ocp.ny_N,

        .p       = p,

    };

    res.update_data(ocp);

    return res;

}


// For lgp = 5, lgv = 2, N = 3 << lgp

//

// | Stage j | Thread c | Index i | Data di | λ(A) | λ(I) | bλ(A) | bλ(I) |

// |:-------:|:--------:|:-------:|:-------:|-----:|-----:|------:|------:|

// | 0/96    | 0        | 0       | 0       | 0    | 93   | 0     | 7*    |

// | 95      | 0        | 1       | 1       |      |      |       |       |

// | 94      | 0        | 2       | 2       |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 3       | 1        | 0       | 3       | 3    | 0    | 1     | 0     |

// | 2       | 1        | 1       | 4       |      |      |       |       |

// | 1       | 1        | 2       | 5       |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 6       | 2        | 0       | 6       | 6    | 3    | 2     | 1     |

// | 5       | 2        | 1       | 7       |      |      |       |       |

// | 4       | 2        | 2       | 8       |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 9       | 3        | 0       | 9       | 9    | 6    | 3     | 2     |

// | 8       | 3        | 1       | 10      |      |      |       |       |

// | 7       | 3        | 2       | 11      |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 12      | 4        | 0       | 12      | 12   | 9    | 4     | 3     |

// | 11      | 4        | 1       | 13      |      |      |       |       |

// | 10      | 4        | 2       | 14      |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 15      | 5        | 0       | 15      | 15   | 12   | 5     | 4     |

// | 14      | 5        | 1       | 16      |      |      |       |       |

// | 13      | 5        | 2       | 17      |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 18      | 6        | 0       | 18      | 18   | 15   | 6     | 5     |

// | 17      | 6        | 1       | 19      |      |      |       |       |

// | 16      | 6        | 2       | 20      |      |      |       |       |

// |         |          |         |         |      |      |       |       |

// | 21      | 7        | 0       | 21      | 21   | 18   | 7     | 6     |

// | 20      | 7        | 1       | 22      |      |      |       |       |

// | 19      | 7        | 2       | 23      |      |      |       |       |


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::update_data(const CyqloneStorage<value_type> &ocp) {

    using cyqlone::detail::copy;

    using cyqlone::detail::scale;

    BATMAT_ASSERT(ocp.N_horiz == N_horiz);

    BATMAT_ASSERT(ocp.nx == nx);

    BATMAT_ASSERT(ocp.nu == nu);

    BATMAT_ASSERT(ocp.ny == ny);

    BATMAT_ASSERT(ocp.ny_0 == ny_0);

    BATMAT_ASSERT(ocp.ny_N == ny_N);

    const auto scale_QN = 1 / static_cast<value_type>(ceil_N() - N_horiz + 1);

    for (index_t c = 0; c < p; ++c) {

        const index_t k0  = c * n;

        const index_t di0 = c * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k = sub_wrap_ceil_N(k0 + vi * p * n, i);

                if (k == 0) {

                    if (ceil_N() == N_horiz) {

                        copy(ocp.data_F(0), data_F.batch(di)(vi)); // A, B

                        copy(ocp.data_H(0), data_H.batch(di)(vi)); // R, S, Q

                    } else {

                        copy(ocp.data_F(0).left_cols(nu),

                             data_F.batch(di)(vi).left_cols(nu));                 // B

                        data_F.batch(di)(vi).right_cols(nx).set_constant(0);      // A = 0

                        copy(ocp.data_H(0).top_left(nu, nu),                      //

                             data_H.batch(di)(vi).top_left(nu, nu));              // R

                        data_H.batch(di)(vi).bottom_left(nx, nu).set_constant(0); // S = 0

                        scale(scale_QN, ocp.data_H(0).bottom_right(nx, nx),       //

                              data_H.batch(di)(vi).bottom_right(nx, nx));         // Q = α Q(N)

                    }

                    copy(ocp.data_G0N(0).transposed(),

                         data_Gᵀ.batch(di)(vi).left_cols(ny_0 + ny_N)); // D, C

                } else if (k < N_horiz) {

                    copy(ocp.data_F(k), data_F.batch(di)(vi)); // A, B

                    copy(ocp.data_H(k), data_H.batch(di)(vi)); // R, S, Q

                    copy(ocp.data_G(k - 1).transposed(),       //

                         data_Gᵀ.batch(di)(vi).left_cols(ny)); // D, C

                } else {

                    data_F.batch(di)(vi).set_constant(0);                  // B = 0

                    data_F.batch(di)(vi).right_cols(nx).set_diagonal(1);   // A = I

                    data_H.batch(di)(vi).left_cols(nu).set_constant(0);    // S = 0

                    data_H.batch(di)(vi).top_left(nu, nu).set_diagonal(1); // R = I

                    scale(scale_QN, ocp.data_H(0).bottom_right(nx, nx),    //

                          data_H.batch(di)(vi).bottom_right(nx, nx));      // Q = α Q(N)

                    data_Gᵀ.batch(di)(vi).left_cols(ny).set_constant(0);   // D, C

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_rhs(const CyqloneStorage<value_type> &ocp,

                                                             mut_view<> rhs) const {

    BATMAT_ASSERT(rhs.depth() == ceil_N());

    BATMAT_ASSERT(rhs.rows() == nx);

    BATMAT_ASSERT(rhs.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k = sub_wrap_ceil_N(k0 + vi * p * n, i);

                if (k < N_horiz) {

                    rhs.batch(di)(vi) = ocp.data_c(k);

                } else {

                    rhs.batch(di)(vi).set_constant(0);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_gradient(

    const CyqloneStorage<value_type> &ocp, mut_view<> grad) const {

    BATMAT_ASSERT(grad.depth() == ceil_N());

    BATMAT_ASSERT(grad.rows() == nu + nx);

    BATMAT_ASSERT(grad.cols() == 1);

    const auto scale_qN = 1 / static_cast<value_type>(ceil_N() - N_horiz + 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k = sub_wrap_ceil_N(k0 + vi * p * n, i);

                if (k == 0) {

                    if (ceil_N() == N_horiz) {

                        grad.batch(di)(vi) = ocp.data_rq(0);

                    } else {

                        grad.batch(di)(vi).top_rows(nu) = ocp.data_rq(0).top_rows(nu);

                        cyqlone::detail::scale(scale_qN, ocp.data_rq(0).bottom_rows(nx),

                                               grad.batch(di)(vi).bottom_rows(nx));

                    }

                } else if (k < N_horiz) {

                    grad.batch(di)(vi) = ocp.data_rq(k);

                } else {

                    grad.batch(di)(vi).top_rows(nu).set_constant(0);

                    cyqlone::detail::scale(scale_qN, ocp.data_rq(0).bottom_rows(nx),

                                           grad.batch(di)(vi).bottom_rows(nx));

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_bounds(

    const CyqloneStorage<value_type> &ocp, mut_view<> b_min, mut_view<> b_max) const {

    const index_t nyM = std::max(ny, ny_0 + ny_N);

    BATMAT_ASSERT(b_min.depth() == ceil_N());

    BATMAT_ASSERT(b_min.rows() == nyM);

    BATMAT_ASSERT(b_min.cols() == 1);

    BATMAT_ASSERT(b_max.depth() == ceil_N());

    BATMAT_ASSERT(b_max.rows() == nyM);

    BATMAT_ASSERT(b_max.cols() == 1);

    const auto inf = std::numeric_limits<value_type>::infinity();

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k       = sub_wrap_ceil_N(k0 + vi * p * n, i);

                auto b_min_i = b_min.batch(di)(vi), b_max_i = b_max.batch(di)(vi);

                if (k == 0) {

                    b_min_i.top_rows(ny_0 + ny_N) = ocp.data_lb0N(0);

                    b_max_i.top_rows(ny_0 + ny_N) = ocp.data_ub0N(0);

                    b_min_i.bottom_rows(nyM - ny_0 - ny_N).set_constant(-inf);

                    b_max_i.bottom_rows(nyM - ny_0 - ny_N).set_constant(+inf);

                } else if (k < N_horiz) {

                    b_min_i.top_rows(ny) = ocp.data_lb(k - 1);

                    b_max_i.top_rows(ny) = ocp.data_ub(k - 1);

                    b_min_i.bottom_rows(nyM - ny).set_constant(-inf);

                    b_max_i.bottom_rows(nyM - ny).set_constant(+inf);

                } else {

                    b_min_i.set_constant(-inf);

                    b_max_i.set_constant(+inf);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_variables(std::span<const value_type> ux_lin,

                                                             mut_view<> ux) const {

    const index_t nux = nu + nx;

    BATMAT_ASSERT(static_cast<index_t>(ux_lin.size()) == nux * N_horiz);

    BATMAT_ASSERT(ux.depth() == ceil_N());

    BATMAT_ASSERT(ux.rows() == nux);

    BATMAT_ASSERT(ux.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k       = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using crview = guanaqo::MatrixView<const value_type, index_t>;

                if (k == 0) {

                    ux.batch(di)(vi).top_rows(nu) = crview::as_column(ux_lin.first(nu));

                    if (ceil_N() == N_horiz)

                        ux.batch(di)(vi).bottom_rows(nx) =

                            crview::as_column(ux_lin.subspan(nu + (N_horiz - 1) * nux, nx));

                    else

                        ux.batch(di)(vi).bottom_rows(nx).set_constant(0);

                } else if (k < N_horiz) {

                    ux.batch(di)(vi).top_rows(nu) = crview::as_column(ux_lin.subspan(k * nux, nu));

                    ux.batch(di)(vi).bottom_rows(nx) =

                        crview::as_column(ux_lin.subspan(nu + (k - 1) * nux, nx));

                } else if (k == N_horiz) {

                    // only pack the last state if we have padding stages

                    ux.batch(di)(vi).bottom_rows(nx) =

                        crview::as_column(ux_lin.subspan(nu + (N_horiz - 1) * nux, nx));

                } else {

                    ux.batch(di)(vi).set_constant(0);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_variables(view<> ux,

                                                               std::span<value_type> ux_lin) const {

    const index_t nux = nu + nx;

    BATMAT_ASSERT(static_cast<index_t>(ux_lin.size()) == nux * N_horiz);

    BATMAT_ASSERT(ux.depth() == ceil_N());

    BATMAT_ASSERT(ux.rows() == nux);

    BATMAT_ASSERT(ux.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k      = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using rview = guanaqo::MatrixView<value_type, index_t>;

                if (k == 0) {

                    rview::as_column(ux_lin.first(nu)) = ux.batch(di)(vi).top_rows(nu);

                    if (ceil_N() == N_horiz)

                        rview::as_column(ux_lin.subspan(nu + (N_horiz - 1) * nux, nx)) =

                            ux.batch(di)(vi).bottom_rows(nx);

                } else if (k < N_horiz) {

                    rview::as_column(ux_lin.subspan(k * nux, nu)) = ux.batch(di)(vi).top_rows(nu);

                    rview::as_column(ux_lin.subspan(nu + (k - 1) * nux, nx)) =

                        ux.batch(di)(vi).bottom_rows(nx);

                } else if (k == N_horiz) {

                    // only unpack the last state if we have padding stages

                    rview::as_column(ux_lin.subspan(nu + (N_horiz - 1) * nux, nx)) =

                        ux.batch(di)(vi).bottom_rows(nx);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_dynamics(std::span<const value_type> λ_lin,

                                                            mut_view<> λ) const {

    const index_t nλ = nx;

    BATMAT_ASSERT(static_cast<index_t>(λ_lin.size()) == nλ * N_horiz);

    BATMAT_ASSERT(λ.depth() == ceil_N());

    BATMAT_ASSERT(λ.rows() == nλ);

    BATMAT_ASSERT(λ.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k       = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using crview = guanaqo::MatrixView<const value_type, index_t>;

                if (k < N_horiz) {

                    λ.batch(di)(vi) = crview::as_column(λ_lin.subspan(k * nλ, nλ));

                } else {

                    λ.batch(di)(vi).set_constant(0);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_dynamics(view<> λ,

                                                              std::span<value_type> λ_lin) const {

    const index_t nλ = nx;

    BATMAT_ASSERT(static_cast<index_t>(λ_lin.size()) == nλ * N_horiz);

    BATMAT_ASSERT(λ.depth() == ceil_N());

    BATMAT_ASSERT(λ.rows() == nλ);

    BATMAT_ASSERT(λ.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k      = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using rview = guanaqo::MatrixView<value_type, index_t>;

                if (k < N_horiz) {

                    rview::as_column(λ_lin.subspan(k * nλ, nλ)) = λ.batch(di)(vi);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_constraints(std::span<const value_type> y_lin,

                                                               mut_view<> y,

                                                               value_type fill) const {

    BATMAT_ASSERT(static_cast<index_t>(y_lin.size()) == ny * (N_horiz - 1) + ny_0 + ny_N);

    BATMAT_ASSERT(y.depth() == ceil_N());

    BATMAT_ASSERT(y.rows() == std::max(ny, ny_0 + ny_N));

    BATMAT_ASSERT(y.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k       = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using crview = guanaqo::MatrixView<const value_type, index_t>;

                if (k == 0) {

                    index_t ny_pad                 = std::max(ny, ny_0 + ny_N) - (ny_0 + ny_N);

                    y.batch(di)(vi).top_rows(ny_0) = crview::as_column(y_lin.first(ny_0));

                    y.batch(di)(vi).bottom_rows(ny_N) =

                        crview::as_column(y_lin.subspan(ny_0 + (N_horiz - 1) * ny, ny_N));

                    y.batch(di)(vi).bottom_rows(ny_pad).set_constant(fill);

                } else if (k < N_horiz) {

                    index_t ny_pad = std::max(ny, ny_0 + ny_N) - ny;

                    y.batch(di)(vi).top_rows(ny) =

                        crview::as_column(y_lin.subspan(ny_0 + (k - 1) * ny, ny));

                    y.batch(di)(vi).bottom_rows(ny_pad).set_constant(fill);

                } else {

                    y.batch(di)(vi).set_constant(0);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


void CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_constraints(

    view<> y, std::span<value_type> y_lin) const {

    BATMAT_ASSERT(static_cast<index_t>(y_lin.size()) == ny * (N_horiz - 1) + ny_0 + ny_N);

    BATMAT_ASSERT(y.depth() == ceil_N());

    BATMAT_ASSERT(y.rows() == std::max(ny, ny_0 + ny_N));

    BATMAT_ASSERT(y.cols() == 1);

    for (index_t ti = 0; ti < p; ++ti) {

        const index_t k0  = ti * n;

        const index_t di0 = ti * n;

        for (index_t i = 0; i < n; ++i) {

            index_t di = di0 + i;

            for (index_t vi = 0; vi < v; ++vi) {

                auto k      = sub_wrap_ceil_N(k0 + vi * p * n, i);

                using rview = guanaqo::MatrixView<value_type, index_t>;

                if (k == 0) {

                    rview::as_column(y_lin.first(ny_0)) = y.batch(di)(vi).top_rows(ny_0);

                    rview::as_column(y_lin.subspan(ny_0 + (N_horiz - 1) * ny, ny_N)) =

                        y.batch(di)(vi).bottom_rows(ny_N);

                } else if (k < N_horiz) {

                    rview::as_column(y_lin.subspan(ny_0 + (k - 1) * ny, ny)) =

                        y.batch(di)(vi).top_rows(ny);

                }

            }

        }

    }

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_rhs(

    const CyqloneStorage<value_type> &ocp) const -> matrix<> {

    matrix<> rhs = initialize_dynamics_constraints();

    initialize_rhs(ocp, rhs);

    return rhs;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_gradient(

    const CyqloneStorage<value_type> &ocp) const -> matrix<> {

    matrix<> grad = initialize_variables();

    initialize_gradient(ocp, grad);

    return grad;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_bounds(

    const CyqloneStorage<value_type> &ocp) const -> std::pair<matrix<>, matrix<>> {

    std::pair b{initialize_general_constraints(), initialize_general_constraints()};

    initialize_bounds(ocp, b.first, b.second);

    return b;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_variables(

    std::span<const value_type> ux_lin) const -> matrix<> {

    matrix<> ux = initialize_variables();

    pack_variables(ux_lin, ux);

    return ux;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_variables(view<> ux) const

    -> std::vector<value_type> {

    std::vector<value_type> ux_lin(num_variables());

    unpack_variables(ux, ux_lin);

    return ux_lin;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_dynamics(std::span<const value_type> λ_lin) const

    -> matrix<> {

    matrix<> λ = initialize_dynamics_constraints();

    pack_dynamics(λ_lin, λ);

    return λ;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_dynamics(view<> λ) const

    -> std::vector<value_type> {

    std::vector<value_type> λ_lin(num_dynamics_constraints());

    unpack_dynamics(λ, λ_lin);

    return λ_lin;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::pack_constraints(std::span<const value_type> y_lin,

                                                               value_type fill) const -> matrix<> {

    matrix<> y = initialize_general_constraints();

    pack_constraints(y_lin, y, fill);

    return y;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::unpack_constraints(view<> y) const

    -> std::vector<value_type> {

    std::vector<value_type> y_lin(num_general_constraints());

    unpack_constraints(y, y_lin);

    return y_lin;

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_variables() const -> matrix<> {

    return matrix<>{{.depth = ceil_N(), .rows = nu + nx, .cols = 1}};

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_dynamics_constraints() const -> matrix<> {

    return matrix<>{{.depth = ceil_N(), .rows = nx, .cols = 1}};

}


template <index_t VL, class T, StorageOrder DefaultOrder, class Ctx>


auto CyqloneSolver<VL, T, DefaultOrder, Ctx>::initialize_general_constraints() const -> matrix<> {

    return matrix<>{{.depth = ceil_N(), .rows = std::max(ny, ny_0 + ny_N), .cols = 1}};

}


} // namespace CYQLONE_NS(cyqlone)

BATMAT_ASSERT
#define BATMAT_ASSERT(x)

cyqlone.hpp
The main header for the Cyqlone and Tricyqle linear solvers.

guanaqo::StorageOrder
StorageOrder

batmat::linalg::copy
void copy(VA &&A, VB &&B, Opts... opts)

cyqlone::linalg::scale
void scale(T alpha, Vx &&x, Vz &&z)
Multiply a vector by a scalar z = αx.
Definition linalg.hpp:294

batmat::linalg::fill
void fill(simdified_value_t< VB > a, VB &&B)

batmat::linalg::detail

batmat::linalg::simdify
constexpr auto simdify(simdifiable auto &&a) -> simdified_view_t< decltype(a)>

cyqlone::detail::copy
void copy(guanaqo::MatrixView< T1, I1, S1, O1 > src, guanaqo::MatrixView< T2, I2, S2, O2 > dst)
Simple (inefficient) matrix copy that supports slices with non-unit strides.
Definition data.tpp:19

cyqlone::detail::scale
void scale(T0 scalar, guanaqo::MatrixView< T1, I1, S1, O1 > src, guanaqo::MatrixView< T2, I2, S2, O2 > dst)
Simple (inefficient) scaled matrix copy that supports slices with non-unit strides.
Definition data.tpp:29

cyqlone::is_pow_2
constexpr bool is_pow_2(index_t n)
Definition cyqlone.hpp:32

batmat::matrix::Matrix::bottom_rows
auto bottom_rows(index_type n)

batmat::matrix::Matrix::left_cols
auto left_cols(index_type n)

batmat::matrix::Matrix::top_rows
auto top_rows(index_type n)

batmat::matrix::Matrix::top_left
auto top_left(index_type nr, index_type nc)

batmat::matrix::Matrix::bottom_right
auto bottom_right(index_type nr, index_type nc)

batmat::matrix::Matrix::transposed
auto transposed()

cyqlone::CyqloneSolver
Linear solver for systems with optimal control structure.
Definition cyqlone.hpp:561

cyqlone::CyqloneSolver::n
const index_t n
Number of stages per thread per vector lane (rounded up).
Definition cyqlone.hpp:605

cyqlone::CyqloneSolver::num_variables
index_t num_variables() const
Get the total number of primal variables in the OCP.
Definition cyqlone.hpp:577

cyqlone::CyqloneSolver::data_H
matrix< default_order > data_H
Stage-wise Hessian blocks H(j) = [ R(j) S(j); S(j)ᵀ Q(j) ] of the OCP cost function.
Definition cyqlone.hpp:762

cyqlone::CyqloneSolver::initialize_variables
matrix initialize_variables() const
Get a zero-initialized matrix for the primal variables u and x.
Definition data.tpp:501

cyqlone::CyqloneSolver::ceil_N
index_t ceil_N() const
Horizon length, rounded up to a multiple of the number of parallel execution units.
Definition cyqlone.hpp:653

cyqlone::CyqloneSolver::view
typename tricyqle_t::template view< O > view
Non-owning immutable view type for matrix.
Definition cyqlone.hpp:693

cyqlone::CyqloneSolver::update_data
void update_data(const CyqloneStorage< value_type > &ocp)
Update the internal data structures to reflect changes in the OCP data (without changing the problem ...
Definition data.tpp:94

cyqlone::CyqloneSolver::data_F
matrix< default_order > data_F
Stage-wise dynamics matrices F(j) = [ B(j) A(j) ] of the OCP.
Definition cyqlone.hpp:766

cyqlone::CyqloneSolver::data_Gᵀ
matrix< default_order > data_Gᵀ
Stage-wise constraint Jacobians G(j)ᵀ = [ D(j) C(j) ]ᵀ of the OCP.
Definition cyqlone.hpp:770

cyqlone::CyqloneSolver::pack_variables
void pack_variables(std::span< const value_type > ux_lin, mut_view<> ux) const
Definition data.tpp:242

cyqlone::CyqloneSolver::pack_constraints
void pack_constraints(std::span< const value_type > y_lin, mut_view<> y, value_type fill=0) const
Definition data.tpp:366

cyqlone::CyqloneSolver::initialize_gradient
void initialize_gradient(const CyqloneStorage< value_type > &ocp, mut_view<> grad) const
Initialize the gradient vector for the OCP cost function, using the custom Cyqlone storage format.
Definition data.tpp:170

cyqlone::CyqloneSolver::unpack_variables
void unpack_variables(view<> ux, std::span< value_type > ux_lin) const
Definition data.tpp:281

cyqlone::CyqloneSolver::sub_wrap_ceil_N
index_t sub_wrap_ceil_N(index_t a, index_t b) const
Subtract b from a modulo N_horiz.
Definition indexing.tpp:53

cyqlone::CyqloneSolver::unpack_constraints
void unpack_constraints(view<> y, std::span< value_type > y_lin) const
Definition data.tpp:401

cyqlone::CyqloneSolver::matrix
typename tricyqle_t::template matrix< O > matrix
Owning type for a batch of matrices (with batch size v).
Definition cyqlone.hpp:690

cyqlone::CyqloneSolver::N_horiz
const index_t N_horiz
Horizon length of the optimal control problem.
Definition cyqlone.hpp:567

cyqlone::CyqloneSolver::num_dynamics_constraints
index_t num_dynamics_constraints() const
Get the total number of dynamics constraints in the OCP.
Definition cyqlone.hpp:581

cyqlone::CyqloneSolver::build
static CyqloneSolver build(const CyqloneStorage< value_type > &ocp, index_t p)
Initialize a Cyqlone solver for the given OCP.
Definition data.tpp:41

cyqlone::CyqloneSolver::ny
const index_t ny
Number of general constraints of the OCP per stage.
Definition cyqlone.hpp:570

cyqlone::CyqloneSolver::initialize_dynamics_constraints
matrix initialize_dynamics_constraints() const
Get a zero-initialized matrix for the dynamics constraints (or their multipliers).
Definition data.tpp:506

cyqlone::CyqloneSolver::initialize_rhs
void initialize_rhs(const CyqloneStorage< value_type > &ocp, mut_view<> rhs) const
Initialize the right-hand side vector for the dynamics constraints of the OCP, using the custom Cyqlo...
Definition data.tpp:147

cyqlone::CyqloneSolver::initialize_general_constraints
matrix initialize_general_constraints() const
Get a zero-initialized matrix for the general constraints (or their multipliers).
Definition data.tpp:511

cyqlone::CyqloneSolver::initialize_bounds
void initialize_bounds(const CyqloneStorage< value_type > &ocp, mut_view<> b_min, mut_view<> b_max) const
Initialize the lower and upper bounds for the general constraints of the OCP, using the custom Cyqlon...
Definition data.tpp:204

cyqlone::CyqloneSolver::mut_view
typename tricyqle_t::template mut_view< O > mut_view
Non-owning mutable view type for matrix.
Definition cyqlone.hpp:696

cyqlone::CyqloneSolver::pack_dynamics
void pack_dynamics(std::span< const value_type > λ_lin, mut_view<> λ) const
Definition data.tpp:316

cyqlone::CyqloneSolver::ny_0
const index_t ny_0
Number of general constraints at stage 0, D(0) u(0).
Definition cyqlone.hpp:571

cyqlone::CyqloneSolver::nu
const index_t nu
Number of controls of the OCP.
Definition cyqlone.hpp:569

cyqlone::CyqloneSolver::value_type
T value_type
Definition cyqlone.hpp:562

cyqlone::CyqloneSolver::p
const index_t p
Number of processors/threads.
Definition cyqlone.hpp:601

cyqlone::CyqloneSolver::num_general_constraints
index_t num_general_constraints() const
Get the total number of general constraints in the OCP.
Definition cyqlone.hpp:585

cyqlone::CyqloneSolver::ny_N
const index_t ny_N
Number of general constraints at the final stage, C(N) x(N).
Definition cyqlone.hpp:572

cyqlone::CyqloneSolver::unpack_dynamics
void unpack_dynamics(view<> λ, std::span< value_type > λ_lin) const
Definition data.tpp:342

cyqlone::CyqloneSolver::v
static constexpr index_t v
Vector length.
Definition cyqlone.hpp:603

cyqlone::CyqloneSolver::nx
const index_t nx
Number of states of the OCP.
Definition cyqlone.hpp:568

cyqlone::CyqloneStorage
Storage for a linear-quadratic OCP with the initial states x₀ eliminated.
Definition cyqlone-storage.hpp:39

cyqlone::CyqloneStorage::data_ub
matrix data_ub
Definition cyqlone-storage.hpp:59

cyqlone::CyqloneStorage::data_c
matrix data_c
Definition cyqlone-storage.hpp:56

cyqlone::CyqloneStorage::data_rq
matrix data_rq
Definition cyqlone-storage.hpp:55

cyqlone::CyqloneStorage::nx
index_t nx
Definition cyqlone-storage.hpp:42

cyqlone::CyqloneStorage::data_lb
matrix data_lb
Definition cyqlone-storage.hpp:57

cyqlone::CyqloneStorage::N_horiz
index_t N_horiz
Definition cyqlone-storage.hpp:41

cyqlone::CyqloneStorage::nu
index_t nu
Definition cyqlone-storage.hpp:42

cyqlone::CyqloneStorage::data_F
matrix data_F
Definition cyqlone-storage.hpp:48

cyqlone::CyqloneStorage::data_ub0N
matrix data_ub0N
Definition cyqlone-storage.hpp:60

cyqlone::CyqloneStorage::data_G0N
matrix data_G0N
Definition cyqlone-storage.hpp:52

cyqlone::CyqloneStorage::ny
index_t ny
Definition cyqlone-storage.hpp:42

cyqlone::CyqloneStorage::data_G
matrix data_G
Definition cyqlone-storage.hpp:49

cyqlone::CyqloneStorage::ny_N
index_t ny_N
Definition cyqlone-storage.hpp:42

cyqlone::CyqloneStorage::ny_0
index_t ny_0
Definition cyqlone-storage.hpp:42

cyqlone::CyqloneStorage::data_H
matrix data_H
Definition cyqlone-storage.hpp:45

cyqlone::CyqloneStorage::data_lb0N
matrix data_lb0N
Definition cyqlone-storage.hpp:58

guanaqo::MatrixView

guanaqo::MatrixView::rows
index_type rows

guanaqo::MatrixView::cols
index_type cols