main/Doxygen/limited-memory-qr_8hpp_source.html

#include <Eigen/Jacobi>

#include <cstddef>

#include <quala/util/ringbuffer.hpp>

#include <quala/util/vec.hpp>

#include <type_traits>


namespace quala {


/// Incremental QR factorization using modified Gram-Schmidt with

/// reorthogonalization.

///

/// Computes A = QR while allowing efficient removal of the first

/// column of A or adding new columns at the end of A.

class LimitedMemoryQR {

  public:

    LimitedMemoryQR() = default;


    /// @param  n

    ///         The size of the vectors, the number of rows of A.

    /// @param  m

    ///         The maximum number of columns of A.

    ///

    /// The maximum dimensions of Q are n×m and the maximum dimensions of R are

    /// m×m.

    LimitedMemoryQR(length_t n, length_t m) : Q(n, m), R(m, m) {}


    length_t n() const { return Q.rows(); }

    length_t m() const { return Q.cols(); }

    length_t size() const { return n(); }

    length_t history() const { return m(); }


    /// Add the given column to the right.

    template <class VecV>

    void add_column(const VecV &v) {

        assert(num_columns() < m());


        auto q = Q.col(q_idx);

        auto r = R.col(r_idx_end);


        // Modified Gram-Schmidt to make q orthogonal to Q

        q = v;

        for (index_t i = 0; i < q_idx; ++i) {

            real_t s = Q.col(i).dot(q);

            r(i)     = s;

            q -= s * Q.col(i);

        }


        // Compute the norms of orthogonalized q and original v

        real_t norm_q = q.norm();

        real_t norm_v = v.norm();


        // If ‖q‖ is significantly smaller than ‖v‖, perform

        // reorthogonalization

        real_t η = 0.7;

        while (norm_q < η * norm_v) {

            ++reorth_count;

            for (index_t i = 0; i < q_idx; ++i) {

                real_t s = Q.col(i).dot(q);

                r(i) += s;

                q -= s * Q.col(i);

            }

            norm_v = norm_q;

            norm_q = q.norm();

        }


        // Normalize q such that new matrix (Q q) remains orthogonal (i.e. has

        // orthonormal columns)

        r(q_idx) = norm_q;

        q /= norm_q;

        // Keep track of the minimum/maximum diagonal element of R

        min_eig = std::min(min_eig, norm_q);

        max_eig = std::max(max_eig, norm_q);


        // Increment indices, add a column to Q and R.

        ++q_idx;

        r_idx_end = r_succ(r_idx_end);

    }


    /// Remove the leftmost column.

    void remove_column() {

        assert(num_columns() > 0);


        // After removing the first colomn of the upper triangular matrix R,

        // it becomes upper Hessenberg. Givens rotations are used to make it

        // triangular again.

        Eigen::JacobiRotation<real_t> G;

        index_t r = 0;                   // row index of R

        index_t c = r_succ(r_idx_start); // column index of R in storage

        while (r < q_idx - 1) {

            // Compute the Givens rotation that makes the subdiagonal element

            // of column c or R zero.

            G.makeGivens(R(r, c), R(r + 1, c), &R(r, c));

            // Apply it to the remaining columns of R.

            // Not the current column, because the diagonal element was updated

            // by the makeGivens function, and the subdiagonal element doesn't

            // have to be set to zero explicitly, it's implicit.

            // Also not the previous columns, because they are already

            // implicitly zero below the diagonal and this rotation wouldn't

            // have any effect there.

            // TODO: can this be sped up by applying it in two blocks instead

            //       of column by column?

            for (index_t cc = r_succ(c); cc != r_idx_end; cc = r_succ(cc))

                R.col(cc).applyOnTheLeft(r, r + 1, G.adjoint());

            // Apply the inverse of the Givens rotation to Q.

            Q.block(0, 0, Q.rows(), q_idx).applyOnTheRight(r, r + 1, G);

            // Keep track of the minimum/maximum diagonal element of R

            min_eig = std::min(min_eig, R(r, c));

            max_eig = std::max(max_eig, R(r, c));

            // Advance indices to next diagonal element of R.

            ++r;

            c = r_succ(c);

        }

        // Remove rightmost column of Q, since it corresponds to the bottom row

        // of R, which was set to zero by the Givens rotations

        --q_idx;

        // Remove the first column of R.

        r_idx_start = r_succ(r_idx_start);

    }


    /// Solve the least squares problem Ax = b.

    /// Do not divide by elements that are smaller in absolute value than @p tol.

    template <class VecB, class VecX>

    void solve_col(const VecB &b, VecX &x, real_t tol = 0) const {

        // Iterate over the diagonal of R, starting at the bottom right,

        // this is standard back substitution

        // (recall that R is stored in a circular buffer, so R.col(i) is

        // not the mathematical i-th column)

        auto rev_bgn = ring_reverse_iter().begin();

        auto rev_end = ring_reverse_iter().end();

        auto fwd_end = ring_iter().end();

        for (auto it_d = rev_bgn; it_d != rev_end; ++it_d) {

            // Row/column index of diagonal element of R

            auto [rR, cR] = *it_d;

            // Don't divide by very small diagonal elements

            if (std::abs(R(rR, cR)) < tol) {

                x(rR) = real_t{0};

                continue;

            }

            // (r is the zero-based mathematical index, c is the index in

            // the circular buffer)

            x(rR) = Q.col(rR).transpose() * b; // Compute rhs Qᵀb

            // In the current row of R, iterate over the elements to the

            // right of the diagonal

            // Iterating from left to right seems to give better results

            for (auto it_c = it_d.forwardit; it_c != fwd_end; ++it_c) {

                auto [rX2, cR2] = *it_c;

                x(rR) -= R(rR, cR2) * x(rX2);

            }

            x(rR) /= R(rR, cR); // Divide by diagonal element

        }

    }


    /// Solve the least squares problem AX = B.

    /// Do not divide by elements that are smaller in absolute value than @p tol.

    template <class MatB, class MatX>

    void solve(const MatB &B, MatX &X, real_t tol = 0) const {

        assert(B.cols() <= X.cols());

        assert(B.rows() >= Q.rows());

        assert(X.rows() >= Eigen::Index(num_columns()));

        // Each column of the right hand side is solved as an individual system

        for (Eigen::Index cB = 0; cB < B.cols(); ++cB) {

            auto b = B.col(cB);

            auto x = X.col(cB);

            solve_col(b, x, tol);

        }

    }


    template <class Derived>

    using solve_ret_t = std::conditional_t<

        Eigen::internal::traits<Derived>::ColsAtCompileTime == 1, vec, mat>;


    /// Solve the least squares problem AX = B.

    template <class Derived>

    solve_ret_t<Derived> solve(const Eigen::DenseBase<Derived> &B) {

        solve_ret_t<Derived> X(m(), B.cols());

        solve(B, X);

        return X;

    }


    /// Get the full, raw storage for the orthogonal matrix Q.

    const mat &get_raw_Q() const { return Q; }

    /// Get the full, raw storage for the upper triangular matrix R.

    /// The columns of this matrix are permuted because it's stored as a

    /// circular buffer for efficiently appending columns to the end and

    /// popping columns from the front.

    const mat &get_raw_R() const { return R; }


    /// Get the full storage for the upper triangular matrix R but with the

    /// columns in the correct order.

    /// @note   Meant for tests only, creates a permuted copy.

    mat get_full_R() const {

        if (r_idx_start == 0)

            return R;

        // Using a permutation matrix here isn't as efficient as rotating the

        // matrix manually, but this function is only used in tests, so it

        // shouldn't matter.

        Eigen::PermutationMatrix<Eigen::Dynamic> P(R.cols());

        P.setIdentity();

        std::rotate(P.indices().data(), P.indices().data() + r_idx_start,

                    P.indices().data() + P.size());

        return R * P;

    }

    /// Get the matrix R such that Q times R is the original matrix.

    /// @note   Meant for tests only, creates a permuted copy.

    mat get_R() const {

        return get_full_R()

            .block(0, 0, q_idx, q_idx)

            .triangularView<Eigen::Upper>();

    }

    /// Get the matrix Q such that Q times R is the original matrix.

    /// @note   Meant for tests only, creates a copy.

    mat get_Q() const { return Q.block(0, 0, n(), q_idx); }


    /// Multiply the matrix R by a scalar.

    void scale_R(real_t scal) {

        for (auto [i, r_idx] : ring_iter())

            R.col(r_idx).topRows(i + 1) *= scal;

        min_eig *= scal;

        max_eig *= scal;

    }


    /// Get the number of MGS reorthogonalizations.

    unsigned long get_reorth_count() const { return reorth_count; }

    /// Reset the number of MGS reorthogonalizations.

    void clear_reorth_count() { reorth_count = 0; }


    /// Get the minimum eigenvalue of R.

    real_t get_min_eig() const { return min_eig; }

    /// Get the maximum eigenvalue of R.

    real_t get_max_eig() const { return max_eig; }


    /// Reset all indices, clearing the Q and R matrices.

    void reset() {

        q_idx        = 0;

        r_idx_start  = 0;

        r_idx_end    = 0;

        reorth_count = 0;

        min_eig      = +inf;

        max_eig      = -inf;

    }


    /// Re-allocate storage for a problem with a different size. Causes

    /// a @ref reset.

    void resize(length_t n, length_t m) {

        Q.resize(n, m);

        R.resize(m, m);

        reset();

    }


    /// Get the number of columns that are currently stored.

    length_t num_columns() const { return q_idx; }

    /// Get the head index of the circular buffer (points to the oldest

    /// element).

    index_t ring_head() const { return r_idx_start; }

    /// Get the tail index of the circular buffer (points to one past the most

    /// recent element).

    index_t ring_tail() const { return r_idx_end; }

    /// Get the next index in the circular buffer.

    index_t ring_next(index_t i) const { return r_succ(i); }

    /// Get the previous index in the circular buffer.

    index_t ring_prev(index_t i) const { return r_pred(i); }

    /// Get the number of columns currently stored in the buffer.

    length_t current_history() const { return q_idx; }


    /// Get iterators in the circular buffer.

    CircularRange<index_t> ring_iter() const {

        return {q_idx, r_idx_start, r_idx_end, m()};

    }

    /// Get reverse iterators in the circular buffer.

    ReverseCircularRange<index_t> ring_reverse_iter() const {

        return ring_iter();

    }


  private:

    mat Q; ///< Storage for orthogonal factor Q.

    mat R; ///< Storage for upper triangular factor R.


    index_t q_idx       = 0; ///< Number of columns of Q being stored.

    index_t r_idx_start = 0; ///< Index of the first column of R.

    index_t r_idx_end   = 0; ///< Index of the one-past-last column of R.


    unsigned long reorth_count = 0; ///< Number of MGS reorthogonalizations.


    real_t min_eig = +inf; ///< Minimum eigenvalue of R.

    real_t max_eig = -inf; ///< Maximum eigenvalue of R.


    /// Get the next index in the circular storage for R.

    index_t r_succ(index_t i) const { return i + 1 < m() ? i + 1 : 0; }

    /// Get the previous index in the circular storage for R.

    index_t r_pred(index_t i) const { return i == 0 ? m() - 1 : i - 1; }

};


} // namespace quala

quala::CircularRange
Definition: ringbuffer.hpp:185

quala::LimitedMemoryQR
Incremental QR factorization using modified Gram-Schmidt with reorthogonalization.
Definition: limited-memory-qr.hpp:14

quala::LimitedMemoryQR::size
length_t size() const
Definition: limited-memory-qr.hpp:29

quala::LimitedMemoryQR::R
mat R
Storage for upper triangular factor R.
Definition: limited-memory-qr.hpp:276

quala::LimitedMemoryQR::r_idx_start
index_t r_idx_start
Index of the first column of R.
Definition: limited-memory-qr.hpp:279

quala::LimitedMemoryQR::max_eig
real_t max_eig
Maximum eigenvalue of R.
Definition: limited-memory-qr.hpp:285

quala::LimitedMemoryQR::ring_iter
CircularRange< index_t > ring_iter() const
Get iterators in the circular buffer.
Definition: limited-memory-qr.hpp:266

quala::LimitedMemoryQR::Q
mat Q
Storage for orthogonal factor Q.
Definition: limited-memory-qr.hpp:275

quala::LimitedMemoryQR::LimitedMemoryQR
LimitedMemoryQR(length_t n, length_t m)
Definition: limited-memory-qr.hpp:25

quala::LimitedMemoryQR::num_columns
length_t num_columns() const
Get the number of columns that are currently stored.
Definition: limited-memory-qr.hpp:251

quala::LimitedMemoryQR::get_Q
mat get_Q() const
Get the matrix Q such that Q times R is the original matrix.
Definition: limited-memory-qr.hpp:212

quala::LimitedMemoryQR::solve
void solve(const MatB &B, MatX &X, real_t tol=0) const
Solve the least squares problem AX = B.
Definition: limited-memory-qr.hpp:156

quala::LimitedMemoryQR::current_history
length_t current_history() const
Get the number of columns currently stored in the buffer.
Definition: limited-memory-qr.hpp:263

quala::LimitedMemoryQR::reorth_count
unsigned long reorth_count
Number of MGS reorthogonalizations.
Definition: limited-memory-qr.hpp:282

quala::LimitedMemoryQR::remove_column
void remove_column()
Remove the leftmost column.
Definition: limited-memory-qr.hpp:80

quala::LimitedMemoryQR::get_R
mat get_R() const
Get the matrix R such that Q times R is the original matrix.
Definition: limited-memory-qr.hpp:205

quala::LimitedMemoryQR::q_idx
index_t q_idx
Number of columns of Q being stored.
Definition: limited-memory-qr.hpp:278

quala::LimitedMemoryQR::r_pred
index_t r_pred(index_t i) const
Get the previous index in the circular storage for R.
Definition: limited-memory-qr.hpp:290

quala::LimitedMemoryQR::add_column
void add_column(const VecV &v)
Add the given column to the right.
Definition: limited-memory-qr.hpp:34

quala::LimitedMemoryQR::solve_col
void solve_col(const VecB &b, VecX &x, real_t tol=0) const
Solve the least squares problem Ax = b.
Definition: limited-memory-qr.hpp:123

quala::LimitedMemoryQR::solve
solve_ret_t< Derived > solve(const Eigen::DenseBase< Derived > &B)
Solve the least squares problem AX = B.
Definition: limited-memory-qr.hpp:174

quala::LimitedMemoryQR::min_eig
real_t min_eig
Minimum eigenvalue of R.
Definition: limited-memory-qr.hpp:284

quala::LimitedMemoryQR::n
length_t n() const
Definition: limited-memory-qr.hpp:27

quala::LimitedMemoryQR::clear_reorth_count
void clear_reorth_count()
Reset the number of MGS reorthogonalizations.
Definition: limited-memory-qr.hpp:225

quala::LimitedMemoryQR::ring_tail
index_t ring_tail() const
Get the tail index of the circular buffer (points to one past the most recent element).
Definition: limited-memory-qr.hpp:257

quala::LimitedMemoryQR::history
length_t history() const
Definition: limited-memory-qr.hpp:30

quala::LimitedMemoryQR::get_max_eig
real_t get_max_eig() const
Get the maximum eigenvalue of R.
Definition: limited-memory-qr.hpp:230

quala::LimitedMemoryQR::r_succ
index_t r_succ(index_t i) const
Get the next index in the circular storage for R.
Definition: limited-memory-qr.hpp:288

quala::LimitedMemoryQR::LimitedMemoryQR
LimitedMemoryQR()=default

quala::LimitedMemoryQR::solve_ret_t
std::conditional_t< Eigen::internal::traits< Derived >::ColsAtCompileTime==1, vec, mat > solve_ret_t
Definition: limited-memory-qr.hpp:170

quala::LimitedMemoryQR::ring_prev
index_t ring_prev(index_t i) const
Get the previous index in the circular buffer.
Definition: limited-memory-qr.hpp:261

quala::LimitedMemoryQR::m
length_t m() const
Definition: limited-memory-qr.hpp:28

quala::LimitedMemoryQR::ring_head
index_t ring_head() const
Get the head index of the circular buffer (points to the oldest element).
Definition: limited-memory-qr.hpp:254

quala::LimitedMemoryQR::get_raw_Q
const mat & get_raw_Q() const
Get the full, raw storage for the orthogonal matrix Q.
Definition: limited-memory-qr.hpp:181

quala::LimitedMemoryQR::get_raw_R
const mat & get_raw_R() const
Get the full, raw storage for the upper triangular matrix R.
Definition: limited-memory-qr.hpp:186

quala::LimitedMemoryQR::resize
void resize(length_t n, length_t m)
Re-allocate storage for a problem with a different size.
Definition: limited-memory-qr.hpp:244

quala::LimitedMemoryQR::reset
void reset()
Reset all indices, clearing the Q and R matrices.
Definition: limited-memory-qr.hpp:233

quala::LimitedMemoryQR::ring_next
index_t ring_next(index_t i) const
Get the next index in the circular buffer.
Definition: limited-memory-qr.hpp:259

quala::LimitedMemoryQR::get_reorth_count
unsigned long get_reorth_count() const
Get the number of MGS reorthogonalizations.
Definition: limited-memory-qr.hpp:223

quala::LimitedMemoryQR::get_min_eig
real_t get_min_eig() const
Get the minimum eigenvalue of R.
Definition: limited-memory-qr.hpp:228

quala::LimitedMemoryQR::scale_R
void scale_R(real_t scal)
Multiply the matrix R by a scalar.
Definition: limited-memory-qr.hpp:215

quala::LimitedMemoryQR::ring_reverse_iter
ReverseCircularRange< index_t > ring_reverse_iter() const
Get reverse iterators in the circular buffer.
Definition: limited-memory-qr.hpp:270

quala::LimitedMemoryQR::get_full_R
mat get_full_R() const
Get the full storage for the upper triangular matrix R but with the columns in the correct order.
Definition: limited-memory-qr.hpp:191

quala::LimitedMemoryQR::r_idx_end
index_t r_idx_end
Index of the one-past-last column of R.
Definition: limited-memory-qr.hpp:280

quala::ReverseCircularRange
Definition: ringbuffer.hpp:220

quala
Definition: anderson-acceleration.hpp:8

quala::inf
constexpr real_t inf
Definition: vec.hpp:43

quala::mat
realmat mat
Default type for matrices.
Definition: vec.hpp:20

quala::length_t
index_t length_t
Default type for vector sizes.
Definition: vec.hpp:29

quala::vec
realvec vec
Default type for vectors.
Definition: vec.hpp:14

quala::index_t
Eigen::Index index_t
Default type for vector indices.
Definition: vec.hpp:27

quala::real_t
double real_t
Default floating point type.
Definition: vec.hpp:8

ringbuffer.hpp

vec.hpp