numerics/api/krylov_8cpp_source.html

#include "linalg/solvers/krylov.hpp"

#include "kernel/subspace.hpp"

#include "core/vector.hpp"

#include <algorithm>

#include <cmath>

#include <stdexcept>

#include <vector>


namespace num {


// Core restarted GMRES implementation (matrix-free)


SolverResult gmres(MatVecFn matvec_fn, idx n, const Vector &b, Vector &x,

                   real tol, idx max_iter, idx restart) {

  if (x.size() != n || b.size() != n)

    throw std::invalid_argument("Dimension mismatch in GMRES");


  restart = std::min(restart, n);

  SolverResult result{0, 0.0, false};


  std::vector<Vector> V;

  V.reserve(restart + 1);

  std::vector<std::vector<real>> H(restart,

                                   std::vector<real>(restart + 1, 0.0));

  std::vector<real> cs(restart, 0.0);

  std::vector<real> sn(restart, 0.0);

  std::vector<real> g(restart + 1, 0.0);


  // Wrap matvec_fn once; scratch buffer reused across all Arnoldi steps

  auto A_op = kernel::subspace::make_op(

      [&](const Vector& in, Vector& out) { matvec_fn(in, out); }, n);

  Vector scratch(n);


  idx total_iters = 0;


  while (total_iters < max_iter) {

    Vector r(n);

    matvec_fn(x, r);

    for (idx i = 0; i < n; ++i)

      r[i] = b[i] - r[i];


    real beta = 0.0;

    for (idx i = 0; i < n; ++i)

      beta += r[i] * r[i];

    beta = std::sqrt(beta);


    result.residual = beta;

    if (beta < tol) {

      result.converged = true;

      break;

    }


    V.clear();

    V.emplace_back(n);

    for (idx i = 0; i < n; ++i)

      V[0][i] = r[i] / beta;


    for (auto &col : H)

      std::fill(col.begin(), col.end(), 0.0);

    std::fill(cs.begin(), cs.end(), 0.0);

    std::fill(sn.begin(), sn.end(), 0.0);

    std::fill(g.begin(), g.end(), 0.0);

    g[0] = beta;


    idx j = 0;

    for (; j < restart && total_iters < max_iter; ++j, ++total_iters) {

      result.iterations = total_iters + 1;


      const real h_next = kernel::subspace::arnoldi_step(

          A_op, V, H[j], j, scratch, real(1e-15));


      if (h_next < 1e-15) {

        ++j;

        break;

      }


      for (idx i = 0; i < j; ++i) {

        real tmp = cs[i] * H[j][i] + sn[i] * H[j][i + 1];

        H[j][i + 1] = -sn[i] * H[j][i] + cs[i] * H[j][i + 1];

        H[j][i] = tmp;

      }


      real h0 = H[j][j], h1 = H[j][j + 1];

      real denom = std::sqrt(h0 * h0 + h1 * h1);

      if (denom < 1e-15) {

        cs[j] = 1.0;

        sn[j] = 0.0;

      } else {

        cs[j] = h0 / denom;

        sn[j] = h1 / denom;

      }


      H[j][j] = cs[j] * h0 + sn[j] * h1;

      H[j][j + 1] = 0.0;


      g[j + 1] = -sn[j] * g[j];

      g[j] = cs[j] * g[j];


      result.residual = std::abs(g[j + 1]);

      if (result.residual < tol) {

        result.converged = true;

        ++j;

        break;

      }

    }


    idx m = j;

    std::vector<real> y(m, 0.0);

    for (idx i = m; i > 0;) {

      --i;

      y[i] = g[i];

      for (idx k = i + 1; k < m; ++k)

        y[i] -= H[k][i] * y[k];

      y[i] /= H[i][i];

    }


    for (idx i = 0; i < m; ++i)

      for (idx k = 0; k < n; ++k)

        x[k] += y[i] * V[i][k];


    if (result.converged)

      break;

  }


  return result;

}


// Sparse overload


SolverResult gmres(const SparseMatrix &A, const Vector &b, Vector &x, real tol,

                   idx max_iter, idx restart) {

  if (A.n_rows() != A.n_cols())

    throw std::invalid_argument("GMRES requires a square matrix");

  idx n = A.n_rows();

  MatVecFn mv = [&](const Vector &in, Vector &out) {

    out = Vector(n);

    sparse_matvec(A, in, out);

  };

  return gmres(mv, n, b, x, tol, max_iter, restart);

}


// Dense overload  -- wraps the matrix-free core with a backend-parameterized

// matvec


SolverResult gmres(const Matrix &A, const Vector &b, Vector &x, real tol,

                   idx max_iter, idx restart, Backend backend) {

  if (A.rows() != A.cols())

    throw std::invalid_argument("GMRES requires a square matrix");

  idx n = A.rows();

  MatVecFn mv = [&](const Vector &in, Vector &out) {

    out = Vector(n);

    matvec(A, in, out, backend);

  };

  return gmres(mv, n, b, x, tol, max_iter, restart);

}


} // namespace num

num::BasicVector< real >

num::BasicVector::size
constexpr idx size() const noexcept
Definition vector.hpp:80

num::Matrix
Dense row-major matrix with optional GPU storage.
Definition matrix.hpp:12

num::Matrix::rows
constexpr idx rows() const noexcept
Definition matrix.hpp:24

num::Matrix::cols
constexpr idx cols() const noexcept
Definition matrix.hpp:25

num::SparseMatrix
Sparse matrix in Compressed Sparse Row (CSR) format.
Definition sparse.hpp:15

num::SparseMatrix::n_cols
idx n_cols() const
Definition sparse.hpp:36

num::SparseMatrix::n_rows
idx n_rows() const
Definition sparse.hpp:33

krylov.hpp
Restarted GMRES – a Krylov subspace solver for general Ax = b.

num::kernel::subspace::make_op
CallableOp< F > make_op(F f, idx n)
Factory: wrap a callable as a stack-allocated CallableOp<F>.
Definition subspace.hpp:128

num::kernel::subspace::arnoldi_step
real arnoldi_step(const LinearOp &A, std::vector< Vector > &basis, std::vector< real > &h, idx k, Vector &scratch, real breakdown_tol=real(1e-14))
One Arnoldi step: expand the orthonormal basis by one vector.
Definition subspace.cpp:73

num
Definition quadrature.hpp:8

num::real
double real
Definition types.hpp:10

num::Backend
Backend
Selects which backend handles a linalg operation.
Definition policy.hpp:19

num::beta
real beta(real a, real b)
B(a, b) – beta function.
Definition math.hpp:248

num::MatVecFn
std::function< void(const Vector &, Vector &)> MatVecFn
Callable type for matrix-free matvec: computes y = A*x.
Definition cg.hpp:13

num::idx
std::size_t idx
Definition types.hpp:11

num::matvec
void matvec(const Matrix &A, const Vector &x, Vector &y, Backend b=default_backend)
y = A * x
Definition matrix.cpp:120

num::sparse_matvec
void sparse_matvec(const SparseMatrix &A, const Vector &x, Vector &y)
y = A * x
Definition sparse.cpp:124

num::gmres
SolverResult gmres(MatVecFn matvec, idx n, const Vector &b, Vector &x, real tol=1e-6, idx max_iter=1000, idx restart=30)
Restarted GMRES(restart) – matrix-free interface.
Definition krylov.cpp:12

num::e
constexpr real e
Definition math.hpp:43

num::Vector
BasicVector< real > Vector
Real-valued dense vector with full backend dispatch (CPU + GPU)
Definition vector.hpp:130

num::SolverResult
Definition solver_result.hpp:8

subspace.hpp
Subspace construction and orthogonalization kernels. (namespace num::kernel::subspace)

vector.hpp
Vector operations.