numerics/api/dense_8cpp_source.html

/// @file kernel/dense.cpp

/// @brief Implementations for num::kernel::dense (seq_t, par_t, and no-policy

/// ops).


#include "kernel/dense.hpp"

#include "kernel/raw.hpp"

#include <stdexcept>


namespace num::kernel::dense {


void ger(real alpha, const Vector& x, const Vector& y, Matrix& A, seq_t) noexcept {

    raw::ger(A.data(), x.data(), y.data(), alpha, x.size(), y.size());

}


void ger(real alpha, const Vector& x, const Vector& y, Matrix& A, par_t) {

#ifdef NUMERICS_HAS_OMP

    const idx m = x.size();

    const idx n = y.size();

    const real* xd = x.data();

    const real* yd = y.data();

    real* Ad = A.data();

    #pragma omp parallel for schedule(static)

    for (idx i = 0; i < m; ++i) {

        const real axi = alpha * xd[i];

        real* row = Ad + (i * n);

        for (idx j = 0; j < n; ++j) {

            row[j] += axi * yd[j];

        }

    }

#else

    ger(alpha, x, y, A, seq_t{});

#endif

}


void trsv_lower(const Matrix& L, const Vector& b, Vector& x) {

    const idx n = L.rows();

    if (L.cols() != n || b.size() != n) {

        throw std::invalid_argument("kernel::dense::trsv_lower: dimension mismatch");

    }

    if (x.size() != n) {

        x = Vector(n);

    }

    raw::trsv_lower(x.data(), L.data(), b.data(), n);

}


void trsv_upper(const Matrix& U, const Vector& b, Vector& x) {

    const idx n = U.rows();

    if (U.cols() != n || b.size() != n) {

        throw std::invalid_argument("kernel::dense::trsv_upper: dimension mismatch");

    }

    if (x.size() != n) {

        x = Vector(n);

    }

    raw::trsv_upper(x.data(), U.data(), b.data(), n);

}


} // namespace num::kernel::dense

num::BasicMatrix< real >

num::BasicMatrix::rows
constexpr idx rows() const noexcept
Definition matrix.hpp:87

num::BasicMatrix::data
T * data()
Definition matrix.hpp:91

num::BasicMatrix::cols
constexpr idx cols() const noexcept
Definition matrix.hpp:88

num::BasicVector< real >

num::BasicVector::data
T * data()
Definition vector.hpp:88

num::BasicVector::size
constexpr idx size() const noexcept
Definition vector.hpp:83

dense.hpp
Dense matrix inner kernels (namespace num::kernel::dense)

num::kernel::dense
Definition dense.hpp:10

num::kernel::dense::trsv_upper
void trsv_upper(const Matrix &U, const Vector &b, Vector &x)
Back substitution: solve Ux = b.
Definition dense.cpp:46

num::kernel::dense::trsv_lower
void trsv_lower(const Matrix &L, const Vector &b, Vector &x)
Forward substitution: solve Lx = b.
Definition dense.cpp:35

num::kernel::dense::ger
void ger(real alpha, const Vector &x, const Vector &y, Matrix &A, seq_t) noexcept
Sequential rank-1 update.
Definition dense.cpp:11

num::kernel::raw::trsv_upper
NUM_K_AINLINE void trsv_upper(T *NUM_K_RESTRICT x, const T *NUM_K_RESTRICT U, const T *NUM_K_RESTRICT b, idx n) noexcept
Back substitution: solve Ux = b, U upper triangular (n x n, row-major).
Definition raw.hpp:200

num::kernel::raw::ger
NUM_K_AINLINE void ger(T *NUM_K_RESTRICT A, const T *NUM_K_RESTRICT x, const T *NUM_K_RESTRICT y, T alpha, idx m, idx n) noexcept
Rank-1 update: A[i*n + j] += alpha * x[i] * y[j] (m x n row-major)
Definition raw.hpp:160

num::kernel::raw::trsv_lower
NUM_K_AINLINE void trsv_lower(T *NUM_K_RESTRICT x, const T *NUM_K_RESTRICT L, const T *NUM_K_RESTRICT b, idx n) noexcept
Forward substitution: solve Lx = b, L lower triangular (n x n, row-major).
Definition raw.hpp:181

num::real
double real
Definition types.hpp:10

num::idx
std::size_t idx
Definition types.hpp:11

num::Vector
BasicVector< real > Vector
Real-valued dense vector with full backend dispatch (CPU + GPU)
Definition vector.hpp:129

raw.hpp
Tier-1 kernel: raw-pointer, inline, zero-overhead inner loops.

num::kernel::par_t
Parallel execution policy tag.
Definition policy.hpp:13

num::kernel::seq_t
Sequential execution policy tag.
Definition policy.hpp:10