numerics/api/array_8cpp_source.html

/// @file kernel/array.cpp

/// @brief Implementations for num::kernel::array (seq_t and par_t overloads).


#include "kernel/array.hpp"

#include "kernel/raw.hpp"


namespace num::kernel::array {


void axpby(real a, const Vector& x, real b, Vector& y, seq_t) noexcept {

    raw::axpby(y.data(), x.data(), a, b, x.size());

}


void axpby(real a, const Vector& x, real b, Vector& y, par_t) {

#ifdef NUMERICS_HAS_OMP

    const idx n = x.size();

    const real* xd = x.data();

    real* yd = y.data();

    #pragma omp parallel for schedule(static)

    for (idx i = 0; i < n; ++i) {

        yd[i] = (a * xd[i]) + (b * yd[i]);

    }

#else

    axpby(a, x, b, y, seq_t{});

#endif

}


void axpbyz(real a, const Vector& x, real b, const Vector& y, Vector& z, seq_t) noexcept {

    raw::axpbyz(z.data(), x.data(), y.data(), a, b, x.size());

}


void axpbyz(real a, const Vector& x, real b, const Vector& y, Vector& z, par_t) {

#ifdef NUMERICS_HAS_OMP

    const idx n = x.size();

    const real* xd = x.data();

    const real* yd = y.data();

    real* zd = z.data();

    #pragma omp parallel for schedule(static)

    for (idx i = 0; i < n; ++i) {

        zd[i] = (a * xd[i]) + (b * yd[i]);

    }

#else

    axpbyz(a, x, b, y, z, seq_t{});

#endif

}


} // namespace num::kernel::array

array.hpp
Elementwise vector kernels (namespace num::kernel::array)

num::BasicVector< real >

num::BasicVector::data
T * data()
Definition vector.hpp:88

num::BasicVector::size
constexpr idx size() const noexcept
Definition vector.hpp:83

num::kernel::array
Definition array.hpp:9

num::kernel::array::axpby
void axpby(real a, const Vector &x, real b, Vector &y, seq_t) noexcept
Sequential: y[i] = a*x[i] + b*y[i] (single-pass; calls raw::axpby)
Definition array.cpp:9

num::kernel::array::axpbyz
void axpbyz(real a, const Vector &x, real b, const Vector &y, Vector &z, seq_t) noexcept
Sequential: z[i] = a*x[i] + b*y[i].
Definition array.cpp:27

num::kernel::raw::axpby
NUM_K_AINLINE void axpby(T *NUM_K_RESTRICT y, const T *NUM_K_RESTRICT x, T a, T b, idx n) noexcept
y[i] = a*x[i] + b*y[i].
Definition raw.hpp:46

num::kernel::raw::axpbyz
NUM_K_AINLINE void axpbyz(T *NUM_K_RESTRICT z, const T *NUM_K_RESTRICT x, const T *NUM_K_RESTRICT y, T a, T b, idx n) noexcept
z[i] = a*x[i] + b*y[i].
Definition raw.hpp:59

num::real
double real
Definition types.hpp:10

num::idx
std::size_t idx
Definition types.hpp:11

raw.hpp
Tier-1 kernel: raw-pointer, inline, zero-overhead inner loops.

num::kernel::par_t
Parallel execution policy tag.
Definition policy.hpp:13

num::kernel::seq_t
Sequential execution policy tag.
Definition policy.hpp:10