numerics/api/backends_2gpu_2matrix_8cpp_source.html

/// @file core/backends/gpu/matrix.cpp

/// @brief GPU (CUDA) backend  -- matrix operations

///

/// Thin shims that forward to cuda:: kernels (cuda_ops.hpp).

/// Falls back to sequential when NUMERICS_HAS_CUDA is not defined.


#include "core/matrix.hpp"

#include "../seq/impl.hpp"

#include "core/parallel/cuda_ops.hpp"


namespace num::backends::gpu {


void matmul(const Matrix& A, const Matrix& B, Matrix& C) {

#ifdef NUMERICS_HAS_CUDA

    cuda::matmul(A.gpu_data(), B.gpu_data(), C.gpu_data(), A.rows(), A.cols(), B.cols());

#else

    num::backends::seq::matmul(A, B, C);

#endif

}


void matvec(const Matrix& A, const Vector& x, Vector& y) {

#ifdef NUMERICS_HAS_CUDA

    cuda::matvec(A.gpu_data(), x.gpu_data(), y.gpu_data(), A.rows(), A.cols());

#else

    num::backends::seq::matvec(A, x, y);

#endif

}


} // namespace num::backends::gpu

num::BasicMatrix< real >

num::BasicMatrix::rows
constexpr idx rows() const noexcept
Definition matrix.hpp:87

num::BasicMatrix::cols
constexpr idx cols() const noexcept
Definition matrix.hpp:88

num::BasicMatrix::gpu_data
T * gpu_data()
Definition matrix.hpp:116

num::BasicVector< real >

num::BasicVector::gpu_data
real * gpu_data()
Definition vector.hpp:118

cuda_ops.hpp
CUDA kernel wrappers.

matrix.hpp
Dense row-major matrix templated over scalar type T.

num::backends::gpu
Definition impl.hpp:8

num::backends::gpu::matmul
void matmul(const Matrix &A, const Matrix &B, Matrix &C)
Definition matrix.cpp:13

num::backends::gpu::matvec
void matvec(const Matrix &A, const Vector &x, Vector &y)
Definition matrix.cpp:21

num::backends::seq::matmul
void matmul(const Matrix &A, const Matrix &B, Matrix &C)
Definition matrix.cpp:10

num::backends::seq::matvec
void matvec(const Matrix &A, const Vector &x, Vector &y)
Definition matrix.cpp:20

num::cuda::matmul
void matmul(const real *A, const real *B, real *C, idx m, idx k, idx n)
C = A * B.
Definition cuda_stubs.cpp:37

num::cuda::matvec
void matvec(const real *A, const real *x, real *y, idx rows, idx cols)
y = A * x (row-major A)
Definition cuda_stubs.cpp:34