21#ifndef NDA_HAVE_DEVICE
47 template <Matrix A, Matrix B, MemoryMatrix C>
48 void gemm_generic(
typename A::value_type alpha, A
const &a, B
const &b,
typename A::value_type beta,
50 EXPECTS(a.extent(1) == b.extent(0));
51 EXPECTS(a.extent(0) == c.extent(0));
52 EXPECTS(b.extent(1) == c.extent(1));
53 for (
int i = 0; i < a.extent(0); ++i) {
54 for (
int j = 0; j < b.extent(1); ++j) {
55 c(i, j) = beta * c(i, j);
56 for (
int k = 0; k < a.extent(1); ++k) c(i, j) += alpha * a(i, k) * b(k, j);
87 template <Matrix A, Matrix B, MemoryMatrix C>
92 auto to_mat = []<
typename Z>(Z
const &z) ->
auto & {
94 return std::get<0>(z.a);
98 auto &mat_a = to_mat(a);
99 auto &mat_b = to_mat(b);
102 using mat_a_type =
decltype(mat_a);
103 using mat_b_type =
decltype(mat_b);
107 EXPECTS(mat_a.extent(1) == mat_b.extent(0));
108 EXPECTS(mat_a.extent(0) == c.extent(0));
109 EXPECTS(mat_b.extent(1) == c.extent(1));
110 EXPECTS(mat_a.indexmap().min_stride() == 1);
111 EXPECTS(mat_b.indexmap().min_stride() == 1);
112 EXPECTS(c.indexmap().min_stride() == 1);
122 auto [m, k] = mat_a.shape();
123 auto n = mat_b.extent(1);
126#if defined(NDA_HAVE_DEVICE)
127 device::gemm(op_a, op_b, m, n, k, alpha, mat_a.data(),
get_ld(mat_a), mat_b.data(),
get_ld(mat_b), beta, c.data(),
get_ld(c));
132 f77::gemm(op_a, op_b, m, n, k, alpha, mat_a.data(),
get_ld(mat_a), mat_b.data(),
get_ld(mat_b), beta, c.data(),
get_ld(c));
Provides definitions and type traits involving the different memory address spaces supported by nda.
Provides a C++ interface for various BLAS routines.
Check if a given type is a memory matrix, i.e. an nda::MemoryArrayOfRank<2>.
Provides concepts for the nda library.
Provides GPU and non-GPU specific functionality.
auto transpose(A &&a)
Transpose the memory layout of an nda::MemoryArray or an nda::expr_call.
constexpr bool have_same_value_type_v
Constexpr variable that is true if all types in As have the same value type as A0.
std::decay_t< decltype(get_first_element(std::declval< A const >()))> get_value_t
Get the value type of an array/view or a scalar type.
int get_ld(A const &a)
Get the leading dimension in LAPACK jargon of an nda::MemoryMatrix.
static constexpr bool has_C_layout
Constexpr variable that is true if the given nda::Array type has a C memory layout.
void gemm_generic(typename A::value_type alpha, A const &a, B const &b, typename A::value_type beta, C &&c)
Generic nda::blas::gemm implementation for types not supported by BLAS/LAPACK.
static constexpr bool is_conj_array_expr
Constexpr variable that is true if the given type is a conjugate lazy expression.
void gemm(get_value_t< A > alpha, A const &a, B const &b, get_value_t< A > beta, C &&c)
Interface to the BLAS gemm routine.
const char get_op
Variable template that determines the BLAS matrix operation tag ('N','T','C') based on the given bool...
static constexpr bool have_compatible_addr_space
Constexpr variable that is true if all given types have compatible address spaces.
static constexpr bool have_device_compatible_addr_space
Constexpr variable that is true if all given types have an address space compatible with Device.
void compile_error_no_gpu()
Trigger a compilation error in case GPU specific functionality is used without configuring the projec...
constexpr bool is_blas_lapack_v
Alias for nda::is_double_or_complex_v.
Macros used in the nda library.
Provides type traits for the nda library.