nda/latest/gemv_8hpp_source.html

// Copyright (c) 2019-2023 Simons Foundation

//

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

//

//     http://www.apache.org/licenses/LICENSE-2.0.txt

//

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.

//

// Authors: Miguel Morales, Olivier Parcollet, Nils Wentzell


#pragma once


#include "./interface/cxx_interface.hpp"

#include "./tools.hpp"

#include "../concepts.hpp"

#include "../macros.hpp"

#include "../mem/address_space.hpp"

#include "../traits.hpp"


#ifndef NDA_HAVE_DEVICE

#include "../device.hpp"

#endif


#include <tuple>


namespace nda::blas {


  template <typename A, typename X, typename Y>


  void gemv_generic(get_value_t<A> alpha, A const &a, X const &x, get_value_t<A> beta, Y &&y) { // NOLINT (temporary views are allowed here)

    EXPECTS(a.extent(1) == x.extent(0));

    EXPECTS(a.extent(0) == y.extent(0));

    for (int i = 0; i < a.extent(0); ++i) {

      y(i) = beta * y(i);

      for (int k = 0; k < a.extent(1); ++k) y(i) += alpha * a(i, k) * x(k);

    }

  }


  template <Matrix A, MemoryVector X, MemoryVector Y>

    requires((MemoryMatrix<A> or is_conj_array_expr<A>) and have_same_value_type_v<A, X, Y> and is_blas_lapack_v<get_value_t<A>>)


  void gemv(get_value_t<A> alpha, A const &a, X const &x, get_value_t<A> beta, Y &&y) { // NOLINT (temporary views are allowed here)

    // get underlying matrix in case it is given as a lazy expression

    auto to_mat = []<Matrix Z>(Z const &z) -> decltype(auto) {

      if constexpr (is_conj_array_expr<Z>)

        return std::get<0>(z.a);

      else

        return z;

    };

    auto &mat = to_mat(a);


    // compile-time checks

    using mat_type = decltype(mat);

    static_assert(mem::have_compatible_addr_space<mat_type, X, Y>);


    // runtime checks

    EXPECTS(mat.extent(1) == x.extent(0));

    EXPECTS(mat.extent(0) == y.extent(0));

    EXPECTS(mat.indexmap().min_stride() == 1);

    EXPECTS(x.indexmap().min_stride() == 1);

    EXPECTS(y.indexmap().min_stride() == 1);


    // gather parameters for gemv call

    static constexpr bool conj_A = is_conj_array_expr<A>;

    char op_a                    = get_op<conj_A, /* transpose = */ !has_F_layout<mat_type>>;

    auto [m, n]                  = mat.shape();

    if constexpr (has_C_layout<mat_type>) std::swap(m, n);


    if constexpr (mem::have_device_compatible_addr_space<mat_type, X, Y>) {

#if defined(NDA_HAVE_DEVICE)

      device::gemv(op_a, m, n, alpha, mat.data(), get_ld(mat), x.data(), x.indexmap().strides()[0], beta, y.data(), y.indexmap().strides()[0]);

#else

      compile_error_no_gpu();

#endif

    } else {

      f77::gemv(op_a, m, n, alpha, mat.data(), get_ld(mat), x.data(), x.indexmap().strides()[0], beta, y.data(), y.indexmap().strides()[0]);

    }

  }


} // namespace nda::blas

address_space.hpp
Provides definitions and type traits involving the different memory address spaces supported by nda.

std::swap
void swap(nda::basic_array_view< V1, R1, LP1, A1, AP1, OP1 > &a, nda::basic_array_view< V2, R2, LP2, A2, AP2, OP2 > &b)=delete
std::swap is deleted for nda::basic_array_view.

cxx_interface.hpp
Provides a C++ interface for various BLAS routines.

nda::Matrix
Check if a given type is a matrix, i.e. an nda::ArrayOfRank<2>.
Definition concepts.hpp:290

nda::MemoryMatrix
Check if a given type is a memory matrix, i.e. an nda::MemoryArrayOfRank<2>.
Definition concepts.hpp:306

concepts.hpp
Provides concepts for the nda library.

device.hpp
Provides GPU and non-GPU specific functionality.

nda::have_same_value_type_v
constexpr bool have_same_value_type_v
Constexpr variable that is true if all types in As have the same value type as A0.
Definition traits.hpp:196

nda::get_value_t
std::decay_t< decltype(get_first_element(std::declval< A const  >()))> get_value_t
Get the value type of an array/view or a scalar type.
Definition traits.hpp:192

nda::blas::get_ld
int get_ld(A const &a)
Get the leading dimension in LAPACK jargon of an nda::MemoryMatrix.
Definition tools.hpp:109

nda::blas::has_C_layout
static constexpr bool has_C_layout
Constexpr variable that is true if the given nda::Array type has a C memory layout.
Definition tools.hpp:76

nda::blas::gemv_generic
void gemv_generic(get_value_t< A > alpha, A const &a, X const &x, get_value_t< A > beta, Y &&y)
Generic nda::blas::gemv implementation for types not supported by BLAS/LAPACK.
Definition gemv.hpp:57

nda::blas::is_conj_array_expr
static constexpr bool is_conj_array_expr
Constexpr variable that is true if the given type is a conjugate lazy expression.
Definition tools.hpp:52

nda::blas::gemv
void gemv(get_value_t< A > alpha, A const &a, X const &x, get_value_t< A > beta, Y &&y)
Interface to the BLAS gemv routine.
Definition gemv.hpp:89

nda::blas::has_F_layout
static constexpr bool has_F_layout
Constexpr variable that is true if the given nda::Array type has a Fortran memory layout.
Definition tools.hpp:66

nda::blas::get_op
const char get_op
Variable template that determines the BLAS matrix operation tag ('N','T','C') based on the given bool...
Definition tools.hpp:91

nda::mem::have_compatible_addr_space
static constexpr bool have_compatible_addr_space
Constexpr variable that is true if all given types have compatible address spaces.
Definition address_space.hpp:186

nda::mem::have_device_compatible_addr_space
static constexpr bool have_device_compatible_addr_space
Constexpr variable that is true if all given types have an address space compatible with Device.
Definition address_space.hpp:182

nda::compile_error_no_gpu
void compile_error_no_gpu()
Trigger a compilation error in case GPU specific functionality is used without configuring the projec...
Definition device.hpp:47

nda::is_blas_lapack_v
constexpr bool is_blas_lapack_v
Alias for nda::is_double_or_complex_v.
Definition traits.hpp:102

macros.hpp
Macros used in the nda library.

tools.hpp
Provides various traits and utilities for the BLAS interface.

traits.hpp
Provides type traits for the nda library.