nda/unstable/matmul_8hpp_source.html

// Copyright (c) 2019--present, The Simons Foundation

// This file is part of TRIQS/nda and is licensed under the Apache License, Version 2.0.

// SPDX-License-Identifier: Apache-2.0

// See LICENSE in the root of this distribution for details.


#pragma once


#include "../basic_functions.hpp"

#include "../blas/gemm.hpp"

#include "../blas/gemv.hpp"

#include "../blas/tools.hpp"

#include "../concepts.hpp"

#include "../declarations.hpp"

#include "../layout/policies.hpp"

#include "../mem/address_space.hpp"

#include "../mem/policies.hpp"

#include "../traits.hpp"


#include <type_traits>

#include <utility>


namespace nda {


  namespace detail {


    // Helper variable template to check if the three matrix types can be passed to gemm.

    // The following combinations are allowed (gemm can only be called with 'N', 'T' or 'C' op tags):

    // - C in Fortran layout:

    // -- A/B is not a conj expression and has Fortran layout

    // -- A/B is a conj expression and has C layout

    // - C in C layout:

    // -- A/B is not a conj expression and has C layout

    // -- A/B is a conj expression and has Fortran layout

    template <Matrix A, Matrix B, MemoryMatrix C, bool conj_A = blas::is_conj_array_expr<A>, bool conj_B = blas::is_conj_array_expr<B>>

      requires((MemoryMatrix<A> or conj_A) and (MemoryMatrix<B> or conj_B))

    static constexpr bool is_valid_gemm_triple = []() {

      using blas::has_F_layout;

      if constexpr (has_F_layout<C>) {

        return !(conj_A and has_F_layout<A>) and !(conj_B and has_F_layout<B>);

      } else {

        return !(conj_B and !has_F_layout<B>) and !(conj_A and !has_F_layout<A>);

      }

    }();


    // Get the layout policy for a given array type.

    template <Array A>

    using get_layout_policy = typename std::remove_reference_t<decltype(make_regular(std::declval<A>()))>::layout_policy_t;


  } // namespace detail


  template <Matrix A, Matrix B>


  auto matmul(A &&a, B &&b) { // NOLINT (temporary views are allowed here)

    // check dimensions

    EXPECTS_WITH_MESSAGE(a.shape()[1] == b.shape()[0], "Error in nda::matmul: Dimension mismatch in matrix-matrix product");


    // check address space compatibility

    static constexpr auto L_adr_spc = mem::get_addr_space<A>;

    static constexpr auto R_adr_spc = mem::get_addr_space<B>;

    mem::check_adr_sp_valid<L_adr_spc, R_adr_spc>();


    // get resulting value type, layout policy and matrix type

    using value_t = decltype(get_value_t<A>{} * get_value_t<B>{});

    using layout_policy =

       std::conditional_t<get_layout_info<A>.stride_order == get_layout_info<B>.stride_order, detail::get_layout_policy<A>, C_layout>;

    using matrix_t = basic_array<value_t, 2, layout_policy, 'M', nda::heap<mem::combine<L_adr_spc, R_adr_spc>>>;


    // perform matrix-matrix multiplication

    auto result = matrix_t(a.shape()[0], b.shape()[1]);

    if constexpr (is_blas_lapack_v<value_t>) {

      // for double or complex value types we use blas::gemm

      // lambda to form a new matrix with the correct value type if necessary

      auto as_container = []<Matrix M>(M &&m) -> decltype(auto) {

        if constexpr (std::is_same_v<get_value_t<M>, value_t> and (MemoryMatrix<M> or blas::is_conj_array_expr<M>))

          return std::forward<M>(m);

        else

          return matrix_t{std::forward<M>(m)};

      };


      // MSAN has no way to know that we are calling with beta = 0, hence this is not necessary.

      // Of course, in production code, we do NOT waste time to do this.

#if defined(__has_feature)

#if __has_feature(memory_sanitizer)

      result = 0;

#endif

#endif


      // check if we can call gemm directly

      if constexpr (detail::is_valid_gemm_triple<decltype(as_container(a)), decltype(as_container(b)), matrix_t>) {

        blas::gemm(1, as_container(a), as_container(b), 0, result);

      } else {

        // otherwise, turn the lhs and rhs first into regular matrices and then call gemm

        blas::gemm(1, make_regular(as_container(a)), make_regular(as_container(b)), 0, result);

      }


    } else {

      // for other value types we use a generic implementation

      blas::gemm_generic(1, a, b, 0, result);

    }

    return result;

  }


  template <Matrix A, Vector X>


  auto matvecmul(A &&a, X &&x) { // NOLINT (temporary views are allowed here)

    // check dimensions

    EXPECTS_WITH_MESSAGE(a.shape()[1] == x.shape()[0], "Error in nda::matvecmul: Dimension mismatch in matrix-vector product");


    // check address space compatibility

    static constexpr auto L_adr_spc = mem::get_addr_space<A>;

    static constexpr auto R_adr_spc = mem::get_addr_space<X>;

    static_assert(L_adr_spc == R_adr_spc, "Error in nda::matvecmul: Matrix-vector product requires arguments with same address spaces");

    static_assert(L_adr_spc != mem::None);


    // get resulting value type and vector type

    using value_t  = decltype(get_value_t<A>{} * get_value_t<X>{});

    using vector_t = vector<value_t, heap<L_adr_spc>>;


    // perform matrix-matrix multiplication

    auto result = vector_t(a.shape()[0]);

    if constexpr (is_blas_lapack_v<value_t>) {

      // for double or complex value types we use blas::gemv

      // lambda to form a new array with the correct value type if necessary

      auto as_container = []<Array B>(B &&b) -> decltype(auto) {

        if constexpr (std::is_same_v<get_value_t<B>, value_t> and (MemoryMatrix<B> or (Matrix<B> and blas::is_conj_array_expr<B>)))

          return std::forward<B>(b);

        else

          return basic_array<value_t, get_rank<B>, C_layout, 'A', heap<L_adr_spc>>{std::forward<B>(b)};

      };


      // MSAN has no way to know that we are calling with beta = 0, hence this is not necessary.

      // Of course, in production code, we do NOT waste time to do this.

#if defined(__has_feature)

#if __has_feature(memory_sanitizer)

      result = 0;

#endif

#endif


      // for expressions of the kind 'conj(M) * V' with a Matrix in Fortran Layout, we have to explicitly

      // form the conj operation in memory as gemv only provides op tags 'N', 'T' and 'C' (hermitian conjugate)

      if constexpr (blas::is_conj_array_expr<decltype(as_container(a))> and blas::has_F_layout<decltype(as_container(a))>) {

        blas::gemv(1, make_regular(as_container(a)), as_container(x), 0, result);

      } else {

        blas::gemv(1, as_container(a), as_container(x), 0, result);

      }

    } else {

      // for other value types we use a generic implementation

      blas::gemv_generic(1, a, x, 0, result);

    }

    return result;

  }


} // namespace nda

address_space.hpp
Provides definitions and type traits involving the different memory address spaces supported by nda.

basic_functions.hpp
Provides basic functions to create and manipulate arrays and views.

nda::basic_array
A generic multi-dimensional array.
Definition basic_array.hpp:100

nda::Array
Check if a given type satisfies the array concept.
Definition concepts.hpp:230

nda::Matrix
Check if a given type is a matrix, i.e. an nda::ArrayOfRank<2>.
Definition concepts.hpp:290

nda::MemoryMatrix
Check if a given type is a memory matrix, i.e. an nda::MemoryArrayOfRank<2>.
Definition concepts.hpp:306

concepts.hpp
Provides concepts for the nda library.

declarations.hpp
Provides various convenient aliases and helper functions for nda::basic_array and nda::basic_array_vi...

gemm.hpp
Provides a generic interface to the BLAS gemm routine.

gemv.hpp
Provides a generic interface to the BLAS gemv routine.

nda::make_regular
decltype(auto) make_regular(A &&a)
Make a given object regular.
Definition basic_functions.hpp:225

nda::vector
basic_array< ValueType, 1, C_layout, 'V', ContainerPolicy > vector
Alias template of an nda::basic_array with rank 1 and a 'V' algebra.
Definition declarations.hpp:145

nda::get_value_t
std::decay_t< decltype(get_first_element(std::declval< A const  >()))> get_value_t
Get the value type of an array/view or a scalar type.
Definition traits.hpp:182

nda::get_layout_info
constexpr layout_info_t get_layout_info
Constexpr variable that specifies the nda::layout_info_t of type A.
Definition traits.hpp:311

nda::blas::gemm_generic
void gemm_generic(typename A::value_type alpha, A const &a, B const &b, typename A::value_type beta, C &&c)
Generic nda::blas::gemm implementation for types not supported by BLAS/LAPACK.
Definition gemm.hpp:48

nda::blas::gemv_generic
void gemv_generic(get_value_t< A > alpha, A const &a, X const &x, get_value_t< A > beta, Y &&y)
Generic nda::blas::gemv implementation for types not supported by BLAS/LAPACK.
Definition gemv.hpp:46

nda::blas::is_conj_array_expr
static constexpr bool is_conj_array_expr
Constexpr variable that is true if the given type is a conjugate lazy expression.
Definition tools.hpp:41

nda::blas::gemv
void gemv(get_value_t< A > alpha, A const &a, X const &x, get_value_t< A > beta, Y &&y)
Interface to the BLAS gemv routine.
Definition gemv.hpp:84

nda::blas::has_F_layout
static constexpr bool has_F_layout
Constexpr variable that is true if the given nda::Array type has a Fortran memory layout.
Definition tools.hpp:55

nda::blas::gemm
void gemm(get_value_t< A > alpha, A const &a, B const &b, get_value_t< A > beta, C &&c)
Interface to the BLAS gemm routine.
Definition gemm.hpp:96

nda::matvecmul
auto matvecmul(A &&a, X &&x)
Perform a matrix-vector multiplication.
Definition matmul.hpp:141

nda::matmul
auto matmul(A &&a, B &&b)
Perform a matrix-matrix multiplication.
Definition matmul.hpp:76

nda::mem::get_addr_space
static constexpr AddressSpace get_addr_space
Variable template providing the address space for different types.
Definition address_space.hpp:69

nda::mem::check_adr_sp_valid
static const auto check_adr_sp_valid
Check validity of a set of nda::mem::AddressSpace values.
Definition address_space.hpp:140

nda::heap
heap_basic< mem::mallocator< AdrSp > > heap
Alias template of the nda::heap_basic policy using an nda::mem::mallocator.
Definition policies.hpp:52

nda::is_blas_lapack_v
constexpr bool is_blas_lapack_v
Alias for nda::is_double_or_complex_v.
Definition traits.hpp:92

policies.hpp
Provides definitions of various layout policies.

policies.hpp
Defines various memory handling policies.

nda::C_layout
Contiguous layout policy with C-order (row-major order).
Definition policies.hpp:36

tools.hpp
Provides various traits and utilities for the BLAS interface.

traits.hpp
Provides type traits for the nda library.