nda/latest/ger_8hpp_source.html

// Copyright (c) 2019-2023 Simons Foundation

//

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

//

//     http://www.apache.org/licenses/LICENSE-2.0.txt

//

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.

//

// Authors: Miguel Morales, Olivier Parcollet, Nils Wentzell


#pragma once


#include "./interface/cxx_interface.hpp"

#include "./tools.hpp"

#include "../basic_functions.hpp"

#include "../concepts.hpp"

#include "../exceptions.hpp"

#include "../layout_transforms.hpp"

#include "../macros.hpp"

#include "../mem/address_space.hpp"

#include "../stdutil/array.hpp"

#include "../traits.hpp"


#ifndef NDA_HAVE_DEVICE

#include "../device.hpp"

#endif


#include <array>


namespace nda::blas {


  template <MemoryVector X, MemoryVector Y, MemoryMatrix M>

    requires(have_same_value_type_v<X, Y, M> and mem::have_compatible_addr_space<X, Y, M> and is_blas_lapack_v<get_value_t<X>>)


  void ger(get_value_t<X> alpha, X const &x, Y const &y, M &&m) { // NOLINT (temporary views are allowed here)

    EXPECTS(m.extent(0) == x.extent(0));

    EXPECTS(m.extent(1) == y.extent(0));


    // must be lapack compatible

    EXPECTS(m.indexmap().min_stride() == 1);


    // if in C, we need to call fortran with transposed matrix

    if (has_C_layout<M>) {

      ger(alpha, y, x, transpose(m));

      return;

    }


    if constexpr (mem::have_device_compatible_addr_space<X, Y, M>) {

#if defined(NDA_HAVE_DEVICE)

      device::ger(m.extent(0), m.extent(1), alpha, x.data(), x.indexmap().strides()[0], y.data(), y.indexmap().strides()[0], m.data(), get_ld(m));

#else

      compile_error_no_gpu();

#endif

    } else {

      f77::ger(m.extent(0), m.extent(1), alpha, x.data(), x.indexmap().strides()[0], y.data(), y.indexmap().strides()[0], m.data(), get_ld(m));

    }

  }


  template <ArrayOrScalar A, ArrayOrScalar B>


  auto outer_product(A const &a, B const &b) {

    if constexpr (Scalar<A> or Scalar<B>) {

      return a * b;

    } else {

      if (not a.is_contiguous()) NDA_RUNTIME_ERROR << "Error in nda::blas::outer_product: First argument has non-contiguous layout";

      if (not b.is_contiguous()) NDA_RUNTIME_ERROR << "Error in nda::blas::outer_product: Second argument has non-contiguous layout";


      // use BLAS ger to calculate the outer product

      auto res   = zeros<get_value_t<A>, mem::common_addr_space<A, B>>(stdutil::join(a.shape(), b.shape()));

      auto a_vec = reshape(a, std::array{a.size()});

      auto b_vec = reshape(b, std::array{b.size()});

      auto mat   = reshape(res, std::array{a.size(), b.size()});

      ger(1.0, a_vec, b_vec, mat);


      return res;

    }

  }


} // namespace nda::blas

address_space.hpp
Provides definitions and type traits involving the different memory address spaces supported by nda.

array.hpp
Provides utility functions for std::array.

basic_functions.hpp
Provides basic functions to create and manipulate arrays and views.

cxx_interface.hpp
Provides a C++ interface for various BLAS routines.

nda::Scalar
Check if a given type is either an arithmetic or complex type.
Definition concepts.hpp:119

concepts.hpp
Provides concepts for the nda library.

device.hpp
Provides GPU and non-GPU specific functionality.

exceptions.hpp
Provides a custom runtime error class and macros to assert conditions and throw exceptions.

nda::zeros
auto zeros(std::array< Int, Rank > const &shape)
Make an array of the given shape on the given address space and zero-initialize it.
Definition basic_functions.hpp:61

nda::transpose
auto transpose(A &&a)
Transpose the memory layout of an nda::MemoryArray or an nda::expr_call.
Definition layout_transforms.hpp:188

nda::reshape
auto reshape(A &&a, std::array< Int, R > const &new_shape)
Reshape an nda::basic_array or nda::basic_array_view.
Definition layout_transforms.hpp:108

nda::have_same_value_type_v
constexpr bool have_same_value_type_v
Constexpr variable that is true if all types in As have the same value type as A0.
Definition traits.hpp:196

nda::get_value_t
std::decay_t< decltype(get_first_element(std::declval< A const  >()))> get_value_t
Get the value type of an array/view or a scalar type.
Definition traits.hpp:192

nda::blas::outer_product
auto outer_product(A const &a, B const &b)
Calculate the outer product of two contiguous arrays/views/scalars.
Definition ger.hpp:111

nda::blas::ger
void ger(get_value_t< X > alpha, X const &x, Y const &y, M &&m)
Interface to the BLAS ger routine.
Definition ger.hpp:68

nda::mem::have_compatible_addr_space
static constexpr bool have_compatible_addr_space
Constexpr variable that is true if all given types have compatible address spaces.
Definition address_space.hpp:186

nda::mem::have_device_compatible_addr_space
static constexpr bool have_device_compatible_addr_space
Constexpr variable that is true if all given types have an address space compatible with Device.
Definition address_space.hpp:182

nda::mem::common_addr_space
constexpr AddressSpace common_addr_space
Get common address space for a number of given nda::MemoryArray types.
Definition address_space.hpp:120

nda::compile_error_no_gpu
void compile_error_no_gpu()
Trigger a compilation error in case GPU specific functionality is used without configuring the projec...
Definition device.hpp:47

nda::stdutil::join
constexpr std::array< T, R1+R2 > join(std::array< T, R1 > const &a1, std::array< T, R2 > const &a2)
Make a new std::array by joining two existing std::array objects.
Definition array.hpp:309

nda::is_blas_lapack_v
constexpr bool is_blas_lapack_v
Alias for nda::is_double_or_complex_v.
Definition traits.hpp:102

layout_transforms.hpp
Provides functions to transform the memory layout of an nda::basic_array or nda::basic_array_view.

macros.hpp
Macros used in the nda library.

tools.hpp
Provides various traits and utilities for the BLAS interface.

traits.hpp
Provides type traits for the nda library.