nda/latest/cublas__interface_8hpp_source.html

// Copyright (c) 2022-2023 Simons Foundation

//

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

//

//     http://www.apache.org/licenses/LICENSE-2.0.txt

//

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.

//

// Authors: Miguel Morales, Nils Wentzell


#pragma once


#include "../tools.hpp"


#ifndef NDA_HAVE_MAGMA

#include "../../exceptions.hpp"

#endif // NDA_HAVE_MAGMA


namespace nda::blas::device {


  void axpy(int N, double alpha, const double *x, int incx, double *Y, int incy);

  void axpy(int N, dcomplex alpha, const dcomplex *x, int incx, dcomplex *Y, int incy);


  void copy(int N, const double *x, int incx, double *Y, int incy);

  void copy(int N, const dcomplex *x, int incx, dcomplex *Y, int incy);


  double dot(int M, const double *x, int incx, const double *Y, int incy);

  dcomplex dot(int M, const dcomplex *x, int incx, const dcomplex *Y, int incy);

  dcomplex dotc(int M, const dcomplex *x, int incx, const dcomplex *Y, int incy);


  void gemm(char op_a, char op_b, int M, int N, int K, double alpha, const double *A, int LDA, const double *B, int LDB, double beta, double *C,

            int LDC);

  void gemm(char op_a, char op_b, int M, int N, int K, dcomplex alpha, const dcomplex *A, int LDA, const dcomplex *B, int LDB, dcomplex beta,

            dcomplex *C, int LDC);


  void gemm_batch(char op_a, char op_b, int M, int N, int K, double alpha, const double **A, int LDA, const double **B, int LDB, double beta,

                  double **C, int LDC, int batch_count);

  void gemm_batch(char op_a, char op_b, int M, int N, int K, dcomplex alpha, const dcomplex **A, int LDA, const dcomplex **B, int LDB, dcomplex beta,

                  dcomplex **C, int LDC, int batch_count);


#ifdef NDA_HAVE_MAGMA

  void gemm_vbatch(char op_a, char op_b, int *M, int *N, int *K, double alpha, const double **A, int *LDA, const double **B, int *LDB, double beta,

                   double **C, int *LDC, int batch_count);

  void gemm_vbatch(char op_a, char op_b, int *M, int *N, int *K, dcomplex alpha, const dcomplex **A, int *LDA, const dcomplex **B, int *LDB,

                   dcomplex beta, dcomplex **C, int *LDC, int batch_count);

#else

  inline void gemm_vbatch(char, char, int, int, int, double, const double **, int *, const double **, int *, double, double **, int *, int) {

    NDA_RUNTIME_ERROR << "nda::blas::device::gemmv_batch requires Magma [https://icl.cs.utk.edu/magma/]. Configure nda with -DUse_Magma=ON";

  }

  inline void gemm_vbatch(char, char, int *, int *, int *, dcomplex, const dcomplex **, int *, const dcomplex **, int *, dcomplex, dcomplex **, int *,

                          int) {

    NDA_RUNTIME_ERROR << "nda::blas::device::gemmv_batch requires Magma [https://icl.cs.utk.edu/magma/]. Configure nda with -DUse_Magma=ON";

  }

#endif


  void gemm_batch_strided(char op_a, char op_b, int M, int N, int K, double alpha, const double *A, int LDA, int strideA, const double *B, int LDB,

                          int strideB, double beta, double *C, int LDC, int strideC, int batch_count);

  void gemm_batch_strided(char op_a, char op_b, int M, int N, int K, dcomplex alpha, const dcomplex *A, int LDA, int strideA, const dcomplex *B,

                          int LDB, int srideB, dcomplex beta, dcomplex *C, int LDC, int strideC, int batch_count);


  void gemv(char op, int M, int N, double alpha, const double *A, int LDA, const double *x, int incx, double beta, double *Y, int incy);

  void gemv(char op, int M, int N, dcomplex alpha, const dcomplex *A, int LDA, const dcomplex *x, int incx, dcomplex beta, dcomplex *Y, int incy);


  void ger(int M, int N, double alpha, const double *x, int incx, const double *Y, int incy, double *A, int LDA);

  void ger(int M, int N, dcomplex alpha, const dcomplex *x, int incx, const dcomplex *Y, int incy, dcomplex *A, int LDA);


  void scal(int M, double alpha, double *x, int incx);

  void scal(int M, dcomplex alpha, dcomplex *x, int incx);


  void swap(int N, double *x, int incx, double *Y, int incy);     // NOLINT (this is a BLAS swap)

  void swap(int N, dcomplex *x, int incx, dcomplex *Y, int incy); // NOLINT (this is a BLAS swap)


} // namespace nda::blas::device

std::swap
void swap(nda::basic_array_view< V1, R1, LP1, A1, AP1, OP1 > &a, nda::basic_array_view< V2, R2, LP2, A2, AP2, OP2 > &b)=delete
std::swap is deleted for nda::basic_array_view.

exceptions.hpp
Provides a custom runtime error class and macros to assert conditions and throw exceptions.

nda::blas::gemm_batch_strided
void gemm_batch_strided(get_value_t< A > alpha, A const &a, B const &b, get_value_t< A > beta, C &&c)
Implements a strided batched version of nda::blas::gemm taking 3-dimensional arrays as arguments.
Definition gemm_batch.hpp:221

nda::dcomplex
std::complex< double > dcomplex
Alias for std::complex<double> type.
Definition tools.hpp:39

nda::blas::gemm_vbatch
void gemm_vbatch(get_value_t< A > alpha, std::vector< A > const &va, std::vector< B > const &vb, get_value_t< A > beta, std::vector< C > &vc)
Wrapper of nda::blas::gemm_batch that allows variable sized matrices.
Definition gemm_batch.hpp:199

nda::blas::dotc
auto dotc(X const &x, Y const &y)
Interface to the BLAS dotc routine.
Definition dot.hpp:103

nda::blas::gemv
void gemv(get_value_t< A > alpha, A const &a, X const &x, get_value_t< A > beta, Y &&y)
Interface to the BLAS gemv routine.
Definition gemv.hpp:89

nda::blas::dot
auto dot(X const &x, Y const &y)
Interface to the BLAS dot routine.
Definition dot.hpp:61

nda::blas::gemm
void gemm(get_value_t< A > alpha, A const &a, B const &b, get_value_t< A > beta, C &&c)
Interface to the BLAS gemm routine.
Definition gemm.hpp:101

nda::blas::ger
void ger(get_value_t< X > alpha, X const &x, Y const &y, M &&m)
Interface to the BLAS ger routine.
Definition ger.hpp:68

nda::blas::gemm_batch
void gemm_batch(get_value_t< A > alpha, std::vector< A > const &va, std::vector< B > const &vb, get_value_t< A > beta, std::vector< C > &vc)
Implements a batched version of nda::blas::gemm taking vectors of matrices as arguments.
Definition gemm_batch.hpp:69

tools.hpp
Provides various traits and utilities for the BLAS interface.