16#error "CUDA support is not enabled in this build of nda. Please configure and install nda with -DCUDASupport=ON"
23namespace nda::blas::device {
25 void axpy(
int N,
double alpha,
const double *x,
int incx,
double *Y,
int incy);
28 void copy(
int N,
const double *x,
int incx,
double *Y,
int incy);
31 double dot(
int M,
const double *x,
int incx,
const double *Y,
int incy);
35 void gemm(
char op_a,
char op_b,
int M,
int N,
int K,
double alpha,
const double *A,
int LDA,
const double *B,
int LDB,
double beta,
double *C,
37 void gemm(
char op_a,
char op_b,
int M,
int N,
int K,
dcomplex alpha,
const dcomplex *A,
int LDA,
const dcomplex *B,
int LDB,
dcomplex beta,
40 void gemm_batch(
char op_a,
char op_b,
int M,
int N,
int K,
double alpha,
const double **A,
int LDA,
const double **B,
int LDB,
double beta,
41 double **C,
int LDC,
int batch_count);
42 void gemm_batch(
char op_a,
char op_b,
int M,
int N,
int K,
dcomplex alpha,
const dcomplex **A,
int LDA,
const dcomplex **B,
int LDB,
dcomplex beta,
43 dcomplex **C,
int LDC,
int batch_count);
46 void gemm_vbatch(
char op_a,
char op_b,
int *M,
int *N,
int *K,
double alpha,
const double **A,
int *LDA,
const double **B,
int *LDB,
double beta,
47 double **C,
int *LDC,
int batch_count);
48 void gemm_vbatch(
char op_a,
char op_b,
int *M,
int *N,
int *K,
dcomplex alpha,
const dcomplex **A,
int *LDA,
const dcomplex **B,
int *LDB,
51 inline void gemm_vbatch(
char,
char,
int *,
int *,
int *,
double,
const double **,
int *,
const double **,
int *,
double,
double **,
int *,
int) {
52 NDA_RUNTIME_ERROR <<
"nda::blas::device::gemmv_batch requires Magma [https://icl.cs.utk.edu/magma/]. Configure nda with -DUse_Magma=ON";
54 inline void gemm_vbatch(
char,
char,
int *,
int *,
int *,
dcomplex,
const dcomplex **,
int *,
const dcomplex **,
int *,
dcomplex,
dcomplex **,
int *,
56 NDA_RUNTIME_ERROR <<
"nda::blas::device::gemmv_batch requires Magma [https://icl.cs.utk.edu/magma/]. Configure nda with -DUse_Magma=ON";
60 void gemm_batch_strided(
char op_a,
char op_b,
int M,
int N,
int K,
double alpha,
const double *A,
int LDA,
int strideA,
const double *B,
int LDB,
61 int strideB,
double beta,
double *C,
int LDC,
int strideC,
int batch_count);
62 void gemm_batch_strided(
char op_a,
char op_b,
int M,
int N,
int K,
dcomplex alpha,
const dcomplex *A,
int LDA,
int strideA,
const dcomplex *B,
63 int LDB,
int srideB,
dcomplex beta,
dcomplex *C,
int LDC,
int strideC,
int batch_count);
65 void gemv(
char op,
int M,
int N,
double alpha,
const double *A,
int LDA,
const double *x,
int incx,
double beta,
double *Y,
int incy);
66 void gemv(
char op,
int M,
int N,
dcomplex alpha,
const dcomplex *A,
int LDA,
const dcomplex *x,
int incx,
dcomplex beta,
dcomplex *Y,
int incy);
68 void ger(
int M,
int N,
double alpha,
const double *x,
int incx,
const double *Y,
int incy,
double *A,
int LDA);
71 void scal(
int M,
double alpha,
double *x,
int incx);
74 void swap(
int N,
double *x,
int incx,
double *Y,
int incy);
Provides a custom runtime error class and macros to assert conditions and throw exceptions.
std::complex< double > dcomplex
Alias for std::complex<double> type.