3#include <cuda_runtime.h>
10 int max_m,
int max_n,
int max_k,
11 const int* m_d,
const int* n_d,
const int* k_d,
12 const T*
const* A_array_d,
const int* lda_d,
13 const T*
const* B_array_d,
const int* ldb_d,
14 double** C_array_d,
const int* ldc_d,
15 int batchCount, cudaStream_t stream,
16 const T* alpha =
nullptr);
25 int max_m,
int max_n,
int max_k,
26 const int* m_d,
const int* n_d,
const int* k_d,
27 const T*
const* A_array_d,
const int* lda_d,
28 const T*
const* B_array_d,
const int* ldb_d,
29 double** C_array_d,
const int* ldc_d,
30 int batchCount, cudaStream_t stream,
31 const T* alpha =
nullptr);
35 int max_m,
int max_n,
int max_k,
36 const int* m_d,
const int* n_d,
const int* k_d,
37 const double*
const* A_array_d,
const int* lda_d,
38 const double*
const* B_array_d,
const int* ldb_d,
39 double** C_array_d,
const int* ldc_d,
40 int batchCount, cudaStream_t stream,
41 const double* alpha =
nullptr)
43 gemm_nn_vbatch<double>(max_m, max_n, max_k,
44 m_d, n_d, k_d, A_array_d, lda_d, B_array_d, ldb_d,
45 C_array_d, ldc_d, batchCount, stream, alpha);
49 int max_m,
int max_n,
int max_k,
50 const int* m_d,
const int* n_d,
const int* k_d,
51 const double*
const* A_array_d,
const int* lda_d,
52 const double*
const* B_array_d,
const int* ldb_d,
53 double** C_array_d,
const int* ldc_d,
54 int batchCount, cudaStream_t stream,
55 const double* alpha =
nullptr)
59 gemm_tn_vbatch<double>(max_m, max_n, max_k,
60 m_d, n_d, k_d, A_array_d, lda_d, B_array_d, ldb_d,
61 C_array_d, ldc_d, batchCount, stream, alpha);
void dgemm_tn_vbatch(int max_m, int max_n, int max_k, const int *m_d, const int *n_d, const int *k_d, const double *const *A_array_d, const int *lda_d, const double *const *B_array_d, const int *ldb_d, double **C_array_d, const int *ldc_d, int batchCount, cudaStream_t stream, const double *alpha=nullptr)
Definition dgemm_vbatch.h:48
void gemm_tn_vbatch(int max_m, int max_n, int max_k, const int *m_d, const int *n_d, const int *k_d, const T *const *A_array_d, const int *lda_d, const T *const *B_array_d, const int *ldb_d, double **C_array_d, const int *ldc_d, int batchCount, cudaStream_t stream, const T *alpha=nullptr)
void dgemm_nn_vbatch(int max_m, int max_n, int max_k, const int *m_d, const int *n_d, const int *k_d, const double *const *A_array_d, const int *lda_d, const double *const *B_array_d, const int *ldb_d, double **C_array_d, const int *ldc_d, int batchCount, cudaStream_t stream, const double *alpha=nullptr)
Definition dgemm_vbatch.h:34
void gemm_nn_vbatch(int max_m, int max_n, int max_k, const int *m_d, const int *n_d, const int *k_d, const T *const *A_array_d, const int *lda_d, const T *const *B_array_d, const int *ldb_d, double **C_array_d, const int *ldc_d, int batchCount, cudaStream_t stream, const T *alpha=nullptr)
#define T
Definition exp.cpp:237