forked from project-asgard/kronmult
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathkgemm_nn_batched.cpp
39 lines (34 loc) · 1.28 KB
/
kgemm_nn_batched.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#include "kroncommon.hpp"
#include "kgemm_nn_batched.hpp"
void kgemm_nn_batched( int const mm, int const nn, int const kk,
double const alpha,
double* const Aarray_[],
int const ldAarray_[],
double* const Barray_[],
int const ldBarray_[],
double const beta,
double* const Carray_[],
int const ldCarray_[],
int const batchCount)
{
#ifdef USE_GPU
int constexpr warpsize = 32;
int constexpr nwarps = 8;
int constexpr nthreads = nwarps * warpsize;
kgemm_nn_batched<double><<< batchCount, nthreads>>>( mm,nn,kk,
alpha,
Aarray_, ldAarray_,
Barray_, ldBarray_,
beta,
Carray_, ldCarray_,
batchCount );
#else
kgemm_nn_batched<double>( mm,nn,kk,
alpha,
Aarray_, ldAarray_,
Barray_, ldBarray_,
beta,
Carray_, ldCarray_,
batchCount );
#endif
}