@@ -116,11 +116,6 @@ void gpu_ddot(cublasHandle_t handle, const int64_t n, const double* x, const int
116
116
assert ( (int64_t ) incy_ == incy );
117
117
118
118
cublasStatus_t rc = cublasDdot (handle , n_ , x , incx_ , y , incy_ , result );
119
- /*
120
- double alpha = 1.0;
121
- double beta = 0.0;
122
- cublasStatus_t rc = cublasDgemm(handle, CUBLAS_OP_N, CUBLAS_OP_N, 1, 1, n_, &alpha, x, 1, y, n_, &beta, &result_, 1);
123
- */
124
119
assert (rc == CUBLAS_STATUS_SUCCESS );
125
120
}
126
121
@@ -149,8 +144,8 @@ void gpu_sdot(cublasHandle_t handle, const int64_t n, const float* x, const int6
149
144
150
145
151
146
152
- void gpu_dgemv (cublasHandle_t handle , const char * transa , const int64_t m , const int64_t n , const double alpha ,
153
- const double * a , const int64_t lda , const double * x , const int64_t incx , const double beta , double * y , const int64_t incy ) {
147
+ void gpu_dgemv (cublasHandle_t handle , const char * transa , const int64_t m , const int64_t n , const double * alpha ,
148
+ const double * a , const int64_t lda , const double * x , const int64_t incx , const double * beta , double * y , const int64_t incy ) {
154
149
155
150
assert (handle != NULL );
156
151
@@ -173,13 +168,13 @@ void gpu_dgemv(cublasHandle_t handle, const char* transa, const int64_t m, const
173
168
cublasOperation_t transa_ = CUBLAS_OP_N ;
174
169
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
175
170
176
- cublasDgemv (handle , transa_ , m_ , n_ , & alpha , a , lda_ , x , incx_ , & beta , y , incy_ );
171
+ cublasDgemv (handle , transa_ , m_ , n_ , alpha , a , lda_ , x , incx_ , beta , y , incy_ );
177
172
}
178
173
179
174
180
175
181
- void gpu_sgemv (cublasHandle_t handle , const char * transa , const int64_t m , const int64_t n , const float alpha ,
182
- const float * a , const int64_t lda , const float * x , const int64_t incx , const float beta , float * y , const int64_t incy ) {
176
+ void gpu_sgemv (cublasHandle_t handle , const char * transa , const int64_t m , const int64_t n , const float * alpha ,
177
+ const float * a , const int64_t lda , const float * x , const int64_t incx , const float * beta , float * y , const int64_t incy ) {
183
178
184
179
assert (handle != NULL );
185
180
@@ -202,12 +197,12 @@ void gpu_sgemv(cublasHandle_t handle, const char* transa, const int64_t m, const
202
197
cublasOperation_t transa_ = CUBLAS_OP_N ;
203
198
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
204
199
205
- cublasSgemv (handle , transa_ , m_ , n_ , & alpha , a , lda_ , x , incx_ , & beta , y , incy_ );
200
+ cublasSgemv (handle , transa_ , m_ , n_ , alpha , a , lda_ , x , incx_ , beta , y , incy_ );
206
201
}
207
202
208
203
209
- void gpu_dgemm (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const int64_t k , const double alpha ,
210
- const double * a , const int64_t lda , const double * b , const int64_t ldb , const double beta , double * c , const int64_t ldc ) {
204
+ void gpu_dgemm (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const int64_t k , const double * alpha ,
205
+ const double * a , const int64_t lda , const double * b , const int64_t ldb , const double * beta , double * c , const int64_t ldc ) {
211
206
212
207
assert (handle != NULL );
213
208
@@ -234,13 +229,13 @@ void gpu_dgemm(cublasHandle_t handle, const char* transa, const char* transb, co
234
229
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
235
230
if (* transb == 'T' || * transb == 't' ) transb_ = CUBLAS_OP_T ;
236
231
237
- cublasDgemm (handle , transa_ , transb_ , m_ , n_ , k_ , & alpha , a , lda_ , b , ldb_ , & beta , c , ldc_ );
232
+ cublasDgemm (handle , transa_ , transb_ , m_ , n_ , k_ , alpha , a , lda_ , b , ldb_ , beta , c , ldc_ );
238
233
}
239
234
240
235
241
236
242
- void gpu_sgemm (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const int64_t k , const float alpha ,
243
- const float * a , const int64_t lda , const float * b , const int64_t ldb , const float beta , float * c , const int64_t ldc ) {
237
+ void gpu_sgemm (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const int64_t k , const float * alpha ,
238
+ const float * a , const int64_t lda , const float * b , const int64_t ldb , const float * beta , float * c , const int64_t ldc ) {
244
239
245
240
assert (handle != NULL );
246
241
@@ -267,12 +262,12 @@ void gpu_sgemm(cublasHandle_t handle, const char* transa, const char* transb, co
267
262
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
268
263
if (* transb == 'T' || * transb == 't' ) transb_ = CUBLAS_OP_T ;
269
264
270
- cublasSgemm (handle , transa_ , transb_ , m_ , n_ , k_ , & alpha , a , lda_ , b , ldb_ , & beta , c , ldc_ );
265
+ cublasSgemm (handle , transa_ , transb_ , m_ , n_ , k_ , alpha , a , lda_ , b , ldb_ , beta , c , ldc_ );
271
266
}
272
267
273
268
274
- void gpu_dgeam (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const double alpha ,
275
- const double * a , const int64_t lda , const double beta , const double * b , const int64_t ldb , double * c , const int64_t ldc ) {
269
+ void gpu_dgeam (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const double * alpha ,
270
+ const double * a , const int64_t lda , const double * beta , const double * b , const int64_t ldb , double * c , const int64_t ldc ) {
276
271
assert (handle != NULL );
277
272
278
273
/* Convert to int */
@@ -296,13 +291,13 @@ void gpu_dgeam(cublasHandle_t handle, const char* transa, const char* transb, co
296
291
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
297
292
if (* transb == 'T' || * transb == 't' ) transb_ = CUBLAS_OP_T ;
298
293
299
- cublasDgeam (handle , transa_ , transb_ , m_ , n_ , & alpha , a , lda_ , & beta , b , ldb_ , c , ldc_ );
294
+ cublasDgeam (handle , transa_ , transb_ , m_ , n_ , alpha , a , lda_ , beta , b , ldb_ , c , ldc_ );
300
295
301
296
}
302
297
303
298
304
- void gpu_sgeam (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const float alpha ,
305
- const float * a , const int64_t lda , const float beta , const float * b , const int64_t ldb , float * c , const int64_t ldc ) {
299
+ void gpu_sgeam (cublasHandle_t handle , const char * transa , const char * transb , const int64_t m , const int64_t n , const float * alpha ,
300
+ const float * a , const int64_t lda , const float * beta , const float * b , const int64_t ldb , float * c , const int64_t ldc ) {
306
301
assert (handle != NULL );
307
302
308
303
/* Convert to int */
@@ -326,6 +321,6 @@ void gpu_sgeam(cublasHandle_t handle, const char* transa, const char* transb, co
326
321
if (* transa == 'T' || * transa == 't' ) transa_ = CUBLAS_OP_T ;
327
322
if (* transb == 'T' || * transb == 't' ) transb_ = CUBLAS_OP_T ;
328
323
329
- cublasSgeam (handle , transa_ , transb_ , m_ , n_ , & alpha , a , lda_ , & beta , b , ldb_ , c , ldc_ );
324
+ cublasSgeam (handle , transa_ , transb_ , m_ , n_ , alpha , a , lda_ , beta , b , ldb_ , c , ldc_ );
330
325
331
326
}
0 commit comments