Skip to content

Commit 7ceb8fd

Browse files
committed
Finished r1
1 parent d686972 commit 7ceb8fd

File tree

5 files changed

+160
-202
lines changed

5 files changed

+160
-202
lines changed

plugins/local/gpu_nvidia/gpu.c

Lines changed: 18 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -116,11 +116,6 @@ void gpu_ddot(cublasHandle_t handle, const int64_t n, const double* x, const int
116116
assert ( (int64_t) incy_ == incy);
117117

118118
cublasStatus_t rc = cublasDdot(handle, n_, x, incx_, y, incy_, result);
119-
/*
120-
double alpha = 1.0;
121-
double beta = 0.0;
122-
cublasStatus_t rc = cublasDgemm(handle, CUBLAS_OP_N, CUBLAS_OP_N, 1, 1, n_, &alpha, x, 1, y, n_, &beta, &result_, 1);
123-
*/
124119
assert (rc == CUBLAS_STATUS_SUCCESS);
125120
}
126121

@@ -149,8 +144,8 @@ void gpu_sdot(cublasHandle_t handle, const int64_t n, const float* x, const int6
149144

150145

151146

152-
void gpu_dgemv(cublasHandle_t handle, const char* transa, const int64_t m, const int64_t n, const double alpha,
153-
const double* a, const int64_t lda, const double* x, const int64_t incx, const double beta, double* y, const int64_t incy) {
147+
void gpu_dgemv(cublasHandle_t handle, const char* transa, const int64_t m, const int64_t n, const double* alpha,
148+
const double* a, const int64_t lda, const double* x, const int64_t incx, const double* beta, double* y, const int64_t incy) {
154149

155150
assert (handle != NULL);
156151

@@ -173,13 +168,13 @@ void gpu_dgemv(cublasHandle_t handle, const char* transa, const int64_t m, const
173168
cublasOperation_t transa_ = CUBLAS_OP_N;
174169
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
175170

176-
cublasDgemv(handle, transa_, m_, n_, &alpha, a, lda_, x, incx_, &beta, y, incy_);
171+
cublasDgemv(handle, transa_, m_, n_, alpha, a, lda_, x, incx_, beta, y, incy_);
177172
}
178173

179174

180175

181-
void gpu_sgemv(cublasHandle_t handle, const char* transa, const int64_t m, const int64_t n, const float alpha,
182-
const float* a, const int64_t lda, const float* x, const int64_t incx, const float beta, float* y, const int64_t incy) {
176+
void gpu_sgemv(cublasHandle_t handle, const char* transa, const int64_t m, const int64_t n, const float* alpha,
177+
const float* a, const int64_t lda, const float* x, const int64_t incx, const float* beta, float* y, const int64_t incy) {
183178

184179
assert (handle != NULL);
185180

@@ -202,12 +197,12 @@ void gpu_sgemv(cublasHandle_t handle, const char* transa, const int64_t m, const
202197
cublasOperation_t transa_ = CUBLAS_OP_N;
203198
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
204199

205-
cublasSgemv(handle, transa_, m_, n_, &alpha, a, lda_, x, incx_, &beta, y, incy_);
200+
cublasSgemv(handle, transa_, m_, n_, alpha, a, lda_, x, incx_, beta, y, incy_);
206201
}
207202

208203

209-
void gpu_dgemm(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const int64_t k, const double alpha,
210-
const double* a, const int64_t lda, const double* b, const int64_t ldb, const double beta, double* c, const int64_t ldc) {
204+
void gpu_dgemm(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const int64_t k, const double* alpha,
205+
const double* a, const int64_t lda, const double* b, const int64_t ldb, const double* beta, double* c, const int64_t ldc) {
211206

212207
assert (handle != NULL);
213208

@@ -234,13 +229,13 @@ void gpu_dgemm(cublasHandle_t handle, const char* transa, const char* transb, co
234229
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
235230
if (*transb == 'T' || *transb == 't') transb_ = CUBLAS_OP_T;
236231

237-
cublasDgemm(handle, transa_, transb_, m_, n_, k_, &alpha, a, lda_, b, ldb_, &beta, c, ldc_);
232+
cublasDgemm(handle, transa_, transb_, m_, n_, k_, alpha, a, lda_, b, ldb_, beta, c, ldc_);
238233
}
239234

240235

241236

242-
void gpu_sgemm(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const int64_t k, const float alpha,
243-
const float* a, const int64_t lda, const float* b, const int64_t ldb, const float beta, float* c, const int64_t ldc) {
237+
void gpu_sgemm(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const int64_t k, const float* alpha,
238+
const float* a, const int64_t lda, const float* b, const int64_t ldb, const float* beta, float* c, const int64_t ldc) {
244239

245240
assert (handle != NULL);
246241

@@ -267,12 +262,12 @@ void gpu_sgemm(cublasHandle_t handle, const char* transa, const char* transb, co
267262
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
268263
if (*transb == 'T' || *transb == 't') transb_ = CUBLAS_OP_T;
269264

270-
cublasSgemm(handle, transa_, transb_, m_, n_, k_, &alpha, a, lda_, b, ldb_, &beta, c, ldc_);
265+
cublasSgemm(handle, transa_, transb_, m_, n_, k_, alpha, a, lda_, b, ldb_, beta, c, ldc_);
271266
}
272267

273268

274-
void gpu_dgeam(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const double alpha,
275-
const double* a, const int64_t lda, const double beta, const double* b, const int64_t ldb, double* c, const int64_t ldc) {
269+
void gpu_dgeam(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const double* alpha,
270+
const double* a, const int64_t lda, const double* beta, const double* b, const int64_t ldb, double* c, const int64_t ldc) {
276271
assert (handle != NULL);
277272

278273
/* Convert to int */
@@ -296,13 +291,13 @@ void gpu_dgeam(cublasHandle_t handle, const char* transa, const char* transb, co
296291
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
297292
if (*transb == 'T' || *transb == 't') transb_ = CUBLAS_OP_T;
298293

299-
cublasDgeam(handle, transa_, transb_, m_, n_, &alpha, a, lda_, &beta, b, ldb_, c, ldc_);
294+
cublasDgeam(handle, transa_, transb_, m_, n_, alpha, a, lda_, beta, b, ldb_, c, ldc_);
300295

301296
}
302297

303298

304-
void gpu_sgeam(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const float alpha,
305-
const float* a, const int64_t lda, const float beta, const float* b, const int64_t ldb, float* c, const int64_t ldc) {
299+
void gpu_sgeam(cublasHandle_t handle, const char* transa, const char* transb, const int64_t m, const int64_t n, const float* alpha,
300+
const float* a, const int64_t lda, const float* beta, const float* b, const int64_t ldb, float* c, const int64_t ldc) {
306301
assert (handle != NULL);
307302

308303
/* Convert to int */
@@ -326,6 +321,6 @@ void gpu_sgeam(cublasHandle_t handle, const char* transa, const char* transb, co
326321
if (*transa == 'T' || *transa == 't') transa_ = CUBLAS_OP_T;
327322
if (*transb == 'T' || *transb == 't') transb_ = CUBLAS_OP_T;
328323

329-
cublasSgeam(handle, transa_, transb_, m_, n_, &alpha, a, lda_, &beta, b, ldb_, c, ldc_);
324+
cublasSgeam(handle, transa_, transb_, m_, n_, alpha, a, lda_, beta, b, ldb_, c, ldc_);
330325

331326
}

0 commit comments

Comments
 (0)