34void gpu_upload(
const void* cpu_ptr,
void* gpu_ptr,
const int64_t n);
37void gpu_download(
const void* gpu_ptr,
void* cpu_ptr,
const int64_t n);
40void gpu_copy(
const void* gpu_ptr_src,
void* gpu_ptr_dest,
const int64_t n);
87void gpu_ddot(
const void* handle,
const int64_t n,
88 const double* x,
const int64_t incx,
89 const double* y,
const int64_t incy,
94void gpu_sdot(
const void* handle,
const int64_t n,
95 const float* x,
const int64_t incx,
96 const float* y,
const int64_t incy,
103 const int64_t m,
const int64_t n,
105 const double* a,
const int64_t lda,
106 const double* x,
const int64_t incx,
107 const double* beta,
double* y,
const int64_t incy);
113 const int64_t m,
const int64_t n,
115 const float* a,
const int64_t lda,
116 const float* x,
const int64_t incx,
117 const float* beta,
float* y,
const int64_t incy);
121void gpu_dgemm(
const void* handle,
const char transa,
const char transb,
122 const int64_t m,
const int64_t n,
const int64_t k,
124 const double* a,
const int64_t lda,
125 const double* b,
const int64_t ldb,
126 const double* beta,
double* c,
const int64_t ldc);
130void gpu_sgemm(
const void* handle,
const char transa,
const char transb,
131 const int64_t m,
const int64_t n,
const int64_t k,
133 const float* a,
const int64_t lda,
134 const float* b,
const int64_t ldb,
135 const float* beta,
float* c,
const int64_t ldc);
140void gpu_dgeam(
const void* handle,
const char transa,
const char transb,
141 const int64_t m,
const int64_t n,
143 const double* a,
const int64_t lda,
145 const double* b,
const int64_t ldb,
146 double* c,
const int64_t ldc);
151void gpu_sgeam(
const void* handle,
const char transa,
const char transb,
152 const int64_t m,
const int64_t n,
154 const float* a,
const int64_t lda,
156 const float* b,
const int64_t ldb,
157 float* c,
const int64_t ldc);
void gpu_set_stream(void *handle, void *stream)
void gpu_blas_destroy(void **handle)
void gpu_stream_create(void **ptr)
void gpu_sdot(const void *handle, const int64_t n, const float *x, const int64_t incx, const float *y, const int64_t incy, float *result)
void gpu_allocate(void **ptr, const int64_t n)
void gpu_free(void **ptr)
void gpu_copy(const void *gpu_ptr_src, void *gpu_ptr_dest, const int64_t n)
void gpu_set_device(int32_t i)
void gpu_upload(const void *cpu_ptr, void *gpu_ptr, const int64_t n)
void gpu_get_memory(size_t *free, size_t *total)
void gpu_ddot(const void *handle, const int64_t n, const double *x, const int64_t incx, const double *y, const int64_t incy, double *result)
void gpu_dgeam(const void *handle, const char transa, const char transb, const int64_t m, const int64_t n, const double *alpha, const double *a, const int64_t lda, const double *beta, const double *b, const int64_t ldb, double *c, const int64_t ldc)
void gpu_sgemm(const void *handle, const char transa, const char transb, const int64_t m, const int64_t n, const int64_t k, const float *alpha, const float *a, const int64_t lda, const float *b, const int64_t ldb, const float *beta, float *c, const int64_t ldc)
void gpu_download(const void *gpu_ptr, void *cpu_ptr, const int64_t n)
void gpu_dgemm(const void *handle, const char transa, const char transb, const int64_t m, const int64_t n, const int64_t k, const double *alpha, const double *a, const int64_t lda, const double *b, const int64_t ldb, const double *beta, double *c, const int64_t ldc)
void gpu_blas_create(void **handle)
void gpu_dgemv(const void *handle, const char transa, const int64_t m, const int64_t n, const double *alpha, const double *a, const int64_t lda, const double *x, const int64_t incx, const double *beta, double *y, const int64_t incy)
void gpu_sgeam(const void *handle, const char transa, const char transb, const int64_t m, const int64_t n, const float *alpha, const float *a, const int64_t lda, const float *beta, const float *b, const int64_t ldb, float *c, const int64_t ldc)
void gpu_sgemv(const void *handle, const char transa, const int64_t m, const int64_t n, const float *alpha, const float *a, const int64_t lda, const float *x, const int64_t incx, const float *beta, float *y, const int64_t incy)
void gpu_stream_destroy(void **ptr)