27#ifndef math_templateCublas_hpp
28#define math_templateCublas_hpp
30#include <cuda_runtime.h>
52template <
typename floatT>
74template <
typename floatT>
106template <
typename dataT1,
typename dataT2>
130template <
typename floatT>
133 cublasOperation_t trans,
165template <
typename floatT>
168 cublasOperation_t trans,
182cublasStatus_t cublasTgemv<float>( cublasHandle_t handle,
183 cublasOperation_t trans,
196cublasStatus_t cublasTgemv<double>( cublasHandle_t handle,
197 cublasOperation_t trans,
210cublasStatus_t cublasTgemv<float>( cublasHandle_t handle,
211 cublasOperation_t trans,
221cublasStatus_t cublasTgemv<double>( cublasHandle_t handle,
222 cublasOperation_t trans,
cudaError_t elementwiseXxY(dataT1 *x, dataT2 *y, int size)
Calculates the element-wise product of two vectors, storing the result in the first.
cublasStatus_t cublasTaxpy(cublasHandle_t handle, int n, const floatT *alpha, const floatT *x, int incx, floatT *y, int incy)
Multiplies a vector by a scalar, adding it to a second vector which is overwritten by the result.
cublasStatus_t cublasTscal(cublasHandle_t handle, int n, const floatT *alpha, floatT *x, int incx)
Multiplies a vector by a scalar, overwriting the vector with the result.
cublasStatus_t cublasTgemv(cublasHandle_t handle, cublasOperation_t trans, int m, int n, const floatT *alpha, const floatT *A, int lda, const floatT *x, int incx, const floatT *beta, floatT *y, int incy)
Perform a matrix-vector multiplication.