QMCPACK
cuBLAS_missing_functions.hpp File Reference
+ Include dependency graph for cuBLAS_missing_functions.hpp:
+ This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Namespaces

 qmcplusplus
 helper functions for EinsplineSetBuilder
 
 qmcplusplus::cuBLAS_MFs
 Implement selected batched BLAS1/2 calls using CUDA for different data types S/C/D/Z.
 

Functions

cudaError_t gemv_batched (cudaStream_t handle, const char trans, const int m, const int n, const float *alpha, const float *const A[], const int lda, const float *const x[], const int incx, const float *beta, float *const y[], const int incy, const int batch_count)
 Xgemv batched API. More...
 
cudaError_t gemv_batched (cudaStream_t handle, const char trans, const int m, const int n, const double *alpha, const double *const A[], const int lda, const double *const x[], const int incx, const double *beta, double *const y[], const int incy, const int batch_count)
 
cudaError_t gemv_batched (cudaStream_t handle, const char trans, const int m, const int n, const std::complex< float > *alpha, const std::complex< float > *const A[], const int lda, const std::complex< float > *const x[], const int incx, const std::complex< float > *beta, std::complex< float > *const y[], const int incy, const int batch_count)
 
cudaError_t gemv_batched (cudaStream_t handle, const char trans, const int m, const int n, const std::complex< double > *alpha, const std::complex< double > *const A[], const int lda, const std::complex< double > *const x[], const int incx, const std::complex< double > *beta, std::complex< double > *const y[], const int incy, const int batch_count)
 
cudaError_t ger_batched (cudaStream_t handle, const int m, const int n, const float *alpha, const float *const x[], const int incx, const float *const y[], const int incy, float *const A[], const int lda, const int batch_count)
 Xger batched API. More...
 
cudaError_t ger_batched (cudaStream_t handle, const int m, const int n, const double *alpha, const double *const x[], const int incx, const double *const y[], const int incy, double *const A[], const int lda, const int batch_count)
 
cudaError_t ger_batched (cudaStream_t handle, const int m, const int n, const std::complex< float > *alpha, const std::complex< float > *const x[], const int incx, const std::complex< float > *const y[], const int incy, std::complex< float > *const A[], const int lda, const int batch_count)
 
cudaError_t ger_batched (cudaStream_t handle, const int m, const int n, const std::complex< double > *alpha, const std::complex< double > *const x[], const int incx, const std::complex< double > *const y[], const int incy, std::complex< double > *const A[], const int lda, const int batch_count)
 
cudaError_t copy_batched (cudaStream_t hstream, const int n, const float *const in[], const int incx, float *const out[], const int incy, const int batch_count)
 Xcopy batched API. More...
 
cudaError_t copy_batched (cudaStream_t hstream, const int n, const double *const in[], const int incx, double *const out[], const int incy, const int batch_count)
 
cudaError_t copy_batched (cudaStream_t hstream, const int n, const std::complex< float > *const in[], const int incx, std::complex< float > *const out[], const int incy, const int batch_count)
 
cudaError_t copy_batched (cudaStream_t hstream, const int n, const std::complex< double > *const in[], const int incx, std::complex< double > *const out[], const int incy, const int batch_count)