![]() |
QMCPACK
|
Functions | |
void | gemm (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const float &alpha, const float *A, int lda, const float *B, int ldb, const float &beta, float *C, int ldc) |
void | gemm (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const double &alpha, const double *A, int lda, const double *B, int ldb, const double &beta, double *C, int ldc) |
void | gemm (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const std::complex< float > &alpha, const std::complex< float > *A, int lda, const std::complex< float > *B, int ldb, const std::complex< float > &beta, std::complex< float > *C, int ldc) |
void | gemm (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const std::complex< double > &alpha, const std::complex< double > *A, int lda, const std::complex< double > *B, int ldb, const std::complex< double > &beta, std::complex< double > *C, int ldc) |
void | gemv (BLASHandle< PlatformKind::CUDA > &handle, const char trans, const int m, const int n, const float &alpha, const float *const A, const int lda, const float *const x, const int incx, const float &beta, float *const y, const int incy) |
void | gemv (BLASHandle< PlatformKind::CUDA > &handle, const char trans, const int m, const int n, const double &alpha, const double *const A, const int lda, const double *const x, const int incx, const double &beta, double *const y, const int incy) |
void | gemv (BLASHandle< PlatformKind::CUDA > &handle, const char trans, const int m, const int n, const std::complex< float > &alpha, const std::complex< float > *A, const int lda, const std::complex< float > *x, const int incx, const std::complex< float > &beta, std::complex< float > *y, const int incy) |
void | gemv (BLASHandle< PlatformKind::CUDA > &handle, const char trans, const int m, const int n, const std::complex< double > &alpha, const std::complex< double > *A, const int lda, const std::complex< double > *x, const int incx, const std::complex< double > &beta, std::complex< double > *y, const int incy) |
template<typename T > | |
void | gemv_batched (BLASHandle< PlatformKind::CUDA > &handle, const char trans, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const int batch_count) |
void | ger (BLASHandle< PlatformKind::CUDA > &handle, const int m, const int n, const float &alpha, const float *const x, const int incx, const float *const y, const int incy, float *const A, const int lda) |
void | ger (BLASHandle< PlatformKind::CUDA > &handle, const int m, const int n, const double &alpha, const double *const x, const int incx, const double *const y, const int incy, double *const A, const int lda) |
void | ger (BLASHandle< PlatformKind::CUDA > &handle, const int m, const int n, const std::complex< float > &alpha, const std::complex< float > *x, const int incx, const std::complex< float > *y, const int incy, std::complex< float > *A, const int lda) |
void | ger (BLASHandle< PlatformKind::CUDA > &handle, const int m, const int n, const std::complex< double > &alpha, const std::complex< double > *x, const int incx, const std::complex< double > *y, const int incy, std::complex< double > *A, const int lda) |
template<typename T > | |
void | ger_batched (BLASHandle< PlatformKind::CUDA > &handle, const int m, const int n, const T *alpha, const T *const x[], const int incx, const T *const y[], const int incy, T *const A[], const int lda, const int batch_count) |
template<typename T > | |
void | copy_batched (BLASHandle< PlatformKind::CUDA > &handle, const int n, const T *const in[], const int incx, T *const out[], const int incy, const int batch_count) |
void | gemm_batched (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const float &alpha, const float *const A[], int lda, const float *const B[], int ldb, const float &beta, float *const C[], int ldc, int batchCount) |
void | gemm_batched (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const std::complex< float > &alpha, const std::complex< float > *const A[], int lda, const std::complex< float > *const B[], int ldb, const std::complex< float > &beta, std::complex< float > *const C[], int ldc, int batchCount) |
void | gemm_batched (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const double &alpha, const double *const A[], int lda, const double *const B[], int ldb, const double &beta, double *const C[], int ldc, int batchCount) |
void | gemm_batched (BLASHandle< PlatformKind::CUDA > &handle, const char transa, const char transb, int m, int n, int k, const std::complex< double > &alpha, const std::complex< double > *const A[], int lda, const std::complex< double > *const B[], int ldb, const std::complex< double > &beta, std::complex< double > *const C[], int ldc, int batchCount) |
template<typename T > | |
void | gemm (BLASHandle< PlatformKind::OMPTARGET > &handle, const char transa, const char transb, int m, int n, int k, const T &alpha, const T *A, int lda, const T *B, int ldb, const T &beta, T *C, int ldc) |
template<typename T > | |
void | gemm_batched (BLASHandle< PlatformKind::OMPTARGET > &handle, const char transa, const char transb, int m, int n, int k, const T &alpha, const T *const A[], int lda, const T *const B[], int ldb, const T &beta, T *const C[], int ldc, int batchCount) |
template<typename T > | |
void | gemv (BLASHandle< PlatformKind::OMPTARGET > &handle, const char trans, const int m, const int n, const T &alpha, const T *const A, const int lda, const T *const x, const int incx, const T &beta, T *const y, const int incy) |
template<typename T > | |
void | gemv_batched (BLASHandle< PlatformKind::OMPTARGET > &handle, const char trans, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const int batch_count) |
template<typename T > | |
void | ger (BLASHandle< PlatformKind::OMPTARGET > &handle, const int m, const int n, const T &alpha, const T *const x, const int incx, const T *const y, const int incy, T *const A, const int lda) |
template<typename T > | |
void | ger_batched (BLASHandle< PlatformKind::OMPTARGET > &handle, const int m, const int n, const T *alpha, const T *const x[], const int incx, const T *const y[], const int incy, T *const A[], const int lda, const int batch_count) |
template<typename T > | |
void | copy_batched (BLASHandle< PlatformKind::OMPTARGET > &handle, const int n, const T *const x[], const int incx, T *const y[], const int incy, const int batch_count) |
template<typename T > | |
void | gemm (BLASHandle< PlatformKind::SYCL > &handle, const char transa, const char transb, int m, int n, int k, const T &alpha, const T *A, int lda, const T *B, int ldb, const T &beta, T *C, int ldc) |
template<typename T > | |
void | gemv (BLASHandle< PlatformKind::SYCL > &handle, const char trans, const int m, const int n, const T &alpha, const T *const A, const int lda, const T *const x, const int incx, const T &beta, T *const y, const int incy) |
template<typename T > | |
void | gemv_batched (BLASHandle< PlatformKind::SYCL > &handle, const char trans, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const size_t batch_count) |
template<typename T > | |
void | ger (BLASHandle< PlatformKind::SYCL > &handle, const int m, const int n, const T &alpha, const T *const x, const int incx, const T *const y, const int incy, T *const A, const int lda) |
template<typename T > | |
void | ger_batched (BLASHandle< PlatformKind::SYCL > &handle, const int m, const int n, const T *alpha, const T *const x[], const int incx, const T *const y[], const int incy, T *const A[], const int lda, const size_t batch_count) |
template<typename T > | |
void | copy_batched (BLASHandle< PlatformKind::SYCL > &handle, syclBLAS::syclBLAS_int n, const T *const in[], syclBLAS::syclBLAS_int incx, T *const out[], syclBLAS::syclBLAS_int incy, const size_t batch_count) |
template<typename T > | |
void | gemm_batched (BLASHandle< PlatformKind::SYCL > &handle, const char transa, const char transb, syclBLAS::syclBLAS_int m, syclBLAS::syclBLAS_int n, syclBLAS::syclBLAS_int k, const T &alpha, const T *const A[], syclBLAS::syclBLAS_int lda, const T *const B[], syclBLAS::syclBLAS_int ldb, const T &beta, T *const C[], syclBLAS::syclBLAS_int ldc, const size_t batch_count) |
|
inline |
Definition at line 147 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::ompBLAS::copy_batched(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, and qmcplusplus::n.
|
inline |
Definition at line 155 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::charge::e, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 303 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::cuBLAS_MFs::copy_batched(), qmcplusplus::cudaErrorCheck(), BLASHandle< PlatformKind::CUDA >::h_stream, and qmcplusplus::n.
Referenced by DelayedUpdateBatched< PL, VALUE >::mw_accept_rejectRow(), and DelayedUpdateBatched< PL, VALUE >::mw_prepareInvRow().
|
inline |
Definition at line 33 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::syclBLAS::convertTransEnum(), qmcplusplus::Units::charge::e, qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 34 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::ompBLAS::gemm(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 49 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasSgemm, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by LCAOrbitalSet::mw_evaluateValueImplGEMM(), LCAOrbitalSet::mw_evaluateValueVPsImplGEMM(), LCAOrbitalSet::mw_evaluateVGLImplGEMM(), qmcplusplus::test_one_gemm(), and DelayedUpdateCUDA< T, T_FP >::updateInvMat().
|
inline |
Definition at line 69 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::cuBLAS::convertOperation(), cublasDgemm, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 89 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasCgemm, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 110 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasZgemm, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 54 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::ompBLAS::gemm_batched(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 176 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::syclBLAS::convertTransEnum(), qmcplusplus::Units::charge::e, qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 315 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasSgemmBatched, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by DelayedUpdateBatched< PL, VALUE >::mw_updateInvMat(), and qmcplusplus::test_one_gemm().
|
inline |
Definition at line 337 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasCgemmBatched, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 368 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, qmcplusplus::cuBLAS::convertOperation(), cublasDgemmBatched, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 390 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasZgemmBatched, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 60 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::syclBLAS::convertTransEnum(), qmcplusplus::Units::charge::e, qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 77 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::ompBLAS::gemv(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 131 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasSgemv, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by qmcplusplus::test_one_gemv().
|
inline |
Definition at line 149 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::cuBLAS::convertOperation(), cublasDgemv, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 167 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasCgemv, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 186 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, castNativeType, qmcplusplus::cuBLAS::convertOperation(), cublasErrorCheck, cublasZgemv, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 85 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::Units::charge::e, qmcplusplus::syclBLAS::gemv_batched(), qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 95 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::ompBLAS::gemv_batched(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 206 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::cudaErrorCheck(), qmcplusplus::cuBLAS_MFs::gemv_batched(), BLASHandle< PlatformKind::CUDA >::h_stream, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by DelayedUpdateBatched< PL, VALUE >::mw_accept_rejectRow(), DelayedUpdateBatched< PL, VALUE >::mw_prepareInvRow(), DelayedUpdateBatched< PL, VALUE >::mw_updateRow(), and qmcplusplus::test_one_gemv().
|
inline |
Definition at line 110 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::Units::charge::e, qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 114 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::ompBLAS::ger(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 225 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, cublasErrorCheck, cublasSger, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by qmcplusplus::test_one_ger().
|
inline |
Definition at line 239 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, cublasDger, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 253 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, castNativeType, cublasCgeru, cublasErrorCheck, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 269 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, castNativeType, cublasErrorCheck, cublasZgeru, BLASHandle< PlatformKind::CUDA >::h_cublas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 130 of file AccelBLAS_OMPTarget.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::ompBLAS::ger_batched(), BLASHandle< PlatformKind::OMPTARGET >::h_ompblas, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
|
inline |
Definition at line 132 of file AccelBLAS_SYCL.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::Units::charge::e, qmcplusplus::syclBLAS::ger_batched(), qmcplusplus::lda, qmcplusplus::Units::distance::m, qmcplusplus::n, and BLASHandle< PlatformKind::SYCL >::queue_.
|
inline |
Definition at line 286 of file AccelBLAS_CUDA.hpp.
References qmcplusplus::Units::distance::A, qmcplusplus::cudaErrorCheck(), qmcplusplus::cuBLAS_MFs::ger_batched(), BLASHandle< PlatformKind::CUDA >::h_stream, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by DelayedUpdateBatched< PL, VALUE >::mw_accept_rejectRow(), DelayedUpdateBatched< PL, VALUE >::mw_updateRow(), and qmcplusplus::test_one_ger().