![]() |
QMCPACK
|
Typedefs | |
using | syclBLAS_int = std::int64_t |
using | syclBLAS_status = sycl::event |
using | syclBLAS_handle = sycl::queue |
Functions | |
template<typename T > | |
sycl::event | gemv (sycl::queue &handle, const char trans, const int m, const int n, const T alpha, const T *const A, const int lda, const T *const x, const int incx, const T beta, T *const y, const int incy, const std::vector< sycl::event > &events) |
template sycl::event | gemv (sycl::queue &handle, const char trans, const int m, const int n, const double alpha, const double *const A, const int lda, const double *const x, const int incx, const double beta, double *const y, const int incy, const std::vector< sycl::event > &events) |
template sycl::event | gemv (sycl::queue &handle, const char trans, const int m, const int n, const float alpha, const float *const A, const int lda, const float *const x, const int incx, const float beta, float *const y, const int incy, const std::vector< sycl::event > &events) |
template sycl::event | gemv (sycl::queue &handle, const char trans, const int m, const int n, const std::complex< double > alpha, const std::complex< double > *const A, const int lda, const std::complex< double > *const x, const int incx, const std::complex< double > beta, std::complex< double > *const y, const int incy, const std::vector< sycl::event > &events) |
template sycl::event | gemv (sycl::queue &handle, const char trans, const int m, const int n, const std::complex< float > alpha, const std::complex< float > *const A, const int lda, const std::complex< float > *const x, const int incx, const std::complex< float > beta, std::complex< float > *const y, const int incy, const std::vector< sycl::event > &events) |
template<typename T , unsigned COLBS> | |
sycl::event | gemvT_batched_impl (sycl::queue &handle, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events={}) |
gemv trans = 'T' case. More... | |
template<typename T , unsigned ROWBS> | |
sycl::event | gemvN_batched_impl (sycl::queue &handle, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events={}) |
gemv trans = 'N' case. More... | |
template<> | |
sycl::event | gemv_batched< float > (sycl::queue &handle, const char trans, const int m, const int n, const float *alpha, const float *const A[], const int lda, const float *const x[], const int incx, const float *beta, float *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | gemv_batched< double > (sycl::queue &handle, const char trans, const int m, const int n, const double *alpha, const double *const A[], const int lda, const double *const x[], const int incx, const double *beta, double *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | gemv_batched< std::complex< float > > (sycl::queue &handle, const char trans, const int m, const int n, const std::complex< float > *alpha, const std::complex< float > *const A[], const int lda, const std::complex< float > *const x[], const int incx, const std::complex< float > *beta, std::complex< float > *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | gemv_batched< std::complex< double > > (sycl::queue &handle, const char trans, const int m, const int n, const std::complex< double > *alpha, const std::complex< double > *const A[], const int lda, const std::complex< double > *const x[], const int incx, const std::complex< double > *beta, std::complex< double > *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events) |
template<typename T > | |
sycl::event | gemm (sycl::queue &handle, const char tA, const char tB, const int m, const int n, const int k, const T alpha, const T *A, const int lda, const T *B, const int ldb, const T beta, T *C, const int ldc, const std::vector< sycl::event > &events) |
template sycl::event | gemm (sycl::queue &handle, const char tA, const char tB, const int m, const int n, const int k, const float alpha, const float *const A, const int lda, const float *const B, const int ldb, const float beta, float *const C, const int ldc, const std::vector< sycl::event > &events) |
template sycl::event | gemm (sycl::queue &handle, const char tA, const char tB, const int m, const int n, const int k, const double alpha, const double *const A, const int lda, const double *const B, const int ldb, const double beta, double *const C, const int ldc, const std::vector< sycl::event > &events) |
template sycl::event | gemm (sycl::queue &handle, const char tA, const char tB, const int m, const int n, const int k, const std::complex< float > alpha, const std::complex< float > *const A, const int lda, const std::complex< float > *const B, const int ldb, const std::complex< float > beta, std::complex< float > *const C, const int ldc, const std::vector< sycl::event > &events) |
template sycl::event | gemm (sycl::queue &handle, const char tA, const char tB, const int m, const int n, const int k, const std::complex< double > alpha, const std::complex< double > *const A, const int lda, const std::complex< double > *const B, const int ldb, const std::complex< double > beta, std::complex< double > *const C, const int ldc, const std::vector< sycl::event > &events) |
template<typename T , int TILE_SIZE, int ROWBS> | |
sycl::event | ger_batched_impl (sycl::queue &handle, const int m, const int n, const T *alpha, const T *const x[], const int incx, const T *const y[], const int incy, T *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | ger_batched< float > (sycl::queue &handle, const int m, const int n, const float *alpha, const float *const x[], const int incx, const float *const y[], const int incy, float *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | ger_batched< double > (sycl::queue &handle, const int m, const int n, const double *alpha, const double *const x[], const int incx, const double *const y[], const int incy, double *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | ger_batched< std::complex< float > > (sycl::queue &handle, const int m, const int n, const std::complex< float > *alpha, const std::complex< float > *const x[], const int incx, const std::complex< float > *const y[], const int incy, std::complex< float > *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events) |
template<> | |
sycl::event | ger_batched< std::complex< double > > (sycl::queue &handle, const int m, const int n, const std::complex< double > *alpha, const std::complex< double > *const x[], const int incx, const std::complex< double > *const y[], const int incy, std::complex< double > *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events) |
template<typename T1 , typename T2 > | |
sycl::event | transpose (sycl::queue &q, const T1 *restrict in, int m, int lda, T2 *restrict out, int n, int ldb, const std::vector< sycl::event > &events) |
template sycl::event | transpose (sycl::queue &q, const float *restrict in, int m, int lda, double *restrict out, int n, int ldb, const std::vector< sycl::event > &events) |
template sycl::event | transpose (sycl::queue &q, const double *restrict in, int m, int lda, double *restrict out, int n, int ldb, const std::vector< sycl::event > &events) |
template sycl::event | transpose (sycl::queue &q, const std::complex< float > *restrict in, int m, int lda, std::complex< double > *restrict out, int n, int ldb, const std::vector< sycl::event > &events) |
template sycl::event | transpose (sycl::queue &q, const std::complex< double > *restrict in, int m, int lda, std::complex< double > *restrict out, int n, int ldb, const std::vector< sycl::event > &events) |
template<typename T1 , typename T2 > | |
sycl::event | copy_n (sycl::queue &aq, const T1 *restrict VA, size_t array_size, T2 *restrict VC, const std::vector< sycl::event > &events) |
template sycl::event | copy_n (sycl::queue &aq, const double *restrict VA, size_t array_size, float *restrict VC, const std::vector< sycl::event > &events) |
template sycl::event | copy_n (sycl::queue &aq, const std::complex< double > *restrict VA, size_t array_size, std::complex< float > *restrict VC, const std::vector< sycl::event > &events) |
oneapi::mkl::transpose | convertTransEnum (char trans) |
template<typename T > | |
sycl::event | gemv_batched (sycl::queue &handle, const char trans, const int m, const int n, const T *alpha, const T *const A[], const int lda, const T *const x[], const int incx, const T *beta, T *const y[], const int incy, const size_t batch_count, const std::vector< sycl::event > &events={}) |
in-house version of gemv_batch implemented in SYCL. Can be dropped if we have vendor optimized versions More... | |
template<typename T > | |
sycl::event | ger_batched (sycl::queue &handle, const int m, const int n, const T *alpha, const T *const x[], const int incx, const T *const y[], const int incy, T *const A[], const int lda, const size_t batch_count, const std::vector< sycl::event > &events={}) |
in-house version of ger_batch implemented in SYCL. Can be dropped if we have vendor optimized versions More... | |
template<typename T1 , typename T2 > | |
sycl::event | transpose (sycl::queue &q, const T1 *in, int m, int lda, T2 *out, int n, int ldb, const std::vector< sycl::event > &events={}) |
template<typename T1 , typename T2 > | |
sycl::event | copy_n (sycl::queue &aq, const T1 *VA, size_t array_size, T2 *VC, const std::vector< sycl::event > &events={}) |
using syclBLAS_handle = sycl::queue |
Definition at line 26 of file syclBLAS.hpp.
using syclBLAS_int = std::int64_t |
Definition at line 24 of file syclBLAS.hpp.
using syclBLAS_status = sycl::event |
Definition at line 25 of file syclBLAS.hpp.
|
inline |
Definition at line 28 of file syclBLAS.hpp.
Referenced by qmcplusplus::compute::BLAS::gemm(), gemm(), qmcplusplus::compute::BLAS::gemm_batched(), gemv(), and qmcplusplus::compute::BLAS::gemv().
sycl::event qmcplusplus::syclBLAS::copy_n | ( | sycl::queue & | aq, |
const T1 * | VA, | ||
size_t | array_size, | ||
T2 * | VC, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
sycl::event qmcplusplus::syclBLAS::copy_n | ( | sycl::queue & | aq, |
const T1 *restrict | VA, | ||
size_t | array_size, | ||
T2 *restrict | VC, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 548 of file syclBLAS.cpp.
Referenced by DelayedUpdate< T, T_FP >::acceptRow(), DelayedUpdateSYCL< T, T_FP >::acceptRow(), DelayedUpdateCUDA< T, T_FP >::acceptRow(), SplineR2R< ST >::applyRotation(), SplineC2C< ST >::applyRotation(), AtomicOrbitals< ST >::applyRotation(), TraceBuffer< TraceInt >::collect_sample(), Vector< T, std::allocator< T > >::construct_copy_elements(), LCAOrbitalSet::evaluate_vgh_impl(), LCAOrbitalSet::evaluate_vghgh_impl(), LCAOrbitalSet::evaluate_vgl_impl(), DiracDeterminant< DU_TYPE >::evaluateDerivRatios(), DiracDeterminantBatched< PL, VT, FPVT >::evaluateDerivRatios(), LCAOrbitalSet::evaluateDetRatios(), SplineC2COMPTarget< ST >::evaluateDetRatios(), SplineC2ROMPTarget< ST >::evaluateDetRatios(), DiracDeterminant< DU_TYPE >::evaluateRatios(), DiracDeterminantBatched< PL, VT, FPVT >::evaluateRatios(), DiracDeterminant< DU_TYPE >::evaluateSpinorRatios(), DiracDeterminantBatched< PL, VT, FPVT >::evaluateSpinorRatios(), DelayedUpdate< T, T_FP >::getInvRow(), DelayedUpdateSYCL< T, T_FP >::getInvRow(), DelayedUpdateCUDA< T, T_FP >::getInvRow(), qmcplusplus::testing::getParticularListener(), MCCoords< CoordsType::POS >::getSubset(), MCCoords< CoordsType::POS_SPIN >::getSubset(), syclSolverInverter< T_FP >::invert_transpose(), WalkerLogBuffer< WLog::Real >::makeNewRow(), LCAOrbitalSet::mw_evaluateValue(), LCAOrbitalSet::mw_evaluateValueImplGEMM(), LCAOrbitalSet::mw_evaluateValueVPsImplGEMM(), LCAOrbitalSet::mw_evaluateVGL(), LCAOrbitalSet::mw_evaluateVGLImplGEMM(), StructFact::mw_updateAllPart(), VectorSoaContainer< ST, 5 >::operator=(), Vector< T, std::allocator< T > >::operator=(), ParticleAttribXmlNode< PAT >::put(), EstimatorManagerNew::reduceOperatorEstimators(), RotatedSPOs::resetParametersExclusive(), WalkerLogBuffer< WLog::Real >::resetRowSize(), SplineR2R< ST >::storeParamsBeforeRotation(), SplineC2C< ST >::storeParamsBeforeRotation(), AtomicOrbitals< ST >::storeParamsBeforeRotation(), qmcplusplus::TEST_CASE(), qmcplusplus::testDualAllocator(), SoaDistanceTableAB< T, D, SC >::update(), SoaDistanceTableAA< T, D, SC >::update(), SoaDistanceTableABOMPTarget< T, D, SC >::update(), SoaDistanceTableAAOMPTarget< T, D, SC >::update(), SoaDistanceTableAA< T, D, SC >::updatePartial(), SoaDistanceTableAAOMPTarget< T, D, SC >::updatePartial(), VectorSoaContainer< ST, 5 >::VectorSoaContainer(), NESpaceGrid< REAL >::write(), and OperatorEstBase::write().
template sycl::event qmcplusplus::syclBLAS::copy_n | ( | sycl::queue & | aq, |
const double *restrict | VA, | ||
size_t | array_size, | ||
float *restrict | VC, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::copy_n | ( | sycl::queue & | aq, |
const std::complex< double > *restrict | VA, | ||
size_t | array_size, | ||
std::complex< float > *restrict | VC, | ||
const std::vector< sycl::event > & | events | ||
) |
sycl::event gemm | ( | sycl::queue & | handle, |
const char | tA, | ||
const char | tB, | ||
const int | m, | ||
const int | n, | ||
const int | k, | ||
const T | alpha, | ||
const T * | A, | ||
const int | lda, | ||
const T * | B, | ||
const int | ldb, | ||
const T | beta, | ||
T * | C, | ||
const int | ldc, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 275 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, B(), qmcplusplus::Units::charge::C, convertTransEnum(), gemm(), qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by DelayedUpdateSYCL< T, T_FP >::updateInvMat().
template sycl::event qmcplusplus::syclBLAS::gemm | ( | sycl::queue & | handle, |
const char | tA, | ||
const char | tB, | ||
const int | m, | ||
const int | n, | ||
const int | k, | ||
const float | alpha, | ||
const float *const | A, | ||
const int | lda, | ||
const float *const | B, | ||
const int | ldb, | ||
const float | beta, | ||
float *const | C, | ||
const int | ldc, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemm | ( | sycl::queue & | handle, |
const char | tA, | ||
const char | tB, | ||
const int | m, | ||
const int | n, | ||
const int | k, | ||
const double | alpha, | ||
const double *const | A, | ||
const int | lda, | ||
const double *const | B, | ||
const int | ldb, | ||
const double | beta, | ||
double *const | C, | ||
const int | ldc, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemm | ( | sycl::queue & | handle, |
const char | tA, | ||
const char | tB, | ||
const int | m, | ||
const int | n, | ||
const int | k, | ||
const std::complex< float > | alpha, | ||
const std::complex< float > *const | A, | ||
const int | lda, | ||
const std::complex< float > *const | B, | ||
const int | ldb, | ||
const std::complex< float > | beta, | ||
std::complex< float > *const | C, | ||
const int | ldc, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemm | ( | sycl::queue & | handle, |
const char | tA, | ||
const char | tB, | ||
const int | m, | ||
const int | n, | ||
const int | k, | ||
const std::complex< double > | alpha, | ||
const std::complex< double > *const | A, | ||
const int | lda, | ||
const std::complex< double > *const | B, | ||
const int | ldb, | ||
const std::complex< double > | beta, | ||
std::complex< double > *const | C, | ||
const int | ldc, | ||
const std::vector< sycl::event > & | events | ||
) |
Referenced by gemm().
sycl::event gemv | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const T | alpha, | ||
const T *const | A, | ||
const int | lda, | ||
const T *const | x, | ||
const int | incx, | ||
const T | beta, | ||
T *const | y, | ||
const int | incy, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 21 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, convertTransEnum(), gemv(), qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
template sycl::event qmcplusplus::syclBLAS::gemv | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const double | alpha, | ||
const double *const | A, | ||
const int | lda, | ||
const double *const | x, | ||
const int | incx, | ||
const double | beta, | ||
double *const | y, | ||
const int | incy, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemv | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const float | alpha, | ||
const float *const | A, | ||
const int | lda, | ||
const float *const | x, | ||
const int | incx, | ||
const float | beta, | ||
float *const | y, | ||
const int | incy, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemv | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const std::complex< double > | alpha, | ||
const std::complex< double > *const | A, | ||
const int | lda, | ||
const std::complex< double > *const | x, | ||
const int | incx, | ||
const std::complex< double > | beta, | ||
std::complex< double > *const | y, | ||
const int | incy, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::gemv | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const std::complex< float > | alpha, | ||
const std::complex< float > *const | A, | ||
const int | lda, | ||
const std::complex< float > *const | x, | ||
const int | incx, | ||
const std::complex< float > | beta, | ||
std::complex< float > *const | y, | ||
const int | incy, | ||
const std::vector< sycl::event > & | events | ||
) |
Referenced by gemv().
sycl::event qmcplusplus::syclBLAS::gemv_batched | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const T * | alpha, | ||
const T *const | A[], | ||
const int | lda, | ||
const T *const | x[], | ||
const int | incx, | ||
const T * | beta, | ||
T *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
in-house version of gemv_batch implemented in SYCL. Can be dropped if we have vendor optimized versions
Referenced by qmcplusplus::compute::BLAS::gemv_batched().
sycl::event qmcplusplus::syclBLAS::gemv_batched< double > | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const double * | alpha, | ||
const double *const | A[], | ||
const int | lda, | ||
const double *const | x[], | ||
const int | incx, | ||
const double * | beta, | ||
double *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 196 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::gemv_batched< float > | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const float * | alpha, | ||
const float *const | A[], | ||
const int | lda, | ||
const float *const | x[], | ||
const int | incx, | ||
const float * | beta, | ||
float *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 171 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::gemv_batched< std::complex< double > > | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const std::complex< double > * | alpha, | ||
const std::complex< double > *const | A[], | ||
const int | lda, | ||
const std::complex< double > *const | x[], | ||
const int | incx, | ||
const std::complex< double > * | beta, | ||
std::complex< double > *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 248 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::gemv_batched< std::complex< float > > | ( | sycl::queue & | handle, |
const char | trans, | ||
const int | m, | ||
const int | n, | ||
const std::complex< float > * | alpha, | ||
const std::complex< float > *const | A[], | ||
const int | lda, | ||
const std::complex< float > *const | x[], | ||
const int | incx, | ||
const std::complex< float > * | beta, | ||
std::complex< float > *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 221 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::gemvN_batched_impl | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const T * | alpha, | ||
const T *const | A[], | ||
const int | lda, | ||
const T *const | x[], | ||
const int | incx, | ||
const T * | beta, | ||
T *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
gemv trans = 'N' case.
ROW refers to rows of the m x n column-major Fortran matrix A.
Definition at line 135 of file syclBLAS.cpp.
sycl::event qmcplusplus::syclBLAS::gemvT_batched_impl | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const T * | alpha, | ||
const T *const | A[], | ||
const int | lda, | ||
const T *const | x[], | ||
const int | incx, | ||
const T * | beta, | ||
T *const | y[], | ||
const int | incy, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
gemv trans = 'T' case.
COLS refers to columns of the m x n column-major Fortran matrix A.
Definition at line 97 of file syclBLAS.cpp.
sycl::event qmcplusplus::syclBLAS::ger_batched | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const T * | alpha, | ||
const T *const | x[], | ||
const int | incx, | ||
const T *const | y[], | ||
const int | incy, | ||
T *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
in-house version of ger_batch implemented in SYCL. Can be dropped if we have vendor optimized versions
Referenced by qmcplusplus::compute::BLAS::ger_batched().
sycl::event qmcplusplus::syclBLAS::ger_batched< double > | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const double * | alpha, | ||
const double *const | x[], | ||
const int | incx, | ||
const double *const | y[], | ||
const int | incy, | ||
double *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 421 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::ger_batched< float > | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const float * | alpha, | ||
const float *const | x[], | ||
const int | incx, | ||
const float *const | y[], | ||
const int | incy, | ||
float *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 404 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::ger_batched< std::complex< double > > | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const std::complex< double > * | alpha, | ||
const std::complex< double > *const | x[], | ||
const int | incx, | ||
const std::complex< double > *const | y[], | ||
const int | incy, | ||
std::complex< double > *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 456 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::ger_batched< std::complex< float > > | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const std::complex< float > * | alpha, | ||
const std::complex< float > *const | x[], | ||
const int | incx, | ||
const std::complex< float > *const | y[], | ||
const int | incy, | ||
std::complex< float > *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 438 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::ger_batched_impl | ( | sycl::queue & | handle, |
const int | m, | ||
const int | n, | ||
const T * | alpha, | ||
const T *const | x[], | ||
const int | incx, | ||
const T *const | y[], | ||
const int | incy, | ||
T *const | A[], | ||
const int | lda, | ||
const size_t | batch_count, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 361 of file syclBLAS.cpp.
References qmcplusplus::Units::distance::A, qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const T1 * | in, | ||
int | m, | ||
int | lda, | ||
T2 * | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events = {} |
||
) |
sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const T1 *restrict | in, | ||
int | m, | ||
int | lda, | ||
T2 *restrict | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events | ||
) |
Definition at line 475 of file syclBLAS.cpp.
References qmcplusplus::lda, qmcplusplus::Units::distance::m, and qmcplusplus::n.
Referenced by syclSolverInverter< T_FP >::invert_transpose().
template sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const float *restrict | in, | ||
int | m, | ||
int | lda, | ||
double *restrict | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const double *restrict | in, | ||
int | m, | ||
int | lda, | ||
double *restrict | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const std::complex< float > *restrict | in, | ||
int | m, | ||
int | lda, | ||
std::complex< double > *restrict | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events | ||
) |
template sycl::event qmcplusplus::syclBLAS::transpose | ( | sycl::queue & | q, |
const std::complex< double > *restrict | in, | ||
int | m, | ||
int | lda, | ||
std::complex< double > *restrict | out, | ||
int | n, | ||
int | ldb, | ||
const std::vector< sycl::event > & | events | ||
) |