13 #ifndef QMCPLUSPLUS_CUBLAS_MISSING_FUNCTIONS_H 14 #define QMCPLUSPLUS_CUBLAS_MISSING_FUNCTIONS_H 52 const float*
const A[],
54 const float*
const x[],
59 const int batch_count);
66 const double*
const A[],
68 const double*
const x[],
73 const int batch_count);
79 const std::complex<float>* alpha,
80 const std::complex<float>*
const A[],
82 const std::complex<float>*
const x[],
84 const std::complex<float>* beta,
85 std::complex<float>*
const y[],
87 const int batch_count);
93 const std::complex<double>* alpha,
94 const std::complex<double>*
const A[],
96 const std::complex<double>*
const x[],
98 const std::complex<double>* beta,
99 std::complex<double>*
const y[],
101 const int batch_count);
120 const float*
const x[],
122 const float*
const y[],
126 const int batch_count);
132 const double*
const x[],
134 const double*
const y[],
138 const int batch_count);
143 const std::complex<float>* alpha,
144 const std::complex<float>*
const x[],
146 const std::complex<float>*
const y[],
148 std::complex<float>*
const A[],
150 const int batch_count);
155 const std::complex<double>* alpha,
156 const std::complex<double>*
const x[],
158 const std::complex<double>*
const y[],
160 std::complex<double>*
const A[],
162 const int batch_count);
176 const float*
const in[],
180 const int batch_count);
184 const double*
const in[],
188 const int batch_count);
192 const std::complex<float>*
const in[],
194 std::complex<float>*
const out[],
196 const int batch_count);
200 const std::complex<double>*
const in[],
202 std::complex<double>*
const out[],
204 const int batch_count);
209 #endif // QMCPLUSPLUS_CUBLAS_INHOUSE_H helper functions for EinsplineSetBuilder
handle CUDA/HIP runtime selection.
cudaError_t gemv_batched(cudaStream_t handle, const char trans, const int m, const int n, const float *alpha, const float *const A[], const int lda, const float *const x[], const int incx, const float *beta, float *const y[], const int incy, const int batch_count)
Xgemv batched API.
cudaError_t copy_batched(cudaStream_t hstream, const int n, const float *const in[], const int incx, float *const out[], const int incy, const int batch_count)
Xcopy batched API.
cudaError_t ger_batched(cudaStream_t handle, const int m, const int n, const float *alpha, const float *const x[], const int incx, const float *const y[], const int incy, float *const A[], const int lda, const int batch_count)
Xger batched API.