![]() |
QMCPACK
|
Go to the source code of this file.
Functions | |
void | applyW_stageV_cuda (const int *delay_list_gpu, const int delay_count, float *temp_gpu, const int numorbs, const int ndelay, float *V_gpu, const float *Ainv, cudaStream_t hstream) |
helper function for delayed update algorithm W matrix is applied and copy selected rows of Ainv into V More... | |
void | applyW_stageV_cuda (const int *delay_list_gpu, const int delay_count, std::complex< float > *temp_gpu, const int numorbs, const int ndelay, std::complex< float > *V_gpu, const std::complex< float > *Ainv, cudaStream_t hstream) |
void | applyW_stageV_cuda (const int *delay_list_gpu, const int delay_count, double *temp_gpu, const int numorbs, const int ndelay, double *V_gpu, const double *Ainv, cudaStream_t hstream) |
void | applyW_stageV_cuda (const int *delay_list_gpu, const int delay_count, std::complex< double > *temp_gpu, const int numorbs, const int ndelay, std::complex< double > *V_gpu, const std::complex< double > *Ainv, cudaStream_t hstream) |
void | make_identity_matrix_cuda (const int nrows, double *mat, const int lda, cudaStream_t hstream) |
create identity matrix on the device More... | |
void | make_identity_matrix_cuda (const int nrows, std::complex< double > *mat, const int lda, cudaStream_t hstream) |
void | extract_matrix_diagonal_cuda (const int nrows, const double *mat, const int lda, double *diag, cudaStream_t hstream) |
extract matrix diagonal More... | |
void | extract_matrix_diagonal_cuda (const int nrows, const std::complex< double > *mat, const int lda, std::complex< double > *diag, cudaStream_t hstream) |
void | copy_matrix_cuda (const int nrows, const int ncols, const double *mat_in, const int lda, float *mat_out, const int ldb, cudaStream_t hstream) |
copy matrix with precision difference More... | |
void | copy_matrix_cuda (const int nrows, const int ncols, const float *mat_in, const int lda, double *mat_out, const int ldb, cudaStream_t hstream) |
void | copy_matrix_cuda (const int nrows, const int ncols, const std::complex< double > *mat_in, const int lda, std::complex< float > *mat_out, const int ldb, cudaStream_t hstream) |
void | copy_matrix_cuda (const int nrows, const int ncols, const std::complex< float > *mat_in, const int lda, std::complex< double > *mat_out, const int ldb, cudaStream_t hstream) |
void applyW_stageV_cuda | ( | const int * | delay_list_gpu, |
const int | delay_count, | ||
float * | temp_gpu, | ||
const int | numorbs, | ||
const int | ndelay, | ||
float * | V_gpu, | ||
const float * | Ainv, | ||
cudaStream_t | hstream | ||
) |
helper function for delayed update algorithm W matrix is applied and copy selected rows of Ainv into V
Referenced by DelayedUpdateCUDA< T, T_FP >::updateInvMat().
void applyW_stageV_cuda | ( | const int * | delay_list_gpu, |
const int | delay_count, | ||
std::complex< float > * | temp_gpu, | ||
const int | numorbs, | ||
const int | ndelay, | ||
std::complex< float > * | V_gpu, | ||
const std::complex< float > * | Ainv, | ||
cudaStream_t | hstream | ||
) |
void applyW_stageV_cuda | ( | const int * | delay_list_gpu, |
const int | delay_count, | ||
double * | temp_gpu, | ||
const int | numorbs, | ||
const int | ndelay, | ||
double * | V_gpu, | ||
const double * | Ainv, | ||
cudaStream_t | hstream | ||
) |
void applyW_stageV_cuda | ( | const int * | delay_list_gpu, |
const int | delay_count, | ||
std::complex< double > * | temp_gpu, | ||
const int | numorbs, | ||
const int | ndelay, | ||
std::complex< double > * | V_gpu, | ||
const std::complex< double > * | Ainv, | ||
cudaStream_t | hstream | ||
) |
void copy_matrix_cuda | ( | const int | nrows, |
const int | ncols, | ||
const double * | mat_in, | ||
const int | lda, | ||
float * | mat_out, | ||
const int | ldb, | ||
cudaStream_t | hstream | ||
) |
copy matrix with precision difference
Referenced by cuSolverInverter< T_FP >::invert_transpose(), and rocSolverInverter< T_FP >::invert_transpose().
void copy_matrix_cuda | ( | const int | nrows, |
const int | ncols, | ||
const float * | mat_in, | ||
const int | lda, | ||
double * | mat_out, | ||
const int | ldb, | ||
cudaStream_t | hstream | ||
) |
void copy_matrix_cuda | ( | const int | nrows, |
const int | ncols, | ||
const std::complex< double > * | mat_in, | ||
const int | lda, | ||
std::complex< float > * | mat_out, | ||
const int | ldb, | ||
cudaStream_t | hstream | ||
) |
void copy_matrix_cuda | ( | const int | nrows, |
const int | ncols, | ||
const std::complex< float > * | mat_in, | ||
const int | lda, | ||
std::complex< double > * | mat_out, | ||
const int | ldb, | ||
cudaStream_t | hstream | ||
) |
void extract_matrix_diagonal_cuda | ( | const int | nrows, |
const double * | mat, | ||
const int | lda, | ||
double * | diag, | ||
cudaStream_t | hstream | ||
) |
extract matrix diagonal
Referenced by cuSolverInverter< T_FP >::invert_transpose(), and rocSolverInverter< T_FP >::invert_transpose().
void extract_matrix_diagonal_cuda | ( | const int | nrows, |
const std::complex< double > * | mat, | ||
const int | lda, | ||
std::complex< double > * | diag, | ||
cudaStream_t | hstream | ||
) |
void make_identity_matrix_cuda | ( | const int | nrows, |
double * | mat, | ||
const int | lda, | ||
cudaStream_t | hstream | ||
) |
create identity matrix on the device
Referenced by cuSolverInverter< T_FP >::invert_transpose(), and rocSolverInverter< T_FP >::invert_transpose().
void make_identity_matrix_cuda | ( | const int | nrows, |
std::complex< double > * | mat, | ||
const int | lda, | ||
cudaStream_t | hstream | ||
) |