13 #ifndef CUDA_MATRIX_UPDATE_HELPER_H 14 #define CUDA_MATRIX_UPDATE_HELPER_H 18 #include <cuda_runtime_api.h> 20 #include <hip/hip_runtime.h> 39 const T*
const Ainv[],
43 const T*
const phi_vgl_in[],
44 const size_t phi_vgl_stride,
47 const int batch_count);
54 const T*
const Ainvrow[],
55 const T*
const dpsiMrow[],
57 const int batch_count);
61 int*
const delay_list[],
63 const int delay_count,
66 const T*
const ratio_inv,
67 const T*
const phi_vgl_in[],
68 const size_t phi_vgl_stride,
74 const int batch_count);
78 const int*
const delay_list[],
79 const int delay_count,
82 const int batch_count);
85 int*
const delay_list[],
86 const int delay_count,
87 const int batch_count);
helper functions for EinsplineSetBuilder
cudaError_t print_delay_list_batched(cudaStream_t hstream, int *const delay_list[], const int delay_count, const int batch_count)
cudaError_t add_delay_list_save_sigma_VGL_batched(cudaStream_t hstream, int *const delay_list[], const int rowchanged, const int delay_count, T *const binv[], const int binv_lda, const T *const ratio_inv, const T *const phi_vgl_in[], const size_t phi_vgl_stride, T *const phi_out[], T *const dphi_out[], T *const d2phi_out[], const int norb, const int n_accepted, const int batch_count)
cudaError_t calcGradients_batched(cudaStream_t hstream, const int n, const T *const Ainvrow[], const T *const dpsiMrow[], T *const grads_now, const int batch_count)
calculate gradients
cudaError_t applyW_batched(cudaStream_t hstream, const int *const delay_list[], const int delay_count, T *const tempMat[], const int lda, const int batch_count)
cudaError_t copyAinvRow_saveGL_batched(cudaStream_t hstream, const int rowchanged, const int n, const T *const Ainv[], const int lda, T *const temp[], T *const rcopy[], const T *const phi_vgl_in[], const size_t phi_vgl_stride, T *const dphi_out[], T *const d2phi_out[], const int batch_count)
helper function for SM-1 Fahy update subtract one in temp copy Ainv changed row to rcopy save phi G a...