interface to cuBLAS_inhouse calls for different data types S/C/D/Z More...

Functions
template<typename T >
cudaError_t	copyAinvRow_saveGL_batched (cudaStream_t hstream, const int rowchanged, const int n, const T const Ainv[], const int lda, T const temp[], T const rcopy[], const T const phi_vgl_in[], const size_t phi_vgl_stride, T const dphi_out[], T const d2phi_out[], const int batch_count)
	helper function for SM-1 Fahy update subtract one in temp copy Ainv changed row to rcopy save phi G and L as accept. More...

template<typename T >
cudaError_t	calcGradients_batched (cudaStream_t hstream, const int n, const T const Ainvrow[], const T const dpsiMrow[], T *const grads_now, const int batch_count)
	calculate gradients More...

template<typename T >
cudaError_t	add_delay_list_save_sigma_VGL_batched (cudaStream_t hstream, int const delay_list[], const int rowchanged, const int delay_count, T const binv[], const int binv_lda, const T const ratio_inv, const T const phi_vgl_in[], const size_t phi_vgl_stride, T const phi_out[], T const dphi_out[], T *const d2phi_out[], const int norb, const int n_accepted, const int batch_count)

template<typename T >
cudaError_t	applyW_batched (cudaStream_t hstream, const int const delay_list[], const int delay_count, T const tempMat[], const int lda, const int batch_count)

cudaError_t	print_delay_list_batched (cudaStream_t hstream, int *const delay_list[], const int delay_count, const int batch_count)

Detailed Description

interface to cuBLAS_inhouse calls for different data types S/C/D/Z

Function Documentation

cudaError_t qmcplusplus::CUDA::add_delay_list_save_sigma_VGL_batched	(	cudaStream_t	hstream,
		int *const	delay_list[],
		const int	rowchanged,
		const int	delay_count,
		T *const	binv[],
		const int	binv_lda,
		const T *const	ratio_inv,
		const T *const	phi_vgl_in[],
		const size_t	phi_vgl_stride,
		T *const	phi_out[],
		T *const	dphi_out[],
		T *const	d2phi_out[],
		const int	norb,
		const int	n_accepted,
		const int	batch_count
	)

cudaError_t qmcplusplus::CUDA::applyW_batched	(	cudaStream_t	hstream,
		const int *const	delay_list[],
		const int	delay_count,
		T *const	tempMat[],
		const int	lda,
		const int	batch_count
	)

cudaError_t qmcplusplus::CUDA::calcGradients_batched	(	cudaStream_t	hstream,
		const int	n,
		const T *const	Ainvrow[],
		const T *const	dpsiMrow[],
		T *const	grads_now,
		const int	batch_count
	)

calculate gradients

cudaError_t qmcplusplus::CUDA::copyAinvRow_saveGL_batched	(	cudaStream_t	hstream,
		const int	rowchanged,
		const int	n,
		const T *const	Ainv[],
		const int	lda,
		T *const	temp[],
		T *const	rcopy[],
		const T *const	phi_vgl_in[],
		const size_t	phi_vgl_stride,
		T *const	dphi_out[],
		T *const	d2phi_out[],
		const int	batch_count
	)

helper function for SM-1 Fahy update subtract one in temp copy Ainv changed row to rcopy save phi G and L as accept.

cudaError_t qmcplusplus::CUDA::print_delay_list_batched	(	cudaStream_t	hstream,
		int *const	delay_list[],
		const int	delay_count,
		const int	batch_count
	)