d5/dae/a00767_source.html

 //////////////////////////////////////////////////////////////////////////////////////
 // This file is distributed under the University of Illinois/NCSA Open Source License.
 // See LICENSE file in top directory for details.
 //
 // Copyright (c) 2021 QMCPACK developers.
 //
 // File developed by: Ye Luo, yeluo@anl.gov, Argonne National Laboratory
 //
 // File created by: Ye Luo, yeluo@anl.gov, Argonne National Laboratory
 //////////////////////////////////////////////////////////////////////////////////////


 #include "CUDAfill.hpp"
 #include <stdexcept>
 #include "CUDAruntime.hpp"

 namespace qmcplusplus
 {
 template<typename T>
 void CUDAfill_n(T* ptr, size_t n, const T& value)
 {
   if (value != T())
     throw std::runtime_error("CUDAfill_n doesn't support fill non T() values!");
   // setting 0 value on each byte should be 0 for int, float and double.
   cudaErrorCheck(cudaMemset(ptr, 0, n * sizeof(T)), "Memset failed in CUDAfill_n!");
 }

 template void CUDAfill_n<int>(int* ptr, size_t n, const int& value);
 template void CUDAfill_n<size_t>(size_t* ptr, size_t n, const size_t& value);

 template void CUDAfill_n<float>(float* ptr, size_t n, const float& value);
 template void CUDAfill_n<double>(double* ptr, size_t n, const double& value);

 template void CUDAfill_n<std::complex<float>>(std::complex<float>* ptr, size_t n, const std::complex<float>& value);
 template void CUDAfill_n<std::complex<double>>(std::complex<double>* ptr, size_t n, const std::complex<double>& value);
 } // namespace qmcplusplus
cudaMemset
#define cudaMemset
Definition: cuda2hip.h:144

qmcplusplus
helper functions for EinsplineSetBuilder
Definition: Configuration.h:43

CUDAruntime.hpp
handle CUDA/HIP runtime selection.

qmcplusplus::CUDAfill_n< double >
template void CUDAfill_n< double >(double *ptr, size_t n, const double &value)

CUDAfill.hpp

qmcplusplus::CUDAfill_n< float >
template void CUDAfill_n< float >(float *ptr, size_t n, const float &value)

qmcplusplus::CUDAfill_n< size_t >
template void CUDAfill_n< size_t >(size_t *ptr, size_t n, const size_t &value)

qmcplusplus::cudaErrorCheck
cudaErrorCheck(cudaMemcpyAsync(dev_lu.data(), lu.data(), sizeof(decltype(lu)::value_type) *lu.size(), cudaMemcpyHostToDevice, hstream), "cudaMemcpyAsync failed copying log_values to device")

qmcplusplus::n
int n
Definition: test_cuBLAS_LU.cpp:216

qmcplusplus::CUDAfill_n
void CUDAfill_n(T *ptr, size_t n, const T &value)
fill device memory with a given value.
Definition: CUDAfill.cpp:20

qmcplusplus::CUDAfill_n< int >
template void CUDAfill_n< int >(int *ptr, size_t n, const int &value)