da/db8/a00797_source.html

 //////////////////////////////////////////////////////////////////////////////////////
 // This file is distributed under the University of Illinois/NCSA Open Source License.
 // See LICENSE file in top directory for details.
 //
 // Copyright (c) 2021 QMCPACK developers.
 //
 // File developed by: Peter Doak, doakpw@ornl.gov, Oak Ridge National Lab
 //
 // Refactored from: OMPallocator.hpp
 //////////////////////////////////////////////////////////////////////////////////////
 // -*- C++ -*-
 /** @file
  */
 #ifndef QMCPLUSPLUS_DUAL_ALLOCATOR_H
 #define QMCPLUSPLUS_DUAL_ALLOCATOR_H

 #include <memory>
 #include <type_traits>
 #include <atomic>
 #include <exception>
 #include "config.h"
 #include "allocator_traits.hpp"
 #include "PinnedAllocator.h"
 #if defined(ENABLE_CUDA)
 #include "CUDA/CUDAallocator.hpp"
 #elif defined(ENABLE_SYCL)
 #include "SYCL/SYCLallocator.hpp"
 #endif

 namespace qmcplusplus
 {
 extern std::atomic<size_t> dual_device_mem_allocated;

 inline size_t getDualDeviceMemAllocated() { return dual_device_mem_allocated; }

 /** Generalizes the DualMemorySpace allocator
  *  This provides a limited alternative to OMPallocator for testing/benchmarking
  *  without dependence of OMPTarget/ offload.
  *  It does not provide an alternative to OMPtarget transfer semantics so many production
  *  objects will not be functional if it is used as the allocator for the data objects they depend
  *  on.
  *  If you use DualAllocator at this time you need to handle data transfer yourself.
  *
  *  \todo the OMPTarget allocation can be a "device" allocator comparable to CUDAAllocator
  *  Then OMPallocator can be replaced by a DualAllocator<T, OffloadAllocator<T>, PinnedAllocator<T>>
  */
 template<typename T, class DeviceAllocator, class HostAllocator = std::allocator<T>>
 struct DualAllocator : public HostAllocator
 {
   using Value        = typename HostAllocator::value_type;
   using Size         = typename HostAllocator::size_type;
   using Pointer      = typename HostAllocator::pointer;
   using ConstPointer = typename HostAllocator::const_pointer;

   DualAllocator() : device_ptr_(nullptr){};
   DualAllocator(const DualAllocator&) : device_ptr_(nullptr) {}
   DualAllocator& operator=(const DualAllocator&)
   {
     device_ptr_ = nullptr;
   }
   template<class U, class V>
   DualAllocator(const DualAllocator<U, V>&) : device_ptr_(nullptr)
   {}

   template<class U, class V>
   struct rebind
   {
     using other = DualAllocator<U, V>;
   };

   Value* allocate(std::size_t n)
   {
     static_assert(std::is_same<T, Value>::value, "DualAllocator and HostAllocator data types must agree!");
     if (device_ptr_ != nullptr)
       throw std::runtime_error("DualAllocator does not support device reallocation");
     Value* host_ptr   = std::allocator_traits<HostAllocator>::allocate(allocator_, n);
     device_ptr_ = std::allocator_traits<DeviceAllocator>::allocate(device_allocator_, n);
     dual_device_mem_allocated += n * sizeof(T);
     return host_ptr;
   }

   void deallocate(Value* pt, std::size_t n)
   {
     dual_device_mem_allocated -= n * sizeof(T);
     std::allocator_traits<DeviceAllocator>::deallocate(device_allocator_, device_ptr_, n);
     std::allocator_traits<HostAllocator>::deallocate(allocator_, pt, n);
     device_ptr_ = nullptr;
   }

   void attachReference(const DualAllocator& from, std::ptrdiff_t ptr_offset)
   {
     device_ptr_               = const_cast<Pointer>(from.get_device_ptr()) + ptr_offset;
   }

   T* get_device_ptr() { return device_ptr_; }
   const T* get_device_ptr() const { return device_ptr_; }

   DeviceAllocator& get_device_allocator() { return device_allocator_; }
   const DeviceAllocator& get_device_allocator() const { return device_allocator_; }

 private:
   HostAllocator allocator_;
   DeviceAllocator device_allocator_;
   T* device_ptr_;
 };

 template<typename T, class DeviceAllocator, class HostAllocator>
 struct qmc_allocator_traits<DualAllocator<T, DeviceAllocator, HostAllocator>>
 {
   using DualAlloc                      = DualAllocator<T, DeviceAllocator, HostAllocator>;
   static constexpr bool is_host_accessible = true;
   static constexpr bool is_dual_space      = true;

   static void fill_n(T* ptr, size_t n, const T& value) { qmc_allocator_traits<HostAllocator>::fill_n(ptr, n, value); }

   static void attachReference(const DualAlloc& from, DualAlloc& to, std::ptrdiff_t ptr_offset)
   {
     to.attachReference(from, ptr_offset);
   }

   /** update to the device, assumes you are copying starting with the implicit host_ptr.
    *
    *  These follow the openmp target semantics where you only provide the host
    *  side of a host_ptr device_ptr pair but the verb relates to what happens on the device.
    *
    *  This is primarily for testing to reduce ifdef code and single "flavor" testing
    *
    *  This a generic API and unlikely to be the best way to handle performance critical transfers,
    *  but if you have to use it or ifdef at a level above a xxxCUDA.cu or xxxOMPTarget.hpp file
    *  thats an issue.
    */
   static void updateTo(DualAlloc& alloc, T* host_ptr, size_t n, size_t offset = 0)
   {
     alloc.get_device_allocator().copyToDevice(alloc.get_device_ptr() + offset, host_ptr + offset, n);
   }

   /** update from the device, assumes you are copying starting with the device_ptr to the implicit host_ptr.
    */
   static void updateFrom(DualAlloc& alloc, T* host_ptr, size_t n, size_t offset = 0)
   {
     alloc.get_device_allocator().copyFromDevice(host_ptr + offset, alloc.get_device_ptr() + offset, n);
   }

   static void deviceSideCopyN(DualAlloc& alloc, size_t to, size_t n, size_t from)
   {
     T* device_ptr = alloc.get_device_ptr();
     T* to_ptr     = device_ptr + to;
     T* from_ptr   = device_ptr + from;
     alloc.get_device_allocator().copyDeviceToDevice(to_ptr, n, from_ptr);
   }
 };

 } // namespace qmcplusplus

 #endif
qmcplusplus::qmc_allocator_traits::is_dual_space
static constexpr bool is_dual_space
Definition: allocator_traits.hpp:31

qmcplusplus::DualAllocator::DualAllocator
DualAllocator(const DualAllocator< U, V > &)
Definition: DualAllocator.hpp:62

qmcplusplus::DualAllocator
Generalizes the DualMemorySpace allocator This provides a limited alternative to OMPallocator for tes...
Definition: DualAllocator.hpp:48

qmcplusplus
helper functions for EinsplineSetBuilder
Definition: Configuration.h:43

qmcplusplus::qmc_allocator_traits< DualAllocator< T, DeviceAllocator, HostAllocator > >::deviceSideCopyN
static void deviceSideCopyN(DualAlloc &alloc, size_t to, size_t n, size_t from)
Definition: DualAllocator.hpp:144

qmcplusplus::DualAllocator::device_allocator_
DeviceAllocator device_allocator_
Definition: DualAllocator.hpp:103

qmcplusplus::qmc_allocator_traits< DualAllocator< T, DeviceAllocator, HostAllocator > >::fill_n
static void fill_n(T *ptr, size_t n, const T &value)
Definition: DualAllocator.hpp:114

qmcplusplus::DualAllocator::DualAllocator
DualAllocator()
Definition: DualAllocator.hpp:55

qmcplusplus::qmc_allocator_traits< DualAllocator< T, DeviceAllocator, HostAllocator > >::updateFrom
static void updateFrom(DualAlloc &alloc, T *host_ptr, size_t n, size_t offset=0)
update from the device, assumes you are copying starting with the device_ptr to the implicit host_ptr...
Definition: DualAllocator.hpp:139

qmcplusplus::Mallocator
Definition: Mallocator.hpp:25

qmcplusplus::qmc_allocator_traits< DualAllocator< T, DeviceAllocator, HostAllocator > >::attachReference
static void attachReference(const DualAlloc &from, DualAlloc &to, std::ptrdiff_t ptr_offset)
Definition: DualAllocator.hpp:116

CUDAallocator.hpp
this file provides three C++ memory allocators using CUDA specific memory allocation functions...

qmcplusplus::DualAllocator::get_device_allocator
const DeviceAllocator & get_device_allocator() const
Definition: DualAllocator.hpp:99

qmcplusplus::DualAllocator::rebind
Definition: DualAllocator.hpp:66

qmcplusplus::DualAllocator::DualAllocator
DualAllocator(const DualAllocator &)
Definition: DualAllocator.hpp:56

qmcplusplus::qmc_allocator_traits< DualAllocator< T, DeviceAllocator, HostAllocator > >::updateTo
static void updateTo(DualAlloc &alloc, T *host_ptr, size_t n, size_t offset=0)
update to the device, assumes you are copying starting with the implicit host_ptr.
Definition: DualAllocator.hpp:132

qmcplusplus::DualAllocator::Pointer
typename HostAllocator::pointer Pointer
Definition: DualAllocator.hpp:52

qmcplusplus::DualAllocator::attachReference
void attachReference(const DualAllocator &from, std::ptrdiff_t ptr_offset)
Definition: DualAllocator.hpp:90

qmcplusplus::qmc_allocator_traits::is_host_accessible
static constexpr bool is_host_accessible
Definition: allocator_traits.hpp:30

qmcplusplus::DualAllocator::device_ptr_
T * device_ptr_
Definition: DualAllocator.hpp:104

qmcplusplus::DualAllocator::get_device_allocator
DeviceAllocator & get_device_allocator()
Definition: DualAllocator.hpp:98

qmcplusplus::qmc_allocator_traits
template class analogous to std::allocator_traits.
Definition: allocator_traits.hpp:26

qmcplusplus::DualAllocator::get_device_ptr
const T * get_device_ptr() const
Definition: DualAllocator.hpp:96

qmcplusplus::getDualDeviceMemAllocated
size_t getDualDeviceMemAllocated()
Definition: DualAllocator.hpp:34

qmcplusplus::DualAllocator::ConstPointer
typename HostAllocator::const_pointer ConstPointer
Definition: DualAllocator.hpp:53

qmcplusplus::n
int n
Definition: test_cuBLAS_LU.cpp:216

qmcplusplus::dual_device_mem_allocated
std::atomic< size_t > dual_device_mem_allocated

SYCLallocator.hpp
this file provides three C++ memory allocators using SYCL specific memory allocation functions...

PinnedAllocator.h

allocator_traits.hpp

qmcplusplus::DualAllocator::Size
typename HostAllocator::size_type Size
Definition: DualAllocator.hpp:51

qmcplusplus::DualAllocator::deallocate
void deallocate(Value *pt, std::size_t n)
Definition: DualAllocator.hpp:82

qmcplusplus::DualAllocator::allocator_
HostAllocator allocator_
Definition: DualAllocator.hpp:102

qmcplusplus::DualAllocator::operator=
DualAllocator & operator=(const DualAllocator &)
Definition: DualAllocator.hpp:57

qmcplusplus::DualAllocator::Value
typename HostAllocator::value_type Value
Definition: DualAllocator.hpp:50

qmcplusplus::DualAllocator::allocate
Value * allocate(std::size_t n)
Definition: DualAllocator.hpp:71

qmcplusplus::DualAllocator::get_device_ptr
T * get_device_ptr()
Definition: DualAllocator.hpp:95

qmcplusplus::qmc_allocator_traits::fill_n
static void fill_n(value_type *ptr, size_t n, const value_type &value)
Definition: allocator_traits.hpp:33

qmcplusplus::value_type
QMCTraits::FullPrecRealType value_type
Definition: ObservableHelper.h:28