d5/d12/a01799_source.html

 //////////////////////////////////////////////////////////////////////////////////////
 // This file is distributed under the University of Illinois/NCSA Open Source License.
 // See LICENSE file in top directory for details.
 //
 // Copyright (c) 2021 QMCPACK developers.
 //
 // File developed by: Jeongnim Kim, jeongnim.kim@intel.com, Intel Corp.
 //                    Amrita Mathuriya, amrita.mathuriya@intel.com, Intel Corp.
 //                    Ye Luo, yeluo@anl.gov, Argonne National Laboratory
 //
 // File created by: Jeongnim Kim, jeongnim.kim@intel.com, Intel Corp.
 //////////////////////////////////////////////////////////////////////////////////////
 // -*- C++ -*-


 #include "TwoBodyJastrow.h"
 #include "CPU/SIMD/algorithm.hpp"
 #include "SoaDistanceTableABOMPTarget.h"
 #include "ResourceCollection.h"
 #include "ParticleBase/ParticleAttribOps.h"

 namespace qmcplusplus
 {

 template<typename T>
 struct TwoBodyJastrowMultiWalkerMem : public Resource
 {
   // fused buffer for fast transfer in mw_accept
   Vector<char, OffloadPinnedAllocator<char>> mw_update_buffer;
   // fused buffer for fast transfer in mw_ratioGrad
   Vector<char, OffloadPinnedAllocator<char>> mw_ratiograd_buffer;
   // fused buffer for fast transfer
   Vector<char, OffloadPinnedAllocator<char>> transfer_buffer;
   // multi walker result
   Vector<T, OffloadPinnedAllocator<T>> mw_vals;
   // multi walker result for V and G
   Matrix<T, OffloadPinnedAllocator<T>> mw_vgl;
   /// memory pool for Uat, dUat, d2Uat [Nw][N_padded] + [Nw][DIM][N_padded] + [Nw][N_padded]
   Vector<T, OffloadPinnedAllocator<T>> mw_allUat;
   /// memory pool for cur_u, cur_du, cur_d2u [3][Nw][N_padded]. 3 is for value, first and second derivatives.
   Vector<T, OffloadPinnedAllocator<T>> mw_cur_allu;

   TwoBodyJastrowMultiWalkerMem() : Resource("TwoBodyJastrowMultiWalkerMem") {}

   TwoBodyJastrowMultiWalkerMem(const TwoBodyJastrowMultiWalkerMem&) : TwoBodyJastrowMultiWalkerMem() {}

   std::unique_ptr<Resource> makeClone() const override { return std::make_unique<TwoBodyJastrowMultiWalkerMem>(*this); }
 };

 template<typename FT>
 void TwoBodyJastrow<FT>::createResource(ResourceCollection& collection) const
 {
   collection.addResource(std::make_unique<TwoBodyJastrowMultiWalkerMem<RealType>>());
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::acquireResource(ResourceCollection& collection,
                                          const RefVectorWithLeader<WaveFunctionComponent>& wfc_list) const
 {
   auto& wfc_leader          = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   wfc_leader.mw_mem_handle_ = collection.lendResource<TwoBodyJastrowMultiWalkerMem<RealType>>();
   const size_t nw           = wfc_list.size();
   auto& mw_allUat           = wfc_leader.mw_mem_handle_.getResource().mw_allUat;
   mw_allUat.resize(N_padded * (DIM + 2) * nw);
   for (size_t iw = 0; iw < nw; iw++)
   {
     // copy per walker Uat, dUat, d2Uat to shared buffer and attach buffer
     auto& wfc = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);

     Vector<valT, aligned_allocator<valT>> Uat_view(mw_allUat.data() + iw * N_padded, N);
     Uat_view = wfc.Uat;
     wfc.Uat.free();
     wfc.Uat.attachReference(mw_allUat.data() + iw * N_padded, N);

     VectorSoaContainer<valT, DIM, aligned_allocator<valT>> dUat_view(mw_allUat.data() + nw * N_padded +
                                                                          iw * N_padded * DIM,
                                                                      N, N_padded);
     dUat_view = wfc.dUat;
     wfc.dUat.free();
     wfc.dUat.attachReference(N, N_padded, mw_allUat.data() + nw * N_padded + iw * N_padded * DIM);

     Vector<valT, aligned_allocator<valT>> d2Uat_view(mw_allUat.data() + nw * N_padded * (DIM + 1) + iw * N_padded, N);
     d2Uat_view = wfc.d2Uat;
     wfc.d2Uat.free();
     wfc.d2Uat.attachReference(mw_allUat.data() + nw * N_padded * (DIM + 1) + iw * N_padded, N);
   }
   wfc_leader.mw_mem_handle_.getResource().mw_cur_allu.resize(N_padded * 3 * nw);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::releaseResource(ResourceCollection& collection,
                                          const RefVectorWithLeader<WaveFunctionComponent>& wfc_list) const
 {
   auto& wfc_leader = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   const size_t nw  = wfc_list.size();
   auto& mw_allUat  = wfc_leader.mw_mem_handle_.getResource().mw_allUat;
   for (size_t iw = 0; iw < nw; iw++)
   {
     // detach buffer and copy per walker Uat, dUat, d2Uat from shared buffer
     auto& wfc = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);

     Vector<valT, aligned_allocator<valT>> Uat_view(mw_allUat.data() + iw * N_padded, N);
     wfc.Uat.free();
     wfc.Uat.resize(N);
     wfc.Uat = Uat_view;

     VectorSoaContainer<valT, DIM, aligned_allocator<valT>> dUat_view(mw_allUat.data() + nw * N_padded +
                                                                          iw * N_padded * DIM,
                                                                      N, N_padded);
     wfc.dUat.free();
     wfc.dUat.resize(N);
     wfc.dUat = dUat_view;

     Vector<valT, aligned_allocator<valT>> d2Uat_view(mw_allUat.data() + nw * N_padded * (DIM + 1) + iw * N_padded, N);
     wfc.d2Uat.free();
     wfc.d2Uat.resize(N);
     wfc.d2Uat = d2Uat_view;
   }
   collection.takebackResource(wfc_leader.mw_mem_handle_);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::extractOptimizableObjectRefs(UniqueOptObjRefs& opt_obj_refs)
 {
   for (auto& [key, functor] : J2Unique)
     opt_obj_refs.push_back(*functor);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::checkOutVariables(const opt_variables_type& active)
 {
   myVars.clear();
   for (auto& [key, functor] : J2Unique)
   {
     functor->myVars.getIndex(active);
     myVars.insertFrom(functor->myVars);
   }
   // Remove inactive variables so the mappings are correct
   myVars.removeInactive();

   myVars.getIndex(active);

   const size_t NumVars = myVars.size();
   if (NumVars)
   {
     OffSet.resize(F.size());

     // Find first active variable for the starting offset
     int varoffset = -1;
     for (int i = 0; i < myVars.size(); i++)
     {
       varoffset = myVars.Index[i];
       if (varoffset != -1)
         break;
     }

     for (int i = 0; i < F.size(); ++i)
       if (F[i] && F[i]->myVars.Index.size())
       {
         OffSet[i].first  = F[i]->myVars.Index.front() - varoffset;
         OffSet[i].second = F[i]->myVars.Index.size() + OffSet[i].first;
       }
       else
         OffSet[i].first = OffSet[i].second = -1;
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateRatios(const VirtualParticleSet& VP, std::vector<ValueType>& ratios)
 {
   for (int k = 0; k < ratios.size(); ++k)
     ratios[k] =
         std::exp(Uat[VP.refPtcl] - computeU(VP.getRefPS(), VP.refPtcl, VP.getDistTableAB(my_table_ID_).getDistRow(k)));
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_evaluateRatios(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                            const RefVectorWithLeader<const VirtualParticleSet>& vp_list,
                                            std::vector<std::vector<ValueType>>& ratios) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_evaluateRatios(wfc_list, vp_list, ratios);
     return;
   }

   // add early return to prevent from accessing vp_list[0]
   if (wfc_list.size() == 0)
     return;
   auto& wfc_leader        = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   auto& vp_leader         = vp_list.getLeader();
   const auto& mw_refPctls = vp_leader.getMultiWalkerRefPctls();
   auto& mw_vals           = wfc_leader.mw_mem_handle_.getResource().mw_vals;
   const int nw            = wfc_list.size();

   const size_t nVPs = mw_refPctls.size();
   mw_vals.resize(nVPs);

   // need to access the spin group of refPtcl. vp_leader doesn't necessary be a member of the list.
   // for this reason, refPtcl must be access from [0].
   const int igt = vp_leader.getRefPS().getGroupID(vp_list[0].refPtcl);
   const auto& dt_leader(vp_leader.getDistTableAB(wfc_leader.my_table_ID_));

   FT::mw_evaluateV(NumGroups, F.data() + igt * NumGroups, wfc_leader.N, grp_ids.data(), nVPs, mw_refPctls.data(),
                    dt_leader.getMultiWalkerDataPtr(), dt_leader.getPerTargetPctlStrideSize(), mw_vals.data(),
                    wfc_leader.mw_mem_handle_.getResource().transfer_buffer);

   size_t ivp = 0;
   for (int iw = 0; iw < nw; ++iw)
   {
     const VirtualParticleSet& vp = vp_list[iw];
     const auto& wfc              = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     for (int k = 0; k < vp.getTotalNum(); ++k, ivp++)
       ratios[iw][k] = std::exp(wfc.Uat[mw_refPctls[ivp]] - mw_vals[ivp]);
   }
   assert(ivp == nVPs);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::registerData(ParticleSet& P, WFBufferType& buf)
 {
   if (Bytes_in_WFBuffer == 0)
   {
     Bytes_in_WFBuffer = buf.current();
     buf.add(Uat.begin(), Uat.end());
     buf.add(dUat.data(), dUat.end());
     buf.add(d2Uat.begin(), d2Uat.end());
     Bytes_in_WFBuffer = buf.current() - Bytes_in_WFBuffer;
     // free local space
     Uat.free();
     dUat.free();
     d2Uat.free();
   }
   else
   {
     buf.forward(Bytes_in_WFBuffer);
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::copyFromBuffer(ParticleSet& P, WFBufferType& buf)
 {
   Uat.attachReference(buf.lendReference<valT>(N), N);
   dUat.attachReference(N, N_padded, buf.lendReference<valT>(N_padded * DIM));
   d2Uat.attachReference(buf.lendReference<valT>(N), N);
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::LogValue TwoBodyJastrow<FT>::updateBuffer(ParticleSet& P,
                                                                        WFBufferType& buf,
                                                                        bool fromscratch)
 {
   log_value_ = computeGL(P.G, P.L);
   buf.forward(Bytes_in_WFBuffer);
   return log_value_;
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::valT TwoBodyJastrow<FT>::computeU(const ParticleSet& P, int iat, const DistRow& dist)
 {
   valT curUat(0);
   const int igt = P.GroupID[iat] * NumGroups;
   for (int jg = 0; jg < NumGroups; ++jg)
     if (F[igt + jg])
     {
       const FuncType& f2(*F[igt + jg]);
       int iStart = P.first(jg);
       int iEnd   = P.last(jg);
       curUat += f2.evaluateV(iat, iStart, iEnd, dist.data(), DistCompressed.data());
     }
   return curUat;
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::posT TwoBodyJastrow<FT>::accumulateG(const valT* restrict du, const DisplRow& displ) const
 {
   posT grad;
   for (int idim = 0; idim < ndim; ++idim)
   {
     const valT* restrict dX = displ.data(idim);
     valT s                  = valT();

 #pragma omp simd reduction(+ : s) aligned(du, dX : QMC_SIMD_ALIGNMENT)
     for (int jat = 0; jat < N; ++jat)
       s += du[jat] * dX[jat];
     grad[idim] = s;
   }
   return grad;
 }

 template<typename FT>
 TwoBodyJastrow<FT>::TwoBodyJastrow(const std::string& obj_name, ParticleSet& p, bool use_offload)
     : WaveFunctionComponent(obj_name),
       N(p.getTotalNum()),
       NumGroups(p.groups()),
       ndim(p.getLattice().ndim),
       lapfac(ndim - RealType(1)),
       use_offload_(use_offload),
       N_padded(getAlignedSize<valT>(N)),
       my_table_ID_(p.addTable(p)),
       j2_ke_corr_helper(p, F)
 {
   if (my_name_.empty())
     throw std::runtime_error("TwoBodyJastrow object name cannot be empty!");

   F.resize(NumGroups * NumGroups, nullptr);

   // set up grp_ids
   grp_ids.resize(N);
   int count = 0;
   for (int ig = 0; ig < NumGroups; ig++)
     for (int j = p.first(ig); j < p.last(ig); j++)
       grp_ids[count++] = ig;
   assert(count == N);
   grp_ids.updateTo();

   resizeInternalStorage();

   KEcorr = 0.0;
 }

 template<typename FT>
 TwoBodyJastrow<FT>::~TwoBodyJastrow() = default;

 template<typename FT>
 void TwoBodyJastrow<FT>::checkSanity() const
 {
   if (std::any_of(F.begin(), F.end(), [](auto* ptr) { return ptr == nullptr; }))
     app_warning() << "Two-body Jastrow \"" << my_name_ << "\" doesn't cover all the particle pairs. "
                   << "Consider fusing multiple entries if they are of the same type for optimal code performance."
                   << std::endl;
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::resizeInternalStorage()
 {
   Uat.resize(N);
   dUat.resize(N);
   d2Uat.resize(N);
   // resize scratch compute
   cur_u.resize(N);
   cur_du.resize(N);
   cur_d2u.resize(N);
   old_u.resize(N);
   old_du.resize(N);
   old_d2u.resize(N);
   DistCompressed.resize(N);
   DistIndice.resize(N);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::addFunc(int ia, int ib, std::unique_ptr<FT> j)
 {
   assert(ia < NumGroups);
   assert(ib < NumGroups);
   if (ia == ib)
   {
     if (ia == 0) //first time, assign everything
     {
       int ij = 0;
       for (int ig = 0; ig < NumGroups; ++ig)
         for (int jg = 0; jg < NumGroups; ++jg, ++ij)
           if (F[ij] == nullptr)
             F[ij] = j.get();
     }
     else
       F[ia * NumGroups + ib] = j.get();
   }
   else
   {
     // a very special case, 1 particle of each type (e.g. 1 up + 1 down)
     // uu/dd/etc. was prevented by the builder
     if (N == NumGroups)
       for (int ig = 0; ig < NumGroups; ++ig)
         F[ig * NumGroups + ig] = j.get();
     // generic case
     F[ia * NumGroups + ib] = j.get();
     F[ib * NumGroups + ia] = j.get();
   }
   std::stringstream aname;
   aname << ia << ib;
   J2Unique[aname.str()] = std::move(j);
 }

 template<typename FT>
 std::unique_ptr<WaveFunctionComponent> TwoBodyJastrow<FT>::makeClone(ParticleSet& tqp) const
 {
   auto j2copy = std::make_unique<TwoBodyJastrow<FT>>(my_name_, tqp, use_offload_);
   std::map<const FT*, FT*> fcmap;
   for (int ig = 0; ig < NumGroups; ++ig)
     for (int jg = ig; jg < NumGroups; ++jg)
     {
       int ij = ig * NumGroups + jg;
       if (F[ij] == 0)
         continue;
       typename std::map<const FT*, FT*>::iterator fit = fcmap.find(F[ij]);
       if (fit == fcmap.end())
       {
         auto fc      = std::make_unique<FT>(*F[ij]);
         fcmap[F[ij]] = fc.get();
         j2copy->addFunc(ig, jg, std::move(fc));
       }
     }
   j2copy->KEcorr = KEcorr;

   j2copy->myVars.clear();
   j2copy->myVars.insertFrom(myVars);
   j2copy->OffSet = OffSet;

   return j2copy;
 }

 /** intenal function to compute \f$\sum_j u(r_j), du/dr, d2u/dr2\f$
  * @param P particleset
  * @param iat particle index
  * @param dist starting distance
  * @param u starting value
  * @param du starting first deriv
  * @param d2u starting second deriv
  */
 template<typename FT>
 void TwoBodyJastrow<FT>::computeU3(const ParticleSet& P,
                                    int iat,
                                    const DistRow& dist,
                                    RealType* restrict u,
                                    RealType* restrict du,
                                    RealType* restrict d2u,
                                    bool triangle)
 {
   const int jelmax = triangle ? iat : N;
   constexpr valT czero(0);
   std::fill_n(u, jelmax, czero);
   std::fill_n(du, jelmax, czero);
   std::fill_n(d2u, jelmax, czero);

   const int igt = P.GroupID[iat] * NumGroups;
   for (int jg = 0; jg < NumGroups; ++jg)
     if (F[igt + jg])
     {
       const FuncType& f2(*F[igt + jg]);
       int iStart = P.first(jg);
       int iEnd   = std::min(jelmax, P.last(jg));
       f2.evaluateVGL(iat, iStart, iEnd, dist.data(), u, du, d2u, DistCompressed.data(), DistIndice.data());
     }
   //u[iat]=czero;
   //du[iat]=czero;
   //d2u[iat]=czero;
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::PsiValue TwoBodyJastrow<FT>::ratio(ParticleSet& P, int iat)
 {
   //only ratio, ready to compute it again
   UpdateMode = ORB_PBYP_RATIO;
   cur_Uat    = computeU(P, iat, P.getDistTableAA(my_table_ID_).getTempDists());
   return std::exp(static_cast<PsiValue>(Uat[iat] - cur_Uat));
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_calcRatio(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                       const RefVectorWithLeader<ParticleSet>& p_list,
                                       int iat,
                                       std::vector<PsiValue>& ratios) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_calcRatio(wfc_list, p_list, iat, ratios);
     return;
   }

   //right now. Directly use FT::mw_evaluateVGL implementation.
   assert(this == &wfc_list.getLeader());
   auto& wfc_leader      = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   auto& p_leader        = p_list.getLeader();
   const auto& dt_leader = p_leader.getDistTableAA(my_table_ID_);
   const int nw          = wfc_list.size();

   auto& mw_vgl = wfc_leader.mw_mem_handle_.getResource().mw_vgl;
   mw_vgl.resize(nw, DIM + 2);

   auto& mw_allUat   = wfc_leader.mw_mem_handle_.getResource().mw_allUat;
   auto& mw_cur_allu = wfc_leader.mw_mem_handle_.getResource().mw_cur_allu;

   FT::mw_evaluateVGL(iat, NumGroups, F.data() + p_leader.GroupID[iat] * NumGroups, wfc_leader.N, grp_ids.data(), nw,
                      mw_vgl.data(), N_padded, dt_leader.getMultiWalkerTempDataPtr(), mw_cur_allu.data(),
                      wfc_leader.mw_mem_handle_.getResource().mw_ratiograd_buffer);

   for (int iw = 0; iw < nw; iw++)
   {
     auto& wfc   = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     wfc.cur_Uat = mw_vgl[iw][0];
     ratios[iw]  = std::exp(static_cast<PsiValue>(wfc.Uat[iat] - wfc.cur_Uat));
   }
 }


 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateRatiosAlltoOne(ParticleSet& P, std::vector<ValueType>& ratios)
 {
   const auto& d_table = P.getDistTableAA(my_table_ID_);
   const auto& dist    = d_table.getTempDists();

   for (int ig = 0; ig < NumGroups; ++ig)
   {
     const int igt = ig * NumGroups;
     valT sumU(0);
     for (int jg = 0; jg < NumGroups; ++jg)
       if (F[igt + jg])
       {
         const FuncType& f2(*F[igt + jg]);
         int iStart = P.first(jg);
         int iEnd   = P.last(jg);
         sumU += f2.evaluateV(-1, iStart, iEnd, dist.data(), DistCompressed.data());
       }

     for (int i = P.first(ig); i < P.last(ig); ++i)
     {
       // remove self-interaction
       const valT Uself = F[igt + ig]->evaluate(dist[i]);
       ratios[i]        = std::exp(Uat[i] + Uself - sumU);
     }
   }
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::GradType TwoBodyJastrow<FT>::evalGrad(ParticleSet& P, int iat)
 {
   return GradType(dUat[iat]);
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::PsiValue TwoBodyJastrow<FT>::ratioGrad(ParticleSet& P, int iat, GradType& grad_iat)
 {
   UpdateMode = ORB_PBYP_PARTIAL;

   computeU3(P, iat, P.getDistTableAA(my_table_ID_).getTempDists(), cur_u.data(), cur_du.data(), cur_d2u.data());
   cur_Uat = simd::accumulate_n(cur_u.data(), N, valT());
   DiffVal = Uat[iat] - cur_Uat;
   grad_iat += accumulateG(cur_du.data(), P.getDistTableAA(my_table_ID_).getTempDispls());
   return std::exp(static_cast<PsiValue>(DiffVal));
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_ratioGrad(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                       const RefVectorWithLeader<ParticleSet>& p_list,
                                       int iat,
                                       std::vector<PsiValue>& ratios,
                                       std::vector<GradType>& grad_new) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_ratioGrad(wfc_list, p_list, iat, ratios, grad_new);
     return;
   }

   assert(this == &wfc_list.getLeader());
   auto& wfc_leader      = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   auto& p_leader        = p_list.getLeader();
   const auto& dt_leader = p_leader.getDistTableAA(my_table_ID_);
   const int nw          = wfc_list.size();

   auto& mw_vgl = wfc_leader.mw_mem_handle_.getResource().mw_vgl;
   mw_vgl.resize(nw, DIM + 2);

   auto& mw_allUat   = wfc_leader.mw_mem_handle_.getResource().mw_allUat;
   auto& mw_cur_allu = wfc_leader.mw_mem_handle_.getResource().mw_cur_allu;

   FT::mw_evaluateVGL(iat, NumGroups, F.data() + p_leader.GroupID[iat] * NumGroups, wfc_leader.N, grp_ids.data(), nw,
                      mw_vgl.data(), N_padded, dt_leader.getMultiWalkerTempDataPtr(), mw_cur_allu.data(),
                      wfc_leader.mw_mem_handle_.getResource().mw_ratiograd_buffer);

   for (int iw = 0; iw < nw; iw++)
   {
     auto& wfc   = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     wfc.cur_Uat = mw_vgl[iw][0];
     ratios[iw]  = std::exp(static_cast<PsiValue>(wfc.Uat[iat] - wfc.cur_Uat));
     for (int idim = 0; idim < ndim; idim++)
       grad_new[iw][idim] += mw_vgl[iw][idim + 1];
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::acceptMove(ParticleSet& P, int iat, bool safe_to_delay)
 {
   // get the old u, du, d2u
   const auto& d_table = P.getDistTableAA(my_table_ID_);
   computeU3(P, iat, d_table.getOldDists(), old_u.data(), old_du.data(), old_d2u.data());
   if (UpdateMode == ORB_PBYP_RATIO)
   { //ratio-only during the move; need to compute derivatives
     const auto& dist = d_table.getTempDists();
     computeU3(P, iat, dist, cur_u.data(), cur_du.data(), cur_d2u.data());
   }

   valT cur_d2Uat(0);
   const auto& new_dr = d_table.getTempDispls();
   const auto& old_dr = d_table.getOldDispls();
 #pragma omp simd reduction(+ : cur_d2Uat)
   for (int jat = 0; jat < N; jat++)
   {
     const valT du   = cur_u[jat] - old_u[jat];
     const valT newl = cur_d2u[jat] + lapfac * cur_du[jat];
     const valT dl   = old_d2u[jat] + lapfac * old_du[jat] - newl;
     Uat[jat] += du;
     d2Uat[jat] += dl;
     cur_d2Uat -= newl;
   }
   posT cur_dUat;
   for (int idim = 0; idim < ndim; ++idim)
   {
     const valT* restrict new_dX    = new_dr.data(idim);
     const valT* restrict old_dX    = old_dr.data(idim);
     const valT* restrict cur_du_pt = cur_du.data();
     const valT* restrict old_du_pt = old_du.data();
     valT* restrict save_g          = dUat.data(idim);
     valT cur_g                     = cur_dUat[idim];
 #pragma omp simd reduction(+ : cur_g) aligned(old_dX, new_dX, save_g, cur_du_pt, old_du_pt : QMC_SIMD_ALIGNMENT)
     for (int jat = 0; jat < N; jat++)
     {
       const valT newg = cur_du_pt[jat] * new_dX[jat];
       const valT dg   = newg - old_du_pt[jat] * old_dX[jat];
       save_g[jat] -= dg;
       cur_g += newg;
     }
     cur_dUat[idim] = cur_g;
   }
   log_value_ += Uat[iat] - cur_Uat;
   Uat[iat]   = cur_Uat;
   dUat(iat)  = cur_dUat;
   d2Uat[iat] = cur_d2Uat;
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_accept_rejectMove(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                               const RefVectorWithLeader<ParticleSet>& p_list,
                                               int iat,
                                               const std::vector<bool>& isAccepted,
                                               bool safe_to_delay) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_accept_rejectMove(wfc_list, p_list, iat, isAccepted, safe_to_delay);
     return;
   }

   assert(this == &wfc_list.getLeader());
   auto& wfc_leader      = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   auto& p_leader        = p_list.getLeader();
   const auto& dt_leader = p_leader.getDistTableAA(my_table_ID_);
   const int nw          = wfc_list.size();

   auto& mw_vgl = wfc_leader.mw_mem_handle_.getResource().mw_vgl;

   auto& mw_allUat   = wfc_leader.mw_mem_handle_.getResource().mw_allUat;
   auto& mw_cur_allu = wfc_leader.mw_mem_handle_.getResource().mw_cur_allu;

   for (int iw = 0; iw < nw; iw++)
   {
     auto& wfc = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     wfc.log_value_ += wfc.Uat[iat] - mw_vgl[iw][0];
   }

   // this call may go asynchronous, then need to wait at mw_calcRatio mw_ratioGrad and mw_completeUpdates
   FT::mw_updateVGL(iat, isAccepted, NumGroups, F.data() + p_leader.GroupID[iat] * NumGroups, wfc_leader.N,
                    grp_ids.data(), nw, mw_vgl.data(), N_padded, dt_leader.getMultiWalkerTempDataPtr(), mw_allUat.data(),
                    mw_cur_allu.data(), wfc_leader.mw_mem_handle_.getResource().mw_update_buffer);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::recompute(const ParticleSet& P)
 {
   const auto& d_table = P.getDistTableAA(my_table_ID_);
   for (int ig = 0; ig < NumGroups; ++ig)
   {
     for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat)
     {
       computeU3(P, iat, d_table.getDistRow(iat), cur_u.data(), cur_du.data(), cur_d2u.data(), true);
       Uat[iat] = simd::accumulate_n(cur_u.data(), iat, valT());
       posT grad;
       valT lap(0);
       const valT* restrict u   = cur_u.data();
       const valT* restrict du  = cur_du.data();
       const valT* restrict d2u = cur_d2u.data();
       const auto& displ        = d_table.getDisplRow(iat);
 #pragma omp simd reduction(+ : lap) aligned(du, d2u : QMC_SIMD_ALIGNMENT)
       for (int jat = 0; jat < iat; ++jat)
         lap += d2u[jat] + lapfac * du[jat];
       for (int idim = 0; idim < ndim; ++idim)
       {
         const valT* restrict dX = displ.data(idim);
         valT s                  = valT();
 #pragma omp simd reduction(+ : s) aligned(du, dX : QMC_SIMD_ALIGNMENT)
         for (int jat = 0; jat < iat; ++jat)
           s += du[jat] * dX[jat];
         grad[idim] = s;
       }
       dUat(iat)  = grad;
       d2Uat[iat] = -lap;
 // add the contribution from the upper triangle
 #pragma omp simd aligned(u, du, d2u : QMC_SIMD_ALIGNMENT)
       for (int jat = 0; jat < iat; jat++)
       {
         Uat[jat] += u[jat];
         d2Uat[jat] -= d2u[jat] + lapfac * du[jat];
       }
       for (int idim = 0; idim < ndim; ++idim)
       {
         valT* restrict save_g   = dUat.data(idim);
         const valT* restrict dX = displ.data(idim);
 #pragma omp simd aligned(save_g, du, dX : QMC_SIMD_ALIGNMENT)
         for (int jat = 0; jat < iat; jat++)
           save_g[jat] -= du[jat] * dX[jat];
       }
     }
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_recompute(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                       const RefVectorWithLeader<ParticleSet>& p_list,
                                       const std::vector<bool>& recompute) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_recompute(wfc_list, p_list, recompute);
     return;
   }

   auto& wfc_leader = wfc_list.getCastedLeader<TwoBodyJastrow<FT>>();
   assert(this == &wfc_leader);
   for (int iw = 0; iw < wfc_list.size(); iw++)
     if (recompute[iw])
       wfc_list[iw].recompute(p_list[iw]);
   wfc_leader.mw_mem_handle_.getResource().mw_allUat.updateTo();
 }

 template<typename FT>
 typename TwoBodyJastrow<FT>::LogValue TwoBodyJastrow<FT>::evaluateLog(const ParticleSet& P,
                                                                       ParticleSet::ParticleGradient& G,
                                                                       ParticleSet::ParticleLaplacian& L)
 {
   recompute(P);
   return log_value_ = computeGL(G, L);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_evaluateLog(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                         const RefVectorWithLeader<ParticleSet>& p_list,
                                         const RefVector<ParticleSet::ParticleGradient>& G_list,
                                         const RefVector<ParticleSet::ParticleLaplacian>& L_list) const

 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_evaluateLog(wfc_list, p_list, G_list, L_list);
     return;
   }

   assert(this == &wfc_list.getLeader());
   const std::vector<bool> recompute_all(wfc_list.size(), true);
   mw_recompute(wfc_list, p_list, recompute_all);

   for (int iw = 0; iw < wfc_list.size(); iw++)
   {
     auto& wfc      = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     wfc.log_value_ = wfc.computeGL(G_list[iw], L_list[iw]);
   }
 }


 template<typename FT>
 typename TwoBodyJastrow<FT>::QTFull::RealType TwoBodyJastrow<FT>::computeGL(ParticleSet::ParticleGradient& G,
                                                                             ParticleSet::ParticleLaplacian& L) const
 {
   for (int iat = 0; iat < N; ++iat)
   {
     G[iat] += dUat[iat];
     L[iat] += d2Uat[iat];
   }
   return -0.5 * simd::accumulate_n(Uat.data(), N, QTFull::RealType());
 }

 template<typename FT>
 WaveFunctionComponent::LogValue TwoBodyJastrow<FT>::evaluateGL(const ParticleSet& P,
                                                                ParticleSet::ParticleGradient& G,
                                                                ParticleSet::ParticleLaplacian& L,
                                                                bool fromscratch)
 {
   return log_value_ = computeGL(G, L);
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::mw_evaluateGL(const RefVectorWithLeader<WaveFunctionComponent>& wfc_list,
                                        const RefVectorWithLeader<ParticleSet>& p_list,
                                        const RefVector<ParticleSet::ParticleGradient>& G_list,
                                        const RefVector<ParticleSet::ParticleLaplacian>& L_list,
                                        bool fromscratch) const
 {
   if (!use_offload_)
   {
     WaveFunctionComponent::mw_evaluateGL(wfc_list, p_list, G_list, L_list, fromscratch);
     return;
   }

   assert(this == &wfc_list.getLeader());
   for (int iw = 0; iw < wfc_list.size(); iw++)
   {
     auto& wfc      = wfc_list.getCastedElement<TwoBodyJastrow<FT>>(iw);
     wfc.log_value_ = wfc.computeGL(G_list[iw], L_list[iw]);
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateHessian(ParticleSet& P, HessVector& grad_grad_psi)
 {
   if (ndim < 3)
     throw std::runtime_error("double check! See 2d jastrow test.");
   log_value_ = 0.0;
   const auto& d_ee(P.getDistTableAA(my_table_ID_));
   valT dudr, d2udr2;

   Tensor<valT, DIM> ident;
   grad_grad_psi = 0.0;
   ident.diagonal(1.0);

   for (int i = 1; i < N; ++i)
   {
     const auto& dist  = d_ee.getDistRow(i);
     const auto& displ = d_ee.getDisplRow(i);
     auto ig           = P.GroupID[i];
     const int igt     = ig * NumGroups;
     for (int j = 0; j < i; ++j)
     {
       auto r    = dist[j];
       auto rinv = 1.0 / r;
       auto dr   = displ[j];
       auto jg   = P.GroupID[j];
       auto uij  = F[igt + jg]->evaluate(r, dudr, d2udr2);
       log_value_ -= uij;
       auto hess = rinv * rinv * outerProduct(dr, dr) * (d2udr2 - dudr * rinv) + ident * dudr * rinv;
       grad_grad_psi[i] -= hess;
       grad_grad_psi[j] -= hess;
     }
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateDerivatives(ParticleSet& P,
                                              const opt_variables_type& active,
                                              Vector<ValueType>& dlogpsi,
                                              Vector<ValueType>& dhpsioverpsi)
 {
   if (myVars.size() == 0)
     return;

   evaluateDerivativesWF(P, active, dlogpsi);
   bool recalculate(false);
   std::vector<bool> rcsingles(myVars.size(), false);
   for (int k = 0; k < myVars.size(); ++k)
   {
     int kk = myVars.where(k);
     if (kk < 0)
       continue;
     if (active.recompute(kk))
       recalculate = true;
     rcsingles[k] = true;
   }
   if (recalculate)
   {
     for (int k = 0; k < myVars.size(); ++k)
     {
       int kk = myVars.where(k);
       if (kk < 0)
         continue;
       if (rcsingles[k])
       {
         dhpsioverpsi[kk] = -RealType(0.5) * ValueType(Sum(lapLogPsi[k])) - ValueType(Dot(P.G, gradLogPsi[k]));
       }
     }
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateDerivativesWF(ParticleSet& P,
                                                const opt_variables_type& active,
                                                Vector<ValueType>& dlogpsi)
 {
   if (myVars.size() == 0)
     return;

   resizeWFOptVectors();

   bool recalculate(false);
   std::vector<bool> rcsingles(myVars.size(), false);
   for (int k = 0; k < myVars.size(); ++k)
   {
     int kk = myVars.where(k);
     if (kk < 0)
       continue;
     if (active.recompute(kk))
       recalculate = true;
     rcsingles[k] = true;
   }
   if (recalculate)
   {
     ///precomputed recalculation switch
     std::vector<bool> RecalcSwitch(F.size(), false);
     for (int i = 0; i < F.size(); ++i)
     {
       if (OffSet[i].first < 0)
       {
         // nothing to optimize
         RecalcSwitch[i] = false;
       }
       else
       {
         bool recalcFunc(false);
         for (int rcs = OffSet[i].first; rcs < OffSet[i].second; rcs++)
           if (rcsingles[rcs] == true)
             recalcFunc = true;
         RecalcSwitch[i] = recalcFunc;
       }
     }
     dLogPsi              = 0.0;
     const size_t NumVars = myVars.size();
     for (int p = 0; p < NumVars; ++p)
     {
       gradLogPsi[p] = 0.0;
       lapLogPsi[p]  = 0.0;
     }
     std::vector<TinyVector<RealType, 3>> derivs(NumVars);
     const auto& d_table = P.getDistTableAA(my_table_ID_);
     constexpr RealType cone(1);
     const size_t n  = d_table.sources();
     const size_t ng = P.groups();
     for (size_t i = 1; i < n; ++i)
     {
       const size_t ig   = P.GroupID[i] * ng;
       const auto& dist  = d_table.getDistRow(i);
       const auto& displ = d_table.getDisplRow(i);
       for (size_t j = 0; j < i; ++j)
       {
         const size_t ptype = ig + P.GroupID[j];
         if (RecalcSwitch[ptype])
         {
           std::fill(derivs.begin(), derivs.end(), 0.0);
           if (!F[ptype]->evaluateDerivatives(dist[j], derivs))
             continue;
           RealType rinv(cone / dist[j]);
           PosType dr(displ[j]);
           if (ndim < 3)
             dr[2] = 0;
           for (int p = OffSet[ptype].first, ip = 0; p < OffSet[ptype].second; ++p, ++ip)
           {
             RealType dudr(rinv * derivs[ip][1]);
             RealType lap(derivs[ip][2] + lapfac * dudr);
             PosType gr(dudr * dr);
             dLogPsi[p] -= derivs[ip][0];
             gradLogPsi[p][i] += gr;
             gradLogPsi[p][j] -= gr;
             lapLogPsi[p][i] -= lap;
             lapLogPsi[p][j] -= lap;
           }
         }
       }
     }
     for (int k = 0; k < myVars.size(); ++k)
     {
       int kk = myVars.where(k);
       if (kk < 0)
         continue;
       if (rcsingles[k])
       {
         dlogpsi[kk] = dLogPsi[k];
       }
       //optVars.setDeriv(p,dLogPsi[ip],-0.5*Sum(lapLogPsi[ip])-Dot(P.G,gradLogPsi[ip]));
     }
   }
 }

 template<typename FT>
 void TwoBodyJastrow<FT>::evaluateDerivRatios(const VirtualParticleSet& VP,
                                              const opt_variables_type& optvars,
                                              std::vector<ValueType>& ratios,
                                              Matrix<ValueType>& dratios)
 {
   evaluateRatios(VP, ratios);
   if (myVars.size() == 0)
     return;

   bool recalculate(false);
   std::vector<bool> rcsingles(myVars.size(), false);
   for (int k = 0; k < myVars.size(); ++k)
   {
     int kk = myVars.where(k);
     if (kk < 0)
       continue;
     if (optvars.recompute(kk))
       recalculate = true;
     rcsingles[k] = true;
   }

   if (recalculate)
   {
     ///precomputed recalculation switch
     std::vector<bool> RecalcSwitch(F.size(), false);
     for (int i = 0; i < F.size(); ++i)
     {
       if (OffSet[i].first < 0)
       {
         // nothing to optimize
         RecalcSwitch[i] = false;
       }
       else
       {
         bool recalcFunc(false);
         for (int rcs = OffSet[i].first; rcs < OffSet[i].second; rcs++)
           if (rcsingles[rcs] == true)
             recalcFunc = true;
         RecalcSwitch[i] = recalcFunc;
       }
     }
     const size_t NumVars = myVars.size();
     std::vector<RealType> derivs_ref(NumVars);
     std::vector<RealType> derivs(NumVars);
     const auto& d_table = VP.getDistTableAB(my_table_ID_);
     const size_t n      = d_table.sources();
     const size_t nt     = VP.getTotalNum();
     for (size_t i = 0; i < n; ++i)
     {
       if (i == VP.refPtcl)
         continue;
       const size_t ptype = VP.getRefPS().GroupID[i] * VP.getRefPS().groups() + VP.getRefPS().GroupID[VP.refPtcl];
       if (!RecalcSwitch[ptype])
         continue;
       const auto dist_ref = i < VP.refPtcl ? VP.getRefPS().getDistTableAA(my_table_ID_).getDistRow(VP.refPtcl)[i]
                                            : VP.getRefPS().getDistTableAA(my_table_ID_).getDistRow(i)[VP.refPtcl];
       //first calculate the old derivatives VP.refPtcl.
       std::fill(derivs_ref.begin(), derivs_ref.end(), 0.0);
       F[ptype]->evaluateDerivatives(dist_ref, derivs_ref);
       for (size_t j = 0; j < nt; ++j)
       {
         std::fill(derivs.begin(), derivs.end(), 0.0);
         F[ptype]->evaluateDerivatives(d_table.getDistRow(j)[i], derivs);
         for (int ip = 0, p = F[ptype]->myVars.Index.front(); ip < F[ptype]->myVars.Index.size(); ++ip, ++p)
           dratios[j][p] += derivs_ref[ip] - derivs[ip];
       }
     }
   }
 }

 template class TwoBodyJastrow<BsplineFunctor<QMCTraits::RealType>>;
 template class TwoBodyJastrow<PadeFunctor<QMCTraits::RealType>>;
 template class TwoBodyJastrow<UserFunctor<QMCTraits::RealType>>;
 template class TwoBodyJastrow<FakeFunctor<QMCTraits::RealType>>;
 } // namespace qmcplusplus
qmcplusplus::TwoBodyJastrow::checkSanity
void checkSanity() const override
Validate the internal consistency of the object.
Definition: TwoBodyJastrow.cpp:326

qmcplusplus::simd::accumulate_n
T2 accumulate_n(const T1 *restrict in, size_t n, T2 res)
Definition: algorithm.hpp:26

qmcplusplus::Sum
T Sum(const ParticleAttrib< T > &pa)
Definition: ParticleAttribOps.h:170

qmcplusplus::TinyVector
Fixed-size array.
Definition: OhmmsTinyMeta.h:30

qmcplusplus::Units::time::s
const real s
Definition: unit_conversion.h:47

optimize::VariableSet::recompute
bool recompute(int i) const
Definition: VariableSet.h:206

TwoBodyJastrow.h

qmcplusplus::ResourceCollection::addResource
size_t addResource(std::unique_ptr< Resource > &&res, bool noprint=false)
Definition: ResourceCollection.cpp:36

getAlignedSize
size_t getAlignedSize(size_t n)
return size in T&#39;s of allocated aligned memory
Definition: aligned_allocator.hpp:42

qmcplusplus::app_warning
std::ostream & app_warning()
Definition: OutputManager.h:69

qmcplusplus::ResourceCollection::takebackResource
void takebackResource(ResourceHandle< RS > &res_handle)
Definition: ResourceCollection.h:43

qmcplusplus::WaveFunctionComponent::my_name_
const std::string my_name_
Name of the object It is required to be different for objects of the same derived type like multiple ...
Definition: WaveFunctionComponent.h:99

qmcplusplus::VirtualParticleSet::getRefPS
const ParticleSet & getRefPS() const
ParticleSet this object refers to.
Definition: VirtualParticleSet.h:59

qmcplusplus::TwoBodyJastrow::mw_evaluateLog
void mw_evaluateLog(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const RefVector< ParticleSet::ParticleGradient > &G_list, const RefVector< ParticleSet::ParticleLaplacian > &L_list) const override
evaluate from scratch the same type WaveFunctionComponent of multiple walkers
Definition: TwoBodyJastrow.cpp:746

qmcplusplus
helper functions for EinsplineSetBuilder
Definition: Configuration.h:43

qmcplusplus::TwoBodyJastrow::registerData
void registerData(ParticleSet &P, WFBufferType &buf) override
For particle-by-particle move.
Definition: TwoBodyJastrow.cpp:220

qmcplusplus::ParticleSet::getDistTableAA
const DistanceTableAA & getDistTableAA(int table_ID) const
get a distance table by table_ID and dyanmic_cast to DistanceTableAA
Definition: ParticleSet.cpp:339

qmcplusplus::WaveFunctionComponent::mw_recompute
virtual void mw_recompute(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const std::vector< bool > &recompute) const
Definition: WaveFunctionComponent.cpp:49

qmcplusplus::TwoBodyJastrowMultiWalkerMem::makeClone
std::unique_ptr< Resource > makeClone() const override
Definition: TwoBodyJastrow.cpp:47

qmcplusplus::DistanceTableAB::getDistRow
const DistRow & getDistRow(int iel) const
return a row of distances for a given target particle
Definition: DistanceTable.h:343

qmcplusplus::RefVectorWithLeader::getLeader
T & getLeader() const
Definition: RefVectorWithLeader.h:34

qmcplusplus::PooledMemory::forward
void forward(size_type n)
Definition: PooledMemory.h:162

qmcplusplus::TwoBodyJastrow::addFunc
void addFunc(int ia, int ib, std::unique_ptr< FT > j)
add functor for (ia,ib) pair
Definition: TwoBodyJastrow.cpp:352

OMPstd::fill_n
void fill_n(T *x, size_t count, const T &value)
Definition: OMPstd.hpp:21

SoaDistanceTableABOMPTarget.h

BLAS::czero
constexpr std::complex< float > czero
Definition: BLAS.hpp:51

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_update_buffer
Vector< char, OffloadPinnedAllocator< char > > mw_update_buffer
Definition: TwoBodyJastrow.cpp:29

BLAS::cone
constexpr std::complex< float > cone
Definition: BLAS.hpp:50

qmcplusplus::VirtualParticleSet
A ParticleSet that handles virtual moves of a selected particle of a given physical ParticleSet Virtu...
Definition: VirtualParticleSet.h:39

qmcplusplus::ewaldref::DIM
Definition: EwaldRef.h:38

qmcplusplus::TwoBodyJastrow::evalGrad
GradType evalGrad(ParticleSet &P, int iat) override
return the current gradient for the iat-th particle
Definition: TwoBodyJastrow.cpp:526

qmcplusplus::VirtualParticleSet::getTotalNum
size_t getTotalNum() const
Definition: VirtualParticleSet.h:98

qmcplusplus::VirtualParticleSet::refPtcl
int refPtcl
Reference particle.
Definition: VirtualParticleSet.h:54

qmcplusplus::GradType
LatticeGaussianProduct::GradType GradType
Definition: LatticeGaussianProduct.cpp:21

qmcplusplus::VectorSoaContainer
SoA adaptor class for Vector<TinyVector<T,D> >
Definition: VectorSoaContainer.h:34

qmcplusplus::TwoBodyJastrow::extractOptimizableObjectRefs
void extractOptimizableObjectRefs(UniqueOptObjRefs &opt_obj_refs) override
extract underlying OptimizableObject references
Definition: TwoBodyJastrow.cpp:123

qmcplusplus::Vector
Definition: OhmmsVector.h:33

qmcplusplus::ParticleSet::first
int first(int igroup) const
return the first index of a group i
Definition: ParticleSet.h:514

qmcplusplus::Vector::free
void free()
free
Definition: OhmmsVector.h:196

qmcplusplus::DistanceTableAA::getTempDispls
const DisplRow & getTempDispls() const
return the temporary displacements when a move is proposed
Definition: DistanceTable.h:280

qmcplusplus::PooledMemory< FullPrecRealType >

qmcplusplus::Resource
Definition: Resource.h:20

qmcplusplus::TwoBodyJastrow::makeClone
std::unique_ptr< WaveFunctionComponent > makeClone(ParticleSet &tqp) const override
make clone
Definition: TwoBodyJastrow.cpp:386

qmcplusplus::ParticleAttrib
Attaches a unit to a Vector for IO.
Definition: ParticleAttrib.h:33

qmcplusplus::ParticleSet::L
ParticleLaplacian L
laplacians of the particles
Definition: ParticleSet.h:85

qmcplusplus::TwoBodyJastrow::ratioGrad
PsiValue ratioGrad(ParticleSet &P, int iat, GradType &grad_iat) override
evaluate the ratio of the new to old WaveFunctionComponent value and the new gradient ...
Definition: TwoBodyJastrow.cpp:532

qmcplusplus::DistanceTableAA::getTempDists
const DistRow & getTempDists() const
return the temporary distances when a move is proposed
Definition: DistanceTable.h:276

qmcplusplus::TwoBodyJastrow::resizeInternalStorage
void resizeInternalStorage()
initialize storage Uat,dUat, d2Uat
Definition: TwoBodyJastrow.cpp:335

qmcplusplus::TwoBodyJastrowMultiWalkerMem
Definition: TwoBodyJastrow.cpp:26

qmcplusplus::Vector::data
pointer data()
Definition: OhmmsVector.h:238

qmcplusplus::Dot
T Dot(const ParticleAttrib< TinyVector< T, D >> &pa, const ParticleAttrib< TinyVector< T, D >> &pb)
Definition: ParticleAttribOps.h:122

omptarget::min
T min(T a, T b)
Definition: OMPTargetMath.hpp:36

qmcplusplus::TwoBodyJastrow::releaseResource
void releaseResource(ResourceCollection &collection, const RefVectorWithLeader< WaveFunctionComponent > &wfc_list) const override
return a shared resource to a collection
Definition: TwoBodyJastrow.cpp:91

qmcplusplus::ParticleSet::GroupID
ParticleIndex GroupID
Species ID.
Definition: ParticleSet.h:77

qmcplusplus::WaveFunctionComponent::mw_evaluateGL
virtual void mw_evaluateGL(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const RefVector< ParticleSet::ParticleGradient > &G_list, const RefVector< ParticleSet::ParticleLaplacian > &L_list, bool fromscratch) const
evaluate gradients and laplacian of the same type WaveFunctionComponent of multiple walkers ...
Definition: WaveFunctionComponent.cpp:186

qmcplusplus::TwoBodyJastrow::F
std::vector< FT * > F
Container for . treat every pointer as a reference.
Definition: TwoBodyJastrow.h:111

qmcplusplus::WaveFunctionComponent::LogValue
std::complex< QTFull::RealType > LogValue
Definition: WaveFunctionComponent.h:83

qmcplusplus::TwoBodyJastrow::evaluateDerivativesWF
void evaluateDerivativesWF(ParticleSet &P, const opt_variables_type &active, Vector< ValueType > &dlogpsi) override
Definition: TwoBodyJastrow.cpp:883

qmcplusplus::ParticleSet::getDistTableAB
const DistanceTableAB & getDistTableAB(int table_ID) const
get a distance table by table_ID and dyanmic_cast to DistanceTableAB
Definition: ParticleSet.cpp:344

qmcplusplus::TwoBodyJastrow::computeGL
QTFull::RealType computeGL(ParticleSet::ParticleGradient &G, ParticleSet::ParticleLaplacian &L) const
compute G and L from internally stored data
Definition: TwoBodyJastrow.cpp:771

qmcplusplus::ParticleSet::groups
int groups() const
return the number of groups
Definition: ParticleSet.h:511

qmcplusplus::WaveFunctionComponent
An abstract class for a component of a many-body trial wave function.
Definition: WaveFunctionComponent.h:59

qmcplusplus::TwoBodyJastrow::accumulateG
posT accumulateG(const valT *restrict du, const DisplRow &displ) const
compute gradient
Definition: TwoBodyJastrow.cpp:275

qmcplusplus::ParticleSet
Specialized paritlce class for atomistic simulations.
Definition: ParticleSet.h:55

qmcplusplus::TwoBodyJastrow::TwoBodyJastrow
TwoBodyJastrow(const std::string &obj_name, ParticleSet &p, bool use_offload)
Definition: TwoBodyJastrow.cpp:292

qmcplusplus::TwoBodyJastrowMultiWalkerMem::transfer_buffer
Vector< char, OffloadPinnedAllocator< char > > transfer_buffer
Definition: TwoBodyJastrow.cpp:33

qmcplusplus::TwoBodyJastrow::recompute
void recompute(const ParticleSet &P) override
recompute internal data assuming distance table is fully ready
Definition: TwoBodyJastrow.cpp:669

qmcplusplus::TwoBodyJastrow::mw_evaluateRatios
void mw_evaluateRatios(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< const VirtualParticleSet > &vp_list, std::vector< std::vector< ValueType >> &ratios) const override
Definition: TwoBodyJastrow.cpp:177

qmcplusplus::Tensor
Tensor<T,D> class for D by D tensor.
Definition: OhmmsTinyMeta.h:32

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_vgl
Matrix< T, OffloadPinnedAllocator< T > > mw_vgl
Definition: TwoBodyJastrow.cpp:37

qmcplusplus::outerProduct
Tensor< typename BinaryReturn< T1, T2, OpMultiply >::Type_t, D > outerProduct(const TinyVector< T1, D > &lhs, const TinyVector< T2, D > &rhs)
Definition: TinyVector.h:211

qmcplusplus::TwoBodyJastrow::updateBuffer
LogValue updateBuffer(ParticleSet &P, WFBufferType &buf, bool fromscratch=false) override
For particle-by-particle move.
Definition: TwoBodyJastrow.cpp:249

qmcplusplus::TwoBodyJastrow::createResource
void createResource(ResourceCollection &collection) const override
initialize a shared resource and hand it to a collection
Definition: TwoBodyJastrow.cpp:51

qmcplusplus::ParticleSet::G
ParticleGradient G
gradients of the particles
Definition: ParticleSet.h:83

qmcplusplus::RefVectorWithLeader::getCastedElement
CASTTYPE & getCastedElement(size_t i) const
Definition: RefVectorWithLeader.h:47

qmcplusplus::TwoBodyJastrow::mw_mem_handle_
ResourceHandle< TwoBodyJastrowMultiWalkerMem< RealType > > mw_mem_handle_
Definition: TwoBodyJastrow.h:124

qmcplusplus::TwoBodyJastrow::computeU
valT computeU(const ParticleSet &P, int iat, const DistRow &dist)
Definition: TwoBodyJastrow.cpp:259

optimize::VariableSet
class to handle a set of variables that can be modified during optimizations
Definition: VariableSet.h:49

qmcplusplus::TwoBodyJastrow::mw_evaluateGL
void mw_evaluateGL(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const RefVector< ParticleSet::ParticleGradient > &G_list, const RefVector< ParticleSet::ParticleLaplacian > &L_list, bool fromscratch) const override
evaluate gradients and laplacian of the same type WaveFunctionComponent of multiple walkers ...
Definition: TwoBodyJastrow.cpp:792

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_ratiograd_buffer
Vector< char, OffloadPinnedAllocator< char > > mw_ratiograd_buffer
Definition: TwoBodyJastrow.cpp:31

qmcplusplus::ResourceCollection
Definition: ResourceCollection.h:25

qmcplusplus::RealType
double RealType
Definition: test_min_oned.cpp:22

qmcplusplus::ParticleSet::last
int last(int igroup) const
return the last index of a group i
Definition: ParticleSet.h:517

qmcplusplus::exp
MakeReturn< UnaryNode< FnExp, typename CreateLeaf< Vector< T1, C1 > >::Leaf_t > >::Expression_t exp(const Vector< T1, C1 > &l)
Definition: OhmmsVectorOperators.h:80

qmcplusplus::WaveFunctionComponent::PsiValue
QTFull::ValueType PsiValue
Definition: WaveFunctionComponent.h:85

qmcplusplus::DistanceTableAA::getDistRow
const DistRow & getDistRow(int iel) const
return a row of distances for a given target particle
Definition: DistanceTable.h:268

qmcplusplus::TwoBodyJastrow::valT
typename FT::real_type valT
type of each component U, dU, d2U;
Definition: TwoBodyJastrow.h:62

qmcplusplus::TwoBodyJastrow::ratio
PsiValue ratio(ParticleSet &P, int iat) override
evaluate the ratio of the new to old WaveFunctionComponent value
Definition: TwoBodyJastrow.cpp:451

qmcplusplus::TwoBodyJastrow::evaluateDerivRatios
void evaluateDerivRatios(const VirtualParticleSet &VP, const opt_variables_type &optvars, std::vector< ValueType > &ratios, Matrix< ValueType > &dratios) override
Definition: TwoBodyJastrow.cpp:981

qmcplusplus::TwoBodyJastrow::~TwoBodyJastrow
~TwoBodyJastrow() override

qmcplusplus::VectorSoaContainer::data
T * data()
return the base
Definition: VectorSoaContainer.h:262

qmcplusplus::TwoBodyJastrow
Specialization for two-body Jastrow function using multiple functors.
Definition: TwoBodyJastrow.h:56

qmcplusplus::TwoBodyJastrow::mw_ratioGrad
void mw_ratioGrad(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, std::vector< PsiValue > &ratios, std::vector< GradType > &grad_new) const override
Definition: TwoBodyJastrow.cpp:544

qmcplusplus::Tensor::diagonal
void diagonal(const T &rhs)
Definition: Tensor.h:205

qmcplusplus::WaveFunctionComponent::log_value_
LogValue log_value_
Current .
Definition: WaveFunctionComponent.h:106

qmcplusplus::TwoBodyJastrow::evaluateHessian
void evaluateHessian(ParticleSet &P, HessVector &grad_grad_psi) override
Definition: TwoBodyJastrow.cpp:813

qmcplusplus::TwoBodyJastrow::computeU3
void computeU3(const ParticleSet &P, int iat, const DistRow &dist, RealType *restrict u, RealType *restrict du, RealType *restrict d2u, bool triangle=false)
intenal function to compute
Definition: TwoBodyJastrow.cpp:422

qmcplusplus::PooledMemory::current
size_type current() const
Definition: PooledMemory.h:76

qmcplusplus::WaveFunctionComponent::mw_accept_rejectMove
virtual void mw_accept_rejectMove(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, const std::vector< bool > &isAccepted, bool safe_to_delay=false) const
moves of the iat-th particle on some walkers in a batch is accepted.
Definition: WaveFunctionComponent.cpp:157

qmcplusplus::RefVector
std::vector< std::reference_wrapper< T > > RefVector
Definition: template_types.hpp:32

qmcplusplus::WaveFunctionComponent::mw_evaluateLog
virtual void mw_evaluateLog(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const RefVector< ParticleSet::ParticleGradient > &G_list, const RefVector< ParticleSet::ParticleLaplacian > &L_list) const
evaluate from scratch the same type WaveFunctionComponent of multiple walkers
Definition: WaveFunctionComponent.cpp:31

qmcplusplus::n
int n
Definition: test_cuBLAS_LU.cpp:216

RealType
QMCTraits::RealType RealType
Definition: qmcfinitesize.cpp:47

qmcplusplus::RefVectorWithLeader::getCastedLeader
CASTTYPE & getCastedLeader() const
Definition: RefVectorWithLeader.h:39

qmcplusplus::TinyVector::data
Type_t * data()
Definition: TinyVector.h:138

qmcplusplus::TwoBodyJastrow::grp_ids
Vector< int, OffloadPinnedAllocator< int > > grp_ids
the group_id of each particle
Definition: TwoBodyJastrow.h:92

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_cur_allu
Vector< T, OffloadPinnedAllocator< T > > mw_cur_allu
memory pool for cur_u, cur_du, cur_d2u [3][Nw][N_padded]. 3 is for value, first and second derivative...
Definition: TwoBodyJastrow.cpp:41

qmcplusplus::WaveFunctionComponent::mw_ratioGrad
void mw_ratioGrad(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, std::vector< PsiValue > &ratios, TWFGrads< CT > &grad_new) const
Definition: WaveFunctionComponent.cpp:122

qmcplusplus::TwoBodyJastrow::acquireResource
void acquireResource(ResourceCollection &collection, const RefVectorWithLeader< WaveFunctionComponent > &wfc_list) const override
acquire a shared resource from a collection
Definition: TwoBodyJastrow.cpp:57

qmcplusplus::Matrix
Definition: OhmmsMatrix.h:27

qmcplusplus::UniqueOptObjRefs
Definition: OptimizableObject.h:98

qmcplusplus::TwoBodyJastrow::NumGroups
const size_t NumGroups
number of groups of the target particleset
Definition: TwoBodyJastrow.h:76

qmcplusplus::TwoBodyJastrow::evaluateGL
LogValue evaluateGL(const ParticleSet &P, ParticleSet::ParticleGradient &G, ParticleSet::ParticleLaplacian &L, bool fromscratch=false) override
compute G and L after the sweep
Definition: TwoBodyJastrow.cpp:783

qmcplusplus::TwoBodyJastrow::evaluateRatiosAlltoOne
void evaluateRatiosAlltoOne(ParticleSet &P, std::vector< ValueType > &ratios) override
Definition: TwoBodyJastrow.cpp:498

qmcplusplus::QMCTypes::RealType
Precision RealType
Definition: QMCTypes.h:37

ParticleAttribOps.h
Declaraton of ParticleAttrib<T>

qmcplusplus::WaveFunctionComponent::mw_evaluateRatios
virtual void mw_evaluateRatios(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< const VirtualParticleSet > &vp_list, std::vector< std::vector< ValueType >> &ratios) const
evaluate ratios to evaluate the non-local PP multiple walkers
Definition: WaveFunctionComponent.cpp:250

qmcplusplus::TwoBodyJastrow::evaluateDerivatives
void evaluateDerivatives(ParticleSet &P, const opt_variables_type &active, Vector< ValueType > &dlogpsi, Vector< ValueType > &dhpsioverpsi) override
Definition: TwoBodyJastrow.cpp:847

qmcplusplus::TwoBodyJastrow::evaluateRatios
void evaluateRatios(const VirtualParticleSet &VP, std::vector< ValueType > &ratios) override
Definition: TwoBodyJastrow.cpp:169

qmcplusplus::VectorSoaContainer::free
void free()
free allocated memory and clear status variables
Definition: VectorSoaContainer.h:148

qmcplusplus::WaveFunctionComponent::HessVector
OrbitalSetTraits< ValueType >::HessVector HessVector
Definition: WaveFunctionComponent.h:80

qmcplusplus::ValueType
LatticeGaussianProduct::ValueType ValueType
Definition: LatticeGaussianProduct.cpp:20

qmcplusplus::TwoBodyJastrow::checkOutVariables
void checkOutVariables(const opt_variables_type &active) override
check out optimizable variables
Definition: TwoBodyJastrow.cpp:130

ResourceCollection.h

qmcplusplus::TwoBodyJastrow::mw_recompute
void mw_recompute(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, const std::vector< bool > &recompute) const override
Definition: TwoBodyJastrow.cpp:718

qmcplusplus::RefVectorWithLeader
Definition: RefVectorWithLeader.h:23

qmcplusplus::ResourceCollection::lendResource
ResourceHandle< RS > lendResource()
Definition: ResourceCollection.h:40

qmcplusplus::TwoBodyJastrowMultiWalkerMem::TwoBodyJastrowMultiWalkerMem
TwoBodyJastrowMultiWalkerMem()
Definition: TwoBodyJastrow.cpp:43

qmcplusplus::Units::force::N
const real N
Definition: unit_conversion.h:92

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_vals
Vector< T, OffloadPinnedAllocator< T > > mw_vals
Definition: TwoBodyJastrow.cpp:35

qmcplusplus::WaveFunctionComponent::mw_calcRatio
virtual void mw_calcRatio(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, std::vector< PsiValue > &ratios) const
compute the ratio of the new to old WaveFunctionComponent value of multiple walkers ...
Definition: WaveFunctionComponent.cpp:104

qmcplusplus::TwoBodyJastrow::cur_Uat
valT cur_Uat
Definition: TwoBodyJastrow.h:103

qmcplusplus::TwoBodyJastrow::mw_accept_rejectMove
void mw_accept_rejectMove(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, const std::vector< bool > &isAccepted, bool safe_to_delay=false) const override
moves of the iat-th particle on some walkers in a batch is accepted.
Definition: TwoBodyJastrow.cpp:633

qmcplusplus::TwoBodyJastrow::KEcorr
RealType KEcorr
Correction.
Definition: TwoBodyJastrow.h:96

qmcplusplus::TwoBodyJastrow::FuncType
FT FuncType
alias FuncType
Definition: TwoBodyJastrow.h:60

algorithm.hpp
SIMD version of functions in algorithm.

qmcplusplus::PooledMemory::lendReference
T1 * lendReference(size_type n)
Definition: PooledMemory.h:154

qmcplusplus::UniqueOptObjRefs::push_back
void push_back(OptimizableObject &obj)
Definition: OptimizableObject.h:103

qmcplusplus::TwoBodyJastrow::N
const size_t N
number of particles
Definition: TwoBodyJastrow.h:74

qmcplusplus::TwoBodyJastrow::mw_calcRatio
void mw_calcRatio(const RefVectorWithLeader< WaveFunctionComponent > &wfc_list, const RefVectorWithLeader< ParticleSet > &p_list, int iat, std::vector< PsiValue > &ratios) const override
Definition: TwoBodyJastrow.cpp:460

qmcplusplus::TwoBodyJastrow::copyFromBuffer
void copyFromBuffer(ParticleSet &P, WFBufferType &buf) override
For particle-by-particle move.
Definition: TwoBodyJastrow.cpp:241

qmcplusplus::TwoBodyJastrowMultiWalkerMem::mw_allUat
Vector< T, OffloadPinnedAllocator< T > > mw_allUat
memory pool for Uat, dUat, d2Uat [Nw][N_padded] + [Nw][DIM][N_padded] + [Nw][N_padded] ...
Definition: TwoBodyJastrow.cpp:39

qmcplusplus::TwoBodyJastrowMultiWalkerMem::TwoBodyJastrowMultiWalkerMem
TwoBodyJastrowMultiWalkerMem(const TwoBodyJastrowMultiWalkerMem &)
Definition: TwoBodyJastrow.cpp:45

qmcplusplus::TwoBodyJastrow::acceptMove
void acceptMove(ParticleSet &P, int iat, bool safe_to_delay=false) override
a move for iat-th particle is accepted.
Definition: TwoBodyJastrow.cpp:583

qmcplusplus::PooledMemory::add
void add(std::complex< T1 > &x)
Definition: PooledMemory.h:113

qmcplusplus::TwoBodyJastrow::evaluateLog
LogValue evaluateLog(const ParticleSet &P, ParticleSet::ParticleGradient &G, ParticleSet::ParticleLaplacian &L) override
evaluate the value of the WaveFunctionComponent from scratch
Definition: TwoBodyJastrow.cpp:737