d4/d2a/a00632_source.html

 //////////////////////////////////////////////////////////////////////////////////////
 // This file is distributed under the University of Illinois/NCSA Open Source License.
 // See LICENSE file in top directory for details.
 //
 // Copyright (c) 2016 Jeongnim Kim and QMCPACK developers.
 //
 // File developed by:
 //
 // File created by: Jeongnim Kim, jeongnim.kim@intel.com, Intel Corp.
 //////////////////////////////////////////////////////////////////////////////////////


 #ifndef QMCPLUSPLUS_SOA_SPHERICAL_CARTESIAN_TENSOR_H
 #define QMCPLUSPLUS_SOA_SPHERICAL_CARTESIAN_TENSOR_H

 #include <stdexcept>
 #include <limits>
 #include "OhmmsSoA/VectorSoaContainer.h"
 #include "OhmmsPETE/Tensor.h"
 #include "OhmmsPETE/OhmmsArray.h"
 #include "OMPTarget/OffloadAlignedAllocators.hpp"

 namespace qmcplusplus
 {
 /** SoaSphericalTensor that evaluates the Real Spherical Harmonics
  *
  * The template parameters
  * - T, the value_type, e.g. double
  * - Point_t, a vector type to provide xyz coordinate.
  * Point_t must have the operator[] defined, e.g., TinyVector<double,3>.
  *
  * Real Spherical Harmonics Ylm\f$=r^l S_l^m(x,y,z) \f$ is stored
  * in an array ordered as [0,-1 0 1,-2 -1 0 1 2, -Lmax,-Lmax+1,..., Lmax-1,Lmax]
  * where Lmax is the maximum angular momentum of a center.
  * All the data members, e.g, Ylm and pre-calculated factors,
  * can be accessed by index(l,m) which returns the
  * locator of the combination for l and m.
  */
 template<typename T>
 class SoaSphericalTensor
 {
 private:
   using OffloadVector  = Vector<T, OffloadPinnedAllocator<T>>;
   using OffloadArray2D = Array<T, 2, OffloadPinnedAllocator<T>>;
   using OffloadArray3D = Array<T, 3, OffloadPinnedAllocator<T>>;
   using OffloadArray4D = Array<T, 4, OffloadPinnedAllocator<T>>;
   ///maximum angular momentum for the center
   int Lmax;
   /// Normalization factors
   const std::shared_ptr<OffloadVector> norm_factor_ptr_;
   ///pre-evaluated factor \f$1/\sqrt{(l+m)\times(l+1-m)}\f$
   const std::shared_ptr<OffloadVector> factorLM_ptr_;
   ///pre-evaluated factor \f$\sqrt{(2l+1)/(4\pi)}\f$
   const std::shared_ptr<OffloadVector> factorL_ptr_;
   ///pre-evaluated factor \f$(2l+1)/(2l-1)\f$
   const std::shared_ptr<OffloadVector> factor2L_ptr_;
   /// norm_factor reference
   OffloadVector& norm_factor_;
   /// factorLM reference
   OffloadVector& factorLM_;
   /// factorL reference
   OffloadVector& factorL_;
   /// factor2L reference
   OffloadVector& factor2L_;
   ///composite
   VectorSoaContainer<T, 5> cYlm;

 public:
   explicit SoaSphericalTensor(const int l_max, bool addsign = false);

   SoaSphericalTensor(const SoaSphericalTensor& rhs) = default;

   ///compute Ylm for single position
   static void evaluate_bare(T x, T y, T z, T* Ylm, int lmax, const T* factorL, const T* factorLM);
   ///compute Ylm_vgl for single position
   static void evaluateVGL_impl(const T x,
                                const T y,
                                const T z,
                                T* restrict Ylm_vgl,
                                int lmax,
                                const T* factorL,
                                const T* factorLM,
                                const T* factor2L,
                                const T* normfactor,
                                size_t offset);

   ///compute Ylm
   inline void evaluateV(T x, T y, T z, T* Ylm) const
   {
     evaluate_bare(x, y, z, Ylm, Lmax, factorL_.data(), factorLM_.data());
     for (int i = 0, nl = cYlm.size(); i < nl; i++)
       Ylm[i] *= norm_factor_[i];
   }

   /**
    * @brief evaluate V for multiple electrons and multiple pbc images
    *
    * @param [in] xyz electron positions [Nelec, Npbc, 3(x,y,z)]
    * @param [out] Ylm Spherical tensor elements [Nelec, Npbc, Nlm]
   */
   inline void batched_evaluateV(const OffloadArray3D& xyz, OffloadArray3D& Ylm) const
   {
     const size_t nElec = xyz.size(0);
     const size_t Npbc  = xyz.size(1); // number of PBC images
     assert(xyz.size(2) == 3);

     assert(Ylm.size(0) == nElec);
     assert(Ylm.size(1) == Npbc);
     const size_t Nlm = Ylm.size(2);

     size_t nR = nElec * Npbc; // total number of positions to evaluate

     auto* xyz_ptr          = xyz.data();
     auto* Ylm_ptr          = Ylm.data();
     auto* factorLM__ptr    = factorLM_.data();
     auto* factorL__ptr     = factorL_.data();
     auto* norm_factor__ptr = norm_factor_.data();

     PRAGMA_OFFLOAD("omp target teams distribute parallel for \
                     map(to:factorLM__ptr[:Nlm], factorL__ptr[:Lmax+1], norm_factor__ptr[:Nlm]) \
                     map(to: xyz_ptr[:3*nR], Ylm_ptr[:Nlm*nR])")
     for (uint32_t ir = 0; ir < nR; ir++)
     {
       evaluate_bare(xyz_ptr[0 + 3 * ir], xyz_ptr[1 + 3 * ir], xyz_ptr[2 + 3 * ir], Ylm_ptr + (ir * Nlm), Lmax,
                     factorL__ptr, factorLM__ptr);
       for (int i = 0; i < Nlm; i++)
         Ylm_ptr[ir * Nlm + i] *= norm_factor__ptr[i];
     }
   }

   /**
    * @brief evaluate VGL for multiple electrons and multiple pbc images
    *
    * when offload is enabled, xyz is assumed to be up to date on the device before entering the function
    * Ylm_vgl will be up to date on the device (but not host) when this function exits
    *
    * @param [in] xyz electron positions [Nelec, Npbc, 3(x,y,z)]
    * @param [out] Ylm_vgl Spherical tensor elements [5(v, gx, gy, gz, lapl), Nelec, Npbc, Nlm]
   */
   inline void batched_evaluateVGL(const OffloadArray3D& xyz, OffloadArray4D& Ylm_vgl) const
   {
     const size_t nElec = xyz.size(0);
     const size_t Npbc  = xyz.size(1); // number of PBC images
     assert(xyz.size(2) == 3);

     assert(Ylm_vgl.size(0) == 5);
     assert(Ylm_vgl.size(1) == nElec);
     assert(Ylm_vgl.size(2) == Npbc);
     const size_t Nlm = Ylm_vgl.size(3);
     assert(norm_factor_.size() == Nlm);

     const size_t nR     = nElec * Npbc; // total number of positions to evaluate
     const size_t offset = Nlm * nR;     // stride for v/gx/gy/gz/l

     auto* xyz_ptr          = xyz.data();
     auto* Ylm_vgl_ptr      = Ylm_vgl.data();
     auto* factorLM__ptr    = factorLM_.data();
     auto* factorL__ptr     = factorL_.data();
     auto* factor2L__ptr    = factor2L_.data();
     auto* norm_factor__ptr = norm_factor_.data();

     PRAGMA_OFFLOAD("omp target teams distribute parallel for \
                     map(to:factorLM__ptr[:Nlm], factorL__ptr[:Lmax+1], norm_factor__ptr[:Nlm], factor2L__ptr[:Lmax+1]) \
                     map(to: xyz_ptr[:nR*3], Ylm_vgl_ptr[:5*nR*Nlm])")
     for (uint32_t ir = 0; ir < nR; ir++)
       evaluateVGL_impl(xyz_ptr[0 + 3 * ir], xyz_ptr[1 + 3 * ir], xyz_ptr[2 + 3 * ir], Ylm_vgl_ptr + (ir * Nlm), Lmax,
                        factorL__ptr, factorLM__ptr, factor2L__ptr, norm_factor__ptr, offset);
   }

   ///compute Ylm
   inline void evaluateV(T x, T y, T z)
   {
     T* restrict Ylm = cYlm.data(0);
     evaluate_bare(x, y, z, Ylm, Lmax, factorL_.data(), factorLM_.data());
     for (int i = 0, nl = cYlm.size(); i < nl; i++)
       Ylm[i] *= norm_factor_[i];
   }

   ///makes a table of \f$ r^l S_l^m \f$ and their gradients up to Lmax.
   void evaluateVGL(T x, T y, T z);

   ///makes a table of \f$ r^l S_l^m \f$ and their gradients up to Lmax.
   void evaluateVGH(T x, T y, T z);

   ///makes a table of \f$ r^l S_l^m \f$ and their gradients up to Lmax.
   void evaluateVGHGH(T x, T y, T z);

   ///returns the index/locator for (\f$l,m\f$) combo, \f$ l(l+1)+m \f$
   static inline int index(int l, int m) { return (l * (l + 1)) + m; }

   /** return the starting address of the component
    *
    * component=0(V), 1(dx), 2(dy), 3(dz), 4(Lap)
    */
   inline const T* operator[](size_t component) const { return cYlm.data(component); }

   inline size_t size() const { return cYlm.size(); }

   inline int lmax() const { return Lmax; }
 };

 /** constructor
  * @param l_max maximum angular momentum
  * @param addsign flag to determine what convention to use
  *
  * Evaluate all the constants and prefactors.
  * The spherical harmonics is defined as
  * \f[ Y_l^m (\theta,\phi) = \sqrt{\frac{(2l+1)(l-m)!}{4\pi(l+m)!}} P_l^m(\cos\theta)e^{im\phi}\f]
  * Note that the data member Ylm is a misnomer and should not be confused with "spherical harmonics"
  * \f$Y_l^m\f$.
  - When addsign == true, e.g., Gaussian packages
  \f{eqnarray*}
  S_l^m &=& (-1)^m \sqrt{2}\Re(Y_l^{|m|}), \;\;\;m > 0 \\
  &=& Y_l^0, \;\;\;m = 0 \\
  &=& (-1)^m \sqrt{2}\Im(Y_l^{|m|}),\;\;\;m < 0
  \f}
  - When addsign == false, e.g., SIESTA package,
  \f{eqnarray*}
  S_l^m &=& \sqrt{2}\Re(Y_l^{|m|}), \;\;\;m > 0 \\
  &=& Y_l^0, \;\;\;m = 0 \\
  &=&\sqrt{2}\Im(Y_l^{|m|}),\;\;\;m < 0
  \f}
  */
 template<typename T>
 inline SoaSphericalTensor<T>::SoaSphericalTensor(const int l_max, bool addsign)
     : Lmax(l_max),
       norm_factor_ptr_(std::make_shared<OffloadVector>()),
       factorLM_ptr_(std::make_shared<OffloadVector>()),
       factorL_ptr_(std::make_shared<OffloadVector>()),
       factor2L_ptr_(std::make_shared<OffloadVector>()),
       norm_factor_(*norm_factor_ptr_),
       factorLM_(*factorLM_ptr_),
       factorL_(*factorL_ptr_),
       factor2L_(*factor2L_ptr_)
 {
   constexpr T czero(0);
   constexpr T cone(1);
   const int ntot = (Lmax + 1) * (Lmax + 1);
   cYlm.resize(ntot);
   norm_factor_.resize(ntot, cone);
   const T sqrt2 = std::sqrt(2.0);
   if (addsign)
   {
     for (int l = 0; l <= Lmax; l++)
     {
       norm_factor_[index(l, 0)] = cone;
       for (int m = 1; m <= l; m++)
       {
         norm_factor_[index(l, m)]  = std::pow(-cone, m) * sqrt2;
         norm_factor_[index(l, -m)] = std::pow(-cone, -m) * sqrt2;
       }
     }
   }
   else
   {
     for (int l = 0; l <= Lmax; l++)
     {
       for (int m = 1; m <= l; m++)
       {
         norm_factor_[index(l, m)]  = sqrt2;
         norm_factor_[index(l, -m)] = sqrt2;
       }
     }
   }
   factorL_.resize(Lmax + 1);
   const T omega = 1.0 / std::sqrt(16.0 * std::atan(1.0));
   for (int l = 1; l <= Lmax; l++)
     factorL_[l] = std::sqrt(static_cast<T>(2 * l + 1)) * omega;
   factor2L_.resize(Lmax + 1);
   for (int l = 1; l <= Lmax; l++)
     factor2L_[l] = static_cast<T>(2 * l + 1) / static_cast<T>(2 * l - 1);
   factorLM_.resize(ntot);
   for (int l = 1; l <= Lmax; l++)
     for (int m = 1; m <= l; m++)
     {
       T fac2                  = 1.0 / std::sqrt(static_cast<T>((l + m) * (l + 1 - m)));
       factorLM_[index(l, m)]  = fac2;
       factorLM_[index(l, -m)] = fac2;
     }
   norm_factor_.updateTo();
   factorLM_.updateTo();
   factorL_.updateTo();
   factor2L_.updateTo();
 }

 PRAGMA_OFFLOAD("omp declare target")
 template<typename T>
 inline void SoaSphericalTensor<T>::evaluate_bare(T x,
                                                  T y,
                                                  T z,
                                                  T* restrict Ylm,
                                                  int lmax,
                                                  const T* factorL,
                                                  const T* factorLM)
 {
   constexpr T czero(0);
   constexpr T cone(1);
   const T pi       = 4.0 * std::atan(1.0);
   const T omega    = 1.0 / std::sqrt(4.0 * pi);
   constexpr T eps2 = std::numeric_limits<T>::epsilon() * std::numeric_limits<T>::epsilon();

   /*  Calculate r, cos(theta), sin(theta), cos(phi), sin(phi) from input
       coordinates. Check here the coordinate singularity at cos(theta) = +-1.
       This also takes care of r=0 case. */
   T cphi, sphi, ctheta;
   T r2xy = x * x + y * y;
   T r    = std::sqrt(r2xy + z * z);
   if (r2xy < eps2)
   {
     cphi   = czero;
     sphi   = cone;
     ctheta = (z < czero) ? -cone : cone;
   }
   else
   {
     ctheta = z / r;
     //protect ctheta, when ctheta is slightly >1 or <-1
     if (ctheta > cone)
       ctheta = cone;
     if (ctheta < -cone)
       ctheta = -cone;
     T rxyi = cone / std::sqrt(r2xy);
     cphi   = x * rxyi;
     sphi   = y * rxyi;
   }
   T stheta = std::sqrt(cone - ctheta * ctheta);
   /* Now to calculate the associated legendre functions P_lm from the
      recursion relation from l=0 to Lmax. Conventions of J.D. Jackson,
      Classical Electrodynamics are used. */
   Ylm[0] = cone;
   // calculate P_ll and P_l,l-1
   T fac = cone;
   int j = -1;
   for (int l = 1; l <= lmax; l++)
   {
     j += 2;
     fac *= -j * stheta;
     int ll  = index(l, l);
     int l1  = index(l, l - 1);
     int l2  = index(l - 1, l - 1);
     Ylm[ll] = fac;
     Ylm[l1] = j * ctheta * Ylm[l2];
   }
   // Use recurence to get other plm's //
   for (int m = 0; m < lmax - 1; m++)
   {
     int j = 2 * m + 1;
     for (int l = m + 2; l <= lmax; l++)
     {
       j += 2;
       int lm  = index(l, m);
       int l1  = index(l - 1, m);
       int l2  = index(l - 2, m);
       Ylm[lm] = (ctheta * j * Ylm[l1] - (l + m - 1) * Ylm[l2]) / (l - m);
     }
   }
   // Now to calculate r^l Y_lm. //
   T sphim, cphim, temp;
   Ylm[0] = omega; //1.0/sqrt(pi4);
   T rpow = 1.0;
   for (int l = 1; l <= lmax; l++)
   {
     rpow *= r;
     //fac = rpow*sqrt(static_cast<T>(2*l+1))*omega;//rpow*sqrt((2*l+1)/pi4);
     //factorL[l] = sqrt(2*l+1)/sqrt(4*pi)
     fac    = rpow * factorL[l];
     int l0 = index(l, 0);
     Ylm[l0] *= fac;
     cphim = cone;
     sphim = czero;
     for (int m = 1; m <= l; m++)
     {
       temp   = cphim * cphi - sphim * sphi;
       sphim  = sphim * cphi + cphim * sphi;
       cphim  = temp;
       int lm = index(l, m);
       fac *= factorLM[lm];
       temp    = fac * Ylm[lm];
       Ylm[lm] = temp * cphim;
       lm      = index(l, -m);
       Ylm[lm] = temp * sphim;
     }
   }
   //for (int i=0; i<Ylm.size(); i++)
   //  Ylm[i]*= norm_factor_[i];
 }
 PRAGMA_OFFLOAD("omp end declare target")


 PRAGMA_OFFLOAD("omp declare target")
 template<typename T>
 inline void SoaSphericalTensor<T>::evaluateVGL_impl(const T x,
                                                     const T y,
                                                     const T z,
                                                     T* restrict Ylm_vgl,
                                                     int lmax,
                                                     const T* factorL,
                                                     const T* factorLM,
                                                     const T* factor2L,
                                                     const T* normfactor,
                                                     size_t offset)
 {
   T* restrict Ylm = Ylm_vgl;
   // T* restrict Ylm = cYlm.data(0);
   evaluate_bare(x, y, z, Ylm, lmax, factorL, factorLM);
   const size_t Nlm = (lmax + 1) * (lmax + 1);

   constexpr T czero(0);
   constexpr T ahalf(0.5);
   T* restrict gYlmX = Ylm_vgl + offset * 1;
   T* restrict gYlmY = Ylm_vgl + offset * 2;
   T* restrict gYlmZ = Ylm_vgl + offset * 3;
   T* restrict lYlm  = Ylm_vgl + offset * 4; // just need to set to zero

   gYlmX[0] = czero;
   gYlmY[0] = czero;
   gYlmZ[0] = czero;
   lYlm[0]  = czero;

   // Calculating Gradient now//
   for (int l = 1; l <= lmax; l++)
   {
     //T fac = ((T) (2*l+1))/(2*l-1);
     T fac = factor2L[l];
     for (int m = -l; m <= l; m++)
     {
       int lm = index(l - 1, 0);
       T gx, gy, gz, dpr, dpi, dmr, dmi;
       const int ma = std::abs(m);
       const T cp   = std::sqrt(fac * (l - ma - 1) * (l - ma));
       const T cm   = std::sqrt(fac * (l + ma - 1) * (l + ma));
       const T c0   = std::sqrt(fac * (l - ma) * (l + ma));
       gz           = (l > ma) ? c0 * Ylm[lm + m] : czero;
       if (l > ma + 1)
       {
         dpr = cp * Ylm[lm + ma + 1];
         dpi = cp * Ylm[lm - ma - 1];
       }
       else
       {
         dpr = czero;
         dpi = czero;
       }
       if (l > 1)
       {
         switch (ma)
         {
         case 0:
           dmr = -cm * Ylm[lm + 1];
           dmi = cm * Ylm[lm - 1];
           break;
         case 1:
           dmr = cm * Ylm[lm];
           dmi = czero;
           break;
         default:
           dmr = cm * Ylm[lm + ma - 1];
           dmi = cm * Ylm[lm - ma + 1];
         }
       }
       else
       {
         dmr = cm * Ylm[lm];
         dmi = czero;
         //dmr = (l==1) ? cm*Ylm[lm]:0.0;
         //dmi = 0.0;
       }
       if (m < 0)
       {
         gx = ahalf * (dpi - dmi);
         gy = -ahalf * (dpr + dmr);
       }
       else
       {
         gx = ahalf * (dpr - dmr);
         gy = ahalf * (dpi + dmi);
       }
       lm = index(l, m);
       if (ma)
       {
         gYlmX[lm] = normfactor[lm] * gx;
         gYlmY[lm] = normfactor[lm] * gy;
         gYlmZ[lm] = normfactor[lm] * gz;
       }
       else
       {
         gYlmX[lm] = gx;
         gYlmY[lm] = gy;
         gYlmZ[lm] = gz;
       }
     }
   }
   for (int i = 0; i < Nlm; i++)
   {
     Ylm[i] *= normfactor[i];
     lYlm[i] = 0;
   }
   //for (int i=0; i<Ylm.size(); i++) gradYlm[i]*= norm_factor_[i];
 }
 PRAGMA_OFFLOAD("omp end declare target")

 template<typename T>
 inline void SoaSphericalTensor<T>::evaluateVGL(T x, T y, T z)
 {
   evaluateVGL_impl(x, y, z, cYlm.data(), Lmax, factorL_.data(), factorLM_.data(), factor2L_.data(), norm_factor_.data(),
                    cYlm.capacity());
 }

 template<typename T>
 inline void SoaSphericalTensor<T>::evaluateVGH(T x, T y, T z)
 {
   throw std::runtime_error("SoaSphericalTensor<T>::evaluateVGH(x,y,z):  Not implemented\n");
 }

 template<typename T>
 inline void SoaSphericalTensor<T>::evaluateVGHGH(T x, T y, T z)
 {
   throw std::runtime_error("SoaSphericalTensor<T>::evaluateVGHGH(x,y,z):  Not implemented\n");
 }

 extern template class SoaSphericalTensor<float>;
 extern template class SoaSphericalTensor<double>;
 } // namespace qmcplusplus
 #endif
qmcplusplus::SoaSphericalTensor::norm_factor_
OffloadVector & norm_factor_
norm_factor reference
Definition: SoaSphericalTensor.h:58

qmcplusplus::SoaSphericalTensor::norm_factor_ptr_
const std::shared_ptr< OffloadVector > norm_factor_ptr_
Normalization factors.
Definition: SoaSphericalTensor.h:50

qmcplusplus
helper functions for EinsplineSetBuilder
Definition: Configuration.h:43

qmcplusplus::SoaSphericalTensor::SoaSphericalTensor
SoaSphericalTensor(const int l_max, bool addsign=false)
constructor
Definition: SoaSphericalTensor.h:225

qmcplusplus::SoaSphericalTensor::batched_evaluateVGL
void batched_evaluateVGL(const OffloadArray3D &xyz, OffloadArray4D &Ylm_vgl) const
evaluate VGL for multiple electrons and multiple pbc images
Definition: SoaSphericalTensor.h:140

qmcplusplus::SoaSphericalTensor::factor2L_ptr_
const std::shared_ptr< OffloadVector > factor2L_ptr_
pre-evaluated factor
Definition: SoaSphericalTensor.h:56

qmcplusplus::SoaSphericalTensor::evaluateV
void evaluateV(T x, T y, T z)
compute Ylm
Definition: SoaSphericalTensor.h:171

qmcplusplus::Ylm
std::complex< T > Ylm(int l, int m, const TinyVector< T, 3 > &r)
calculates Ylm param[in] l angular momentum param[in] m magnetic quantum number param[in] r position ...
Definition: Ylm.h:89

qmcplusplus::abs
MakeReturn< UnaryNode< FnFabs, typename CreateLeaf< Vector< T1, C1 > >::Leaf_t > >::Expression_t abs(const Vector< T1, C1 > &l)
Definition: OhmmsVectorOperators.h:88

OhmmsArray.h

qmcplusplus::SoaSphericalTensor::factorL_
OffloadVector & factorL_
factorL reference
Definition: SoaSphericalTensor.h:62

BLAS::czero
constexpr std::complex< float > czero
Definition: BLAS.hpp:51

pi
const double pi
Definition: Standard.h:56

Array::data
Type_t * data()
Definition: OhmmsArray.h:87

BLAS::cone
constexpr std::complex< float > cone
Definition: BLAS.hpp:50

VectorSoaContainer.h
Soa Container for D-dim vectors.

qmcplusplus::SoaSphericalTensor::operator[]
const T * operator[](size_t component) const
return the starting address of the component
Definition: SoaSphericalTensor.h:195

qmcplusplus::VectorSoaContainer< T, 5 >

qmcplusplus::Vector
Definition: OhmmsVector.h:33

qmcplusplus::SoaSphericalTensor::cYlm
VectorSoaContainer< T, 5 > cYlm
composite
Definition: SoaSphericalTensor.h:66

qmcplusplus::SoaSphericalTensor
SoaSphericalTensor that evaluates the Real Spherical Harmonics.
Definition: SoaSphericalTensor.h:40

qmcplusplus::SoaSphericalTensor::evaluateVGL
void evaluateVGL(T x, T y, T z)
makes a table of  and their gradients up to Lmax.
Definition: SoaSphericalTensor.h:503

qmcplusplus::SoaSphericalTensor::evaluate_bare
static void evaluate_bare(T x, T y, T z, T *Ylm, int lmax, const T *factorL, const T *factorLM)
compute Ylm for single position
Definition: SoaSphericalTensor.h:288

qmcplusplus::Vector::data
pointer data()
Definition: OhmmsVector.h:238

qmcplusplus::SoaSphericalTensor::evaluateVGHGH
void evaluateVGHGH(T x, T y, T z)
makes a table of  and their gradients up to Lmax.
Definition: SoaSphericalTensor.h:516

qmcplusplus::pow
MakeReturn< BinaryNode< FnPow, typename CreateLeaf< Vector< T1, C1 > >::Leaf_t, typename CreateLeaf< Vector< T2, C2 > >::Leaf_t > >::Expression_t pow(const Vector< T1, C1 > &l, const Vector< T2, C2 > &r)
Definition: OhmmsVectorOperators.h:316

qmcplusplus::Units::distance::m
const real m
Definition: unit_conversion.h:37

std

qmcplusplus::Vector::size
size_type size() const
return the current size
Definition: OhmmsVector.h:162

qmcplusplus::atan
MakeReturn< UnaryNode< FnArcTan, typename CreateLeaf< Vector< T1, C1 > >::Leaf_t > >::Expression_t atan(const Vector< T1, C1 > &l)
Definition: OhmmsVectorOperators.h:48

Array::size
size_t size() const
Definition: OhmmsArray.h:57

Ylm
std::complex< double > Ylm(int l, int m, const std::vector< double > &sph)
Definition: soecp_eval_reference.cpp:182

qmcplusplus::VectorSoaContainer::data
T * data()
return the base
Definition: VectorSoaContainer.h:262

qmcplusplus::SoaSphericalTensor::batched_evaluateV
void batched_evaluateV(const OffloadArray3D &xyz, OffloadArray3D &Ylm) const
evaluate V for multiple electrons and multiple pbc images
Definition: SoaSphericalTensor.h:101

Tensor.h

qmcplusplus::SoaSphericalTensor::evaluateV
void evaluateV(T x, T y, T z, T *Ylm) const
compute Ylm
Definition: SoaSphericalTensor.h:88

qmcplusplus::sqrt
MakeReturn< UnaryNode< FnSqrt, typename CreateLeaf< Vector< T1, C1 > >::Leaf_t > >::Expression_t sqrt(const Vector< T1, C1 > &l)
Definition: OhmmsVectorOperators.h:136

qmcplusplus::SoaSphericalTensor::size
size_t size() const
Definition: SoaSphericalTensor.h:197

qmcplusplus::SoaSphericalTensor::factorL_ptr_
const std::shared_ptr< OffloadVector > factorL_ptr_
pre-evaluated factor
Definition: SoaSphericalTensor.h:54

qmcplusplus::SoaSphericalTensor::evaluateVGH
void evaluateVGH(T x, T y, T z)
makes a table of  and their gradients up to Lmax.
Definition: SoaSphericalTensor.h:510

OffloadAlignedAllocators.hpp

qmcplusplus::SoaSphericalTensor::Lmax
int Lmax
maximum angular momentum for the center
Definition: SoaSphericalTensor.h:48

qmcplusplus::SoaSphericalTensor::index
static int index(int l, int m)
returns the index/locator for ( ) combo,
Definition: SoaSphericalTensor.h:189

qmcplusplus::SoaSphericalTensor::lmax
int lmax() const
Definition: SoaSphericalTensor.h:199

Array
A D-dimensional Array class based on PETE.
Definition: OhmmsArray.h:25

qmcplusplus::VectorSoaContainer::size
size_type size() const
return the physical size
Definition: VectorSoaContainer.h:204

qmcplusplus::SoaSphericalTensor::evaluateVGL_impl
static void evaluateVGL_impl(const T x, const T y, const T z, T *restrict Ylm_vgl, int lmax, const T *factorL, const T *factorLM, const T *factor2L, const T *normfactor, size_t offset)
compute Ylm_vgl for single position
Definition: SoaSphericalTensor.h:392

qmcplusplus::SoaSphericalTensor::factor2L_
OffloadVector & factor2L_
factor2L reference
Definition: SoaSphericalTensor.h:64

qmcplusplus::SoaSphericalTensor::factorLM_ptr_
const std::shared_ptr< OffloadVector > factorLM_ptr_
pre-evaluated factor
Definition: SoaSphericalTensor.h:52

qmcplusplus::SoaSphericalTensor::factorLM_
OffloadVector & factorLM_
factorLM reference
Definition: SoaSphericalTensor.h:60