class to match std::complex<ST> spline with BsplineSet::ValueType (real) SPOs More...

Inheritance diagram for SplineC2R< ST >:

Collaboration diagram for SplineC2R< ST >:

Public Types
using	SplineType = typename bspline_traits< ST, 3 >::SplineType

using	BCType = typename bspline_traits< ST, 3 >::BCType

using	DataType = ST

using	PointType = TinyVector< ST, 3 >

using	SingleSplineType = UBspline_3d_d

using	TT = typename BsplineSet::ValueType

using	vContainer_type = Vector< ST, aligned_allocator< ST > >

using	gContainer_type = VectorSoaContainer< ST, 3 >

using	hContainer_type = VectorSoaContainer< ST, 6 >

using	ghContainer_type = VectorSoaContainer< ST, 10 >

Public Types inherited from SPOSet
using	ValueVector = OrbitalSetTraits< ValueType >::ValueVector

using	ValueMatrix = OrbitalSetTraits< ValueType >::ValueMatrix

using	GradVector = OrbitalSetTraits< ValueType >::GradVector

using	GradMatrix = OrbitalSetTraits< ValueType >::GradMatrix

using	HessVector = OrbitalSetTraits< ValueType >::HessVector

using	HessMatrix = OrbitalSetTraits< ValueType >::HessMatrix

using	GGGVector = OrbitalSetTraits< ValueType >::GradHessVector

using	GGGMatrix = OrbitalSetTraits< ValueType >::GradHessMatrix

using	SPOMap = std::map< std::string, const std::unique_ptr< const SPOSet > >

using	OffloadMWVGLArray = Array< ValueType, 3, OffloadPinnedAllocator< ValueType > >

using	OffloadMWVArray = Array< ValueType, 2, OffloadPinnedAllocator< ValueType > >

template<typename DT >
using	OffloadMatrix = Matrix< DT, OffloadPinnedAllocator< DT > >

Public Types inherited from QMCTraits
enum	{ DIM = OHMMS_DIM, DIM_VGL = OHMMS_DIM + 2 }

using	QTBase = QMCTypes< OHMMS_PRECISION, DIM >

using	QTFull = QMCTypes< OHMMS_PRECISION_FULL, DIM >

using	RealType = QTBase::RealType

using	ComplexType = QTBase::ComplexType

using	ValueType = QTBase::ValueType

using	PosType = QTBase::PosType

using	GradType = QTBase::GradType

using	TensorType = QTBase::TensorType

using	IndexType = OHMMS_INDEXTYPE
	define other types More...

using	FullPrecRealType = QTFull::RealType

using	FullPrecValueType = QTFull::ValueType

using	PropertySetType = RecordNamedProperty< FullPrecRealType >
	define PropertyList_t More...

using	PtclGrpIndexes = std::vector< std::pair< int, int > >

Public Member Functions
	SplineC2R (const std::string &my_name)

	SplineC2R (const SplineC2R &in)

virtual std::string	getClassName () const override
	return class name More...

virtual std::string	getKeyword () const override

bool	isComplex () const override

std::unique_ptr< SPOSet >	makeClone () const override
	make a clone of itself every derived class must implement this to have threading working correctly. More...

void	resizeStorage (size_t n, size_t nvals)

void	bcast_tables (Communicate *comm)

void	gather_tables (Communicate *comm)

template<typename GT , typename BCT >
void	create_spline (GT &xyz_g, BCT &xyz_bc)

void	flush_zero ()

void	resize_kpoints ()
	remap kPoints to pack the double copy More...

void	set_spline (SingleSplineType spline_r, SingleSplineType spline_i, int twist, int ispline, int level)

bool	read_splines (hdf_archive &h5f)

bool	write_splines (hdf_archive &h5f)

void	assign_v (const PointType &r, const vContainer_type &myV, ValueVector &psi, int first, int last) const

void	evaluateValue (const ParticleSet &P, const int iat, ValueVector &psi) override
	evaluate the values of this single-particle orbital set More...

void	evaluateDetRatios (const VirtualParticleSet &VP, ValueVector &psi, const ValueVector &psiinv, std::vector< TT > &ratios) override

void	assign_vgl (const PointType &r, ValueVector &psi, GradVector &dpsi, ValueVector &d2psi, int first, int last) const
	assign_vgl More...

void	assign_vgl_from_l (const PointType &r, ValueVector &psi, GradVector &dpsi, ValueVector &d2psi)
	assign_vgl_from_l can be used when myL is precomputed and myV,myG,myL in cartesian More...

void	evaluateVGL (const ParticleSet &P, const int iat, ValueVector &psi, GradVector &dpsi, ValueVector &d2psi) override
	evaluate the values, gradients and laplacians of this single-particle orbital set More...

void	assign_vgh (const PointType &r, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi, int first, int last) const

void	evaluateVGH (const ParticleSet &P, const int iat, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi) override
	evaluate the values, gradients and hessians of this single-particle orbital set More...

void	assign_vghgh (const PointType &r, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi, GGGVector &grad_grad_grad_psi, int first=0, int last=-1) const

void	evaluateVGHGH (const ParticleSet &P, const int iat, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi, GGGVector &grad_grad_grad_psi) override
	evaluate the values, gradients, hessians, and grad hessians of this single-particle orbital set More...

Public Member Functions inherited from BsplineSet
	BsplineSet (const std::string &my_name)

auto &	getHalfG () const

void	init_base (int n)

int	remap_kpoints ()
	remap kpoints to group general kpoints & special kpoints More...

void	setOrbitalSetSize (int norbs) override
	set the OrbitalSetSize More...

void	evaluate_notranspose (const ParticleSet &P, int first, int last, ValueMatrix &logdet, GradMatrix &dlogdet, ValueMatrix &d2logdet) override
	evaluate the values, gradients and laplacians of this single-particle orbital for [first,last) particles More...

void	mw_evaluate_notranspose (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int first, int last, const RefVector< ValueMatrix > &logdet_list, const RefVector< GradMatrix > &dlogdet_list, const RefVector< ValueMatrix > &d2logdet_list) const override

void	evaluate_notranspose (const ParticleSet &P, int first, int last, ValueMatrix &logdet, GradMatrix &dlogdet, HessMatrix &grad_grad_logdet) override
	evaluate the values, gradients and hessians of this single-particle orbital for [first,last) particles More...

void	evaluate_notranspose (const ParticleSet &P, int first, int last, ValueMatrix &logdet, GradMatrix &dlogdet, HessMatrix &grad_grad_logdet, GGGMatrix &grad_grad_grad_logdet) override
	evaluate the values, gradients, hessians and third derivatives of this single-particle orbital for [first,last) particles More...

void	evaluateGradSource (const ParticleSet &P, int first, int last, const ParticleSet &source, int iat_src, GradMatrix &gradphi) override
	evaluate the gradients of this single-particle orbital for [first,last) target particles with respect to the given source particle More...

void	evaluateGradSource (const ParticleSet &P, int first, int last, const ParticleSet &source, int iat_src, GradMatrix &grad_phi, HessMatrix &grad_grad_phi, GradMatrix &grad_lapl_phi) override
	evaluate the gradients of values, gradients, laplacians of this single-particle orbital for [first,last) target particles with respect to the given source particle More...

virtual void	evaluateDetRatios (const VirtualParticleSet &VP, ValueVector &psi, const ValueVector &psiinv, std::vector< ValueType > &ratios)
	evaluate determinant ratios for virtual moves, e.g., sphere move for nonlocalPP More...

virtual void	evaluateValue (const ParticleSet &P, int iat, ValueVector &psi)=0
	evaluate the values of this single-particle orbital set More...

virtual void	evaluateVGH (const ParticleSet &P, int iat, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi)
	evaluate the values, gradients and hessians of this single-particle orbital set More...

virtual void	evaluateVGHGH (const ParticleSet &P, int iat, ValueVector &psi, GradVector &dpsi, HessVector &grad_grad_psi, GGGVector &grad_grad_grad_psi)
	evaluate the values, gradients, hessians, and grad hessians of this single-particle orbital set More...

virtual void	evaluateVGL (const ParticleSet &P, int iat, ValueVector &psi, GradVector &dpsi, ValueVector &d2psi)=0
	evaluate the values, gradients and laplacians of this single-particle orbital set More...

virtual void	finalizeConstruction ()
	finalize the construction of SPOSet More...

virtual void	mw_evaluateDetRatios (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< const VirtualParticleSet > &vp_list, const RefVector< ValueVector > &psi_list, const std::vector< const ValueType * > &invRow_ptr_list, std::vector< std::vector< ValueType >> &ratios_list) const
	evaluate determinant ratios for virtual moves, e.g., sphere move for nonlocalPP, of multiple walkers More...

virtual void	mw_evaluateVGL (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const RefVector< ValueVector > &psi_v_list, const RefVector< GradVector > &dpsi_v_list, const RefVector< ValueVector > &d2psi_v_list) const
	evaluate the values, gradients and laplacians of this single-particle orbital sets of multiple walkers More...

virtual void	mw_evaluateVGLandDetRatioGrads (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const std::vector< const ValueType * > &invRow_ptr_list, OffloadMWVGLArray &phi_vgl_v, std::vector< ValueType > &ratios, std::vector< GradType > &grads) const
	evaluate the values, gradients and laplacians of this single-particle orbital sets and determinant ratio and grads of multiple walkers. More...

virtual void	acquireResource (ResourceCollection &collection, const RefVectorWithLeader< SPOSet > &spo_list) const
	acquire a shared resource from collection More...

virtual void	createResource (ResourceCollection &collection) const
	initialize a shared resource and hand it to collection More...

virtual void	releaseResource (ResourceCollection &collection, const RefVectorWithLeader< SPOSet > &spo_list) const
	return a shared resource to collection More...

Public Member Functions inherited from SPOSet
	SPOSet (const std::string &my_name)
	constructor More...

virtual	~SPOSet ()=default
	destructor More...

int	size () const
	return the size of the orbital set Ye: this needs to be replaced by getOrbitalSetSize(); More...

void	basic_report (const std::string &pad="") const
	print basic SPOSet information More...

virtual void	report (const std::string &pad="") const
	print SPOSet information More...

int	getOrbitalSetSize () const
	return the size of the orbitals More...

virtual bool	isOptimizable () const
	Query if this SPOSet is optimizable. More...

virtual void	extractOptimizableObjectRefs (UniqueOptObjRefs &opt_obj_refs)
	extract underlying OptimizableObject references More...

virtual void	checkOutVariables (const opt_variables_type &active)
	check out variational optimizable variables More...

virtual bool	isOMPoffload () const
	Query if this SPOSet uses OpenMP offload. More...

virtual bool	hasIonDerivs () const
	Query if this SPOSet has an explicit ion dependence. More...

virtual void	checkObject () const
	check a few key parameters before putting the SPO into a determinant More...

virtual bool	isRotationSupported () const
	return true if this SPOSet can be wrappered by RotatedSPO More...

virtual void	storeParamsBeforeRotation ()
	store parameters before getting destroyed by rotation. More...

virtual void	applyRotation (const ValueMatrix &rot_mat, bool use_stored_copy=false)
	apply rotation to all the orbitals More...

virtual void	evaluateDerivatives (ParticleSet &P, const opt_variables_type &optvars, Vector< ValueType > &dlogpsi, Vector< ValueType > &dhpsioverpsi, const int &FirstIndex, const int &LastIndex)
	Parameter derivatives of the wavefunction and the Laplacian of the wavefunction. More...

virtual void	evaluateDerivativesWF (ParticleSet &P, const opt_variables_type &optvars, Vector< ValueType > &dlogpsi, int FirstIndex, int LastIndex)
	Parameter derivatives of the wavefunction. More...

virtual void	evaluateDerivatives (ParticleSet &P, const opt_variables_type &optvars, Vector< ValueType > &dlogpsi, Vector< ValueType > &dhpsioverpsi, const ValueType &psiCurrent, const std::vector< ValueType > &Coeff, const std::vector< size_t > &C2node_up, const std::vector< size_t > &C2node_dn, const ValueVector &detValues_up, const ValueVector &detValues_dn, const GradMatrix &grads_up, const GradMatrix &grads_dn, const ValueMatrix &lapls_up, const ValueMatrix &lapls_dn, const ValueMatrix &M_up, const ValueMatrix &M_dn, const ValueMatrix &Minv_up, const ValueMatrix &Minv_dn, const GradMatrix &B_grad, const ValueMatrix &B_lapl, const std::vector< int > &detData_up, const size_t N1, const size_t N2, const size_t NP1, const size_t NP2, const std::vector< std::vector< int >> &lookup_tbl)
	Evaluate the derivative of the optimized orbitals with respect to the parameters this is used only for MSD, to be refined for better serving both single and multi SD. More...

virtual void	evaluateDerivativesWF (ParticleSet &P, const opt_variables_type &optvars, Vector< ValueType > &dlogpsi, const QTFull::ValueType &psiCurrent, const std::vector< ValueType > &Coeff, const std::vector< size_t > &C2node_up, const std::vector< size_t > &C2node_dn, const ValueVector &detValues_up, const ValueVector &detValues_dn, const ValueMatrix &M_up, const ValueMatrix &M_dn, const ValueMatrix &Minv_up, const ValueMatrix &Minv_dn, const std::vector< int > &detData_up, const std::vector< std::vector< int >> &lookup_tbl)
	Evaluate the derivative of the optimized orbitals with respect to the parameters this is used only for MSD, to be refined for better serving both single and multi SD. More...

virtual void	evaluateDetRatios (const VirtualParticleSet &VP, ValueVector &psi, const ValueVector &psiinv, std::vector< ValueType > &ratios)
	evaluate determinant ratios for virtual moves, e.g., sphere move for nonlocalPP More...

virtual void	evaluateDetSpinorRatios (const VirtualParticleSet &VP, ValueVector &psi, const std::pair< ValueVector, ValueVector > &spinor_multiplier, const ValueVector &invrow, std::vector< ValueType > &ratios)
	evaluate determinant ratios for virtual moves, specifically for Spinor SPOSets More...

virtual void	evaluateDerivRatios (const VirtualParticleSet &VP, const opt_variables_type &optvars, ValueVector &psi, const ValueVector &psiinv, std::vector< ValueType > &ratios, Matrix< ValueType > &dratios, int FirstIndex, int LastIndex)
	Determinant ratios and parameter derivatives of the wavefunction for virtual moves. More...

virtual void	mw_evaluateDetRatios (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< const VirtualParticleSet > &vp_list, const RefVector< ValueVector > &psi_list, const std::vector< const ValueType *> &invRow_ptr_list, std::vector< std::vector< ValueType >> &ratios_list) const
	evaluate determinant ratios for virtual moves, e.g., sphere move for nonlocalPP, of multiple walkers More...

virtual void	evaluateVGL_spin (const ParticleSet &P, int iat, ValueVector &psi, GradVector &dpsi, ValueVector &d2psi, ValueVector &dspin)
	evaluate the values, gradients and laplacians and spin gradient of this single-particle orbital set More...

virtual void	mw_evaluateValue (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const RefVector< ValueVector > &psi_v_list) const
	evaluate the values this single-particle orbital sets of multiple walkers More...

virtual void	mw_evaluateVGL (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const RefVector< ValueVector > &psi_v_list, const RefVector< GradVector > &dpsi_v_list, const RefVector< ValueVector > &d2psi_v_list) const
	evaluate the values, gradients and laplacians of this single-particle orbital sets of multiple walkers More...

virtual void	mw_evaluateVGLWithSpin (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const RefVector< ValueVector > &psi_v_list, const RefVector< GradVector > &dpsi_v_list, const RefVector< ValueVector > &d2psi_v_list, OffloadMatrix< ComplexType > &mw_dspin) const
	evaluate the values, gradients and laplacians and spin gradient of this single-particle orbital sets of multiple walkers More...

virtual void	mw_evaluateVGLandDetRatioGrads (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const std::vector< const ValueType *> &invRow_ptr_list, OffloadMWVGLArray &phi_vgl_v, std::vector< ValueType > &ratios, std::vector< GradType > &grads) const
	evaluate the values, gradients and laplacians of this single-particle orbital sets and determinant ratio and grads of multiple walkers. More...

virtual void	mw_evaluateVGLandDetRatioGradsWithSpin (const RefVectorWithLeader< SPOSet > &spo_list, const RefVectorWithLeader< ParticleSet > &P_list, int iat, const std::vector< const ValueType *> &invRow_ptr_list, OffloadMWVGLArray &phi_vgl_v, std::vector< ValueType > &ratios, std::vector< GradType > &grads, std::vector< ValueType > &spingrads) const
	evaluate the values, gradients and laplacians of this single-particle orbital sets and determinant ratio and grads of multiple walkers. More...

virtual void	evaluate_spin (const ParticleSet &P, int iat, ValueVector &psi, ValueVector &dpsi)
	evaluate the values of this single-particle orbital set More...

virtual void	evaluateThirdDeriv (const ParticleSet &P, int first, int last, GGGMatrix &grad_grad_grad_logdet)
	evaluate the third derivatives of this single-particle orbital set More...

virtual void	evaluate_notranspose_spin (const ParticleSet &P, int first, int last, ValueMatrix &logdet, GradMatrix &dlogdet, ValueMatrix &d2logdet, ValueMatrix &dspinlogdet)
	evaluate the values, gradients and laplacians of this single-particle orbital for [first,last) particles, including the spin gradient More...

virtual void	evaluateGradSourceRow (const ParticleSet &P, int iel, const ParticleSet &source, int iat_src, GradVector &gradphi)
	Returns a row of d/dR_iat phi_j(r) evaluated at position r. More...

virtual PosType	get_k (int orb)
	access the k point related to the given orbital More...

virtual void	createResource (ResourceCollection &collection) const
	initialize a shared resource and hand it to collection More...

virtual void	acquireResource (ResourceCollection &collection, const RefVectorWithLeader< SPOSet > &spo_list) const
	acquire a shared resource from collection More...

virtual void	releaseResource (ResourceCollection &collection, const RefVectorWithLeader< SPOSet > &spo_list) const
	return a shared resource to collection More...

virtual bool	transformSPOSet ()
	Used only by cusp correction in AOS LCAO. More...

virtual void	finalizeConstruction ()
	finalize the construction of SPOSet More...

const std::string &	getName () const
	return object name More...

Protected Attributes
vContainer_type	myV
	intermediate result vectors More...

vContainer_type	myL

gContainer_type	myG

hContainer_type	myH

ghContainer_type	mygH

Protected Attributes inherited from BsplineSet
size_t	MyIndex
	Index of this adoptor, when multiple adoptors are used for NUMA or distributed cases. More...

size_t	first_spo
	first index of the SPOs this Spline handles More...

size_t	last_spo
	last index of the SPOs this Spline handles More...

TinyVector< int, D >	HalfG
	sign bits at the G/2 boundaries More...

std::vector< bool >	MakeTwoCopies
	flags to unpack sin/cos More...

std::vector< SPOSet::PosType >	kPoints
	kpoints for each unique orbitals. More...

aligned_vector< int >	BandIndexMap
	remap splines to orbitals More...

std::vector< int >	offset
	band offsets used for communication More...

Protected Attributes inherited from SPOSet
const std::string	my_name_
	name of the object, unique identifier More...

IndexType	OrbitalSetSize
	number of Single-particle orbitals More...

opt_variables_type	myVars
	Optimizable variables. More...

Private Attributes
CrystalLattice< ST, 3 >	PrimLattice
	primitive cell More...

Tensor< ST, 3 >	GGt
	, transformation for tensor in LatticeUnit to CartesianUnit, e.g. Hessian More...

int	nComplexBands
	number of complex bands More...

std::shared_ptr< MultiBspline< ST > >	SplineInst
	multi bspline set More...

vContainer_type	mKK

VectorSoaContainer< ST, 3 >	myKcart

Matrix< TT >	ratios_private
	thread private ratios for reduction when using nested threading, numVP x numThread More...

Friends
template<class BSPLINESPO >
class	SplineSetReader

struct	BsplineReader

Additional Inherited Members
Static Protected Attributes inherited from BsplineSet
static const int	D = DIM

Detailed Description

template<typename ST>
class qmcplusplus::SplineC2R< ST >

class to match std::complex<ST> spline with BsplineSet::ValueType (real) SPOs

Template Parameters

ST	precision of spline

Requires temporage storage and multiplication of phase vectors The internal storage of complex spline coefficients uses double sized real arrays of ST type, aligned and padded. The first nComplexBands complex splines produce 2 real orbitals. The rest complex splines produce 1 real orbital. All the output orbitals are real (C2R). The maximal number of output orbitals is OrbitalSetSize.

Definition at line 42 of file SplineC2R.h.

Member Typedef Documentation

◆ BCType

using BCType = typename bspline_traits<ST, 3>::BCType

Definition at line 46 of file SplineC2R.h.

◆ DataType

using DataType = ST

Definition at line 47 of file SplineC2R.h.

◆ gContainer_type

using gContainer_type = VectorSoaContainer<ST, 3>

Definition at line 58 of file SplineC2R.h.

◆ ghContainer_type

using ghContainer_type = VectorSoaContainer<ST, 10>

Definition at line 60 of file SplineC2R.h.

◆ hContainer_type

using hContainer_type = VectorSoaContainer<ST, 6>

Definition at line 59 of file SplineC2R.h.

◆ PointType

using PointType = TinyVector<ST, 3>

Definition at line 48 of file SplineC2R.h.

◆ SingleSplineType

using SingleSplineType = UBspline_3d_d

Definition at line 49 of file SplineC2R.h.

◆ SplineType

using SplineType = typename bspline_traits<ST, 3>::SplineType

Definition at line 45 of file SplineC2R.h.

◆ TT

using TT = typename BsplineSet::ValueType

Definition at line 51 of file SplineC2R.h.

◆ vContainer_type

using vContainer_type = Vector<ST, aligned_allocator<ST> >

Definition at line 57 of file SplineC2R.h.

Constructor & Destructor Documentation

◆ SplineC2R() [1/2]

SplineC2R ( const std::string & my_name )

inline

Definition at line 87 of file SplineC2R.h.

87 : BsplineSet(my_name), nComplexBands(0) {}

qmcplusplus::BsplineSet::BsplineSet

BsplineSet(const std::string &my_name)

Definition: BsplineSet.h:59

qmcplusplus::SplineC2R::nComplexBands

int nComplexBands

number of complex bands

Definition: SplineC2R.h:68

◆ SplineC2R() [2/2]

SplineC2R ( const SplineC2R< ST > & in )

default

Member Function Documentation

◆ assign_v()

void assign_v	(	const PointType &	r,
		const vContainer_type &	myV,
		ValueVector &	psi,
		int	first,
		int	last
	)		const

inline

Definition at line 59 of file SplineC2R.cpp.

References TinyVector< T, D >::data(), omptarget::min(), qmcplusplus::Units::time::s, and qmcplusplus::sincos().

 {
   // protect last
   last = last > kPoints.size() ? kPoints.size() : last;
 
   const ST x = r[0], y = r[1], z = r[2];
   const ST* restrict kx = myKcart.data(0);
   const ST* restrict ky = myKcart.data(1);
   const ST* restrict kz = myKcart.data(2);
 
   TT* restrict psi_s              = psi.data() + first_spo;
   const size_t requested_orb_size = psi.size();
 #pragma omp simd
   for (size_t j = first; j < std::min(nComplexBands, last); j++)
   {
     ST s, c;
     const size_t jr = j << 1;
     const size_t ji = jr + 1;
     const ST val_r  = myV[jr];
     const ST val_i  = myV[ji];
     qmcplusplus::sincos(-(x * kx[j] + y * ky[j] + z * kz[j]), &s, &c);
     if (jr < requested_orb_size)
       psi_s[jr] = val_r * c - val_i * s;
     if (ji < requested_orb_size)
       psi_s[ji] = val_i * c + val_r * s;
   }
 
   psi_s += nComplexBands;
 #pragma omp simd
   for (size_t j = std::max(nComplexBands, first); j < last; j++)
   {
     ST s, c;
     const ST val_r = myV[2 * j];
     const ST val_i = myV[2 * j + 1];
     qmcplusplus::sincos(-(x * kx[j] + y * ky[j] + z * kz[j]), &s, &c);
     if (j + nComplexBands < requested_orb_size)
       psi_s[j] = val_r * c - val_i * s;
   }
 }

◆ assign_vgh()

void assign_vgh	(	const PointType &	r,
		ValueVector &	psi,
		GradVector &	dpsi,
		HessVector &	grad_grad_psi,
		int	first,
		int	last
	)		const

Definition at line 465 of file SplineC2R.cpp.

References TinyVector< T, D >::data(), omptarget::min(), qmcplusplus::Units::time::s, qmcplusplus::sincos(), and qmcplusplus::v_m_v().

 {
   // protect last
   last = last > kPoints.size() ? kPoints.size() : last;
 
   const ST g00 = PrimLattice.G(0), g01 = PrimLattice.G(1), g02 = PrimLattice.G(2), g10 = PrimLattice.G(3),
            g11 = PrimLattice.G(4), g12 = PrimLattice.G(5), g20 = PrimLattice.G(6), g21 = PrimLattice.G(7),
            g22 = PrimLattice.G(8);
   const ST x = r[0], y = r[1], z = r[2];
 
   const ST* restrict k0 = myKcart.data(0);
   const ST* restrict k1 = myKcart.data(1);
   const ST* restrict k2 = myKcart.data(2);
 
   const ST* restrict g0  = myG.data(0);
   const ST* restrict g1  = myG.data(1);
   const ST* restrict g2  = myG.data(2);
   const ST* restrict h00 = myH.data(0);
   const ST* restrict h01 = myH.data(1);
   const ST* restrict h02 = myH.data(2);
   const ST* restrict h11 = myH.data(3);
   const ST* restrict h12 = myH.data(4);
   const ST* restrict h22 = myH.data(5);
 
   const size_t requested_orb_size = psi.size();
 #pragma omp simd
   for (size_t j = first; j < std::min(nComplexBands, last); j++)
   {
     int jr = j << 1;
     int ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     const size_t psiIndex = first_spo + jr;
     if (psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
     }
     if (psiIndex + 1 < requested_orb_size)
     {
       psi[psiIndex + 1]     = c * val_i + s * val_r;
       dpsi[psiIndex + 1][0] = c * gX_i + s * gX_r;
       dpsi[psiIndex + 1][1] = c * gY_i + s * gY_r;
       dpsi[psiIndex + 1][2] = c * gZ_i + s * gZ_r;
     }
 
     const ST h_xx_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g00, g01, g02) + kX * (gX_i + dX_i);
     const ST h_xy_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g10, g11, g12) + kX * (gY_i + dY_i);
     const ST h_xz_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g20, g21, g22) + kX * (gZ_i + dZ_i);
     const ST h_yx_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g00, g01, g02) + kY * (gX_i + dX_i);
     const ST h_yy_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g10, g11, g12) + kY * (gY_i + dY_i);
     const ST h_yz_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g20, g21, g22) + kY * (gZ_i + dZ_i);
     const ST h_zx_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g00, g01, g02) + kZ * (gX_i + dX_i);
     const ST h_zy_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g10, g11, g12) + kZ * (gY_i + dY_i);
     const ST h_zz_r =
         v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g20, g21, g22) + kZ * (gZ_i + dZ_i);
 
     const ST h_xx_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g00, g01, g02) - kX * (gX_r + dX_r);
     const ST h_xy_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g10, g11, g12) - kX * (gY_r + dY_r);
     const ST h_xz_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g20, g21, g22) - kX * (gZ_r + dZ_r);
     const ST h_yx_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g00, g01, g02) - kY * (gX_r + dX_r);
     const ST h_yy_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g10, g11, g12) - kY * (gY_r + dY_r);
     const ST h_yz_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g20, g21, g22) - kY * (gZ_r + dZ_r);
     const ST h_zx_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g00, g01, g02) - kZ * (gX_r + dX_r);
     const ST h_zy_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g10, g11, g12) - kZ * (gY_r + dY_r);
     const ST h_zz_i =
         v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g20, g21, g22) - kZ * (gZ_r + dZ_r);
 
     if (psiIndex < requested_orb_size)
     {
       grad_grad_psi[psiIndex][0] = c * h_xx_r - s * h_xx_i;
       grad_grad_psi[psiIndex][1] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][2] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][3] = c * h_yx_r - s * h_yx_i;
       grad_grad_psi[psiIndex][4] = c * h_yy_r - s * h_yy_i;
       grad_grad_psi[psiIndex][5] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][6] = c * h_zx_r - s * h_zx_i;
       grad_grad_psi[psiIndex][7] = c * h_zy_r - s * h_zy_i;
       grad_grad_psi[psiIndex][8] = c * h_zz_r - s * h_zz_i;
     }
     if (psiIndex + 1 < requested_orb_size)
     {
       grad_grad_psi[psiIndex + 1][0] = c * h_xx_i + s * h_xx_r;
       grad_grad_psi[psiIndex + 1][1] = c * h_xy_i + s * h_xy_r;
       grad_grad_psi[psiIndex + 1][2] = c * h_xz_i + s * h_xz_r;
       grad_grad_psi[psiIndex + 1][3] = c * h_yx_i + s * h_yx_r;
       grad_grad_psi[psiIndex + 1][4] = c * h_yy_i + s * h_yy_r;
       grad_grad_psi[psiIndex + 1][5] = c * h_yz_i + s * h_yz_r;
       grad_grad_psi[psiIndex + 1][6] = c * h_zx_i + s * h_zx_r;
       grad_grad_psi[psiIndex + 1][7] = c * h_zy_i + s * h_zy_r;
       grad_grad_psi[psiIndex + 1][8] = c * h_zz_i + s * h_zz_r;
     }
   }
 
 #pragma omp simd
   for (size_t j = std::max(nComplexBands, first); j < last; j++)
   {
     int jr = j << 1;
     int ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     if (const size_t psiIndex = first_spo + nComplexBands + j; psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
 
       const ST h_xx_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g00, g01, g02) +
           kX * (gX_i + dX_i);
       const ST h_xy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g10, g11, g12) +
           kX * (gY_i + dY_i);
       const ST h_xz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g20, g21, g22) +
           kX * (gZ_i + dZ_i);
       const ST h_yx_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g00, g01, g02) +
           kY * (gX_i + dX_i);
       const ST h_yy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g10, g11, g12) +
           kY * (gY_i + dY_i);
       const ST h_yz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g20, g21, g22) +
           kY * (gZ_i + dZ_i);
       const ST h_zx_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g00, g01, g02) +
           kZ * (gX_i + dX_i);
       const ST h_zy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g10, g11, g12) +
           kZ * (gY_i + dY_i);
       const ST h_zz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g20, g21, g22) +
           kZ * (gZ_i + dZ_i);
 
       const ST h_xx_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g00, g01, g02) -
           kX * (gX_r + dX_r);
       const ST h_xy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g10, g11, g12) -
           kX * (gY_r + dY_r);
       const ST h_xz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g20, g21, g22) -
           kX * (gZ_r + dZ_r);
       const ST h_yx_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g00, g01, g02) -
           kY * (gX_r + dX_r);
       const ST h_yy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g10, g11, g12) -
           kY * (gY_r + dY_r);
       const ST h_yz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g20, g21, g22) -
           kY * (gZ_r + dZ_r);
       const ST h_zx_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g00, g01, g02) -
           kZ * (gX_r + dX_r);
       const ST h_zy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g10, g11, g12) -
           kZ * (gY_r + dY_r);
       const ST h_zz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g20, g21, g22) -
           kZ * (gZ_r + dZ_r);
 
       grad_grad_psi[psiIndex][0] = c * h_xx_r - s * h_xx_i;
       grad_grad_psi[psiIndex][1] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][2] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][3] = c * h_yx_r - s * h_yx_i;
       grad_grad_psi[psiIndex][4] = c * h_yy_r - s * h_yy_i;
       grad_grad_psi[psiIndex][5] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][6] = c * h_zx_r - s * h_zx_i;
       grad_grad_psi[psiIndex][7] = c * h_zy_r - s * h_zy_i;
       grad_grad_psi[psiIndex][8] = c * h_zz_r - s * h_zz_i;
     }
   }
 }

◆ assign_vghgh()

void assign_vghgh	(	const PointType &	r,
		ValueVector &	psi,
		GradVector &	dpsi,
		HessVector &	grad_grad_psi,
		GGGVector &	grad_grad_grad_psi,
		int	first = `0`,
		int	last = `-1`
	)		const

Definition at line 719 of file SplineC2R.cpp.

References TinyVector< T, D >::data(), omptarget::min(), qmcplusplus::Units::time::s, qmcplusplus::sincos(), qmcplusplus::t3_contract(), and qmcplusplus::v_m_v().

 {
   // protect last
   last = last < 0 ? kPoints.size() : (last > kPoints.size() ? kPoints.size() : last);
 
   const ST g00 = PrimLattice.G(0), g01 = PrimLattice.G(1), g02 = PrimLattice.G(2), g10 = PrimLattice.G(3),
            g11 = PrimLattice.G(4), g12 = PrimLattice.G(5), g20 = PrimLattice.G(6), g21 = PrimLattice.G(7),
            g22 = PrimLattice.G(8);
   const ST x = r[0], y = r[1], z = r[2];
 
   const ST* restrict k0 = myKcart.data(0);
   const ST* restrict k1 = myKcart.data(1);
   const ST* restrict k2 = myKcart.data(2);
 
   const ST* restrict g0  = myG.data(0);
   const ST* restrict g1  = myG.data(1);
   const ST* restrict g2  = myG.data(2);
   const ST* restrict h00 = myH.data(0);
   const ST* restrict h01 = myH.data(1);
   const ST* restrict h02 = myH.data(2);
   const ST* restrict h11 = myH.data(3);
   const ST* restrict h12 = myH.data(4);
   const ST* restrict h22 = myH.data(5);
 
   const ST* restrict gh000 = mygH.data(0);
   const ST* restrict gh001 = mygH.data(1);
   const ST* restrict gh002 = mygH.data(2);
   const ST* restrict gh011 = mygH.data(3);
   const ST* restrict gh012 = mygH.data(4);
   const ST* restrict gh022 = mygH.data(5);
   const ST* restrict gh111 = mygH.data(6);
   const ST* restrict gh112 = mygH.data(7);
   const ST* restrict gh122 = mygH.data(8);
   const ST* restrict gh222 = mygH.data(9);
 
   const size_t requested_orb_size = psi.size();
 //SIMD doesn't work quite right yet.  Comment out until further debugging.
 #pragma omp simd
   for (size_t j = first; j < std::min(nComplexBands, last); j++)
   {
     int jr = j << 1;
     int ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     const size_t psiIndex = first_spo + jr;
     if (psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
     }
     if (psiIndex + 1 < requested_orb_size)
     {
       psi[psiIndex + 1]     = c * val_i + s * val_r;
       dpsi[psiIndex + 1][0] = c * gX_i + s * gX_r;
       dpsi[psiIndex + 1][1] = c * gY_i + s * gY_r;
       dpsi[psiIndex + 1][2] = c * gZ_i + s * gZ_r;
     }
 
     //intermediates for computation of hessian. \partial_i \partial_j phi in cartesian coordinates.
     const ST f_xx_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g00, g01, g02);
     const ST f_xy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g10, g11, g12);
     const ST f_xz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g20, g21, g22);
     const ST f_yy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g10, g11, g12);
     const ST f_yz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g20, g21, g22);
     const ST f_zz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g20, g21, g22);
 
     const ST f_xx_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g00, g01, g02);
     const ST f_xy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g10, g11, g12);
     const ST f_xz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g20, g21, g22);
     const ST f_yy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g10, g11, g12);
     const ST f_yz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g20, g21, g22);
     const ST f_zz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g20, g21, g22);
 
     const ST h_xx_r = f_xx_r + 2 * kX * dX_i - kX * kX * val_r;
     const ST h_xy_r = f_xy_r + (kX * dY_i + kY * dX_i) - kX * kY * val_r;
     const ST h_xz_r = f_xz_r + (kX * dZ_i + kZ * dX_i) - kX * kZ * val_r;
     const ST h_yy_r = f_yy_r + 2 * kY * dY_i - kY * kY * val_r;
     const ST h_yz_r = f_yz_r + (kY * dZ_i + kZ * dY_i) - kY * kZ * val_r;
     const ST h_zz_r = f_zz_r + 2 * kZ * dZ_i - kZ * kZ * val_r;
 
     const ST h_xx_i = f_xx_i - 2 * kX * dX_r - kX * kX * val_i;
     const ST h_xy_i = f_xy_i - (kX * dY_r + kY * dX_r) - kX * kY * val_i;
     const ST h_xz_i = f_xz_i - (kX * dZ_r + kZ * dX_r) - kX * kZ * val_i;
     const ST h_yy_i = f_yy_i - 2 * kY * dY_r - kY * kY * val_i;
     const ST h_yz_i = f_yz_i - (kZ * dY_r + kY * dZ_r) - kZ * kY * val_i;
     const ST h_zz_i = f_zz_i - 2 * kZ * dZ_r - kZ * kZ * val_i;
 
     if (psiIndex < requested_orb_size)
     {
       grad_grad_psi[psiIndex][0] = c * h_xx_r - s * h_xx_i;
       grad_grad_psi[psiIndex][1] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][2] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][3] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][4] = c * h_yy_r - s * h_yy_i;
       grad_grad_psi[psiIndex][5] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][6] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][7] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][8] = c * h_zz_r - s * h_zz_i;
     }
 
     if (psiIndex + 1 < requested_orb_size)
     {
       grad_grad_psi[psiIndex + 1][0] = c * h_xx_i + s * h_xx_r;
       grad_grad_psi[psiIndex + 1][1] = c * h_xy_i + s * h_xy_r;
       grad_grad_psi[psiIndex + 1][2] = c * h_xz_i + s * h_xz_r;
       grad_grad_psi[psiIndex + 1][3] = c * h_xy_i + s * h_xy_r;
       grad_grad_psi[psiIndex + 1][4] = c * h_yy_i + s * h_yy_r;
       grad_grad_psi[psiIndex + 1][5] = c * h_yz_i + s * h_yz_r;
       grad_grad_psi[psiIndex + 1][6] = c * h_xz_i + s * h_xz_r;
       grad_grad_psi[psiIndex + 1][7] = c * h_yz_i + s * h_yz_r;
       grad_grad_psi[psiIndex + 1][8] = c * h_zz_i + s * h_zz_r;
     }
 
     //These are the real and imaginary components of the third SPO derivative.  _xxx denotes
     // third derivative w.r.t. x, _xyz, a derivative with resepect to x,y, and z, and so on.
 
     const ST f3_xxx_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g00, g01, g02);
     const ST f3_xxy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g10, g11, g12);
     const ST f3_xxz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g20, g21, g22);
     const ST f3_xyy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g10, g11, g12, g10, g11, g12);
     const ST f3_xyz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g10, g11, g12, g20, g21, g22);
     const ST f3_xzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g20, g21, g22, g20, g21, g22);
     const ST f3_yyy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g10, g11, g12, g10, g11, g12);
     const ST f3_yyz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g10, g11, g12, g20, g21, g22);
     const ST f3_yzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g20, g21, g22, g20, g21, g22);
     const ST f3_zzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                     gh112[jr], gh122[jr], gh222[jr], g20, g21, g22, g20, g21, g22, g20, g21, g22);
 
     const ST f3_xxx_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g00, g01, g02);
     const ST f3_xxy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g10, g11, g12);
     const ST f3_xxz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g20, g21, g22);
     const ST f3_xyy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g10, g11, g12, g10, g11, g12);
     const ST f3_xyz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g10, g11, g12, g20, g21, g22);
     const ST f3_xzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g20, g21, g22, g20, g21, g22);
     const ST f3_yyy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g10, g11, g12, g10, g11, g12);
     const ST f3_yyz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g10, g11, g12, g20, g21, g22);
     const ST f3_yzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g20, g21, g22, g20, g21, g22);
     const ST f3_zzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                     gh112[ji], gh122[ji], gh222[ji], g20, g21, g22, g20, g21, g22, g20, g21, g22);
 
     //Here is where we build up the components of the physical hessian gradient, namely, d^3/dx^3(e^{-ik*r}\phi(r)
     const ST gh_xxx_r = f3_xxx_r + 3 * kX * f_xx_i - 3 * kX * kX * dX_r - kX * kX * kX * val_i;
     const ST gh_xxx_i = f3_xxx_i - 3 * kX * f_xx_r - 3 * kX * kX * dX_i + kX * kX * kX * val_r;
     const ST gh_xxy_r =
         f3_xxy_r + (kY * f_xx_i + 2 * kX * f_xy_i) - (kX * kX * dY_r + 2 * kX * kY * dX_r) - kX * kX * kY * val_i;
     const ST gh_xxy_i =
         f3_xxy_i - (kY * f_xx_r + 2 * kX * f_xy_r) - (kX * kX * dY_i + 2 * kX * kY * dX_i) + kX * kX * kY * val_r;
     const ST gh_xxz_r =
         f3_xxz_r + (kZ * f_xx_i + 2 * kX * f_xz_i) - (kX * kX * dZ_r + 2 * kX * kZ * dX_r) - kX * kX * kZ * val_i;
     const ST gh_xxz_i =
         f3_xxz_i - (kZ * f_xx_r + 2 * kX * f_xz_r) - (kX * kX * dZ_i + 2 * kX * kZ * dX_i) + kX * kX * kZ * val_r;
     const ST gh_xyy_r =
         f3_xyy_r + (2 * kY * f_xy_i + kX * f_yy_i) - (2 * kX * kY * dY_r + kY * kY * dX_r) - kX * kY * kY * val_i;
     const ST gh_xyy_i =
         f3_xyy_i - (2 * kY * f_xy_r + kX * f_yy_r) - (2 * kX * kY * dY_i + kY * kY * dX_i) + kX * kY * kY * val_r;
     const ST gh_xyz_r = f3_xyz_r + (kX * f_yz_i + kY * f_xz_i + kZ * f_xy_i) -
         (kX * kY * dZ_r + kY * kZ * dX_r + kZ * kX * dY_r) - kX * kY * kZ * val_i;
     const ST gh_xyz_i = f3_xyz_i - (kX * f_yz_r + kY * f_xz_r + kZ * f_xy_r) -
         (kX * kY * dZ_i + kY * kZ * dX_i + kZ * kX * dY_i) + kX * kY * kZ * val_r;
     const ST gh_xzz_r =
         f3_xzz_r + (2 * kZ * f_xz_i + kX * f_zz_i) - (2 * kX * kZ * dZ_r + kZ * kZ * dX_r) - kX * kZ * kZ * val_i;
     const ST gh_xzz_i =
         f3_xzz_i - (2 * kZ * f_xz_r + kX * f_zz_r) - (2 * kX * kZ * dZ_i + kZ * kZ * dX_i) + kX * kZ * kZ * val_r;
     const ST gh_yyy_r = f3_yyy_r + 3 * kY * f_yy_i - 3 * kY * kY * dY_r - kY * kY * kY * val_i;
     const ST gh_yyy_i = f3_yyy_i - 3 * kY * f_yy_r - 3 * kY * kY * dY_i + kY * kY * kY * val_r;
     const ST gh_yyz_r =
         f3_yyz_r + (kZ * f_yy_i + 2 * kY * f_yz_i) - (kY * kY * dZ_r + 2 * kY * kZ * dY_r) - kY * kY * kZ * val_i;
     const ST gh_yyz_i =
         f3_yyz_i - (kZ * f_yy_r + 2 * kY * f_yz_r) - (kY * kY * dZ_i + 2 * kY * kZ * dY_i) + kY * kY * kZ * val_r;
     const ST gh_yzz_r =
         f3_yzz_r + (2 * kZ * f_yz_i + kY * f_zz_i) - (2 * kY * kZ * dZ_r + kZ * kZ * dY_r) - kY * kZ * kZ * val_i;
     const ST gh_yzz_i =
         f3_yzz_i - (2 * kZ * f_yz_r + kY * f_zz_r) - (2 * kY * kZ * dZ_i + kZ * kZ * dY_i) + kY * kZ * kZ * val_r;
     const ST gh_zzz_r = f3_zzz_r + 3 * kZ * f_zz_i - 3 * kZ * kZ * dZ_r - kZ * kZ * kZ * val_i;
     const ST gh_zzz_i = f3_zzz_i - 3 * kZ * f_zz_r - 3 * kZ * kZ * dZ_i + kZ * kZ * kZ * val_r;
 
     if (psiIndex < requested_orb_size)
     {
       grad_grad_grad_psi[psiIndex][0][0] = c * gh_xxx_r - s * gh_xxx_i;
       grad_grad_grad_psi[psiIndex][0][1] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][0][2] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][0][3] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][0][4] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][0][5] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][0][6] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][0][7] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][0][8] = c * gh_xzz_r - s * gh_xzz_i;
 
       grad_grad_grad_psi[psiIndex][1][0] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][1][1] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][1][2] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][1][3] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][1][4] = c * gh_yyy_r - s * gh_yyy_i;
       grad_grad_grad_psi[psiIndex][1][5] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][1][6] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][1][7] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][1][8] = c * gh_yzz_r - s * gh_yzz_i;
 
       grad_grad_grad_psi[psiIndex][2][0] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][2][1] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][2][2] = c * gh_xzz_r - s * gh_xzz_i;
       grad_grad_grad_psi[psiIndex][2][3] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][2][4] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][2][5] = c * gh_yzz_r - s * gh_yzz_i;
       grad_grad_grad_psi[psiIndex][2][6] = c * gh_xzz_r - s * gh_xzz_i;
       grad_grad_grad_psi[psiIndex][2][7] = c * gh_yzz_r - s * gh_yzz_i;
       grad_grad_grad_psi[psiIndex][2][8] = c * gh_zzz_r - s * gh_zzz_i;
     }
 
     if (psiIndex + 1 < requested_orb_size)
     {
       grad_grad_grad_psi[psiIndex + 1][0][0] = c * gh_xxx_i + s * gh_xxx_r;
       grad_grad_grad_psi[psiIndex + 1][0][1] = c * gh_xxy_i + s * gh_xxy_r;
       grad_grad_grad_psi[psiIndex + 1][0][2] = c * gh_xxz_i + s * gh_xxz_r;
       grad_grad_grad_psi[psiIndex + 1][0][3] = c * gh_xxy_i + s * gh_xxy_r;
       grad_grad_grad_psi[psiIndex + 1][0][4] = c * gh_xyy_i + s * gh_xyy_r;
       grad_grad_grad_psi[psiIndex + 1][0][5] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][0][6] = c * gh_xxz_i + s * gh_xxz_r;
       grad_grad_grad_psi[psiIndex + 1][0][7] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][0][8] = c * gh_xzz_i + s * gh_xzz_r;
 
       grad_grad_grad_psi[psiIndex + 1][1][0] = c * gh_xxy_i + s * gh_xxy_r;
       grad_grad_grad_psi[psiIndex + 1][1][1] = c * gh_xyy_i + s * gh_xyy_r;
       grad_grad_grad_psi[psiIndex + 1][1][2] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][1][3] = c * gh_xyy_i + s * gh_xyy_r;
       grad_grad_grad_psi[psiIndex + 1][1][4] = c * gh_yyy_i + s * gh_yyy_r;
       grad_grad_grad_psi[psiIndex + 1][1][5] = c * gh_yyz_i + s * gh_yyz_r;
       grad_grad_grad_psi[psiIndex + 1][1][6] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][1][7] = c * gh_yyz_i + s * gh_yyz_r;
       grad_grad_grad_psi[psiIndex + 1][1][8] = c * gh_yzz_i + s * gh_yzz_r;
 
       grad_grad_grad_psi[psiIndex + 1][2][0] = c * gh_xxz_i + s * gh_xxz_r;
       grad_grad_grad_psi[psiIndex + 1][2][1] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][2][2] = c * gh_xzz_i + s * gh_xzz_r;
       grad_grad_grad_psi[psiIndex + 1][2][3] = c * gh_xyz_i + s * gh_xyz_r;
       grad_grad_grad_psi[psiIndex + 1][2][4] = c * gh_yyz_i + s * gh_yyz_r;
       grad_grad_grad_psi[psiIndex + 1][2][5] = c * gh_yzz_i + s * gh_yzz_r;
       grad_grad_grad_psi[psiIndex + 1][2][6] = c * gh_xzz_i + s * gh_xzz_r;
       grad_grad_grad_psi[psiIndex + 1][2][7] = c * gh_yzz_i + s * gh_yzz_r;
       grad_grad_grad_psi[psiIndex + 1][2][8] = c * gh_zzz_i + s * gh_zzz_r;
     }
   }
 #pragma omp simd
   for (size_t j = std::max(nComplexBands, first); j < last; j++)
   {
     int jr = j << 1;
     int ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     if (const size_t psiIndex = first_spo + nComplexBands + j; psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
 
       //intermediates for computation of hessian. \partial_i \partial_j phi in cartesian coordinates.
       const ST f_xx_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g00, g01, g02);
       const ST f_xy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g10, g11, g12);
       const ST f_xz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g00, g01, g02, g20, g21, g22);
       const ST f_yy_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g10, g11, g12);
       const ST f_yz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g10, g11, g12, g20, g21, g22);
       const ST f_zz_r = v_m_v(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], g20, g21, g22, g20, g21, g22);
 
       const ST f_xx_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g00, g01, g02);
       const ST f_xy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g10, g11, g12);
       const ST f_xz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g00, g01, g02, g20, g21, g22);
       const ST f_yy_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g10, g11, g12);
       const ST f_yz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g10, g11, g12, g20, g21, g22);
       const ST f_zz_i = v_m_v(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], g20, g21, g22, g20, g21, g22);
 
       const ST h_xx_r = f_xx_r + 2 * kX * dX_i - kX * kX * val_r;
       const ST h_xy_r = f_xy_r + (kX * dY_i + kY * dX_i) - kX * kY * val_r;
       const ST h_xz_r = f_xz_r + (kX * dZ_i + kZ * dX_i) - kX * kZ * val_r;
       const ST h_yy_r = f_yy_r + 2 * kY * dY_i - kY * kY * val_r;
       const ST h_yz_r = f_yz_r + (kY * dZ_i + kZ * dY_i) - kY * kZ * val_r;
       const ST h_zz_r = f_zz_r + 2 * kZ * dZ_i - kZ * kZ * val_r;
 
       const ST h_xx_i = f_xx_i - 2 * kX * dX_r - kX * kX * val_i;
       const ST h_xy_i = f_xy_i - (kX * dY_r + kY * dX_r) - kX * kY * val_i;
       const ST h_xz_i = f_xz_i - (kX * dZ_r + kZ * dX_r) - kX * kZ * val_i;
       const ST h_yy_i = f_yy_i - 2 * kY * dY_r - kY * kY * val_i;
       const ST h_yz_i = f_yz_i - (kZ * dY_r + kY * dZ_r) - kZ * kY * val_i;
       const ST h_zz_i = f_zz_i - 2 * kZ * dZ_r - kZ * kZ * val_i;
 
       grad_grad_psi[psiIndex][0] = c * h_xx_r - s * h_xx_i;
       grad_grad_psi[psiIndex][1] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][2] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][3] = c * h_xy_r - s * h_xy_i;
       grad_grad_psi[psiIndex][4] = c * h_yy_r - s * h_yy_i;
       grad_grad_psi[psiIndex][5] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][6] = c * h_xz_r - s * h_xz_i;
       grad_grad_psi[psiIndex][7] = c * h_yz_r - s * h_yz_i;
       grad_grad_psi[psiIndex][8] = c * h_zz_r - s * h_zz_i;
 
       //These are the real and imaginary components of the third SPO derivative.  _xxx denotes
       // third derivative w.r.t. x, _xyz, a derivative with resepect to x,y, and z, and so on.
 
       const ST f3_xxx_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g00, g01, g02);
       const ST f3_xxy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g10, g11, g12);
       const ST f3_xxz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g00, g01, g02, g20, g21, g22);
       const ST f3_xyy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g10, g11, g12, g10, g11, g12);
       const ST f3_xyz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g10, g11, g12, g20, g21, g22);
       const ST f3_xzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g00, g01, g02, g20, g21, g22, g20, g21, g22);
       const ST f3_yyy_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g10, g11, g12, g10, g11, g12);
       const ST f3_yyz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g10, g11, g12, g20, g21, g22);
       const ST f3_yzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g10, g11, g12, g20, g21, g22, g20, g21, g22);
       const ST f3_zzz_r = t3_contract(gh000[jr], gh001[jr], gh002[jr], gh011[jr], gh012[jr], gh022[jr], gh111[jr],
                                       gh112[jr], gh122[jr], gh222[jr], g20, g21, g22, g20, g21, g22, g20, g21, g22);
 
       const ST f3_xxx_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g00, g01, g02);
       const ST f3_xxy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g10, g11, g12);
       const ST f3_xxz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g00, g01, g02, g20, g21, g22);
       const ST f3_xyy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g10, g11, g12, g10, g11, g12);
       const ST f3_xyz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g10, g11, g12, g20, g21, g22);
       const ST f3_xzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g00, g01, g02, g20, g21, g22, g20, g21, g22);
       const ST f3_yyy_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g10, g11, g12, g10, g11, g12);
       const ST f3_yyz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g10, g11, g12, g20, g21, g22);
       const ST f3_yzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g10, g11, g12, g20, g21, g22, g20, g21, g22);
       const ST f3_zzz_i = t3_contract(gh000[ji], gh001[ji], gh002[ji], gh011[ji], gh012[ji], gh022[ji], gh111[ji],
                                       gh112[ji], gh122[ji], gh222[ji], g20, g21, g22, g20, g21, g22, g20, g21, g22);
 
       //Here is where we build up the components of the physical hessian gradient, namely, d^3/dx^3(e^{-ik*r}\phi(r)
       const ST gh_xxx_r = f3_xxx_r + 3 * kX * f_xx_i - 3 * kX * kX * dX_r - kX * kX * kX * val_i;
       const ST gh_xxx_i = f3_xxx_i - 3 * kX * f_xx_r - 3 * kX * kX * dX_i + kX * kX * kX * val_r;
       const ST gh_xxy_r =
           f3_xxy_r + (kY * f_xx_i + 2 * kX * f_xy_i) - (kX * kX * dY_r + 2 * kX * kY * dX_r) - kX * kX * kY * val_i;
       const ST gh_xxy_i =
           f3_xxy_i - (kY * f_xx_r + 2 * kX * f_xy_r) - (kX * kX * dY_i + 2 * kX * kY * dX_i) + kX * kX * kY * val_r;
       const ST gh_xxz_r =
           f3_xxz_r + (kZ * f_xx_i + 2 * kX * f_xz_i) - (kX * kX * dZ_r + 2 * kX * kZ * dX_r) - kX * kX * kZ * val_i;
       const ST gh_xxz_i =
           f3_xxz_i - (kZ * f_xx_r + 2 * kX * f_xz_r) - (kX * kX * dZ_i + 2 * kX * kZ * dX_i) + kX * kX * kZ * val_r;
       const ST gh_xyy_r =
           f3_xyy_r + (2 * kY * f_xy_i + kX * f_yy_i) - (2 * kX * kY * dY_r + kY * kY * dX_r) - kX * kY * kY * val_i;
       const ST gh_xyy_i =
           f3_xyy_i - (2 * kY * f_xy_r + kX * f_yy_r) - (2 * kX * kY * dY_i + kY * kY * dX_i) + kX * kY * kY * val_r;
       const ST gh_xyz_r = f3_xyz_r + (kX * f_yz_i + kY * f_xz_i + kZ * f_xy_i) -
           (kX * kY * dZ_r + kY * kZ * dX_r + kZ * kX * dY_r) - kX * kY * kZ * val_i;
       const ST gh_xyz_i = f3_xyz_i - (kX * f_yz_r + kY * f_xz_r + kZ * f_xy_r) -
           (kX * kY * dZ_i + kY * kZ * dX_i + kZ * kX * dY_i) + kX * kY * kZ * val_r;
       const ST gh_xzz_r =
           f3_xzz_r + (2 * kZ * f_xz_i + kX * f_zz_i) - (2 * kX * kZ * dZ_r + kZ * kZ * dX_r) - kX * kZ * kZ * val_i;
       const ST gh_xzz_i =
           f3_xzz_i - (2 * kZ * f_xz_r + kX * f_zz_r) - (2 * kX * kZ * dZ_i + kZ * kZ * dX_i) + kX * kZ * kZ * val_r;
       const ST gh_yyy_r = f3_yyy_r + 3 * kY * f_yy_i - 3 * kY * kY * dY_r - kY * kY * kY * val_i;
       const ST gh_yyy_i = f3_yyy_i - 3 * kY * f_yy_r - 3 * kY * kY * dY_i + kY * kY * kY * val_r;
       const ST gh_yyz_r =
           f3_yyz_r + (kZ * f_yy_i + 2 * kY * f_yz_i) - (kY * kY * dZ_r + 2 * kY * kZ * dY_r) - kY * kY * kZ * val_i;
       const ST gh_yyz_i =
           f3_yyz_i - (kZ * f_yy_r + 2 * kY * f_yz_r) - (kY * kY * dZ_i + 2 * kY * kZ * dY_i) + kY * kY * kZ * val_r;
       const ST gh_yzz_r =
           f3_yzz_r + (2 * kZ * f_yz_i + kY * f_zz_i) - (2 * kY * kZ * dZ_r + kZ * kZ * dY_r) - kY * kZ * kZ * val_i;
       const ST gh_yzz_i =
           f3_yzz_i - (2 * kZ * f_yz_r + kY * f_zz_r) - (2 * kY * kZ * dZ_i + kZ * kZ * dY_i) + kY * kZ * kZ * val_r;
       const ST gh_zzz_r = f3_zzz_r + 3 * kZ * f_zz_i - 3 * kZ * kZ * dZ_r - kZ * kZ * kZ * val_i;
       const ST gh_zzz_i = f3_zzz_i - 3 * kZ * f_zz_r - 3 * kZ * kZ * dZ_i + kZ * kZ * kZ * val_r;
       //[x][xx] //These are the unique entries
       grad_grad_grad_psi[psiIndex][0][0] = c * gh_xxx_r - s * gh_xxx_i;
       grad_grad_grad_psi[psiIndex][0][1] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][0][2] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][0][3] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][0][4] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][0][5] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][0][6] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][0][7] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][0][8] = c * gh_xzz_r - s * gh_xzz_i;
 
       grad_grad_grad_psi[psiIndex][1][0] = c * gh_xxy_r - s * gh_xxy_i;
       grad_grad_grad_psi[psiIndex][1][1] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][1][2] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][1][3] = c * gh_xyy_r - s * gh_xyy_i;
       grad_grad_grad_psi[psiIndex][1][4] = c * gh_yyy_r - s * gh_yyy_i;
       grad_grad_grad_psi[psiIndex][1][5] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][1][6] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][1][7] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][1][8] = c * gh_yzz_r - s * gh_yzz_i;
 
       grad_grad_grad_psi[psiIndex][2][0] = c * gh_xxz_r - s * gh_xxz_i;
       grad_grad_grad_psi[psiIndex][2][1] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][2][2] = c * gh_xzz_r - s * gh_xzz_i;
       grad_grad_grad_psi[psiIndex][2][3] = c * gh_xyz_r - s * gh_xyz_i;
       grad_grad_grad_psi[psiIndex][2][4] = c * gh_yyz_r - s * gh_yyz_i;
       grad_grad_grad_psi[psiIndex][2][5] = c * gh_yzz_r - s * gh_yzz_i;
       grad_grad_grad_psi[psiIndex][2][6] = c * gh_xzz_r - s * gh_xzz_i;
       grad_grad_grad_psi[psiIndex][2][7] = c * gh_yzz_r - s * gh_yzz_i;
       grad_grad_grad_psi[psiIndex][2][8] = c * gh_zzz_r - s * gh_zzz_i;
     }
   }
 }

◆ assign_vgl()

void assign_vgl	(	const PointType &	r,
		ValueVector &	psi,
		GradVector &	dpsi,
		ValueVector &	d2psi,
		int	first,
		int	last
	)		const

inline

assign_vgl

Definition at line 168 of file SplineC2R.cpp.

References ASSUME_ALIGNED, TinyVector< T, D >::data(), omptarget::min(), qmcplusplus::Units::time::s, qmcplusplus::sincos(), and qmcplusplus::SymTrace().

 {
   // protect last
   last = last > kPoints.size() ? kPoints.size() : last;
 
   constexpr ST two(2);
   const ST g00 = PrimLattice.G(0), g01 = PrimLattice.G(1), g02 = PrimLattice.G(2), g10 = PrimLattice.G(3),
            g11 = PrimLattice.G(4), g12 = PrimLattice.G(5), g20 = PrimLattice.G(6), g21 = PrimLattice.G(7),
            g22 = PrimLattice.G(8);
   const ST x = r[0], y = r[1], z = r[2];
   const ST symGG[6] = {GGt[0], GGt[1] + GGt[3], GGt[2] + GGt[6], GGt[4], GGt[5] + GGt[7], GGt[8]};
 
   const ST* restrict k0 = myKcart.data(0);
   ASSUME_ALIGNED(k0);
   const ST* restrict k1 = myKcart.data(1);
   ASSUME_ALIGNED(k1);
   const ST* restrict k2 = myKcart.data(2);
   ASSUME_ALIGNED(k2);
 
   const ST* restrict g0 = myG.data(0);
   ASSUME_ALIGNED(g0);
   const ST* restrict g1 = myG.data(1);
   ASSUME_ALIGNED(g1);
   const ST* restrict g2 = myG.data(2);
   ASSUME_ALIGNED(g2);
   const ST* restrict h00 = myH.data(0);
   ASSUME_ALIGNED(h00);
   const ST* restrict h01 = myH.data(1);
   ASSUME_ALIGNED(h01);
   const ST* restrict h02 = myH.data(2);
   ASSUME_ALIGNED(h02);
   const ST* restrict h11 = myH.data(3);
   ASSUME_ALIGNED(h11);
   const ST* restrict h12 = myH.data(4);
   ASSUME_ALIGNED(h12);
   const ST* restrict h22 = myH.data(5);
   ASSUME_ALIGNED(h22);
 
   const size_t requested_orb_size = psi.size();
 #pragma omp simd
   for (size_t j = first; j < std::min(nComplexBands, last); j++)
   {
     const size_t jr = j << 1;
     const size_t ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     const ST lcart_r = SymTrace(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], symGG);
     const ST lcart_i = SymTrace(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], symGG);
     const ST lap_r   = lcart_r + mKK[j] * val_r + two * (kX * dX_i + kY * dY_i + kZ * dZ_i);
     const ST lap_i   = lcart_i + mKK[j] * val_i - two * (kX * dX_r + kY * dY_r + kZ * dZ_r);
 
     const size_t psiIndex = first_spo + jr;
     if (psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
       d2psi[psiIndex]   = c * lap_r - s * lap_i;
     }
     if (psiIndex + 1 < requested_orb_size)
     {
       psi[psiIndex + 1]     = c * val_i + s * val_r;
       dpsi[psiIndex + 1][0] = c * gX_i + s * gX_r;
       dpsi[psiIndex + 1][1] = c * gY_i + s * gY_r;
       dpsi[psiIndex + 1][2] = c * gZ_i + s * gZ_r;
       d2psi[psiIndex + 1]   = c * lap_i + s * lap_r;
     }
   }
 
 #pragma omp simd
   for (size_t j = std::max(nComplexBands, first); j < last; j++)
   {
     const size_t jr = j << 1;
     const size_t ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g00 * g0[jr] + g01 * g1[jr] + g02 * g2[jr];
     const ST dY_r = g10 * g0[jr] + g11 * g1[jr] + g12 * g2[jr];
     const ST dZ_r = g20 * g0[jr] + g21 * g1[jr] + g22 * g2[jr];
 
     const ST dX_i = g00 * g0[ji] + g01 * g1[ji] + g02 * g2[ji];
     const ST dY_i = g10 * g0[ji] + g11 * g1[ji] + g12 * g2[ji];
     const ST dZ_i = g20 * g0[ji] + g21 * g1[ji] + g22 * g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     if (const size_t psiIndex = first_spo + nComplexBands + j; psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
 
       const ST lcart_r = SymTrace(h00[jr], h01[jr], h02[jr], h11[jr], h12[jr], h22[jr], symGG);
       const ST lcart_i = SymTrace(h00[ji], h01[ji], h02[ji], h11[ji], h12[ji], h22[ji], symGG);
       const ST lap_r   = lcart_r + mKK[j] * val_r + two * (kX * dX_i + kY * dY_i + kZ * dZ_i);
       const ST lap_i   = lcart_i + mKK[j] * val_i - two * (kX * dX_r + kY * dY_r + kZ * dZ_r);
       d2psi[psiIndex]  = c * lap_r - s * lap_i;
     }
   }
 }

◆ assign_vgl_from_l()

void assign_vgl_from_l	(	const PointType &	r,
		ValueVector &	psi,
		GradVector &	dpsi,
		ValueVector &	d2psi
	)

inline

assign_vgl_from_l can be used when myL is precomputed and myV,myG,myL in cartesian

Definition at line 321 of file SplineC2R.cpp.

References ASSUME_ALIGNED, TinyVector< T, D >::data(), qmcplusplus::Units::force::N, qmcplusplus::Units::time::s, and qmcplusplus::sincos().

 {
   constexpr ST two(2);
   const ST x = r[0], y = r[1], z = r[2];
 
   const ST* restrict k0 = myKcart.data(0);
   ASSUME_ALIGNED(k0);
   const ST* restrict k1 = myKcart.data(1);
   ASSUME_ALIGNED(k1);
   const ST* restrict k2 = myKcart.data(2);
   ASSUME_ALIGNED(k2);
 
   const ST* restrict g0 = myG.data(0);
   ASSUME_ALIGNED(g0);
   const ST* restrict g1 = myG.data(1);
   ASSUME_ALIGNED(g1);
   const ST* restrict g2 = myG.data(2);
   ASSUME_ALIGNED(g2);
 
   const size_t N = kPoints.size();
 
   const size_t requested_orb_size = psi.size();
 #pragma omp simd
   for (size_t j = 0; j < nComplexBands; j++)
   {
     const size_t jr = j << 1;
     const size_t ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g0[jr];
     const ST dY_r = g1[jr];
     const ST dZ_r = g2[jr];
 
     const ST dX_i = g0[ji];
     const ST dY_i = g1[ji];
     const ST dZ_i = g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
 
     const ST lap_r = myL[jr] + mKK[j] * val_r + two * (kX * dX_i + kY * dY_i + kZ * dZ_i);
     const ST lap_i = myL[ji] + mKK[j] * val_i - two * (kX * dX_r + kY * dY_r + kZ * dZ_r);
 
     const size_t psiIndex = first_spo + jr;
     if (psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       d2psi[psiIndex]   = c * lap_r - s * lap_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
     }
     if (psiIndex + 1 < requested_orb_size)
     {
       psi[psiIndex + 1]     = c * val_i + s * val_r;
       d2psi[psiIndex + 1]   = c * lap_i + s * lap_r;
       dpsi[psiIndex + 1][0] = c * gX_i + s * gX_r;
       dpsi[psiIndex + 1][1] = c * gY_i + s * gY_r;
       dpsi[psiIndex + 1][2] = c * gZ_i + s * gZ_r;
     }
   }
 
 #pragma omp simd
   for (size_t j = nComplexBands; j < N; j++)
   {
     const size_t jr = j << 1;
     const size_t ji = jr + 1;
 
     const ST kX    = k0[j];
     const ST kY    = k1[j];
     const ST kZ    = k2[j];
     const ST val_r = myV[jr];
     const ST val_i = myV[ji];
 
     //phase
     ST s, c;
     qmcplusplus::sincos(-(x * kX + y * kY + z * kZ), &s, &c);
 
     //dot(PrimLattice.G,myG[j])
     const ST dX_r = g0[jr];
     const ST dY_r = g1[jr];
     const ST dZ_r = g2[jr];
 
     const ST dX_i = g0[ji];
     const ST dY_i = g1[ji];
     const ST dZ_i = g2[ji];
 
     // \f$\nabla \psi_r + {\bf k}\psi_i\f$
     const ST gX_r = dX_r + val_i * kX;
     const ST gY_r = dY_r + val_i * kY;
     const ST gZ_r = dZ_r + val_i * kZ;
     const ST gX_i = dX_i - val_r * kX;
     const ST gY_i = dY_i - val_r * kY;
     const ST gZ_i = dZ_i - val_r * kZ;
     if (const size_t psiIndex = first_spo + nComplexBands + j; psiIndex < requested_orb_size)
     {
       psi[psiIndex]     = c * val_r - s * val_i;
       dpsi[psiIndex][0] = c * gX_r - s * gX_i;
       dpsi[psiIndex][1] = c * gY_r - s * gY_i;
       dpsi[psiIndex][2] = c * gZ_r - s * gZ_i;
 
       const ST lap_r  = myL[jr] + mKK[j] * val_r + two * (kX * dX_i + kY * dY_i + kZ * dZ_i);
       const ST lap_i  = myL[ji] + mKK[j] * val_i - two * (kX * dX_r + kY * dY_r + kZ * dZ_r);
       d2psi[psiIndex] = c * lap_r - s * lap_i;
     }
   }
 }

◆ bcast_tables()

void bcast_tables ( Communicate * comm )

inline

Definition at line 107 of file SplineC2R.h.

References qmcplusplus::comm, and SplineC2R< ST >::SplineInst.

107 { chunked_bcast(comm, SplineInst->getSplinePtr()); }

qmcplusplus::comm

Communicate * comm

Definition: test_EstimatorManagerNew.cpp:50

qmcplusplus::SplineC2R::SplineInst

std::shared_ptr< MultiBspline< ST > > SplineInst

multi bspline set

Definition: SplineC2R.h:70

◆ create_spline()

void create_spline	(	GT &	xyz_g,
		BCT &	xyz_bc
	)

inline

Definition at line 124 of file SplineC2R.h.

References qmcplusplus::app_log(), SplineC2R< ST >::myV, SplineC2R< ST >::resize_kpoints(), Vector< T, Alloc >::size(), and SplineC2R< ST >::SplineInst.

   {
     resize_kpoints();
     SplineInst = std::make_shared<MultiBspline<ST>>();
     SplineInst->create(xyz_g, xyz_bc, myV.size());
 
     app_log() << "MEMORY " << SplineInst->sizeInByte() / (1 << 20) << " MB allocated "
               << "for the coefficients in 3D spline orbital representation" << std::endl;
   }

◆ evaluateDetRatios()

void evaluateDetRatios	(	const VirtualParticleSet &	VP,
		ValueVector &	psi,
		const ValueVector &	psiinv,
		std::vector< TT > &	ratios
	)

override

Definition at line 120 of file SplineC2R.cpp.

References ParticleSet::activeR(), qmcplusplus::C2C::assign_v(), qmcplusplus::simd::dot(), FairDivideAligned(), VirtualParticleSet::getTotalNum(), omptarget::min(), omp_get_num_threads(), and omp_get_thread_num().

 {
   const bool need_resize = ratios_private.rows() < VP.getTotalNum();
 
 #pragma omp parallel
   {
     int tid = omp_get_thread_num();
     // initialize thread private ratios
     if (need_resize)
     {
       if (tid == 0) // just like #pragma omp master, but one fewer call to the runtime
         ratios_private.resize(VP.getTotalNum(), omp_get_num_threads());
 #pragma omp barrier
     }
     int first, last;
     FairDivideAligned(myV.size(), getAlignment<ST>(), omp_get_num_threads(), tid, first, last);
     const int first_cplx = first / 2;
     const int last_cplx  = kPoints.size() < last / 2 ? kPoints.size() : last / 2;
 
     for (int iat = 0; iat < VP.getTotalNum(); ++iat)
     {
       const PointType& r = VP.activeR(iat);
       PointType ru(PrimLattice.toUnit_floor(r));
 
       spline2::evaluate3d(SplineInst->getSplinePtr(), ru, myV, first, last);
       assign_v(r, myV, psi, first_cplx, last_cplx);
 
       const int first_real     = first_cplx + std::min(nComplexBands, first_cplx);
       const int last_real      = last_cplx + std::min(nComplexBands, last_cplx);
       ratios_private[iat][tid] = simd::dot(psi.data() + first_real, psiinv.data() + first_real, last_real - first_real);
     }
   }
 
   // do the reduction manually
   for (int iat = 0; iat < VP.getTotalNum(); ++iat)
   {
     ratios[iat] = TT(0);
     for (int tid = 0; tid < ratios_private.cols(); tid++)
       ratios[iat] += ratios_private[iat][tid];
   }
 }

◆ evaluateValue()

void evaluateValue	(	const ParticleSet &	P,
		const int	iat,
		ValueVector &	psi
	)

overridevirtual

evaluate the values of this single-particle orbital set

Parameters

P	current ParticleSet
iat	active particle
psi	values of the SPO

Implements SPOSet.

Definition at line 104 of file SplineC2R.cpp.

References ParticleSet::activeR(), qmcplusplus::C2C::assign_v(), FairDivideAligned(), omp_get_num_threads(), and omp_get_thread_num().

 {
   const PointType& r = P.activeR(iat);
   PointType ru(PrimLattice.toUnit_floor(r));
 
 #pragma omp parallel
   {
     int first, last;
     FairDivideAligned(myV.size(), getAlignment<ST>(), omp_get_num_threads(), omp_get_thread_num(), first, last);
 
     spline2::evaluate3d(SplineInst->getSplinePtr(), ru, myV, first, last);
     assign_v(r, myV, psi, first / 2, last / 2);
   }
 }

◆ evaluateVGH()

void evaluateVGH	(	const ParticleSet &	P,
		const int	iat,
		ValueVector &	psi,
		GradVector &	dpsi,
		HessVector &	grad_grad_psi
	)

overridevirtual

evaluate the values, gradients and hessians of this single-particle orbital set

Parameters

P	current ParticleSet
iat	active particle
psi	values of the SPO
dpsi	gradients of the SPO
grad_grad_psi	hessians of the SPO

Reimplemented from SPOSet.

Definition at line 700 of file SplineC2R.cpp.

References ParticleSet::activeR(), FairDivideAligned(), omp_get_num_threads(), and omp_get_thread_num().

 {
   const PointType& r = P.activeR(iat);
   PointType ru(PrimLattice.toUnit_floor(r));
 #pragma omp parallel
   {
     int first, last;
     FairDivideAligned(myV.size(), getAlignment<ST>(), omp_get_num_threads(), omp_get_thread_num(), first, last);
 
     spline2::evaluate3d_vgh(SplineInst->getSplinePtr(), ru, myV, myG, myH, first, last);
     assign_vgh(r, psi, dpsi, grad_grad_psi, first / 2, last / 2);
   }
 }

◆ evaluateVGHGH()

void evaluateVGHGH	(	const ParticleSet &	P,
		const int	iat,
		ValueVector &	psi,
		GradVector &	dpsi,
		HessVector &	grad_grad_psi,
		GGGVector &	grad_grad_grad_psi
	)

overridevirtual

evaluate the values, gradients, hessians, and grad hessians of this single-particle orbital set

Parameters

P	current ParticleSet
iat	active particle
psi	values of the SPO
dpsi	gradients of the SPO
grad_grad_psi	hessians of the SPO
grad_grad_grad_psi	grad hessians of the SPO

Reimplemented from SPOSet.

Definition at line 1207 of file SplineC2R.cpp.

References ParticleSet::activeR(), FairDivideAligned(), omp_get_num_threads(), and omp_get_thread_num().

 {
   const PointType& r = P.activeR(iat);
   PointType ru(PrimLattice.toUnit_floor(r));
 #pragma omp parallel
   {
     int first, last;
     FairDivideAligned(myV.size(), getAlignment<ST>(), omp_get_num_threads(), omp_get_thread_num(), first, last);
 
     spline2::evaluate3d_vghgh(SplineInst->getSplinePtr(), ru, myV, myG, myH, mygH, first, last);
     assign_vghgh(r, psi, dpsi, grad_grad_psi, grad_grad_grad_psi, first / 2, last / 2);
   }
 }

◆ evaluateVGL()

void evaluateVGL	(	const ParticleSet &	P,
		const int	iat,
		ValueVector &	psi,
		GradVector &	dpsi,
		ValueVector &	d2psi
	)

overridevirtual

evaluate the values, gradients and laplacians of this single-particle orbital set

Parameters

P	current ParticleSet
iat	active particle
psi	values of the SPO
dpsi	gradients of the SPO
d2psi	laplacians of the SPO

Implements SPOSet.

Definition at line 445 of file SplineC2R.cpp.

References ParticleSet::activeR(), qmcplusplus::C2C::assign_vgl(), FairDivideAligned(), omp_get_num_threads(), and omp_get_thread_num().

 {
   const PointType& r = P.activeR(iat);
   PointType ru(PrimLattice.toUnit_floor(r));
 
 #pragma omp parallel
   {
     int first, last;
     FairDivideAligned(myV.size(), getAlignment<ST>(), omp_get_num_threads(), omp_get_thread_num(), first, last);
 
     spline2::evaluate3d_vgh(SplineInst->getSplinePtr(), ru, myV, myG, myH, first, last);
     assign_vgl(r, psi, dpsi, d2psi, first / 2, last / 2);
   }
 }

◆ flush_zero()

void flush_zero ( )

inline

Definition at line 134 of file SplineC2R.h.

References SplineC2R< ST >::SplineInst.

134 { SplineInst->flush_zero(); }

qmcplusplus::SplineC2R::SplineInst

std::shared_ptr< MultiBspline< ST > > SplineInst

multi bspline set

Definition: SplineC2R.h:70

◆ gather_tables()

void gather_tables ( Communicate * comm )

inline

Definition at line 109 of file SplineC2R.h.

References qmcplusplus::comm, FairDivideLow(), gatherv(), BsplineSet::kPoints, BsplineSet::offset, Communicate::size(), and SplineC2R< ST >::SplineInst.

   {
     if (comm->size() == 1)
       return;
     const int Nbands      = kPoints.size();
     const int Nbandgroups = comm->size();
     offset.resize(Nbandgroups + 1, 0);
     FairDivideLow(Nbands, Nbandgroups, offset);
 
     for (size_t ib = 0; ib < offset.size(); ib++)
       offset[ib] = offset[ib] * 2;
     gatherv(comm, SplineInst->getSplinePtr(), SplineInst->getSplinePtr()->z_stride, offset);
   }

◆ getClassName()

virtual std::string getClassName ( ) const

inlineoverridevirtual

return class name

Implements SPOSet.

Definition at line 90 of file SplineC2R.h.

90 { return "SplineC2R"; }

◆ getKeyword()

virtual std::string getKeyword ( ) const

inlineoverridevirtual

Implements BsplineSet.

Definition at line 91 of file SplineC2R.h.

91 { return "SplineC2R"; }

◆ isComplex()

bool isComplex ( ) const

inlineoverridevirtual

Implements BsplineSet.

Definition at line 92 of file SplineC2R.h.

92 { return true; };

◆ makeClone()

std::unique_ptr<SPOSet> makeClone ( ) const

inlineoverridevirtual

make a clone of itself every derived class must implement this to have threading working correctly.

Implements BsplineSet.

Definition at line 94 of file SplineC2R.h.

94 { return std::make_unique<SplineC2R>(*this); }

◆ read_splines()

bool read_splines ( hdf_archive & h5f )

Definition at line 41 of file SplineC2R.cpp.

References hdf_archive::readEntry().

 {
   std::ostringstream o;
   o << "spline_" << MyIndex;
   einspline_engine<SplineType> bigtable(SplineInst->getSplinePtr());
   return h5f.readEntry(bigtable, o.str().c_str()); //"spline_0");
 }

◆ resize_kpoints()

void resize_kpoints ( )

inline

remap kPoints to pack the double copy

Definition at line 137 of file SplineC2R.h.

References qmcplusplus::dot(), BsplineSet::kPoints, SplineC2R< ST >::mKK, SplineC2R< ST >::myKcart, SplineC2R< ST >::nComplexBands, BsplineSet::remap_kpoints(), VectorSoaContainer< T, D, Alloc >::resize(), and Vector< T, Alloc >::resize().

Referenced by SplineC2R< ST >::create_spline().

   {
     nComplexBands = this->remap_kpoints();
     const int nk  = kPoints.size();
     mKK.resize(nk);
     myKcart.resize(nk);
     for (size_t i = 0; i < nk; ++i)
     {
       mKK[i]     = -dot(kPoints[i], kPoints[i]);
       myKcart(i) = kPoints[i];
     }
   }

◆ resizeStorage()

void resizeStorage	(	size_t	n,
		size_t	nvals
	)

inline

Definition at line 96 of file SplineC2R.h.

References BsplineSet::init_base(), SplineC2R< ST >::myG, SplineC2R< ST >::mygH, SplineC2R< ST >::myH, SplineC2R< ST >::myL, SplineC2R< ST >::myV, qmcplusplus::n, VectorSoaContainer< T, D, Alloc >::resize(), and Vector< T, Alloc >::resize().

   {
     init_base(n);
     size_t npad = getAlignedSize<ST>(2 * n);
     myV.resize(npad);
     myG.resize(npad);
     myL.resize(npad);
     myH.resize(npad);
     mygH.resize(npad);
   }

◆ set_spline()

void set_spline	(	SingleSplineType *	spline_r,
		SingleSplineType *	spline_i,
		int	twist,
		int	ispline,
		int	level
	)

inline

Definition at line 30 of file SplineC2R.cpp.

 {
   SplineInst->copy_spline(spline_r, 2 * ispline);
   SplineInst->copy_spline(spline_i, 2 * ispline + 1);
 }

◆ write_splines()

bool write_splines ( hdf_archive & h5f )

Definition at line 50 of file SplineC2R.cpp.

References hdf_archive::writeEntry().

 {
   std::ostringstream o;
   o << "spline_" << MyIndex;
   einspline_engine<SplineType> bigtable(SplineInst->getSplinePtr());
   return h5f.writeEntry(bigtable, o.str().c_str()); //"spline_0");
 }

Friends And Related Function Documentation

◆ BsplineReader

friend struct BsplineReader

friend

Definition at line 210 of file SplineC2R.h.

◆ SplineSetReader

friend class SplineSetReader

friend

Definition at line 209 of file SplineC2R.h.

Member Data Documentation

◆ GGt

Tensor<ST, 3> GGt

private

$GGt=G^t G $ , transformation for tensor in LatticeUnit to CartesianUnit, e.g. Hessian

Definition at line 66 of file SplineC2R.h.

◆ mKK

vContainer_type mKK

private

Definition at line 72 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resize_kpoints().

◆ myG

gContainer_type myG

protected

Definition at line 82 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resizeStorage().

◆ mygH

ghContainer_type mygH

protected

Definition at line 84 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resizeStorage().

◆ myH

hContainer_type myH

protected

Definition at line 83 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resizeStorage().

◆ myKcart

VectorSoaContainer<ST, 3> myKcart

private

Definition at line 73 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resize_kpoints().

◆ myL

vContainer_type myL

protected

Definition at line 81 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resizeStorage().

◆ myV

vContainer_type myV

protected

intermediate result vectors

Definition at line 80 of file SplineC2R.h.

Referenced by SplineC2R< ST >::create_spline(), and SplineC2R< ST >::resizeStorage().

◆ nComplexBands

int nComplexBands

private

number of complex bands

Definition at line 68 of file SplineC2R.h.

Referenced by SplineC2R< ST >::resize_kpoints().

◆ PrimLattice

CrystalLattice<ST, 3> PrimLattice

private

primitive cell

Definition at line 64 of file SplineC2R.h.

◆ ratios_private

Matrix<TT> ratios_private

private

thread private ratios for reduction when using nested threading, numVP x numThread

Definition at line 76 of file SplineC2R.h.

◆ SplineInst

std::shared_ptr<MultiBspline<ST> > SplineInst

private

multi bspline set

Definition at line 70 of file SplineC2R.h.

Referenced by SplineC2R< ST >::bcast_tables(), SplineC2R< ST >::create_spline(), SplineC2R< ST >::flush_zero(), and SplineC2R< ST >::gather_tables().

The documentation for this class was generated from the following files:

/home/pk7/projects/qmc/for_cron_doxygen/qmcpack/src/QMCWaveFunctions/BsplineFactory/SplineC2R.h
/home/pk7/projects/qmc/for_cron_doxygen/qmcpack/src/QMCWaveFunctions/BsplineFactory/SplineC2R.cpp

Public Types

Public Member Functions

Protected Attributes

Private Attributes

Friends

Additional Inherited Members

Detailed Description

template<typename ST> class qmcplusplus::SplineC2R< ST >

Member Typedef Documentation

◆ BCType

◆ DataType

◆ gContainer_type

◆ ghContainer_type

◆ hContainer_type

◆ PointType

◆ SingleSplineType

◆ SplineType

◆ TT

◆ vContainer_type

Constructor & Destructor Documentation

◆ SplineC2R() [1/2]

◆ SplineC2R() [2/2]

Member Function Documentation

◆ assign_v()

◆ assign_vgh()

◆ assign_vghgh()

◆ assign_vgl()

◆ assign_vgl_from_l()

◆ bcast_tables()

◆ create_spline()

◆ evaluateDetRatios()

◆ evaluateValue()

◆ evaluateVGH()

◆ evaluateVGHGH()

◆ evaluateVGL()

◆ flush_zero()

◆ gather_tables()

◆ getClassName()

◆ getKeyword()

◆ isComplex()

◆ makeClone()

◆ read_splines()

◆ resize_kpoints()

◆ resizeStorage()

◆ set_spline()

◆ write_splines()

Friends And Related Function Documentation

◆ BsplineReader

◆ SplineSetReader

Member Data Documentation

◆ GGt

◆ mKK

◆ myG

◆ mygH

◆ myH

◆ myKcart

◆ myL

◆ myV

◆ nComplexBands

◆ PrimLattice

◆ ratios_private

◆ SplineInst

template<typename ST>
class qmcplusplus::SplineC2R< ST >