d7/d98/a00983_source.html

 //////////////////////////////////////////////////////////////////////////////////////
 // This file is distributed under the University of Illinois/NCSA Open Source License.
 // See LICENSE file in top directory for details.
 //
 // Copyright (c) 2016 Jeongnim Kim and QMCPACK developers.
 //
 // File developed by: Ken Esler, kpesler@gmail.com, University of Illinois at Urbana-Champaign
 //                    Jeremy McMinnis, jmcminis@gmail.com, University of Illinois at Urbana-Champaign
 //                    Jeongnim Kim, jeongnim.kim@gmail.com, University of Illinois at Urbana-Champaign
 //                    Mark A. Berrill, berrillma@ornl.gov, Oak Ridge National Laboratory
 //
 // File created by: Jeongnim Kim, jeongnim.kim@gmail.com, University of Illinois at Urbana-Champaign
 //////////////////////////////////////////////////////////////////////////////////////


 #ifndef OHMMS_COMMUNICATION_OPERATORS_MPI_H
 #define OHMMS_COMMUNICATION_OPERATORS_MPI_H
 #include "Pools/PooledData.h"
 #include <cstdint>
 #include <stdexcept>
 ///dummy declarations to be specialized
 template<typename T>
 inline void gsum(T&, int)
 {
   throw std::runtime_error("Need specialization for gsum(T&, int)");
 }

 template<typename T>
 inline void Communicate::allreduce(T&)
 {
   throw std::runtime_error("Need specialization for allreduce(T&)");
 }

 template<typename T>
 inline void Communicate::reduce(T&)
 {
   throw std::runtime_error("Need specialization for reduce(T&)");
 }

 template<typename T>
 inline void Communicate::reduce(T* restrict, T* restrict, int n)
 {
   throw std::runtime_error("Need specialization for reduce(T* restrict , T* restrict, int n)");
 }

 template<typename T>
 inline void Communicate::reduce_in_place(T* restrict, int n)
 {
   throw std::runtime_error("Need specialization for reduce_in_place(T* restrict, int n)");
 }

 template<typename T>
 inline void Communicate::bcast(T&)
 {
   throw std::runtime_error("Need specialization for bcast(T&)");
 }

 template<typename T>
 inline void Communicate::bcast(T* restrict, int n)
 {
   throw std::runtime_error("Need specialization for bcast(T* restrict ,int n)");
 }

 template<typename T>
 inline void Communicate::send(int dest, int tag, T&)
 {
   throw std::runtime_error("Need specialization for send(int, int, T& )");
 }

 template<typename T>
 inline void Communicate::gather(T& sb, T& rb, int dest)
 {
   throw std::runtime_error("Need specialization for gather(T&, T&, int)");
 }

 template<typename T>
 inline void Communicate::allgather(T& sb, T& rb, int count)
 {
   throw std::runtime_error("Need specialization for allgather(T&, T&, int)");
 }

 template<typename T, typename IT>
 inline void Communicate::gatherv(T& sb, T& rb, IT&, IT&, int dest)
 {
   throw std::runtime_error("Need specialization for gatherv(T&, T&, IT&, IT&, int)");
 }

 template<typename T>
 inline void Communicate::scatter(T& sb, T& rb, int dest)
 {
   throw std::runtime_error("Need specialization for scatter(T&, T&, int)");
 }

 template<typename T, typename IT>
 inline void Communicate::scatterv(T& sb, T& rb, IT&, IT&, int source)
 {
   throw std::runtime_error("Need specialization for scatterv(T&, T&, IT&, IT&, int)");
 }

 template<typename T>
 inline Communicate::request Communicate::irecv(int source, int tag, T&)
 {
   throw std::runtime_error("Need specialization for irecv(int source, int tag, T& )");
   return MPI_REQUEST_NULL;
 }

 template<typename T>
 inline Communicate::request Communicate::isend(int dest, int tag, T&)
 {
   throw std::runtime_error("Need specialization for isend(int source, int tag, T& )");
   return MPI_REQUEST_NULL;
 }

 template<typename T>
 inline Communicate::request Communicate::irecv(int source, int tag, T*, int n)
 {
   throw std::runtime_error("Need specialization for irecv(int source, int tag, T*, int )");
   return MPI_REQUEST_NULL;
 }

 template<typename T>
 inline Communicate::request Communicate::isend(int dest, int tag, T*, int n)
 {
   throw std::runtime_error("Need specialization for isend(int source, int tag, T*, int )");
   return MPI_REQUEST_NULL;
 }

 template<typename T>
 inline void Communicate::allgather(T* sb, T* rb, int count)
 {
   throw std::runtime_error("Need specialization for allgather(T*, T*, int)");
 }

 template<typename T, typename IT>
 inline void Communicate::gatherv(T* sb, T* rb, int n, IT&, IT&, int dest)
 {
   throw std::runtime_error("Need specialization for gatherv(T*, T*, int, IT&, IT&, int)");
 }

 template<typename T>
 inline void Communicate::gsum(T&)
 {
   throw std::runtime_error("Need specialization for Communicate::::gsum(T&)");
 }

 template<>
 inline void gsum(int& g, int gid)
 {
   int gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_INT, MPI_SUM, MPI_COMM_WORLD);
 }

 template<unsigned N>
 inline void gsum(qmcplusplus::TinyVector<double, N>& g, int gid)
 {
   //TinyVector<double,N> gt = g;
   //MPI_Allreduce(gt.begin(), g.begin(), N, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   qmcplusplus::TinyVector<double, N> gt(g);
   MPI_Allreduce(g.begin(), gt.begin(), N, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   g = gt;
 }

 template<>
 inline void gsum(std::vector<int>& g, int gid)
 {
   std::vector<int> gt(g.size(), 0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_INT, MPI_SUM, MPI_COMM_WORLD);
   g = gt;
 }

 template<>
 inline void gsum(double& g, int gid)
 {
   double gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
 }

 template<unsigned N>
 inline void gsum(qmcplusplus::TinyVector<int, N>& g, int gid)
 {
   //TinyVector<double,N> gt = g;
   //MPI_Allreduce(gt.begin(), g.begin(), N, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   qmcplusplus::TinyVector<int, N> gt(g);
   MPI_Allreduce(g.begin(), gt.begin(), N, MPI_INT, MPI_SUM, MPI_COMM_WORLD);
   g = gt;
 }

 template<>
 inline void gsum(std::vector<double>& g, int gid)
 {
   std::vector<double> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   g = gt;
 }

 template<>
 inline void gsum(qmcplusplus::Matrix<double>& g, int gid)
 {
   //TinyVector<double,N> gt = g;
   //MPI_Allreduce(gt.begin(), g.begin(), N, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   std::vector<double> gt(g.size());
   copy(g.begin(), g.end(), gt.begin());
   MPI_Allreduce(g.data(), &gt[0], g.size(), MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   copy(gt.begin(), gt.end(), g.data());
 }

 template<>
 inline void Communicate::allreduce(int& g)
 {
   if (d_ncontexts == 1)
     return;
   int gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_INT, MPI_SUM, myMPI);
 }

 template<>
 inline void Communicate::allreduce(long& g)
 {
   if (d_ncontexts == 1)
     return;
   long gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_LONG, MPI_SUM, myMPI);
 }

 template<>
 inline void Communicate::allreduce(unsigned long& g)
 {
   if (d_ncontexts == 1)
     return;
   unsigned long gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_UNSIGNED_LONG, MPI_SUM, myMPI);
 }

 template<>
 inline void Communicate::allreduce(float& g)
 {
   if (d_ncontexts == 1)
     return;
   float gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_FLOAT, MPI_SUM, myMPI);
 }

 template<>
 inline void Communicate::allreduce(double& g)
 {
   if (d_ncontexts == 1)
     return;
   double gt = g;
   MPI_Allreduce(&(gt), &(g), 1, MPI_DOUBLE, MPI_SUM, myMPI);
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::TinyVector<float, OHMMS_DIM>& g)
 {
   if (d_ncontexts == 1)
     return;
   qmcplusplus::TinyVector<float, OHMMS_DIM> gt(g);
   MPI_Allreduce(g.begin(), gt.begin(), OHMMS_DIM, MPI_FLOAT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::TinyVector<double, OHMMS_DIM>& g)
 {
   if (d_ncontexts == 1)
     return;
   qmcplusplus::TinyVector<double, OHMMS_DIM> gt(g);
   MPI_Allreduce(g.begin(), gt.begin(), OHMMS_DIM, MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::TinyVector<int, OHMMS_DIM>& g)
 {
   if (d_ncontexts == 1)
     return;
   qmcplusplus::TinyVector<int, OHMMS_DIM> gt(g);
   MPI_Allreduce(g.begin(), gt.begin(), OHMMS_DIM, MPI_INT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<int>& g)
 {
   if (d_ncontexts == 1)
     return;
   std::vector<int> gt(g.size(), 0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_INT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<long>& g)
 {
   if (d_ncontexts == 1)
     return;
   std::vector<long> gt(g.size(), 0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_LONG, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<unsigned long>& g)
 {
   if (d_ncontexts == 1)
     return;
   std::vector<unsigned long> gt(g.size(), 0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_UNSIGNED_LONG, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<float>& g)
 {
   std::vector<float> gt(g.size(), 0.0f);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_FLOAT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<double>& g)
 {
   std::vector<double> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<std::complex<float>>& g)
 {
   std::vector<std::complex<float>> gt(g.size(), std::complex<float>(0.0));
   MPI_Allreduce(&(g[0]), &(gt[0]), 2 * g.size(), MPI_FLOAT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(std::vector<std::complex<double>>& g)
 {
   std::vector<std::complex<double>> gt(g.size(), std::complex<double>(0.0));
   MPI_Allreduce(&(g[0]), &(gt[0]), 2 * g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(PooledData<float>& g)
 {
   PooledData<float> gt(g.size());
   MPI_Allreduce(g.data(), gt.data(), g.size(), MPI_FLOAT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(PooledData<double>& g)
 {
   PooledData<double> gt(g.size());
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::Matrix<float>& g)
 {
   std::vector<float> gt(g.size());
   std::copy(g.begin(), g.end(), gt.begin());
   MPI_Allreduce(g.data(), &gt[0], g.size(), MPI_FLOAT, MPI_SUM, myMPI);
   std::copy(gt.begin(), gt.end(), g.data());
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::Matrix<double>& g)
 {
   std::vector<double> gt(g.size());
   copy(g.begin(), g.end(), gt.begin());
   MPI_Allreduce(g.data(), &gt[0], g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   copy(gt.begin(), gt.end(), g.data());
 }

 template<>
 inline void Communicate::reduce(std::vector<float>& g)
 {
   std::vector<float> gt(g.size(), 0.0f);
   MPI_Reduce(&(g[0]), &(gt[0]), g.size(), MPI_FLOAT, MPI_SUM, 0, myMPI);
   if (!d_mycontext)
     g = gt;
 }

 template<>
 inline void Communicate::reduce(std::vector<double>& g)
 {
   std::vector<double> gt(g.size(), 0.0);
   MPI_Reduce(&(g[0]), &(gt[0]), g.size(), MPI_DOUBLE, MPI_SUM, 0, myMPI);
   if (!d_mycontext)
     g = gt;
 }

 template<>
 inline void Communicate::reduce(std::vector<int>& g)
 {
   std::vector<int> gt(g.size(), 0.0);
   MPI_Reduce(&(g[0]), &(gt[0]), g.size(), MPI_INT, MPI_SUM, 0, myMPI);
   if (!d_mycontext)
     g = gt;
 }

 template<>
 inline void Communicate::reduce(std::vector<long>& g)
 {
   std::vector<long> gt(g.size(), 0.0);
   MPI_Reduce(&(g[0]), &(gt[0]), g.size(), MPI_LONG, MPI_SUM, 0, myMPI);
   if (!d_mycontext)
     g = gt;
 }

 template<>
 inline void Communicate::reduce(int* restrict g, int* restrict res, int n)
 {
   MPI_Reduce(g, res, n, MPI_INT, MPI_SUM, 0, myMPI);
 }

 template<>
 inline void Communicate::reduce(double* restrict g, double* restrict res, int n)
 {
   MPI_Reduce(g, res, n, MPI_DOUBLE, MPI_SUM, 0, myMPI);
 }

 template<>
 inline void Communicate::reduce_in_place(double* restrict res, int n)
 {
   if (!d_mycontext)
     MPI_Reduce(MPI_IN_PLACE, res, n, MPI_DOUBLE, MPI_SUM, 0, myMPI);
   else
     MPI_Reduce(res, NULL, n, MPI_DOUBLE, MPI_SUM, 0, myMPI);
 }

 template<>
 inline void Communicate::reduce_in_place(float* restrict res, int n)
 {
   if (!d_mycontext)
     MPI_Reduce(MPI_IN_PLACE, res, n, MPI_FLOAT, MPI_SUM, 0, myMPI);
   else
     MPI_Reduce(res, NULL, n, MPI_FLOAT, MPI_SUM, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(int& g)
 {
   MPI_Bcast(&g, 1, MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(uint32_t& g)
 {
   MPI_Bcast(&g, 1, MPI_UNSIGNED, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<uint32_t>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_UNSIGNED, 0, myMPI);
 }


 template<>
 inline void Communicate::bcast(double& g)
 {
   MPI_Bcast(&g, 1, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(float& g)
 {
   MPI_Bcast(&g, 1, MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(bool& g)
 {
   int val = g ? 1 : 0;
   MPI_Bcast(&val, 1, MPI_INT, 0, myMPI);
   g = val != 0;
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<double, 2>& g)
 {
   MPI_Bcast(g.begin(), 2, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<int, 2>& g)
 {
   MPI_Bcast(g.begin(), 2, MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<int, 3>& g)
 {
   MPI_Bcast(g.begin(), 3, MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<qmcplusplus::TinyVector<int, 3>>& g)
 {
   MPI_Bcast(&g[0][0], 3 * g.size(), MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<double, 3>& g)
 {
   MPI_Bcast(g.begin(), 3, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<float, 3>& g)
 {
   MPI_Bcast(g.begin(), 3, MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::TinyVector<double, 4>& g)
 {
   MPI_Bcast(g.begin(), 4, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Tensor<double, 3>& g)
 {
   MPI_Bcast(&(g[0]), 9, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Tensor<float, 3>& g)
 {
   MPI_Bcast(&(g[0]), 9, MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<double>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<float>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<std::complex<double>>& g)
 {
   MPI_Bcast(&(g[0]), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<std::complex<float>>& g)
 {
   MPI_Bcast(&(g[0]), 2 * g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<int>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_INT, 0, myMPI);
 }


 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<qmcplusplus::TinyVector<double, 2>>& g)
 {
   MPI_Bcast(&(g[0]), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3>>& g)
 {
   MPI_Bcast(&(g[0]), 3 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(qmcplusplus::Vector<qmcplusplus::TinyVector<float, 3>>& g)
 {
   MPI_Bcast(&(g[0]), 3 * g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(Array<double, 3>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(Array<float, 3>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(Array<int, 1>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_INT, 0, myMPI);
 }


 template<>
 inline void Communicate::bcast(Array<std::complex<double>, 1>& g)
 {
   MPI_Bcast(g.data(), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }


 template<>
 inline void Communicate::bcast(Array<std::complex<double>, 2>& g)
 {
   MPI_Bcast(g.data(), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(Array<std::complex<double>, 3>& g)
 {
   MPI_Bcast(g.data(), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(Array<std::complex<float>, 3>& g)
 {
   MPI_Bcast(g.data(), 2 * g.size(), MPI_FLOAT, 0, myMPI);
 }


 template<>
 inline void Communicate::bcast(std::vector<double>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<std::complex<double>>& g)
 {
   MPI_Bcast(&(g[0]), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<std::complex<float>>& g)
 {
   MPI_Bcast(&(g[0]), 2 * g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<float>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(PooledData<double>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(PooledData<float>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(PooledData<int>& g)
 {
   MPI_Bcast(g.data(), g.size(), MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<qmcplusplus::TinyVector<double, 2>>& g)
 {
   MPI_Bcast(&(g[0][0]), 2 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<qmcplusplus::TinyVector<double, 3>>& g)
 {
   MPI_Bcast(&(g[0][0]), 3 * g.size(), MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<qmcplusplus::TinyVector<float, 3>>& g)
 {
   MPI_Bcast(&(g[0][0]), 3 * g.size(), MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<int>& g)
 {
   MPI_Bcast(&(g[0]), g.size(), MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::vector<bool>& g)
 {
   std::vector<int> intVec(g.size());
   for (int i = 0; i < g.size(); i++)
     intVec[i] = g[i] ? 1 : 0;
   MPI_Bcast(&(intVec[0]), g.size(), MPI_INT, 0, myMPI);
   for (int i = 0; i < g.size(); i++)
     g[i] = intVec[i] != 0;
 }

 template<>
 inline void Communicate::bcast(double* restrict x, int n)
 {
   MPI_Bcast(x, n, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::complex<double>* restrict x, int n)
 {
   MPI_Bcast(x, 2*n, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(float* restrict x, int n)
 {
   MPI_Bcast(x, n, MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::complex<float>* restrict x, int n)
 {
   MPI_Bcast(x, 2*n, MPI_FLOAT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(int* restrict x, int n)
 {
   MPI_Bcast(x, n, MPI_INT, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(char* restrict x, int n)
 {
   MPI_Bcast(x, n, MPI_CHAR, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::string& g)
 {
   int string_size = g.size();

   bcast(string_size);
   if (rank() != 0)
     g.resize(string_size);

   bcast(&g[0], g.size());
 }

 template<>
 inline void Communicate::send(int dest, int tag, std::vector<double>& g)
 {
   MPI_Send(&(g[0]), g.size(), MPI_DOUBLE, dest, tag, myMPI);
 }

 template<>
 inline Communicate::request Communicate::isend(int dest, int tag, std::vector<double>& g)
 {
   request r;
   MPI_Isend(&(g[0]), g.size(), MPI_DOUBLE, dest, tag, myMPI, &r);
   return r;
 }

 template<>
 inline Communicate::request Communicate::irecv(int source, int tag, std::vector<double>& g)
 {
   request r;
   MPI_Irecv(&(g[0]), g.size(), MPI_DOUBLE, source, tag, myMPI, &r);
   return r;
 }

 template<>
 inline void Communicate::gatherv(std::vector<char>& l,
                                  std::vector<char>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(&l[0], l.size(), MPI_CHAR, &g[0], &counts[0], &displ[0], MPI_CHAR, dest, myMPI);
 }


 template<>
 inline void Communicate::gatherv(std::vector<double>& l,
                                  std::vector<double>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(&l[0], l.size(), MPI_DOUBLE, &g[0], &counts[0], &displ[0], MPI_DOUBLE, dest, myMPI);
 }

 template<>
 inline void Communicate::gatherv(std::vector<float>& l,
                                  std::vector<float>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(&l[0], l.size(), MPI_FLOAT, &g[0], &counts[0], &displ[0], MPI_FLOAT, dest, myMPI);
 }

 template<>
 inline void Communicate::gatherv(std::vector<int>& l,
                                  std::vector<int>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(&l[0], l.size(), MPI_INT, &g[0], &counts[0], &displ[0], MPI_INT, dest, myMPI);
 }

 template<>
 inline void Communicate::allgather(std::vector<char>& sb, std::vector<char>& rb, int count)
 {
   MPI_Allgather(&sb[0], count, MPI_CHAR, &rb[0], count, MPI_CHAR, myMPI);
 }

 template<>
 inline void Communicate::allgather(std::vector<int>& sb, std::vector<int>& rb, int count)
 {
   MPI_Allgather(&sb[0], count, MPI_INT, &rb[0], count, MPI_INT, myMPI);
 }


 template<>
 inline void Communicate::allgatherv(std::vector<int>& l,
                                     std::vector<int>& g,
                                     std::vector<int>& counts,
                                     std::vector<int>& displ)
 {
   int ierr = MPI_Allgatherv(&l[0], l.size(), MPI_INT, &g[0], &counts[0], &displ[0], MPI_INT, myMPI);
 }

 template<>
 inline void Communicate::gatherv(std::vector<long>& l,
                                  std::vector<long>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(&l[0], l.size(), MPI_LONG, &g[0], &counts[0], &displ[0], MPI_LONG, dest, myMPI);
 }

 template<>
 inline void Communicate::gather(std::vector<double>& l, std::vector<double>& g, int dest)
 {
   int ierr = MPI_Gather(&l[0], l.size(), MPI_DOUBLE, &g[0], l.size(), MPI_DOUBLE, dest, myMPI);
 }

 template<>
 inline void Communicate::gather(std::vector<char>& l, std::vector<char>& g, int dest)
 {
   int ierr = MPI_Gather(&l[0], l.size(), MPI_CHAR, &g[0], l.size(), MPI_CHAR, dest, myMPI);
 }

 template<>
 inline void Communicate::gather(std::vector<int>& l, std::vector<int>& g, int dest)
 {
   int ierr = MPI_Gather(&l[0], l.size(), MPI_INT, &g[0], l.size(), MPI_INT, dest, myMPI);
 }

 template<>
 inline void Communicate::gatherv(PooledData<double>& l,
                                  PooledData<double>& g,
                                  std::vector<int>& counts,
                                  std::vector<int>& displ,
                                  int dest)
 {
   int ierr = MPI_Gatherv(l.data(), l.size(), MPI_DOUBLE, g.data(), &counts[0], &displ[0], MPI_DOUBLE, dest, myMPI);
 }

 template<>
 inline void Communicate::gather(PooledData<double>& l, PooledData<double>& g, int dest)
 {
   int ierr = MPI_Gather(l.data(), l.size(), MPI_DOUBLE, g.data(), l.size(), MPI_DOUBLE, dest, myMPI);
 }

 template<>
 inline void Communicate::gsum(std::vector<int>& g)
 {
   std::vector<int> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_INT, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::gsum(std::vector<double>& g)
 {
   std::vector<double> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void gsum(std::vector<std::complex<double>>& g, int gid)
 {
   std::vector<std::complex<double>> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), 2 * g.size(), MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
   g = gt;
 }

 template<>
 inline void Communicate::gsum(std::vector<std::complex<double>>& g)
 {
   std::vector<std::complex<double>> gt(g.size(), 0.0);
   MPI_Allreduce(&(g[0]), &(gt[0]), 2 * g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   g = gt;
 }

 template<>
 inline void Communicate::gatherv(char* l, char* g, int n, std::vector<int>& counts, std::vector<int>& displ, int dest)
 {
   int ierr = MPI_Gatherv(l, n, MPI_CHAR, g, &counts[0], &displ[0], MPI_CHAR, dest, myMPI);
 }

 template<>
 inline void Communicate::allgather(char* sb, char* rb, int count)
 {
   MPI_Allgather(sb, count, MPI_CHAR, rb, count, MPI_CHAR, myMPI);
 }

 template<>
 inline void Communicate::scatterv(std::vector<char>& sb,
                                   std::vector<char>& rb,
                                   std::vector<int>& counts,
                                   std::vector<int>& displ,
                                   int source)
 {
   int ierr = MPI_Scatterv(&sb[0], &counts[0], &displ[0], MPI_CHAR, &rb[0], rb.size(), MPI_CHAR, source, myMPI);
 }

 template<typename T, typename TMPI, typename IT>
 inline void Communicate::gatherv_in_place(T* buf, TMPI& datatype, IT& counts, IT& displ, int dest)
 {
   if (!d_mycontext)
     MPI_Gatherv(MPI_IN_PLACE, 0, datatype, buf, counts.data(), displ.data(), datatype, dest, myMPI);
   else
     MPI_Gatherv(buf + displ[d_mycontext], counts[d_mycontext], datatype, NULL, counts.data(), displ.data(), datatype,
                 dest, myMPI);
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::Matrix<std::complex<double>>& g)
 {
   std::vector<std::complex<double>> gt(g.size());
   std::copy(g.begin(), g.end(), gt.begin());
   MPI_Allreduce(g.data(), &gt[0], 2 * g.size(), MPI_DOUBLE, MPI_SUM, myMPI);
   std::copy(gt.begin(), gt.end(), g.data());
 }

 template<>
 inline void Communicate::allreduce(qmcplusplus::Matrix<std::complex<float>>& g)
 {
   std::vector<std::complex<float>> gt(g.size());
   std::copy(g.begin(), g.end(), gt.begin());
   MPI_Allreduce(g.data(), &gt[0], 2 * g.size(), MPI_FLOAT, MPI_SUM, myMPI);
   std::copy(gt.begin(), gt.end(), g.data());
 }

 template<>
 inline void Communicate::bcast(std::complex<double>& g)
 {
   MPI_Bcast(&g, 2, MPI_DOUBLE, 0, myMPI);
 }

 template<>
 inline void Communicate::bcast(std::complex<float>& g)
 {
   MPI_Bcast(&g, 2, MPI_FLOAT, 0, myMPI);
 }

 #endif
qmcplusplus::Matrix::begin
Container_t::iterator begin()
Definition: OhmmsMatrix.h:89

Communicate::isend
request isend(int dest, int tag, T &)
Definition: CommOperatorsMPI.h:108

qmcplusplus::TinyVector
Fixed-size array.
Definition: OhmmsTinyMeta.h:30

PooledData::size
size_type size() const
return the size of the data
Definition: PooledData.h:48

Communicate::irecv
request irecv(int source, int tag, T &)
Definition: CommOperatorsMPI.h:101

Communicate::reduce
void reduce(T &)
Definition: CommOperatorsMPI.h:35

Communicate::rank
int rank() const
return the rank
Definition: Communicate.h:116

Communicate::send
void send(int dest, int tag, T &)
Definition: CommOperatorsMPI.h:65

PooledData::data
T * data()
return the address of the first element
Definition: PooledData.h:212

gsum
void gsum(T &, int)
dummy declarations to be specialized
Definition: CommOperatorsMPI.h:23

Communicate::gatherv
void gatherv(T &sb, T &rb, IT &counts, IT &displ, int dest=0)
Definition: CommOperatorsMPI.h:83

Communicate::d_mycontext
int d_mycontext
Rank.
Definition: Communicate.h:218

Array::data
Type_t * data()
Definition: OhmmsArray.h:87

Communicate::myMPI
mpi_comm_type myMPI
Raw communicator.
Definition: Communicate.h:214

qmcplusplus::Vector
Definition: OhmmsVector.h:33

OHMMS_DIM
#define OHMMS_DIM
Definition: config.h:64

copy
void copy(const Array< T1, 3 > &src, Array< T2, 3 > &dest)
Definition: Blitz.h:639

Communicate::allreduce
void allreduce(T &)
Definition: CommOperatorsMPI.h:29

qmcplusplus::Matrix::size
size_type size() const
Definition: OhmmsMatrix.h:76

qmcplusplus::Vector::size
size_type size() const
return the current size
Definition: OhmmsVector.h:162

qmcplusplus::Tensor< double, 3 >

Communicate::allgather
void allgather(T &sb, T &rb, int count)
Definition: CommOperatorsMPI.h:77

Communicate::d_ncontexts
int d_ncontexts
Size.
Definition: Communicate.h:220

qmcplusplus::TinyVector::begin
Type_t * begin()
Definition: TinyVector.h:140

Communicate::gather
void gather(T &sb, T &rb, int dest=0)
Definition: CommOperatorsMPI.h:71

Array::size
size_t size() const
Definition: OhmmsArray.h:57

Communicate::gsum
void gsum(T &)
Definition: CommOperatorsMPI.h:141

Communicate::gatherv_in_place
void gatherv_in_place(T *buf, TMPI &datatype, IT &counts, IT &displ, int dest=0)
Definition: CommOperatorsMPI.h:940

Communicate::scatter
void scatter(T &sb, T &rb, int dest=0)
Definition: CommOperatorsMPI.h:89

qmcplusplus::n
int n
Definition: test_cuBLAS_LU.cpp:216

CommunicatorTraits::request
int request
Definition: Communicate.h:45

qmcplusplus::Matrix< double >

Communicate::reduce_in_place
void reduce_in_place(T *restrict, int n)
Definition: CommOperatorsMPI.h:47

CommunicatorTraits::MPI_REQUEST_NULL
static const int MPI_REQUEST_NULL
Definition: Communicate.h:47

Communicate::bcast
void bcast(T &)
Definition: CommOperatorsMPI.h:53

qmcplusplus::Matrix::data
pointer data()
Definition: OhmmsMatrix.h:182

qmcplusplus::Units::force::N
const real N
Definition: unit_conversion.h:92

Array< double, 3 >

PooledData
Definition: PooledData.h:30

qmcplusplus::Matrix::end
Container_t::iterator end()
Definition: OhmmsMatrix.h:90

PooledData.h
Define a serialized buffer to store anonymous data.

Communicate::allgatherv
void allgatherv(T &sb, T &rb, IT &counts, IT &displ)

Communicate::scatterv
void scatterv(T &sb, T &rb, IT &counts, IT &displ, int source=0)
Definition: CommOperatorsMPI.h:95