Manuals/CHOMBO-RELEASE-3.2/SPMDI_8H_source.html

 #ifdef CH_LANG_CC
 /*
  *      _______              __
  *     / ___/ /  ___  __ _  / /  ___
  *    / /__/ _ \/ _ \/  V \/ _ \/ _ \
  *    \___/_//_/\___/_/_/_/_.__/\___/
  *    Please refer to Copyright.txt, in Chombo's root directory.
  */
 #endif

 #ifndef _SPMDI_H_
 #define _SPMDI_H_

 #include "memtrack.H"
 #include "parstream.H"
 #include "BaseNamespaceHeader.H"

 // default implementations for linearization routines.

 template <class T>
 int linearSize(const T& inputT)
 {
   return inputT.linearSize();
 }

 template <class T>
 void linearIn(T& a_outputT, const void* const inBuf)
 {
   a_outputT.linearIn(inBuf);
 }

 template <class T>
 void linearOut(void* const a_outBuf, const T& inputT)
 {
   inputT.linearOut(a_outBuf);
 }

 #ifdef CH_MPI

 extern void AttachDebugger(int);
 /*****************************/
 //gather a_input into a a_outVec
 /*****************************/
 template <class T>
 inline void
 gather(Vector<T>& a_outVec, const T& a_input, int a_dest)
 {
   CH_assert (a_dest >= 0);
   CH_assert(a_dest <  numProc());
   //now THIS size lives on THIS processor
   int isize = linearSize(a_input);

   //make stuff for linearout
   void* loclBuf = mallocMT(isize);
   if (loclBuf == NULL)
     MayDay::Error("out of memory in gather 1");

   //put linearized T into its proper buffer
   linearOut(loclBuf, a_input);

   int nProcess = numProc();
   int sendCount = 1;
   int recdCount = 1;

   //need to gather isizes onto processor a_dest
   int* vectSize = NULL;
   int* vectDisp = NULL;
   void* sendBuf = static_cast<void*>(&isize);
   //allocate received buffer
   if (procID() == a_dest)
     {
       vectSize = new int[nProcess];
       vectDisp = new int[nProcess];
     }

   int result1 = MPI_Gather(sendBuf, sendCount, MPI_INT,
                            vectSize,recdCount, MPI_INT,
                            a_dest,  Chombo_MPI::comm);

   if (result1 != MPI_SUCCESS)
     MayDay::Error("Gather<T> failed in MPI_Gather 1");

   //make memory for gather, linearin
   void* recdBuf = NULL;
   if (procID() == a_dest)
     {
       size_t itotsize=0;
       for (int iproc = 0; iproc < nProcess; iproc++)
         {
           vectDisp[iproc] = itotsize;
           itotsize += vectSize[iproc];
         }
       recdBuf = mallocMT(itotsize);
       if (recdBuf == NULL)
         {
           MayDay::Error("out of memory in gather 2");
         }
     }

   //gather data
   int result2 = MPI_Gatherv(loclBuf, isize, MPI_BYTE,
                             recdBuf, vectSize, vectDisp, MPI_BYTE,
                             a_dest, Chombo_MPI::comm);
   if (result2 != MPI_SUCCESS)
     MayDay::Error("Gather<T> failed in MPI_Gather 2");

   if (procID() == a_dest)
     {
       //calculate offset into array for current processor
       int ioffset = 0;
       a_outVec.resize(nProcess);
       //need to cast to char* to do pointer arithmetic
       char* arithPtr = (char*)recdBuf;
       for (int iproc = 0; iproc < nProcess; iproc++)
         {
           ioffset = vectDisp[iproc];
           char* thisProcBuf = arithPtr + ioffset;
           linearIn(a_outVec[iproc], thisProcBuf);
         }

       //delete memory for dest-specific arrays
       delete[] vectSize;
       delete[] vectDisp;
       freeMT(recdBuf);
     }

   //delete memory for local buffer
   freeMT(loclBuf);
 }

 /*****************************/
 //broadcast T everywhere
 /*****************************/
 template <class T>
 inline void
 broadcast(T& a_inAndOut,  int a_src)
 {
   CH_assert (a_src >= 0);
   CH_assert(a_src <  numProc());
   int isize;
   if (procID() == a_src)
   {
     isize = linearSize(a_inAndOut);
   }

   MPI_Bcast(&isize, 1, MPI_INT, a_src, Chombo_MPI::comm);

   void* broadBuf = mallocMT(isize);

   if (broadBuf == NULL)
   {
     MayDay::Error("out of memory in broadcast");
   }

   //take inAndOut from src and put it into broadBuf
   if (procID() == a_src)
   {
     linearOut(broadBuf, a_inAndOut);
   }

   //broadcast broadBuf to all procs
   MPI_Bcast(broadBuf, isize, MPI_BYTE, a_src, Chombo_MPI::comm);

   if (procID()==a_src)
   {
     CH_MaxMPISendSize = Max<long long>(CH_MaxMPISendSize, isize);
   }
   else
   {
     CH_MaxMPIRecvSize = Max<long long>(CH_MaxMPIRecvSize, isize);
   }
   //take broadBuf and put back into inAndOut if not src
   if (procID() != a_src)
   {
     linearIn(a_inAndOut, broadBuf);
   }

   //delete memory for buffer
   freeMT(broadBuf);
 }

 /*****************************/
 // simple Barrier
 /*****************************/
 inline void
 barrier(void)
 {
   MPI_Barrier(Chombo_MPI::comm);
 }

 #else
 /*****************************/
 //non-mpi version
 /*****************************/
 template <class T>
 inline void
 gather(Vector<T>& a_outVec, const T& a_input, int a_dest)
 {
   a_outVec.resize(1);
   a_outVec[0] = a_input;
 }
 /*****************************/
 //non-mpi version
 /*****************************/
 template <class T>
 inline void
 broadcast(T& a_inAndOut,  int a_src)
 {
   //nothing to do.  in and out are the same with one proc
 }
 /*****************************/
 //non-mpi version
 /*****************************/
 inline void
 barrier(void)
 {
   // do nothing in serial
 }

 #endif //the mpi thing

 //*************************************
 //These should work independent of MPI
 //*************************************

 //Vector<T> specialization of linearIn
 template <class T>
 void
 linearListIn(Vector<T>& a_outputT, const void* const a_inBuf)
 {
   //first entry is the size of the vector
   const int* const intBuf = (int*)a_inBuf;
   int vecsize = intBuf[0];
   Vector<int> vecOffset(vecsize);
   //next vecsize entries are offsets of data into buffer
   for (int ivec = 0; ivec < vecsize; ivec++)
     {
       vecOffset[ivec] = intBuf[ivec+1];
     }
   //next vecsize entries are the actual data
   //yes I could do this in one loop but that would
   // either
   // a) make it less symmetric with linearOut
   // and/or
   // b) make both of them far less readable
   a_outputT.resize(vecsize);
   const char* const charbuf = (char*)a_inBuf;
   for (int ivec = 0; ivec < vecsize; ivec++)
     {
       const char* const dataLoc = charbuf + vecOffset[ivec];
       linearIn(a_outputT[ivec], dataLoc);
     }
 }

 //Vector<T> specialization of linearOut
 template <class T>
 void
 linearListOut(void* const a_outBuf, const Vector<T>& a_input)
 {
   //first entry is the size of the vector
   int* const intBuf = (int*)a_outBuf;
   intBuf[0] = a_input.size();
   int vecsize = intBuf[0];
   Vector<int> vecOffset(vecsize);
   //next vecsize entries are offsets of data into buffer
   //next vecsize entries are the actual data
   int ioffset = (vecsize+1)*sizeof(int);
   for (int ivec = 0; ivec < vecsize; ivec++)
     {
       intBuf[ivec+1] = ioffset;
       vecOffset[ivec] = ioffset;
       ioffset += linearSize(a_input[ivec]);
     }
   //yes I could do this in one loop but that would
   // either
   // a) make it less symmetric with linearIn
   // and/or
   // b) make both of them far less readable
   char* const charBuf = (char*)a_outBuf;
   for (int ivec = 0; ivec < vecsize; ivec++)
     {
       char* const dataLoc = charBuf + vecOffset[ivec];
       linearOut(dataLoc, a_input[ivec]);
     }
 }

 //Vector<T> specialization of linearSize
 template <class T>
 int
 linearListSize(const Vector<T>& a_input)
 {
   //first entry is the size of the vector (int)
   //next vecsize entries are offsets of data into buffer (int)
   //next vecsize entries are the actual data
   int itotsize = (a_input.size() + 1)*sizeof(int);
   for (unsigned int ivec = 0; ivec < a_input.size(); ivec++)
     {
       itotsize += linearSize(a_input[ivec]);
     }
   return itotsize;
 }

 #include "BaseNamespaceFooter.H"

 #endif
freeMT
#define freeMT(a_a)
Definition: memtrack.H:160

CH_assert
#define CH_assert(cond)
Definition: CHArray.H:37

linearOut
void linearOut(void *const a_outBuf, const T &inputT)
Definition: SPMDI.H:33

memtrack.H

barrier
void barrier(void)
all ranks wait here to sync-up
Definition: SPMDI.H:215

Vector
one dimensional dynamic array
Definition: Vector.H:53

mallocMT
#define mallocMT(a_a)
Definition: memtrack.H:159

AttachDebugger
void AttachDebugger(int a_sig=4)

linearIn
void linearIn(T &a_outputT, const void *const inBuf)
Definition: SPMDI.H:27

CH_MaxMPIRecvSize
unsigned long long CH_MaxMPIRecvSize

CH_MaxMPISendSize
unsigned long long CH_MaxMPISendSize

numProc
unsigned int numProc()
number of parallel processes

linearSize
int linearSize(const T &inputT)
Definition: SPMDI.H:21

BaseNamespaceHeader.H

Vector::resize
void resize(unsigned int isize)
Definition: Vector.H:346

gather
void gather(Vector< T > &a_outVec, const T &a_input, int a_dest)
Definition: SPMDI.H:197

linearListIn
void linearListIn(Vector< T > &a_outputT, const void *const a_inBuf)
Definition: SPMDI.H:229

parstream.H

Vector::size
size_t size() const
Definition: Vector.H:192

MayDay::Error
static void Error(const char *const a_msg=m_nullString, int m_exitCode=CH_DEFAULT_ERROR_CODE)
Print out message to cerr and exit with the specified exit code.

linearListOut
void linearListOut(void *const a_outBuf, const Vector< T > &a_input)
Definition: SPMDI.H:258

linearListSize
int linearListSize(const Vector< T > &a_input)
Definition: SPMDI.H:290

procID
int procID()
local process ID

BaseNamespaceFooter.H

broadcast
void broadcast(T &a_inAndOut, int a_src)
broadcast to every process
Definition: SPMDI.H:207