Dendro-5.01/html/parUtils_8h_source.html

 #ifndef __PAR_UTILS_H_
 #define __PAR_UTILS_H_

 #define KEEP_HIGH 100
 #define KEEP_LOW 101

 #ifdef __DEBUG__
 #ifndef __DEBUG_PAR__
 #define __DEBUG_PAR__
 #endif
 #endif

 #include "mpi.h"
 #include <vector>
 #include "dendro.h"

 #ifndef KWAY
 #define KWAY 128
 #endif

 template<typename T>
 struct _T{

     unsigned int p;
     unsigned int idx;
     T val;
     DendroIntL rank;

     inline bool operator< (const _T<T> &c1) const {
       return (this->val < c1.val);
     }

     inline bool operator== (const _T<T> &c1) const {
       return (this->val == c1.val);
     }

     inline bool operator<= (const _T<T> &c1) const {
       return (this->val <= c1.val);
     }

     inline bool operator> (const _T<T> &c1) const {
       return (this->val > c1.val);
     }

     inline bool operator>= (const _T<T> &c1) const {
       return (this->val >= c1.val);
     }

 };

 namespace par
 {
   template<typename T>
   class Mpi_datatype;

    template <>
    class Mpi_datatype<_T<double>>
    {
      public:

       static MPI_Datatype value()
       {
         static bool         first = true;
         static MPI_Datatype datatype;

         if (first)
         {
             first = false;
             MPI_Type_contiguous(sizeof(_T<double>), MPI_BYTE, &datatype);
             MPI_Type_commit(&datatype);
         }

         return datatype;
       }
    };

    template <>
    class Mpi_datatype<_T<float>>
    {
      public:

       static MPI_Datatype value()
       {
         static bool         first = true;
         static MPI_Datatype datatype;

         if (first)
         {
             first = false;
             MPI_Type_contiguous(sizeof(_T<float>), MPI_BYTE, &datatype);
             MPI_Type_commit(&datatype);
         }

         return datatype;
       }
    };


 }


 #ifdef PETSC_USE_LOG

 #include "petscsys.h"

 namespace par
 {
 extern int sortEvent;
 extern int concatEvent;
 extern int remdupEvent;
 extern int partwEvent;
 extern int searchEvent;
 extern int parScatterEvent;
 extern int a2avWaitEvent;
 extern int all2AllvSparseEvent;
 extern int all2AllvDenseEvent;
 extern int allGatherEvent;
 extern int reduceEvent;
 extern int sendRecvEvent;
 extern int allReduceEvent;
 extern int all2AllEvent;
 extern int allGathervEvent;
 extern int gatherEvent;
 extern int scanEvent;
 extern int bcastEvent;
 extern int splitComm2wayEvent;
 extern int splitCommEvent;
 } // namespace par

 #define PROF_A2AV_WAIT_BEGIN PetscLogEventBegin(a2avWaitEvent, 0, 0, 0, 0);
 #define PROF_A2AV_WAIT_END PetscLogEventEnd(a2avWaitEvent, 0, 0, 0, 0);

 #define PROF_SPLIT_COMM_2WAY_BEGIN \
   PetscFunctionBegin;              \
   PetscLogEventBegin(splitComm2wayEvent, 0, 0, 0, 0);
 #define PROF_SPLIT_COMM_2WAY_END                    \
   PetscLogEventEnd(splitComm2wayEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_SPLIT_COMM_BEGIN \
   PetscFunctionBegin;         \
   PetscLogEventBegin(splitCommEvent, 0, 0, 0, 0);
 #define PROF_SPLIT_COMM_END                     \
   PetscLogEventEnd(splitCommEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_SEARCH_BEGIN \
   PetscFunctionBegin;     \
   PetscLogEventBegin(searchEvent, 0, 0, 0, 0);
 #define PROF_SEARCH_END                      \
   PetscLogEventEnd(searchEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_CONCAT_BEGIN \
   PetscFunctionBegin;         \
   PetscLogEventBegin(concatEvent, 0, 0, 0, 0);
 #define PROF_PAR_CONCAT_END                  \
   PetscLogEventEnd(concatEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_SCATTER_BEGIN \
   PetscFunctionBegin;          \
   PetscLogEventBegin(parScatterEvent, 0, 0, 0, 0);
 #define PROF_PAR_SCATTER_END                     \
   PetscLogEventEnd(parScatterEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_SENDRECV_BEGIN \
   PetscFunctionBegin;           \
   PetscLogEventBegin(sendRecvEvent, 0, 0, 0, 0);
 #define PROF_PAR_SENDRECV_END                  \
   PetscLogEventEnd(sendRecvEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_BCAST_BEGIN \
   PetscFunctionBegin;        \
   PetscLogEventBegin(bcastEvent, 0, 0, 0, 0);
 #define PROF_PAR_BCAST_END                  \
   PetscLogEventEnd(bcastEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_SCAN_BEGIN \
   PetscFunctionBegin;       \
   PetscLogEventBegin(scanEvent, 0, 0, 0, 0);
 #define PROF_PAR_SCAN_END                  \
   PetscLogEventEnd(scanEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_GATHER_BEGIN \
   PetscFunctionBegin;         \
   PetscLogEventBegin(gatherEvent, 0, 0, 0, 0);
 #define PROF_PAR_GATHER_END                  \
   PetscLogEventEnd(gatherEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_REDUCE_BEGIN \
   PetscFunctionBegin;         \
   PetscLogEventBegin(reduceEvent, 0, 0, 0, 0);
 #define PROF_PAR_REDUCE_END                  \
   PetscLogEventEnd(reduceEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALLREDUCE_BEGIN \
   PetscFunctionBegin;            \
   PetscLogEventBegin(allReduceEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALLREDUCE_END                  \
   PetscLogEventEnd(allReduceEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALL2ALL_BEGIN \
   PetscFunctionBegin;          \
   PetscLogEventBegin(all2AllEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALL2ALL_END                  \
   PetscLogEventEnd(all2AllEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALLGATHER_BEGIN \
   PetscFunctionBegin;            \
   PetscLogEventBegin(allGatherEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALLGATHER_END                  \
   PetscLogEventEnd(allGatherEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALLGATHERV_BEGIN \
   PetscFunctionBegin;             \
   PetscLogEventBegin(allGathervEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALLGATHERV_END                  \
   PetscLogEventEnd(allGathervEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALL2ALLV_SPARSE_BEGIN \
   PetscFunctionBegin;                  \
   PetscLogEventBegin(all2AllvSparseEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALL2ALLV_SPARSE_END                 \
   PetscLogEventEnd(all2AllvSparseEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PAR_ALL2ALLV_DENSE_BEGIN \
   PetscFunctionBegin;                 \
   PetscLogEventBegin(all2AllvDenseEvent, 0, 0, 0, 0);
 #define PROF_PAR_ALL2ALLV_DENSE_END                 \
   PetscLogEventEnd(all2AllvDenseEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_SORT_BEGIN \
   PetscFunctionBegin;   \
   PetscLogEventBegin(sortEvent, 0, 0, 0, 0);
 #define PROF_SORT_END                      \
   PetscLogEventEnd(sortEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_REMDUP_BEGIN \
   PetscFunctionBegin;     \
   PetscLogEventBegin(remdupEvent, 0, 0, 0, 0);
 #define PROF_REMDUP_END                      \
   PetscLogEventEnd(remdupEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #define PROF_PARTW_BEGIN \
   PetscFunctionBegin;    \
   PetscLogEventBegin(partwEvent, 0, 0, 0, 0);
 #define PROF_PARTW_END                      \
   PetscLogEventEnd(partwEvent, 0, 0, 0, 0); \
   PetscFunctionReturn(0);

 #else

 #define PROF_A2AV_WAIT_BEGIN
 #define PROF_SPLIT_COMM_2WAY_BEGIN
 #define PROF_SPLIT_COMM_BEGIN
 #define PROF_SEARCH_BEGIN
 #define PROF_PAR_SCATTER_BEGIN
 #define PROF_PAR_SENDRECV_BEGIN
 #define PROF_PAR_BCAST_BEGIN
 #define PROF_PAR_GATHER_BEGIN
 #define PROF_PAR_SCAN_BEGIN
 #define PROF_PAR_REDUCE_BEGIN
 #define PROF_PAR_ALLREDUCE_BEGIN
 #define PROF_PAR_ALL2ALL_BEGIN
 #define PROF_PAR_ALLGATHERV_BEGIN
 #define PROF_PAR_ALLGATHER_BEGIN
 #define PROF_PAR_ALL2ALLV_SPARSE_BEGIN
 #define PROF_PAR_ALL2ALLV_DENSE_BEGIN
 #define PROF_PAR_CONCAT_BEGIN
 #define PROF_SORT_BEGIN
 #define PROF_REMDUP_BEGIN
 #define PROF_PARTW_BEGIN

 #define PROF_A2AV_WAIT_END
 #define PROF_SPLIT_COMM_2WAY_END return 1;
 #define PROF_SPLIT_COMM_END return 1;
 #define PROF_SEARCH_END return 1;
 #define PROF_PAR_SCATTER_END return 1;
 #define PROF_PAR_SENDRECV_END return 1;
 #define PROF_PAR_BCAST_END return 1;
 #define PROF_PAR_GATHER_END return 1;
 #define PROF_PAR_SCAN_END return 1;
 #define PROF_PAR_REDUCE_END return 1;
 #define PROF_PAR_ALLREDUCE_END return 1;
 #define PROF_PAR_ALL2ALL_END return 1;
 #define PROF_PAR_ALLGATHERV_END return 1;
 #define PROF_PAR_ALLGATHER_END return 1;
 #define PROF_PAR_ALL2ALLV_SPARSE_END return 1;
 #define PROF_PAR_ALL2ALLV_DENSE_END return 1;
 #define PROF_PAR_CONCAT_END return 1;
 #define PROF_SORT_END return 1;
 #define PROF_REMDUP_END return 1;
 #define PROF_PARTW_END return 1;

 #endif

 namespace par
 {

 template <typename T>
 int Mpi_Isend(T *buf, int count, int dest, int tag, MPI_Comm comm, MPI_Request *request);

 template <typename T>
 int Mpi_Issend(T *buf, int count, int dest, int tag, MPI_Comm comm, MPI_Request *request);

 template <typename T>
 int Mpi_Recv(T *buf, int count, int source, int tag, MPI_Comm comm, MPI_Status *status);

 template <typename T>
 int Mpi_Irecv(T *buf, int count, int source, int tag, MPI_Comm comm, MPI_Request *request);

 template <typename T>
 int Mpi_Gather(T *sendBuffer, T *recvBuffer, int count, int root, MPI_Comm comm);

 template <typename T, typename S>
 int Mpi_Sendrecv(T *sendBuf, int sendCount, int dest, int sendTag,
                  S *recvBuf, int recvCount, int source, int recvTag,
                  MPI_Comm comm, MPI_Status *status);

 template <typename T>
 int Mpi_Bcast(T *buffer, int count, int root, MPI_Comm comm);

 template <typename T>
 int Mpi_Scan(T *sendbuf, T *recvbuf, int count, MPI_Op op, MPI_Comm comm);

 template <typename T>
 int Mpi_Reduce(T *sendbuf, T *recvbuf, int count, MPI_Op op, int root, MPI_Comm comm);

 template <typename T>
 int Mpi_Allreduce(T *sendbuf, T *recvbuf, int count, MPI_Op op, MPI_Comm comm);

 template <typename T>
 int Mpi_Alltoall(T *sendbuf, T *recvbuf, int count, MPI_Comm comm);

 template <typename T>
 int Mpi_Allgatherv(T *sendbuf, int sendcount, T *recvbuf,
                    int *recvcounts, int *displs, MPI_Comm comm);

 template <typename T>
 int Mpi_Allgather(T *sendbuf, T *recvbuf, int count, MPI_Comm comm);

 template <typename T>
 int Mpi_Alltoallv_sparse(T *sendbuf, int *sendcnts, int *sdispls,
                          T *recvbuf, int *recvcnts, int *rdispls, MPI_Comm comm);

 template <typename T>
 int Mpi_Alltoallv_dense(T *sendbuf, int *sendcnts, int *sdispls,
                         T *recvbuf, int *recvcnts, int *rdispls, MPI_Comm comm);

 template <typename T>
 int Mpi_Alltoallv_Kway(T *sbuff_, int *s_cnt_, int *sdisp_,
                        T *rbuff_, int *r_cnt_, int *rdisp_, MPI_Comm c);

 template <typename T>
 int scatterValues(std::vector<T> &in, std::vector<T> &out,
                   DendroIntL outSz, MPI_Comm comm);

 template <typename T>
 int maxLowerBound(const std::vector<T> &keys, const std::vector<T> &searchList,
                   std::vector<T> &results, MPI_Comm comm);

 template <typename T>
 unsigned int defaultWeight(const T *a);

 template <typename T>
 int partitionW(std::vector<T> &vec,
                unsigned int (*getWeight)(const T *), MPI_Comm comm);

 template <typename T>
 int concatenate(std::vector<T> &listA,
                 std::vector<T> &listB, MPI_Comm comm);

 template <typename T>
 int sampleSort(std::vector<T> &in, std::vector<T> &out, std::vector<double> &stats, MPI_Comm comm);

 /*template<typename T>
     int removeDuplicates(std::vector<T>& nodes, bool isSorted, MPI_Comm comm);*/

 int splitComm2way(bool iAmEmpty, MPI_Comm *new_comm, MPI_Comm orig_comm);

 int splitComm2way(const bool *isEmptyList, MPI_Comm *new_comm, MPI_Comm orig_comm);

 /*
      @author Rahul Sampath
      @brief Splits a communication group into two, processors with
      ranks less than splittingRank form one group and the other
      processors form the second group. Both the groups are sorted in
      the ascending order of their ranks in the old comm.
      @param splittingRank The rank used for splitting the communicator
      @param orig_comm    The comm group that needs to be split.
      @param new_comm     The new comm group.
      */
 int splitCommUsingSplittingRank(int splittingRank, MPI_Comm *new_comm, MPI_Comm orig_comm);

 unsigned int splitCommBinary(MPI_Comm orig_comm, MPI_Comm *new_comm);

 unsigned int splitCommBinaryNoFlip(MPI_Comm orig_comm, MPI_Comm *new_comm);

 template <typename T>
 void MergeLists(std::vector<T> &listA, std::vector<T> &listB, int KEEP_WHAT);

 template <typename T>
 void MergeSplit(std::vector<T> &local_list, int which_keys, int partner, MPI_Comm comm);

 template <typename T>
 void Par_bitonic_sort_incr(std::vector<T> &local_list, int proc_set_size, MPI_Comm comm);

 template <typename T>
 void Par_bitonic_sort_decr(std::vector<T> &local_list, int proc_set_size, MPI_Comm comm);

 template <typename T>
 void Par_bitonic_merge_incr(std::vector<T> &local_list, int proc_set_size, MPI_Comm comm);

 template <typename T>
 void bitonicSort_binary(std::vector<T> &in, MPI_Comm comm);

 template <typename T>
 void bitonicSort(std::vector<T> &in, MPI_Comm comm);


 template <typename T>
 void parallel_rank(const T* in, unsigned int sz, DendroIntL* out, MPI_Comm comm);


 } // namespace par

 #ifdef USE_OLD_SORT
 #include "parUtils_old.tcc"
 #else
 #include "parUtils.tcc"
 #endif

 #endif
par::Mpi_Alltoallv_sparse
int Mpi_Alltoallv_sparse(T *sendbuf, int *sendcnts, int *sdispls, T *recvbuf, int *recvcnts, int *rdispls, MPI_Comm comm)

par::Mpi_Allgatherv
int Mpi_Allgatherv(T *sendbuf, int sendcount, T *recvbuf, int *recvcounts, int *displs, MPI_Comm comm)

par::Mpi_Reduce
int Mpi_Reduce(T *sendbuf, T *recvbuf, int count, MPI_Op op, int root, MPI_Comm comm)

par::MergeLists
void MergeLists(std::vector< T > &listA, std::vector< T > &listB, int KEEP_WHAT)
Merges lists A, and B, retaining either the low or the High in list A.

par::splitComm2way
int splitComm2way(const bool *isEmptyList, MPI_Comm *new_comm, MPI_Comm orig_comm)
Splits a communication group into two depending on the values in isEmptyList. Both the groups are sor...
Definition: parUtils.cpp:243

par::Par_bitonic_merge_incr
void Par_bitonic_merge_incr(std::vector< T > &local_list, int proc_set_size, MPI_Comm comm)

par::Mpi_Alltoall
int Mpi_Alltoall(T *sendbuf, T *recvbuf, int count, MPI_Comm comm)

par::maxLowerBound
int maxLowerBound(const std::vector< T > &keys, const std::vector< T > &searchList, std::vector< T > &results, MPI_Comm comm)
A parallel search function.

par::Par_bitonic_sort_incr
void Par_bitonic_sort_incr(std::vector< T > &local_list, int proc_set_size, MPI_Comm comm)

par::Mpi_Bcast
int Mpi_Bcast(T *buffer, int count, int root, MPI_Comm comm)

par::Mpi_Allgather
int Mpi_Allgather(T *sendbuf, T *recvbuf, int count, MPI_Comm comm)

par::MergeSplit
void MergeSplit(std::vector< T > &local_list, int which_keys, int partner, MPI_Comm comm)
The main operation in the parallel bitonic sort algorithm. This implements the compare-split operatio...

par::bitonicSort_binary
void bitonicSort_binary(std::vector< T > &in, MPI_Comm comm)
An implementation of parallel bitonic sort that expects the number of processors to be a power of 2...

par::splitCommBinary
unsigned int splitCommBinary(MPI_Comm orig_comm, MPI_Comm *new_comm)
Splits a communication group into two, the first having a power of 2 number of processors and the oth...
Definition: parUtils.cpp:21

par::partitionW
int partitionW(std::vector< T > &vec, unsigned int(*getWeight)(const T *), MPI_Comm comm)
A parallel weighted partitioning function. In our implementation, we do not pose any restriction on t...

par::Mpi_datatype
An abstract class used for communicating messages using user-defined datatypes. The user must impleme...
Definition: zoltan_hilbert.h:76

par::concatenate
int concatenate(std::vector< T > &listA, std::vector< T > &listB, MPI_Comm comm)
A parallel concatenation function. listB is appended (globally) to listA and the result is stored in ...

par::Mpi_Allreduce
int Mpi_Allreduce(T *sendbuf, T *recvbuf, int count, MPI_Op op, MPI_Comm comm)

par::bitonicSort
void bitonicSort(std::vector< T > &in, MPI_Comm comm)
An implementation of parallel bitonic sort that does not expect the number of processors to be a powe...

par
Collection of Generic Parallel Functions: Sorting, Partitioning, Searching,...
Definition: zoltan_hilbert.h:72

par::sampleSort
int sampleSort(std::vector< T > &in, std::vector< T > &out, std::vector< double > &stats, MPI_Comm comm)
A parallel sample sort implementation. In our implementation, we do not pose any restriction on the i...

par::Mpi_Sendrecv
int Mpi_Sendrecv(T *sendBuf, int sendCount, int dest, int sendTag, S *recvBuf, int recvCount, int source, int recvTag, MPI_Comm comm, MPI_Status *status)

par::splitCommBinaryNoFlip
unsigned int splitCommBinaryNoFlip(MPI_Comm orig_comm, MPI_Comm *new_comm)
Splits a communication group into two, the first having a power of 2 number of processors and the oth...
Definition: parUtils.cpp:73

_T
: data structure to compute parallel rank
Definition: parUtils.h:32

par::Mpi_Scan
int Mpi_Scan(T *sendbuf, T *recvbuf, int count, MPI_Op op, MPI_Comm comm)

par::Par_bitonic_sort_decr
void Par_bitonic_sort_decr(std::vector< T > &local_list, int proc_set_size, MPI_Comm comm)

par::Mpi_Alltoallv_dense
int Mpi_Alltoallv_dense(T *sendbuf, int *sendcnts, int *sdispls, T *recvbuf, int *recvcnts, int *rdispls, MPI_Comm comm)

par::Mpi_Gather
int Mpi_Gather(T *sendBuffer, T *recvBuffer, int count, int root, MPI_Comm comm)

par::scatterValues
int scatterValues(std::vector< T > &in, std::vector< T > &out, DendroIntL outSz, MPI_Comm comm)
Re-distributes a STL vector, preserving the relative ordering of the elements.