d3/dde/ParallelAnalysis_8hpp_source.html

 // -*-Mode: C++;-*-

 // * BeginRiceCopyright *****************************************************
 //
 // $HeadURL$
 // $Id$
 //
 // --------------------------------------------------------------------------
 // Part of HPCToolkit (hpctoolkit.org)
 //
 // Information about sources of support for research and development of
 // HPCToolkit is at 'hpctoolkit.org' and in 'README.Acknowledgments'.
 // --------------------------------------------------------------------------
 //
 // Copyright ((c)) 2002-2019, Rice University
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are
 // met:
 //
 // * Redistributions of source code must retain the above copyright
 //   notice, this list of conditions and the following disclaimer.
 //
 // * Redistributions in binary form must reproduce the above copyright
 //   notice, this list of conditions and the following disclaimer in the
 //   documentation and/or other materials provided with the distribution.
 //
 // * Neither the name of Rice University (RICE) nor the names of its
 //   contributors may be used to endorse or promote products derived from
 //   this software without specific prior written permission.
 //
 // This software is provided by RICE and contributors "as is" and any
 // express or implied warranties, including, but not limited to, the
 // implied warranties of merchantability and fitness for a particular
 // purpose are disclaimed. In no event shall RICE or contributors be
 // liable for any direct, indirect, incidental, special, exemplary, or
 // consequential damages (including, but not limited to, procurement of
 // substitute goods or services; loss of use, data, or profits; or
 // business interruption) however caused and on any theory of liability,
 // whether in contract, strict liability, or tort (including negligence
 // or otherwise) arising in any way out of the use of this software, even
 // if advised of the possibility of such damage.
 //
 // ******************************************************* EndRiceCopyright *

 //***************************************************************************
 //
 // File:
 //   $HeadURL$
 //
 // Purpose:
 //   [The purpose of this file]
 //
 // Description:
 //   [The set of functions, macros, etc. defined in the file]
 //
 //***************************************************************************

 #ifndef ParallelAnalysis_hpp
 #define ParallelAnalysis_hpp

 //**************************** MPI Include Files ****************************

 #include <mpi.h>

 //************************* System Include Files ****************************

 #include <iostream>
 #include <string>
 #include <vector>

 #include <cstring> // for memset()

 #include <stdint.h>

 //*************************** User Include Files ****************************

 #include <include/uint.h>

 #include <lib/prof/CallPath-Profile.hpp>

 #include <lib/support/Unique.hpp>

 //*************************** Forward Declarations **************************

 //***************************************************************************
 // PackedMetrics: a packable matrix
 //***************************************************************************

 namespace ParallelAnalysis {

 class PackedMetrics
   : public Unique // prevent copying
 {
 public:
   // [mBegId, mEndId)
   PackedMetrics(uint numNodes, uint mBegId, uint mEndId,
                 uint mDrvdBegId, uint mDrvdEndId)
     : m_numNodes(numNodes), m_numMetrics(mEndId - mBegId),
       m_mBegId(mBegId), m_mEndId(mEndId),
       m_mDrvdBegId(mDrvdBegId), m_mDrvdEndId(mDrvdEndId)
   {
     size_t sz = dataSize();
     m_packedData = new double[sz];

     // initialize first (unused) row to avoid bogus valgrind warnings
     memset(m_packedData, 0, (m_numHdr + m_numMetrics) * sizeof(double));

     m_packedData[m_numNodesIdx] = (double)m_numNodes;
     m_packedData[m_mBegIdIdx]   = (double)m_mBegId;
     m_packedData[m_mEndIdIdx]   = (double)m_mEndId;
   }

   // PackedMetrics(double* packedMatrix) { }

   ~PackedMetrics()
   { delete[] m_packedData; }


   // 0 based indexing (row-major layout)
   double
   idx(uint idxNodes, uint idxMetrics) const
   { return m_packedData[m_numHdr + (m_numMetrics * idxNodes) + idxMetrics]; }


   double&
   idx(uint idxNodes, uint idxMetrics)
   { return m_packedData[m_numHdr + (m_numMetrics * idxNodes) + idxMetrics]; }


   uint
   numNodes() const
   { return m_numNodes; }

   uint
   numMetrics() const
   { return m_numMetrics; }


   uint
   mBegId() const
   { return m_mBegId; }

   uint
   mEndId() const
   { return m_mEndId; }


   uint
   mDrvdBegId() const
   { return m_mDrvdBegId; }

   uint
   mDrvdEndId() const
   { return m_mDrvdEndId; }


   bool
   verify() const
   {
     return (m_numNodes      == (uint)m_packedData[m_numNodesIdx]
             && m_mBegId     == (uint)m_packedData[m_mBegIdIdx]
             && m_mEndId     == (uint)m_packedData[m_mEndIdIdx]);
   }


   double*
   data() const
   { return m_packedData; }

   // dataSize: size in terms of elements
   uint
   dataSize() const
   { return (m_numNodes * m_numMetrics) + m_numHdr; }

 private:
   static const uint m_numHdr = 4;
   static const uint m_numNodesIdx   = 0;
   static const uint m_mBegIdIdx     = 1;
   static const uint m_mEndIdIdx     = 2;

   uint m_numNodes;   // rows
   uint m_numMetrics; // columns
   uint m_mBegId, m_mEndId; // [ )

   uint m_mDrvdBegId, m_mDrvdEndId; // [ )

   double* m_packedData; // use row-major layout

 };

 } // namespace ParallelAnalysis


 //***************************************************************************
 // reduce/broadcast
 //***************************************************************************

 namespace ParallelAnalysis {

 // ------------------------------------------------------------------------
 // recvMerge: merge profile on rank_y into profile on rank_x
 // ------------------------------------------------------------------------

 void
 packSend(Prof::CallPath::Profile* profile,
          int dest, int myRank, MPI_Comm comm = MPI_COMM_WORLD);
 void
 recvMerge(Prof::CallPath::Profile* profile,
           int src, int myRank, MPI_Comm comm = MPI_COMM_WORLD);

 void
 packSend(std::pair<Prof::CallPath::Profile*,
                         ParallelAnalysis::PackedMetrics*> data,
          int dest, int myRank, MPI_Comm comm = MPI_COMM_WORLD);
 void
 recvMerge(std::pair<Prof::CallPath::Profile*,
           ParallelAnalysis::PackedMetrics*> data,
           int src, int myRank, MPI_Comm comm = MPI_COMM_WORLD);

 void
 packSend(StringSet *stringSet,
          int dest, int myRank, MPI_Comm comm = MPI_COMM_WORLD);
 void
 recvMerge(StringSet *stringSet,
           int src, int myRank, MPI_Comm comm = MPI_COMM_WORLD);

 // ------------------------------------------------------------------------
 // reduce: Uses a tree-based reduction to reduce the profile at every
 // rank into a canonical profile at the tree's root, rank 0.  Assumes
 // 0-based ranks.
 //
 // T: Prof::CallPath::Profile*
 // T: std::pair<Prof::CallPath::Profile*, ParallelAnalysis::PackedMetrics*>
 // ------------------------------------------------------------------------

 template<typename T>
 void
 reduce(T object, int myRank, int numRanks, MPI_Comm comm = MPI_COMM_WORLD)
 {
   int lchild = 2 * myRank + 1;
   if (lchild < numRanks) {
     recvMerge(object, lchild, myRank);
     int rchild = 2 * myRank + 2;
     if (rchild < numRanks) {
       recvMerge(object, rchild, myRank);
     }
   }
   if (myRank > 0) {
     int parent = (myRank - 1) / 2;
     packSend(object, parent, myRank);
   }
 }


 // ------------------------------------------------------------------------
 // broadcast: Broadcast the profile at the tree's root (rank 0) to every
 // other rank.  Assumes 0-based ranks.
 // ------------------------------------------------------------------------
 void
 broadcast(Prof::CallPath::Profile*& profile, int myRank,
           MPI_Comm comm = MPI_COMM_WORLD);
 void
 broadcast(StringSet &stringSet, int myRank,
           MPI_Comm comm = MPI_COMM_WORLD);

 // ------------------------------------------------------------------------
 // pack/unpack a profile to/from a buffer
 // ------------------------------------------------------------------------
 void
 packProfile(const Prof::CallPath::Profile& profile,
             uint8_t** buffer, size_t* bufferSz);


 Prof::CallPath::Profile*
 unpackProfile(uint8_t* buffer, size_t bufferSz);


 // ------------------------------------------------------------------------
 // pack/unpack a metrics from/to a profile
 // ------------------------------------------------------------------------

 // packMetrics: pack the given metric values from 'profile' into
 // 'packedMetrics'
 void
 packMetrics(const Prof::CallPath::Profile& profile,
             ParallelAnalysis::PackedMetrics& packedMetrics);

 // unpackMetrics: unpack 'packedMetrics' into profile and apply metric update
 void
 unpackMetrics(Prof::CallPath::Profile& profile,
               const ParallelAnalysis::PackedMetrics& packedMetrics);

 } // namespace ParallelAnalysis


 //***************************************************************************

 #endif // ParallelAnalysis_hpp
ParallelAnalysis::PackedMetrics::PackedMetrics
PackedMetrics(uint numNodes, uint mBegId, uint mEndId, uint mDrvdBegId, uint mDrvdEndId)
Definition: ParallelAnalysis.hpp:98

ParallelAnalysis::PackedMetrics::numNodes
uint numNodes() const
Definition: ParallelAnalysis.hpp:133

ParallelAnalysis::PackedMetrics::m_mDrvdEndId
uint m_mDrvdEndId
Definition: ParallelAnalysis.hpp:187

ParallelAnalysis::PackedMetrics::dataSize
uint dataSize() const
Definition: ParallelAnalysis.hpp:174

ParallelAnalysis::PackedMetrics::m_mEndIdIdx
static const uint m_mEndIdIdx
Definition: ParallelAnalysis.hpp:181

ParallelAnalysis::PackedMetrics::mDrvdEndId
uint mDrvdEndId() const
Definition: ParallelAnalysis.hpp:155

ParallelAnalysis::PackedMetrics
Definition: ParallelAnalysis.hpp:93

Unique
Definition: Unique.hpp:104

ParallelAnalysis::PackedMetrics::~PackedMetrics
~PackedMetrics()
Definition: ParallelAnalysis.hpp:117

ParallelAnalysis::PackedMetrics::mDrvdBegId
uint mDrvdBegId() const
Definition: ParallelAnalysis.hpp:151

StringSet
Definition: StringSet.hpp:77

ParallelAnalysis::PackedMetrics::m_mDrvdBegId
uint m_mDrvdBegId
Definition: ParallelAnalysis.hpp:187

ParallelAnalysis::PackedMetrics::data
double * data() const
Definition: ParallelAnalysis.hpp:169

ParallelAnalysis::PackedMetrics::m_numNodes
uint m_numNodes
Definition: ParallelAnalysis.hpp:183

ParallelAnalysis::reduce
void reduce(T object, int myRank, int numRanks, MPI_Comm comm=MPI_COMM_WORLD)
Definition: ParallelAnalysis.hpp:240

Prof::CallPath::Profile
Definition: CallPath-Profile.hpp:104

ParallelAnalysis::PackedMetrics::m_mEndId
uint m_mEndId
Definition: ParallelAnalysis.hpp:185

Unique.hpp

ParallelAnalysis::PackedMetrics::numMetrics
uint numMetrics() const
Definition: ParallelAnalysis.hpp:137

ParallelAnalysis
Definition: ParallelAnalysis.cpp:96

ParallelAnalysis::PackedMetrics::m_packedData
double * m_packedData
Definition: ParallelAnalysis.hpp:189

uint.h

ParallelAnalysis::recvMerge
void recvMerge(Prof::CallPath::Profile *profile, int src, int myRank, MPI_Comm comm)
Definition: ParallelAnalysis.cpp:207

T
void(* T)(int code, va_list_box *box, int put(int c, void *cl), void *cl, unsigned char flags[256], int width, int precision)
Definition: fmt.h:62

ParallelAnalysis::PackedMetrics::idx
double & idx(uint idxNodes, uint idxMetrics)
Definition: ParallelAnalysis.hpp:128

uint
unsigned int uint
Definition: uint.h:124

ParallelAnalysis::unpackMetrics
void unpackMetrics(Prof::CallPath::Profile &profile, const ParallelAnalysis::PackedMetrics &packedMetrics)
Definition: ParallelAnalysis.cpp:396

ParallelAnalysis::PackedMetrics::m_numMetrics
uint m_numMetrics
Definition: ParallelAnalysis.hpp:184

CallPath-Profile.hpp

ParallelAnalysis::PackedMetrics::m_mBegIdIdx
static const uint m_mBegIdIdx
Definition: ParallelAnalysis.hpp:180

ParallelAnalysis::broadcast
void broadcast(Prof::CallPath::Profile *&profile, int myRank, MPI_Comm comm)
Definition: ParallelAnalysis.cpp:133

ParallelAnalysis::unpackProfile
Prof::CallPath::Profile * unpackProfile(uint8_t *buffer, size_t bufferSz)
Definition: ParallelAnalysis.cpp:324

ParallelAnalysis::packSend
void packSend(Prof::CallPath::Profile *profile, int dest, int myRank, MPI_Comm comm)
Definition: ParallelAnalysis.cpp:196

ParallelAnalysis::PackedMetrics::verify
bool verify() const
Definition: ParallelAnalysis.hpp:160

ParallelAnalysis::PackedMetrics::mEndId
uint mEndId() const
Definition: ParallelAnalysis.hpp:146

ParallelAnalysis::PackedMetrics::m_numNodesIdx
static const uint m_numNodesIdx
Definition: ParallelAnalysis.hpp:179

ParallelAnalysis::packProfile
void packProfile(const Prof::CallPath::Profile &profile, uint8_t **buffer, size_t *bufferSz)
Definition: ParallelAnalysis.cpp:310

ParallelAnalysis::PackedMetrics::mBegId
uint mBegId() const
Definition: ParallelAnalysis.hpp:142

ParallelAnalysis::PackedMetrics::m_mBegId
uint m_mBegId
Definition: ParallelAnalysis.hpp:185

ParallelAnalysis::PackedMetrics::idx
double idx(uint idxNodes, uint idxMetrics) const
Definition: ParallelAnalysis.hpp:123

ParallelAnalysis::packMetrics
void packMetrics(const Prof::CallPath::Profile &profile, ParallelAnalysis::PackedMetrics &packedMetrics)
Definition: ParallelAnalysis.cpp:373

ParallelAnalysis::PackedMetrics::m_numHdr
static const uint m_numHdr
Definition: ParallelAnalysis.hpp:178