docs/parallelization__util__impl_8h_source.html

 /*

  * Copyright (c) 2014:  G-CSC, Goethe University Frankfurt

  * Author: Sebastian Reiter

  *

  * This file is part of UG4.

  *

  * UG4 is free software: you can redistribute it and/or modify it under the

  * terms of the GNU Lesser General Public License version 3 (as published by the

  * Free Software Foundation) with the following additional attribution

  * requirements (according to LGPL/GPL v3 §7):

  *

  * (1) The following notice must be displayed in the Appropriate Legal Notices

  * of covered and combined works: "Based on UG4 (www.ug4.org/license)".

  *

  * (2) The following notice must be displayed at a prominent place in the

  * terminal output of covered works: "Based on UG4 (www.ug4.org/license)".

  *

  * (3) The following bibliography is recommended for citation and must be

  * preserved in all covered files:

  * "Reiter, S., Vogel, A., Heppner, I., Rupp, M., and Wittum, G. A massively

  *   parallel geometric multigrid solver on hierarchically distributed grids.

  *   Computing and visualization in science 16, 4 (2013), 151-164"

  * "Vogel, A., Reiter, S., Rupp, M., Nägel, A., and Wittum, G. UG4 -- a novel

  *   flexible software system for simulating pde based models on high performance

  *   computers. Computing and visualization in science 16, 4 (2013), 165-179"

  *

  * This program is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

  * GNU Lesser General Public License for more details.

  */


 #ifndef __H__LIB_ALGEBRA__PARALLELIZATION__PARALLELIZATION_UTIL_IMPL__

 #define __H__LIB_ALGEBRA__PARALLELIZATION__PARALLELIZATION_UTIL_IMPL__


 #include <vector>

 #include "common/error.h"

 #include "parallelization_util.h"


 namespace ug{


 template <class TIndVec>

 void GenerateGlobalConsecutiveIndices(TIndVec& indsOut, size_t numLocalInds,

                     const AlgebraLayouts& layouts)

 {

   typedef typename TIndVec::value_type index_t;


   PU_PROFILE_FUNC();

   indsOut.clear();

   indsOut.resize(numLocalInds, 0);


 //  count local unique indices. Ignore vmasters and hslaves.

 //  we're using uint64 here to stay compatible with mpi

   uint64 numLocalUniqueInds = 0;

   const index_t invalidIndex = -1;

   SetLayoutValues(&indsOut, layouts.slave(), invalidIndex);

   SetLayoutValues(&indsOut, layouts.vertical_master(), invalidIndex);


   for(size_t i = 0; i < numLocalInds; ++i){

     if(indsOut[i] != invalidIndex){

       ++numLocalUniqueInds;

     }

   }


 //  we'll now gather the numbers of local unique indices on proces 0 and create

 //  an offset map for each process. This offset map will then be scattered to

 //  the separate processes again.

   const pcl::ProcessCommunicator& procCom = layouts.proc_comm();

   std::vector<uint64> p0_uniqueIndNumbers(procCom.size());


   procCom.gather(&numLocalUniqueInds, 1, PCL_DT_UNSIGNED_LONG_LONG,

           &p0_uniqueIndNumbers.front(), 1, PCL_DT_UNSIGNED_LONG_LONG, 0);


   if(procCom.get_local_proc_id() == 0){

   //  convert the number of unique indices of each process to offsets

     uint64 offset = 0;

     for(size_t i = 0; i < p0_uniqueIndNumbers.size(); ++i){

       size_t newOffset = offset + p0_uniqueIndNumbers[i];

       p0_uniqueIndNumbers[i] = offset;

       offset = newOffset;

     }

   }


   uint64 indOffset = 0;

   procCom.scatter(&p0_uniqueIndNumbers.front(), 1, PCL_DT_UNSIGNED_LONG_LONG,

           &indOffset, 1, PCL_DT_UNSIGNED_LONG_LONG, 0);


 //  using the local offset we can now assign the local unique indices to indsOut

   index_t newInd = static_cast<index_t>(indOffset);

   for(size_t i = 0; i < numLocalInds; ++i){

     if(indsOut[i] != invalidIndex){

       indsOut[i] = newInd;

       ++newInd;

     }

   }


 //  finally we have to copy the unique indices from hmasters to hslaves and

 //  afterwards from vslaves to vmasters.

   pcl::InterfaceCommunicator<IndexLayout>& icom = layouts.comm();

   ComPol_VecCopy<TIndVec> compolCopy(&indsOut);


   icom.send_data(layouts.master(), compolCopy);

   icom.receive_data(layouts.slave(), compolCopy);

   icom.communicate();


 //  Todo: This method is mainly used on surface-layouts.

 //      Currently a bug in those layouts prevents the execution of the following code

 //      which would be required for level-matrices.

 //      Since ghosts (pure v-masters) are ignored in surface-vectors and matrices,

 //      but pure v-slaves are considered, v-master and v-slave interfaces do not

 //      match. Fortunately they are not required for surface-index-generation.

 //      The following block should however be used as soon as those layouts are fixed.

   // icom.send_data(layouts.vertical_slave(), compolCopy);

   // icom.receive_data(layouts.vertical_master(), compolCopy);

   // icom.communicate();

 }


 template <class TMatrix>

 void TestHorizontalAlgebraLayouts(

       const TMatrix& mat,

       std::vector<AlgebraID>* algebraIDs,

       bool verbose)

 {

   const AlgebraLayouts& layouts = *mat.layouts();


   std::vector<AlgebraID> fallbackAlgebraIDs;

   if(!algebraIDs) {

     GenerateGlobalAlgebraIDs(layouts.comm(),

                              fallbackAlgebraIDs,

                              mat.num_rows(),

                              layouts.master(),

                              layouts.slave());

     algebraIDs = &fallbackAlgebraIDs;

   }


   struct IDByIndex {

     IDByIndex (const std::vector<AlgebraID>* algIDs) : m_algIDs(*algIDs) {}

     const AlgebraID& operator () (size_t idx) const   {return m_algIDs[idx];}

     const std::vector<AlgebraID>& m_algIDs;

   };


   IDByIndex idByIndex(algebraIDs);


   bool ok = pcl::TestLayout<IndexLayout, AlgebraID> (

               layouts.proc_comm(),

               layouts.comm(),

               layouts.master(),

               layouts.slave(),

               verbose,

               idByIndex,

               true);

   UG_COND_THROW(!ok, "H-Master <-> H-Slave mismatch in matrix layout");


 //  Global IDs do of course not match in overlap interfaces

   ok = pcl::TestLayout<IndexLayout> (

               layouts.proc_comm(),

               layouts.comm(),

               layouts.master_overlap(),

               layouts.slave_overlap(),

               verbose);

   UG_COND_THROW(!ok, "H-Master-Overlap <-> H-Slave-Overlap mismatch in matrix layout");

 }


 }// end of namespace


 #endif  //__H__LIB_ALGEBRA__PARALLELIZATION__PARALLELIZATION_UTIL_IMPL__

verbose
location verbose
Definition: checkpoint_util.lua:128

pcl::InterfaceCommunicator
Performs communication between interfaces on different processes.
Definition: pcl_interface_communicator.h:68

pcl::InterfaceCommunicator::communicate
bool communicate(int tag=749345)
sends and receives the collected data.
Definition: pcl_interface_communicator_impl.hpp:409

pcl::InterfaceCommunicator::send_data
void send_data(int targetProc, const Interface &interface, ICommunicationPolicy< TLayout > &commPol)
collects data that will be send during communicate.
Definition: pcl_interface_communicator_impl.hpp:80

pcl::InterfaceCommunicator::receive_data
void receive_data(int srcProc, const Interface &interface, ICommunicationPolicy< TLayout > &commPol)
registers a communication-policy to receive data on communicate.
Definition: pcl_interface_communicator_impl.hpp:188

pcl::ProcessCommunicator
Definition: pcl_process_communicator.h:70

pcl::ProcessCommunicator::gather
void gather(const void *sendBuf, int sendCount, DataType sendType, void *recBuf, int recCount, DataType recType, int root) const
performs MPI_Gather on the processes of the communicator.
Definition: pcl_process_communicator.cpp:339

pcl::ProcessCommunicator::size
size_t size() const
returns the size of the communicator
Definition: pcl_process_communicator.cpp:71

pcl::ProcessCommunicator::scatter
void scatter(const void *sendBuf, int sendCount, DataType sendType, void *recBuf, int recCount, DataType recType, int root) const
performs MPI_Scatter on the processes of the communicator
Definition: pcl_process_communicator.cpp:392

pcl::ProcessCommunicator::get_local_proc_id
int get_local_proc_id(int globalProcID=pcl::ProcRank()) const
returns the proc-id relative to this communicator
Definition: pcl_process_communicator.cpp:95

ug::AlgebraLayouts
Extends the HorizontalAlgebraLayouts by vertical layouts.
Definition: algebra_layouts.h:121

ug::AlgebraLayouts::vertical_master
const IndexLayout & vertical_master() const
Definition: algebra_layouts.h:133

ug::ComPol_VecCopy
Communication Policy to copy values of a vector.
Definition: communication_policies.h:88

ug::HorizontalAlgebraLayouts::proc_comm
const pcl::ProcessCommunicator & proc_comm() const
returns process communicator
Definition: algebra_layouts.h:68

ug::HorizontalAlgebraLayouts::master_overlap
const IndexLayout & master_overlap() const
Definition: algebra_layouts.h:62

ug::HorizontalAlgebraLayouts::slave
const IndexLayout & slave() const
Definition: algebra_layouts.h:63

ug::HorizontalAlgebraLayouts::master
const IndexLayout & master() const
Definition: algebra_layouts.h:61

ug::HorizontalAlgebraLayouts::comm
pcl::InterfaceCommunicator< IndexLayout > & comm() const
returns (non-const !!!) communicator
Definition: algebra_layouts.h:78

ug::HorizontalAlgebraLayouts::slave_overlap
const IndexLayout & slave_overlap() const
Definition: algebra_layouts.h:64

error.h

ug::GenerateGlobalAlgebraIDs
void GenerateGlobalAlgebraIDs(pcl::InterfaceCommunicator< TLayout > &communicator, std::vector< AlgebraID > &idsOut, size_t numIDs, const TLayout &masterLayout, const TLayout &slaveLayout)
Generates a set of unique global algebra ids.
Definition: parallelization_util.h:81

ug::SetLayoutValues
void SetLayoutValues(TVector *pVec, const IndexLayout &layout, typename TVector::value_type val)
sets the values of a vector to a given number only on the layout indices
Definition: parallelization_util.h:315

PCL_DT_UNSIGNED_LONG_LONG
#define PCL_DT_UNSIGNED_LONG_LONG
Definition: pcl_datatype.h:55

UG_COND_THROW
#define UG_COND_THROW(cond, msg)
UG_COND_THROW(cond, msg) : performs a UG_THROW(msg) if cond == true.
Definition: error.h:61

uint64
ugtypes::uint64_t uint64
Definition: types.h:117

PU_PROFILE_FUNC
#define PU_PROFILE_FUNC()
Definition: parallelization_util.h:48

parallelization_util.h

ug
the ug namespace

ug::GenerateGlobalConsecutiveIndices
void GenerateGlobalConsecutiveIndices(TIndVec &indsOut, size_t numLocalInds, const AlgebraLayouts &layouts)
Generates a set of global consecutive indices.
Definition: parallelization_util_impl.h:44

ug::TestHorizontalAlgebraLayouts
void TestHorizontalAlgebraLayouts(const TMatrix &mat, std::vector< AlgebraID > *algebraIDs=NULL, bool verbose=false)
Tests layouts by matching master and slave interfaces and by comparing global id's.
Definition: parallelization_util_impl.h:121

value_type
T value_type
Definition: sparsematrix_interface.h:2

operator()
value_type & operator()(size_t r, size_t c)

ug::AlgebraID
this type is used to identify distributed objects.
Definition: algebra_id.h:46