docs/collect__matrix_8h_source.html

/*

 * Copyright (c) 2011-2015:  G-CSC, Goethe University Frankfurt

 * Author: Martin Rupp

 *

 * This file is part of UG4.

 *

 * UG4 is free software: you can redistribute it and/or modify it under the

 * terms of the GNU Lesser General Public License version 3 (as published by the

 * Free Software Foundation) with the following additional attribution

 * requirements (according to LGPL/GPL v3 §7):

 *

 * (1) The following notice must be displayed in the Appropriate Legal Notices

 * of covered and combined works: "Based on UG4 (www.ug4.org/license)".

 *

 * (2) The following notice must be displayed at a prominent place in the

 * terminal output of covered works: "Based on UG4 (www.ug4.org/license)".

 *

 * (3) The following bibliography is recommended for citation and must be

 * preserved in all covered files:

 * "Reiter, S., Vogel, A., Heppner, I., Rupp, M., and Wittum, G. A massively

 *   parallel geometric multigrid solver on hierarchically distributed grids.

 *   Computing and visualization in science 16, 4 (2013), 151-164"

 * "Vogel, A., Reiter, S., Rupp, M., Nägel, A., and Wittum, G. UG4 -- a novel

 *   flexible software system for simulating pde based models on high performance

 *   computers. Computing and visualization in science 16, 4 (2013), 165-179"

 *

 * This program is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

 * GNU Lesser General Public License for more details.

 */


#ifndef __H__LIB_ALGEBRA__COLLECT_MATRIX_H_

#define __H__LIB_ALGEBRA__COLLECT_MATRIX_H_


#include "parallel_nodes.h"

#include "serialize_interfaces.h"

#include "common/debug_print.h"


namespace ug{


template<typename matrix_type>


void SerializeRow(BinaryBuffer &stream, const matrix_type &mat, size_t localRowIndex, ParallelNodes &PN)

{

  PROFILE_FUNC_GROUP("algebra parallelization");

  const AlgebraID &globalRowIndex = PN.local_to_global(localRowIndex);

  UG_COND_THROW(globalRowIndex.master_proc() > pcl::NumProcs() || globalRowIndex.master_proc() < 0, globalRowIndex);

  // serialize global row index

  Serialize(stream, globalRowIndex);


  size_t num_connections = mat.num_connections(localRowIndex);


  // serialize number of connections

  Serialize(stream, num_connections);

  UG_DLOG(LIB_ALG_AMG, 4, "Sending row " << localRowIndex << " (" << globalRowIndex << "), " << num_connections << " cons: ");


  for(typename matrix_type::const_row_iterator conn = mat.begin_row(localRowIndex);

            conn != mat.end_row(localRowIndex); ++conn)

  {

    size_t localColIndex = conn.index();

    const AlgebraID &globalColIndex = PN.local_to_global(localColIndex);

    UG_COND_THROW(globalColIndex.master_proc() > pcl::NumProcs() || globalColIndex.master_proc() < 0, globalColIndex);


    UG_DLOG(LIB_ALG_AMG, 4, localColIndex << " (" << globalColIndex << ") -> " << conn.value() << " ");


    // serialize connection

    Serialize(stream, globalColIndex);

    Serialize(stream, conn.value());

  }

  UG_DLOG(LIB_ALG_AMG, 4, "\n");

}

void SerializeRow(BinaryBuffer &stream, const matrix_type &mat, size_t localRowIndex, ParallelNodes &PN) {…}


template<typename matrix_type>


void SendMatrix(const matrix_type &A, IndexLayout &verticalSlaveLayout, int destproc, ParallelNodes &PN)

{

  PROFILE_FUNC_GROUP("algebra parallelization");

  UG_DLOG(LIB_ALG_AMG, 1, "\n*********** SendMatrix ************\n\n");


  pcl::InterfaceCommunicator<IndexLayout> &communicator = A.layouts()->comm();

  BinaryBuffer stream;


  Serialize(stream, A.num_rows());

  for(size_t i=0; i<A.num_rows(); i++)

    SerializeRow(stream, A, i, PN);


  SerializeLayout(stream, A.layouts()->master(), PN);

  SerializeLayout(stream, A.layouts()->slave(), PN);


  IndexLayout::Interface &verticalInterface = verticalSlaveLayout.interface(destproc);

  for(size_t i=0; i<A.num_rows(); i++)

    verticalInterface.push_back(i);


  UG_DLOG(LIB_ALG_AMG, 3, "Srcproc " << pcl::ProcRank() << " is sending " << stream.write_pos() << " bytes of data to destproc " << destproc << "\n");

  communicator.send_raw(destproc, stream.buffer(), stream.write_pos(), false);

  communicator.communicate();

}

void SendMatrix(const matrix_type &A, IndexLayout &verticalSlaveLayout, int destproc, ParallelNodes &PN) {…}


template<typename TConnectionType>


size_t DeserializeRow(BinaryBuffer &stream, stdvector<TConnectionType> &cons, ParallelNodes &PN)

{

  PROFILE_FUNC_GROUP("algebra parallelization");

  AlgebraID globalRowIndex;


  // serialize global row index

  Deserialize(stream, globalRowIndex);

  size_t localRowIndex = PN.global_to_local(globalRowIndex);


  UG_DLOG(LIB_ALG_AMG, 4, "Got row " << localRowIndex << " (" << globalRowIndex << "), ");

  size_t num_connections;


  // serialize number of connections

  Deserialize(stream, num_connections);


  UG_DLOG(LIB_ALG_AMG, 4, num_connections << " connections: ");


  cons.resize(num_connections);

  for(size_t i =0; i<num_connections; i++)

  {

    AlgebraID globalColIndex;

    Deserialize(stream, globalColIndex);

    cons[i].iIndex = PN.global_to_local(globalColIndex);

    Deserialize(stream, cons[i].dValue);

    UG_DLOG(LIB_ALG_AMG, 4, cons[i].iIndex << " (" << globalColIndex << ") -> " << cons[i].dValue << " ");

  }

  UG_DLOG(LIB_ALG_AMG, 4, "\n");

  return localRowIndex;

}

size_t DeserializeRow(BinaryBuffer &stream, stdvector<TConnectionType> &cons, ParallelNodes &PN) {…}


// ReceiveMatrix

//---------------------------------------------------------------------------

template<typename matrix_type>


void ReceiveMatrix(const matrix_type &A, matrix_type &M, IndexLayout &verticalMasterLayout, const std::vector<int> &srcprocs,

    ParallelNodes &PN)

{

  PROFILE_FUNC_GROUP("algebra parallelization");

  UG_DLOG(LIB_ALG_AMG, 1, "\n*********** ReceiveMatrix ************\n\n");

  pcl::InterfaceCommunicator<IndexLayout> &communicator = A.layouts()->comm();


  M = A;

  //M.print();

  M.set_layouts(SmartPtr<AlgebraLayouts>(new AlgebraLayouts));

  typedef std::map<int, BinaryBuffer> BufferMap;

  BufferMap streams;


  UG_DLOG(LIB_ALG_AMG, 3, "DestProc " << pcl::ProcRank() << " is waiting on data from ");

  for(size_t i=0; i<srcprocs.size(); i++)

  {

    UG_DLOG(LIB_ALG_AMG, 3, srcprocs[i] << " ");

    communicator.receive_raw(srcprocs[i], streams[srcprocs[i]]);

  }

  UG_DLOG(LIB_ALG_AMG, 3, "\n");

  communicator.communicate();


  AlgebraID globalRowIndex, globalColIndex;;

  size_t num_connections, numRows;


  for(size_t i=0; i<srcprocs.size(); i++)

  {

    int pid = srcprocs[i];

    BinaryBuffer &stream = streams[pid];

    stream.set_read_pos(0);


    UG_DLOG(LIB_ALG_AMG, 4, "received " << stream.write_pos() << " bytes of data from process " << pid << "\n");

    IndexLayout::Interface &verticalInterface = verticalMasterLayout.interface(pid);

    typename matrix_type::connection con;


    Deserialize(stream, numRows);

    for(size_t i=0; i<numRows; i++)

    {

      // serialize global row index, number of connections

      Deserialize(stream, globalRowIndex);

      Deserialize(stream, num_connections);

      UG_COND_THROW(globalRowIndex.master_proc() > pcl::NumProcs() || globalRowIndex.master_proc() < 0, i << " " << globalRowIndex << " " << pid);


      size_t localRowIndex = PN.get_local_index_or_create_new(globalRowIndex, 0);

      verticalInterface.push_back(localRowIndex);

      UG_DLOG(LIB_ALG_AMG, 4, "Got row " << localRowIndex << " (" << globalRowIndex << "), ");

      UG_DLOG(LIB_ALG_AMG, 4, num_connections << " connections: ");


      for(size_t pid =0; pid<num_connections; pid++)

      {

        Deserialize(stream, globalColIndex);

        Deserialize(stream, con.dValue);


        con.iIndex = PN.get_local_index_or_create_new(globalColIndex, 0);

        UG_DLOG(LIB_ALG_AMG, 4, con.iIndex << " (" << globalColIndex << ") -> " << con.dValue << " ");

      }

      UG_DLOG(LIB_ALG_AMG, 4, "\n");

    }

  }


  M.resize_and_keep_values(PN.local_size(), PN.local_size());

  //M.print();


  for(size_t i=0; i<srcprocs.size(); i++)

  {

    int pid = srcprocs[i];

    BinaryBuffer &stream = streams[pid];

    stream.set_read_pos(0);

    stdvector<typename matrix_type::connection> cons;


    Deserialize(stream, numRows);

    for(size_t i=0; i<numRows; i++)

    {

      size_t localRowIndex = DeserializeRow(stream, cons, PN);

      if(cons.size())

        M.add_matrix_row(localRowIndex, &cons[0], cons.size());

    }

  }


  //UG_DLOG(LIB_ALG_AMG, 4, "\n** the matrix M: \n\n");

  //M.print();

  //UG_DLOG(LIB_ALG_AMG, 4, "\n");


  //UG_LOG("COLLECTED LAYOUT:\n");

  //PrintLayout(processCommunicator, communicator, masterLayout, slaveLayout);

}

void ReceiveMatrix(const matrix_type &A, matrix_type &M, IndexLayout &verticalMasterLayout, const std::vector<int> &srcprocs, {…}


template<typename matrix_type>


void CollectMatrixOnOneProc(const matrix_type &A, matrix_type &collectedA, IndexLayout &masterLayout, IndexLayout &slaveLayout)

{

  try{

  PROFILE_FUNC_GROUP("algebra parallelization");

  UG_DLOG(LIB_ALG_AMG, 1, "\n*********** SendMatrix ************\n\n");

  std::vector<int> srcprocs;

  masterLayout.clear();

  slaveLayout.clear();


  const pcl::ProcessCommunicator &pc = A.layouts()->proc_comm();

  ParallelNodes PN(A.layouts(), A.num_rows());


  if(pcl::ProcRank() == pc.get_proc_id(0))

  {

    srcprocs.resize(pc.size()-1);

    for(size_t i=1; i<pc.size(); i++)

      srcprocs[i-1] = pc.get_proc_id(i);

    ReceiveMatrix(A, collectedA, masterLayout, srcprocs, PN);

  }

  else

    SendMatrix(A, slaveLayout, pc.get_proc_id(0), PN);

  }UG_CATCH_THROW(__FUNCTION__ << " failed");

}

void CollectMatrixOnOneProc(const matrix_type &A, matrix_type &collectedA, IndexLayout &masterLayout, IndexLayout &slaveLayout) {…}


template<typename T>


void GatherVectorOnOne(IndexLayout &agglomeratedMaster, IndexLayout &agglomeratedSlave,

    pcl::InterfaceCommunicator<IndexLayout> &com,

    ParallelVector<T> &collectedVec,

    const ParallelVector<T> &vec,

    ParallelStorageType type, bool bRoot)

{

  try{

  PROFILE_FUNC_GROUP("algebra parallelization");

  typedef ParallelVector<T> vector_type;

  if(!bRoot)

  {

    ComPol_VecAdd<vector_type > compolAdd(&collectedVec, &vec);

    com.send_data(agglomeratedSlave, compolAdd);

    com.communicate();

  }

  else

  {

    //UG_LOG("gather_vertical: receiving data at level " << level << "\n");

    UG_COND_THROW(&vec == &collectedVec, "vec and collected vec may not be same");

    collectedVec.set(0.0);

    for(size_t i=0; i<vec.size(); i++)

      collectedVec[i] = vec[i];


    UG_COND_THROW(!vec.has_storage_type(type), "storage type is " << vec.get_storage_type() << ", not " << type);

    if(type == PST_ADDITIVE)

    {

      ComPol_VecAdd<vector_type > compolAdd(&collectedVec, &vec);

      com.receive_data(agglomeratedMaster, compolAdd);

      com.communicate();

      collectedVec.set_storage_type(PST_ADDITIVE);

    }

    else if(type == PST_CONSISTENT)

    {

      ComPol_VecCopy<vector_type > compolCopy(&collectedVec, &vec);

      com.receive_data(agglomeratedMaster, compolCopy);

      com.communicate();

      collectedVec.set_storage_type(PST_CONSISTENT);

    }

    else { UG_THROW("storage type " << type << "unsupported."); }

  }

  }UG_CATCH_THROW(__FUNCTION__ << " failed");

}

void GatherVectorOnOne(IndexLayout &agglomeratedMaster, IndexLayout &agglomeratedSlave, {…}


template<typename T>


void BroadcastVectorFromOne(IndexLayout &agglomeratedMaster, IndexLayout &agglomeratedSlave,

    pcl::InterfaceCommunicator<IndexLayout> &com,

    ParallelVector<T> &vec,

    const ParallelVector<T> &collectedVec,

    ParallelStorageType type, bool bRoot)

{

  PROFILE_FUNC_GROUP("algebra parallelization");

  try{

  typedef ParallelVector<T> vector_type;

  if(!bRoot)

  {

    ComPol_VecCopy<vector_type> compolCopy(&vec, &collectedVec);

    com.receive_data(agglomeratedSlave, compolCopy);

    com.communicate();

    vec.set_storage_type(type);

  }

  else

  {

    UG_COND_THROW(&vec == &collectedVec, "vec and collected vec may not be same");

    for(size_t i=0; i<vec.size(); i++)

      vec[i] = collectedVec[i];


    UG_COND_THROW(!collectedVec.has_storage_type(type), "storage type is " << collectedVec.get_storage_type() << ", not " << type);

    vec.set_storage_type(type);


    ComPol_VecAdd<vector_type > compolCopy(&vec, &collectedVec);

    com.send_data(agglomeratedMaster, compolCopy);

    com.communicate();

  }


  if(type == PST_ADDITIVE)

  {

    UG_THROW("ONLY CONSISTENT!");

    // das problem ist, dass der vektor noch slave-interfaces nach "au�en" haben kann,

    // diese werden dann f�lschlicherweise auch 0 gesetzt.


    //vec.set_storage_type(PST_ADDITIVE);


  }

  else if(type == PST_CONSISTENT) { }

  else { UG_THROW("storage type " << type << "unsupported."); }


  }UG_CATCH_THROW(__FUNCTION__ << " failed");

}

void BroadcastVectorFromOne(IndexLayout &agglomeratedMaster, IndexLayout &agglomeratedSlave, {…}


} // namespace ug


#endif /* __H__LIB_ALGEBRA__COLLECT_MATRIX_H_ */

SmartPtr
Definition smart_pointer.h:108

pcl::InterfaceCommunicator
Performs communication between interfaces on different processes.
Definition pcl_interface_communicator.h:68

pcl::InterfaceCommunicator::send_raw
void send_raw(int targetProc, const void *pBuff, int bufferSize, bool bSizeKnownAtTarget=false)
sends raw data to a target-proc.
Definition pcl_interface_communicator_impl.hpp:61

pcl::InterfaceCommunicator::receive_raw
void receive_raw(int srcProc, ug::BinaryBuffer &bufOut, int bufSize=-1)
registers a binary-stream to receive data from a source-proc.
Definition pcl_interface_communicator_impl.hpp:166

pcl::InterfaceCommunicator::communicate
bool communicate(int tag=749345)
sends and receives the collected data.
Definition pcl_interface_communicator_impl.hpp:409

pcl::InterfaceCommunicator::send_data
void send_data(int targetProc, const Interface &interface, ICommunicationPolicy< TLayout > &commPol)
collects data that will be send during communicate.
Definition pcl_interface_communicator_impl.hpp:80

pcl::InterfaceCommunicator::receive_data
void receive_data(int srcProc, const Interface &interface, ICommunicationPolicy< TLayout > &commPol)
registers a communication-policy to receive data on communicate.
Definition pcl_interface_communicator_impl.hpp:188

pcl::OrderedInterface
You may add elements to this interface and iterate over them.
Definition pcl_communication_structs.h:207

pcl::OrderedInterface::push_back
iterator push_back(const Element &elem)
Definition pcl_communication_structs.h:245

pcl::ProcessCommunicator
Definition pcl_process_communicator.h:70

pcl::ProcessCommunicator::get_proc_id
int get_proc_id(size_t index) const
returns the i-th process in the communicator
Definition pcl_process_communicator.cpp:86

pcl::ProcessCommunicator::size
size_t size() const
returns the size of the communicator
Definition pcl_process_communicator.cpp:71

pcl::SingleLevelLayout< pcl::OrderedInterface< size_t, std::vector > >

pcl::SingleLevelLayout::interface
Interface & interface(iterator iter)
returns the interface to the given iterator.
Definition pcl_communication_structs.h:505

pcl::SingleLevelLayout::clear
void clear()
clears the layout
Definition pcl_communication_structs.h:522

ug::AlgebraLayouts
Extends the HorizontalAlgebraLayouts by vertical layouts.
Definition algebra_layouts.h:121

ug::BinaryBuffer
A Buffer for binary data.
Definition binary_buffer.h:56

ug::BinaryBuffer::buffer
char * buffer()
returns the raw buffer pointer or NULL if the buffer is empty (capacity() == 0)
Definition binary_buffer_impl.h:94

ug::BinaryBuffer::set_read_pos
void set_read_pos(size_t pos)
sets the read position (in bytes).
Definition binary_buffer.cpp:64

ug::BinaryBuffer::write_pos
size_t write_pos() const
returns the current write-pos (in bytes)
Definition binary_buffer_impl.h:53

ug::ComPol_VecAdd
Communication Policy to add values of a vector.
Definition communication_policies.h:319

ug::ComPol_VecCopy
Communication Policy to copy values of a vector.
Definition communication_policies.h:88

ug::ParallelNodes
Definition parallel_nodes.h:112

ug::ParallelNodes::get_local_index_or_create_new
size_t get_local_index_or_create_new(const AlgebraID &globalIndex, int distanceToMasterOrInner, bool &bCreated)
get_index_or_create_new: returns a local index by creating and saving a new one or returning an old
Definition parallel_nodes.cpp:107

ug::ParallelNodes::local_size
size_t local_size() const
Definition parallel_nodes.h:273

ug::ParallelNodes::global_to_local
size_t global_to_local(const AlgebraID &globalIndex) const
Definition parallel_nodes.cpp:141

ug::ParallelNodes::local_to_global
const AlgebraID & local_to_global(size_t i) const
Definition parallel_nodes.h:278

ug::ParallelVector
Definition parallel_vector.h:60

ug::ParallelVector::has_storage_type
bool has_storage_type(uint type) const
returns if the current storage type has a given representation
Definition parallel_vector.h:119

ug::ParallelVector::get_storage_type
ParallelStorageType get_storage_type() const
Definition parallel_vector.h:124

ug::ParallelVector::set
void set(number w, ParallelStorageType type)
set all entries to value and the storage type
Definition parallel_vector_impl.h:223

ug::ParallelVector::set_storage_type
void set_storage_type(uint type)
sets the storage type
Definition parallel_vector.h:104

ug::stdvector
Definition stl_debug.h:45

debug_print.h

ug::ParallelStorageType
ParallelStorageType
Definition parallel_storage_type.h:66

ug::PST_CONSISTENT
@ PST_CONSISTENT
Definition parallel_storage_type.h:68

ug::PST_ADDITIVE
@ PST_ADDITIVE
Definition parallel_storage_type.h:69

pcl::ProcRank
int ProcRank()
returns the rank of the process
Definition pcl_base.cpp:83

pcl::NumProcs
int NumProcs()
returns the number of processes
Definition pcl_base.cpp:91

UG_CATCH_THROW
#define UG_CATCH_THROW(msg)
Definition error.h:64

UG_THROW
#define UG_THROW(msg)
Definition error.h:57

UG_DLOG
#define UG_DLOG(__debugID__, level, msg)
Definition log.h:298

ug::LIB_ALG_AMG
DebugID LIB_ALG_AMG
Definition debug_id.h:131

UG_COND_THROW
#define UG_COND_THROW(cond, msg)
UG_COND_THROW(cond, msg) : performs a UG_THROW(msg) if cond == true.
Definition error.h:61

ug
the ug namespace

ug::SerializeRow
void SerializeRow(BinaryBuffer &stream, const matrix_type &mat, size_t localRowIndex, ParallelNodes &PN)
Definition collect_matrix.h:43

ug::CollectMatrixOnOneProc
void CollectMatrixOnOneProc(const matrix_type &A, matrix_type &collectedA, IndexLayout &masterLayout, IndexLayout &slaveLayout)
Definition collect_matrix.h:246

ug::Deserialize
void Deserialize(TIStream &buf, ParallelVector< T > &v)
Deerialize for ParallelVector<T>
Definition restart_bridge.cpp:112

ug::DeserializeRow
size_t DeserializeRow(BinaryBuffer &stream, stdvector< TConnectionType > &cons, ParallelNodes &PN)
Definition collect_matrix.h:100

ug::ReceiveMatrix
void ReceiveMatrix(const matrix_type &A, matrix_type &M, IndexLayout &verticalMasterLayout, const std::vector< int > &srcprocs, ParallelNodes &PN)
Definition collect_matrix.h:142

ug::GatherVectorOnOne
void GatherVectorOnOne(HorizontalAlgebraLayouts &agglomerationLayout, ParallelVector< T > &collectedVec, const ParallelVector< T > &vec, ParallelStorageType type)
Definition agglomerating_solver.h:53

ug::BroadcastVectorFromOne
void BroadcastVectorFromOne(HorizontalAlgebraLayouts &agglomerationLayout, ParallelVector< T > &vec, const ParallelVector< T > &collectedVec, ParallelStorageType type)
Definition agglomerating_solver.h:65

ug::Serialize
void Serialize(TOStream &buf, const ParallelVector< T > &v)
Serialize for ParallelVector<T>
Definition restart_bridge.cpp:103

ug::SerializeLayout
void SerializeLayout(BinaryBuffer &stream, const IndexLayout &layout, const TLocalToGlobal &localToGlobal)
Definition serialize_interfaces.h:63

ug::SendMatrix
void SendMatrix(const matrix_type &A, IndexLayout &verticalSlaveLayout, int destproc, ParallelNodes &PN)
Definition collect_matrix.h:75

parallel_nodes.h

PROFILE_FUNC_GROUP
#define PROFILE_FUNC_GROUP(groups)
Definition profiler.h:258

serialize_interfaces.h

num_connections
size_t num_connections(size_t row) const

ug::AlgebraID
this type is used to identify distributed objects.
Definition algebra_id.h:46

ug::AlgebraID::master_proc
int master_proc() const
Definition algebra_id.h:54