dg/html/mpi__collective_8h_source.html

#pragma once

#include <cassert>

#include <thrust/sequence.h>

#include <thrust/sort.h>

#include <thrust/gather.h>

#include <thrust/scatter.h>


#include <thrust/host_vector.h>

#include <thrust/device_vector.h>

#include "blas1_dispatch_shared.h"

#include "dg/blas1.h"

#include "memory.h"

#include "mpi_communicator.h"


namespace dg{


template<class Index, class Vector>

struct Collective

{

    Collective(){

        m_comm = MPI_COMM_NULL;

    }

    Collective( const thrust::host_vector<int>& sendTo, MPI_Comm comm) {

        construct( sendTo, comm);

    }


    void construct( thrust::host_vector<int> sendTo, MPI_Comm comm){

        //sollte schnell sein

        thrust::host_vector<int> recvFrom(sendTo), accS(sendTo), accR(sendTo);

        m_comm=comm;

        int rank, size;

        MPI_Comm_rank( m_comm, &rank);

        MPI_Comm_size( m_comm, &size);

        assert( sendTo.size() == (unsigned)size);

        thrust::host_vector<unsigned> global( size*size);

        MPI_Allgather( sendTo.data(), size, MPI_UNSIGNED,

                       global.data(), size, MPI_UNSIGNED,

                       m_comm);

        for( unsigned i=0; i<(unsigned)size; i++)

            recvFrom[i] = global[i*size+rank];

        thrust::exclusive_scan( sendTo.begin(),   sendTo.end(),   accS.begin());

        thrust::exclusive_scan( recvFrom.begin(), recvFrom.end(), accR.begin());

        m_sendTo=sendTo, m_recvFrom=recvFrom, m_accS=accS, m_accR=accR;

    }

    unsigned size() const {return values_size();}

    MPI_Comm comm() const {return m_comm;}


    void transpose(){ m_sendTo.swap( m_recvFrom);}

    void invert(){ m_sendTo.swap( m_recvFrom);}


    void scatter( const Vector& values, Vector& store) const;

    void gather( const Vector& store, Vector& values) const;

    unsigned store_size() const{

        if( m_recvFrom.empty())

            return 0;

        return thrust::reduce( m_recvFrom.begin(), m_recvFrom.end() );

    }

    unsigned values_size() const{

        if( m_sendTo.empty())

            return 0;

        return thrust::reduce( m_sendTo.begin(), m_sendTo.end() );

    }

    MPI_Comm communicator() const{return m_comm;}

    private:

    unsigned sendTo( unsigned pid) const {return m_sendTo[pid];}

    unsigned recvFrom( unsigned pid) const {return m_recvFrom[pid];}

#ifdef _DG_CUDA_UNAWARE_MPI

    thrust::host_vector<int> m_sendTo,   m_accS;

    thrust::host_vector<int> m_recvFrom, m_accR;

    dg::Buffer<thrust::host_vector<get_value_type<Vector> >> m_values, m_store;

#else

//surprisingly MPI_Alltoallv wants the integers to be on the host, only

//the data is on the device (does this question the necessity of Index?)

    thrust::host_vector<int> m_sendTo,   m_accS; //accumulated send

    thrust::host_vector<int> m_recvFrom, m_accR; //accumulated recv

#endif // _DG_CUDA_UNAWARE_MPI

    MPI_Comm m_comm;

};


template< class Index, class Device>

void Collective<Index, Device>::scatter( const Device& values, Device& store) const

{

    //assert( store.size() == store_size() );

#if THRUST_DEVICE_SYSTEM==THRUST_DEVICE_SYSTEM_CUDA

    if( std::is_same< get_execution_policy<Device>, CudaTag>::value ) //could be serial tag

    {

        cudaError_t code = cudaGetLastError( );

        if( code != cudaSuccess)

            throw dg::Error(dg::Message(_ping_)<<cudaGetErrorString(code));

        code = cudaDeviceSynchronize(); //needs to be called

        if( code != cudaSuccess)

            throw dg::Error(dg::Message(_ping_)<<cudaGetErrorString(code));

    }

#endif //THRUST_DEVICE_SYSTEM

#ifdef _DG_CUDA_UNAWARE_MPI

    m_values.data() = values;

    m_store.data().resize( store.size());

    MPI_Alltoallv(

            thrust::raw_pointer_cast( m_values.data().data()),

            thrust::raw_pointer_cast( m_sendTo.data()),

            thrust::raw_pointer_cast( m_accS.data()), getMPIDataType<get_value_type<Device> >(),

            thrust::raw_pointer_cast( m_store.data().data()),

            thrust::raw_pointer_cast( m_recvFrom.data()),

            thrust::raw_pointer_cast( m_accR.data()), getMPIDataType<get_value_type<Device> >(), m_comm);

    store = m_store.data();

#else

    MPI_Alltoallv(

            thrust::raw_pointer_cast( values.data()),

            thrust::raw_pointer_cast( m_sendTo.data()),

            thrust::raw_pointer_cast( m_accS.data()), getMPIDataType<get_value_type<Device> >(),

            thrust::raw_pointer_cast( store.data()),

            thrust::raw_pointer_cast( m_recvFrom.data()),

            thrust::raw_pointer_cast( m_accR.data()), getMPIDataType<get_value_type<Device> >(), m_comm);

#endif //_DG_CUDA_UNAWARE_MPI

}


template< class Index, class Device>

void Collective<Index, Device>::gather( const Device& gatherFrom, Device& values) const

{

    //assert( gatherFrom.size() == store_size() );

    values.resize( values_size() );

#if THRUST_DEVICE_SYSTEM==THRUST_DEVICE_SYSTEM_CUDA

    if( std::is_same< get_execution_policy<Device>, CudaTag>::value ) //could be serial tag

    {

        cudaError_t code = cudaGetLastError( );

        if( code != cudaSuccess)

            throw dg::Error(dg::Message(_ping_)<<cudaGetErrorString(code));

        code = cudaDeviceSynchronize(); //needs to be called

        if( code != cudaSuccess)

            throw dg::Error(dg::Message(_ping_)<<cudaGetErrorString(code));

    }

#endif //THRUST_DEVICE_SYSTEM

#ifdef _DG_CUDA_UNAWARE_MPI

    m_store.data() = gatherFrom;

    m_values.data().resize( values.size());

    MPI_Alltoallv(

            thrust::raw_pointer_cast( m_store.data().data()),

            thrust::raw_pointer_cast( m_recvFrom.data()),

            thrust::raw_pointer_cast( m_accR.data()), getMPIDataType<get_value_type<Device> >(),

            thrust::raw_pointer_cast( m_values.data().data()),

            thrust::raw_pointer_cast( m_sendTo.data()),

            thrust::raw_pointer_cast( m_accS.data()), getMPIDataType<get_value_type<Device> >(), m_comm);

    values = m_values.data();

#else

    MPI_Alltoallv(

            thrust::raw_pointer_cast( gatherFrom.data()),

            thrust::raw_pointer_cast( m_recvFrom.data()),

            thrust::raw_pointer_cast( m_accR.data()), getMPIDataType<get_value_type<Device> >(),

            thrust::raw_pointer_cast( values.data()),

            thrust::raw_pointer_cast( m_sendTo.data()),

            thrust::raw_pointer_cast( m_accS.data()), getMPIDataType<get_value_type<Device> >(), m_comm);

#endif //_DG_CUDA_UNAWARE_MPI

}

//BijectiveComm ist der Spezialfall, dass jedes Element nur ein einziges Mal gebraucht wird.


template< class Index, class Vector>

struct BijectiveComm : public aCommunicator<Vector>

{

    BijectiveComm( ) = default;

    BijectiveComm( const thrust::host_vector<int>& pids, MPI_Comm comm) {

        construct( pids, comm);

    }

    BijectiveComm( unsigned local_size, thrust::host_vector<int> localIndexMap, thrust::host_vector<int> pidIndexMap, MPI_Comm comm)

    {

        construct( pidIndexMap, comm);

        m_p.transpose();

    }

    template<class ConversionPolicy>

    BijectiveComm( const thrust::host_vector<int>& globalIndexMap, const ConversionPolicy& p)

    {

        thrust::host_vector<int> local(globalIndexMap.size()), pids(globalIndexMap.size());

        bool success = true;

        for(unsigned i=0; i<local.size(); i++)

            if( !p.global2localIdx(globalIndexMap[i], local[i], pids[i]) ) success = false;

        assert( success);

        construct( pids, p.communicator());

        m_p.transpose();

    }


    template<class OtherIndex, class OtherVector>

    BijectiveComm( const BijectiveComm<OtherIndex, OtherVector>& src) {

        construct( src.get_pids(), src.communicator());

    }


    const thrust::host_vector<int>& get_pids()const{return m_pids;}

    virtual BijectiveComm* clone() const override final {return new BijectiveComm(*this);}

    private:

    void compute_global_comm(){

        if( m_p.communicator()  == MPI_COMM_NULL){

            m_global_comm = false;

            return;

        }

        int rank;

        MPI_Comm_rank( m_p.communicator(), &rank);

        bool local_communicating = false, global_communicating=false;

        for( unsigned i=0; i<m_pids.size(); i++)

            if( m_pids[i] != rank)

                local_communicating = true;

        MPI_Allreduce( &local_communicating, &global_communicating, 1,

                       MPI_C_BOOL, MPI_LOR, m_p.communicator());

        m_global_comm = global_communicating;

    }

    virtual bool do_isCommunicating() const override final{ return m_global_comm;}

    virtual MPI_Comm do_communicator() const override final {return m_p.communicator();}

    virtual unsigned do_size() const override final { return m_p.store_size();}

    virtual Vector do_make_buffer()const override final{

        Vector tmp( do_size() );

        return tmp;

    }

    void construct( thrust::host_vector<int> pids, MPI_Comm comm)

    {

        this->set_local_size( pids.size());

        m_pids = pids;

        dg::assign( pids, m_idx);

        int size;

        MPI_Comm_size( comm, &size);

        for( unsigned i=0; i<pids.size(); i++)

            assert( 0 <= pids[i] && pids[i] < size);

        thrust::host_vector<int> index(pids);

        thrust::sequence( index.begin(), index.end());

        thrust::stable_sort_by_key( pids.begin(), pids.end(), index.begin());//note: this also sorts the pids

        m_idx=index;

        //now we can repeat/invert the sort by a gather/scatter operation with index as map

        //i.e. we could sort pids by a gather


        //Now construct the collective object by getting the number of elements to send

        thrust::host_vector<int> one( pids.size(), 1), keys(one), number(one);

        typedef thrust::host_vector<int>::iterator iterator;

        thrust::pair< iterator, iterator> new_end =

            thrust::reduce_by_key( pids.begin(), pids.end(), //sorted!

                one.begin(), keys.begin(), number.begin() );

        unsigned distance = thrust::distance( keys.begin(), new_end.first);

        thrust::host_vector<int> sendTo( size, 0 );

        for( unsigned i=0; i<distance; i++)

            sendTo[keys[i]] = number[i];

        m_p.construct( sendTo, comm);

        m_values.data().resize( m_idx.size());

        compute_global_comm();

    }

    virtual void do_global_gather( const get_value_type<Vector>* values, Vector& store)const override final

    {

        //actually this is a scatter but we constructed it invertedly

        //we could maybe transpose the Collective object!?

        //assert( values.size() == m_idx.size());

        //nach PID ordnen

        typename Vector::const_pointer values_ptr(values);

        //senden

        if( m_global_comm)

        {

            thrust::gather( m_idx.begin(), m_idx.end(), values_ptr, m_values.data().begin());

            m_p.scatter( m_values.data(), store);

        }

        else

            thrust::gather( m_idx.begin(), m_idx.end(), values_ptr, store.begin());

    }


    virtual void do_global_scatter_reduce( const Vector& toScatter, get_value_type<Vector>* values) const override final

    {

        //actually this is a gather but we constructed it invertedly

        typename Vector::pointer values_ptr(values);

        if( m_global_comm)

        {

            m_p.gather( toScatter, m_values.data());

            //nach PID geordnete Werte wieder umsortieren

            thrust::scatter( m_values.data().begin(), m_values.data().end(), m_idx.begin(), values_ptr);

        }

        else

        {

            thrust::scatter( toScatter.begin(), toScatter.end(), m_idx.begin(), values_ptr);

        }

    }

    Buffer<Vector> m_values;

    Index m_idx;

    Collective<Index, Vector> m_p;

    thrust::host_vector<int> m_pids;

    bool m_global_comm = false;

};


template< class Index, class Vector>

struct SurjectiveComm : public aCommunicator<Vector>

{

    SurjectiveComm(){

        m_buffer_size = m_store_size = 0;

    }

    SurjectiveComm( unsigned local_size, const thrust::host_vector<int>& localIndexMap, const thrust::host_vector<int>& pidIndexMap, MPI_Comm comm)

    {

        construct( local_size, localIndexMap, pidIndexMap, comm);

    }


    template<class ConversionPolicy>

    SurjectiveComm( const thrust::host_vector<int>& globalIndexMap, const ConversionPolicy& p)

    {

        thrust::host_vector<int> local(globalIndexMap.size()), pids(globalIndexMap.size());

        bool success = true;

        for(unsigned i=0; i<local.size(); i++)

            if( !p.global2localIdx(globalIndexMap[i], local[i], pids[i]) ) success = false;


        assert( success);

        construct( p.local_size(), local, pids, p.communicator());

    }


    template<class OtherIndex, class OtherVector>

    SurjectiveComm( const SurjectiveComm<OtherIndex, OtherVector>& src)

    {

        construct( src.local_size(), src.getLocalIndexMap(), src.getPidIndexMap(), src.communicator());

    }


    const thrust::host_vector<int>& getLocalIndexMap() const {return m_localIndexMap;}

    const thrust::host_vector<int>& getPidIndexMap() const {return m_pidIndexMap;}

    const Index& getSortedIndexMap() const {return m_sortedIndexMap;}

    virtual SurjectiveComm* clone() const override final {return new SurjectiveComm(*this);}

    bool isLocalBijective() const {return !m_reduction;}

    private:

    virtual bool do_isCommunicating() const override final{

        return m_bijectiveComm.isCommunicating();

    }

    virtual Vector do_make_buffer()const override final{

        Vector tmp(do_size());

        return tmp;

    }

    virtual void do_global_gather( const get_value_type<Vector>* values, Vector& buffer)const override final

    {

        //gather values to store

        typename Vector::const_pointer values_ptr(values);

        thrust::gather( m_IndexMap.begin(), m_IndexMap.end(), values_ptr, m_store.data().begin());

        m_bijectiveComm.global_scatter_reduce( m_store.data(), thrust::raw_pointer_cast(buffer.data()));

    }

    virtual void do_global_scatter_reduce( const Vector& toScatter, get_value_type<Vector>* values)const override final

    {

        //now perform a local sort, reduce and scatter operation

        typename Vector::pointer values_ptr(values);

        if( m_reduction)

        {

            //first gather values into temporary store

            Vector storet = m_bijectiveComm.global_gather( thrust::raw_pointer_cast(toScatter.data()));

            thrust::gather( m_sortMap.begin(), m_sortMap.end(), storet.begin(), m_store.data().begin());

            thrust::reduce_by_key( m_sortedIndexMap.begin(), m_sortedIndexMap.end(), m_store.data().begin(), m_keys.data().begin(), values_ptr);

        }

        else

        {

            m_bijectiveComm.global_gather( thrust::raw_pointer_cast(toScatter.data()), m_store.data());

            thrust::gather( m_sortMap.begin(), m_sortMap.end(), m_store.data().begin(), values_ptr);

        }


    }

    virtual MPI_Comm do_communicator()const override final{return m_bijectiveComm.communicator();}

    virtual unsigned do_size() const override final {return m_buffer_size;}

    void construct( unsigned local_size, thrust::host_vector<int> localIndexMap, thrust::host_vector<int> pidIndexMap, MPI_Comm comm)

    {

        this->set_local_size(local_size);

        m_bijectiveComm = BijectiveComm<Index, Vector>( pidIndexMap, comm);

        m_localIndexMap = localIndexMap, m_pidIndexMap = pidIndexMap;

        m_buffer_size = localIndexMap.size();

        assert( m_buffer_size == pidIndexMap.size());

        //the bijectiveComm behaves as if we had given the index map for the store

        //now gather the localIndexMap from the buffer to the store to get the final index map

        Vector m_localIndexMapd = dg::construct<Vector>( localIndexMap);

        const typename aCommunicator<Vector>::value_type * v_ptr = thrust::raw_pointer_cast(m_localIndexMapd.data());

        Vector gatherMapV = m_bijectiveComm.global_gather( v_ptr); // a scatter wrt to the buffer

        m_sortMap = m_sortedIndexMap = m_IndexMap = dg::construct<Index>(gatherMapV);

        //now prepare a reduction map and a scatter map

        thrust::sequence( m_sortMap.begin(), m_sortMap.end());

        thrust::stable_sort_by_key( m_sortedIndexMap.begin(), m_sortedIndexMap.end(), m_sortMap.begin());//note: this sorts both keys and values (m_sortedIndexMap, m_sortMap)

        //now we can repeat/invert the sort by a gather/scatter operation with sortMap as map

        // if bijective, sortMap is the inverse of IndexMap

        m_store_size = m_IndexMap.size();

        m_store.data().resize( m_store_size);

        m_keys.data().resize( m_store_size);

        // Check if reduction is necessary

        Vector temp( m_store_size);

        auto new_end = thrust::reduce_by_key( m_sortedIndexMap.begin(), m_sortedIndexMap.end(), m_store.data().begin(), m_keys.data().begin(), temp.begin());

        if( new_end.second == temp.end())

            m_reduction = false;


    }

    unsigned m_buffer_size, m_store_size;

    BijectiveComm<Index, Vector> m_bijectiveComm;

    Index m_IndexMap, m_sortMap, m_sortedIndexMap;

    Buffer<Index> m_keys;

    Buffer<Vector> m_store;

    thrust::host_vector<int> m_localIndexMap, m_pidIndexMap;

    bool m_reduction = true;

};


template< class Index, class Vector>

struct GeneralComm : public aCommunicator<Vector>

{

    GeneralComm() = default;

    GeneralComm( unsigned local_size, const thrust::host_vector<int>& localIndexMap, const thrust::host_vector<int>& pidIndexMap, MPI_Comm comm) {

        construct(local_size, localIndexMap, pidIndexMap, comm);

    }


    template<class ConversionPolicy>

    GeneralComm( const thrust::host_vector<int>& globalIndexMap, const ConversionPolicy& p)

    {

        thrust::host_vector<int> local(globalIndexMap.size()), pids(globalIndexMap.size());

        bool success = true;

        for(unsigned i=0; i<local.size(); i++)

            if( !p.global2localIdx(globalIndexMap[i], local[i], pids[i]) ) success = false;

        assert( success);

        construct(p.local_size(), local, pids, p.communicator());

    }


    template<class OtherIndex, class OtherVector>

    GeneralComm( const GeneralComm<OtherIndex, OtherVector>& src){

        if( src.buffer_size() > 0)

            construct( src.local_size(), src.getLocalIndexMap(), src.getPidIndexMap(), src.communicator());

    }


    const thrust::host_vector<int>& getLocalIndexMap() const {return m_surjectiveComm.getLocalIndexMap();}

    const thrust::host_vector<int>& getPidIndexMap() const {return m_surjectiveComm.getPidIndexMap();}

    virtual GeneralComm* clone() const override final {return new GeneralComm(*this);}

    private:

    virtual bool do_isCommunicating() const override final{

        return m_surjectiveComm.isCommunicating();

    }

    virtual Vector do_make_buffer() const override final{

        Vector tmp(do_size());

        return tmp;

    }

    virtual MPI_Comm do_communicator()const override final{return m_surjectiveComm.communicator();}

    virtual void do_global_gather( const get_value_type<Vector>* values, Vector& sink)const override final {

        m_surjectiveComm.global_gather( values, sink);

    }

    virtual void do_global_scatter_reduce( const Vector& toScatter, get_value_type<Vector>* values)const override final {

        m_surjectiveComm.global_scatter_reduce( toScatter, thrust::raw_pointer_cast(m_store.data().data()));

        typename Vector::pointer values_ptr(values);

        dg::blas1::detail::doSubroutine_dispatch(

            get_execution_policy<Vector>(),

            this->local_size(),

            dg::equals(),

            0,

            values

        );

        thrust::scatter( m_store.data().begin(), m_store.data().end(), m_scatterMap.begin(), values_ptr);

    }


    virtual unsigned do_size() const override final{return m_surjectiveComm.buffer_size();}

    void construct( unsigned local_size, const thrust::host_vector<int>& localIndexMap, const thrust::host_vector<int>& pidIndexMap, MPI_Comm comm)

    {

        this->set_local_size( local_size);

        m_surjectiveComm = SurjectiveComm<Index,Vector>(local_size, localIndexMap, pidIndexMap, comm);


        const Index& m_sortedIndexMap = m_surjectiveComm.getSortedIndexMap();

        thrust::host_vector<int> gatherMap = dg::construct<thrust::host_vector<int>>( m_sortedIndexMap);

        thrust::host_vector<int> one( gatherMap.size(), 1), keys(one), number(one);

        typedef thrust::host_vector<int>::iterator iterator;

        thrust::pair< iterator, iterator> new_end =

            thrust::reduce_by_key( gatherMap.begin(), gatherMap.end(), //sorted!

                one.begin(), keys.begin(), number.begin() );

        unsigned distance = thrust::distance( keys.begin(), new_end.first);

        m_store.data().resize( distance);

        m_scatterMap.resize(distance);

        thrust::copy( keys.begin(), keys.begin() + distance, m_scatterMap.begin());

    }

    SurjectiveComm<Index, Vector> m_surjectiveComm;

    Buffer<Vector> m_store;

    Index m_scatterMap;

};


}//namespace dg

blas1.h

dg::Error
class intended for the use in throw statements
Definition: exceptions.h:83

dg::Message
small class holding a stringstream
Definition: exceptions.h:29

_ping_
#define _ping_
Definition: exceptions.h:12

dg::construct
ContainerType construct(const from_ContainerType &from, Params &&... ps)
Generic way to construct an object of ContainerType given a from_ContainerType object and optional ad...
Definition: blas1.h:696

dg::assign
void assign(const from_ContainerType &from, ContainerType &to, Params &&... ps)
Generic way to assign the contents of a from_ContainerType object to a ContainerType object optionall...
Definition: blas1.h:665

dg::one
static DG_DEVICE double one(double x)
Definition: functions.h:20

dg::blas1::copy
void copy(const ContainerTypeIn &source, ContainerTypeOut &target)
Definition: blas1.h:164

dg::blas1::reduce
OutputType reduce(const ContainerType &x, OutputType zero, BinaryOp binary_op, UnaryOp unary_op=UnaryOp())
Custom (transform) reduction
Definition: blas1.h:139

dg::invert
dg::Operator< T > invert(const dg::Operator< T > &in)
Alias for dg::create::inverse. Compute inverse of square matrix.
Definition: operator.h:695

dg::transpose
void transpose(unsigned nx, unsigned ny, const ContainerType &in, ContainerType &out)
Transpose vector.
Definition: average_dispatch.h:26

dg::is_same
bool is_same(double x, double y, double eps=1e-15)
Definition: runge_kutta.h:948

memory.h

mpi_communicator.h

dg
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...

dg::BijectiveComm
Perform bijective gather and its transpose (scatter) operation across processes on distributed vector...
Definition: mpi_collective.h:208

dg::BijectiveComm::get_pids
const thrust::host_vector< int > & get_pids() const
These are the pids that were given in the Constructor.
Definition: mpi_collective.h:262

dg::BijectiveComm::BijectiveComm
BijectiveComm(const thrust::host_vector< int > &globalIndexMap, const ConversionPolicy &p)
Construct from global indices index map.
Definition: mpi_collective.h:241

dg::BijectiveComm::BijectiveComm
BijectiveComm(const BijectiveComm< OtherIndex, OtherVector > &src)
reconstruct from another type; if src is empty, same as default constructor
Definition: mpi_collective.h:254

dg::BijectiveComm::BijectiveComm
BijectiveComm(const thrust::host_vector< int > &pids, MPI_Comm comm)
Construct from a given scatter map (inverse index map) with respect to the source/data vector.
Definition: mpi_collective.h:226

dg::BijectiveComm::BijectiveComm
BijectiveComm()=default
no memory allocation; size 0

dg::BijectiveComm::clone
virtual BijectiveComm * clone() const override final
Generic copy method.
Definition: mpi_collective.h:263

dg::BijectiveComm::BijectiveComm
BijectiveComm(unsigned local_size, thrust::host_vector< int > localIndexMap, thrust::host_vector< int > pidIndexMap, MPI_Comm comm)
Construct from local indices and PIDs index map.
Definition: mpi_collective.h:232

dg::Buffer
a manager class that invokes the copy constructor on the managed ptr when copied (deep copy)
Definition: memory.h:152

dg::Buffer::data
T & data() const
Get write access to the data on the heap.
Definition: memory.h:187

dg::GeneralComm
Perform general gather and its transpose (scatter) operation across processes on distributed vectors ...
Definition: mpi_collective.h:504

dg::GeneralComm::GeneralComm
GeneralComm(unsigned local_size, const thrust::host_vector< int > &localIndexMap, const thrust::host_vector< int > &pidIndexMap, MPI_Comm comm)
Construct from local indices and PIDs index map.
Definition: mpi_collective.h:518

dg::GeneralComm::GeneralComm
GeneralComm(const thrust::host_vector< int > &globalIndexMap, const ConversionPolicy &p)
Construct from global indices index map.
Definition: mpi_collective.h:538

dg::GeneralComm::getPidIndexMap
const thrust::host_vector< int > & getPidIndexMap() const
read access to the pid index map given in constructor
Definition: mpi_collective.h:558

dg::GeneralComm::GeneralComm
GeneralComm()=default
no memory allocation; size 0

dg::GeneralComm::clone
virtual GeneralComm * clone() const override final
Generic copy method.
Definition: mpi_collective.h:559

dg::GeneralComm::GeneralComm
GeneralComm(const GeneralComm< OtherIndex, OtherVector > &src)
reconstruct from another type; if src is empty, same as default constructor
Definition: mpi_collective.h:550

dg::GeneralComm::getLocalIndexMap
const thrust::host_vector< int > & getLocalIndexMap() const
read access to the local index index map given in constructor
Definition: mpi_collective.h:556

dg::SurjectiveComm
Perform surjective gather and its transpose (scatter) operation across processes on distributed vecto...
Definition: mpi_collective.h:374

dg::SurjectiveComm::SurjectiveComm
SurjectiveComm(unsigned local_size, const thrust::host_vector< int > &localIndexMap, const thrust::host_vector< int > &pidIndexMap, MPI_Comm comm)
Construct from local indices and PIDs index map.
Definition: mpi_collective.h:381

dg::SurjectiveComm::SurjectiveComm
SurjectiveComm()
no memory allocation; size 0
Definition: mpi_collective.h:376

dg::SurjectiveComm::getPidIndexMap
const thrust::host_vector< int > & getPidIndexMap() const
read access to the pid index map given in constructor
Definition: mpi_collective.h:410

dg::SurjectiveComm::getSortedIndexMap
const Index & getSortedIndexMap() const
Definition: mpi_collective.h:411

dg::SurjectiveComm::isLocalBijective
bool isLocalBijective() const
No reduction on this process? True: no reduction, False: need to reduce.
Definition: mpi_collective.h:414

dg::SurjectiveComm::getLocalIndexMap
const thrust::host_vector< int > & getLocalIndexMap() const
read access to the local index index map given in constructor
Definition: mpi_collective.h:408

dg::SurjectiveComm::SurjectiveComm
SurjectiveComm(const SurjectiveComm< OtherIndex, OtherVector > &src)
reconstruct from another type; if src is empty, same as default constructor
Definition: mpi_collective.h:402

dg::SurjectiveComm::SurjectiveComm
SurjectiveComm(const thrust::host_vector< int > &globalIndexMap, const ConversionPolicy &p)
Construct from global indices index map.
Definition: mpi_collective.h:389

dg::SurjectiveComm::clone
virtual SurjectiveComm * clone() const override final
Generic copy method.
Definition: mpi_collective.h:412

dg::aCommunicator
Struct that performs collective scatter and gather operations across processes on distributed vectors...
Definition: mpi_communicator.h:98

dg::aCommunicator< Vector >::local_size
unsigned local_size() const
The local size of the source vector v = local size of the  dg::MPI_Vector
Definition: mpi_communicator.h:190

dg::aCommunicator< Vector >::value_type
get_value_type< Vector > value_type
reveal value type
Definition: mpi_communicator.h:99

dg::aCommunicator::buffer_size
unsigned buffer_size() const
The local size of the buffer vector w = local map size.
Definition: mpi_communicator.h:178

dg::aCommunicator< Vector >::set_local_size
void set_local_size(unsigned new_size)
Set the local size of the source vector v.
Definition: mpi_communicator.h:242

dg::aCommunicator::communicator
MPI_Comm communicator() const
The internal MPI communicator used.
Definition: mpi_communicator.h:220

dg::equals
Definition: subroutines.h:22