4#include <thrust/host_vector.h>
20template<
template<
typename>
typename Vector>
21struct MPIContiguousKroneckerGather
23 MPIContiguousKroneckerGather( MPI_Comm comm = MPI_COMM_NULL) : m_mpi_gather(comm){ }
24 MPIContiguousKroneckerGather(
25 const std::map<
int, thrust::host_vector<int>>& recvIdx,
28 : m_recvIdx(recvIdx), m_chunk_size(chunk_size)
31 MPI_Cartdim_get( comm_1d, &ndims);
34 MPI_Comm_rank( comm_1d, &rank);
36 "Only Shared vectors allowed");
37 auto recvChunks = detail::MPIContiguousGather::make_chunks(
39 m_mpi_gather = dg::detail::MPIContiguousGather( recvChunks, comm_1d);
40 m_buffer_size = m_mpi_gather.buffer_size(
false);
42 template<
template<
class>
class OtherVector>
43 friend class MPIContiguousKroneckerGather;
45 template<
template<
typename >
typename OtherVector>
46 MPIContiguousKroneckerGather(
const MPIContiguousKroneckerGather<OtherVector>& src)
47 : m_mpi_gather( src.m_mpi_gather),
48 m_recvIdx(src.m_recvIdx),
49 m_chunk_size(src.m_chunk_size),
50 m_buffer_size(src.m_buffer_size)
54 MPI_Comm communicator()
const{
return m_mpi_gather.communicator();}
56 unsigned buffer_size()
const {
return detail::flatten_map( m_recvIdx).size(); }
57 unsigned chunk_size()
const {
return m_chunk_size; }
58 bool isCommunicating()
const{
return m_mpi_gather.isCommunicating(); }
60 template<
class ContainerType>
61 void global_gather_init(
const ContainerType& gatherFrom)
const
64 m_buffer.template set<value_type>( m_buffer_size);
65 auto& buffer = m_buffer.template get<value_type>();
66 m_mpi_gather.global_gather_init( gatherFrom, buffer,
false);
68 template<
class ContainerType>
69 void global_gather_wait(
const ContainerType& gatherFrom,
73 auto& buffer = m_buffer.template get<value_type>();
74 m_mpi_gather.global_gather_wait( buffer);
77 MPI_Comm_rank( communicator(), &rank);
78 unsigned start = 0, buffer_start = 0;
79 for(
auto& idx : m_recvIdx)
80 for(
unsigned u=0; u<idx.second.size(); u++)
82 if( rank != idx.first)
84 buffer_ptrs[start] = thrust::raw_pointer_cast(
85 buffer.data()) + buffer_start*m_chunk_size;
89 buffer_ptrs[start] = thrust::raw_pointer_cast(
90 gatherFrom.data()) + idx.second[u]*m_chunk_size;
96 dg::detail::MPIContiguousGather m_mpi_gather;
97 std::map<int,thrust::host_vector<int>> m_recvIdx;
98 unsigned m_chunk_size = 0;
99 unsigned m_buffer_size = 0;
100 mutable detail::AnyVector<Vector> m_buffer;
142template<
template<
typename>
typename Vector>
165 const std::map<
int, thrust::host_vector<int>>& recvIdx,
171 m_contiguous = (left_size==1);
173 if( not m_contiguous)
177 detail::Unique<int> uni = detail::find_unique_order_preserving(
178 detail::flatten_map( sendIdx));
179 auto uni_sendIdx = detail::make_map_t<thrust::host_vector<int>>(
180 detail::combine_gather( uni.gather1, uni.gather2),
181 detail::get_size_map( sendIdx));
185 m_mpi_gather = detail::MPIContiguousKroneckerGather<Vector>(
186 uni_recvIdx, n*left_size*right_size, comm_1d);
190 thrust::host_vector<int> g2( uni.unique.size()*n*left_size*
192 for(
unsigned l=0; l<uni.unique.size(); l++)
193 for(
unsigned j=0; j<n; j++)
194 for(
unsigned i=0; i<left_size; i++)
195 for(
unsigned k=0; k<right_size; k++)
196 g2[((l*n+j)*left_size+i)*right_size + k] =
197 ((i*num_cols + uni.unique[l])*n + j)*right_size + k;
201 m_mpi_gather = detail::MPIContiguousKroneckerGather<Vector>(
202 recvIdx, n*left_size*right_size, comm_1d);
206 template<
template<
class>
class OtherVector>
210 template<
template<
typename >
typename OtherVector>
212 : m_contiguous( src.m_contiguous),
214 m_mpi_gather( src.m_mpi_gather)
222 unsigned buffer_size()
const {
return m_mpi_gather.buffer_size(); }
224 unsigned chunk_size()
const {
return m_mpi_gather.chunk_size(); }
241 template<
class ContainerType>
245 if( not m_contiguous)
247 m_store.template set<value_type>( m_g2.size());
248 auto& store = m_store.template get<value_type>();
249 thrust::gather( m_g2.begin(), m_g2.end(), gatherFrom.begin(),
251 m_mpi_gather.global_gather_init( store);
254 m_mpi_gather.global_gather_init( gatherFrom);
268 template<
class ContainerType>
272 if( not m_contiguous)
275 auto& store = m_store.template get<value_type>();
276 m_mpi_gather.global_gather_wait( store, buffer_ptrs);
279 m_mpi_gather.global_gather_wait( gatherFrom, buffer_ptrs);
283 bool m_contiguous=
false;
285 dg::detail::MPIContiguousKroneckerGather<Vector> m_mpi_gather;
286 mutable detail::AnyVector<Vector> m_store;
Error classes or the dg library.
constexpr bool is_vector_v
Utility typedef.
Definition predicate.h:75
typename TensorTraits< std::decay_t< Vector > >::value_type get_value_type
Definition tensor_traits.h:45
std::map< int, MessageType > mpi_permute(const std::map< int, MessageType > &messages, MPI_Comm comm)
Exchange messages between processes in a communicator.
Definition mpi_permutation.h:91
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Communicator for asynchronous communication of MPISparseBlockMat.
Definition mpi_gather_kron.h:144
void global_gather_init(const ContainerType &gatherFrom) const
. Globally (across processes) asynchronously gather data into a buffer
Definition mpi_gather_kron.h:242
bool isCommunicating() const
True if the gather/scatter operation involves actual MPI communication.
Definition mpi_gather_kron.h:226
MPI_Comm communicator() const
The internal MPI communicator used.
Definition mpi_gather_kron.h:219
void global_gather_wait(const ContainerType &gatherFrom, Vector< const dg::get_value_type< ContainerType > * > &buffer_ptrs) const
Wait for asynchronous communication to finish and gather received data into buffer and return pointer...
Definition mpi_gather_kron.h:269
MPIKroneckerGather(unsigned left_size, const std::map< int, thrust::host_vector< int > > &recvIdx, unsigned n, unsigned num_cols, unsigned right_size, MPI_Comm comm_1d)
Construct from communication pattern.
Definition mpi_gather_kron.h:164
MPIKroneckerGather(const MPIKroneckerGather< OtherVector > &src)
Construct from other execution policy.
Definition mpi_gather_kron.h:211
unsigned chunk_size() const
n*left_size*right_size
Definition mpi_gather_kron.h:224
MPIKroneckerGather(MPI_Comm comm=MPI_COMM_NULL)
no communication
Definition mpi_gather_kron.h:146
unsigned buffer_size() const
Number of pointers in receive buffer equals number of indices in recvIdx.
Definition mpi_gather_kron.h:222