Arcane  4.1.12.0
Developer documentation
Loading...
Searching...
No Matches
ParallelDataWriter.cc
1// -*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-
2//-----------------------------------------------------------------------------
3// Copyright 2000-2026 CEA (www.cea.fr) IFPEN (www.ifpenergiesnouvelles.com)
4// See the top-level COPYRIGHT file for details.
5// SPDX-License-Identifier: Apache-2.0
6//-----------------------------------------------------------------------------
7/*---------------------------------------------------------------------------*/
8/* ParallelDataWriter.cc (C) 2000-2025 */
9/* */
10/* Parallel IData Reader/Writer. */
11/*---------------------------------------------------------------------------*/
12/*---------------------------------------------------------------------------*/
13
14#include "arcane/std/internal/ParallelDataWriter.h"
15
16#include "arcane/utils/Ref.h"
17#include "arcane/utils/Math.h"
18
19#include "arcane/core/IParallelMng.h"
20#include "arcane/core/IParallelExchanger.h"
21#include "arcane/core/ISerializer.h"
22#include "arcane/core/ISerializeMessage.h"
23#include "arcane/core/SerializeBuffer.h"
24#include "arcane/core/IData.h"
25#include "arcane/core/parallel/BitonicSortT.H"
26#include "arcane/core/ParallelMngUtils.h"
27#include "arcane/core/ItemGroup.h"
28#include "arcane/core/IItemFamily.h"
30
31/*---------------------------------------------------------------------------*/
32/*---------------------------------------------------------------------------*/
33
34namespace Arcane
35{
36
37/*---------------------------------------------------------------------------*/
38/*---------------------------------------------------------------------------*/
39
41: public TraceAccessor
42{
43 public:
44
45 explicit Impl(IParallelMng* pm);
46
47 public:
48
49 Int64ConstArrayView sortedUniqueIds() const;
50 void setGatherAll(bool v);
51
52 private:
53
54 IParallelMng* m_parallel_mng = nullptr;
59 //TODO do not use an array dimensioned by commSize()
60 UniqueArray<UniqueArray<Int32>> m_indexes_to_send;
61 UniqueArray<UniqueArray<Int32>> m_indexes_to_recv;
62 Int32 m_nb_item = 0;
63 Int64UniqueArray m_sorted_unique_ids;
64
65 UniqueArray<Int32> m_local_indexes_to_send;
66 UniqueArray<Int32> m_local_indexes_to_recv;
67
68 bool m_gather_all = false;
69 bool m_is_verbose = false;
70
71 public:
72
73 void sort(Int32ConstArrayView local_ids, Int64ConstArrayView items_uid);
74
75 Ref<IData> getSortedValues(IData* data);
76};
77
78/*---------------------------------------------------------------------------*/
79/*---------------------------------------------------------------------------*/
80
81ParallelDataWriter::
82ParallelDataWriter(IParallelMng* pm)
83: m_p(new Impl(pm))
84{
85}
86
87ParallelDataWriter::
88~ParallelDataWriter()
89{
90 delete m_p;
91}
92
93Int64ConstArrayView ParallelDataWriter::
94sortedUniqueIds() const
95{
96 return m_p->sortedUniqueIds();
97}
98void ParallelDataWriter::
99setGatherAll(bool v)
100{
101 m_p->setGatherAll(v);
102}
103
104void ParallelDataWriter::
105sort(Int32ConstArrayView local_ids, Int64ConstArrayView items_uid)
106{
107 m_p->sort(local_ids, items_uid);
108}
109
110Ref<IData> ParallelDataWriter::
111getSortedValues(IData* data)
112{
113 return m_p->getSortedValues(data);
114}
115
116/*---------------------------------------------------------------------------*/
117/*---------------------------------------------------------------------------*/
118
119ParallelDataWriter::Impl::
120Impl(IParallelMng* pm)
121: TraceAccessor(pm->traceMng())
122, m_parallel_mng(pm)
123{
124}
125
126/*---------------------------------------------------------------------------*/
127/*---------------------------------------------------------------------------*/
128
129Int64ConstArrayView ParallelDataWriter::Impl::
130sortedUniqueIds() const
131{
132 return m_sorted_unique_ids;
133}
134
135/*---------------------------------------------------------------------------*/
136/*---------------------------------------------------------------------------*/
137
138void ParallelDataWriter::Impl::
139setGatherAll(bool v)
140{
141 m_gather_all = v;
142}
143
144/*---------------------------------------------------------------------------*/
145/*---------------------------------------------------------------------------*/
146
147void ParallelDataWriter::Impl::
148sort(Int32ConstArrayView local_ids, Int64ConstArrayView items_uid)
149{
150 IParallelMng* pm = m_parallel_mng;
151
152 Parallel::BitonicSort<Int64> uid_sorter(pm);
153 uid_sorter.sort(items_uid);
154
155 ConstArrayView<Int32> key_indexes = uid_sorter.keyIndexes();
156 ConstArrayView<Int32> key_ranks = uid_sorter.keyRanks();
157 ConstArrayView<Int64> keys = uid_sorter.keys();
158
159 UniqueArray<Int64> global_all_keys;
160 UniqueArray<Int32> global_all_key_indexes;
161 UniqueArray<Int32> global_all_key_ranks;
162
163 Int32 nb_item = keys.size();
164 const Int32 my_rank = pm->commRank();
165 const bool is_verbose = m_is_verbose;
166 if (is_verbose) {
167 for (Integer i = 0; i < math::min(nb_item, 20); ++i) {
168 info() << "ORIGINAL I=" << i << " UID=" << items_uid[i]
169 << " INDEX=" << key_indexes[i]
170 << " RANK=" << key_ranks[i]
171 << " KEY=" << keys[i];
172 }
173 }
174
175 if (m_gather_all) {
176 // Process 0 gathers everything
177 pm->allGatherVariable(keys, global_all_keys);
178 pm->allGatherVariable(key_indexes, global_all_key_indexes);
179 pm->allGatherVariable(key_ranks, global_all_key_ranks);
180 Int32 gather_rank = 0;
181
182 if (pm->commRank() != gather_rank) {
183 global_all_key_ranks.clear();
184 global_all_key_indexes.clear();
185 global_all_keys.clear();
186 }
187 nb_item = global_all_keys.size();
188
189 key_ranks = global_all_key_ranks.view();
190 key_indexes = global_all_key_indexes.view();
191 keys = global_all_keys.view();
192 }
193
194 m_nb_item = nb_item;
195
196 m_sorted_unique_ids.resize(nb_item);
197 m_sorted_unique_ids.copy(keys);
198
199 //info() << "END SORT SIZE=" << nb_item << " KEY_SIZE=" << keys.size();
200 if (is_verbose) {
201 for (Integer i = 0; i < math::min(nb_item, 20); ++i) {
202 info() << "I=" << i << " KEY=" << keys[i]
203 << " INDEX=" << key_indexes[i]
204 << " RANK=" << key_ranks[i];
205 }
206 }
207 {
208 UniqueArray<UniqueArray<Int32>> indexes_list(pm->commSize());
209 UniqueArray<UniqueArray<Int32>> own_indexes_list(pm->commSize());
210 auto sd_exchange{ ParallelMngUtils::createExchangerRef(pm) };
211
212 for (Integer i = 0; i < nb_item; ++i) {
213 Int32 index = key_indexes[i];
214 Int32 rank = key_ranks[i];
215 if (rank != my_rank && indexes_list[rank].empty())
216 sd_exchange->addSender(rank);
217 indexes_list[rank].add(index);
218 own_indexes_list[rank].add(i);
219 }
220 m_local_indexes_to_recv = own_indexes_list[my_rank];
221 m_local_indexes_to_send.resize(indexes_list[my_rank].size());
222
223 sd_exchange->initializeCommunicationsMessages();
224 //info() << "NB SEND=" << sd_exchange->nbSender()
225 // << " NB_RECV=" << sd_exchange->nbReceiver();
226 Int32ConstArrayView send_sd = sd_exchange->senderRanks();
227 Integer nb_send = send_sd.size();
228 m_indexes_to_recv.resize(nb_send);
229 m_ranks_to_recv.resize(nb_send);
230 for (Integer i = 0; i < nb_send; ++i) {
231 //info() << " SEND TO A: rank=" << send_sd[i];
232 ISerializeMessage* send_msg = sd_exchange->messageToSend(i);
233 Int32 dest_rank = send_sd[i];
234 ISerializer* serializer = send_msg->serializer();
235 m_indexes_to_recv[i] = own_indexes_list[dest_rank];
236 m_ranks_to_recv[i] = dest_rank;
237 serializer->setMode(ISerializer::ModeReserve);
238
239 serializer->reserveArray(indexes_list[dest_rank]);
240
241 serializer->allocateBuffer();
242 serializer->setMode(ISerializer::ModePut);
243
244 serializer->putArray(indexes_list[dest_rank]);
245 if (is_verbose) {
246 Integer nb_to_send = indexes_list[dest_rank].size();
247 for (Integer z = 0; z < nb_to_send; ++z) {
248 Integer index = indexes_list[dest_rank][z];
249 info() << " SEND Z=" << z << " RANK=" << dest_rank << " index=" << index;
250 }
251 }
252 }
253 sd_exchange->processExchange();
254
255 ConstArrayView<Int32> recv_sd = sd_exchange->receiverRanks();
256 const Int32 nb_recv = recv_sd.size();
257 m_indexes_to_send.resize(nb_recv);
258 m_ranks_to_send.resize(nb_recv);
259 for (Integer i = 0; i < nb_recv; ++i) {
260 //info() << " RECEIVE FROM A: rank=" << recv_sd[i];
261 ISerializeMessage* recv_msg = sd_exchange->messageToReceive(i);
262 Int32 orig_rank = recv_sd[i];
263 ISerializer* serializer = recv_msg->serializer();
264 serializer->setMode(ISerializer::ModeGet);
265 Int32Array& recv_indexes = m_indexes_to_send[i];
266 m_ranks_to_send[i] = orig_rank;
267 serializer->getArray(recv_indexes);
268 const Int32 nb_to_recv = recv_indexes.size();
269 //info() << " RECEIVE FROM A: NB_TO_RECEIVE " << nb_to_recv << " S2=" << own_group_local_ids.size();
270 for (Integer z = 0; z < nb_to_recv; ++z) {
271 Int32 index = recv_indexes[z];
272 //info() << " RECV Z=" << z << " RANK=" << orig_rank << " index=" << index
273 // << " index2=" << own_group_local_ids[index];
274 recv_indexes[z] = local_ids[index];
275 }
276 //info() << "END RECEIVE FROM A: NB_TO_RECEIVE " << nb_to_recv;
277 }
278
279 // Processes local entities
280 {
281 const Int32 nb_local = m_local_indexes_to_send.size();
282 for (Int32 z = 0; z < nb_local; ++z) {
283 Int32 index = indexes_list[my_rank][z];
284 //info() << " RECV Z=" << z << " RANK=" << orig_rank << " index=" << index
285 // << " index2=" << own_group_local_ids[index];
286 m_local_indexes_to_send[z] = local_ids[index];
287 }
288 }
289 }
290}
291
292/*---------------------------------------------------------------------------*/
293/*---------------------------------------------------------------------------*/
294
295Ref<IData> ParallelDataWriter::Impl::
296getSortedValues(IData* data)
297{
298 IParallelMng* pm = m_parallel_mng;
299 Ref<IData> sorted_data = data->cloneEmptyRef();
300
301 auto sd_exchange{ ParallelMngUtils::createExchangerRef(pm) };
302 for (Int32 rank_to_send : m_ranks_to_send)
303 sd_exchange->addSender(rank_to_send);
304
305 UniqueArray<Int32> ranks_to_recv2;
306 for (Int32 rank_to_receive : m_ranks_to_recv)
307 ranks_to_recv2.add(rank_to_receive);
308
309 sd_exchange->initializeCommunicationsMessages(ranks_to_recv2);
310 Int32ConstArrayView send_sd = sd_exchange->senderRanks();
311 const Int32 nb_send = send_sd.size();
312 for (Integer i = 0; i < nb_send; ++i) {
313 //info() << " SEND TO B: rank=" << send_sd[i];
314 ISerializeMessage* send_msg = sd_exchange->messageToSend(i);
315 //Int32 dest_rank = send_sd[i];
316 ISerializer* serializer = send_msg->serializer();
317 serializer->setMode(ISerializer::ModeReserve);
318 data->serialize(serializer, m_indexes_to_send[i], 0);
319 serializer->allocateBuffer();
320 serializer->setMode(ISerializer::ModePut);
321 data->serialize(serializer, m_indexes_to_send[i], 0);
322 }
323
324 sd_exchange->processExchange();
325
326 Int32ConstArrayView recv_sd = sd_exchange->receiverRanks();
327 const Int32 nb_recv = recv_sd.size();
328 sorted_data->resize(m_nb_item);
329 for (Integer i = 0; i < nb_recv; ++i) {
330 //info() << " RECEIVE FROM B: rank=" << recv_sd[i];
331 ISerializeMessage* recv_msg = sd_exchange->messageToReceive(i);
332 //Int32 orig_rank = recv_sd[i];
333 ISerializer* serializer = recv_msg->serializer();
334 serializer->setMode(ISerializer::ModeGet);
335 sorted_data->serialize(serializer, m_indexes_to_recv[i], 0);
336 }
337
338 // Processes data that is already present on this processor.
339 {
340 ConstArrayView<Int32> local_recv_indexes = m_local_indexes_to_recv;
341 const Int32 nb_local_index = local_recv_indexes.size();
342 if (nb_local_index > 0) {
343 SerializeBuffer sbuf;
344 sbuf.setMode(ISerializer::ModeReserve);
345 data->serialize(&sbuf, m_local_indexes_to_send, nullptr);
346 sbuf.allocateBuffer();
347 sbuf.setMode(ISerializer::ModePut);
348 data->serialize(&sbuf, m_local_indexes_to_send, nullptr);
349 sbuf.setMode(ISerializer::ModeGet);
350 sorted_data->serialize(&sbuf, local_recv_indexes, nullptr);
351 }
352 }
353 return sorted_data;
354}
355
356/*---------------------------------------------------------------------------*/
357/*---------------------------------------------------------------------------*/
358
359/*---------------------------------------------------------------------------*/
360/*---------------------------------------------------------------------------*/
361
362Ref<ParallelDataWriter> ParallelDataWriterList::
363getOrCreateWriter(const ItemGroup& group)
364{
365 auto i = m_data_writers.find(group);
366 if (i != m_data_writers.end())
367 return i->second;
368 IParallelMng* pm = group.itemFamily()->parallelMng();
369 Ref<ParallelDataWriter> writer = makeRef(new ParallelDataWriter(pm));
370 {
371 Int64UniqueArray items_uid;
372 ItemGroup own_group = group.own();
373 MeshUtils::fillUniqueIds(own_group.view(), items_uid);
374 Int32ConstArrayView local_ids = own_group.internal()->itemsLocalId();
375 writer->sort(local_ids, items_uid);
376 }
377 m_data_writers.try_emplace(group, writer);
378 return writer;
379}
380
381/*---------------------------------------------------------------------------*/
382/*---------------------------------------------------------------------------*/
383
384} // End namespace Arcane
385
386/*---------------------------------------------------------------------------*/
387/*---------------------------------------------------------------------------*/
Utility functions for the mesh.
Integer size() const
Number of elements in the vector.
constexpr Integer size() const noexcept
Number of elements in the array.
Interface of a data item.
Definition IData.h:34
Interface of the parallelism manager for a subdomain.
UniqueArray< Int32 > m_ranks_to_recv
Array indicating the ranks of processes to which we send information.
UniqueArray< Int32 > m_ranks_to_send
Array indicating the ranks of processes from which we receive information.
Reference to an instance.
TraceAccessor(ITraceMng *m)
Constructs an accessor via the trace manager m.
1D data vector with value semantics (STL style).
__host__ __device__ Real2 min(Real2 a, Real2 b)
Returns the minimum of two Real2.
Definition MathUtils.h:346
Ref< IParallelExchanger > createExchangerRef(IParallelMng *pm)
Returns an interface to transfer messages between ranks.
-- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature --
UniqueArray< Int64 > Int64UniqueArray
Dynamic 1D array of 64-bit integers.
Definition UtilsTypes.h:339
Int32 Integer
Type representing an integer.
ConstArrayView< Int32 > Int32ConstArrayView
C equivalent of a 1D array of 32-bit integers.
Definition UtilsTypes.h:482
ConstArrayView< Int64 > Int64ConstArrayView
C equivalent of a 1D array of 64-bit integers.
Definition UtilsTypes.h:480
auto makeRef(InstanceType *t) -> Ref< InstanceType >
Creates a reference on a pointer.
Array< Int32 > Int32Array
Dynamic one-dimensional array of 32-bit integers.
Definition UtilsTypes.h:127
std::int32_t Int32
Signed integer type of 32 bits.