db/d5c/GatherGroup_8cc_source.html

// -*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-

//-----------------------------------------------------------------------------

// Copyright 2000-2026 CEA (www.cea.fr) IFPEN (www.ifpenergiesnouvelles.com)

// See the top-level COPYRIGHT file for details.

// SPDX-License-Identifier: Apache-2.0

//-----------------------------------------------------------------------------

/*---------------------------------------------------------------------------*/

/* GatherGroup.cc                                              (C) 2000-2026 */

/*                                                                           */

/* Classe permettant de gérer les regroupements de données sur le ou les     */

/* sous-domaines écrivains.                                                  */

/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


#include "arcane/core/internal/GatherGroup.h"


#include "arcane/utils/FatalErrorException.h"

#include "arcane/utils/Array2.h"


#include "arcane/core/IParallelMng.h"

#include "arcane/core/internal/IParallelMngInternal.h"


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


namespace Arcane

{


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


GatherGroup::

GatherGroup(GatherGroupInfo* gather_group_info)

: m_gather_group_info(ARCANE_CHECK_POINTER(gather_group_info))

{

  ARCANE_FATAL_IF(!gather_group_info->isComputed(), "GatherGroupInfo is not computed");

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


GatherGroup::

GatherGroup() = default;


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


GatherGroup::

~GatherGroup() = default;


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


bool GatherGroup::

isNeedGather()

{

  ARCANE_CHECK_POINTER(m_gather_group_info);

  IParallelMng* pm = m_gather_group_info->m_parallel_mng;

  // True si Thread ou Hybride ou MPI sans MPI-IO

  // False si Séquentiel ou MPI + MPI-IO.

  return pm->commSize() != 1 && (pm->isThreadImplementation() || !m_gather_group_info->m_use_collective_io);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void GatherGroup::

gatherToMasterIO(Int64 sizeof_elem, Span<const Byte> in, Span<Byte> out)

{

  ARCANE_CHECK_POINTER(m_gather_group_info);

  IParallelMng* pm = m_gather_group_info->m_parallel_mng;


  // Si séquentiel ou MPI + MPI-IO.

  if ((pm->commSize() == 1) || (!pm->isThreadImplementation() && m_gather_group_info->m_use_collective_io)) {

    out.copy(in);

    return;

  }


  const Int32 writer = m_gather_group_info->m_writer;


  if (writer != pm->commRank()) {

    pm->send(in.constSmallView(), writer);

    return;

  }


  out.copy(in);


  const Int32 nb_sender = m_gather_group_info->m_nb_sender_to_writer;


  SmallSpan<const Int32> nb_elem_recved = m_gather_group_info->m_nb_elem_recv.smallSpan();


  UniqueArray<Parallel::Request> requests(nb_sender - 1);


  Int64 old_size = in.size();

  for (Int32 i = 0; i < nb_sender - 1; ++i) {

    const Int32 rank = i + writer + 1;

    const Int64 sizeof_recved = nb_elem_recved[i] * sizeof_elem;


    ArrayView<Byte> recv_elem = out.subSpan(old_size, sizeof_recved).smallView();

    requests[i] = pm->recv(recv_elem, rank, false);


    old_size += sizeof_recved;

  }

  pm->waitAllRequests(requests);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void GatherGroup::

setGatherGroupInfo(GatherGroupInfo* gather_group_info)

{

  ARCANE_CHECK_POINTER(gather_group_info);

  ARCANE_FATAL_IF(!gather_group_info->isComputed(), "GatherGroupInfo is not computed");

  m_gather_group_info = gather_group_info;

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


GatherGroupInfo::

GatherGroupInfo(IParallelMng* parallel_mng, bool use_collective_io)

: m_parallel_mng(parallel_mng)

, m_use_collective_io(use_collective_io)

{}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


GatherGroupInfo::

~GatherGroupInfo() = default;


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void GatherGroupInfo::

computeSize(Int32 nb_elem_in)

{

  if (m_is_computed)

    return;

  m_is_computed = true;


  if (m_use_collective_io) {

    m_writer = m_parallel_mng->_internalApi()->masterParallelIORank();

    m_nb_sender_to_writer = m_parallel_mng->_internalApi()->nbSendersToMasterParallelIO();

  }

  else {

    m_writer = m_parallel_mng->masterIORank();

    m_nb_sender_to_writer = m_parallel_mng->commSize();

  }


  // Si séquentiel ou MPI + MPI-IO.

  if ((m_parallel_mng->commSize() == 1) || (!m_parallel_mng->isThreadImplementation() && m_use_collective_io)) {

    m_nb_elem_output = nb_elem_in;

    m_nb_writer_global = m_parallel_mng->commSize();

    return;

  }


  if (m_writer != m_parallel_mng->commRank()) {

    m_parallel_mng->send({ 1, &nb_elem_in }, m_writer);

    m_nb_elem_output = 0;

  }

  else {

    m_nb_elem_recv.resizeNoInit(m_nb_sender_to_writer - 1);


    {

      UniqueArray<Parallel::Request> requests(m_nb_sender_to_writer - 1);

      for (Int32 i = 0; i < m_nb_sender_to_writer - 1; ++i) {

        const Int32 rank = i + m_writer + 1;

        requests[i] = m_parallel_mng->recv({ 1, &m_nb_elem_recv[i] }, rank, false);

      }

      m_parallel_mng->waitAllRequests(requests);

    }


    m_nb_elem_output = nb_elem_in;

    for (const Int32 size : m_nb_elem_recv) {

      m_nb_elem_output += size;

    }

  }


  m_nb_writer_global = m_parallel_mng->reduce(MessagePassing::ReduceSum, (m_writer == m_parallel_mng->commRank()));

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


SmallSpan<Int32> GatherGroupInfo::

nbElemRecvGatherToMasterIO()

{

  return m_nb_elem_recv.smallSpan();

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


} // End namespace Arcane


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/

ARCANE_FATAL_IF
#define ARCANE_FATAL_IF(const,...)
Macro envoyant une exception FatalErrorException si cond est vrai.
Definition ArcaneGlobal.h:751

ARCANE_CHECK_POINTER
#define ARCANE_CHECK_POINTER(ptr)
Macro retournant le pointeur ptr s'il est non nul ou lancant une exception s'il est nul.
Definition ArcaneGlobal.h:810

Arcane::ArrayView
Vue modifiable d'un tableau d'un type T.
Definition arccore/src/base/arccore/base/ArrayView.h:94

Arcane::GatherGroupInfo
Classe permettant de calculer et de conserver les informations de regroupements.
Definition GatherGroup.h:128

Arcane::GatherGroupInfo::computeSize
void computeSize(Int32 nb_elem_in) override
Méthode permettant de calculer les informations de regroupements.
Definition GatherGroup.cc:140

Arcane::GatherGroupInfo::GatherGroupInfo
GatherGroupInfo(IParallelMng *parallel_mng, bool use_collective_io)
Constructeur.
Definition GatherGroup.cc:125

Arcane::GatherGroupInfo::nbElemRecvGatherToMasterIO
SmallSpan< Int32 > nbElemRecvGatherToMasterIO() override
Méthode permettant de connaitre le nombre d'éléments que vont nous envoyer chaque sous-domaine tier.
Definition GatherGroup.cc:191

Arcane::GatherGroupInfo::isComputed
bool isComputed() override
Méthode permettant de savoir si la méthode computeSize() a déjà été appelée.
Definition GatherGroup.h:149

Arcane::GatherGroup::GatherGroup
GatherGroup()
Constructeur. Pour que l'objet soit utilisable, il est nécessaire d'appeler setGatherGroupInfo().

Arcane::GatherGroup::isNeedGather
bool isNeedGather() override
Méthode permettant de savoir si l'on doit effectuer le regroupement ou si l'on peut directement écrir...
Definition GatherGroup.cc:55

Arcane::GatherGroup::gatherToMasterIO
void gatherToMasterIO(Int64 sizeof_elem, Span< const Byte > in, Span< Byte > out) override
Méthode permettant de regrouper les données de plusieurs sous-domaines sur un ou plusieurs sous-domai...
Definition GatherGroup.cc:68

Arcane::GatherGroup::setGatherGroupInfo
void setGatherGroupInfo(GatherGroupInfo *gather_group_info)
Méthode permettant de définir les informations de regroupement.
Definition GatherGroup.cc:111

Arcane::IParallelMng
Interface du gestionnaire de parallélisme pour un sous-domaine.
Definition IParallelMng.h:52

Arcane::IParallelMng::isThreadImplementation
virtual bool isThreadImplementation() const =0
Indique si l'implémentation utilise les threads.

Arcane::IParallelMng::commRank
virtual Int32 commRank() const =0
Rang de cette instance dans le communicateur.

Arcane::IParallelMng::recv
virtual void recv(ArrayView< char > values, Int32 rank)=0

Arcane::IParallelMng::commSize
virtual Int32 commSize() const =0
Nombre d'instance dans le communicateur.

Arcane::IParallelMng::waitAllRequests
virtual void waitAllRequests(ArrayView< Request > rvalues)=0
Bloque en attendant que les requêtes rvalues soient terminées.

Arcane::SmallSpan
Vue d'un tableau d'éléments de type T.
Definition Span.h:801

Arcane::SpanImpl::copy
__host__ __device__ void copy(const U &copy_array)
Recopie le tableau copy_array dans l'instance.
Definition Span.h:475

Arcane::SpanImpl::constSmallView
constexpr ConstArrayView< value_type > constSmallView() const
Vue constante sur cette vue.
Definition Span.h:399

Arcane::SpanImpl::size
constexpr __host__ __device__ SizeType size() const noexcept
Retourne la taille du tableau.
Definition Span.h:325

Arcane::Span
Vue d'un tableau d'éléments de type T.
Definition Span.h:633

Arcane::Span::subSpan
constexpr __host__ __device__ Span< T, DynExtent > subSpan(Int64 abegin, Int64 asize) const
Sous-vue à partir de l'élément abegin et contenant asize éléments.
Definition Span.h:733

Arcane::UniqueArray
Vecteur 1D de données avec sémantique par valeur (style STL).
Definition arccore/src/common/arccore/common/Array.h:888

Arcane::MessagePassing::ReduceSum
@ ReduceSum
Somme des valeurs.
Definition MessagePassingGlobal.h:103

Arcane
-*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-
Definition arcane/src/arcane/accelerator/AcceleratorGlobal.h:37

Arcane::Int64
std::int64_t Int64
Type entier signé sur 64 bits.
Definition ArccoreGlobal.h:227

Arcane::Int32
std::int32_t Int32
Type entier signé sur 32 bits.
Definition ArccoreGlobal.h:225