d4/dc8/MpiMultiMachineShMemWinBaseInternal_8cc_source.html

// -*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-

//-----------------------------------------------------------------------------

// Copyright 2000-2026 CEA (www.cea.fr) IFPEN (www.ifpenergiesnouvelles.com)

// See the top-level COPYRIGHT file for details.

// SPDX-License-Identifier: Apache-2.0

//-----------------------------------------------------------------------------

/*---------------------------------------------------------------------------*/

/* MpiMultiMachineShMemWinBaseInternal.h                       (C) 2000-2026 */

/*                                                                           */

/* Classe permettant de créer des fenêtres mémoires pour un noeud de calcul. */

/* Les segments de ces fenêtres ne sont pas contigües en mémoire et peuvent  */

/* être redimensionnées. Un processus peut posséder plusieurs segments.      */

/*---------------------------------------------------------------------------*/


#include "arccore/message_passing_mpi/internal/MpiMultiMachineShMemWinBaseInternal.h"


#include "arccore/base/FatalErrorException.h"


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


namespace Arcane::MessagePassing::Mpi

{


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


MpiMultiMachineShMemWinBaseInternal::

MpiMultiMachineShMemWinBaseInternal(SmallSpan<Int64> sizeof_segments, Int32 nb_segments_per_proc, Int32 sizeof_type, const MPI_Comm& comm_machine, Int32 comm_machine_rank, Int32 comm_machine_size, ConstArrayView<Int32> machine_ranks)

: m_win_need_resize()

, m_win_actual_sizeof()

, m_win_target_segments()

, m_comm_machine(comm_machine)

, m_comm_machine_size(comm_machine_size)

, m_comm_machine_rank(comm_machine_rank)

, m_sizeof_type(sizeof_type)

, m_nb_segments_per_proc(nb_segments_per_proc)

, m_machine_ranks(machine_ranks)

, m_add_requests(nb_segments_per_proc)

, m_resize_requests(nb_segments_per_proc)

{

  if (m_sizeof_type <= 0) {

    ARCCORE_FATAL("Invalid sizeof_type");

  }

  for (Integer i = 0; i < m_nb_segments_per_proc; ++i) {

    if (sizeof_segments[i] < 0 || sizeof_segments[i] % m_sizeof_type != 0) {

      ARCCORE_FATAL("Invalid initial sizeof_segment");

    }

  }

  if (m_nb_segments_per_proc <= 0) {

    ARCCORE_FATAL("Invalid nb_segments_per_proc");

  }

  m_all_mpi_win.resize(m_comm_machine_size * m_nb_segments_per_proc);

  m_reserved_part_span.resize(m_nb_segments_per_proc);


  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    m_add_requests[num_seg] = Span<const std::byte>{ nullptr, 0 };

    m_resize_requests[num_seg] = -1;

  }


  MPI_Info win_info_true;

  MPI_Info_create(&win_info_true);

  MPI_Info_set(win_info_true, "alloc_shared_noncontig", "true");


  MPI_Info win_info_false;

  MPI_Info_create(&win_info_false);

  MPI_Info_set(win_info_false, "alloc_shared_noncontig", "false");


  const Int32 pos_my_wins = m_comm_machine_rank * m_nb_segments_per_proc;


  {

    // On crée tous les segments de tous les processus.

    for (Integer i = 0; i < m_comm_machine_size; ++i) {

      for (Integer j = 0; j < m_nb_segments_per_proc; ++j) {

        Int64 size_seg = 0;

        if (m_comm_machine_rank == i) {

          if (sizeof_segments[j] == 0)

            size_seg = m_sizeof_type;

          else

            size_seg = sizeof_segments[j];

        }

        std::byte* ptr_seg = nullptr;

        int error = MPI_Win_allocate_shared(size_seg, m_sizeof_type, win_info_true, m_comm_machine, &ptr_seg, &m_all_mpi_win[j + i * m_nb_segments_per_proc]);


        if (error != MPI_SUCCESS) {

          ARCCORE_FATAL("Error with MPI_Win_allocate_shared() call");

        }

      }

    }


    for (Integer i = 0; i < m_nb_segments_per_proc; ++i) {

      MPI_Aint size_seg;

      int size_type;

      std::byte* ptr_seg = nullptr;

      int error = MPI_Win_shared_query(m_all_mpi_win[i + pos_my_wins], m_comm_machine_rank, &size_seg, &size_type, &ptr_seg);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

      }


      // Attention : L'utilisateur demande un nombre minimum d'éléments réservés.

      // Mais MPI réserve la taille qu'il veut (effet du alloc_shared_noncontig=true).

      // On est juste sûr que la taille qu'il a réservée est supérieure ou égale à sizeof_segment.

      m_reserved_part_span[i] = Span<std::byte>{ ptr_seg, size_seg };

    }

  }


  {

    Int64* ptr_seg = nullptr;

    Int64* ptr_win = nullptr;

    {

      int error = MPI_Win_allocate_shared(static_cast<Int64>(sizeof(Int64)) * m_nb_segments_per_proc, sizeof(Int64), win_info_false, m_comm_machine, &ptr_seg, &m_win_need_resize);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_allocate_shared() call");

      }

    }

    {

      MPI_Aint size_seg;

      int size_type;

      int error = MPI_Win_shared_query(m_win_need_resize, 0, &size_seg, &size_type, &ptr_win);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

      }


      m_need_resize = Span<Int64>{ ptr_win, m_comm_machine_size * m_nb_segments_per_proc };


      for (Integer i = 0; i < m_nb_segments_per_proc; ++i) {

        m_need_resize[i + pos_my_wins] = -1;

      }

    }

    if (ptr_win + pos_my_wins != ptr_seg) {

      ARCCORE_FATAL("m_win_need_resize is noncontig");

    }

  }


  {

    Int64* ptr_seg = nullptr;

    Int64* ptr_win = nullptr;

    {

      int error = MPI_Win_allocate_shared(static_cast<Int64>(sizeof(Int64)) * m_nb_segments_per_proc, sizeof(Int64), win_info_false, m_comm_machine, &ptr_seg, &m_win_actual_sizeof);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_allocate_shared() call");

      }

    }

    {

      MPI_Aint size_seg;

      int size_type;

      int error = MPI_Win_shared_query(m_win_actual_sizeof, 0, &size_seg, &size_type, &ptr_win);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

      }


      m_sizeof_used_part = Span<Int64>{ ptr_win, m_comm_machine_size * m_nb_segments_per_proc };


      for (Integer i = 0; i < m_nb_segments_per_proc; ++i) {

        m_sizeof_used_part[i + pos_my_wins] = sizeof_segments[i];

      }

    }

    if (ptr_win + pos_my_wins != ptr_seg) {

      ARCCORE_FATAL("m_win_actual_sizeof is noncontig");

    }

  }


  {

    Int32* ptr_seg = nullptr;

    Int32* ptr_win = nullptr;

    {

      int error = MPI_Win_allocate_shared(static_cast<Int64>(sizeof(Int32)) * m_nb_segments_per_proc, sizeof(Int32), win_info_false, m_comm_machine, &ptr_seg, &m_win_target_segments);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_allocate_shared() call");

      }

    }

    {

      MPI_Aint size_seg;

      int size_type;

      int error = MPI_Win_shared_query(m_win_target_segments, 0, &size_seg, &size_type, &ptr_win);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

      }


      m_target_segments = Span<Int32>{ ptr_win, m_comm_machine_size * m_nb_segments_per_proc };


      for (Integer i = 0; i < m_nb_segments_per_proc; ++i) {

        m_target_segments[i + pos_my_wins] = -1;

      }

    }

    if (ptr_win + pos_my_wins != ptr_seg) {

      ARCCORE_FATAL("m_win_owner_segments is noncontig");

    }

  }


  MPI_Info_free(&win_info_false);

  MPI_Info_free(&win_info_true);


  MPI_Barrier(m_comm_machine);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


MpiMultiMachineShMemWinBaseInternal::

~MpiMultiMachineShMemWinBaseInternal()

{

  for (Integer i = 0; i < m_comm_machine_size * m_nb_segments_per_proc; ++i) {

    MPI_Win_free(&m_all_mpi_win[i]);

  }

  MPI_Win_free(&m_win_need_resize);

  MPI_Win_free(&m_win_actual_sizeof);

  MPI_Win_free(&m_win_target_segments);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Int32 MpiMultiMachineShMemWinBaseInternal::

sizeofOneElem() const

{

  return m_sizeof_type;

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


ConstArrayView<Int32> MpiMultiMachineShMemWinBaseInternal::

machineRanks() const

{

  return m_machine_ranks;

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

barrier() const

{

  MPI_Barrier(m_comm_machine);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Span<std::byte> MpiMultiMachineShMemWinBaseInternal::

segmentView(Int32 num_seg)

{

  const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;

  return m_reserved_part_span[num_seg].subSpan(0, m_sizeof_used_part[segment_infos_pos]);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Span<std::byte> MpiMultiMachineShMemWinBaseInternal::

segmentView(Int32 rank, Int32 num_seg)

{

  const Int32 segment_infos_pos = num_seg + _worldToMachine(rank) * m_nb_segments_per_proc;


  MPI_Aint size_seg;

  int size_type;

  std::byte* ptr_seg = nullptr;

  int error = MPI_Win_shared_query(m_all_mpi_win[segment_infos_pos], rank, &size_seg, &size_type, &ptr_seg);


  if (error != MPI_SUCCESS) {

    ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

  }


  return Span<std::byte>{ ptr_seg, m_sizeof_used_part[segment_infos_pos] };

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Span<const std::byte> MpiMultiMachineShMemWinBaseInternal::

segmentConstView(Int32 num_seg) const

{

  const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;

  return m_reserved_part_span[num_seg].subSpan(0, m_sizeof_used_part[segment_infos_pos]);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Span<const std::byte> MpiMultiMachineShMemWinBaseInternal::

segmentConstView(Int32 rank, Int32 num_seg) const

{

  const Int32 segment_infos_pos = num_seg + _worldToMachine(rank) * m_nb_segments_per_proc;


  MPI_Aint size_seg;

  int size_type;

  std::byte* ptr_seg = nullptr;

  int error = MPI_Win_shared_query(m_all_mpi_win[segment_infos_pos], rank, &size_seg, &size_type, &ptr_seg);


  if (error != MPI_SUCCESS) {

    ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

  }


  return Span<const std::byte>{ ptr_seg, m_sizeof_used_part[segment_infos_pos] };

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

requestAdd(Int32 num_seg, Span<const std::byte> elem)

{

  if (elem.size() % m_sizeof_type) {

    ARCCORE_FATAL("Sizeof elem not valid");

  }

  if (elem.empty() || elem.data() == nullptr) {

    return;

  }


  const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


  const Int64 actual_sizeof_win = m_sizeof_used_part[segment_infos_pos];

  const Int64 future_sizeof_win = actual_sizeof_win + elem.size();

  const Int64 old_reserved = m_reserved_part_span[num_seg].size();


  if (future_sizeof_win > old_reserved) {

    _requestRealloc(segment_infos_pos, future_sizeof_win);

  }

  else {

    _requestRealloc(segment_infos_pos);

  }


  m_add_requests[num_seg] = elem;

  m_add_requested = true; // TODO Atomic ?

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

executeAdd()

{

  _executeRealloc();


  if (!m_add_requested) {

    return;

  }

  m_add_requested = false;


  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    if (m_add_requests[num_seg].empty() || m_add_requests[num_seg].data() == nullptr) {

      continue;

    }


    const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


    const Int64 actual_sizeof_win = m_sizeof_used_part[segment_infos_pos];

    const Int64 future_sizeof_win = actual_sizeof_win + m_add_requests[num_seg].size();


    if (m_reserved_part_span[num_seg].size() < future_sizeof_win) {

      ARCCORE_FATAL("Bad realloc -- New size : {1} -- Needed size : {2}", m_reserved_part_span[num_seg].size(), future_sizeof_win);

    }


    for (Int64 pos_win = actual_sizeof_win, pos_elem = 0; pos_win < future_sizeof_win; ++pos_win, ++pos_elem) {

      m_reserved_part_span[num_seg][pos_win] = m_add_requests[num_seg][pos_elem];

    }

    m_sizeof_used_part[segment_infos_pos] = future_sizeof_win;


    m_add_requests[num_seg] = Span<const std::byte>{ nullptr, 0 };

  }

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

requestAddToAnotherSegment(Int32 thread, Int32 rank, Int32 num_seg, Span<const std::byte> elem)

{

  if (elem.size() % m_sizeof_type) {

    ARCCORE_FATAL("Sizeof elem not valid");

  }

  if (elem.empty() || elem.data() == nullptr) {

    return;

  }


  const Int32 machine_rank = _worldToMachine(rank);

  const Int32 target_segment_infos_pos = num_seg + machine_rank * m_nb_segments_per_proc;


  {

    const Int32 segment_infos_pos = thread + m_comm_machine_rank * m_nb_segments_per_proc;

    m_target_segments[segment_infos_pos] = target_segment_infos_pos;

  }


  Span<std::byte> rank_reserved_part_span;

  {

    MPI_Aint size_seg;

    std::byte* ptr_seg = nullptr;

    int size_type;

    int error = MPI_Win_shared_query(m_all_mpi_win[target_segment_infos_pos], machine_rank, &size_seg, &size_type, &ptr_seg);


    if (error != MPI_SUCCESS) {

      ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

    }

    rank_reserved_part_span = Span<std::byte>{ ptr_seg, size_seg };

  }


  const Int64 actual_sizeof_win = m_sizeof_used_part[target_segment_infos_pos];

  const Int64 future_sizeof_win = actual_sizeof_win + elem.size();

  const Int64 old_reserved = rank_reserved_part_span.size();


  if (future_sizeof_win > old_reserved) {

    _requestRealloc(target_segment_infos_pos, future_sizeof_win);

  }

  else {

    _requestRealloc(target_segment_infos_pos);

  }


  m_add_requests[thread] = elem;

  m_add_requested = true; // TODO Atomic ?

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

executeAddToAnotherSegment()

{

  MPI_Barrier(m_comm_machine);


  // Pour chaque segment appartenant à mon processus, je regarde si quelqu'un

  // veut le modifier.

  // is_my_seg_edited sera utilisé à la fin de la méthode.

  auto is_my_seg_edited = std::make_unique<bool[]>(m_comm_machine_size);

  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    for (const Int32 rank_asked : m_target_segments) {

      if (rank_asked == m_comm_machine_rank) {

        is_my_seg_edited[num_seg] = true;

        break;

      }

    }

  }


  // Si je n'ai pas demandé de modification de segment, j'effectue uniquement

  // les réallocations si besoin (d'autres processus peuvent me demander des

  // réallocations).

  if (!m_add_requested) {

    _executeRealloc();

  }


  else {

    m_add_requested = false;


    // Un segment ne peut être modifié que par un seul thread à la fois. On vérifie cela ici :

    for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

      const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;

      const Int32 seg_needs_to_edit = m_target_segments[segment_infos_pos];

      if (seg_needs_to_edit == -1)

        continue;


      bool is_found = false;

      for (const Int32 rank_asked : m_target_segments) {

        if (rank_asked == seg_needs_to_edit) {

          if (!is_found) {

            is_found = true;

          }

          else {

            ARCCORE_FATAL("Two subdomains ask same rank for addToAnotherSegment()");

          }

        }

      }

    }


    _executeRealloc();


    // On ajoute les éléments dans les segments.

    for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

      if (m_add_requests[num_seg].empty() || m_add_requests[num_seg].data() == nullptr) {

        continue;

      }


      const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;

      const Int32 target_segment_infos_pos = m_target_segments[segment_infos_pos];

      if (target_segment_infos_pos == -1) {

        ARCCORE_FATAL("Ne devrait pas aller ici");

      }


      const Int64 actual_sizeof_win = m_sizeof_used_part[target_segment_infos_pos];

      const Int64 future_sizeof_win = actual_sizeof_win + m_add_requests[num_seg].size();


      // On récupère le segment à modifier.

      Span<std::byte> rank_reserved_part_span;

      {

        MPI_Aint size_seg;

        std::byte* ptr_seg = nullptr;

        int size_type;

        int error = MPI_Win_shared_query(m_all_mpi_win[target_segment_infos_pos], target_segment_infos_pos / m_nb_segments_per_proc, &size_seg, &size_type, &ptr_seg);


        if (error != MPI_SUCCESS) {

          ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

        }

        rank_reserved_part_span = Span<std::byte>{ ptr_seg, size_seg };

      }


      if (rank_reserved_part_span.size() < future_sizeof_win) {

        ARCCORE_FATAL("Bad realloc -- New size : {1} -- Needed size : {2}", rank_reserved_part_span.size(), future_sizeof_win);

      }


      // On le modifie avec les éléments donnés dans la méthode requestAddToAnotherSegment().

      for (Int64 pos_win = actual_sizeof_win, pos_elem = 0; pos_win < future_sizeof_win; ++pos_win, ++pos_elem) {

        rank_reserved_part_span[pos_win] = m_add_requests[num_seg][pos_elem];

      }

      m_sizeof_used_part[target_segment_infos_pos] = future_sizeof_win;


      m_add_requests[num_seg] = Span<const std::byte>{ nullptr, 0 };

      m_target_segments[segment_infos_pos] = -1;

    }

  }

  MPI_Barrier(m_comm_machine);


  // Vu que d'autres ont pu modifier nos segments, on recrée les vues.

  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    if (is_my_seg_edited[num_seg]) {

      const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


      MPI_Aint size_seg;

      std::byte* ptr_seg = nullptr;

      int size_type;

      int error = MPI_Win_shared_query(m_all_mpi_win[segment_infos_pos], m_comm_machine_rank, &size_seg, &size_type, &ptr_seg);


      if (error != MPI_SUCCESS) {

        ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

      }

      m_reserved_part_span[num_seg] = Span<std::byte>{ ptr_seg, size_seg };

    }

  }

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

requestReserve(Int32 num_seg, Int64 new_capacity)

{

  if (new_capacity % m_sizeof_type) {

    ARCCORE_FATAL("new_capacity not valid");

  }


  const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


  if (new_capacity > m_reserved_part_span[num_seg].size()) {

    _requestRealloc(segment_infos_pos, new_capacity);

  }

  else {

    _requestRealloc(segment_infos_pos);

  }

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

executeReserve()

{

  _executeRealloc();

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

requestResize(Int32 num_seg, Int64 new_size)

{

  if (new_size == -1) {

    return;

  }

  if (new_size < 0 || new_size % m_sizeof_type) {

    ARCCORE_FATAL("new_size not valid");

  }


  const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


  if (new_size > m_reserved_part_span[num_seg].size()) {

    _requestRealloc(segment_infos_pos, new_size);

  }

  else {

    _requestRealloc(segment_infos_pos);

  }


  m_resize_requests[num_seg] = new_size;

  m_resize_requested = true; // TODO Atomic ?

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

executeResize()

{

  _executeRealloc();


  if (!m_resize_requested) {

    return;

  }

  m_resize_requested = false;


  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    if (m_resize_requests[num_seg] == -1) {

      continue;

    }


    const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


    if (m_reserved_part_span[num_seg].size() < m_resize_requests[num_seg]) {

      ARCCORE_FATAL("Bad realloc -- New size : {0} -- Needed size : {1}", m_reserved_part_span[num_seg].size(), m_resize_requests[num_seg]);

    }


    m_sizeof_used_part[segment_infos_pos] = m_resize_requests[num_seg];

    m_resize_requests[num_seg] = -1;

  }

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

executeShrink()

{

  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


    if (m_reserved_part_span[num_seg].size() == m_sizeof_used_part[segment_infos_pos]) {

      _requestRealloc(segment_infos_pos);

    }

    else {

      _requestRealloc(segment_infos_pos, m_sizeof_used_part[segment_infos_pos]);

    }

  }

  _executeRealloc();

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

_requestRealloc(Int32 owner_pos_segment, Int64 new_capacity) const

{

  m_need_resize[owner_pos_segment] = new_capacity;

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

_requestRealloc(Int32 owner_pos_segment) const

{

  m_need_resize[owner_pos_segment] = -1;

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

_executeRealloc()

{

  // Barrière importante car tout le monde doit savoir que l'on doit

  // redimensionner un des segments que nous possédons.

  MPI_Barrier(m_comm_machine);


  // Pas besoin de barrière car MPI_Win_allocate_shared() de _realloc() est

  // bloquant.

  _realloc();


  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;

    m_need_resize[segment_infos_pos] = -1;

  }


  // Barrière importante dans le cas où un MPI_Win_shared_query() de

  // _reallocCollective() durerait trop longtemps (un autre processus pourrait

  // rappeler cette méthode et remettre m_need_resize[m_owner_segment] à

  // true => deadlock dans _reallocCollective() sur MPI_Win_allocate_shared()

  // à cause du continue).

  MPI_Barrier(m_comm_machine);

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


void MpiMultiMachineShMemWinBaseInternal::

_realloc()

{

  MPI_Info win_info;

  MPI_Info_create(&win_info);

  MPI_Info_set(win_info, "alloc_shared_noncontig", "true");


  // Chacun réalloc ses segments, si demandé.

  for (Integer rank = 0; rank < m_comm_machine_size; ++rank) {

    for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {


      const Int32 local_segment_infos_pos = num_seg + rank * m_nb_segments_per_proc;


      if (m_need_resize[local_segment_infos_pos] == -1)

        continue;


      ARCCORE_ASSERT(m_need_resize[local_segment_infos_pos] >= 0, ("New size must be >= 0"));

      ARCCORE_ASSERT(m_need_resize[local_segment_infos_pos] % m_sizeof_type == 0, ("New size must be % sizeof type"));


      // Si on doit realloc notre segment, on alloue au moins une taille de m_sizeof_type.

      // Si ce n'est pas notre segment, taille 0 pour que MPI n'alloue rien.

      const Int64 size_seg = (m_comm_machine_rank == rank ? (m_need_resize[local_segment_infos_pos] == 0 ? m_sizeof_type : m_need_resize[local_segment_infos_pos]) : 0);


      // On sauvegarde l'ancien segment pour déplacer les données.

      MPI_Win old_win = m_all_mpi_win[local_segment_infos_pos];

      std::byte* ptr_new_seg = nullptr;


      // Si size_seg == 0 alors ptr_seg == nullptr.

      int error = MPI_Win_allocate_shared(size_seg, m_sizeof_type, win_info, m_comm_machine, &ptr_new_seg, &m_all_mpi_win[local_segment_infos_pos]);

      if (error != MPI_SUCCESS) {

        MPI_Win_free(&old_win);

        ARCCORE_FATAL("Error with MPI_Win_allocate_shared() call");

      }


      // Il n'y a que si c'est notre segment que l'on déplace les données.

      if (m_comm_machine_rank == rank) {

        // On a besoin de deux infos supplémentaires :

        // - le pointeur vers l'ancien segment (pas possible de le récupérer

        //   via m_reserved_part_span à cause des échanges),

        // - la taille du nouveau segment (MPI peut allouer plus que la taille

        //   que l'on a demandée).

        std::byte* ptr_old_seg = nullptr;

        MPI_Aint mpi_reserved_size_new_seg;


        // Ancien segment.

        {

          MPI_Aint size_old_seg;

          int size_type;

          // Ici, ptr_seg n'est jamais == nullptr vu que l'on fait toujours un

          // segment d'une taille d'au moins m_sizeof_type.

          error = MPI_Win_shared_query(old_win, m_comm_machine_rank, &size_old_seg, &size_type, &ptr_old_seg);

          if (error != MPI_SUCCESS || ptr_old_seg == nullptr) {

            MPI_Win_free(&old_win);

            ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

          }

        }


        // Nouveau segment.

        {

          std::byte* ptr_seg = nullptr;

          int size_type;

          // Ici, ptr_seg n'est jamais == nullptr vu que l'on fait toujours un

          // segment d'une taille d'au moins m_sizeof_type.

          error = MPI_Win_shared_query(m_all_mpi_win[local_segment_infos_pos], m_comm_machine_rank, &mpi_reserved_size_new_seg, &size_type, &ptr_seg);

          if (error != MPI_SUCCESS || ptr_seg == nullptr || ptr_seg != ptr_new_seg) {

            MPI_Win_free(&old_win);

            ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

          }

        }


        // Si le realloc est une réduction de la taille du segment (espace

        // utilisé par l'utilisateur, si resize par exemple), on ne peut pas

        // copier toutes les anciennes données.

        const Int64 min_size = std::min(m_need_resize[local_segment_infos_pos], m_sizeof_used_part[local_segment_infos_pos]);


        memcpy(ptr_new_seg, ptr_old_seg, min_size);

      }


      MPI_Win_free(&old_win);

    }

  }

  MPI_Info_free(&win_info);


  // On reconstruit les spans des segments que l'on possède.

  for (Integer num_seg = 0; num_seg < m_nb_segments_per_proc; ++num_seg) {

    const Int32 segment_infos_pos = num_seg + m_comm_machine_rank * m_nb_segments_per_proc;


    MPI_Aint size_seg;

    int size_type;

    std::byte* ptr_seg = nullptr;

    int error = MPI_Win_shared_query(m_all_mpi_win[segment_infos_pos], m_comm_machine_rank, &size_seg, &size_type, &ptr_seg);


    if (error != MPI_SUCCESS) {

      ARCCORE_FATAL("Error with MPI_Win_shared_query() call");

    }


    m_reserved_part_span[num_seg] = Span<std::byte>{ ptr_seg, size_seg };

  }

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Int32 MpiMultiMachineShMemWinBaseInternal::

_worldToMachine(Int32 world) const

{

  for (Int32 i = 0; i < m_comm_machine_size; ++i) {

    if (m_machine_ranks[i] == world) {

      return i;

    }

  }

  ARCCORE_FATAL("Rank is not in machine");

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


Int32 MpiMultiMachineShMemWinBaseInternal::

_machineToWorld(Int32 machine) const

{

  return m_machine_ranks[machine];

}


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


} // namespace Arcane::MessagePassing::Mpi


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/

ARCCORE_FATAL
#define ARCCORE_FATAL(...)
Macro envoyant une exception FatalErrorException.
Definition ArccoreGlobal.h:532

Arcane::ConstArrayView
Vue constante d'un tableau de type T.
Definition arccore/src/base/arccore/base/ArrayView.h:533

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::requestAdd
void requestAdd(Int32 num_seg, Span< const std::byte > elem)
Méthode permettant de demander l'ajout d'éléments dans l'un de nos segments.
Definition MpiMultiMachineShMemWinBaseInternal.cc:310

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::segmentConstView
Span< const std::byte > segmentConstView(Int32 num_seg) const
Méthode permettant d'obtenir une vue sur l'un de nos segments.
Definition MpiMultiMachineShMemWinBaseInternal.cc:280

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::executeResize
void executeResize()
Méthode permettant d'exécuter les requêtes de redimensionnement.
Definition MpiMultiMachineShMemWinBaseInternal.cc:596

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::executeShrink
void executeShrink()
Méthode permettant de réduire l'espace mémoire réservé pour les segments au minimum nécessaire.
Definition MpiMultiMachineShMemWinBaseInternal.cc:625

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::requestReserve
void requestReserve(Int32 num_seg, Int64 new_capacity)
Méthode permettant de demander la réservation d'espace mémoire pour un de nos segments.
Definition MpiMultiMachineShMemWinBaseInternal.cc:541

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::requestAddToAnotherSegment
void requestAddToAnotherSegment(Int32 thread, Int32 rank, Int32 num_seg, Span< const std::byte > elem)
Méthode permettant de demander l'ajout d'éléments dans un des segments de la fenêtre.
Definition MpiMultiMachineShMemWinBaseInternal.cc:376

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::executeReserve
void executeReserve()
Méthode permettant d'exécuter les requêtes de réservation.
Definition MpiMultiMachineShMemWinBaseInternal.cc:561

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::_requestRealloc
void _requestRealloc(Int32 owner_pos_segment, Int64 new_capacity) const
Méthode permettant de demander une réallocation.
Definition MpiMultiMachineShMemWinBaseInternal.cc:644

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::MpiMultiMachineShMemWinBaseInternal
MpiMultiMachineShMemWinBaseInternal(SmallSpan< Int64 > sizeof_segments, Int32 nb_segments_per_proc, Int32 sizeof_type, const MPI_Comm &comm_machine, Int32 comm_machine_rank, Int32 comm_machine_size, ConstArrayView< Int32 > machine_ranks)
Le sizeof_segments ne doit pas être conservé !
Definition MpiMultiMachineShMemWinBaseInternal.cc:30

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::executeAdd
void executeAdd()
Méthode permettant d'exécuter les requêtes d'ajout.
Definition MpiMultiMachineShMemWinBaseInternal.cc:340

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::requestResize
void requestResize(Int32 num_seg, Int64 new_size)
Méthode permettant de demander le redimensionnement d'un de nos segments.
Definition MpiMultiMachineShMemWinBaseInternal.cc:570

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_target_segments
Span< Int32 > m_target_segments
Definition MpiMultiMachineShMemWinBaseInternal.h:353

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::barrier
void barrier() const
Méthode permettant d'attendre que tous les processus du noeud appellent cette méthode pour continuer ...
Definition MpiMultiMachineShMemWinBaseInternal.cc:241

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::executeAddToAnotherSegment
void executeAddToAnotherSegment()
Méthode permettant d'exécuter les requêtes d'ajout dans les segments d'autres processus.
Definition MpiMultiMachineShMemWinBaseInternal.cc:425

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_win_actual_sizeof
MPI_Win m_win_actual_sizeof
Fenêtre contiguë avec taille des fenêtres principales.
Definition MpiMultiMachineShMemWinBaseInternal.h:332

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_all_mpi_win
UniqueArray< MPI_Win > m_all_mpi_win
Definition MpiMultiMachineShMemWinBaseInternal.h:316

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_need_resize
Span< Int64 > m_need_resize
Definition MpiMultiMachineShMemWinBaseInternal.h:329

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_reserved_part_span
UniqueArray< Span< std::byte > > m_reserved_part_span
Definition MpiMultiMachineShMemWinBaseInternal.h:319

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_add_requests
UniqueArray< Span< const std::byte > > m_add_requests
Definition MpiMultiMachineShMemWinBaseInternal.h:367

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::sizeofOneElem
Int32 sizeofOneElem() const
Méthode permettant d'obtenir la taille d'un élement de la fenêtre.
Definition MpiMultiMachineShMemWinBaseInternal.cc:223

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_resize_requests
UniqueArray< Int64 > m_resize_requests
Definition MpiMultiMachineShMemWinBaseInternal.h:373

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_sizeof_used_part
Span< Int64 > m_sizeof_used_part
Definition MpiMultiMachineShMemWinBaseInternal.h:337

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_win_need_resize
MPI_Win m_win_need_resize
Definition MpiMultiMachineShMemWinBaseInternal.h:323

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::segmentView
Span< std::byte > segmentView(Int32 num_seg)
Méthode permettant d'obtenir une vue sur l'un de nos segments.
Definition MpiMultiMachineShMemWinBaseInternal.cc:250

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::m_win_target_segments
MPI_Win m_win_target_segments
Definition MpiMultiMachineShMemWinBaseInternal.h:341

Arcane::MessagePassing::Mpi::MpiMultiMachineShMemWinBaseInternal::machineRanks
ConstArrayView< Int32 > machineRanks() const
Méthode permettant d'obtenir les rangs qui possèdent un segment dans la fenêtre.
Definition MpiMultiMachineShMemWinBaseInternal.cc:232

Arcane::SmallSpan
Vue d'un tableau d'éléments de type T.
Definition Span.h:801

Arcane::SpanImpl::data
constexpr __host__ __device__ pointer data() const noexcept
Pointeur sur le début de la vue.
Definition Span.h:537

Arcane::SpanImpl::empty
constexpr __host__ __device__ bool empty() const noexcept
Retourne true si le tableau est vide (dimension nulle).
Definition Span.h:490

Arcane::SpanImpl::size
constexpr __host__ __device__ SizeType size() const noexcept
Retourne la taille du tableau.
Definition Span.h:325

Arcane::Span
Vue d'un tableau d'éléments de type T.
Definition Span.h:633

Arcane::Int64
std::int64_t Int64
Type entier signé sur 64 bits.
Definition ArccoreGlobal.h:227

Arcane::Integer
Int32 Integer
Type représentant un entier.
Definition ArccoreGlobal.h:281

Arcane::Int32
std::int32_t Int32
Type entier signé sur 32 bits.
Definition ArccoreGlobal.h:225