df/d64/core_2RunCommandLaunchInfo_8h_source.html

// -*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-

//-----------------------------------------------------------------------------

// Copyright 2000-2025 CEA (www.cea.fr) IFPEN (www.ifpenergiesnouvelles.com)

// See the top-level COPYRIGHT file for details.

// SPDX-License-Identifier: Apache-2.0

//-----------------------------------------------------------------------------

/*---------------------------------------------------------------------------*/

/* RunCommandLaunchInfo.h                                      (C) 2000-2025 */

/*                                                                           */

/* Informations pour l'exécution d'une 'RunCommand'.                         */

/*---------------------------------------------------------------------------*/

#ifndef ARCANE_ACCELERATOR_CORE_RUNCOMMANDLAUNCHINFO_H

#define ARCANE_ACCELERATOR_CORE_RUNCOMMANDLAUNCHINFO_H

/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


#include "arcane/utils/ConcurrencyUtils.h"


#include "arcane/accelerator/core/KernelLaunchArgs.h"


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


namespace Arcane::Accelerator::impl

{


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


class ARCANE_ACCELERATOR_CORE_EXPORT RunCommandLaunchInfo

{

  // Les fonctions suivantes permettent de lancer les kernels.

  template <typename SyclKernel, typename Lambda, typename LambdaArgs, typename... ReducerArgs>

  friend void _applyKernelSYCL(impl::RunCommandLaunchInfo& launch_info, SyclKernel kernel, Lambda& func,

                               const LambdaArgs& args, const ReducerArgs&... reducer_args);

  template <typename CudaKernel, typename Lambda, typename LambdaArgs, typename... RemainingArgs>

  friend void _applyKernelCUDA(impl::RunCommandLaunchInfo& launch_info, const CudaKernel& kernel, Lambda& func,

                               const LambdaArgs& args, [[maybe_unused]] const RemainingArgs&... other_args);

  template <typename HipKernel, typename Lambda, typename LambdaArgs, typename... RemainingArgs>

  friend void _applyKernelHIP(impl::RunCommandLaunchInfo& launch_info, const HipKernel& kernel, const Lambda& func,

                              const LambdaArgs& args, [[maybe_unused]] const RemainingArgs&... other_args);


 public:


  using ThreadBlockInfo = KernelLaunchArgs;


 public:


  RunCommandLaunchInfo(RunCommand& command, Int64 total_loop_size);

  ~RunCommandLaunchInfo();

  RunCommandLaunchInfo(const RunCommandLaunchInfo&) = delete;

  RunCommandLaunchInfo operator=(const RunCommandLaunchInfo&) = delete;


 public:


  eExecutionPolicy executionPolicy() const { return m_exec_policy; }


  void beginExecute();


  void endExecute();


  KernelLaunchArgs kernelLaunchArgs() const { return m_kernel_launch_args; }


  ParallelLoopOptions computeParallelLoopOptions() const;


  const ForLoopRunInfo& loopRunInfo() const { return m_loop_run_info; }


  Int64 totalLoopSize() const { return m_total_loop_size; }


 private:


  RunCommand& m_command;

  bool m_has_exec_begun = false;

  bool m_is_notify_end_kernel_done = false;

  eExecutionPolicy m_exec_policy = eExecutionPolicy::Sequential;

  KernelLaunchArgs m_kernel_launch_args;

  ForLoopRunInfo m_loop_run_info;

  Int64 m_total_loop_size = 0;

  impl::RunQueueImpl* m_queue_impl = nullptr;


 private:


  KernelLaunchArgs _threadBlockInfo(const void* func, Int32 shared_memory_size) const;

  NativeStream _internalNativeStream();

  void _doEndKernelLaunch();

  KernelLaunchArgs _computeKernelLaunchArgs() const;


 private:


  void _computeLoopRunInfo();


  // Pour SYCL: enregistre l'évènement associé à la dernière commande de la file

  // \a sycl_event_ptr est de type 'sycl::event*'.

  void _addSyclEvent(void* sycl_event_ptr);

};


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


} // End namespace Arcane::Accelerator::impl


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


#endif

ConcurrencyUtils.h
Classes, Types et macros pour gérer la concurrence.

Arcane::Accelerator::RunCommand
Gestion d'une commande sur accélérateur.
Definition core/RunCommand.h:46

Arcane::Accelerator::impl::KernelLaunchArgs
Arguments pour lancer un kernel.
Definition KernelLaunchArgs.h:32

Arcane::Accelerator::impl::NativeStream
Type opaque pour encapsuler une 'stream' native.
Definition NativeStream.h:54

Arcane::Accelerator::impl::RunCommandLaunchInfo
Object temporaire pour conserver les informations d'exécution d'une commande et regrouper les tests.
Definition core/RunCommandLaunchInfo.h:35

Arcane::Accelerator::impl::RunCommandLaunchInfo::totalLoopSize
Int64 totalLoopSize() const
Taille totale de la boucle.
Definition core/RunCommandLaunchInfo.h:97

Arcane::Accelerator::impl::RunCommandLaunchInfo::beginExecute
void beginExecute()
Indique qu'on commence l'exécution de la commande.
Definition RunCommandLaunchInfo.cc:62

Arcane::Accelerator::impl::RunCommandLaunchInfo::kernelLaunchArgs
KernelLaunchArgs kernelLaunchArgs() const
Informations sur le nombre de block/thread/grille du noyau à lancer.
Definition core/RunCommandLaunchInfo.h:83

Arcane::Accelerator::impl::RunCommandLaunchInfo::endExecute
void endExecute()
Signale la fin de l'exécution.
Definition RunCommandLaunchInfo.cc:81

Arcane::Accelerator::impl::RunCommandLaunchInfo::_applyKernelCUDA
friend void _applyKernelCUDA(impl::RunCommandLaunchInfo &launch_info, const CudaKernel &kernel, Lambda &func, const LambdaArgs &args, const RemainingArgs &... other_args)
Fonction générique pour exécuter un kernel CUDA.
Definition KernelLauncher.h:313

Arcane::Accelerator::impl::RunCommandLaunchInfo::loopRunInfo
const ForLoopRunInfo & loopRunInfo() const
Informations d'exécution de la boucle.
Definition core/RunCommandLaunchInfo.h:94

Arcane::Accelerator::impl::RunCommandLaunchInfo::_applyKernelHIP
friend void _applyKernelHIP(impl::RunCommandLaunchInfo &launch_info, const HipKernel &kernel, const Lambda &func, const LambdaArgs &args, const RemainingArgs &... other_args)
Fonction générique pour exécuter un kernel HIP.
Definition KernelLauncher.h:341

Arcane::Accelerator::impl::RunQueueImpl
File d'exécution pour accélérateur.
Definition core/internal/RunQueueImpl.h:42

Arcane::ForLoopRunInfo
Informations d'exécution d'une boucle.
Definition ConcurrencyUtils.h:56

Arcane::ParallelLoopOptions
Options d'exécution d'une boucle parallèle en multi-thread.
Definition ParallelLoopOptions.h:35

Arcane::Accelerator::eExecutionPolicy
eExecutionPolicy
Politique d'exécution pour un Runner.
Definition AcceleratorCoreGlobal.h:93

Arcane::Accelerator::eExecutionPolicy::Sequential
@ Sequential
Politique d'exécution séquentielle.
Definition AcceleratorCoreGlobal.h:97

Arcane::Int64
std::int64_t Int64
Type entier signé sur 64 bits.
Definition ArccoreGlobal.h:186

Arcane::Int32
std::int32_t Int32
Type entier signé sur 32 bits.
Definition ArccoreGlobal.h:184