14#include "arcane/accelerator/core/internal/RunQueueImpl.h"
16#include "arcane/utils/FatalErrorException.h"
18#include "arcane/utils/SmallArray.h"
20#include "arcane/accelerator/core/internal/IRunnerRuntime.h"
21#include "arcane/accelerator/core/internal/IRunQueueStream.h"
22#include "arcane/accelerator/core/internal/RunCommandImpl.h"
23#include "arcane/accelerator/core/internal/RunnerImpl.h"
24#include "arcane/accelerator/core/internal/IRunQueueEventImpl.h"
25#include "arcane/accelerator/core/Runner.h"
26#include "arcane/accelerator/core/RunQueueBuildInfo.h"
27#include "arcane/accelerator/core/DeviceId.h"
28#include "arcane/accelerator/core/RunQueueEvent.h"
30#include <unordered_set>
35namespace Arcane::Accelerator::impl
46 explicit Lock(RunQueueImpl* p)
48 if (p->m_use_pool_mutex) {
49 m_mutex = p->m_pool_mutex.get();
61 Lock& operator=(
const Lock&) =
delete;
65 std::mutex* m_mutex =
nullptr;
73: m_runner_impl(runner_impl)
74, m_execution_policy(runner_impl->executionPolicy())
75, m_runtime(runner_impl->runtime())
76, m_queue_stream(m_runtime->createStream(bi))
87 delete m_queue_stream;
100 std::unordered_set<RunCommandImpl*> command_set;
101 while (!m_run_command_pool.empty()) {
102 RunCommandImpl* c = m_run_command_pool.top();
104 if (command_set.find(c) != command_set.end())
105 std::cerr <<
"Command is present several times in the command pool\n";
106 command_set.insert(c);
108 RunCommand::_internalDestroyImpl(c);
109 m_run_command_pool.pop();
117_destroy(RunQueueImpl* q)
119 q->_freeCommandsInPool();
137 if (!m_active_run_command_list.empty()) {
138 if (!_internalStream()->_barrierNoException()) {
139 _internalFreeRunningCommands();
142 std::cerr <<
"WARNING: Error in internal accelerator barrier\n";
145 m_runner_impl->_internalPutRunQueueImplInPool(
this);
155_setDefaultMemoryRessource()
157 m_memory_ressource = eMemoryRessource::Host;
159 m_memory_ressource = eMemoryRessource::UnifiedMemory;
165MemoryAllocationOptions RunQueueImpl::
166allocationOptions()
const
169 Int16 device_id =
static_cast<Int16
>(m_runner_impl->deviceId().asInt32());
170 opt.setDevice(device_id);
178isAutoPrefetchCommand()
const
180 return m_runner_impl->isAutoPrefetchCommand();
187copyMemory(
const MemoryCopyArgs& args)
const
189 _internalStream()->copyMemory(args);
196prefetchMemory(
const MemoryPrefetchArgs& args)
const
198 _internalStream()->prefetchMemory(args);
205recordEvent(RunQueueEvent& event)
207 auto* p =
event._internalEventImpl();
208 return p->recordQueue(_internalStream());
215waitEvent(RunQueueEvent& event)
217 auto* p =
event._internalEventImpl();
218 return p->waitForEvent(_internalStream());
224RunQueueImpl* RunQueueImpl::
227 return _reset(r->_internalCreateOrGetRunQueueImpl());
233RunQueueImpl* RunQueueImpl::
234create(RunnerImpl* r,
const RunQueueBuildInfo& bi)
236 return _reset(r->_internalCreateOrGetRunQueueImpl(bi));
242RunCommandImpl* RunQueueImpl::
243_internalCreateOrGetRunCommandImpl()
245 RunCommandImpl* p =
nullptr;
248 auto& pool = m_run_command_pool;
256 p = RunCommand::_internalCreateImpl(
this);
270_internalFreeRunningCommands()
272 if (m_use_pool_mutex) {
273 SmallArray<RunCommandImpl*> command_list;
278 for (RunCommandImpl* p : m_active_run_command_list) {
281 m_active_run_command_list.clear();
283 for (RunCommandImpl* p : command_list) {
284 p->notifyEndExecuteKernel();
288 for (RunCommandImpl* p : command_list) {
289 _checkPutCommandInPoolNoLock(p);
294 for (RunCommandImpl* p : m_active_run_command_list) {
295 p->notifyEndExecuteKernel();
296 _checkPutCommandInPoolNoLock(p);
298 m_active_run_command_list.clear();
315_checkPutCommandInPoolNoLock(RunCommandImpl* p)
317 if (p->m_has_living_run_command)
318 p->m_may_be_put_in_pool =
true;
320 m_run_command_pool.push(p);
327_addRunningCommand(RunCommandImpl* p)
330 m_active_run_command_list.add(p);
337_putInCommandPool(RunCommandImpl* p)
340 m_run_command_pool.push(p);
351 _internalStream()->barrier();
352 _internalFreeRunningCommands();
364RunQueueImpl* RunQueueImpl::
365_reset(RunQueueImpl* p)
367 p->m_is_async =
false;
368 p->_setDefaultMemoryRessource();
376setConcurrentCommandCreation(
bool v)
378 m_use_pool_mutex = v;
379 if (!m_pool_mutex.get())
380 m_pool_mutex = std::make_unique<std::mutex>();
387dumpStats(std::ostream& ostr)
const
389 ostr <<
"nb_pool=" << m_run_command_pool.size()
390 <<
" nb_active=" << m_active_run_command_list.size() <<
"\n";
Fonctions de gestion mémoire et des allocateurs.
Informations pour créer une RunQueue.
Verrou pour le pool de RunCommand en multi-thread.
bool isAcceleratorPolicy(eExecutionPolicy exec_policy)
Indique si exec_policy correspond à un accélérateur.
MemoryAllocationOptions getAllocationOptions(eMemoryResource mem_resource)
Allocation par défaut pour la ressource mem_resource.
bool arcaneIsCheck()
Vrai si on est en mode vérification.
std::int32_t Int32
Type entier signé sur 32 bits.