8#include <gtest/gtest.h>
10#include "arccore/base/PlatformUtils.h"
12#include "arccore/common/accelerator/Runner.h"
13#include "arccore/common/accelerator/RunQueue.h"
28_testCooperativeLaunch_GridSync(
RunQueue queue, Int32 nb_value, Int32 nb_loop, Int32 nb_loop2)
32 for (
int j = 0; j < nb_loop; ++j) {
37 auto grid = iter.grid();
38 for (Int32 j = 0; j < nb_loop2; ++j) {
45 Real diff = (y - x) * 1000.0;
46 std::cout <<
"** TotalCooperativeLaunch_GridSync nb_value=" << nb_value
47 <<
" nb_loop2=" << nb_loop2 <<
" time(ms)=" << diff <<
"\n";
Types and macros for managing hierarchical parallelism on accelerators.
#define RUNCOMMAND_LAUNCH(iter_name, bounds,...)
Macro to launch a command using hierarchical, possibly cooperative, parallelism.
Iteration range of a loop using cooperative hierarchical parallelism.
Execution queue for an accelerator.
Namespace for accelerator usage.
RunCommand makeCommand(const RunQueue &run_queue)
Creates a command associated with the queue run_queue.
-- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature --