160class SpecificMemoryCopyList
165 using InterfaceType =
typename Traits::InterfaceType;
166 template <
typename DataType,
typename Extent>
using SpecificType =
typename Traits::template SpecificType<DataType, Extent>;
167 using RefType =
typename Traits::RefType;
171 static constexpr Int32 NB_COPIER = 128;
175 SpecificMemoryCopyList()
177 m_copier.fill(
nullptr);
188 m_copier[10] = &m_s10;
190 m_copier[12] = &m_s12;
191 m_copier[16] = &m_s16;
192 m_copier[24] = &m_s24;
193 m_copier[32] = &m_s32;
194 m_copier[40] = &m_s40;
195 m_copier[48] = &m_s48;
196 m_copier[56] = &m_s56;
197 m_copier[64] = &m_s64;
198 m_copier[72] = &m_s72;
205 std::cout <<
"SpecificMemory::nb_specialized=" << m_nb_specialized
206 <<
" nb_generic=" << m_nb_generic <<
"\n";
212 for (
Int32 i = 0; i < NB_COPIER; ++i) {
213 auto* x = m_copier[i];
214 if (x && (x->datatypeSize() != i))
215 ARCANE_FATAL(
"Incoherent datatype size v={0} expected={1}", x->datatypeSize(), i);
221 RefType _copier(
Int32 v)
226 InterfaceType* x =
nullptr;
230 if (x->datatypeSize() != v)
231 ARCANE_FATAL(
"Incoherent datatype size v={0} expected={1}", x->datatypeSize(), v);
236 return RefType(x, v);
243 auto c = _copier(datatype_size);
248 auto c = _copier(datatype_size);
253 auto c = _copier(datatype_size);
258 auto c = _copier(datatype_size);
263 auto c = _copier(datatype_size);
268 auto c = _copier(datatype_size);
274 SpecificType<std::byte, ExtentValue<1>> m_s1;
275 SpecificType<Int16, ExtentValue<1>> m_s2;
276 SpecificType<std::byte, ExtentValue<3>> m_s3;
277 SpecificType<Int32, ExtentValue<1>> m_s4;
278 SpecificType<std::byte, ExtentValue<5>> m_s5;
279 SpecificType<Int16, ExtentValue<3>> m_s6;
280 SpecificType<std::byte, ExtentValue<7>> m_s7;
281 SpecificType<Int64, ExtentValue<1>> m_s8;
282 SpecificType<std::byte, ExtentValue<9>> m_s9;
283 SpecificType<Int16, ExtentValue<5>> m_s10;
284 SpecificType<Int32, ExtentValue<3>> m_s12;
286 SpecificType<Int64, ExtentValue<2>> m_s16;
287 SpecificType<Int64, ExtentValue<3>> m_s24;
288 SpecificType<Int64, ExtentValue<4>> m_s32;
289 SpecificType<Int64, ExtentValue<5>> m_s40;
290 SpecificType<Int64, ExtentValue<6>> m_s48;
291 SpecificType<Int64, ExtentValue<7>> m_s56;
292 SpecificType<Int64, ExtentValue<8>> m_s64;
293 SpecificType<Int64, ExtentValue<9>> m_s72;
295 std::array<InterfaceType*, NB_COPIER> m_copier;
296 std::atomic<Int32> m_nb_specialized = 0;
297 std::atomic<Int32> m_nb_generic = 0;
337 using BaseClass::_toTrueType;
341 using BaseClass::m_extent;
347 _copyFrom(args.m_indexes, _toTrueType(args.m_source), _toTrueType(args.m_destination));
351 _copyTo(args.m_indexes, _toTrueType(args.m_source), _toTrueType(args.m_destination));
355 _fill(args.m_indexes, _toTrueType(args.m_source), _toTrueType(args.m_destination));
359 _copyFrom(args.m_indexes, args.m_multi_memory, _toTrueType(args.m_source_buffer));
363 _copyTo(args.m_indexes, args.m_const_multi_memory, _toTrueType(args.m_destination_buffer));
367 _fill(args.m_indexes, args.m_multi_memory, _toTrueType(args.m_source_buffer));
380 for (
Int32 i = 0; i < nb_index; ++i) {
383 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
384 destination[z_index + z] = source[zci + z];
394 const Int32 value_size = indexes.
size() / 2;
395 for (
Int32 i = 0; i < value_size; ++i) {
396 Int32 index0 = indexes[i * 2];
397 Int32 index1 = indexes[(i * 2) + 1];
399 auto* orig_view_data =
reinterpret_cast<DataType*
>(orig_view_bytes.data());
402 Span<DataType> orig_view = { orig_view_data, orig_view_bytes.size() / (
Int64)
sizeof(DataType) };
405 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
406 orig_view[zci + z] = source[z_index + z];
424 Int64 nb_value = destination.
size() / m_extent.v;
425 for (
Int64 i = 0; i < nb_value; ++i) {
426 Int64 zci = i * m_extent.v;
427 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
428 destination[zci + z] = source[z];
433 for (
Int32 i = 0; i < nb_index; ++i) {
435 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
436 destination[zci + z] = source[z];
447 const Int32 nb_index = indexes.
size() / 2;
450 const Int32 nb_dim1 = multi_views.size();
451 for (
Int32 zz = 0; zz < nb_dim1; ++zz) {
453 Int64 nb_value = orig_view_bytes.
size() / ((
Int64)
sizeof(DataType) * m_extent.v);
454 auto* orig_view_data =
reinterpret_cast<DataType*
>(orig_view_bytes.
data());
456 for (
Int64 i = 0; i < nb_value; i += m_extent.v) {
459 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
460 orig_view[i + z] = source[z];
466 for (
Int32 i = 0; i < nb_index; ++i) {
467 Int32 index0 = indexes[i * 2];
468 Int32 index1 = indexes[(i * 2) + 1];
469 Span<std::byte> orig_view_bytes = multi_views[index0];
470 auto* orig_view_data =
reinterpret_cast<DataType*
>(orig_view_bytes.data());
473 Span<DataType> orig_view = { orig_view_data, orig_view_bytes.size() / (
Int64)
sizeof(DataType) };
475 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
476 orig_view[zci + z] = source[z];
481 void _copyTo(SmallSpan<const Int32> indexes, Span<const DataType> source,
482 Span<DataType> destination)
488 Int32 nb_index = indexes.size();
490 for (
Int32 i = 0; i < nb_index; ++i) {
493 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
494 destination[zci + z] = source[z_index + z];
498 void _copyTo(SmallSpan<const Int32> indexes, SmallSpan<
const Span<const std::byte>> multi_views,
499 Span<DataType> destination)
505 const Int32 value_size = indexes.size() / 2;
506 for (
Int32 i = 0; i < value_size; ++i) {
507 Int32 index0 = indexes[i * 2];
508 Int32 index1 = indexes[(i * 2) + 1];
509 Span<const std::byte> orig_view_bytes = multi_views[index0];
510 auto* orig_view_data =
reinterpret_cast<const DataType*
>(orig_view_bytes.data());
513 Span<const DataType> orig_view = { orig_view_data, orig_view_bytes.size() / (
Int64)
sizeof(DataType) };
516 for (
Int32 z = 0, n = m_extent.v; z < n; ++z)
517 destination[z_index + z] = orig_view[zci + z];
526class SpecificMemoryCopyRef
528 template <
typename DataType,
typename Extent>
using SpecificType =
typename Traits::template SpecificType<DataType, Extent>;
533 : m_specialized_copier(specialized_copier)
534 , m_used_copier(specialized_copier)
536 m_generic_copier.m_extent.v = datatype_size;
538 m_used_copier = &m_generic_copier;
543 m_used_copier->copyFrom(args);
548 m_used_copier->copyTo(args);
553 m_used_copier->fill(args);
558 m_used_copier->copyFrom(args);
563 m_used_copier->copyTo(args);
568 m_used_copier->fill(args);
574 SpecificType<std::byte, ExtentValue<DynExtent>> m_generic_copier;