14#include "arcane/std/PapiPerformanceService.h"
16#include "arcane/utils/ValueConvert.h"
17#include "arcane/utils/PlatformUtils.h"
18#include "arcane/utils/FatalErrorException.h"
19#include "arcane/utils/CriticalSection.h"
20#include "arcane/utils/IPerformanceCounterService.h"
22#include "arcane/FactoryService.h"
23#include "arcane/IParallelSuperMng.h"
25#include "arcane/std/ProfilingInfo.h"
26#include "arcane/impl/TimerMng.h"
48 if (PAPI_is_initialized()==PAPI_NOT_INITED){
49 int retval = PAPI_library_init(PAPI_VER_CURRENT);
50 if (retval!=PAPI_VER_CURRENT && retval>0)
51 ARCANE_FATAL(
"PAPI version mismatch r={0} current={1}",retval,PAPI_VER_CURRENT);
53 ARCANE_FATAL(
"Error in PAPI_library_init r={0} msg={1}",retval,PAPI_strerror(retval));
77PapiPerformanceService::
81, m_event_set(PAPI_NULL)
82, m_application(sbi.application())
89PapiPerformanceService::
90~PapiPerformanceService()
100ProfInfos* global_infos =
nullptr;
101int global_nb_total_call = 0;
107void PapiPerformanceService::
108arcane_papi_handler(
int EventSet,
void *address, long_long overflow_vector,
void *context)
110 ARCANE_UNUSED(context);
111 static bool is_in_handler =
false;
117 if (Exception::hasPendingException()){
118 cout <<
"** WARNING: PapiHandler in pending exception\n";
124 is_in_handler =
true;
125 ++global_nb_total_call;
127 int overflow_event[MAX_COUNTER];
128 int nb_overflow_event = MAX_COUNTER;
129 PAPI_get_overflow_event_index(EventSet,overflow_vector,overflow_event,&nb_overflow_event);
130 global_infos->addEvent(address,overflow_event,nb_overflow_event);
131 is_in_handler =
false;
137bool PapiPerformanceService::
138_addEvent(
int event_code,
int event_index)
140 char event_name[PAPI_MAX_STR_LEN];
142 int retval = PAPI_add_event(m_event_set,event_code);
143 PAPI_event_code_to_name(event_code,event_name);
144 info() <<
"Adding Papi event name=" << event_name;
145 if (retval!=PAPI_OK){
146 pwarning() <<
"** ERROR in add_event (index=" << event_index <<
") r=" << retval
147 <<
" msg=" << PAPI_strerror(retval);
156void PapiPerformanceService::
160 if (m_is_initialized)
165 m_is_initialized =
true;
167 int major = PAPI_VERSION_MAJOR(PAPI_VERSION);
168 int minor = PAPI_VERSION_MINOR(PAPI_VERSION);
169 int sub_minor = PAPI_VERSION_REVISION(PAPI_VERSION);
170 info() <<
"PROFILING: start profiling using 'PAPI' version="
171 << major <<
"." << minor <<
"." << sub_minor;
176 global_infos->setNbEventBeforeGettingStack(2000);
177 global_infos->setFunctionDepth(5);
181 const PAPI_exe_info_t *prginfo;
185 retval = PAPI_thread_init((
unsigned long (*)(
void)) (pthread_self));
187 ARCANE_FATAL(
"Error in PAPI_thread_init r={0} msg={1}",retval,PAPI_strerror(retval));
189 prginfo = PAPI_get_executable_info();
191 start =
reinterpret_cast<caddr_t
>(prginfo->address_info.text_start);
192 end =
reinterpret_cast<caddr_t
>(prginfo->address_info.text_end);
194 info() <<
"** PROGRAM INFOS: start=" << (long)start <<
" end=" << (
long)end <<
" length=" << (end-start);
196 if ((retval=PAPI_create_eventset(&m_event_set))!=PAPI_OK)
197 ARCANE_FATAL(
"ERROR in PAPI_create_eventset r={0}",retval);
199 const int NB_EVENT = 3;
200 int papi_events[NB_EVENT];
204 papi_events[0] = PAPI_TOT_CYC;
206 papi_events[1] = PAPI_RES_STL;
207 papi_events[2] = PAPI_DP_OPS;
210 int nb_event = NB_EVENT;
211 if (!papi_user_events.
null()){
213 papi_user_events.
split(strs,
':');
214 int nb_str = strs.
size();
216 for(
Integer i=0; i<nb_str; ++i ){
217 const String& ename = strs[i];
218 info() <<
"USER_EVENT name=" << ename;
220 int retval = PAPI_event_name_to_code((
char*)ename.
localstr(), &new_event);
221 if (retval!=PAPI_OK){
222 pwarning() <<
"Can not set event from name=" << ename <<
" r=" << retval;
225 papi_events[i+1] = new_event;
229 bool is_valid_event[NB_EVENT];
231 for(
Integer i=0; i<nb_event; ++i )
232 is_valid_event[i] = _addEvent(papi_events[i],i);
237 if (!period_str.
null()){
238 bool is_bad = builtInGetValue(m_period,period_str);
240 pwarning() <<
"Can not convert '" << period_str <<
"' to int";
244 if (!only_str.
null())
255 for(
Integer i=0; i<nb_event; ++i ){
256 if (is_valid_event[i]){
257 retval = PAPI_overflow(m_event_set, papi_events[i], m_period, 0, arcane_papi_handler);
258 if (retval!=PAPI_OK){
261 fatal() <<
"** ERROR in papi_overflow i=" << i <<
" r=" << retval
262 <<
" msg=" << PAPI_strerror(retval);
265 pwarning() <<
"** ERROR in papi_overflow i=" << i <<
" r=" << retval
266 <<
" msg=" << PAPI_strerror(retval);
267 is_valid_event[i] =
false;
271 info() <<
"Période de sampling: (en évènements) " << m_period;
279void PapiPerformanceService::
285 global_infos->startProfiling();
287 int retval = PAPI_start(m_event_set);
288 if (retval!=PAPI_OK){
298void PapiPerformanceService::
306void PapiPerformanceService::
309 float real_time = 0.0f;
310 float proc_time = 0.0f;
311 long long flpins = 0.0;
317#if PAPI_VERSION >= PAPI_VERSION_NUMBER(6,0,0,0)
318 int retval = PAPI_flops_rate(PAPI_DP_OPS, &real_time, &proc_time, &flpins, &mflops);
320 int retval = PAPI_flops(&real_time, &proc_time, &flpins, &mflops);
323 error() <<
"** ERROR in PAPI_flops r=" << retval;
325 info() <<
"PAPI_Flops: real_time=" << real_time
326 <<
" proc_time=" << proc_time
327 <<
" flpins=" << flpins
328 <<
" mflips=" << mflops;
335void PapiPerformanceService::
349 int retval = PAPI_stop(m_event_set,0);
350 if (retval!=PAPI_OK){
353 m_is_running =
false;
355 global_infos->stopProfiling();
361void PapiPerformanceService::
362printInfos(
bool dump_file)
365 global_infos->printInfos(dump_file);
371void PapiPerformanceService::
375 global_infos->dumpJSON(writer);
381void PapiPerformanceService::
385 global_infos->getInfos(array);
391void PapiPerformanceService::
395 global_infos->reset();
409 :
TimerMng(tm), m_nb_event(0), m_event_set(PAPI_NULL), m_is_started(
false),
410 m_is_init(
false), m_elapsed_us(0), m_elapsed_cycle()
415 PAPI_stop(m_event_set,m_values.data());
419 void _addEvent(
int event);
421 Real stop(
const char* msg);
446 long_long m_elapsed_us;
447 long_long m_elapsed_cycle;
458 int retval = PAPI_thread_init((
unsigned long (*)(
void)) (pthread_self));
459 if (retval != PAPI_OK)
462 retval = PAPI_create_eventset(&m_event_set);
466 _addEvent(PAPI_TOT_CYC);
467 _addEvent(PAPI_DP_OPS);
468 m_values.resize(m_nb_event);
470 m_start_values.resize(m_nb_event);
471 m_start_values.fill(0);
473 retval = PAPI_start(m_event_set);
474 if (retval != PAPI_OK)
485 int retval = PAPI_add_event(m_event_set,event);
486 if (retval!=PAPI_OK){
487 cerr <<
"** CAN NOT FIND EVENT " <<
event <<
'\n';
499 int retval = PAPI_read(m_event_set,m_start_values.data());
500 if (retval!=PAPI_OK){
501 cerr <<
"** CAN NOT START EVENT\n";
503 m_elapsed_us = PAPI_get_real_usec();
504 m_elapsed_cycle = PAPI_get_real_cyc();
513 int retval = PAPI_read(m_event_set,m_values.data());
514 if (retval!=PAPI_OK){
515 cerr <<
"** CAN NOT STOP EVENT\n";
517 long_long elapsed_us = PAPI_get_real_usec() - m_elapsed_us;
520 double sec_time = ((double)elapsed_us) / 1.0e6;
522 std::cout <<
" -- -- Time: ";
524 std::cout << msg <<
" = ";
526 std::cout << sec_time <<
" ";
530 long_long nb_cycle = m_values[0]-m_start_values[0];
531 long_long nb_flop = m_values[1]-m_start_values[1];
534 std::cout << nb_cycle <<
" ";
536 std::cout << nb_flop;
540 std::cout << nb_flop/elapsed_us;
572class PapiPerformanceCounterService
579 m_event_set(PAPI_NULL), m_is_started(
false)
582 ~PapiPerformanceCounterService()
585 (void)PAPI_stop(m_event_set,
nullptr);
599 retval = PAPI_thread_init((
unsigned long (*)(
void)) (pthread_self));
600 if (retval != PAPI_OK)
601 ARCANE_FATAL(
"Error in 'PAPI_thread_init' r={0}",retval);
605 retval = PAPI_create_eventset(&m_event_set);
607 ARCANE_FATAL(
"Error in 'PAPI_createeventset' r={0}",retval);
609 _addEvent(PAPI_TOT_CYC);
610 _addEvent(PAPI_RES_STL);
611 _addEvent(PAPI_L2_TCM);
613 void _addEvent(
int event)
615 int retval = PAPI_add_event(m_event_set,event);
616 if (retval!=PAPI_OK){
617 error() <<
"** CAN NOT FIND EVENT " <<
event <<
'\n';
626 int retval = PAPI_start(m_event_set);
627 if (retval != PAPI_OK)
635 int retval = PAPI_stop(m_event_set,
nullptr);
636 if (retval != PAPI_OK)
638 m_is_started =
false;
648 int retval = PAPI_read(m_event_set,values);
649 if (retval!=PAPI_OK){
650 error() <<
"Error in 'PAPI_read' during getCounters() r=" << retval;
654 for(
int i=0; i<n; ++i )
655 counters[i] = (
Int64)values[i] - counters[i];
658 for(
int i=0; i<n; ++i )
659 counters[i] = values[i];
665 std::array<Int64,MIN_COUNTER_SIZE> values;
675 bool m_is_started =
false;
682 ServiceProperty(
"PapiPerformanceCounterService",ST_Application),
#define ARCANE_CHECK_POINTER(ptr)
Macro retournant le pointeur ptr s'il est non nul ou lancant une exception s'il est nul.
#define ARCANE_FATAL(...)
Macro envoyant une exception FatalErrorException.
#define ARCANE_SERVICE_INTERFACE(ainterface)
Macro pour déclarer une interface lors de l'enregistrement d'un service.
Integer size() const
Nombre d'éléments du vecteur.
Classe de base d'un service.
Section critique en multi-thread.
virtual ITraceMng * traceMng() const =0
Gestionnaire de traces.
Interface d'un service de profiling.
Interface d'un gestionnaire de timer.
Interface du gestionnaire de traces.
Real _getRealTime() override
Retourne le temps réel.
void _setRealTime() override
Positionne un timer réel.
IApplication * application() const
Accès à l'application IApplication associé.
Structure contenant les informations pour créer un service.
Propriétés de création d'un service.
Chaîne de caractères unicode.
bool null() const
Retourne true si la chaîne est nulle.
const char * localstr() const
Retourne la conversion de l'instance dans l'encodage UTF-8.
void split(StringContainer &str_array, char c) const
Découpe la chaîne suivant le caractère c.
TimerMng(ITraceMng *msg)
Construit un timer lié au gestionnaire mng.
TraceAccessor(ITraceMng *m)
Construit un accesseur via le gestionnaire de trace m.
TraceMessage fatal() const
Flot pour un message d'erreur fatale.
TraceMessage info() const
Flot pour un message d'information.
TraceMessage error() const
Flot pour un message d'erreur.
ITraceMng * traceMng() const
Gestionnaire de trace.
TraceMessage pwarning() const
Vecteur 1D de données avec sémantique par valeur (style STL).
__host__ __device__ Real2 min(Real2 a, Real2 b)
Retourne le minimum de deux Real2.
#define ARCANE_REGISTER_SERVICE(aclass, a_service_property,...)
Macro pour enregistrer un service.
-*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-
Array< Int64 > Int64Array
Tableau dynamique à une dimension d'entiers 64 bits.
ArrayView< Int64 > Int64ArrayView
Equivalent C d'un tableau à une dimension d'entiers 64 bits.
std::int64_t Int64
Type entier signé sur 64 bits.
Int32 Integer
Type représentant un entier.
@ ST_Application
Le service s'utilise au niveau de l'application.
double Real
Type représentant un réel.
UniqueArray< String > StringUniqueArray
Tableau dynamique à une dimension de chaînes de caractères.