43 #define INTEL_ITTNOTIFY_API_PRIVATE
44 #include "ittnotify.h"
45 #include "legacy/ittnotify.h"
48 #define __kmp_inline // Turn off inlining in debug mode.
50 #define __kmp_inline static inline
54 extern kmp_int32 __kmp_itt_prepare_delay;
56 extern "C" void __kmp_itt_fini_ittlib(
void);
58 extern void __kmp_itt_fini_ittlib(
void);
63 #define USE_ITT_BUILD_ARG(x) ,x
65 void __kmp_itt_initialize();
66 void __kmp_itt_destroy();
77 __kmp_inline
void __kmp_itt_region_forking(
int gtid,
int team_size,
int barriers,
int serialized = 0 );
78 __kmp_inline
void __kmp_itt_region_joined(
int gtid,
int serialized = 0 );
83 __kmp_inline
void __kmp_itt_frame_submit(
int gtid, __itt_timestamp begin, __itt_timestamp end,
int imbalance,
ident_t *loc,
int team_size,
int region = 0 );
87 __kmp_inline
void __kmp_itt_metadata_imbalance(
int gtid, kmp_uint64 begin, kmp_uint64 end, kmp_uint64 imbalance, kmp_uint64 reduction );
89 __kmp_inline
void __kmp_itt_metadata_loop(
ident_t * loc, kmp_uint64
sched_type, kmp_uint64 iterations, kmp_uint64 chunk );
90 __kmp_inline
void __kmp_itt_metadata_single();
93 __kmp_inline
void * __kmp_itt_barrier_object(
int gtid,
int bt,
int set_name = 0,
int delta = 0 );
94 __kmp_inline
void __kmp_itt_barrier_starting(
int gtid,
void *
object );
95 __kmp_inline
void __kmp_itt_barrier_middle(
int gtid,
void *
object );
96 __kmp_inline
void __kmp_itt_barrier_finished(
int gtid,
void *
object );
99 __kmp_inline
void * __kmp_itt_taskwait_object(
int gtid );
100 __kmp_inline
void __kmp_itt_taskwait_starting(
int gtid,
void *
object );
101 __kmp_inline
void __kmp_itt_taskwait_finished(
int gtid,
void *
object );
104 __kmp_inline
void __kmp_itt_task_starting(
void *
object );
105 __kmp_inline
void __kmp_itt_task_finished(
void *
object );
108 __kmp_inline
void __kmp_itt_lock_creating( kmp_user_lock_p lock );
109 __kmp_inline
void __kmp_itt_lock_acquiring( kmp_user_lock_p lock );
110 __kmp_inline
void __kmp_itt_lock_acquired( kmp_user_lock_p lock );
111 __kmp_inline
void __kmp_itt_lock_releasing( kmp_user_lock_p lock );
112 __kmp_inline
void __kmp_itt_lock_cancelled( kmp_user_lock_p lock );
113 __kmp_inline
void __kmp_itt_lock_destroyed( kmp_user_lock_p lock );
116 __kmp_inline
void __kmp_itt_critical_creating( kmp_user_lock_p lock );
117 __kmp_inline
void __kmp_itt_critical_acquiring( kmp_user_lock_p lock );
118 __kmp_inline
void __kmp_itt_critical_acquired( kmp_user_lock_p lock );
119 __kmp_inline
void __kmp_itt_critical_releasing( kmp_user_lock_p lock );
120 __kmp_inline
void __kmp_itt_critical_destroyed( kmp_user_lock_p lock );
123 __kmp_inline
void __kmp_itt_single_start(
int gtid );
124 __kmp_inline
void __kmp_itt_single_end(
int gtid );
127 __kmp_inline
void __kmp_itt_ordered_init(
int gtid );
128 __kmp_inline
void __kmp_itt_ordered_prep(
int gtid );
129 __kmp_inline
void __kmp_itt_ordered_start(
int gtid );
130 __kmp_inline
void __kmp_itt_ordered_end(
int gtid );
133 __kmp_inline
void __kmp_itt_thread_ignore();
134 __kmp_inline
void __kmp_itt_thread_name(
int gtid );
137 __kmp_inline
void __kmp_itt_system_object_created(
void *
object,
char const * name );
140 __kmp_inline __itt_caller __kmp_itt_stack_caller_create(
void);
141 __kmp_inline
void __kmp_itt_stack_caller_destroy(__itt_caller);
142 __kmp_inline
void __kmp_itt_stack_callee_enter(__itt_caller);
143 __kmp_inline
void __kmp_itt_stack_callee_leave(__itt_caller);
157 #ifndef INCLUDE_SSC_MARKS
158 # define INCLUDE_SSC_MARKS (KMP_OS_LINUX && KMP_ARCH_X86_64)
162 #if (INCLUDE_SSC_MARKS && KMP_OS_LINUX && KMP_ARCH_X86_64)
165 #if defined( __INTEL_COMPILER )
166 # define INSERT_SSC_MARK(tag) __SSC_MARK(tag)
168 # define INSERT_SSC_MARK(tag) \
169 __asm__ __volatile__ ("movl %0, %%ebx; .byte 0x64, 0x67, 0x90 " ::"i"(tag):"%ebx")
172 # define INSERT_SSC_MARK(tag) ((void)0)
181 #define SSC_MARK_SPIN_START() INSERT_SSC_MARK(0x4376)
182 #define SSC_MARK_SPIN_END() INSERT_SSC_MARK(0x4377)
190 #define SSC_MARK_FORKING() INSERT_SSC_MARK(0xd693)
191 #define SSC_MARK_JOINING() INSERT_SSC_MARK(0xd694)
192 #define SSC_MARK_INVOKING() INSERT_SSC_MARK(0xd695)
193 #define SSC_MARK_DISPATCH_INIT() INSERT_SSC_MARK(0xd696)
194 #define SSC_MARK_DISPATCH_NEXT() INSERT_SSC_MARK(0xd697)
214 #define KMP_FSYNC_PREPARE( obj ) __itt_fsync_prepare( (void *)( obj ) )
215 #define KMP_FSYNC_CANCEL( obj ) __itt_fsync_cancel( (void *)( obj ) )
216 #define KMP_FSYNC_ACQUIRED( obj ) __itt_fsync_acquired( (void *)( obj ) )
217 #define KMP_FSYNC_RELEASING( obj ) __itt_fsync_releasing( (void *)( obj ) )
227 #undef KMP_FSYNC_SPIN_INIT
228 #define KMP_FSYNC_SPIN_INIT( obj, spin ) \
229 int sync_iters = 0; \
230 if ( __itt_fsync_prepare_ptr ) { \
231 if ( obj == NULL ) { \
235 SSC_MARK_SPIN_START()
237 #undef KMP_FSYNC_SPIN_PREPARE
238 #define KMP_FSYNC_SPIN_PREPARE( obj ) do { \
239 if ( __itt_fsync_prepare_ptr && sync_iters < __kmp_itt_prepare_delay ) { \
241 if ( sync_iters >= __kmp_itt_prepare_delay ) { \
242 KMP_FSYNC_PREPARE( (void*) obj ); \
246 #undef KMP_FSYNC_SPIN_ACQUIRED
247 #define KMP_FSYNC_SPIN_ACQUIRED( obj ) do { \
248 SSC_MARK_SPIN_END(); \
249 if ( sync_iters >= __kmp_itt_prepare_delay ) { \
250 KMP_FSYNC_ACQUIRED( (void*) obj ); \
259 #define KMP_ITT_IGNORE( statement ) do { \
260 __itt_state_t __itt_state_; \
261 if ( __itt_state_get_ptr ) { \
262 __itt_state_ = __itt_state_get(); \
263 __itt_obj_mode_set( __itt_obj_prop_ignore, __itt_obj_state_set ); \
266 if ( __itt_state_get_ptr ) { \
267 __itt_state_set( __itt_state_ ); \
271 const int KMP_MAX_FRAME_DOMAINS = 512;
273 extern kmp_int32 __kmp_barrier_domain_count;
274 extern kmp_int32 __kmp_region_domain_count;
275 extern __itt_domain* __kmp_itt_barrier_domains[KMP_MAX_FRAME_DOMAINS];
276 extern __itt_domain* __kmp_itt_region_domains[KMP_MAX_FRAME_DOMAINS];
277 extern __itt_domain* __kmp_itt_imbalance_domains[KMP_MAX_FRAME_DOMAINS];
278 extern kmp_int32 __kmp_itt_region_team_size[KMP_MAX_FRAME_DOMAINS];
279 extern __itt_domain * metadata_domain;
284 # define KMP_FSYNC_PREPARE( obj ) ((void)0)
285 # define KMP_FSYNC_CANCEL( obj ) ((void)0)
286 # define KMP_FSYNC_ACQUIRED( obj ) ((void)0)
287 # define KMP_FSYNC_RELEASING( obj ) ((void)0)
289 # define KMP_FSYNC_SPIN_INIT( obj, spin ) ((void)0)
290 # define KMP_FSYNC_SPIN_PREPARE( obj ) ((void)0)
291 # define KMP_FSYNC_SPIN_ACQUIRED( obj ) ((void)0)
293 # define KMP_ITT_IGNORE(stmt ) do { stmt } while (0)
295 #endif // USE_ITT_NOTIFY
299 #include "kmp_itt.inl"
309 # define KMP_FSYNC_PREPARE( obj ) ((void)0)
310 # define KMP_FSYNC_CANCEL( obj ) ((void)0)
311 # define KMP_FSYNC_ACQUIRED( obj ) ((void)0)
312 # define KMP_FSYNC_RELEASING( obj ) ((void)0)
314 # define KMP_FSYNC_SPIN_INIT( obj, spin ) ((void)0)
315 # define KMP_FSYNC_SPIN_PREPARE( obj ) ((void)0)
316 # define KMP_FSYNC_SPIN_ACQUIRED( obj ) ((void)0)
318 # define KMP_ITT_IGNORE(stmt ) do { stmt } while (0)
320 # define USE_ITT_BUILD_ARG(x)