41 #define INTEL_ITTNOTIFY_API_PRIVATE
42 #include "ittnotify.h"
43 #include "legacy/ittnotify.h"
46 #define __kmp_inline // Turn off inlining in debug mode.
48 #define __kmp_inline static inline
52 extern kmp_int32 __kmp_itt_prepare_delay;
54 extern "C" void __kmp_itt_fini_ittlib(
void);
56 extern void __kmp_itt_fini_ittlib(
void);
61 #define USE_ITT_BUILD_ARG(x) ,x
63 void __kmp_itt_initialize();
64 void __kmp_itt_destroy();
75 __kmp_inline
void __kmp_itt_region_forking(
int gtid,
int team_size,
int barriers,
int serialized = 0 );
76 __kmp_inline
void __kmp_itt_region_joined(
int gtid,
int serialized = 0 );
81 __kmp_inline
void __kmp_itt_frame_submit(
int gtid, __itt_timestamp begin, __itt_timestamp end,
int imbalance,
ident_t *loc,
int team_size,
int region = 0 );
85 __kmp_inline
void __kmp_itt_metadata_imbalance(
int gtid, kmp_uint64 begin, kmp_uint64 end, kmp_uint64 imbalance, kmp_uint64 reduction );
87 __kmp_inline
void __kmp_itt_metadata_loop(
ident_t * loc, kmp_uint64
sched_type, kmp_uint64 iterations, kmp_uint64 chunk );
88 __kmp_inline
void __kmp_itt_metadata_single(
ident_t * loc );
91 __kmp_inline
void * __kmp_itt_barrier_object(
int gtid,
int bt,
int set_name = 0,
int delta = 0 );
92 __kmp_inline
void __kmp_itt_barrier_starting(
int gtid,
void *
object );
93 __kmp_inline
void __kmp_itt_barrier_middle(
int gtid,
void *
object );
94 __kmp_inline
void __kmp_itt_barrier_finished(
int gtid,
void *
object );
97 __kmp_inline
void * __kmp_itt_taskwait_object(
int gtid );
98 __kmp_inline
void __kmp_itt_taskwait_starting(
int gtid,
void *
object );
99 __kmp_inline
void __kmp_itt_taskwait_finished(
int gtid,
void *
object );
102 __kmp_inline
void __kmp_itt_task_starting(
void *
object );
103 __kmp_inline
void __kmp_itt_task_finished(
void *
object );
106 #if KMP_USE_DYNAMIC_LOCK
107 __kmp_inline
void __kmp_itt_lock_creating( kmp_user_lock_p lock,
const ident_t * );
109 __kmp_inline
void __kmp_itt_lock_creating( kmp_user_lock_p lock );
111 __kmp_inline
void __kmp_itt_lock_acquiring( kmp_user_lock_p lock );
112 __kmp_inline
void __kmp_itt_lock_acquired( kmp_user_lock_p lock );
113 __kmp_inline
void __kmp_itt_lock_releasing( kmp_user_lock_p lock );
114 __kmp_inline
void __kmp_itt_lock_cancelled( kmp_user_lock_p lock );
115 __kmp_inline
void __kmp_itt_lock_destroyed( kmp_user_lock_p lock );
118 #if KMP_USE_DYNAMIC_LOCK
119 __kmp_inline
void __kmp_itt_critical_creating( kmp_user_lock_p lock,
const ident_t * );
121 __kmp_inline
void __kmp_itt_critical_creating( kmp_user_lock_p lock );
123 __kmp_inline
void __kmp_itt_critical_acquiring( kmp_user_lock_p lock );
124 __kmp_inline
void __kmp_itt_critical_acquired( kmp_user_lock_p lock );
125 __kmp_inline
void __kmp_itt_critical_releasing( kmp_user_lock_p lock );
126 __kmp_inline
void __kmp_itt_critical_destroyed( kmp_user_lock_p lock );
129 __kmp_inline
void __kmp_itt_single_start(
int gtid );
130 __kmp_inline
void __kmp_itt_single_end(
int gtid );
133 __kmp_inline
void __kmp_itt_ordered_init(
int gtid );
134 __kmp_inline
void __kmp_itt_ordered_prep(
int gtid );
135 __kmp_inline
void __kmp_itt_ordered_start(
int gtid );
136 __kmp_inline
void __kmp_itt_ordered_end(
int gtid );
139 __kmp_inline
void __kmp_itt_thread_ignore();
140 __kmp_inline
void __kmp_itt_thread_name(
int gtid );
143 __kmp_inline
void __kmp_itt_system_object_created(
void *
object,
char const * name );
146 __kmp_inline __itt_caller __kmp_itt_stack_caller_create(
void);
147 __kmp_inline
void __kmp_itt_stack_caller_destroy(__itt_caller);
148 __kmp_inline
void __kmp_itt_stack_callee_enter(__itt_caller);
149 __kmp_inline
void __kmp_itt_stack_callee_leave(__itt_caller);
163 #ifndef INCLUDE_SSC_MARKS
164 # define INCLUDE_SSC_MARKS (KMP_OS_LINUX && KMP_ARCH_X86_64)
168 #if (INCLUDE_SSC_MARKS && KMP_OS_LINUX && KMP_ARCH_X86_64)
171 #if defined( __INTEL_COMPILER )
172 # define INSERT_SSC_MARK(tag) __SSC_MARK(tag)
174 # define INSERT_SSC_MARK(tag) \
175 __asm__ __volatile__ ("movl %0, %%ebx; .byte 0x64, 0x67, 0x90 " ::"i"(tag):"%ebx")
178 # define INSERT_SSC_MARK(tag) ((void)0)
187 #define SSC_MARK_SPIN_START() INSERT_SSC_MARK(0x4376)
188 #define SSC_MARK_SPIN_END() INSERT_SSC_MARK(0x4377)
196 #define SSC_MARK_FORKING() INSERT_SSC_MARK(0xd693)
197 #define SSC_MARK_JOINING() INSERT_SSC_MARK(0xd694)
198 #define SSC_MARK_INVOKING() INSERT_SSC_MARK(0xd695)
199 #define SSC_MARK_DISPATCH_INIT() INSERT_SSC_MARK(0xd696)
200 #define SSC_MARK_DISPATCH_NEXT() INSERT_SSC_MARK(0xd697)
220 #define KMP_FSYNC_PREPARE( obj ) __itt_fsync_prepare( (void *)( obj ) )
221 #define KMP_FSYNC_CANCEL( obj ) __itt_fsync_cancel( (void *)( obj ) )
222 #define KMP_FSYNC_ACQUIRED( obj ) __itt_fsync_acquired( (void *)( obj ) )
223 #define KMP_FSYNC_RELEASING( obj ) __itt_fsync_releasing( (void *)( obj ) )
233 #undef KMP_FSYNC_SPIN_INIT
234 #define KMP_FSYNC_SPIN_INIT( obj, spin ) \
235 int sync_iters = 0; \
236 if ( __itt_fsync_prepare_ptr ) { \
237 if ( obj == NULL ) { \
241 SSC_MARK_SPIN_START()
243 #undef KMP_FSYNC_SPIN_PREPARE
244 #define KMP_FSYNC_SPIN_PREPARE( obj ) do { \
245 if ( __itt_fsync_prepare_ptr && sync_iters < __kmp_itt_prepare_delay ) { \
247 if ( sync_iters >= __kmp_itt_prepare_delay ) { \
248 KMP_FSYNC_PREPARE( (void*) obj ); \
252 #undef KMP_FSYNC_SPIN_ACQUIRED
253 #define KMP_FSYNC_SPIN_ACQUIRED( obj ) do { \
254 SSC_MARK_SPIN_END(); \
255 if ( sync_iters >= __kmp_itt_prepare_delay ) { \
256 KMP_FSYNC_ACQUIRED( (void*) obj ); \
265 #define KMP_ITT_IGNORE( statement ) do { \
266 __itt_state_t __itt_state_; \
267 if ( __itt_state_get_ptr ) { \
268 __itt_state_ = __itt_state_get(); \
269 __itt_obj_mode_set( __itt_obj_prop_ignore, __itt_obj_state_set ); \
272 if ( __itt_state_get_ptr ) { \
273 __itt_state_set( __itt_state_ ); \
277 const int KMP_MAX_FRAME_DOMAINS = 512;
279 extern kmp_int32 __kmp_barrier_domain_count;
280 extern kmp_int32 __kmp_region_domain_count;
281 extern __itt_domain* __kmp_itt_barrier_domains[KMP_MAX_FRAME_DOMAINS];
282 extern __itt_domain* __kmp_itt_region_domains[KMP_MAX_FRAME_DOMAINS];
283 extern __itt_domain* __kmp_itt_imbalance_domains[KMP_MAX_FRAME_DOMAINS];
284 extern kmp_int32 __kmp_itt_region_team_size[KMP_MAX_FRAME_DOMAINS];
285 extern __itt_domain * metadata_domain;
290 # define KMP_FSYNC_PREPARE( obj ) ((void)0)
291 # define KMP_FSYNC_CANCEL( obj ) ((void)0)
292 # define KMP_FSYNC_ACQUIRED( obj ) ((void)0)
293 # define KMP_FSYNC_RELEASING( obj ) ((void)0)
295 # define KMP_FSYNC_SPIN_INIT( obj, spin ) ((void)0)
296 # define KMP_FSYNC_SPIN_PREPARE( obj ) ((void)0)
297 # define KMP_FSYNC_SPIN_ACQUIRED( obj ) ((void)0)
299 # define KMP_ITT_IGNORE(stmt ) do { stmt } while (0)
301 #endif // USE_ITT_NOTIFY
305 #include "kmp_itt.inl"
315 # define KMP_FSYNC_PREPARE( obj ) ((void)0)
316 # define KMP_FSYNC_CANCEL( obj ) ((void)0)
317 # define KMP_FSYNC_ACQUIRED( obj ) ((void)0)
318 # define KMP_FSYNC_RELEASING( obj ) ((void)0)
320 # define KMP_FSYNC_SPIN_INIT( obj, spin ) ((void)0)
321 # define KMP_FSYNC_SPIN_PREPARE( obj ) ((void)0)
322 # define KMP_FSYNC_SPIN_ACQUIRED( obj ) ((void)0)
324 # define KMP_ITT_IGNORE(stmt ) do { stmt } while (0)
326 # define USE_ITT_BUILD_ARG(x)