22 #define INTEL_ITTNOTIFY_API_PRIVATE 23 #include "ittnotify.h" 24 #include "legacy/ittnotify.h" 27 #define __kmp_inline // Turn off inlining in debug mode. 29 #define __kmp_inline static inline 33 extern kmp_int32 __kmp_itt_prepare_delay;
35 extern "C" void __kmp_itt_fini_ittlib(
void);
37 extern void __kmp_itt_fini_ittlib(
void);
43 #define USE_ITT_BUILD_ARG(x) , x 45 void __kmp_itt_initialize();
46 void __kmp_itt_destroy();
57 __kmp_itt_region_forking(
int gtid,
int team_size,
60 __kmp_itt_region_joined(
int gtid);
65 __kmp_inline
void __kmp_itt_frame_submit(
int gtid, __itt_timestamp begin,
66 __itt_timestamp end,
int imbalance,
73 __kmp_inline
void __kmp_itt_metadata_imbalance(
int gtid, kmp_uint64 begin,
76 kmp_uint64 reduction);
80 kmp_uint64 iterations,
82 __kmp_inline
void __kmp_itt_metadata_single(
ident_t *loc);
85 __kmp_inline
void *__kmp_itt_barrier_object(
int gtid,
int bt,
int set_name = 0,
87 __kmp_inline
void __kmp_itt_barrier_starting(
int gtid,
void *
object);
88 __kmp_inline
void __kmp_itt_barrier_middle(
int gtid,
void *
object);
89 __kmp_inline
void __kmp_itt_barrier_finished(
int gtid,
void *
object);
92 __kmp_inline
void *__kmp_itt_taskwait_object(
int gtid);
93 __kmp_inline
void __kmp_itt_taskwait_starting(
int gtid,
void *
object);
94 __kmp_inline
void __kmp_itt_taskwait_finished(
int gtid,
void *
object);
97 __kmp_inline
void __kmp_itt_task_starting(
void *
object);
98 __kmp_inline
void __kmp_itt_task_finished(
void *
object);
101 #if KMP_USE_DYNAMIC_LOCK 102 __kmp_inline
void __kmp_itt_lock_creating(kmp_user_lock_p lock,
105 __kmp_inline
void __kmp_itt_lock_creating(kmp_user_lock_p lock);
107 __kmp_inline
void __kmp_itt_lock_acquiring(kmp_user_lock_p lock);
108 __kmp_inline
void __kmp_itt_lock_acquired(kmp_user_lock_p lock);
109 __kmp_inline
void __kmp_itt_lock_releasing(kmp_user_lock_p lock);
110 __kmp_inline
void __kmp_itt_lock_cancelled(kmp_user_lock_p lock);
111 __kmp_inline
void __kmp_itt_lock_destroyed(kmp_user_lock_p lock);
114 #if KMP_USE_DYNAMIC_LOCK 115 __kmp_inline
void __kmp_itt_critical_creating(kmp_user_lock_p lock,
118 __kmp_inline
void __kmp_itt_critical_creating(kmp_user_lock_p lock);
120 __kmp_inline
void __kmp_itt_critical_acquiring(kmp_user_lock_p lock);
121 __kmp_inline
void __kmp_itt_critical_acquired(kmp_user_lock_p lock);
122 __kmp_inline
void __kmp_itt_critical_releasing(kmp_user_lock_p lock);
123 __kmp_inline
void __kmp_itt_critical_destroyed(kmp_user_lock_p lock);
126 __kmp_inline
void __kmp_itt_single_start(
int gtid);
127 __kmp_inline
void __kmp_itt_single_end(
int gtid);
130 __kmp_inline
void __kmp_itt_ordered_init(
int gtid);
131 __kmp_inline
void __kmp_itt_ordered_prep(
int gtid);
132 __kmp_inline
void __kmp_itt_ordered_start(
int gtid);
133 __kmp_inline
void __kmp_itt_ordered_end(
int gtid);
136 __kmp_inline
void __kmp_itt_thread_ignore();
137 __kmp_inline
void __kmp_itt_thread_name(
int gtid);
140 __kmp_inline
void __kmp_itt_system_object_created(
void *
object,
144 __kmp_inline __itt_caller __kmp_itt_stack_caller_create(
void);
145 __kmp_inline
void __kmp_itt_stack_caller_destroy(__itt_caller);
146 __kmp_inline
void __kmp_itt_stack_callee_enter(__itt_caller);
147 __kmp_inline
void __kmp_itt_stack_callee_leave(__itt_caller);
159 #ifndef INCLUDE_SSC_MARKS 160 #define INCLUDE_SSC_MARKS (KMP_OS_LINUX && KMP_ARCH_X86_64) 164 #if (INCLUDE_SSC_MARKS && KMP_OS_LINUX && KMP_ARCH_X86_64) 167 #if defined(__INTEL_COMPILER) 168 #define INSERT_SSC_MARK(tag) __SSC_MARK(tag) 170 #define INSERT_SSC_MARK(tag) \ 171 __asm__ __volatile__("movl %0, %%ebx; .byte 0x64, 0x67, 0x90 " ::"i"(tag) \ 175 #define INSERT_SSC_MARK(tag) ((void)0) 182 #define SSC_MARK_SPIN_START() INSERT_SSC_MARK(0x4376) 183 #define SSC_MARK_SPIN_END() INSERT_SSC_MARK(0x4377) 191 #define SSC_MARK_FORKING() INSERT_SSC_MARK(0xd693) 192 #define SSC_MARK_JOINING() INSERT_SSC_MARK(0xd694) 193 #define SSC_MARK_INVOKING() INSERT_SSC_MARK(0xd695) 194 #define SSC_MARK_DISPATCH_INIT() INSERT_SSC_MARK(0xd696) 195 #define SSC_MARK_DISPATCH_NEXT() INSERT_SSC_MARK(0xd697) 215 #define KMP_FSYNC_PREPARE(obj) __itt_fsync_prepare((void *)(obj)) 216 #define KMP_FSYNC_CANCEL(obj) __itt_fsync_cancel((void *)(obj)) 217 #define KMP_FSYNC_ACQUIRED(obj) __itt_fsync_acquired((void *)(obj)) 218 #define KMP_FSYNC_RELEASING(obj) __itt_fsync_releasing((void *)(obj)) 226 #undef KMP_FSYNC_SPIN_INIT 227 #define KMP_FSYNC_SPIN_INIT(obj, spin) \ 228 int sync_iters = 0; \ 229 if (__itt_fsync_prepare_ptr) { \ 234 SSC_MARK_SPIN_START() 236 #undef KMP_FSYNC_SPIN_PREPARE 237 #define KMP_FSYNC_SPIN_PREPARE(obj) \ 239 if (__itt_fsync_prepare_ptr && sync_iters < __kmp_itt_prepare_delay) { \ 241 if (sync_iters >= __kmp_itt_prepare_delay) { \ 242 KMP_FSYNC_PREPARE((void *)obj); \ 246 #undef KMP_FSYNC_SPIN_ACQUIRED 247 #define KMP_FSYNC_SPIN_ACQUIRED(obj) \ 249 SSC_MARK_SPIN_END(); \ 250 if (sync_iters >= __kmp_itt_prepare_delay) { \ 251 KMP_FSYNC_ACQUIRED((void *)obj); \ 260 #define KMP_ITT_IGNORE(statement) \ 262 __itt_state_t __itt_state_; \ 263 if (__itt_state_get_ptr) { \ 264 __itt_state_ = __itt_state_get(); \ 265 __itt_obj_mode_set(__itt_obj_prop_ignore, __itt_obj_state_set); \ 268 if (__itt_state_get_ptr) { \ 269 __itt_state_set(__itt_state_); \ 273 const int KMP_MAX_FRAME_DOMAINS =
276 extern kmp_int32 __kmp_barrier_domain_count;
277 extern kmp_int32 __kmp_region_domain_count;
278 extern __itt_domain *__kmp_itt_barrier_domains[KMP_MAX_FRAME_DOMAINS];
279 extern __itt_domain *__kmp_itt_region_domains[KMP_MAX_FRAME_DOMAINS];
280 extern __itt_domain *__kmp_itt_imbalance_domains[KMP_MAX_FRAME_DOMAINS];
281 extern kmp_int32 __kmp_itt_region_team_size[KMP_MAX_FRAME_DOMAINS];
282 extern __itt_domain *metadata_domain;
283 extern __itt_string_handle *string_handle_imbl;
284 extern __itt_string_handle *string_handle_loop;
285 extern __itt_string_handle *string_handle_sngl;
290 #define KMP_FSYNC_PREPARE(obj) ((void)0) 291 #define KMP_FSYNC_CANCEL(obj) ((void)0) 292 #define KMP_FSYNC_ACQUIRED(obj) ((void)0) 293 #define KMP_FSYNC_RELEASING(obj) ((void)0) 295 #define KMP_FSYNC_SPIN_INIT(obj, spin) ((void)0) 296 #define KMP_FSYNC_SPIN_PREPARE(obj) ((void)0) 297 #define KMP_FSYNC_SPIN_ACQUIRED(obj) ((void)0) 299 #define KMP_ITT_IGNORE(stmt) \ 304 #endif // USE_ITT_NOTIFY 308 #include "kmp_itt.inl" 318 #define KMP_FSYNC_PREPARE(obj) ((void)0) 319 #define KMP_FSYNC_CANCEL(obj) ((void)0) 320 #define KMP_FSYNC_ACQUIRED(obj) ((void)0) 321 #define KMP_FSYNC_RELEASING(obj) ((void)0) 323 #define KMP_FSYNC_SPIN_INIT(obj, spin) ((void)0) 324 #define KMP_FSYNC_SPIN_PREPARE(obj) ((void)0) 325 #define KMP_FSYNC_SPIN_ACQUIRED(obj) ((void)0) 327 #define KMP_ITT_IGNORE(stmt) \ 332 #define USE_ITT_BUILD_ARG(x)