17 #include "kmp_affinity.h" 19 kmp_key_t __kmp_gtid_threadprivate_key;
21 #if KMP_ARCH_X86 || KMP_ARCH_X86_64 22 kmp_cpuinfo_t __kmp_cpuinfo = {0};
26 #include "kmp_stats.h" 28 kmp_tas_lock_t __kmp_stats_lock;
32 kmp_stats_list *__kmp_stats_list;
35 __thread kmp_stats_list *__kmp_stats_thread_ptr = NULL;
38 tsc_tick_count __kmp_stats_start_time;
44 volatile int __kmp_init_serial = FALSE;
45 volatile int __kmp_init_gtid = FALSE;
46 volatile int __kmp_init_common = FALSE;
47 volatile int __kmp_init_middle = FALSE;
48 volatile int __kmp_init_parallel = FALSE;
50 volatile int __kmp_init_monitor =
53 volatile int __kmp_init_user_locks = FALSE;
56 kmp_cached_addr_t *__kmp_threadpriv_cache_list = NULL;
58 int __kmp_init_counter = 0;
59 int __kmp_root_counter = 0;
60 int __kmp_version = 0;
62 volatile kmp_uint32 __kmp_team_counter = 0;
63 volatile kmp_uint32 __kmp_task_counter = 0;
65 unsigned int __kmp_init_wait =
66 KMP_DEFAULT_INIT_WAIT;
67 unsigned int __kmp_next_wait =
68 KMP_DEFAULT_NEXT_WAIT;
70 size_t __kmp_stksize = KMP_DEFAULT_STKSIZE;
72 size_t __kmp_monitor_stksize = 0;
74 size_t __kmp_stkoffset = KMP_DEFAULT_STKOFFSET;
75 int __kmp_stkpadding = KMP_MIN_STKPADDING;
77 size_t __kmp_malloc_pool_incr = KMP_DEFAULT_MALLOC_POOL_INCR;
82 kmp_uint32 __kmp_barrier_gather_bb_dflt = 2;
84 kmp_uint32 __kmp_barrier_release_bb_dflt = 2;
87 kmp_uint32 __kmp_barrier_gather_bb_dflt = 2;
89 kmp_uint32 __kmp_barrier_release_bb_dflt = 2;
91 #endif // KMP_ARCH_X86_64 93 kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_hyper_bar;
94 kmp_bar_pat_e __kmp_barrier_release_pat_dflt =
97 kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_linear_bar;
98 kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_linear_bar;
100 kmp_uint32 __kmp_barrier_gather_branch_bits[bs_last_barrier] = {0};
101 kmp_uint32 __kmp_barrier_release_branch_bits[bs_last_barrier] = {0};
102 kmp_bar_pat_e __kmp_barrier_gather_pattern[bs_last_barrier] = {bp_linear_bar};
103 kmp_bar_pat_e __kmp_barrier_release_pattern[bs_last_barrier] = {bp_linear_bar};
104 char const *__kmp_barrier_branch_bit_env_name[bs_last_barrier] = {
105 "KMP_PLAIN_BARRIER",
"KMP_FORKJOIN_BARRIER" 106 #if KMP_FAST_REDUCTION_BARRIER 108 "KMP_REDUCTION_BARRIER" 109 #endif // KMP_FAST_REDUCTION_BARRIER 111 char const *__kmp_barrier_pattern_env_name[bs_last_barrier] = {
112 "KMP_PLAIN_BARRIER_PATTERN",
"KMP_FORKJOIN_BARRIER_PATTERN" 113 #if KMP_FAST_REDUCTION_BARRIER 115 "KMP_REDUCTION_BARRIER_PATTERN" 116 #endif // KMP_FAST_REDUCTION_BARRIER 118 char const *__kmp_barrier_type_name[bs_last_barrier] = {
"plain",
"forkjoin" 119 #if KMP_FAST_REDUCTION_BARRIER 122 #endif // KMP_FAST_REDUCTION_BARRIER 124 char const *__kmp_barrier_pattern_name[bp_last_bar] = {
"linear",
"tree",
125 "hyper",
"hierarchical"};
127 int __kmp_allThreadsSpecified = 0;
128 size_t __kmp_align_alloc = CACHE_LINE;
131 int __kmp_generate_warnings = kmp_warnings_low;
132 int __kmp_reserve_warn = 0;
134 int __kmp_avail_proc = 0;
135 size_t __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
136 int __kmp_sys_max_nth = KMP_MAX_NTH;
137 int __kmp_max_nth = 0;
138 int __kmp_threads_capacity = 0;
139 int __kmp_dflt_team_nth = 0;
140 int __kmp_dflt_team_nth_ub = 0;
141 int __kmp_tp_capacity = 0;
142 int __kmp_tp_cached = 0;
143 int __kmp_dflt_nested = FALSE;
144 int __kmp_dispatch_num_buffers = KMP_DFLT_DISP_NUM_BUFF;
145 int __kmp_dflt_max_active_levels =
146 KMP_MAX_ACTIVE_LEVELS_LIMIT;
147 #if KMP_NESTED_HOT_TEAMS 148 int __kmp_hot_teams_mode = 0;
150 int __kmp_hot_teams_max_level = 1;
152 enum library_type __kmp_library = library_none;
156 kmp_sch_static_greedy;
158 kmp_sch_guided_iterative_chunked;
160 kmp_sch_guided_analytical_chunked;
161 int __kmp_dflt_blocktime = KMP_DEFAULT_BLOCKTIME;
163 int __kmp_monitor_wakeups = KMP_MIN_MONITOR_WAKEUPS;
164 int __kmp_bt_intervals = KMP_INTERVALS_FROM_BLOCKTIME(KMP_DEFAULT_BLOCKTIME,
165 KMP_MIN_MONITOR_WAKEUPS);
167 #ifdef KMP_ADJUST_BLOCKTIME 168 int __kmp_zero_bt = FALSE;
170 #ifdef KMP_DFLT_NTH_CORES 171 int __kmp_ncores = 0;
174 int __kmp_abort_delay = 0;
175 #if KMP_OS_LINUX && defined(KMP_TDATA_GTID) 176 int __kmp_gtid_mode = 3;
177 int __kmp_adjust_gtid_mode = FALSE;
179 int __kmp_gtid_mode = 2;
180 int __kmp_adjust_gtid_mode = FALSE;
182 int __kmp_gtid_mode = 0;
183 int __kmp_adjust_gtid_mode = TRUE;
185 #ifdef KMP_TDATA_GTID 187 __declspec(thread)
int __kmp_gtid = KMP_GTID_DNE;
189 __thread
int __kmp_gtid = KMP_GTID_DNE;
193 int __kmp_tls_gtid_min = INT_MAX;
194 int __kmp_foreign_tp = TRUE;
195 #if KMP_ARCH_X86 || KMP_ARCH_X86_64 196 int __kmp_inherit_fp_control = TRUE;
197 kmp_int16 __kmp_init_x87_fpu_control_word = 0;
198 kmp_uint32 __kmp_init_mxcsr = 0;
201 #ifdef USE_LOAD_BALANCE 202 double __kmp_load_balance_interval = 1.0;
205 kmp_nested_nthreads_t __kmp_nested_nth = {NULL, 0, 0};
207 #if KMP_USE_ADAPTIVE_LOCKS 209 kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params = {
212 #if KMP_DEBUG_ADAPTIVE_LOCKS 213 char *__kmp_speculative_statsfile =
"-";
216 #endif // KMP_USE_ADAPTIVE_LOCKS 219 int __kmp_display_env = FALSE;
220 int __kmp_display_env_verbose = FALSE;
221 int __kmp_omp_cancellation = FALSE;
225 enum sched_type __kmp_sch_map[kmp_sched_upper - kmp_sched_lower_ext +
226 kmp_sched_upper_std - kmp_sched_lower - 2] = {
227 kmp_sch_static_chunked,
228 kmp_sch_dynamic_chunked,
237 enum clock_function_type __kmp_clock_function;
238 int __kmp_clock_function_param;
241 #if KMP_MIC_SUPPORTED 242 enum mic_type __kmp_mic_type = non_mic;
245 #if KMP_AFFINITY_SUPPORTED 247 KMPAffinity *__kmp_affinity_dispatch = NULL;
250 int __kmp_hwloc_error = FALSE;
251 hwloc_topology_t __kmp_hwloc_topology = NULL;
255 #if KMP_GROUP_AFFINITY 256 int __kmp_num_proc_groups = 1;
258 kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount = NULL;
259 kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount = NULL;
260 kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity = NULL;
261 kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity = NULL;
264 size_t __kmp_affin_mask_size = 0;
265 enum affinity_type __kmp_affinity_type = affinity_default;
266 enum affinity_gran __kmp_affinity_gran = affinity_gran_default;
267 int __kmp_affinity_gran_levels = -1;
268 int __kmp_affinity_dups = TRUE;
269 enum affinity_top_method __kmp_affinity_top_method =
270 affinity_top_method_default;
271 int __kmp_affinity_compact = 0;
272 int __kmp_affinity_offset = 0;
273 int __kmp_affinity_verbose = FALSE;
274 int __kmp_affinity_warnings = TRUE;
275 int __kmp_affinity_respect_mask = affinity_respect_mask_default;
276 char *__kmp_affinity_proclist = NULL;
277 kmp_affin_mask_t *__kmp_affinity_masks = NULL;
278 unsigned __kmp_affinity_num_masks = 0;
280 char const *__kmp_cpuinfo_file = NULL;
285 kmp_nested_proc_bind_t __kmp_nested_proc_bind = {NULL, 0, 0};
286 int __kmp_affinity_num_places = 0;
289 kmp_hws_item_t __kmp_hws_socket = {0, 0};
290 kmp_hws_item_t __kmp_hws_node = {0, 0};
291 kmp_hws_item_t __kmp_hws_tile = {0, 0};
292 kmp_hws_item_t __kmp_hws_core = {0, 0};
293 kmp_hws_item_t __kmp_hws_proc = {0, 0};
294 int __kmp_hws_requested = 0;
295 int __kmp_hws_abs_flag = 0;
298 kmp_int32 __kmp_default_device = 0;
301 kmp_tasking_mode_t __kmp_tasking_mode = tskm_task_teams;
303 kmp_int32 __kmp_max_task_priority = 0;
304 kmp_uint64 __kmp_taskloop_min_tasks = 0;
312 KMP_BUILD_ASSERT(
sizeof(kmp_tasking_flags_t) == 4);
314 kmp_int32 __kmp_task_stealing_constraint =
318 int __kmp_suspend_count = 0;
321 int __kmp_settings = FALSE;
322 int __kmp_duplicate_library_ok = 0;
324 int __kmp_forkjoin_frames = 1;
325 int __kmp_forkjoin_frames_mode = 3;
327 PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method =
328 reduction_method_not_defined;
329 int __kmp_determ_red = FALSE;
342 int __kmp_debug_buf =
344 int __kmp_debug_buf_lines =
345 KMP_DEBUG_BUF_LINES_INIT;
346 int __kmp_debug_buf_chars =
347 KMP_DEBUG_BUF_CHARS_INIT;
348 int __kmp_debug_buf_atomic =
351 char *__kmp_debug_buffer = NULL;
352 int __kmp_debug_count =
354 int __kmp_debug_buf_warn_chars =
361 char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN] = {
'\0'};
362 char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN] = {
'\0'};
363 int __kmp_par_range_lb = 0;
364 int __kmp_par_range_ub = INT_MAX;
368 int __kmp_storage_map =
370 int __kmp_storage_map_verbose =
372 int __kmp_storage_map_verbose_specified = FALSE;
375 int __kmp_need_register_atfork =
377 int __kmp_need_register_atfork_specified = TRUE;
379 int __kmp_env_chunk = FALSE;
380 int __kmp_env_stksize = FALSE;
381 int __kmp_env_omp_stksize = FALSE;
382 int __kmp_env_all_threads =
384 int __kmp_env_omp_all_threads = FALSE;
385 int __kmp_env_blocktime = FALSE;
386 int __kmp_env_checks = FALSE;
387 int __kmp_env_consistency_check = FALSE;
389 kmp_uint32 __kmp_yield_init = KMP_INIT_WAIT;
390 kmp_uint32 __kmp_yield_next = KMP_NEXT_WAIT;
393 kmp_uint32 __kmp_yielding_on = 1;
396 kmp_uint32 __kmp_yield_cycle = 0;
398 kmp_uint32 __kmp_yield_cycle = 1;
400 kmp_int32 __kmp_yield_on_count =
402 kmp_int32 __kmp_yield_off_count =
412 kmp_info_t **__kmp_threads = NULL;
413 kmp_root_t **__kmp_root = NULL;
417 volatile int __kmp_nth = 0;
418 volatile int __kmp_all_nth = 0;
419 int __kmp_thread_pool_nth = 0;
420 volatile kmp_info_t *__kmp_thread_pool = NULL;
421 volatile kmp_team_t *__kmp_team_pool = NULL;
424 volatile int __kmp_thread_pool_active_nth = 0;
429 kmp_global_t __kmp_global = {{0}};
435 #if KMP_USE_INTERNODE_ALIGNMENT 438 KMP_ALIGN_CACHE_INTERNODE
440 kmp_bootstrap_lock_t __kmp_initz_lock = KMP_BOOTSTRAP_LOCK_INITIALIZER(
442 KMP_ALIGN_CACHE_INTERNODE
443 kmp_bootstrap_lock_t __kmp_forkjoin_lock;
444 KMP_ALIGN_CACHE_INTERNODE
445 kmp_bootstrap_lock_t __kmp_exit_lock;
447 KMP_ALIGN_CACHE_INTERNODE
448 kmp_bootstrap_lock_t __kmp_monitor_lock;
452 KMP_ALIGN_CACHE_INTERNODE
453 kmp_bootstrap_lock_t __kmp_tp_cached_lock;
455 KMP_ALIGN_CACHE_INTERNODE
456 kmp_lock_t __kmp_global_lock;
457 KMP_ALIGN_CACHE_INTERNODE
458 kmp_queuing_lock_t __kmp_dispatch_lock;
459 KMP_ALIGN_CACHE_INTERNODE
460 kmp_lock_t __kmp_debug_lock;
464 kmp_bootstrap_lock_t __kmp_initz_lock = KMP_BOOTSTRAP_LOCK_INITIALIZER(
466 kmp_bootstrap_lock_t __kmp_forkjoin_lock;
467 kmp_bootstrap_lock_t __kmp_exit_lock;
469 kmp_bootstrap_lock_t __kmp_monitor_lock;
473 kmp_bootstrap_lock_t __kmp_tp_cached_lock;
476 kmp_lock_t __kmp_global_lock;
478 kmp_queuing_lock_t __kmp_dispatch_lock;
480 kmp_lock_t __kmp_debug_lock;
485 #if KMP_HANDLE_SIGNALS 505 int __kmp_handle_signals = FALSE;
510 kmp_key_t __kmp_tv_key = 0;
516 int get_suspend_count_(
void) {
517 int count = __kmp_suspend_count;
518 __kmp_suspend_count = 0;
521 void set_suspend_count_(
int *value) { __kmp_suspend_count = *value; }
525 int _You_must_link_with_exactly_one_OpenMP_library = 1;
526 int _You_must_link_with_Intel_OpenMP_library = 1;
527 #if KMP_OS_WINDOWS && (KMP_VERSION_MAJOR > 4) 528 int _You_must_link_with_Microsoft_OpenMP_library = 1;