14 #include "kmp_affinity.h"
15 #if KMP_USE_HIER_SCHED
16 #include "kmp_dispatch_hier.h"
19 kmp_key_t __kmp_gtid_threadprivate_key;
21 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
22 kmp_cpuinfo_t __kmp_cpuinfo = {0};
26 #include "kmp_stats.h"
28 kmp_tas_lock_t __kmp_stats_lock;
32 kmp_stats_list *__kmp_stats_list;
35 KMP_THREAD_LOCAL kmp_stats_list *__kmp_stats_thread_ptr = NULL;
38 tsc_tick_count __kmp_stats_start_time;
44 volatile int __kmp_init_serial = FALSE;
45 volatile int __kmp_init_gtid = FALSE;
46 volatile int __kmp_init_common = FALSE;
47 volatile int __kmp_need_register_serial = TRUE;
48 volatile int __kmp_init_middle = FALSE;
49 volatile int __kmp_init_parallel = FALSE;
50 volatile int __kmp_init_hidden_helper = FALSE;
51 volatile int __kmp_init_hidden_helper_threads = FALSE;
52 volatile int __kmp_hidden_helper_team_done = FALSE;
54 volatile int __kmp_init_monitor =
57 volatile int __kmp_init_user_locks = FALSE;
60 kmp_cached_addr_t *__kmp_threadpriv_cache_list = NULL;
62 int __kmp_init_counter = 0;
63 int __kmp_root_counter = 0;
64 int __kmp_version = 0;
66 std::atomic<kmp_int32> __kmp_team_counter = 0;
67 std::atomic<kmp_int32> __kmp_task_counter = 0;
69 size_t __kmp_stksize = KMP_DEFAULT_STKSIZE;
71 size_t __kmp_monitor_stksize = 0;
73 size_t __kmp_stkoffset = KMP_DEFAULT_STKOFFSET;
74 int __kmp_stkpadding = KMP_MIN_STKPADDING;
76 size_t __kmp_malloc_pool_incr = KMP_DEFAULT_MALLOC_POOL_INCR;
80 kmp_uint32 __kmp_barrier_gather_bb_dflt = 2;
82 kmp_uint32 __kmp_barrier_release_bb_dflt = 2;
85 kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_hyper_bar;
87 kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_hyper_bar;
90 kmp_uint32 __kmp_barrier_gather_branch_bits[bs_last_barrier] = {0};
91 kmp_uint32 __kmp_barrier_release_branch_bits[bs_last_barrier] = {0};
92 kmp_bar_pat_e __kmp_barrier_gather_pattern[bs_last_barrier] = {bp_linear_bar};
93 kmp_bar_pat_e __kmp_barrier_release_pattern[bs_last_barrier] = {bp_linear_bar};
94 char const *__kmp_barrier_branch_bit_env_name[bs_last_barrier] = {
95 "KMP_PLAIN_BARRIER",
"KMP_FORKJOIN_BARRIER"
96 #if KMP_FAST_REDUCTION_BARRIER
98 "KMP_REDUCTION_BARRIER"
101 char const *__kmp_barrier_pattern_env_name[bs_last_barrier] = {
102 "KMP_PLAIN_BARRIER_PATTERN",
"KMP_FORKJOIN_BARRIER_PATTERN"
103 #if KMP_FAST_REDUCTION_BARRIER
105 "KMP_REDUCTION_BARRIER_PATTERN"
108 char const *__kmp_barrier_type_name[bs_last_barrier] = {
"plain",
"forkjoin"
109 #if KMP_FAST_REDUCTION_BARRIER
114 char const *__kmp_barrier_pattern_name[bp_last_bar] = {
115 "linear",
"tree",
"hyper",
"hierarchical",
"dist"};
117 int __kmp_allThreadsSpecified = 0;
118 size_t __kmp_align_alloc = CACHE_LINE;
120 int __kmp_generate_warnings = kmp_warnings_low;
121 int __kmp_reserve_warn = 0;
123 int __kmp_avail_proc = 0;
124 size_t __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
125 int __kmp_sys_max_nth = KMP_MAX_NTH;
126 int __kmp_max_nth = 0;
127 int __kmp_cg_max_nth = 0;
128 int __kmp_task_max_nth = 0;
129 int __kmp_teams_max_nth = 0;
130 int __kmp_threads_capacity = 0;
131 int __kmp_dflt_team_nth = 0;
132 int __kmp_dflt_team_nth_ub = 0;
133 int __kmp_tp_capacity = 0;
134 int __kmp_tp_cached = 0;
135 int __kmp_dispatch_num_buffers = KMP_DFLT_DISP_NUM_BUFF;
136 int __kmp_dflt_max_active_levels = 1;
137 bool __kmp_dflt_max_active_levels_set =
false;
138 #if KMP_NESTED_HOT_TEAMS
139 int __kmp_hot_teams_mode = 0;
141 int __kmp_hot_teams_max_level = 1;
143 enum library_type __kmp_library = library_none;
147 kmp_sch_static_greedy;
149 kmp_sch_guided_iterative_chunked;
151 kmp_sch_guided_analytical_chunked;
152 #if KMP_USE_HIER_SCHED
153 int __kmp_dispatch_hand_threading = 0;
154 int __kmp_hier_max_units[kmp_hier_layer_e::LAYER_LAST + 1];
155 int __kmp_hier_threads_per[kmp_hier_layer_e::LAYER_LAST + 1];
156 kmp_hier_sched_env_t __kmp_hier_scheds = {0, 0, NULL, NULL, NULL};
158 int __kmp_dflt_blocktime = KMP_DEFAULT_BLOCKTIME;
159 char __kmp_blocktime_units =
'm';
160 bool __kmp_wpolicy_passive =
false;
162 int __kmp_monitor_wakeups = KMP_MIN_MONITOR_WAKEUPS;
163 int __kmp_bt_intervals = KMP_INTERVALS_FROM_BLOCKTIME(KMP_DEFAULT_BLOCKTIME,
164 KMP_MIN_MONITOR_WAKEUPS);
166 #ifdef KMP_ADJUST_BLOCKTIME
167 int __kmp_zero_bt = FALSE;
169 #ifdef KMP_DFLT_NTH_CORES
170 int __kmp_ncores = 0;
173 int __kmp_force_monotonic = 0;
174 int __kmp_abort_delay = 0;
175 #if (KMP_OS_LINUX || KMP_OS_AIX || KMP_OS_SOLARIS) && defined(KMP_TDATA_GTID)
176 int __kmp_gtid_mode = 3;
177 int __kmp_adjust_gtid_mode = FALSE;
179 int __kmp_gtid_mode = 2;
180 int __kmp_adjust_gtid_mode = FALSE;
182 int __kmp_gtid_mode = 0;
183 int __kmp_adjust_gtid_mode = TRUE;
185 #ifdef KMP_TDATA_GTID
186 KMP_THREAD_LOCAL
int __kmp_gtid = KMP_GTID_DNE;
188 int __kmp_tls_gtid_min = INT_MAX;
189 int __kmp_foreign_tp = TRUE;
190 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
191 int __kmp_inherit_fp_control = TRUE;
192 kmp_int16 __kmp_init_x87_fpu_control_word = 0;
193 kmp_uint32 __kmp_init_mxcsr = 0;
196 #ifdef USE_LOAD_BALANCE
197 double __kmp_load_balance_interval = 1.0;
200 kmp_nested_nthreads_t __kmp_nested_nth = {NULL, 0, 0};
202 #if KMP_USE_ADAPTIVE_LOCKS
204 kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params = {
207 #if KMP_DEBUG_ADAPTIVE_LOCKS
208 const char *__kmp_speculative_statsfile =
"-";
213 int __kmp_display_env = FALSE;
214 int __kmp_display_env_verbose = FALSE;
215 int __kmp_omp_cancellation = FALSE;
216 int __kmp_nteams = 0;
217 int __kmp_teams_thread_limit = 0;
219 #if KMP_HAVE_MWAIT || KMP_HAVE_UMWAIT
220 int __kmp_user_level_mwait = FALSE;
221 int __kmp_umwait_enabled = FALSE;
222 int __kmp_mwait_enabled = FALSE;
223 int __kmp_mwait_hints = 0;
227 int __kmp_waitpkg_enabled = 0;
228 int __kmp_tpause_state = 0;
229 int __kmp_tpause_hint = 1;
230 int __kmp_tpause_enabled = 0;
234 enum sched_type __kmp_sch_map[kmp_sched_upper - kmp_sched_lower_ext +
235 kmp_sched_upper_std - kmp_sched_lower - 2] = {
236 kmp_sch_static_chunked,
237 kmp_sch_dynamic_chunked,
245 #if KMP_MIC_SUPPORTED
246 enum mic_type __kmp_mic_type = non_mic;
249 #if KMP_AFFINITY_SUPPORTED
251 KMPAffinity *__kmp_affinity_dispatch = NULL;
254 int __kmp_hwloc_error = FALSE;
255 hwloc_topology_t __kmp_hwloc_topology = NULL;
259 #if KMP_GROUP_AFFINITY
260 int __kmp_num_proc_groups = 1;
262 kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount = NULL;
263 kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount = NULL;
264 kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity = NULL;
265 kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity = NULL;
268 size_t __kmp_affin_mask_size = 0;
269 enum affinity_top_method __kmp_affinity_top_method =
270 affinity_top_method_default;
273 kmp_affinity_t __kmp_affinity = KMP_AFFINITY_INIT(
"KMP_AFFINITY");
275 kmp_affinity_t __kmp_hh_affinity =
276 KMP_AFFINITY_INIT(
"KMP_HIDDEN_HELPER_AFFINITY");
277 kmp_affinity_t *__kmp_affinities[] = {&__kmp_affinity, &__kmp_hh_affinity};
279 char *__kmp_cpuinfo_file = NULL;
280 #if KMP_WEIGHTED_ITERATIONS_SUPPORTED
281 int __kmp_first_osid_with_ecore = -1;
286 kmp_nested_proc_bind_t __kmp_nested_proc_bind = {NULL, 0, 0};
287 kmp_proc_bind_t __kmp_teams_proc_bind = proc_bind_spread;
288 int __kmp_affinity_num_places = 0;
289 int __kmp_display_affinity = FALSE;
290 char *__kmp_affinity_format = NULL;
292 kmp_int32 __kmp_default_device = 0;
294 kmp_tasking_mode_t __kmp_tasking_mode = tskm_task_teams;
295 kmp_int32 __kmp_max_task_priority = 0;
296 kmp_uint64 __kmp_taskloop_min_tasks = 0;
298 int __kmp_memkind_available = 0;
299 bool __kmp_hwloc_available =
false;
300 omp_allocator_handle_t
const omp_null_allocator = NULL;
301 omp_allocator_handle_t
const omp_default_mem_alloc =
302 (omp_allocator_handle_t
const)1;
303 omp_allocator_handle_t
const omp_large_cap_mem_alloc =
304 (omp_allocator_handle_t
const)2;
305 omp_allocator_handle_t
const omp_const_mem_alloc =
306 (omp_allocator_handle_t
const)3;
307 omp_allocator_handle_t
const omp_high_bw_mem_alloc =
308 (omp_allocator_handle_t
const)4;
309 omp_allocator_handle_t
const omp_low_lat_mem_alloc =
310 (omp_allocator_handle_t
const)5;
311 omp_allocator_handle_t
const omp_cgroup_mem_alloc =
312 (omp_allocator_handle_t
const)6;
313 omp_allocator_handle_t
const omp_pteam_mem_alloc =
314 (omp_allocator_handle_t
const)7;
315 omp_allocator_handle_t
const omp_thread_mem_alloc =
316 (omp_allocator_handle_t
const)8;
317 omp_allocator_handle_t
const llvm_omp_target_host_mem_alloc =
318 (omp_allocator_handle_t
const)100;
319 omp_allocator_handle_t
const llvm_omp_target_shared_mem_alloc =
320 (omp_allocator_handle_t
const)101;
321 omp_allocator_handle_t
const llvm_omp_target_device_mem_alloc =
322 (omp_allocator_handle_t
const)102;
323 omp_allocator_handle_t
const kmp_max_mem_alloc =
324 (omp_allocator_handle_t
const)1024;
325 omp_allocator_handle_t __kmp_def_allocator = omp_default_mem_alloc;
327 omp_memspace_handle_t
const omp_null_mem_space = (omp_memspace_handle_t
const)0;
328 omp_memspace_handle_t
const omp_default_mem_space =
329 (omp_memspace_handle_t
const)99;
330 omp_memspace_handle_t
const omp_large_cap_mem_space =
331 (omp_memspace_handle_t
const)1;
332 omp_memspace_handle_t
const omp_const_mem_space =
333 (omp_memspace_handle_t
const)2;
334 omp_memspace_handle_t
const omp_high_bw_mem_space =
335 (omp_memspace_handle_t
const)3;
336 omp_memspace_handle_t
const omp_low_lat_mem_space =
337 (omp_memspace_handle_t
const)4;
338 omp_memspace_handle_t
const llvm_omp_target_host_mem_space =
339 (omp_memspace_handle_t
const)100;
340 omp_memspace_handle_t
const llvm_omp_target_shared_mem_space =
341 (omp_memspace_handle_t
const)101;
342 omp_memspace_handle_t
const llvm_omp_target_device_mem_space =
343 (omp_memspace_handle_t
const)102;
344 omp_memspace_handle_t
const kmp_max_mem_space =
345 (omp_memspace_handle_t
const)1024;
352 KMP_BUILD_ASSERT(
sizeof(kmp_tasking_flags_t) == 4);
354 int __kmp_task_stealing_constraint = 1;
355 int __kmp_enable_task_throttling = 1;
358 int __kmp_suspend_count = 0;
361 int __kmp_settings = FALSE;
362 int __kmp_duplicate_library_ok = 0;
364 int __kmp_forkjoin_frames = 1;
365 int __kmp_forkjoin_frames_mode = 3;
367 PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method =
368 reduction_method_not_defined;
369 int __kmp_determ_red = FALSE;
382 int __kmp_debug_buf =
384 int __kmp_debug_buf_lines =
385 KMP_DEBUG_BUF_LINES_INIT;
386 int __kmp_debug_buf_chars =
387 KMP_DEBUG_BUF_CHARS_INIT;
388 int __kmp_debug_buf_atomic =
391 char *__kmp_debug_buffer = NULL;
392 std::atomic<int> __kmp_debug_count =
394 int __kmp_debug_buf_warn_chars =
401 char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN] = {
'\0'};
402 char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN] = {
'\0'};
403 int __kmp_par_range_lb = 0;
404 int __kmp_par_range_ub = INT_MAX;
408 int __kmp_storage_map =
410 int __kmp_storage_map_verbose =
412 int __kmp_storage_map_verbose_specified = FALSE;
415 int __kmp_need_register_atfork =
417 int __kmp_need_register_atfork_specified = TRUE;
419 int __kmp_env_stksize = FALSE;
420 int __kmp_env_blocktime = FALSE;
421 int __kmp_env_checks = FALSE;
422 int __kmp_env_consistency_check = FALSE;
428 #if KMP_OS_DARWIN && KMP_ARCH_AARCH64
430 kmp_int32 __kmp_use_yield = 0;
432 kmp_int32 __kmp_use_yield = 1;
436 kmp_int32 __kmp_use_yield_exp_set = 0;
438 kmp_uint32 __kmp_yield_init = KMP_INIT_WAIT;
439 kmp_uint32 __kmp_yield_next = KMP_NEXT_WAIT;
440 kmp_uint64 __kmp_pause_init = 1;
449 kmp_info_t **__kmp_threads = NULL;
450 kmp_root_t **__kmp_root = NULL;
451 kmp_old_threads_list_t *__kmp_old_threads_list = NULL;
455 volatile int __kmp_nth = 0;
456 volatile int __kmp_all_nth = 0;
457 volatile kmp_info_t *__kmp_thread_pool = NULL;
458 volatile kmp_team_t *__kmp_team_pool = NULL;
461 std::atomic<int> __kmp_thread_pool_active_nth = 0;
466 kmp_global_t __kmp_global;
472 #if KMP_USE_INTERNODE_ALIGNMENT
475 KMP_ALIGN_CACHE_INTERNODE
477 KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock);
478 KMP_ALIGN_CACHE_INTERNODE
479 KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock);
480 KMP_ALIGN_CACHE_INTERNODE
481 KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock);
484 KMP_ALIGN_CACHE_INTERNODE
485 KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock);
489 KMP_ALIGN_CACHE_INTERNODE
490 KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock);
492 KMP_ALIGN_CACHE_INTERNODE
493 KMP_LOCK_INIT(__kmp_global_lock);
497 KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock);
498 KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock);
499 KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock);
502 KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock);
506 KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock);
509 KMP_LOCK_INIT(__kmp_global_lock);
514 #if KMP_HANDLE_SIGNALS
534 int __kmp_handle_signals = FALSE;
538 int get_suspend_count_(
void) {
539 int count = __kmp_suspend_count;
540 __kmp_suspend_count = 0;
543 void set_suspend_count_(
int *value) { __kmp_suspend_count = *value; }
546 kmp_target_offload_kind_t __kmp_target_offload = tgt_default;
549 kmp_pause_status_t __kmp_pause_status = kmp_not_paused;
552 int __kmp_nesting_mode = 0;
553 int __kmp_nesting_mode_nlevels = 1;
554 int *__kmp_nesting_nth_level;
558 int __kmp_tdg_dot = 0;
559 kmp_int32 __kmp_max_tdgs = 100;
560 kmp_tdg_info_t **__kmp_global_tdgs = NULL;
561 kmp_int32 __kmp_curr_tdg_idx =
563 kmp_int32 __kmp_num_tdg = 0;
564 kmp_int32 __kmp_successors_size = 10;
566 std::atomic<kmp_int32> __kmp_tdg_task_id = 0;