14 #include "kmp_affinity.h"
15 #if KMP_USE_HIER_SCHED
16 #include "kmp_dispatch_hier.h"
19 kmp_key_t __kmp_gtid_threadprivate_key;
21 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
22 kmp_cpuinfo_t __kmp_cpuinfo = {0};
26 #include "kmp_stats.h"
28 kmp_tas_lock_t __kmp_stats_lock;
32 kmp_stats_list *__kmp_stats_list;
35 KMP_THREAD_LOCAL kmp_stats_list *__kmp_stats_thread_ptr = NULL;
38 tsc_tick_count __kmp_stats_start_time;
44 volatile int __kmp_init_serial = FALSE;
45 volatile int __kmp_init_gtid = FALSE;
46 volatile int __kmp_init_common = FALSE;
47 volatile int __kmp_init_middle = FALSE;
48 volatile int __kmp_init_parallel = FALSE;
50 volatile int __kmp_init_monitor =
53 volatile int __kmp_init_user_locks = FALSE;
56 kmp_cached_addr_t *__kmp_threadpriv_cache_list = NULL;
58 int __kmp_init_counter = 0;
59 int __kmp_root_counter = 0;
60 int __kmp_version = 0;
62 std::atomic<kmp_int32> __kmp_team_counter = ATOMIC_VAR_INIT(0);
63 std::atomic<kmp_int32> __kmp_task_counter = ATOMIC_VAR_INIT(0);
65 size_t __kmp_stksize = KMP_DEFAULT_STKSIZE;
67 size_t __kmp_monitor_stksize = 0;
69 size_t __kmp_stkoffset = KMP_DEFAULT_STKOFFSET;
70 int __kmp_stkpadding = KMP_MIN_STKPADDING;
72 size_t __kmp_malloc_pool_incr = KMP_DEFAULT_MALLOC_POOL_INCR;
76 kmp_uint32 __kmp_barrier_gather_bb_dflt = 2;
78 kmp_uint32 __kmp_barrier_release_bb_dflt = 2;
81 kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_hyper_bar;
83 kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_hyper_bar;
86 kmp_uint32 __kmp_barrier_gather_branch_bits[bs_last_barrier] = {0};
87 kmp_uint32 __kmp_barrier_release_branch_bits[bs_last_barrier] = {0};
88 kmp_bar_pat_e __kmp_barrier_gather_pattern[bs_last_barrier] = {bp_linear_bar};
89 kmp_bar_pat_e __kmp_barrier_release_pattern[bs_last_barrier] = {bp_linear_bar};
90 char const *__kmp_barrier_branch_bit_env_name[bs_last_barrier] = {
91 "KMP_PLAIN_BARRIER",
"KMP_FORKJOIN_BARRIER"
92 #if KMP_FAST_REDUCTION_BARRIER
94 "KMP_REDUCTION_BARRIER"
95 #endif // KMP_FAST_REDUCTION_BARRIER
97 char const *__kmp_barrier_pattern_env_name[bs_last_barrier] = {
98 "KMP_PLAIN_BARRIER_PATTERN",
"KMP_FORKJOIN_BARRIER_PATTERN"
99 #if KMP_FAST_REDUCTION_BARRIER
101 "KMP_REDUCTION_BARRIER_PATTERN"
102 #endif // KMP_FAST_REDUCTION_BARRIER
104 char const *__kmp_barrier_type_name[bs_last_barrier] = {
"plain",
"forkjoin"
105 #if KMP_FAST_REDUCTION_BARRIER
108 #endif // KMP_FAST_REDUCTION_BARRIER
110 char const *__kmp_barrier_pattern_name[bp_last_bar] = {
"linear",
"tree",
111 "hyper",
"hierarchical"};
113 int __kmp_allThreadsSpecified = 0;
114 size_t __kmp_align_alloc = CACHE_LINE;
116 int __kmp_generate_warnings = kmp_warnings_low;
117 int __kmp_reserve_warn = 0;
119 int __kmp_avail_proc = 0;
120 size_t __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
121 int __kmp_sys_max_nth = KMP_MAX_NTH;
122 int __kmp_max_nth = 0;
123 int __kmp_cg_max_nth = 0;
124 int __kmp_teams_max_nth = 0;
125 int __kmp_threads_capacity = 0;
126 int __kmp_dflt_team_nth = 0;
127 int __kmp_dflt_team_nth_ub = 0;
128 int __kmp_tp_capacity = 0;
129 int __kmp_tp_cached = 0;
130 int __kmp_dispatch_num_buffers = KMP_DFLT_DISP_NUM_BUFF;
131 int __kmp_dflt_max_active_levels = 1;
132 bool __kmp_dflt_max_active_levels_set =
false;
133 #if KMP_NESTED_HOT_TEAMS
134 int __kmp_hot_teams_mode = 0;
136 int __kmp_hot_teams_max_level = 1;
138 enum library_type __kmp_library = library_none;
142 kmp_sch_static_greedy;
144 kmp_sch_guided_iterative_chunked;
146 kmp_sch_guided_analytical_chunked;
147 #if KMP_USE_HIER_SCHED
148 int __kmp_dispatch_hand_threading = 0;
149 int __kmp_hier_max_units[kmp_hier_layer_e::LAYER_LAST + 1];
150 int __kmp_hier_threads_per[kmp_hier_layer_e::LAYER_LAST + 1];
151 kmp_hier_sched_env_t __kmp_hier_scheds = {0, 0, NULL, NULL, NULL};
153 int __kmp_dflt_blocktime = KMP_DEFAULT_BLOCKTIME;
155 int __kmp_monitor_wakeups = KMP_MIN_MONITOR_WAKEUPS;
156 int __kmp_bt_intervals = KMP_INTERVALS_FROM_BLOCKTIME(KMP_DEFAULT_BLOCKTIME,
157 KMP_MIN_MONITOR_WAKEUPS);
159 #ifdef KMP_ADJUST_BLOCKTIME
160 int __kmp_zero_bt = FALSE;
162 #ifdef KMP_DFLT_NTH_CORES
163 int __kmp_ncores = 0;
166 int __kmp_abort_delay = 0;
167 #if KMP_OS_LINUX && defined(KMP_TDATA_GTID)
168 int __kmp_gtid_mode = 3;
169 int __kmp_adjust_gtid_mode = FALSE;
171 int __kmp_gtid_mode = 2;
172 int __kmp_adjust_gtid_mode = FALSE;
174 int __kmp_gtid_mode = 0;
175 int __kmp_adjust_gtid_mode = TRUE;
177 #ifdef KMP_TDATA_GTID
178 KMP_THREAD_LOCAL
int __kmp_gtid = KMP_GTID_DNE;
180 int __kmp_tls_gtid_min = INT_MAX;
181 int __kmp_foreign_tp = TRUE;
182 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
183 int __kmp_inherit_fp_control = TRUE;
184 kmp_int16 __kmp_init_x87_fpu_control_word = 0;
185 kmp_uint32 __kmp_init_mxcsr = 0;
188 #ifdef USE_LOAD_BALANCE
189 double __kmp_load_balance_interval = 1.0;
192 kmp_nested_nthreads_t __kmp_nested_nth = {NULL, 0, 0};
194 #if KMP_USE_ADAPTIVE_LOCKS
196 kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params = {
199 #if KMP_DEBUG_ADAPTIVE_LOCKS
200 const char *__kmp_speculative_statsfile =
"-";
203 #endif // KMP_USE_ADAPTIVE_LOCKS
205 int __kmp_display_env = FALSE;
206 int __kmp_display_env_verbose = FALSE;
207 int __kmp_omp_cancellation = FALSE;
210 enum sched_type __kmp_sch_map[kmp_sched_upper - kmp_sched_lower_ext +
211 kmp_sched_upper_std - kmp_sched_lower - 2] = {
212 kmp_sch_static_chunked,
213 kmp_sch_dynamic_chunked,
222 enum clock_function_type __kmp_clock_function;
223 int __kmp_clock_function_param;
226 #if KMP_MIC_SUPPORTED
227 enum mic_type __kmp_mic_type = non_mic;
230 #if KMP_AFFINITY_SUPPORTED
232 KMPAffinity *__kmp_affinity_dispatch = NULL;
235 int __kmp_hwloc_error = FALSE;
236 hwloc_topology_t __kmp_hwloc_topology = NULL;
237 int __kmp_numa_detected = FALSE;
238 int __kmp_tile_depth = 0;
242 #if KMP_GROUP_AFFINITY
243 int __kmp_num_proc_groups = 1;
245 kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount = NULL;
246 kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount = NULL;
247 kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity = NULL;
248 kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity = NULL;
251 size_t __kmp_affin_mask_size = 0;
252 enum affinity_type __kmp_affinity_type = affinity_default;
253 enum affinity_gran __kmp_affinity_gran = affinity_gran_default;
254 int __kmp_affinity_gran_levels = -1;
255 int __kmp_affinity_dups = TRUE;
256 enum affinity_top_method __kmp_affinity_top_method =
257 affinity_top_method_default;
258 int __kmp_affinity_compact = 0;
259 int __kmp_affinity_offset = 0;
260 int __kmp_affinity_verbose = FALSE;
261 int __kmp_affinity_warnings = TRUE;
262 int __kmp_affinity_respect_mask = affinity_respect_mask_default;
263 char *__kmp_affinity_proclist = NULL;
264 kmp_affin_mask_t *__kmp_affinity_masks = NULL;
265 unsigned __kmp_affinity_num_masks = 0;
267 char *__kmp_cpuinfo_file = NULL;
271 kmp_nested_proc_bind_t __kmp_nested_proc_bind = {NULL, 0, 0};
272 int __kmp_affinity_num_places = 0;
273 int __kmp_display_affinity = FALSE;
274 char *__kmp_affinity_format = NULL;
276 kmp_hws_item_t __kmp_hws_socket = {0, 0};
277 kmp_hws_item_t __kmp_hws_node = {0, 0};
278 kmp_hws_item_t __kmp_hws_tile = {0, 0};
279 kmp_hws_item_t __kmp_hws_core = {0, 0};
280 kmp_hws_item_t __kmp_hws_proc = {0, 0};
281 int __kmp_hws_requested = 0;
282 int __kmp_hws_abs_flag = 0;
284 kmp_int32 __kmp_default_device = 0;
286 kmp_tasking_mode_t __kmp_tasking_mode = tskm_task_teams;
287 kmp_int32 __kmp_max_task_priority = 0;
288 kmp_uint64 __kmp_taskloop_min_tasks = 0;
290 int __kmp_memkind_available = 0;
291 omp_allocator_handle_t
const omp_null_allocator = NULL;
292 omp_allocator_handle_t
const omp_default_mem_alloc =
293 (omp_allocator_handle_t
const)1;
294 omp_allocator_handle_t
const omp_large_cap_mem_alloc =
295 (omp_allocator_handle_t
const)2;
296 omp_allocator_handle_t
const omp_const_mem_alloc =
297 (omp_allocator_handle_t
const)3;
298 omp_allocator_handle_t
const omp_high_bw_mem_alloc =
299 (omp_allocator_handle_t
const)4;
300 omp_allocator_handle_t
const omp_low_lat_mem_alloc =
301 (omp_allocator_handle_t
const)5;
302 omp_allocator_handle_t
const omp_cgroup_mem_alloc =
303 (omp_allocator_handle_t
const)6;
304 omp_allocator_handle_t
const omp_pteam_mem_alloc =
305 (omp_allocator_handle_t
const)7;
306 omp_allocator_handle_t
const omp_thread_mem_alloc =
307 (omp_allocator_handle_t
const)8;
308 omp_allocator_handle_t
const kmp_max_mem_alloc =
309 (omp_allocator_handle_t
const)1024;
310 omp_allocator_handle_t __kmp_def_allocator = omp_default_mem_alloc;
312 omp_memspace_handle_t
const omp_default_mem_space =
313 (omp_memspace_handle_t
const)0;
314 omp_memspace_handle_t
const omp_large_cap_mem_space =
315 (omp_memspace_handle_t
const)1;
316 omp_memspace_handle_t
const omp_const_mem_space =
317 (omp_memspace_handle_t
const)2;
318 omp_memspace_handle_t
const omp_high_bw_mem_space =
319 (omp_memspace_handle_t
const)3;
320 omp_memspace_handle_t
const omp_low_lat_mem_space =
321 (omp_memspace_handle_t
const)4;
328 KMP_BUILD_ASSERT(
sizeof(kmp_tasking_flags_t) == 4);
330 int __kmp_task_stealing_constraint = 1;
331 int __kmp_enable_task_throttling = 1;
334 int __kmp_suspend_count = 0;
337 int __kmp_settings = FALSE;
338 int __kmp_duplicate_library_ok = 0;
340 int __kmp_forkjoin_frames = 1;
341 int __kmp_forkjoin_frames_mode = 3;
343 PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method =
344 reduction_method_not_defined;
345 int __kmp_determ_red = FALSE;
358 int __kmp_debug_buf =
360 int __kmp_debug_buf_lines =
361 KMP_DEBUG_BUF_LINES_INIT;
362 int __kmp_debug_buf_chars =
363 KMP_DEBUG_BUF_CHARS_INIT;
364 int __kmp_debug_buf_atomic =
367 char *__kmp_debug_buffer = NULL;
368 std::atomic<int> __kmp_debug_count =
370 int __kmp_debug_buf_warn_chars =
377 char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN] = {
'\0'};
378 char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN] = {
'\0'};
379 int __kmp_par_range_lb = 0;
380 int __kmp_par_range_ub = INT_MAX;
384 int __kmp_storage_map =
386 int __kmp_storage_map_verbose =
388 int __kmp_storage_map_verbose_specified = FALSE;
391 int __kmp_need_register_atfork =
393 int __kmp_need_register_atfork_specified = TRUE;
395 int __kmp_env_stksize = FALSE;
396 int __kmp_env_blocktime = FALSE;
397 int __kmp_env_checks = FALSE;
398 int __kmp_env_consistency_check = FALSE;
404 kmp_int32 __kmp_use_yield = 1;
406 kmp_int32 __kmp_use_yield_exp_set = 0;
408 kmp_uint32 __kmp_yield_init = KMP_INIT_WAIT;
409 kmp_uint32 __kmp_yield_next = KMP_NEXT_WAIT;
418 kmp_info_t **__kmp_threads = NULL;
419 kmp_root_t **__kmp_root = NULL;
423 volatile int __kmp_nth = 0;
424 volatile int __kmp_all_nth = 0;
425 volatile kmp_info_t *__kmp_thread_pool = NULL;
426 volatile kmp_team_t *__kmp_team_pool = NULL;
429 std::atomic<int> __kmp_thread_pool_active_nth = ATOMIC_VAR_INIT(0);
434 kmp_global_t __kmp_global;
440 #if KMP_USE_INTERNODE_ALIGNMENT
443 KMP_ALIGN_CACHE_INTERNODE
445 KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock);
446 KMP_ALIGN_CACHE_INTERNODE
447 KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock);
448 KMP_ALIGN_CACHE_INTERNODE
449 KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock);
452 KMP_ALIGN_CACHE_INTERNODE
453 KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock);
457 KMP_ALIGN_CACHE_INTERNODE
458 KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock);
460 KMP_ALIGN_CACHE_INTERNODE
461 KMP_LOCK_INIT(__kmp_global_lock);
462 KMP_ALIGN_CACHE_INTERNODE
463 kmp_queuing_lock_t __kmp_dispatch_lock;
464 KMP_ALIGN_CACHE_INTERNODE
465 KMP_LOCK_INIT(__kmp_debug_lock);
469 KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock);
470 KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock);
471 KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock);
474 KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock);
478 KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock);
481 KMP_LOCK_INIT(__kmp_global_lock);
483 kmp_queuing_lock_t __kmp_dispatch_lock;
485 KMP_LOCK_INIT(__kmp_debug_lock);
490 #if KMP_HANDLE_SIGNALS
510 int __kmp_handle_signals = FALSE;
514 int get_suspend_count_(
void) {
515 int count = __kmp_suspend_count;
516 __kmp_suspend_count = 0;
519 void set_suspend_count_(
int *value) { __kmp_suspend_count = *value; }
523 int _You_must_link_with_exactly_one_OpenMP_library = 1;
524 int _You_must_link_with_Intel_OpenMP_library = 1;
525 #if KMP_OS_WINDOWS && (KMP_VERSION_MAJOR > 4)
526 int _You_must_link_with_Microsoft_OpenMP_library = 1;
529 kmp_target_offload_kind_t __kmp_target_offload = tgt_default;
532 kmp_pause_status_t __kmp_pause_status = kmp_not_paused;