1*0b57cec5SDimitry Andric /* 2*0b57cec5SDimitry Andric * kmp_global.cpp -- KPTS global variables for runtime support library 3*0b57cec5SDimitry Andric */ 4*0b57cec5SDimitry Andric 5*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 6*0b57cec5SDimitry Andric // 7*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 8*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 9*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 10*0b57cec5SDimitry Andric // 11*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 12*0b57cec5SDimitry Andric 13*0b57cec5SDimitry Andric #include "kmp.h" 14*0b57cec5SDimitry Andric #include "kmp_affinity.h" 15*0b57cec5SDimitry Andric #if KMP_USE_HIER_SCHED 16*0b57cec5SDimitry Andric #include "kmp_dispatch_hier.h" 17*0b57cec5SDimitry Andric #endif 18*0b57cec5SDimitry Andric 19*0b57cec5SDimitry Andric kmp_key_t __kmp_gtid_threadprivate_key; 20*0b57cec5SDimitry Andric 21*0b57cec5SDimitry Andric #if KMP_ARCH_X86 || KMP_ARCH_X86_64 22*0b57cec5SDimitry Andric kmp_cpuinfo_t __kmp_cpuinfo = {0}; // Not initialized 23*0b57cec5SDimitry Andric #endif 24*0b57cec5SDimitry Andric 25*0b57cec5SDimitry Andric #if KMP_STATS_ENABLED 26*0b57cec5SDimitry Andric #include "kmp_stats.h" 27*0b57cec5SDimitry Andric // lock for modifying the global __kmp_stats_list 28*0b57cec5SDimitry Andric kmp_tas_lock_t __kmp_stats_lock; 29*0b57cec5SDimitry Andric 30*0b57cec5SDimitry Andric // global list of per thread stats, the head is a sentinel node which 31*0b57cec5SDimitry Andric // accumulates all stats produced before __kmp_create_worker is called. 32*0b57cec5SDimitry Andric kmp_stats_list *__kmp_stats_list; 33*0b57cec5SDimitry Andric 34*0b57cec5SDimitry Andric // thread local pointer to stats node within list 35*0b57cec5SDimitry Andric KMP_THREAD_LOCAL kmp_stats_list *__kmp_stats_thread_ptr = NULL; 36*0b57cec5SDimitry Andric 37*0b57cec5SDimitry Andric // gives reference tick for all events (considered the 0 tick) 38*0b57cec5SDimitry Andric tsc_tick_count __kmp_stats_start_time; 39*0b57cec5SDimitry Andric #endif 40*0b57cec5SDimitry Andric 41*0b57cec5SDimitry Andric /* ----------------------------------------------------- */ 42*0b57cec5SDimitry Andric /* INITIALIZATION VARIABLES */ 43*0b57cec5SDimitry Andric /* they are syncronized to write during init, but read anytime */ 44*0b57cec5SDimitry Andric volatile int __kmp_init_serial = FALSE; 45*0b57cec5SDimitry Andric volatile int __kmp_init_gtid = FALSE; 46*0b57cec5SDimitry Andric volatile int __kmp_init_common = FALSE; 47*0b57cec5SDimitry Andric volatile int __kmp_init_middle = FALSE; 48*0b57cec5SDimitry Andric volatile int __kmp_init_parallel = FALSE; 49*0b57cec5SDimitry Andric #if KMP_USE_MONITOR 50*0b57cec5SDimitry Andric volatile int __kmp_init_monitor = 51*0b57cec5SDimitry Andric 0; /* 1 - launched, 2 - actually started (Windows* OS only) */ 52*0b57cec5SDimitry Andric #endif 53*0b57cec5SDimitry Andric volatile int __kmp_init_user_locks = FALSE; 54*0b57cec5SDimitry Andric 55*0b57cec5SDimitry Andric /* list of address of allocated caches for commons */ 56*0b57cec5SDimitry Andric kmp_cached_addr_t *__kmp_threadpriv_cache_list = NULL; 57*0b57cec5SDimitry Andric 58*0b57cec5SDimitry Andric int __kmp_init_counter = 0; 59*0b57cec5SDimitry Andric int __kmp_root_counter = 0; 60*0b57cec5SDimitry Andric int __kmp_version = 0; 61*0b57cec5SDimitry Andric 62*0b57cec5SDimitry Andric std::atomic<kmp_int32> __kmp_team_counter = ATOMIC_VAR_INIT(0); 63*0b57cec5SDimitry Andric std::atomic<kmp_int32> __kmp_task_counter = ATOMIC_VAR_INIT(0); 64*0b57cec5SDimitry Andric 65*0b57cec5SDimitry Andric size_t __kmp_stksize = KMP_DEFAULT_STKSIZE; 66*0b57cec5SDimitry Andric #if KMP_USE_MONITOR 67*0b57cec5SDimitry Andric size_t __kmp_monitor_stksize = 0; // auto adjust 68*0b57cec5SDimitry Andric #endif 69*0b57cec5SDimitry Andric size_t __kmp_stkoffset = KMP_DEFAULT_STKOFFSET; 70*0b57cec5SDimitry Andric int __kmp_stkpadding = KMP_MIN_STKPADDING; 71*0b57cec5SDimitry Andric 72*0b57cec5SDimitry Andric size_t __kmp_malloc_pool_incr = KMP_DEFAULT_MALLOC_POOL_INCR; 73*0b57cec5SDimitry Andric 74*0b57cec5SDimitry Andric // Barrier method defaults, settings, and strings. 75*0b57cec5SDimitry Andric // branch factor = 2^branch_bits (only relevant for tree & hyper barrier types) 76*0b57cec5SDimitry Andric kmp_uint32 __kmp_barrier_gather_bb_dflt = 2; 77*0b57cec5SDimitry Andric /* branch_factor = 4 */ /* hyper2: C78980 */ 78*0b57cec5SDimitry Andric kmp_uint32 __kmp_barrier_release_bb_dflt = 2; 79*0b57cec5SDimitry Andric /* branch_factor = 4 */ /* hyper2: C78980 */ 80*0b57cec5SDimitry Andric 81*0b57cec5SDimitry Andric kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_hyper_bar; 82*0b57cec5SDimitry Andric /* hyper2: C78980 */ 83*0b57cec5SDimitry Andric kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_hyper_bar; 84*0b57cec5SDimitry Andric /* hyper2: C78980 */ 85*0b57cec5SDimitry Andric 86*0b57cec5SDimitry Andric kmp_uint32 __kmp_barrier_gather_branch_bits[bs_last_barrier] = {0}; 87*0b57cec5SDimitry Andric kmp_uint32 __kmp_barrier_release_branch_bits[bs_last_barrier] = {0}; 88*0b57cec5SDimitry Andric kmp_bar_pat_e __kmp_barrier_gather_pattern[bs_last_barrier] = {bp_linear_bar}; 89*0b57cec5SDimitry Andric kmp_bar_pat_e __kmp_barrier_release_pattern[bs_last_barrier] = {bp_linear_bar}; 90*0b57cec5SDimitry Andric char const *__kmp_barrier_branch_bit_env_name[bs_last_barrier] = { 91*0b57cec5SDimitry Andric "KMP_PLAIN_BARRIER", "KMP_FORKJOIN_BARRIER" 92*0b57cec5SDimitry Andric #if KMP_FAST_REDUCTION_BARRIER 93*0b57cec5SDimitry Andric , 94*0b57cec5SDimitry Andric "KMP_REDUCTION_BARRIER" 95*0b57cec5SDimitry Andric #endif // KMP_FAST_REDUCTION_BARRIER 96*0b57cec5SDimitry Andric }; 97*0b57cec5SDimitry Andric char const *__kmp_barrier_pattern_env_name[bs_last_barrier] = { 98*0b57cec5SDimitry Andric "KMP_PLAIN_BARRIER_PATTERN", "KMP_FORKJOIN_BARRIER_PATTERN" 99*0b57cec5SDimitry Andric #if KMP_FAST_REDUCTION_BARRIER 100*0b57cec5SDimitry Andric , 101*0b57cec5SDimitry Andric "KMP_REDUCTION_BARRIER_PATTERN" 102*0b57cec5SDimitry Andric #endif // KMP_FAST_REDUCTION_BARRIER 103*0b57cec5SDimitry Andric }; 104*0b57cec5SDimitry Andric char const *__kmp_barrier_type_name[bs_last_barrier] = {"plain", "forkjoin" 105*0b57cec5SDimitry Andric #if KMP_FAST_REDUCTION_BARRIER 106*0b57cec5SDimitry Andric , 107*0b57cec5SDimitry Andric "reduction" 108*0b57cec5SDimitry Andric #endif // KMP_FAST_REDUCTION_BARRIER 109*0b57cec5SDimitry Andric }; 110*0b57cec5SDimitry Andric char const *__kmp_barrier_pattern_name[bp_last_bar] = {"linear", "tree", 111*0b57cec5SDimitry Andric "hyper", "hierarchical"}; 112*0b57cec5SDimitry Andric 113*0b57cec5SDimitry Andric int __kmp_allThreadsSpecified = 0; 114*0b57cec5SDimitry Andric size_t __kmp_align_alloc = CACHE_LINE; 115*0b57cec5SDimitry Andric 116*0b57cec5SDimitry Andric int __kmp_generate_warnings = kmp_warnings_low; 117*0b57cec5SDimitry Andric int __kmp_reserve_warn = 0; 118*0b57cec5SDimitry Andric int __kmp_xproc = 0; 119*0b57cec5SDimitry Andric int __kmp_avail_proc = 0; 120*0b57cec5SDimitry Andric size_t __kmp_sys_min_stksize = KMP_MIN_STKSIZE; 121*0b57cec5SDimitry Andric int __kmp_sys_max_nth = KMP_MAX_NTH; 122*0b57cec5SDimitry Andric int __kmp_max_nth = 0; 123*0b57cec5SDimitry Andric int __kmp_cg_max_nth = 0; 124*0b57cec5SDimitry Andric int __kmp_teams_max_nth = 0; 125*0b57cec5SDimitry Andric int __kmp_threads_capacity = 0; 126*0b57cec5SDimitry Andric int __kmp_dflt_team_nth = 0; 127*0b57cec5SDimitry Andric int __kmp_dflt_team_nth_ub = 0; 128*0b57cec5SDimitry Andric int __kmp_tp_capacity = 0; 129*0b57cec5SDimitry Andric int __kmp_tp_cached = 0; 130*0b57cec5SDimitry Andric int __kmp_dispatch_num_buffers = KMP_DFLT_DISP_NUM_BUFF; 131*0b57cec5SDimitry Andric int __kmp_dflt_max_active_levels = 1; // Nesting off by default 132*0b57cec5SDimitry Andric bool __kmp_dflt_max_active_levels_set = false; // Don't override set value 133*0b57cec5SDimitry Andric #if KMP_NESTED_HOT_TEAMS 134*0b57cec5SDimitry Andric int __kmp_hot_teams_mode = 0; /* 0 - free extra threads when reduced */ 135*0b57cec5SDimitry Andric /* 1 - keep extra threads when reduced */ 136*0b57cec5SDimitry Andric int __kmp_hot_teams_max_level = 1; /* nesting level of hot teams */ 137*0b57cec5SDimitry Andric #endif 138*0b57cec5SDimitry Andric enum library_type __kmp_library = library_none; 139*0b57cec5SDimitry Andric enum sched_type __kmp_sched = 140*0b57cec5SDimitry Andric kmp_sch_default; /* scheduling method for runtime scheduling */ 141*0b57cec5SDimitry Andric enum sched_type __kmp_static = 142*0b57cec5SDimitry Andric kmp_sch_static_greedy; /* default static scheduling method */ 143*0b57cec5SDimitry Andric enum sched_type __kmp_guided = 144*0b57cec5SDimitry Andric kmp_sch_guided_iterative_chunked; /* default guided scheduling method */ 145*0b57cec5SDimitry Andric enum sched_type __kmp_auto = 146*0b57cec5SDimitry Andric kmp_sch_guided_analytical_chunked; /* default auto scheduling method */ 147*0b57cec5SDimitry Andric #if KMP_USE_HIER_SCHED 148*0b57cec5SDimitry Andric int __kmp_dispatch_hand_threading = 0; 149*0b57cec5SDimitry Andric int __kmp_hier_max_units[kmp_hier_layer_e::LAYER_LAST + 1]; 150*0b57cec5SDimitry Andric int __kmp_hier_threads_per[kmp_hier_layer_e::LAYER_LAST + 1]; 151*0b57cec5SDimitry Andric kmp_hier_sched_env_t __kmp_hier_scheds = {0, 0, NULL, NULL, NULL}; 152*0b57cec5SDimitry Andric #endif 153*0b57cec5SDimitry Andric int __kmp_dflt_blocktime = KMP_DEFAULT_BLOCKTIME; 154*0b57cec5SDimitry Andric #if KMP_USE_MONITOR 155*0b57cec5SDimitry Andric int __kmp_monitor_wakeups = KMP_MIN_MONITOR_WAKEUPS; 156*0b57cec5SDimitry Andric int __kmp_bt_intervals = KMP_INTERVALS_FROM_BLOCKTIME(KMP_DEFAULT_BLOCKTIME, 157*0b57cec5SDimitry Andric KMP_MIN_MONITOR_WAKEUPS); 158*0b57cec5SDimitry Andric #endif 159*0b57cec5SDimitry Andric #ifdef KMP_ADJUST_BLOCKTIME 160*0b57cec5SDimitry Andric int __kmp_zero_bt = FALSE; 161*0b57cec5SDimitry Andric #endif /* KMP_ADJUST_BLOCKTIME */ 162*0b57cec5SDimitry Andric #ifdef KMP_DFLT_NTH_CORES 163*0b57cec5SDimitry Andric int __kmp_ncores = 0; 164*0b57cec5SDimitry Andric #endif 165*0b57cec5SDimitry Andric int __kmp_chunk = 0; 166*0b57cec5SDimitry Andric int __kmp_abort_delay = 0; 167*0b57cec5SDimitry Andric #if KMP_OS_LINUX && defined(KMP_TDATA_GTID) 168*0b57cec5SDimitry Andric int __kmp_gtid_mode = 3; /* use __declspec(thread) TLS to store gtid */ 169*0b57cec5SDimitry Andric int __kmp_adjust_gtid_mode = FALSE; 170*0b57cec5SDimitry Andric #elif KMP_OS_WINDOWS 171*0b57cec5SDimitry Andric int __kmp_gtid_mode = 2; /* use TLS functions to store gtid */ 172*0b57cec5SDimitry Andric int __kmp_adjust_gtid_mode = FALSE; 173*0b57cec5SDimitry Andric #else 174*0b57cec5SDimitry Andric int __kmp_gtid_mode = 0; /* select method to get gtid based on #threads */ 175*0b57cec5SDimitry Andric int __kmp_adjust_gtid_mode = TRUE; 176*0b57cec5SDimitry Andric #endif /* KMP_OS_LINUX && defined(KMP_TDATA_GTID) */ 177*0b57cec5SDimitry Andric #ifdef KMP_TDATA_GTID 178*0b57cec5SDimitry Andric KMP_THREAD_LOCAL int __kmp_gtid = KMP_GTID_DNE; 179*0b57cec5SDimitry Andric #endif /* KMP_TDATA_GTID */ 180*0b57cec5SDimitry Andric int __kmp_tls_gtid_min = INT_MAX; 181*0b57cec5SDimitry Andric int __kmp_foreign_tp = TRUE; 182*0b57cec5SDimitry Andric #if KMP_ARCH_X86 || KMP_ARCH_X86_64 183*0b57cec5SDimitry Andric int __kmp_inherit_fp_control = TRUE; 184*0b57cec5SDimitry Andric kmp_int16 __kmp_init_x87_fpu_control_word = 0; 185*0b57cec5SDimitry Andric kmp_uint32 __kmp_init_mxcsr = 0; 186*0b57cec5SDimitry Andric #endif /* KMP_ARCH_X86 || KMP_ARCH_X86_64 */ 187*0b57cec5SDimitry Andric 188*0b57cec5SDimitry Andric #ifdef USE_LOAD_BALANCE 189*0b57cec5SDimitry Andric double __kmp_load_balance_interval = 1.0; 190*0b57cec5SDimitry Andric #endif /* USE_LOAD_BALANCE */ 191*0b57cec5SDimitry Andric 192*0b57cec5SDimitry Andric kmp_nested_nthreads_t __kmp_nested_nth = {NULL, 0, 0}; 193*0b57cec5SDimitry Andric 194*0b57cec5SDimitry Andric #if KMP_USE_ADAPTIVE_LOCKS 195*0b57cec5SDimitry Andric 196*0b57cec5SDimitry Andric kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params = { 197*0b57cec5SDimitry Andric 1, 1024}; // TODO: tune it! 198*0b57cec5SDimitry Andric 199*0b57cec5SDimitry Andric #if KMP_DEBUG_ADAPTIVE_LOCKS 200*0b57cec5SDimitry Andric const char *__kmp_speculative_statsfile = "-"; 201*0b57cec5SDimitry Andric #endif 202*0b57cec5SDimitry Andric 203*0b57cec5SDimitry Andric #endif // KMP_USE_ADAPTIVE_LOCKS 204*0b57cec5SDimitry Andric 205*0b57cec5SDimitry Andric int __kmp_display_env = FALSE; 206*0b57cec5SDimitry Andric int __kmp_display_env_verbose = FALSE; 207*0b57cec5SDimitry Andric int __kmp_omp_cancellation = FALSE; 208*0b57cec5SDimitry Andric 209*0b57cec5SDimitry Andric /* map OMP 3.0 schedule types with our internal schedule types */ 210*0b57cec5SDimitry Andric enum sched_type __kmp_sch_map[kmp_sched_upper - kmp_sched_lower_ext + 211*0b57cec5SDimitry Andric kmp_sched_upper_std - kmp_sched_lower - 2] = { 212*0b57cec5SDimitry Andric kmp_sch_static_chunked, // ==> kmp_sched_static = 1 213*0b57cec5SDimitry Andric kmp_sch_dynamic_chunked, // ==> kmp_sched_dynamic = 2 214*0b57cec5SDimitry Andric kmp_sch_guided_chunked, // ==> kmp_sched_guided = 3 215*0b57cec5SDimitry Andric kmp_sch_auto, // ==> kmp_sched_auto = 4 216*0b57cec5SDimitry Andric kmp_sch_trapezoidal // ==> kmp_sched_trapezoidal = 101 217*0b57cec5SDimitry Andric // will likely not be used, introduced here just to debug the code 218*0b57cec5SDimitry Andric // of public intel extension schedules 219*0b57cec5SDimitry Andric }; 220*0b57cec5SDimitry Andric 221*0b57cec5SDimitry Andric #if KMP_OS_LINUX 222*0b57cec5SDimitry Andric enum clock_function_type __kmp_clock_function; 223*0b57cec5SDimitry Andric int __kmp_clock_function_param; 224*0b57cec5SDimitry Andric #endif /* KMP_OS_LINUX */ 225*0b57cec5SDimitry Andric 226*0b57cec5SDimitry Andric #if KMP_MIC_SUPPORTED 227*0b57cec5SDimitry Andric enum mic_type __kmp_mic_type = non_mic; 228*0b57cec5SDimitry Andric #endif 229*0b57cec5SDimitry Andric 230*0b57cec5SDimitry Andric #if KMP_AFFINITY_SUPPORTED 231*0b57cec5SDimitry Andric 232*0b57cec5SDimitry Andric KMPAffinity *__kmp_affinity_dispatch = NULL; 233*0b57cec5SDimitry Andric 234*0b57cec5SDimitry Andric #if KMP_USE_HWLOC 235*0b57cec5SDimitry Andric int __kmp_hwloc_error = FALSE; 236*0b57cec5SDimitry Andric hwloc_topology_t __kmp_hwloc_topology = NULL; 237*0b57cec5SDimitry Andric int __kmp_numa_detected = FALSE; 238*0b57cec5SDimitry Andric int __kmp_tile_depth = 0; 239*0b57cec5SDimitry Andric #endif 240*0b57cec5SDimitry Andric 241*0b57cec5SDimitry Andric #if KMP_OS_WINDOWS 242*0b57cec5SDimitry Andric #if KMP_GROUP_AFFINITY 243*0b57cec5SDimitry Andric int __kmp_num_proc_groups = 1; 244*0b57cec5SDimitry Andric #endif /* KMP_GROUP_AFFINITY */ 245*0b57cec5SDimitry Andric kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount = NULL; 246*0b57cec5SDimitry Andric kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount = NULL; 247*0b57cec5SDimitry Andric kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity = NULL; 248*0b57cec5SDimitry Andric kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity = NULL; 249*0b57cec5SDimitry Andric #endif /* KMP_OS_WINDOWS */ 250*0b57cec5SDimitry Andric 251*0b57cec5SDimitry Andric size_t __kmp_affin_mask_size = 0; 252*0b57cec5SDimitry Andric enum affinity_type __kmp_affinity_type = affinity_default; 253*0b57cec5SDimitry Andric enum affinity_gran __kmp_affinity_gran = affinity_gran_default; 254*0b57cec5SDimitry Andric int __kmp_affinity_gran_levels = -1; 255*0b57cec5SDimitry Andric int __kmp_affinity_dups = TRUE; 256*0b57cec5SDimitry Andric enum affinity_top_method __kmp_affinity_top_method = 257*0b57cec5SDimitry Andric affinity_top_method_default; 258*0b57cec5SDimitry Andric int __kmp_affinity_compact = 0; 259*0b57cec5SDimitry Andric int __kmp_affinity_offset = 0; 260*0b57cec5SDimitry Andric int __kmp_affinity_verbose = FALSE; 261*0b57cec5SDimitry Andric int __kmp_affinity_warnings = TRUE; 262*0b57cec5SDimitry Andric int __kmp_affinity_respect_mask = affinity_respect_mask_default; 263*0b57cec5SDimitry Andric char *__kmp_affinity_proclist = NULL; 264*0b57cec5SDimitry Andric kmp_affin_mask_t *__kmp_affinity_masks = NULL; 265*0b57cec5SDimitry Andric unsigned __kmp_affinity_num_masks = 0; 266*0b57cec5SDimitry Andric 267*0b57cec5SDimitry Andric char *__kmp_cpuinfo_file = NULL; 268*0b57cec5SDimitry Andric 269*0b57cec5SDimitry Andric #endif /* KMP_AFFINITY_SUPPORTED */ 270*0b57cec5SDimitry Andric 271*0b57cec5SDimitry Andric kmp_nested_proc_bind_t __kmp_nested_proc_bind = {NULL, 0, 0}; 272*0b57cec5SDimitry Andric int __kmp_affinity_num_places = 0; 273*0b57cec5SDimitry Andric int __kmp_display_affinity = FALSE; 274*0b57cec5SDimitry Andric char *__kmp_affinity_format = NULL; 275*0b57cec5SDimitry Andric 276*0b57cec5SDimitry Andric kmp_hws_item_t __kmp_hws_socket = {0, 0}; 277*0b57cec5SDimitry Andric kmp_hws_item_t __kmp_hws_node = {0, 0}; 278*0b57cec5SDimitry Andric kmp_hws_item_t __kmp_hws_tile = {0, 0}; 279*0b57cec5SDimitry Andric kmp_hws_item_t __kmp_hws_core = {0, 0}; 280*0b57cec5SDimitry Andric kmp_hws_item_t __kmp_hws_proc = {0, 0}; 281*0b57cec5SDimitry Andric int __kmp_hws_requested = 0; 282*0b57cec5SDimitry Andric int __kmp_hws_abs_flag = 0; // absolute or per-item number requested 283*0b57cec5SDimitry Andric 284*0b57cec5SDimitry Andric kmp_int32 __kmp_default_device = 0; 285*0b57cec5SDimitry Andric 286*0b57cec5SDimitry Andric kmp_tasking_mode_t __kmp_tasking_mode = tskm_task_teams; 287*0b57cec5SDimitry Andric kmp_int32 __kmp_max_task_priority = 0; 288*0b57cec5SDimitry Andric kmp_uint64 __kmp_taskloop_min_tasks = 0; 289*0b57cec5SDimitry Andric 290*0b57cec5SDimitry Andric int __kmp_memkind_available = 0; 291*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_null_allocator = NULL; 292*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_default_mem_alloc = 293*0b57cec5SDimitry Andric (omp_allocator_handle_t const)1; 294*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_large_cap_mem_alloc = 295*0b57cec5SDimitry Andric (omp_allocator_handle_t const)2; 296*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_const_mem_alloc = 297*0b57cec5SDimitry Andric (omp_allocator_handle_t const)3; 298*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_high_bw_mem_alloc = 299*0b57cec5SDimitry Andric (omp_allocator_handle_t const)4; 300*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_low_lat_mem_alloc = 301*0b57cec5SDimitry Andric (omp_allocator_handle_t const)5; 302*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_cgroup_mem_alloc = 303*0b57cec5SDimitry Andric (omp_allocator_handle_t const)6; 304*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_pteam_mem_alloc = 305*0b57cec5SDimitry Andric (omp_allocator_handle_t const)7; 306*0b57cec5SDimitry Andric omp_allocator_handle_t const omp_thread_mem_alloc = 307*0b57cec5SDimitry Andric (omp_allocator_handle_t const)8; 308*0b57cec5SDimitry Andric omp_allocator_handle_t const kmp_max_mem_alloc = 309*0b57cec5SDimitry Andric (omp_allocator_handle_t const)1024; 310*0b57cec5SDimitry Andric omp_allocator_handle_t __kmp_def_allocator = omp_default_mem_alloc; 311*0b57cec5SDimitry Andric 312*0b57cec5SDimitry Andric omp_memspace_handle_t const omp_default_mem_space = 313*0b57cec5SDimitry Andric (omp_memspace_handle_t const)0; 314*0b57cec5SDimitry Andric omp_memspace_handle_t const omp_large_cap_mem_space = 315*0b57cec5SDimitry Andric (omp_memspace_handle_t const)1; 316*0b57cec5SDimitry Andric omp_memspace_handle_t const omp_const_mem_space = 317*0b57cec5SDimitry Andric (omp_memspace_handle_t const)2; 318*0b57cec5SDimitry Andric omp_memspace_handle_t const omp_high_bw_mem_space = 319*0b57cec5SDimitry Andric (omp_memspace_handle_t const)3; 320*0b57cec5SDimitry Andric omp_memspace_handle_t const omp_low_lat_mem_space = 321*0b57cec5SDimitry Andric (omp_memspace_handle_t const)4; 322*0b57cec5SDimitry Andric 323*0b57cec5SDimitry Andric /* This check ensures that the compiler is passing the correct data type for the 324*0b57cec5SDimitry Andric flags formal parameter of the function kmpc_omp_task_alloc(). If the type is 325*0b57cec5SDimitry Andric not a 4-byte type, then give an error message about a non-positive length 326*0b57cec5SDimitry Andric array pointing here. If that happens, the kmp_tasking_flags_t structure must 327*0b57cec5SDimitry Andric be redefined to have exactly 32 bits. */ 328*0b57cec5SDimitry Andric KMP_BUILD_ASSERT(sizeof(kmp_tasking_flags_t) == 4); 329*0b57cec5SDimitry Andric 330*0b57cec5SDimitry Andric int __kmp_task_stealing_constraint = 1; /* Constrain task stealing by default */ 331*0b57cec5SDimitry Andric int __kmp_enable_task_throttling = 1; 332*0b57cec5SDimitry Andric 333*0b57cec5SDimitry Andric #ifdef DEBUG_SUSPEND 334*0b57cec5SDimitry Andric int __kmp_suspend_count = 0; 335*0b57cec5SDimitry Andric #endif 336*0b57cec5SDimitry Andric 337*0b57cec5SDimitry Andric int __kmp_settings = FALSE; 338*0b57cec5SDimitry Andric int __kmp_duplicate_library_ok = 0; 339*0b57cec5SDimitry Andric #if USE_ITT_BUILD 340*0b57cec5SDimitry Andric int __kmp_forkjoin_frames = 1; 341*0b57cec5SDimitry Andric int __kmp_forkjoin_frames_mode = 3; 342*0b57cec5SDimitry Andric #endif 343*0b57cec5SDimitry Andric PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method = 344*0b57cec5SDimitry Andric reduction_method_not_defined; 345*0b57cec5SDimitry Andric int __kmp_determ_red = FALSE; 346*0b57cec5SDimitry Andric 347*0b57cec5SDimitry Andric #ifdef KMP_DEBUG 348*0b57cec5SDimitry Andric int kmp_a_debug = 0; 349*0b57cec5SDimitry Andric int kmp_b_debug = 0; 350*0b57cec5SDimitry Andric int kmp_c_debug = 0; 351*0b57cec5SDimitry Andric int kmp_d_debug = 0; 352*0b57cec5SDimitry Andric int kmp_e_debug = 0; 353*0b57cec5SDimitry Andric int kmp_f_debug = 0; 354*0b57cec5SDimitry Andric int kmp_diag = 0; 355*0b57cec5SDimitry Andric #endif 356*0b57cec5SDimitry Andric 357*0b57cec5SDimitry Andric /* For debug information logging using rotating buffer */ 358*0b57cec5SDimitry Andric int __kmp_debug_buf = 359*0b57cec5SDimitry Andric FALSE; /* TRUE means use buffer, FALSE means print to stderr */ 360*0b57cec5SDimitry Andric int __kmp_debug_buf_lines = 361*0b57cec5SDimitry Andric KMP_DEBUG_BUF_LINES_INIT; /* Lines of debug stored in buffer */ 362*0b57cec5SDimitry Andric int __kmp_debug_buf_chars = 363*0b57cec5SDimitry Andric KMP_DEBUG_BUF_CHARS_INIT; /* Characters allowed per line in buffer */ 364*0b57cec5SDimitry Andric int __kmp_debug_buf_atomic = 365*0b57cec5SDimitry Andric FALSE; /* TRUE means use atomic update of buffer entry pointer */ 366*0b57cec5SDimitry Andric 367*0b57cec5SDimitry Andric char *__kmp_debug_buffer = NULL; /* Debug buffer itself */ 368*0b57cec5SDimitry Andric std::atomic<int> __kmp_debug_count = 369*0b57cec5SDimitry Andric ATOMIC_VAR_INIT(0); /* number of lines printed in buffer so far */ 370*0b57cec5SDimitry Andric int __kmp_debug_buf_warn_chars = 371*0b57cec5SDimitry Andric 0; /* Keep track of char increase recommended in warnings */ 372*0b57cec5SDimitry Andric /* end rotating debug buffer */ 373*0b57cec5SDimitry Andric 374*0b57cec5SDimitry Andric #ifdef KMP_DEBUG 375*0b57cec5SDimitry Andric int __kmp_par_range; /* +1 => only go par for constructs in range */ 376*0b57cec5SDimitry Andric /* -1 => only go par for constructs outside range */ 377*0b57cec5SDimitry Andric char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN] = {'\0'}; 378*0b57cec5SDimitry Andric char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN] = {'\0'}; 379*0b57cec5SDimitry Andric int __kmp_par_range_lb = 0; 380*0b57cec5SDimitry Andric int __kmp_par_range_ub = INT_MAX; 381*0b57cec5SDimitry Andric #endif /* KMP_DEBUG */ 382*0b57cec5SDimitry Andric 383*0b57cec5SDimitry Andric /* For printing out dynamic storage map for threads and teams */ 384*0b57cec5SDimitry Andric int __kmp_storage_map = 385*0b57cec5SDimitry Andric FALSE; /* True means print storage map for threads and teams */ 386*0b57cec5SDimitry Andric int __kmp_storage_map_verbose = 387*0b57cec5SDimitry Andric FALSE; /* True means storage map includes placement info */ 388*0b57cec5SDimitry Andric int __kmp_storage_map_verbose_specified = FALSE; 389*0b57cec5SDimitry Andric /* Initialize the library data structures when we fork a child process, defaults 390*0b57cec5SDimitry Andric * to TRUE */ 391*0b57cec5SDimitry Andric int __kmp_need_register_atfork = 392*0b57cec5SDimitry Andric TRUE; /* At initialization, call pthread_atfork to install fork handler */ 393*0b57cec5SDimitry Andric int __kmp_need_register_atfork_specified = TRUE; 394*0b57cec5SDimitry Andric 395*0b57cec5SDimitry Andric int __kmp_env_stksize = FALSE; /* KMP_STACKSIZE specified? */ 396*0b57cec5SDimitry Andric int __kmp_env_blocktime = FALSE; /* KMP_BLOCKTIME specified? */ 397*0b57cec5SDimitry Andric int __kmp_env_checks = FALSE; /* KMP_CHECKS specified? */ 398*0b57cec5SDimitry Andric int __kmp_env_consistency_check = FALSE; /* KMP_CONSISTENCY_CHECK specified? */ 399*0b57cec5SDimitry Andric 400*0b57cec5SDimitry Andric // From KMP_USE_YIELD: 401*0b57cec5SDimitry Andric // 0 = never yield; 402*0b57cec5SDimitry Andric // 1 = always yield (default); 403*0b57cec5SDimitry Andric // 2 = yield only if oversubscribed 404*0b57cec5SDimitry Andric kmp_int32 __kmp_use_yield = 1; 405*0b57cec5SDimitry Andric // This will be 1 if KMP_USE_YIELD environment variable was set explicitly 406*0b57cec5SDimitry Andric kmp_int32 __kmp_use_yield_exp_set = 0; 407*0b57cec5SDimitry Andric 408*0b57cec5SDimitry Andric kmp_uint32 __kmp_yield_init = KMP_INIT_WAIT; 409*0b57cec5SDimitry Andric kmp_uint32 __kmp_yield_next = KMP_NEXT_WAIT; 410*0b57cec5SDimitry Andric 411*0b57cec5SDimitry Andric /* ------------------------------------------------------ */ 412*0b57cec5SDimitry Andric /* STATE mostly syncronized with global lock */ 413*0b57cec5SDimitry Andric /* data written to rarely by masters, read often by workers */ 414*0b57cec5SDimitry Andric /* TODO: None of this global padding stuff works consistently because the order 415*0b57cec5SDimitry Andric of declaration is not necessarily correlated to storage order. To fix this, 416*0b57cec5SDimitry Andric all the important globals must be put in a big structure instead. */ 417*0b57cec5SDimitry Andric KMP_ALIGN_CACHE 418*0b57cec5SDimitry Andric kmp_info_t **__kmp_threads = NULL; 419*0b57cec5SDimitry Andric kmp_root_t **__kmp_root = NULL; 420*0b57cec5SDimitry Andric 421*0b57cec5SDimitry Andric /* data read/written to often by masters */ 422*0b57cec5SDimitry Andric KMP_ALIGN_CACHE 423*0b57cec5SDimitry Andric volatile int __kmp_nth = 0; 424*0b57cec5SDimitry Andric volatile int __kmp_all_nth = 0; 425*0b57cec5SDimitry Andric volatile kmp_info_t *__kmp_thread_pool = NULL; 426*0b57cec5SDimitry Andric volatile kmp_team_t *__kmp_team_pool = NULL; 427*0b57cec5SDimitry Andric 428*0b57cec5SDimitry Andric KMP_ALIGN_CACHE 429*0b57cec5SDimitry Andric std::atomic<int> __kmp_thread_pool_active_nth = ATOMIC_VAR_INIT(0); 430*0b57cec5SDimitry Andric 431*0b57cec5SDimitry Andric /* ------------------------------------------------- 432*0b57cec5SDimitry Andric * GLOBAL/ROOT STATE */ 433*0b57cec5SDimitry Andric KMP_ALIGN_CACHE 434*0b57cec5SDimitry Andric kmp_global_t __kmp_global = {{0}}; 435*0b57cec5SDimitry Andric 436*0b57cec5SDimitry Andric /* ----------------------------------------------- */ 437*0b57cec5SDimitry Andric /* GLOBAL SYNCHRONIZATION LOCKS */ 438*0b57cec5SDimitry Andric /* TODO verify the need for these locks and if they need to be global */ 439*0b57cec5SDimitry Andric 440*0b57cec5SDimitry Andric #if KMP_USE_INTERNODE_ALIGNMENT 441*0b57cec5SDimitry Andric /* Multinode systems have larger cache line granularity which can cause 442*0b57cec5SDimitry Andric * false sharing if the alignment is not large enough for these locks */ 443*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 444*0b57cec5SDimitry Andric 445*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock); /* Control initializations */ 446*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 447*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock); /* control fork/join access */ 448*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 449*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock); /* exit() is not always thread-safe */ 450*0b57cec5SDimitry Andric #if KMP_USE_MONITOR 451*0b57cec5SDimitry Andric /* control monitor thread creation */ 452*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 453*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock); 454*0b57cec5SDimitry Andric #endif 455*0b57cec5SDimitry Andric /* used for the hack to allow threadprivate cache and __kmp_threads expansion 456*0b57cec5SDimitry Andric to co-exist */ 457*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 458*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock); 459*0b57cec5SDimitry Andric 460*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 461*0b57cec5SDimitry Andric KMP_LOCK_INIT(__kmp_global_lock); /* Control OS/global access */ 462*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 463*0b57cec5SDimitry Andric kmp_queuing_lock_t __kmp_dispatch_lock; /* Control dispatch access */ 464*0b57cec5SDimitry Andric KMP_ALIGN_CACHE_INTERNODE 465*0b57cec5SDimitry Andric KMP_LOCK_INIT(__kmp_debug_lock); /* Control I/O access for KMP_DEBUG */ 466*0b57cec5SDimitry Andric #else 467*0b57cec5SDimitry Andric KMP_ALIGN_CACHE 468*0b57cec5SDimitry Andric 469*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_initz_lock); /* Control initializations */ 470*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_forkjoin_lock); /* control fork/join access */ 471*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_exit_lock); /* exit() is not always thread-safe */ 472*0b57cec5SDimitry Andric #if KMP_USE_MONITOR 473*0b57cec5SDimitry Andric /* control monitor thread creation */ 474*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_monitor_lock); 475*0b57cec5SDimitry Andric #endif 476*0b57cec5SDimitry Andric /* used for the hack to allow threadprivate cache and __kmp_threads expansion 477*0b57cec5SDimitry Andric to co-exist */ 478*0b57cec5SDimitry Andric KMP_BOOTSTRAP_LOCK_INIT(__kmp_tp_cached_lock); 479*0b57cec5SDimitry Andric 480*0b57cec5SDimitry Andric KMP_ALIGN(128) 481*0b57cec5SDimitry Andric KMP_LOCK_INIT(__kmp_global_lock); /* Control OS/global access */ 482*0b57cec5SDimitry Andric KMP_ALIGN(128) 483*0b57cec5SDimitry Andric kmp_queuing_lock_t __kmp_dispatch_lock; /* Control dispatch access */ 484*0b57cec5SDimitry Andric KMP_ALIGN(128) 485*0b57cec5SDimitry Andric KMP_LOCK_INIT(__kmp_debug_lock); /* Control I/O access for KMP_DEBUG */ 486*0b57cec5SDimitry Andric #endif 487*0b57cec5SDimitry Andric 488*0b57cec5SDimitry Andric /* ----------------------------------------------- */ 489*0b57cec5SDimitry Andric 490*0b57cec5SDimitry Andric #if KMP_HANDLE_SIGNALS 491*0b57cec5SDimitry Andric /* Signal handling is disabled by default, because it confuses users: In case of 492*0b57cec5SDimitry Andric sigsegv (or other trouble) in user code signal handler catches the signal, 493*0b57cec5SDimitry Andric which then "appears" in the monitor thread (when the monitor executes raise() 494*0b57cec5SDimitry Andric function). Users see signal in the monitor thread and blame OpenMP RTL. 495*0b57cec5SDimitry Andric 496*0b57cec5SDimitry Andric Grant said signal handling required on some older OSes (Irix?) supported by 497*0b57cec5SDimitry Andric KAI, because bad applications hung but not aborted. Currently it is not a 498*0b57cec5SDimitry Andric problem for Linux* OS, OS X* and Windows* OS. 499*0b57cec5SDimitry Andric 500*0b57cec5SDimitry Andric Grant: Found new hangs for EL4, EL5, and a Fedora Core machine. So I'm 501*0b57cec5SDimitry Andric putting the default back for now to see if that fixes hangs on those 502*0b57cec5SDimitry Andric machines. 503*0b57cec5SDimitry Andric 504*0b57cec5SDimitry Andric 2010-04013 Lev: It was a bug in Fortran RTL. Fortran RTL prints a kind of 505*0b57cec5SDimitry Andric stack backtrace when program is aborting, but the code is not signal-safe. 506*0b57cec5SDimitry Andric When multiple signals raised at the same time (which occurs in dynamic 507*0b57cec5SDimitry Andric negative tests because all the worker threads detects the same error), 508*0b57cec5SDimitry Andric Fortran RTL may hang. The bug finally fixed in Fortran RTL library provided 509*0b57cec5SDimitry Andric by Steve R., and will be available soon. */ 510*0b57cec5SDimitry Andric int __kmp_handle_signals = FALSE; 511*0b57cec5SDimitry Andric #endif 512*0b57cec5SDimitry Andric 513*0b57cec5SDimitry Andric #ifdef DEBUG_SUSPEND 514*0b57cec5SDimitry Andric int get_suspend_count_(void) { 515*0b57cec5SDimitry Andric int count = __kmp_suspend_count; 516*0b57cec5SDimitry Andric __kmp_suspend_count = 0; 517*0b57cec5SDimitry Andric return count; 518*0b57cec5SDimitry Andric } 519*0b57cec5SDimitry Andric void set_suspend_count_(int *value) { __kmp_suspend_count = *value; } 520*0b57cec5SDimitry Andric #endif 521*0b57cec5SDimitry Andric 522*0b57cec5SDimitry Andric // Symbols for MS mutual detection. 523*0b57cec5SDimitry Andric int _You_must_link_with_exactly_one_OpenMP_library = 1; 524*0b57cec5SDimitry Andric int _You_must_link_with_Intel_OpenMP_library = 1; 525*0b57cec5SDimitry Andric #if KMP_OS_WINDOWS && (KMP_VERSION_MAJOR > 4) 526*0b57cec5SDimitry Andric int _You_must_link_with_Microsoft_OpenMP_library = 1; 527*0b57cec5SDimitry Andric #endif 528*0b57cec5SDimitry Andric 529*0b57cec5SDimitry Andric kmp_target_offload_kind_t __kmp_target_offload = tgt_default; 530*0b57cec5SDimitry Andric 531*0b57cec5SDimitry Andric // OMP Pause Resources 532*0b57cec5SDimitry Andric kmp_pause_status_t __kmp_pause_status = kmp_not_paused; 533*0b57cec5SDimitry Andric 534*0b57cec5SDimitry Andric // end of file // 535