blob: 583e299bea6b64e66ba33dee767aa3dd1db7e489 [file] [log] [blame]
Jim Cownie5e8470a2013-09-27 10:38:44 +00001/*
2 * kmp_global.c -- KPTS global variables for runtime support library
Jim Cownie181b4bb2013-12-23 17:28:57 +00003 * $Revision: 42816 $
4 * $Date: 2013-11-11 15:33:37 -0600 (Mon, 11 Nov 2013) $
Jim Cownie5e8470a2013-09-27 10:38:44 +00005 */
6
7
8//===----------------------------------------------------------------------===//
9//
10// The LLVM Compiler Infrastructure
11//
12// This file is dual licensed under the MIT and the University of Illinois Open
13// Source Licenses. See LICENSE.txt for details.
14//
15//===----------------------------------------------------------------------===//
16
17
18#include "kmp.h"
19
20#ifdef KMP_SETVERSION
21char __kmp_setversion_string[] = VERSION_STRING;
22#endif
23
24kmp_key_t __kmp_gtid_threadprivate_key;
25
26kmp_cpuinfo_t __kmp_cpuinfo = { 0 }; // Not initialized
Jim Cownie5e8470a2013-09-27 10:38:44 +000027
28
29/* ----------------------------------------------------- */
30/* INITIALIZATION VARIABLES */
31/* they are syncronized to write during init, but read anytime */
32volatile int __kmp_init_serial = FALSE;
33volatile int __kmp_init_gtid = FALSE;
34volatile int __kmp_init_common = FALSE;
35volatile int __kmp_init_middle = FALSE;
36volatile int __kmp_init_parallel = FALSE;
37volatile int __kmp_init_monitor = 0; /* 1 - launched, 2 - actually started (Windows* OS only) */
38volatile int __kmp_init_user_locks = FALSE;
39
40/* list of address of allocated caches for commons */
41kmp_cached_addr_t *__kmp_threadpriv_cache_list = NULL;
42
43int __kmp_init_counter = 0;
44int __kmp_root_counter = 0;
45int __kmp_version = 0;
46
47volatile kmp_uint32 __kmp_team_counter = 0;
48volatile kmp_uint32 __kmp_task_counter = 0;
49
50unsigned int __kmp_init_wait = KMP_DEFAULT_INIT_WAIT; /* initial number of spin-tests */
51unsigned int __kmp_next_wait = KMP_DEFAULT_NEXT_WAIT; /* susequent number of spin-tests */
52
53size_t __kmp_stksize = KMP_DEFAULT_STKSIZE;
54size_t __kmp_monitor_stksize = 0; // auto adjust
55size_t __kmp_stkoffset = KMP_DEFAULT_STKOFFSET;
56
57size_t __kmp_malloc_pool_incr = KMP_DEFAULT_MALLOC_POOL_INCR;
58
59/* Barrier method defaults, settings, and strings */
60/* branch factor = 2^branch_bits (only relevant for tree and hyper barrier types) */
61#if KMP_ARCH_X86_64
62kmp_uint32 __kmp_barrier_gather_bb_dflt = 2; /* branch_factor = 4 */ /* hyper2: C78980 */
63kmp_uint32 __kmp_barrier_release_bb_dflt = 2; /* branch_factor = 4 */ /* hyper2: C78980 */
64#else
65kmp_uint32 __kmp_barrier_gather_bb_dflt = 2; /* branch_factor = 4 */ /* communication in core for MIC */
66kmp_uint32 __kmp_barrier_release_bb_dflt = 2; /* branch_factor = 4 */ /* communication in core for MIC */
67#endif // KMP_ARCH_X86_64
68#if KMP_ARCH_X86_64
69kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_hyper_bar; /* hyper2: C78980 */
70kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_hyper_bar; /* hyper2: C78980 */
71#else
72kmp_bar_pat_e __kmp_barrier_gather_pat_dflt = bp_linear_bar;
73kmp_bar_pat_e __kmp_barrier_release_pat_dflt = bp_linear_bar;
74#endif
75kmp_uint32 __kmp_barrier_gather_branch_bits [ bs_last_barrier ] = { 0 };
76kmp_uint32 __kmp_barrier_release_branch_bits [ bs_last_barrier ] = { 0 };
77kmp_bar_pat_e __kmp_barrier_gather_pattern [ bs_last_barrier ] = { bp_linear_bar };
78kmp_bar_pat_e __kmp_barrier_release_pattern [ bs_last_barrier ] = { bp_linear_bar };
79char const *__kmp_barrier_branch_bit_env_name [ bs_last_barrier ] =
80 { "KMP_PLAIN_BARRIER", "KMP_FORKJOIN_BARRIER"
81 #if KMP_FAST_REDUCTION_BARRIER
82 , "KMP_REDUCTION_BARRIER"
83 #endif // KMP_FAST_REDUCTION_BARRIER
84 };
85char const *__kmp_barrier_pattern_env_name [ bs_last_barrier ] =
86 { "KMP_PLAIN_BARRIER_PATTERN", "KMP_FORKJOIN_BARRIER_PATTERN"
87 #if KMP_FAST_REDUCTION_BARRIER
88 , "KMP_REDUCTION_BARRIER_PATTERN"
89 #endif // KMP_FAST_REDUCTION_BARRIER
90 };
91char const *__kmp_barrier_type_name [ bs_last_barrier ] =
92 { "plain", "forkjoin"
93 #if KMP_FAST_REDUCTION_BARRIER
94 , "reduction"
95 #endif // KMP_FAST_REDUCTION_BARRIER
96 };
97char const *__kmp_barrier_pattern_name [ bp_last_bar ] = { "linear", "tree", "hyper" };
98
99
100int __kmp_allThreadsSpecified = 0;
101size_t __kmp_align_alloc = CACHE_LINE;
102
103
104int __kmp_generate_warnings = kmp_warnings_low;
105int __kmp_reserve_warn = 0;
106int __kmp_xproc = 0;
107int __kmp_avail_proc = 0;
108size_t __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
109int __kmp_sys_max_nth = KMP_MAX_NTH;
110int __kmp_max_nth = 0;
111int __kmp_threads_capacity = 0;
112int __kmp_dflt_team_nth = 0;
113int __kmp_dflt_team_nth_ub = 0;
114int __kmp_tp_capacity = 0;
115int __kmp_tp_cached = 0;
116int __kmp_dflt_nested = FALSE;
117#if OMP_30_ENABLED
118int __kmp_dflt_max_active_levels = KMP_MAX_ACTIVE_LEVELS_LIMIT; /* max_active_levels limit */
119#endif // OMP_30_ENABLED
120enum library_type __kmp_library = library_none;
121enum sched_type __kmp_sched = kmp_sch_default; /* scheduling method for runtime scheduling */
122enum sched_type __kmp_static = kmp_sch_static_greedy; /* default static scheduling method */
123enum sched_type __kmp_guided = kmp_sch_guided_iterative_chunked; /* default guided scheduling method */
124#if OMP_30_ENABLED
125enum sched_type __kmp_auto = kmp_sch_guided_analytical_chunked; /* default auto scheduling method */
126#endif // OMP_30_ENABLED
127int __kmp_dflt_blocktime = KMP_DEFAULT_BLOCKTIME;
128int __kmp_monitor_wakeups = KMP_MIN_MONITOR_WAKEUPS;
129int __kmp_bt_intervals = KMP_INTERVALS_FROM_BLOCKTIME( KMP_DEFAULT_BLOCKTIME, KMP_MIN_MONITOR_WAKEUPS );
130#ifdef KMP_ADJUST_BLOCKTIME
131int __kmp_zero_bt = FALSE;
132#endif /* KMP_ADJUST_BLOCKTIME */
133int __kmp_ht_capable = FALSE;
134int __kmp_ht_enabled = FALSE;
135int __kmp_ht_log_per_phy = 1;
136int __kmp_ncores = 0;
137int __kmp_chunk = 0;
138int __kmp_abort_delay = 0;
139#if KMP_OS_LINUX && defined(KMP_TDATA_GTID)
140int __kmp_gtid_mode = 3; /* use __declspec(thread) TLS to store gtid */
141int __kmp_adjust_gtid_mode = FALSE;
142#elif KMP_OS_WINDOWS
143int __kmp_gtid_mode = 2; /* use TLS functions to store gtid */
144int __kmp_adjust_gtid_mode = FALSE;
145#else
146int __kmp_gtid_mode = 0; /* select method to get gtid based on #threads */
147int __kmp_adjust_gtid_mode = TRUE;
148#endif /* KMP_OS_LINUX && defined(KMP_TDATA_GTID) */
149#ifdef KMP_TDATA_GTID
150#if KMP_OS_WINDOWS
151__declspec(thread) int __kmp_gtid = KMP_GTID_DNE;
152#else
153__thread int __kmp_gtid = KMP_GTID_DNE;
154#endif /* KMP_OS_WINDOWS - workaround because Intel(R) Many Integrated Core compiler 20110316 doesn't accept __declspec */
155#endif /* KMP_TDATA_GTID */
156int __kmp_tls_gtid_min = INT_MAX;
157int __kmp_foreign_tp = TRUE;
158#if KMP_ARCH_X86 || KMP_ARCH_X86_64
159int __kmp_inherit_fp_control = TRUE;
160kmp_int16 __kmp_init_x87_fpu_control_word = 0;
161kmp_uint32 __kmp_init_mxcsr = 0;
162#endif /* KMP_ARCH_X86 || KMP_ARCH_X86_64 */
163
164#ifdef USE_LOAD_BALANCE
165double __kmp_load_balance_interval = 1.0;
166#endif /* USE_LOAD_BALANCE */
167
168kmp_nested_nthreads_t __kmp_nested_nth = { NULL, 0, 0 };
169
170#if KMP_USE_ADAPTIVE_LOCKS
171
172kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params = { 1, 1024 }; // TODO: tune it!
173
174#if KMP_DEBUG_ADAPTIVE_LOCKS
175char * __kmp_speculative_statsfile = "-";
176#endif
177
178#endif // KMP_USE_ADAPTIVE_LOCKS
179
180#if OMP_40_ENABLED
181int __kmp_display_env = FALSE;
182int __kmp_display_env_verbose = FALSE;
Jim Cownie181b4bb2013-12-23 17:28:57 +0000183int __kmp_omp_cancellation = FALSE;
Jim Cownie5e8470a2013-09-27 10:38:44 +0000184#endif
185
186/* map OMP 3.0 schedule types with our internal schedule types */
187enum sched_type __kmp_sch_map[ kmp_sched_upper - kmp_sched_lower_ext + kmp_sched_upper_std - kmp_sched_lower - 2 ] = {
188 kmp_sch_static_chunked, // ==> kmp_sched_static = 1
189 kmp_sch_dynamic_chunked, // ==> kmp_sched_dynamic = 2
190 kmp_sch_guided_chunked, // ==> kmp_sched_guided = 3
191 kmp_sch_auto, // ==> kmp_sched_auto = 4
192 kmp_sch_trapezoidal // ==> kmp_sched_trapezoidal = 101
193 // will likely not used, introduced here just to debug the code
194 // of public intel extension schedules
195};
196
197#if KMP_OS_LINUX
198enum clock_function_type __kmp_clock_function;
199int __kmp_clock_function_param;
200#endif /* KMP_OS_LINUX */
201
202#if KMP_OS_LINUX || KMP_OS_WINDOWS
203
204# if KMP_OS_WINDOWS && KMP_ARCH_X86_64
205
206int __kmp_num_proc_groups = 1;
207
208kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount = NULL;
209kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount = NULL;
210kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity = NULL;
211kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity = NULL;
212
213# endif /* KMP_OS_WINDOWS && KMP_ARCH_X86_64 */
214
215size_t __kmp_affin_mask_size = 0;
216enum affinity_type __kmp_affinity_type = affinity_default;
217enum affinity_gran __kmp_affinity_gran = affinity_gran_default;
218int __kmp_affinity_gran_levels = -1;
219int __kmp_affinity_dups = TRUE;
220enum affinity_top_method __kmp_affinity_top_method = affinity_top_method_default;
221int __kmp_affinity_compact = 0;
222int __kmp_affinity_offset = 0;
223int __kmp_affinity_verbose = FALSE;
224int __kmp_affinity_warnings = TRUE;
225int __kmp_affinity_respect_mask = affinity_respect_mask_default;
226char * __kmp_affinity_proclist = NULL;
227kmp_affin_mask_t *__kmp_affinity_masks = NULL;
228unsigned __kmp_affinity_num_masks = 0;
229
230char const * __kmp_cpuinfo_file = NULL;
231
232#endif /* KMP_OS_LINUX || KMP_OS_WINDOWS */
233
234#if OMP_40_ENABLED
235kmp_nested_proc_bind_t __kmp_nested_proc_bind = { NULL, 0, 0 };
236int __kmp_affinity_num_places = 0;
237#endif
238
239#if KMP_MIC
240unsigned int __kmp_place_num_cores = 0;
241unsigned int __kmp_place_num_threads_per_core = 0;
242unsigned int __kmp_place_core_offset = 0;
243#endif
244
245#if OMP_30_ENABLED
246kmp_tasking_mode_t __kmp_tasking_mode = tskm_task_teams;
247
248/* This check ensures that the compiler is passing the correct data type
249 * for the flags formal parameter of the function kmpc_omp_task_alloc().
250 * If the type is not a 4-byte type, then give an error message about
251 * a non-positive length array pointing here. If that happens, the
252 * kmp_tasking_flags_t structure must be redefined to have exactly 32 bits.
253 */
254KMP_BUILD_ASSERT( sizeof(kmp_tasking_flags_t) == 4 );
255
256kmp_int32 __kmp_task_stealing_constraint = 1; /* Constrain task stealing by default */
257
258#endif /* OMP_30_ENABLED */
259
260#ifdef DEBUG_SUSPEND
261int __kmp_suspend_count = 0;
262#endif
263
264int __kmp_settings = FALSE;
265int __kmp_duplicate_library_ok = 0;
266#if USE_ITT_BUILD
267int __kmp_forkjoin_frames = 1;
268int __kmp_forkjoin_frames_mode = 0;
Jim Cownie5e8470a2013-09-27 10:38:44 +0000269#endif
270PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method = reduction_method_not_defined;
271int __kmp_determ_red = FALSE;
272
273#ifdef KMP_DEBUG
274int kmp_a_debug = 0;
275int kmp_b_debug = 0;
276int kmp_c_debug = 0;
277int kmp_d_debug = 0;
278int kmp_e_debug = 0;
279int kmp_f_debug = 0;
280int kmp_diag = 0;
281#endif
282
283/* For debug information logging using rotating buffer */
284int __kmp_debug_buf = FALSE; /* TRUE means use buffer, FALSE means print to stderr */
285int __kmp_debug_buf_lines = KMP_DEBUG_BUF_LINES_INIT; /* Lines of debug stored in buffer */
286int __kmp_debug_buf_chars = KMP_DEBUG_BUF_CHARS_INIT; /* Characters allowed per line in buffer */
287int __kmp_debug_buf_atomic = FALSE; /* TRUE means use atomic update of buffer entry pointer */
288
289char *__kmp_debug_buffer = NULL; /* Debug buffer itself */
290int __kmp_debug_count = 0; /* Counter for number of lines printed in buffer so far */
291int __kmp_debug_buf_warn_chars = 0; /* Keep track of char increase recommended in warnings */
292/* end rotating debug buffer */
293
294#ifdef KMP_DEBUG
295int __kmp_par_range; /* +1 => only go par for constructs in range */
296 /* -1 => only go par for constructs outside range */
297char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN] = { '\0' };
298char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN] = { '\0' };
299int __kmp_par_range_lb = 0;
300int __kmp_par_range_ub = INT_MAX;
301#endif /* KMP_DEBUG */
302
303/* For printing out dynamic storage map for threads and teams */
304int __kmp_storage_map = FALSE; /* True means print storage map for threads and teams */
305int __kmp_storage_map_verbose = FALSE; /* True means storage map includes placement info */
306int __kmp_storage_map_verbose_specified = FALSE;
307/* Initialize the library data structures when we fork a child process, defaults to TRUE */
308int __kmp_need_register_atfork = TRUE; /* At initialization, call pthread_atfork to install fork handler */
309int __kmp_need_register_atfork_specified = TRUE;
310
311
312int __kmp_env_chunk = FALSE; /* KMP_CHUNK specified? */
313int __kmp_env_stksize = FALSE; /* KMP_STACKSIZE specified? */
314int __kmp_env_omp_stksize = FALSE; /* OMP_STACKSIZE specified? */
315int __kmp_env_all_threads = FALSE;/* KMP_ALL_THREADS or KMP_MAX_THREADS specified? */
316int __kmp_env_omp_all_threads = FALSE;/* OMP_THREAD_LIMIT specified? */
317int __kmp_env_blocktime = FALSE; /* KMP_BLOCKTIME specified? */
318int __kmp_env_checks = FALSE; /* KMP_CHECKS specified? */
319int __kmp_env_consistency_check = FALSE; /* KMP_CONSISTENCY_CHECK specified? */
320
321kmp_uint32 __kmp_yield_init = KMP_INIT_WAIT;
322kmp_uint32 __kmp_yield_next = KMP_NEXT_WAIT;
323kmp_uint32 __kmp_yielding_on = 1;
324kmp_uint32 __kmp_yield_cycle = 1; /* Yield-cycle is on by default */
325kmp_int32 __kmp_yield_on_count = 10; /* By default, yielding is on for 10 monitor periods. */
326kmp_int32 __kmp_yield_off_count = 1; /* By default, yielding is off for 1 monitor periods. */
327/* ----------------------------------------------------- */
328
329
330/* ------------------------------------------------------ */
331/* STATE mostly syncronized with global lock */
332/* data written to rarely by masters, read often by workers */
333/*
334 * SHALL WE EDIT THE COMMENT BELOW IN SOME WAY?
335 * TODO: None of this global padding stuff works consistently because
336 * the order of declaration is not necessarily correlated to storage order.
337 * To fix this, all the important globals must be put in a big structure
338 * instead.
339 */
340KMP_ALIGN_CACHE
341 kmp_info_t **__kmp_threads = NULL;
342 kmp_root_t **__kmp_root = NULL;
343
344/* data read/written to often by masters */
345KMP_ALIGN_CACHE
346volatile int __kmp_nth = 0;
347volatile int __kmp_all_nth = 0;
348int __kmp_thread_pool_nth = 0;
349volatile kmp_info_t *__kmp_thread_pool = NULL;
350volatile kmp_team_t *__kmp_team_pool = NULL;
351
352KMP_ALIGN_CACHE
353volatile int __kmp_thread_pool_active_nth = 0;
354
355/* -------------------------------------------------
356 * GLOBAL/ROOT STATE */
357KMP_ALIGN_CACHE
358kmp_global_t __kmp_global = {{ 0 }};
359
360/* ----------------------------------------------- */
Alp Toker8f2d3f02014-02-24 10:40:15 +0000361/* GLOBAL SYNCHRONIZATION LOCKS */
Jim Cownie5e8470a2013-09-27 10:38:44 +0000362/* TODO verify the need for these locks and if they need to be global */
363KMP_ALIGN_CACHE
364
365kmp_bootstrap_lock_t __kmp_initz_lock = KMP_BOOTSTRAP_LOCK_INITIALIZER( __kmp_initz_lock ); /* Control initializations */
366kmp_bootstrap_lock_t __kmp_forkjoin_lock; /* control fork/join access */
367kmp_bootstrap_lock_t __kmp_exit_lock; /* exit() is not always thread-safe */
368kmp_bootstrap_lock_t __kmp_monitor_lock; /* control monitor thread creation */
369kmp_bootstrap_lock_t __kmp_tp_cached_lock; /* used for the hack to allow threadprivate cache and __kmp_threads expansion to co-exist */
370
371KMP_ALIGN(128)
372kmp_lock_t __kmp_global_lock; /* Control OS/global access */
373KMP_ALIGN(128)
374kmp_queuing_lock_t __kmp_dispatch_lock; /* Control dispatch access */
375KMP_ALIGN(128)
376kmp_lock_t __kmp_debug_lock; /* Control I/O access for KMP_DEBUG */
377
378/* ----------------------------------------------- */
379
380#if KMP_HANDLE_SIGNALS
381 /*
382 Signal handling is disabled by default, because it confuses users: In case of sigsegv
383 (or other trouble) in user code signal handler catches the signal, which then "appears" in
384 the monitor thread (when the monitor executes raise() function). Users see signal in the
385 monitor thread and blame OpenMP RTL.
386
387 Grant said signal handling required on some older OSes (Irix?) supported by KAI, because
388 bad applications hung but not aborted. Currently it is not a problem for Linux* OS, OS X* and
389 Windows* OS.
390
391 Grant: Found new hangs for EL4, EL5, and a Fedora Core machine. So I'm putting
392 the default back for now to see if that fixes hangs on those machines.
393
394 2010-04013 Lev: It was a bug in Fortran RTL. Fortran RTL prints a kind of stack backtrace
395 when program is aborting, but the code is not signal-safe. When multiple signals raised at
396 the same time (which occurs in dynamic negative tests because all the worker threads detects
397 the same error), Fortran RTL may hang. The bug finally fixed in Fortran RTL library provided
398 by Steve R., and will be available soon.
399 */
400 int __kmp_handle_signals = FALSE;
401#endif
402
403/* ----------------------------------------------- */
404#ifdef BUILD_TV
405kmp_key_t __kmp_tv_key = 0;
406#endif
407
408/* ------------------------------------------------------------------------ */
409/* ------------------------------------------------------------------------ */
410
411#ifdef DEBUG_SUSPEND
412int
413get_suspend_count_( void ) {
414 int count = __kmp_suspend_count;
415 __kmp_suspend_count = 0;
416 return count;
417}
418void
419set_suspend_count_( int * value ) {
420 __kmp_suspend_count = *value;
421}
422#endif
423
424// Symbols for MS mutual detection.
425int _You_must_link_with_exactly_one_OpenMP_library = 1;
426int _You_must_link_with_Intel_OpenMP_library = 1;
427#if KMP_OS_WINDOWS && ( KMP_VERSION_MAJOR > 4 )
428 int _You_must_link_with_Microsoft_OpenMP_library = 1;
429#endif
430
431// end of file //