blob: a7b4eb12757ef4fa3bf14a58c2c57677b89f0973 [file] [log] [blame]
Jim Cownie5e8470a2013-09-27 10:38:44 +00001/*
2 * z_Linux_util.c -- platform specific routines.
Jim Cownie5e8470a2013-09-27 10:38:44 +00003 */
4
5
6//===----------------------------------------------------------------------===//
7//
8// The LLVM Compiler Infrastructure
9//
10// This file is dual licensed under the MIT and the University of Illinois Open
11// Source Licenses. See LICENSE.txt for details.
12//
13//===----------------------------------------------------------------------===//
14
15
16#include "kmp.h"
17#include "kmp_wrapper_getpid.h"
18#include "kmp_itt.h"
19#include "kmp_str.h"
20#include "kmp_i18n.h"
21#include "kmp_io.h"
Jim Cownie4cc4bb42014-10-07 16:25:50 +000022#include "kmp_stats.h"
23#include "kmp_wait_release.h"
Jim Cownie5e8470a2013-09-27 10:38:44 +000024
Alp Toker763b9392014-02-28 09:42:41 +000025#if !KMP_OS_FREEBSD
26# include <alloca.h>
27#endif
Jim Cownie5e8470a2013-09-27 10:38:44 +000028#include <unistd.h>
29#include <math.h> // HUGE_VAL.
30#include <sys/time.h>
31#include <sys/times.h>
32#include <sys/resource.h>
33#include <sys/syscall.h>
34
Jim Cownie3051f972014-08-07 10:12:54 +000035#if KMP_OS_LINUX && !KMP_OS_CNK
Jim Cownie5e8470a2013-09-27 10:38:44 +000036# include <sys/sysinfo.h>
Andrey Churbanovcbda8682015-01-13 14:43:35 +000037# if KMP_OS_LINUX && (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64)
Jim Cownie5e8470a2013-09-27 10:38:44 +000038// We should really include <futex.h>, but that causes compatibility problems on different
39// Linux* OS distributions that either require that you include (or break when you try to include)
40// <pci/types.h>.
41// Since all we need is the two macros below (which are part of the kernel ABI, so can't change)
42// we just define the constants here and don't include <futex.h>
43# ifndef FUTEX_WAIT
44# define FUTEX_WAIT 0
45# endif
46# ifndef FUTEX_WAKE
47# define FUTEX_WAKE 1
48# endif
49# endif
50#elif KMP_OS_DARWIN
51# include <sys/sysctl.h>
52# include <mach/mach.h>
Alp Toker763b9392014-02-28 09:42:41 +000053#elif KMP_OS_FREEBSD
54# include <sys/sysctl.h>
55# include <pthread_np.h>
Jim Cownie5e8470a2013-09-27 10:38:44 +000056#endif
57
58
59#include <dirent.h>
60#include <ctype.h>
61#include <fcntl.h>
62
Jim Cownie181b4bb2013-12-23 17:28:57 +000063// For non-x86 architecture
Andrey Churbanovcbda8682015-01-13 14:43:35 +000064#if KMP_COMPILER_GCC && !(KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_PPC64 || KMP_ARCH_AARCH64)
Jim Cownie181b4bb2013-12-23 17:28:57 +000065# include <stdbool.h>
66# include <ffi.h>
67#endif
68
Jim Cownie5e8470a2013-09-27 10:38:44 +000069/* ------------------------------------------------------------------------ */
70/* ------------------------------------------------------------------------ */
71
72struct kmp_sys_timer {
73 struct timespec start;
74};
75
76// Convert timespec to nanoseconds.
77#define TS2NS(timespec) (((timespec).tv_sec * 1e9) + (timespec).tv_nsec)
78
79static struct kmp_sys_timer __kmp_sys_timer_data;
80
81#if KMP_HANDLE_SIGNALS
82 typedef void (* sig_func_t )( int );
83 STATIC_EFI2_WORKAROUND struct sigaction __kmp_sighldrs[ NSIG ];
84 static sigset_t __kmp_sigset;
85#endif
86
87static int __kmp_init_runtime = FALSE;
88
89static int __kmp_fork_count = 0;
90
91static pthread_condattr_t __kmp_suspend_cond_attr;
92static pthread_mutexattr_t __kmp_suspend_mutex_attr;
93
94static kmp_cond_align_t __kmp_wait_cv;
95static kmp_mutex_align_t __kmp_wait_mx;
96
97/* ------------------------------------------------------------------------ */
98/* ------------------------------------------------------------------------ */
99
100#ifdef DEBUG_SUSPEND
101static void
102__kmp_print_cond( char *buffer, kmp_cond_align_t *cond )
103{
104 sprintf( buffer, "(cond (lock (%ld, %d)), (descr (%p)))",
105 cond->c_cond.__c_lock.__status, cond->c_cond.__c_lock.__spinlock,
106 cond->c_cond.__c_waiting );
107}
108#endif
109
110/* ------------------------------------------------------------------------ */
111/* ------------------------------------------------------------------------ */
112
Jim Cownie3051f972014-08-07 10:12:54 +0000113#if ( KMP_OS_LINUX && KMP_AFFINITY_SUPPORTED)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000114
115/*
116 * Affinity support
117 */
118
119/*
120 * On some of the older OS's that we build on, these constants aren't present
121 * in <asm/unistd.h> #included from <sys.syscall.h>. They must be the same on
122 * all systems of the same arch where they are defined, and they cannot change.
123 * stone forever.
124 */
125
Jim Cownie181b4bb2013-12-23 17:28:57 +0000126# if KMP_ARCH_X86 || KMP_ARCH_ARM
Jim Cownie5e8470a2013-09-27 10:38:44 +0000127# ifndef __NR_sched_setaffinity
128# define __NR_sched_setaffinity 241
129# elif __NR_sched_setaffinity != 241
130# error Wrong code for setaffinity system call.
131# endif /* __NR_sched_setaffinity */
132# ifndef __NR_sched_getaffinity
133# define __NR_sched_getaffinity 242
134# elif __NR_sched_getaffinity != 242
135# error Wrong code for getaffinity system call.
136# endif /* __NR_sched_getaffinity */
137
Andrey Churbanovcbda8682015-01-13 14:43:35 +0000138# elif KMP_ARCH_AARCH64
139# ifndef __NR_sched_setaffinity
140# define __NR_sched_setaffinity 122
141# elif __NR_sched_setaffinity != 122
142# error Wrong code for setaffinity system call.
143# endif /* __NR_sched_setaffinity */
144# ifndef __NR_sched_getaffinity
145# define __NR_sched_getaffinity 123
146# elif __NR_sched_getaffinity != 123
147# error Wrong code for getaffinity system call.
148# endif /* __NR_sched_getaffinity */
149
Jim Cownie5e8470a2013-09-27 10:38:44 +0000150# elif KMP_ARCH_X86_64
151# ifndef __NR_sched_setaffinity
152# define __NR_sched_setaffinity 203
153# elif __NR_sched_setaffinity != 203
154# error Wrong code for setaffinity system call.
155# endif /* __NR_sched_setaffinity */
156# ifndef __NR_sched_getaffinity
157# define __NR_sched_getaffinity 204
158# elif __NR_sched_getaffinity != 204
159# error Wrong code for getaffinity system call.
160# endif /* __NR_sched_getaffinity */
161
Jim Cownie3051f972014-08-07 10:12:54 +0000162# elif KMP_ARCH_PPC64
163# ifndef __NR_sched_setaffinity
164# define __NR_sched_setaffinity 222
165# elif __NR_sched_setaffinity != 222
166# error Wrong code for setaffinity system call.
167# endif /* __NR_sched_setaffinity */
168# ifndef __NR_sched_getaffinity
169# define __NR_sched_getaffinity 223
170# elif __NR_sched_getaffinity != 223
171# error Wrong code for getaffinity system call.
172# endif /* __NR_sched_getaffinity */
173
174
Jim Cownie5e8470a2013-09-27 10:38:44 +0000175# else
176# error Unknown or unsupported architecture
177
178# endif /* KMP_ARCH_* */
179
180int
181__kmp_set_system_affinity( kmp_affin_mask_t const *mask, int abort_on_error )
182{
183 KMP_ASSERT2(KMP_AFFINITY_CAPABLE(),
184 "Illegal set affinity operation when not capable");
185
186 int retval = syscall( __NR_sched_setaffinity, 0, __kmp_affin_mask_size, mask );
187 if (retval >= 0) {
188 return 0;
189 }
190 int error = errno;
191 if (abort_on_error) {
192 __kmp_msg(
193 kmp_ms_fatal,
194 KMP_MSG( FatalSysError ),
195 KMP_ERR( error ),
196 __kmp_msg_null
197 );
198 }
199 return error;
200}
201
202int
203__kmp_get_system_affinity( kmp_affin_mask_t *mask, int abort_on_error )
204{
205 KMP_ASSERT2(KMP_AFFINITY_CAPABLE(),
206 "Illegal get affinity operation when not capable");
207
208 int retval = syscall( __NR_sched_getaffinity, 0, __kmp_affin_mask_size, mask );
209 if (retval >= 0) {
210 return 0;
211 }
212 int error = errno;
213 if (abort_on_error) {
214 __kmp_msg(
215 kmp_ms_fatal,
216 KMP_MSG( FatalSysError ),
217 KMP_ERR( error ),
218 __kmp_msg_null
219 );
220 }
221 return error;
222}
223
224void
225__kmp_affinity_bind_thread( int which )
226{
227 KMP_ASSERT2(KMP_AFFINITY_CAPABLE(),
228 "Illegal set affinity operation when not capable");
229
230 kmp_affin_mask_t *mask = (kmp_affin_mask_t *)alloca(__kmp_affin_mask_size);
231 KMP_CPU_ZERO(mask);
232 KMP_CPU_SET(which, mask);
233 __kmp_set_system_affinity(mask, TRUE);
234}
235
236/*
237 * Determine if we can access affinity functionality on this version of
238 * Linux* OS by checking __NR_sched_{get,set}affinity system calls, and set
239 * __kmp_affin_mask_size to the appropriate value (0 means not capable).
240 */
241void
242__kmp_affinity_determine_capable(const char *env_var)
243{
244 //
245 // Check and see if the OS supports thread affinity.
246 //
247
248# define KMP_CPU_SET_SIZE_LIMIT (1024*1024)
249
250 int gCode;
251 int sCode;
252 kmp_affin_mask_t *buf;
253 buf = ( kmp_affin_mask_t * ) KMP_INTERNAL_MALLOC( KMP_CPU_SET_SIZE_LIMIT );
254
255 // If Linux* OS:
256 // If the syscall fails or returns a suggestion for the size,
257 // then we don't have to search for an appropriate size.
258 gCode = syscall( __NR_sched_getaffinity, 0, KMP_CPU_SET_SIZE_LIMIT, buf );
259 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
Alp Toker8f2d3f02014-02-24 10:40:15 +0000260 "initial getaffinity call returned %d errno = %d\n",
Jim Cownie5e8470a2013-09-27 10:38:44 +0000261 gCode, errno));
262
263 //if ((gCode < 0) && (errno == ENOSYS))
264 if (gCode < 0) {
265 //
266 // System call not supported
267 //
268 if (__kmp_affinity_verbose || (__kmp_affinity_warnings
269 && (__kmp_affinity_type != affinity_none)
270 && (__kmp_affinity_type != affinity_default)
271 && (__kmp_affinity_type != affinity_disabled))) {
272 int error = errno;
273 __kmp_msg(
274 kmp_ms_warning,
275 KMP_MSG( GetAffSysCallNotSupported, env_var ),
276 KMP_ERR( error ),
277 __kmp_msg_null
278 );
279 }
280 __kmp_affin_mask_size = 0; // should already be 0
281 KMP_INTERNAL_FREE(buf);
282 return;
283 }
284 if (gCode > 0) { // Linux* OS only
285 // The optimal situation: the OS returns the size of the buffer
286 // it expects.
287 //
288 // A verification of correct behavior is that Isetaffinity on a NULL
289 // buffer with the same size fails with errno set to EFAULT.
290 sCode = syscall( __NR_sched_setaffinity, 0, gCode, NULL );
291 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
292 "setaffinity for mask size %d returned %d errno = %d\n",
293 gCode, sCode, errno));
294 if (sCode < 0) {
295 if (errno == ENOSYS) {
296 if (__kmp_affinity_verbose || (__kmp_affinity_warnings
297 && (__kmp_affinity_type != affinity_none)
298 && (__kmp_affinity_type != affinity_default)
299 && (__kmp_affinity_type != affinity_disabled))) {
300 int error = errno;
301 __kmp_msg(
302 kmp_ms_warning,
303 KMP_MSG( SetAffSysCallNotSupported, env_var ),
304 KMP_ERR( error ),
305 __kmp_msg_null
306 );
307 }
308 __kmp_affin_mask_size = 0; // should already be 0
309 KMP_INTERNAL_FREE(buf);
310 }
311 if (errno == EFAULT) {
312 __kmp_affin_mask_size = gCode;
313 KA_TRACE(10, ( "__kmp_affinity_determine_capable: "
314 "affinity supported (mask size %d)\n",
315 (int)__kmp_affin_mask_size));
316 KMP_INTERNAL_FREE(buf);
317 return;
318 }
319 }
320 }
321
322 //
323 // Call the getaffinity system call repeatedly with increasing set sizes
324 // until we succeed, or reach an upper bound on the search.
325 //
326 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
327 "searching for proper set size\n"));
328 int size;
329 for (size = 1; size <= KMP_CPU_SET_SIZE_LIMIT; size *= 2) {
330 gCode = syscall( __NR_sched_getaffinity, 0, size, buf );
331 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
332 "getaffinity for mask size %d returned %d errno = %d\n", size,
333 gCode, errno));
334
335 if (gCode < 0) {
336 if ( errno == ENOSYS )
337 {
338 //
339 // We shouldn't get here
340 //
341 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
342 "inconsistent OS call behavior: errno == ENOSYS for mask size %d\n",
343 size));
344 if (__kmp_affinity_verbose || (__kmp_affinity_warnings
345 && (__kmp_affinity_type != affinity_none)
346 && (__kmp_affinity_type != affinity_default)
347 && (__kmp_affinity_type != affinity_disabled))) {
348 int error = errno;
349 __kmp_msg(
350 kmp_ms_warning,
351 KMP_MSG( GetAffSysCallNotSupported, env_var ),
352 KMP_ERR( error ),
353 __kmp_msg_null
354 );
355 }
356 __kmp_affin_mask_size = 0; // should already be 0
357 KMP_INTERNAL_FREE(buf);
358 return;
359 }
360 continue;
361 }
362
363 sCode = syscall( __NR_sched_setaffinity, 0, gCode, NULL );
364 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
365 "setaffinity for mask size %d returned %d errno = %d\n",
366 gCode, sCode, errno));
367 if (sCode < 0) {
368 if (errno == ENOSYS) { // Linux* OS only
369 //
370 // We shouldn't get here
371 //
372 KA_TRACE(30, ( "__kmp_affinity_determine_capable: "
373 "inconsistent OS call behavior: errno == ENOSYS for mask size %d\n",
374 size));
375 if (__kmp_affinity_verbose || (__kmp_affinity_warnings
376 && (__kmp_affinity_type != affinity_none)
377 && (__kmp_affinity_type != affinity_default)
378 && (__kmp_affinity_type != affinity_disabled))) {
379 int error = errno;
380 __kmp_msg(
381 kmp_ms_warning,
382 KMP_MSG( SetAffSysCallNotSupported, env_var ),
383 KMP_ERR( error ),
384 __kmp_msg_null
385 );
386 }
387 __kmp_affin_mask_size = 0; // should already be 0
388 KMP_INTERNAL_FREE(buf);
389 return;
390 }
391 if (errno == EFAULT) {
392 __kmp_affin_mask_size = gCode;
393 KA_TRACE(10, ( "__kmp_affinity_determine_capable: "
394 "affinity supported (mask size %d)\n",
395 (int)__kmp_affin_mask_size));
396 KMP_INTERNAL_FREE(buf);
397 return;
398 }
399 }
400 }
401 //int error = errno; // save uncaught error code
402 KMP_INTERNAL_FREE(buf);
403 // errno = error; // restore uncaught error code, will be printed at the next KMP_WARNING below
404
405 //
406 // Affinity is not supported
407 //
408 __kmp_affin_mask_size = 0;
409 KA_TRACE(10, ( "__kmp_affinity_determine_capable: "
410 "cannot determine mask size - affinity not supported\n"));
411 if (__kmp_affinity_verbose || (__kmp_affinity_warnings
412 && (__kmp_affinity_type != affinity_none)
413 && (__kmp_affinity_type != affinity_default)
414 && (__kmp_affinity_type != affinity_disabled))) {
415 KMP_WARNING( AffCantGetMaskSize, env_var );
416 }
417}
418
419
420/*
421 * Change thread to the affinity mask pointed to by affin_mask argument
422 * and return a pointer to the old value in the old_mask argument, if argument
423 * is non-NULL.
424 */
425
426void
427__kmp_change_thread_affinity_mask( int gtid, kmp_affin_mask_t *new_mask,
428 kmp_affin_mask_t *old_mask )
429{
430 KMP_DEBUG_ASSERT( gtid == __kmp_get_gtid() );
431 if ( KMP_AFFINITY_CAPABLE() ) {
432 int status;
433 kmp_info_t *th = __kmp_threads[ gtid ];
434
435 KMP_DEBUG_ASSERT( new_mask != NULL );
436
437 if ( old_mask != NULL ) {
438 status = __kmp_get_system_affinity( old_mask, TRUE );
439 int error = errno;
440 if ( status != 0 ) {
441 __kmp_msg(
442 kmp_ms_fatal,
443 KMP_MSG( ChangeThreadAffMaskError ),
444 KMP_ERR( error ),
445 __kmp_msg_null
446 );
447 }
448 }
449
450 __kmp_set_system_affinity( new_mask, TRUE );
451
452 if (__kmp_affinity_verbose) {
453 char old_buf[KMP_AFFIN_MASK_PRINT_LEN];
454 char new_buf[KMP_AFFIN_MASK_PRINT_LEN];
455 __kmp_affinity_print_mask(old_buf, KMP_AFFIN_MASK_PRINT_LEN, old_mask);
456 __kmp_affinity_print_mask(new_buf, KMP_AFFIN_MASK_PRINT_LEN, new_mask);
457 KMP_INFORM( ChangeAffMask, "KMP_AFFINITY (Bind)", gtid, old_buf, new_buf );
458
459 }
460
461 /* Make sure old value is correct in thread data structures */
462 KMP_DEBUG_ASSERT( old_mask != NULL && (memcmp(old_mask,
463 th->th.th_affin_mask, __kmp_affin_mask_size) == 0) );
464 KMP_CPU_COPY( th->th.th_affin_mask, new_mask );
465 }
466}
467
Alp Toker98758b02014-03-02 04:12:06 +0000468#endif // KMP_OS_LINUX && KMP_AFFINITY_SUPPORTED
Jim Cownie5e8470a2013-09-27 10:38:44 +0000469
470/* ------------------------------------------------------------------------ */
471/* ------------------------------------------------------------------------ */
472
Andrey Churbanovcbda8682015-01-13 14:43:35 +0000473#if KMP_OS_LINUX && (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64) && !KMP_OS_CNK
Jim Cownie5e8470a2013-09-27 10:38:44 +0000474
475int
476__kmp_futex_determine_capable()
477{
478 int loc = 0;
479 int rc = syscall( __NR_futex, &loc, FUTEX_WAKE, 1, NULL, NULL, 0 );
480 int retval = ( rc == 0 ) || ( errno != ENOSYS );
481
482 KA_TRACE(10, ( "__kmp_futex_determine_capable: rc = %d errno = %d\n", rc,
483 errno ) );
484 KA_TRACE(10, ( "__kmp_futex_determine_capable: futex syscall%s supported\n",
485 retval ? "" : " not" ) );
486
487 return retval;
488}
489
Jim Cownie3051f972014-08-07 10:12:54 +0000490#endif // KMP_OS_LINUX && (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_ARM) && !KMP_OS_CNK
Jim Cownie5e8470a2013-09-27 10:38:44 +0000491
492/* ------------------------------------------------------------------------ */
493/* ------------------------------------------------------------------------ */
494
495#if (KMP_ARCH_X86 || KMP_ARCH_X86_64) && (! KMP_ASM_INTRINS)
496/*
497 * Only 32-bit "add-exchange" instruction on IA-32 architecture causes us to
498 * use compare_and_store for these routines
499 */
500
501kmp_int32
502__kmp_test_then_or32( volatile kmp_int32 *p, kmp_int32 d )
503{
504 kmp_int32 old_value, new_value;
505
506 old_value = TCR_4( *p );
507 new_value = old_value | d;
508
Jim Cownie3051f972014-08-07 10:12:54 +0000509 while ( ! KMP_COMPARE_AND_STORE_REL32 ( p, old_value, new_value ) )
Jim Cownie5e8470a2013-09-27 10:38:44 +0000510 {
511 KMP_CPU_PAUSE();
512 old_value = TCR_4( *p );
513 new_value = old_value | d;
514 }
515 return old_value;
516}
517
518kmp_int32
519__kmp_test_then_and32( volatile kmp_int32 *p, kmp_int32 d )
520{
521 kmp_int32 old_value, new_value;
522
523 old_value = TCR_4( *p );
524 new_value = old_value & d;
525
Jim Cownie3051f972014-08-07 10:12:54 +0000526 while ( ! KMP_COMPARE_AND_STORE_REL32 ( p, old_value, new_value ) )
Jim Cownie5e8470a2013-09-27 10:38:44 +0000527 {
528 KMP_CPU_PAUSE();
529 old_value = TCR_4( *p );
530 new_value = old_value & d;
531 }
532 return old_value;
533}
534
Andrey Churbanovcbda8682015-01-13 14:43:35 +0000535# if KMP_ARCH_X86 || KMP_ARCH_PPC64 || KMP_ARCH_AARCH64
Jim Cownie5e8470a2013-09-27 10:38:44 +0000536kmp_int64
537__kmp_test_then_add64( volatile kmp_int64 *p, kmp_int64 d )
538{
539 kmp_int64 old_value, new_value;
540
541 old_value = TCR_8( *p );
542 new_value = old_value + d;
543
Jim Cownie3051f972014-08-07 10:12:54 +0000544 while ( ! KMP_COMPARE_AND_STORE_REL64 ( p, old_value, new_value ) )
Jim Cownie5e8470a2013-09-27 10:38:44 +0000545 {
546 KMP_CPU_PAUSE();
547 old_value = TCR_8( *p );
548 new_value = old_value + d;
549 }
550 return old_value;
551}
552# endif /* KMP_ARCH_X86 */
553
554kmp_int64
555__kmp_test_then_or64( volatile kmp_int64 *p, kmp_int64 d )
556{
557 kmp_int64 old_value, new_value;
558
559 old_value = TCR_8( *p );
560 new_value = old_value | d;
Jim Cownie3051f972014-08-07 10:12:54 +0000561 while ( ! KMP_COMPARE_AND_STORE_REL64 ( p, old_value, new_value ) )
Jim Cownie5e8470a2013-09-27 10:38:44 +0000562 {
563 KMP_CPU_PAUSE();
564 old_value = TCR_8( *p );
565 new_value = old_value | d;
566 }
567 return old_value;
568}
569
570kmp_int64
571__kmp_test_then_and64( volatile kmp_int64 *p, kmp_int64 d )
572{
573 kmp_int64 old_value, new_value;
574
575 old_value = TCR_8( *p );
576 new_value = old_value & d;
Jim Cownie3051f972014-08-07 10:12:54 +0000577 while ( ! KMP_COMPARE_AND_STORE_REL64 ( p, old_value, new_value ) )
Jim Cownie5e8470a2013-09-27 10:38:44 +0000578 {
579 KMP_CPU_PAUSE();
580 old_value = TCR_8( *p );
581 new_value = old_value & d;
582 }
583 return old_value;
584}
585
586#endif /* (KMP_ARCH_X86 || KMP_ARCH_X86_64) && (! KMP_ASM_INTRINS) */
587
588void
589__kmp_terminate_thread( int gtid )
590{
591 int status;
592 kmp_info_t *th = __kmp_threads[ gtid ];
593
594 if ( !th ) return;
595
596 #ifdef KMP_CANCEL_THREADS
597 KA_TRACE( 10, ("__kmp_terminate_thread: kill (%d)\n", gtid ) );
598 status = pthread_cancel( th->th.th_info.ds.ds_thread );
599 if ( status != 0 && status != ESRCH ) {
600 __kmp_msg(
601 kmp_ms_fatal,
602 KMP_MSG( CantTerminateWorkerThread ),
603 KMP_ERR( status ),
604 __kmp_msg_null
605 );
606 }; // if
607 #endif
608 __kmp_yield( TRUE );
609} //
610
611/* ------------------------------------------------------------------------ */
612/* ------------------------------------------------------------------------ */
613
614/* ------------------------------------------------------------------------ */
615/* ------------------------------------------------------------------------ */
616
617/*
618 * Set thread stack info according to values returned by
619 * pthread_getattr_np().
620 * If values are unreasonable, assume call failed and use
621 * incremental stack refinement method instead.
622 * Returns TRUE if the stack parameters could be determined exactly,
623 * FALSE if incremental refinement is necessary.
624 */
625static kmp_int32
626__kmp_set_stack_info( int gtid, kmp_info_t *th )
627{
628 int stack_data;
Alp Toker763b9392014-02-28 09:42:41 +0000629#if KMP_OS_LINUX || KMP_OS_FREEBSD
Jim Cownie5e8470a2013-09-27 10:38:44 +0000630 /* Linux* OS only -- no pthread_getattr_np support on OS X* */
631 pthread_attr_t attr;
632 int status;
633 size_t size = 0;
634 void * addr = 0;
635
636 /* Always do incremental stack refinement for ubermaster threads since the initial
637 thread stack range can be reduced by sibling thread creation so pthread_attr_getstack
638 may cause thread gtid aliasing */
639 if ( ! KMP_UBER_GTID(gtid) ) {
640
641 /* Fetch the real thread attributes */
642 status = pthread_attr_init( &attr );
643 KMP_CHECK_SYSFAIL( "pthread_attr_init", status );
Alp Toker763b9392014-02-28 09:42:41 +0000644#if KMP_OS_FREEBSD
645 status = pthread_attr_get_np( pthread_self(), &attr );
646 KMP_CHECK_SYSFAIL( "pthread_attr_get_np", status );
647#else
Jim Cownie5e8470a2013-09-27 10:38:44 +0000648 status = pthread_getattr_np( pthread_self(), &attr );
649 KMP_CHECK_SYSFAIL( "pthread_getattr_np", status );
Alp Toker763b9392014-02-28 09:42:41 +0000650#endif
Jim Cownie5e8470a2013-09-27 10:38:44 +0000651 status = pthread_attr_getstack( &attr, &addr, &size );
652 KMP_CHECK_SYSFAIL( "pthread_attr_getstack", status );
653 KA_TRACE( 60, ( "__kmp_set_stack_info: T#%d pthread_attr_getstack returned size: %lu, "
654 "low addr: %p\n",
655 gtid, size, addr ));
656
657 status = pthread_attr_destroy( &attr );
658 KMP_CHECK_SYSFAIL( "pthread_attr_destroy", status );
659 }
660
661 if ( size != 0 && addr != 0 ) { /* was stack parameter determination successful? */
662 /* Store the correct base and size */
663 TCW_PTR(th->th.th_info.ds.ds_stackbase, (((char *)addr) + size));
664 TCW_PTR(th->th.th_info.ds.ds_stacksize, size);
665 TCW_4(th->th.th_info.ds.ds_stackgrow, FALSE);
666 return TRUE;
Jim Cownie5e8470a2013-09-27 10:38:44 +0000667 }
Alp Toker763b9392014-02-28 09:42:41 +0000668#endif /* KMP_OS_LINUX || KMP_OS_FREEBSD */
Alp Toker763b9392014-02-28 09:42:41 +0000669 /* Use incremental refinement starting from initial conservative estimate */
670 TCW_PTR(th->th.th_info.ds.ds_stacksize, 0);
671 TCW_PTR(th -> th.th_info.ds.ds_stackbase, &stack_data);
672 TCW_4(th->th.th_info.ds.ds_stackgrow, TRUE);
673 return FALSE;
Jim Cownie5e8470a2013-09-27 10:38:44 +0000674}
675
676static void*
677__kmp_launch_worker( void *thr )
678{
679 int status, old_type, old_state;
680#ifdef KMP_BLOCK_SIGNALS
681 sigset_t new_set, old_set;
682#endif /* KMP_BLOCK_SIGNALS */
683 void *exit_val;
684 void *padding = 0;
685 int gtid;
686 int error;
687
688 gtid = ((kmp_info_t*)thr) -> th.th_info.ds.ds_gtid;
689 __kmp_gtid_set_specific( gtid );
690#ifdef KMP_TDATA_GTID
691 __kmp_gtid = gtid;
692#endif
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000693#if KMP_STATS_ENABLED
694 // set __thread local index to point to thread-specific stats
695 __kmp_stats_thread_ptr = ((kmp_info_t*)thr)->th.th_stats;
696#endif
Jim Cownie5e8470a2013-09-27 10:38:44 +0000697
698#if USE_ITT_BUILD
699 __kmp_itt_thread_name( gtid );
700#endif /* USE_ITT_BUILD */
701
Alp Toker763b9392014-02-28 09:42:41 +0000702#if KMP_AFFINITY_SUPPORTED
Jim Cownie5e8470a2013-09-27 10:38:44 +0000703 __kmp_affinity_set_init_mask( gtid, FALSE );
Jim Cownie5e8470a2013-09-27 10:38:44 +0000704#endif
705
706#ifdef KMP_CANCEL_THREADS
707 status = pthread_setcanceltype( PTHREAD_CANCEL_ASYNCHRONOUS, & old_type );
708 KMP_CHECK_SYSFAIL( "pthread_setcanceltype", status );
709 /* josh todo: isn't PTHREAD_CANCEL_ENABLE default for newly-created threads? */
710 status = pthread_setcancelstate( PTHREAD_CANCEL_ENABLE, & old_state );
711 KMP_CHECK_SYSFAIL( "pthread_setcancelstate", status );
712#endif
713
714#if KMP_ARCH_X86 || KMP_ARCH_X86_64
715 //
716 // Set the FP control regs to be a copy of
717 // the parallel initialization thread's.
718 //
719 __kmp_clear_x87_fpu_status_word();
720 __kmp_load_x87_fpu_control_word( &__kmp_init_x87_fpu_control_word );
721 __kmp_load_mxcsr( &__kmp_init_mxcsr );
722#endif /* KMP_ARCH_X86 || KMP_ARCH_X86_64 */
723
724#ifdef KMP_BLOCK_SIGNALS
725 status = sigfillset( & new_set );
726 KMP_CHECK_SYSFAIL_ERRNO( "sigfillset", status );
727 status = pthread_sigmask( SIG_BLOCK, & new_set, & old_set );
728 KMP_CHECK_SYSFAIL( "pthread_sigmask", status );
729#endif /* KMP_BLOCK_SIGNALS */
730
Alp Toker763b9392014-02-28 09:42:41 +0000731#if KMP_OS_LINUX || KMP_OS_FREEBSD
Jim Cownie5e8470a2013-09-27 10:38:44 +0000732 if ( __kmp_stkoffset > 0 && gtid > 0 ) {
733 padding = alloca( gtid * __kmp_stkoffset );
734 }
735#endif
736
737 KMP_MB();
738 __kmp_set_stack_info( gtid, (kmp_info_t*)thr );
739
740 __kmp_check_stack_overlap( (kmp_info_t*)thr );
741
742 exit_val = __kmp_launch_thread( (kmp_info_t *) thr );
743
744#ifdef KMP_BLOCK_SIGNALS
745 status = pthread_sigmask( SIG_SETMASK, & old_set, NULL );
746 KMP_CHECK_SYSFAIL( "pthread_sigmask", status );
747#endif /* KMP_BLOCK_SIGNALS */
748
749 return exit_val;
750}
751
752
753/* The monitor thread controls all of the threads in the complex */
754
755static void*
756__kmp_launch_monitor( void *thr )
757{
758 int status, old_type, old_state;
759#ifdef KMP_BLOCK_SIGNALS
760 sigset_t new_set;
761#endif /* KMP_BLOCK_SIGNALS */
762 struct timespec interval;
763 int yield_count;
764 int yield_cycles = 0;
765 int error;
766
767 KMP_MB(); /* Flush all pending memory write invalidates. */
768
769 KA_TRACE( 10, ("__kmp_launch_monitor: #1 launched\n" ) );
770
771 /* register us as the monitor thread */
772 __kmp_gtid_set_specific( KMP_GTID_MONITOR );
773#ifdef KMP_TDATA_GTID
774 __kmp_gtid = KMP_GTID_MONITOR;
775#endif
776
777 KMP_MB();
778
779#if USE_ITT_BUILD
780 __kmp_itt_thread_ignore(); // Instruct Intel(R) Threading Tools to ignore monitor thread.
781#endif /* USE_ITT_BUILD */
782
783 __kmp_set_stack_info( ((kmp_info_t*)thr)->th.th_info.ds.ds_gtid, (kmp_info_t*)thr );
784
785 __kmp_check_stack_overlap( (kmp_info_t*)thr );
786
787#ifdef KMP_CANCEL_THREADS
788 status = pthread_setcanceltype( PTHREAD_CANCEL_ASYNCHRONOUS, & old_type );
789 KMP_CHECK_SYSFAIL( "pthread_setcanceltype", status );
790 /* josh todo: isn't PTHREAD_CANCEL_ENABLE default for newly-created threads? */
791 status = pthread_setcancelstate( PTHREAD_CANCEL_ENABLE, & old_state );
792 KMP_CHECK_SYSFAIL( "pthread_setcancelstate", status );
793#endif
794
795 #if KMP_REAL_TIME_FIX
796 // This is a potential fix which allows application with real-time scheduling policy work.
797 // However, decision about the fix is not made yet, so it is disabled by default.
798 { // Are program started with real-time scheduling policy?
799 int sched = sched_getscheduler( 0 );
800 if ( sched == SCHED_FIFO || sched == SCHED_RR ) {
801 // Yes, we are a part of real-time application. Try to increase the priority of the
802 // monitor.
803 struct sched_param param;
804 int max_priority = sched_get_priority_max( sched );
805 int rc;
806 KMP_WARNING( RealTimeSchedNotSupported );
807 sched_getparam( 0, & param );
808 if ( param.sched_priority < max_priority ) {
809 param.sched_priority += 1;
810 rc = sched_setscheduler( 0, sched, & param );
811 if ( rc != 0 ) {
812 int error = errno;
813 __kmp_msg(
814 kmp_ms_warning,
815 KMP_MSG( CantChangeMonitorPriority ),
816 KMP_ERR( error ),
817 KMP_MSG( MonitorWillStarve ),
818 __kmp_msg_null
819 );
820 }; // if
821 } else {
822 // We cannot abort here, because number of CPUs may be enough for all the threads,
823 // including the monitor thread, so application could potentially work...
824 __kmp_msg(
825 kmp_ms_warning,
826 KMP_MSG( RunningAtMaxPriority ),
827 KMP_MSG( MonitorWillStarve ),
828 KMP_HNT( RunningAtMaxPriority ),
829 __kmp_msg_null
830 );
831 }; // if
832 }; // if
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000833 TCW_4( __kmp_global.g.g_time.dt.t_value, 0 ); // AC: free thread that waits for monitor started
Jim Cownie5e8470a2013-09-27 10:38:44 +0000834 }
835 #endif // KMP_REAL_TIME_FIX
836
837 KMP_MB(); /* Flush all pending memory write invalidates. */
838
839 if ( __kmp_monitor_wakeups == 1 ) {
840 interval.tv_sec = 1;
841 interval.tv_nsec = 0;
842 } else {
843 interval.tv_sec = 0;
844 interval.tv_nsec = (NSEC_PER_SEC / __kmp_monitor_wakeups);
845 }
846
847 KA_TRACE( 10, ("__kmp_launch_monitor: #2 monitor\n" ) );
848
849 if (__kmp_yield_cycle) {
850 __kmp_yielding_on = 0; /* Start out with yielding shut off */
851 yield_count = __kmp_yield_off_count;
852 } else {
853 __kmp_yielding_on = 1; /* Yielding is on permanently */
854 }
855
856 while( ! TCR_4( __kmp_global.g.g_done ) ) {
857 struct timespec now;
858 struct timeval tval;
859
860 /* This thread monitors the state of the system */
861
862 KA_TRACE( 15, ( "__kmp_launch_monitor: update\n" ) );
863
864 status = gettimeofday( &tval, NULL );
865 KMP_CHECK_SYSFAIL_ERRNO( "gettimeofday", status );
866 TIMEVAL_TO_TIMESPEC( &tval, &now );
867
868 now.tv_sec += interval.tv_sec;
869 now.tv_nsec += interval.tv_nsec;
870
871 if (now.tv_nsec >= NSEC_PER_SEC) {
872 now.tv_sec += 1;
873 now.tv_nsec -= NSEC_PER_SEC;
874 }
875
876 status = pthread_mutex_lock( & __kmp_wait_mx.m_mutex );
877 KMP_CHECK_SYSFAIL( "pthread_mutex_lock", status );
Jim Cownie07ea89f2014-09-03 11:10:54 +0000878 // AC: the monitor should not fall asleep if g_done has been set
879 if ( !TCR_4(__kmp_global.g.g_done) ) { // check once more under mutex
880 status = pthread_cond_timedwait( &__kmp_wait_cv.c_cond, &__kmp_wait_mx.m_mutex, &now );
881 if ( status != 0 ) {
882 if ( status != ETIMEDOUT && status != EINTR ) {
883 KMP_SYSFAIL( "pthread_cond_timedwait", status );
884 };
Jim Cownie5e8470a2013-09-27 10:38:44 +0000885 };
886 };
Jim Cownie5e8470a2013-09-27 10:38:44 +0000887 status = pthread_mutex_unlock( & __kmp_wait_mx.m_mutex );
888 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
889
890 if (__kmp_yield_cycle) {
891 yield_cycles++;
892 if ( (yield_cycles % yield_count) == 0 ) {
893 if (__kmp_yielding_on) {
894 __kmp_yielding_on = 0; /* Turn it off now */
895 yield_count = __kmp_yield_off_count;
896 } else {
897 __kmp_yielding_on = 1; /* Turn it on now */
898 yield_count = __kmp_yield_on_count;
899 }
900 yield_cycles = 0;
901 }
902 } else {
903 __kmp_yielding_on = 1;
904 }
905
906 TCW_4( __kmp_global.g.g_time.dt.t_value,
907 TCR_4( __kmp_global.g.g_time.dt.t_value ) + 1 );
908
909 KMP_MB(); /* Flush all pending memory write invalidates. */
910 }
911
912 KA_TRACE( 10, ("__kmp_launch_monitor: #3 cleanup\n" ) );
913
914#ifdef KMP_BLOCK_SIGNALS
915 status = sigfillset( & new_set );
916 KMP_CHECK_SYSFAIL_ERRNO( "sigfillset", status );
917 status = pthread_sigmask( SIG_UNBLOCK, & new_set, NULL );
918 KMP_CHECK_SYSFAIL( "pthread_sigmask", status );
919#endif /* KMP_BLOCK_SIGNALS */
920
921 KA_TRACE( 10, ("__kmp_launch_monitor: #4 finished\n" ) );
922
923 if( __kmp_global.g.g_abort != 0 ) {
924 /* now we need to terminate the worker threads */
925 /* the value of t_abort is the signal we caught */
926
927 int gtid;
928
929 KA_TRACE( 10, ("__kmp_launch_monitor: #5 terminate sig=%d\n", __kmp_global.g.g_abort ) );
930
931 /* terminate the OpenMP worker threads */
932 /* TODO this is not valid for sibling threads!!
933 * the uber master might not be 0 anymore.. */
934 for (gtid = 1; gtid < __kmp_threads_capacity; ++gtid)
935 __kmp_terminate_thread( gtid );
936
937 __kmp_cleanup();
938
939 KA_TRACE( 10, ("__kmp_launch_monitor: #6 raise sig=%d\n", __kmp_global.g.g_abort ) );
940
941 if (__kmp_global.g.g_abort > 0)
942 raise( __kmp_global.g.g_abort );
943
944 }
945
946 KA_TRACE( 10, ("__kmp_launch_monitor: #7 exit\n" ) );
947
948 return thr;
949}
950
951void
952__kmp_create_worker( int gtid, kmp_info_t *th, size_t stack_size )
953{
954 pthread_t handle;
955 pthread_attr_t thread_attr;
956 int status;
957
958
959 th->th.th_info.ds.ds_gtid = gtid;
960
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000961#if KMP_STATS_ENABLED
962 // sets up worker thread stats
963 __kmp_acquire_tas_lock(&__kmp_stats_lock, gtid);
964
965 // th->th.th_stats is used to transfer thread specific stats-pointer to __kmp_launch_worker
966 // So when thread is created (goes into __kmp_launch_worker) it will
967 // set it's __thread local pointer to th->th.th_stats
968 th->th.th_stats = __kmp_stats_list.push_back(gtid);
969 if(KMP_UBER_GTID(gtid)) {
970 __kmp_stats_start_time = tsc_tick_count::now();
971 __kmp_stats_thread_ptr = th->th.th_stats;
972 __kmp_stats_init();
973 KMP_START_EXPLICIT_TIMER(OMP_serial);
974 KMP_START_EXPLICIT_TIMER(OMP_start_end);
975 }
976 __kmp_release_tas_lock(&__kmp_stats_lock, gtid);
977
978#endif // KMP_STATS_ENABLED
979
Jim Cownie5e8470a2013-09-27 10:38:44 +0000980 if ( KMP_UBER_GTID(gtid) ) {
981 KA_TRACE( 10, ("__kmp_create_worker: uber thread (%d)\n", gtid ) );
982 th -> th.th_info.ds.ds_thread = pthread_self();
983 __kmp_set_stack_info( gtid, th );
984 __kmp_check_stack_overlap( th );
985 return;
986 }; // if
987
988 KA_TRACE( 10, ("__kmp_create_worker: try to create thread (%d)\n", gtid ) );
989
990 KMP_MB(); /* Flush all pending memory write invalidates. */
991
992#ifdef KMP_THREAD_ATTR
993 {
994 status = pthread_attr_init( &thread_attr );
995 if ( status != 0 ) {
996 __kmp_msg(
997 kmp_ms_fatal,
998 KMP_MSG( CantInitThreadAttrs ),
999 KMP_ERR( status ),
1000 __kmp_msg_null
1001 );
1002 }; // if
1003 status = pthread_attr_setdetachstate( & thread_attr, PTHREAD_CREATE_JOINABLE );
1004 if ( status != 0 ) {
1005 __kmp_msg(
1006 kmp_ms_fatal,
1007 KMP_MSG( CantSetWorkerState ),
1008 KMP_ERR( status ),
1009 __kmp_msg_null
1010 );
1011 }; // if
1012
1013 /* Set stack size for this thread now. */
1014 stack_size += gtid * __kmp_stkoffset;
1015
1016 KA_TRACE( 10, ( "__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
1017 "__kmp_stksize = %lu bytes, final stacksize = %lu bytes\n",
1018 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size ) );
1019
1020# ifdef _POSIX_THREAD_ATTR_STACKSIZE
1021 status = pthread_attr_setstacksize( & thread_attr, stack_size );
1022# ifdef KMP_BACKUP_STKSIZE
1023 if ( status != 0 ) {
1024 if ( ! __kmp_env_stksize ) {
1025 stack_size = KMP_BACKUP_STKSIZE + gtid * __kmp_stkoffset;
1026 __kmp_stksize = KMP_BACKUP_STKSIZE;
1027 KA_TRACE( 10, ("__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
1028 "__kmp_stksize = %lu bytes, (backup) final stacksize = %lu "
1029 "bytes\n",
1030 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size )
1031 );
1032 status = pthread_attr_setstacksize( &thread_attr, stack_size );
1033 }; // if
1034 }; // if
1035# endif /* KMP_BACKUP_STKSIZE */
1036 if ( status != 0 ) {
1037 __kmp_msg(
1038 kmp_ms_fatal,
1039 KMP_MSG( CantSetWorkerStackSize, stack_size ),
1040 KMP_ERR( status ),
1041 KMP_HNT( ChangeWorkerStackSize ),
1042 __kmp_msg_null
1043 );
1044 }; // if
1045# endif /* _POSIX_THREAD_ATTR_STACKSIZE */
1046 }
1047#endif /* KMP_THREAD_ATTR */
1048
1049 {
1050 status = pthread_create( & handle, & thread_attr, __kmp_launch_worker, (void *) th );
1051 if ( status != 0 || ! handle ) { // ??? Why do we check handle??
1052#ifdef _POSIX_THREAD_ATTR_STACKSIZE
1053 if ( status == EINVAL ) {
1054 __kmp_msg(
1055 kmp_ms_fatal,
1056 KMP_MSG( CantSetWorkerStackSize, stack_size ),
1057 KMP_ERR( status ),
1058 KMP_HNT( IncreaseWorkerStackSize ),
1059 __kmp_msg_null
1060 );
1061 };
1062 if ( status == ENOMEM ) {
1063 __kmp_msg(
1064 kmp_ms_fatal,
1065 KMP_MSG( CantSetWorkerStackSize, stack_size ),
1066 KMP_ERR( status ),
1067 KMP_HNT( DecreaseWorkerStackSize ),
1068 __kmp_msg_null
1069 );
1070 };
1071#endif /* _POSIX_THREAD_ATTR_STACKSIZE */
1072 if ( status == EAGAIN ) {
1073 __kmp_msg(
1074 kmp_ms_fatal,
1075 KMP_MSG( NoResourcesForWorkerThread ),
1076 KMP_ERR( status ),
1077 KMP_HNT( Decrease_NUM_THREADS ),
1078 __kmp_msg_null
1079 );
1080 }; // if
1081 KMP_SYSFAIL( "pthread_create", status );
1082 }; // if
1083
1084 th->th.th_info.ds.ds_thread = handle;
1085 }
1086
1087#ifdef KMP_THREAD_ATTR
1088 {
1089 status = pthread_attr_destroy( & thread_attr );
1090 if ( status ) {
1091 __kmp_msg(
1092 kmp_ms_warning,
1093 KMP_MSG( CantDestroyThreadAttrs ),
1094 KMP_ERR( status ),
1095 __kmp_msg_null
1096 );
1097 }; // if
1098 }
1099#endif /* KMP_THREAD_ATTR */
1100
1101 KMP_MB(); /* Flush all pending memory write invalidates. */
1102
1103 KA_TRACE( 10, ("__kmp_create_worker: done creating thread (%d)\n", gtid ) );
1104
1105} // __kmp_create_worker
1106
1107
1108void
1109__kmp_create_monitor( kmp_info_t *th )
1110{
1111 pthread_t handle;
1112 pthread_attr_t thread_attr;
1113 size_t size;
1114 int status;
1115 int caller_gtid = __kmp_get_gtid();
1116 int auto_adj_size = FALSE;
1117
1118 KA_TRACE( 10, ("__kmp_create_monitor: try to create monitor\n" ) );
1119
1120 KMP_MB(); /* Flush all pending memory write invalidates. */
1121
1122 th->th.th_info.ds.ds_tid = KMP_GTID_MONITOR;
1123 th->th.th_info.ds.ds_gtid = KMP_GTID_MONITOR;
1124 #if KMP_REAL_TIME_FIX
1125 TCW_4( __kmp_global.g.g_time.dt.t_value, -1 ); // Will use it for synchronization a bit later.
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001126 #else
1127 TCW_4( __kmp_global.g.g_time.dt.t_value, 0 );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001128 #endif // KMP_REAL_TIME_FIX
1129
1130 #ifdef KMP_THREAD_ATTR
1131 if ( __kmp_monitor_stksize == 0 ) {
1132 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
1133 auto_adj_size = TRUE;
1134 }
1135 status = pthread_attr_init( &thread_attr );
1136 if ( status != 0 ) {
1137 __kmp_msg(
1138 kmp_ms_fatal,
1139 KMP_MSG( CantInitThreadAttrs ),
1140 KMP_ERR( status ),
1141 __kmp_msg_null
1142 );
1143 }; // if
1144 status = pthread_attr_setdetachstate( & thread_attr, PTHREAD_CREATE_JOINABLE );
1145 if ( status != 0 ) {
1146 __kmp_msg(
1147 kmp_ms_fatal,
1148 KMP_MSG( CantSetMonitorState ),
1149 KMP_ERR( status ),
1150 __kmp_msg_null
1151 );
1152 }; // if
1153
1154 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
1155 status = pthread_attr_getstacksize( & thread_attr, & size );
1156 KMP_CHECK_SYSFAIL( "pthread_attr_getstacksize", status );
1157 #else
1158 size = __kmp_sys_min_stksize;
1159 #endif /* _POSIX_THREAD_ATTR_STACKSIZE */
1160 #endif /* KMP_THREAD_ATTR */
1161
1162 if ( __kmp_monitor_stksize == 0 ) {
1163 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
1164 }
1165 if ( __kmp_monitor_stksize < __kmp_sys_min_stksize ) {
1166 __kmp_monitor_stksize = __kmp_sys_min_stksize;
1167 }
1168
1169 KA_TRACE( 10, ( "__kmp_create_monitor: default stacksize = %lu bytes,"
1170 "requested stacksize = %lu bytes\n",
1171 size, __kmp_monitor_stksize ) );
1172
1173 retry:
1174
1175 /* Set stack size for this thread now. */
1176
1177 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
1178 KA_TRACE( 10, ( "__kmp_create_monitor: setting stacksize = %lu bytes,",
1179 __kmp_monitor_stksize ) );
1180 status = pthread_attr_setstacksize( & thread_attr, __kmp_monitor_stksize );
1181 if ( status != 0 ) {
1182 if ( auto_adj_size ) {
1183 __kmp_monitor_stksize *= 2;
1184 goto retry;
1185 }
1186 __kmp_msg(
1187 kmp_ms_warning, // should this be fatal? BB
1188 KMP_MSG( CantSetMonitorStackSize, (long int) __kmp_monitor_stksize ),
1189 KMP_ERR( status ),
1190 KMP_HNT( ChangeMonitorStackSize ),
1191 __kmp_msg_null
1192 );
1193 }; // if
1194 #endif /* _POSIX_THREAD_ATTR_STACKSIZE */
1195
Jim Cownie5e8470a2013-09-27 10:38:44 +00001196 status = pthread_create( &handle, & thread_attr, __kmp_launch_monitor, (void *) th );
1197
1198 if ( status != 0 ) {
1199 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
1200 if ( status == EINVAL ) {
1201 if ( auto_adj_size && ( __kmp_monitor_stksize < (size_t)0x40000000 ) ) {
1202 __kmp_monitor_stksize *= 2;
1203 goto retry;
1204 }
1205 __kmp_msg(
1206 kmp_ms_fatal,
1207 KMP_MSG( CantSetMonitorStackSize, __kmp_monitor_stksize ),
1208 KMP_ERR( status ),
1209 KMP_HNT( IncreaseMonitorStackSize ),
1210 __kmp_msg_null
1211 );
1212 }; // if
1213 if ( status == ENOMEM ) {
1214 __kmp_msg(
1215 kmp_ms_fatal,
1216 KMP_MSG( CantSetMonitorStackSize, __kmp_monitor_stksize ),
1217 KMP_ERR( status ),
1218 KMP_HNT( DecreaseMonitorStackSize ),
1219 __kmp_msg_null
1220 );
1221 }; // if
1222 #endif /* _POSIX_THREAD_ATTR_STACKSIZE */
1223 if ( status == EAGAIN ) {
1224 __kmp_msg(
1225 kmp_ms_fatal,
1226 KMP_MSG( NoResourcesForMonitorThread ),
1227 KMP_ERR( status ),
1228 KMP_HNT( DecreaseNumberOfThreadsInUse ),
1229 __kmp_msg_null
1230 );
1231 }; // if
1232 KMP_SYSFAIL( "pthread_create", status );
1233 }; // if
1234
1235 th->th.th_info.ds.ds_thread = handle;
1236
1237 #if KMP_REAL_TIME_FIX
1238 // Wait for the monitor thread is really started and set its *priority*.
1239 KMP_DEBUG_ASSERT( sizeof( kmp_uint32 ) == sizeof( __kmp_global.g.g_time.dt.t_value ) );
1240 __kmp_wait_yield_4(
1241 (kmp_uint32 volatile *) & __kmp_global.g.g_time.dt.t_value, -1, & __kmp_neq_4, NULL
1242 );
1243 #endif // KMP_REAL_TIME_FIX
1244
1245 #ifdef KMP_THREAD_ATTR
1246 status = pthread_attr_destroy( & thread_attr );
1247 if ( status != 0 ) {
1248 __kmp_msg( //
1249 kmp_ms_warning,
1250 KMP_MSG( CantDestroyThreadAttrs ),
1251 KMP_ERR( status ),
1252 __kmp_msg_null
1253 );
1254 }; // if
1255 #endif
1256
1257 KMP_MB(); /* Flush all pending memory write invalidates. */
1258
1259 KA_TRACE( 10, ( "__kmp_create_monitor: monitor created %#.8lx\n", th->th.th_info.ds.ds_thread ) );
1260
1261} // __kmp_create_monitor
1262
1263void
1264__kmp_exit_thread(
1265 int exit_status
1266) {
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001267 pthread_exit( (void *)(intptr_t) exit_status );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001268} // __kmp_exit_thread
1269
Jim Cownie07ea89f2014-09-03 11:10:54 +00001270void __kmp_resume_monitor();
1271
Jim Cownie5e8470a2013-09-27 10:38:44 +00001272void
1273__kmp_reap_monitor( kmp_info_t *th )
1274{
1275 int status, i;
1276 void *exit_val;
1277
1278 KA_TRACE( 10, ("__kmp_reap_monitor: try to reap monitor thread with handle %#.8lx\n",
1279 th->th.th_info.ds.ds_thread ) );
1280
1281 // If monitor has been created, its tid and gtid should be KMP_GTID_MONITOR.
1282 // If both tid and gtid are 0, it means the monitor did not ever start.
1283 // If both tid and gtid are KMP_GTID_DNE, the monitor has been shut down.
1284 KMP_DEBUG_ASSERT( th->th.th_info.ds.ds_tid == th->th.th_info.ds.ds_gtid );
1285 if ( th->th.th_info.ds.ds_gtid != KMP_GTID_MONITOR ) {
1286 return;
1287 }; // if
1288
1289 KMP_MB(); /* Flush all pending memory write invalidates. */
1290
1291
1292 /* First, check to see whether the monitor thread exists. This could prevent a hang,
1293 but if the monitor dies after the pthread_kill call and before the pthread_join
1294 call, it will still hang. */
1295
1296 status = pthread_kill( th->th.th_info.ds.ds_thread, 0 );
1297 if (status == ESRCH) {
1298
1299 KA_TRACE( 10, ("__kmp_reap_monitor: monitor does not exist, returning\n") );
1300
1301 } else
1302 {
Jim Cownie07ea89f2014-09-03 11:10:54 +00001303 __kmp_resume_monitor(); // Wake up the monitor thread
Jim Cownie5e8470a2013-09-27 10:38:44 +00001304 status = pthread_join( th->th.th_info.ds.ds_thread, & exit_val);
1305 if (exit_val != th) {
1306 __kmp_msg(
1307 kmp_ms_fatal,
1308 KMP_MSG( ReapMonitorError ),
1309 KMP_ERR( status ),
1310 __kmp_msg_null
1311 );
1312 }
1313 }
1314
1315 th->th.th_info.ds.ds_tid = KMP_GTID_DNE;
1316 th->th.th_info.ds.ds_gtid = KMP_GTID_DNE;
1317
1318 KA_TRACE( 10, ("__kmp_reap_monitor: done reaping monitor thread with handle %#.8lx\n",
1319 th->th.th_info.ds.ds_thread ) );
1320
1321 KMP_MB(); /* Flush all pending memory write invalidates. */
1322
1323}
1324
1325void
1326__kmp_reap_worker( kmp_info_t *th )
1327{
1328 int status;
1329 void *exit_val;
1330
1331 KMP_MB(); /* Flush all pending memory write invalidates. */
1332
1333 KA_TRACE( 10, ("__kmp_reap_worker: try to reap T#%d\n", th->th.th_info.ds.ds_gtid ) );
1334
1335 /* First, check to see whether the worker thread exists. This could prevent a hang,
1336 but if the worker dies after the pthread_kill call and before the pthread_join
1337 call, it will still hang. */
1338
1339 {
1340 status = pthread_kill( th->th.th_info.ds.ds_thread, 0 );
1341 if (status == ESRCH) {
1342 KA_TRACE( 10, ("__kmp_reap_worker: worker T#%d does not exist, returning\n",
1343 th->th.th_info.ds.ds_gtid ) );
1344 }
1345 else {
1346 KA_TRACE( 10, ("__kmp_reap_worker: try to join with worker T#%d\n",
1347 th->th.th_info.ds.ds_gtid ) );
1348
1349 status = pthread_join( th->th.th_info.ds.ds_thread, & exit_val);
1350#ifdef KMP_DEBUG
1351 /* Don't expose these to the user until we understand when they trigger */
1352 if ( status != 0 ) {
1353 __kmp_msg(
1354 kmp_ms_fatal,
1355 KMP_MSG( ReapWorkerError ),
1356 KMP_ERR( status ),
1357 __kmp_msg_null
1358 );
1359 }
1360 if ( exit_val != th ) {
1361 KA_TRACE( 10, ( "__kmp_reap_worker: worker T#%d did not reap properly, "
1362 "exit_val = %p\n",
1363 th->th.th_info.ds.ds_gtid, exit_val ) );
1364 }
1365#endif /* KMP_DEBUG */
1366 }
1367 }
1368
1369 KA_TRACE( 10, ("__kmp_reap_worker: done reaping T#%d\n", th->th.th_info.ds.ds_gtid ) );
1370
1371 KMP_MB(); /* Flush all pending memory write invalidates. */
1372}
1373
1374
1375/* ------------------------------------------------------------------------ */
1376/* ------------------------------------------------------------------------ */
1377
1378#if KMP_HANDLE_SIGNALS
1379
1380
1381static void
1382__kmp_null_handler( int signo )
1383{
1384 // Do nothing, for doing SIG_IGN-type actions.
1385} // __kmp_null_handler
1386
1387
1388static void
1389__kmp_team_handler( int signo )
1390{
1391 if ( __kmp_global.g.g_abort == 0 ) {
1392 /* Stage 1 signal handler, let's shut down all of the threads */
1393 #ifdef KMP_DEBUG
1394 __kmp_debug_printf( "__kmp_team_handler: caught signal = %d\n", signo );
1395 #endif
1396 switch ( signo ) {
1397 case SIGHUP :
1398 case SIGINT :
1399 case SIGQUIT :
1400 case SIGILL :
1401 case SIGABRT :
1402 case SIGFPE :
1403 case SIGBUS :
1404 case SIGSEGV :
1405 #ifdef SIGSYS
1406 case SIGSYS :
1407 #endif
1408 case SIGTERM :
1409 if ( __kmp_debug_buf ) {
1410 __kmp_dump_debug_buffer( );
1411 }; // if
1412 KMP_MB(); // Flush all pending memory write invalidates.
1413 TCW_4( __kmp_global.g.g_abort, signo );
1414 KMP_MB(); // Flush all pending memory write invalidates.
1415 TCW_4( __kmp_global.g.g_done, TRUE );
1416 KMP_MB(); // Flush all pending memory write invalidates.
1417 break;
1418 default:
1419 #ifdef KMP_DEBUG
1420 __kmp_debug_printf( "__kmp_team_handler: unknown signal type" );
1421 #endif
1422 break;
1423 }; // switch
1424 }; // if
1425} // __kmp_team_handler
1426
1427
1428static
1429void __kmp_sigaction( int signum, const struct sigaction * act, struct sigaction * oldact ) {
1430 int rc = sigaction( signum, act, oldact );
1431 KMP_CHECK_SYSFAIL_ERRNO( "sigaction", rc );
1432}
1433
1434
1435static void
1436__kmp_install_one_handler( int sig, sig_func_t handler_func, int parallel_init )
1437{
1438 KMP_MB(); // Flush all pending memory write invalidates.
1439 KB_TRACE( 60, ( "__kmp_install_one_handler( %d, ..., %d )\n", sig, parallel_init ) );
1440 if ( parallel_init ) {
1441 struct sigaction new_action;
1442 struct sigaction old_action;
1443 new_action.sa_handler = handler_func;
1444 new_action.sa_flags = 0;
1445 sigfillset( & new_action.sa_mask );
1446 __kmp_sigaction( sig, & new_action, & old_action );
1447 if ( old_action.sa_handler == __kmp_sighldrs[ sig ].sa_handler ) {
1448 sigaddset( & __kmp_sigset, sig );
1449 } else {
1450 // Restore/keep user's handler if one previously installed.
1451 __kmp_sigaction( sig, & old_action, NULL );
1452 }; // if
1453 } else {
1454 // Save initial/system signal handlers to see if user handlers installed.
1455 __kmp_sigaction( sig, NULL, & __kmp_sighldrs[ sig ] );
1456 }; // if
1457 KMP_MB(); // Flush all pending memory write invalidates.
1458} // __kmp_install_one_handler
1459
1460
1461static void
1462__kmp_remove_one_handler( int sig )
1463{
1464 KB_TRACE( 60, ( "__kmp_remove_one_handler( %d )\n", sig ) );
1465 if ( sigismember( & __kmp_sigset, sig ) ) {
1466 struct sigaction old;
1467 KMP_MB(); // Flush all pending memory write invalidates.
1468 __kmp_sigaction( sig, & __kmp_sighldrs[ sig ], & old );
1469 if ( ( old.sa_handler != __kmp_team_handler ) && ( old.sa_handler != __kmp_null_handler ) ) {
1470 // Restore the users signal handler.
1471 KB_TRACE( 10, ( "__kmp_remove_one_handler: oops, not our handler, restoring: sig=%d\n", sig ) );
1472 __kmp_sigaction( sig, & old, NULL );
1473 }; // if
1474 sigdelset( & __kmp_sigset, sig );
1475 KMP_MB(); // Flush all pending memory write invalidates.
1476 }; // if
1477} // __kmp_remove_one_handler
1478
1479
1480void
1481__kmp_install_signals( int parallel_init )
1482{
1483 KB_TRACE( 10, ( "__kmp_install_signals( %d )\n", parallel_init ) );
1484 if ( __kmp_handle_signals || ! parallel_init ) {
1485 // If ! parallel_init, we do not install handlers, just save original handlers.
1486 // Let us do it even __handle_signals is 0.
1487 sigemptyset( & __kmp_sigset );
1488 __kmp_install_one_handler( SIGHUP, __kmp_team_handler, parallel_init );
1489 __kmp_install_one_handler( SIGINT, __kmp_team_handler, parallel_init );
1490 __kmp_install_one_handler( SIGQUIT, __kmp_team_handler, parallel_init );
1491 __kmp_install_one_handler( SIGILL, __kmp_team_handler, parallel_init );
1492 __kmp_install_one_handler( SIGABRT, __kmp_team_handler, parallel_init );
1493 __kmp_install_one_handler( SIGFPE, __kmp_team_handler, parallel_init );
1494 __kmp_install_one_handler( SIGBUS, __kmp_team_handler, parallel_init );
1495 __kmp_install_one_handler( SIGSEGV, __kmp_team_handler, parallel_init );
1496 #ifdef SIGSYS
1497 __kmp_install_one_handler( SIGSYS, __kmp_team_handler, parallel_init );
1498 #endif // SIGSYS
1499 __kmp_install_one_handler( SIGTERM, __kmp_team_handler, parallel_init );
1500 #ifdef SIGPIPE
1501 __kmp_install_one_handler( SIGPIPE, __kmp_team_handler, parallel_init );
1502 #endif // SIGPIPE
1503 }; // if
1504} // __kmp_install_signals
1505
1506
1507void
1508__kmp_remove_signals( void )
1509{
1510 int sig;
1511 KB_TRACE( 10, ( "__kmp_remove_signals()\n" ) );
1512 for ( sig = 1; sig < NSIG; ++ sig ) {
1513 __kmp_remove_one_handler( sig );
1514 }; // for sig
1515} // __kmp_remove_signals
1516
1517
1518#endif // KMP_HANDLE_SIGNALS
1519
1520/* ------------------------------------------------------------------------ */
1521/* ------------------------------------------------------------------------ */
1522
1523void
1524__kmp_enable( int new_state )
1525{
1526 #ifdef KMP_CANCEL_THREADS
1527 int status, old_state;
1528 status = pthread_setcancelstate( new_state, & old_state );
1529 KMP_CHECK_SYSFAIL( "pthread_setcancelstate", status );
1530 KMP_DEBUG_ASSERT( old_state == PTHREAD_CANCEL_DISABLE );
1531 #endif
1532}
1533
1534void
1535__kmp_disable( int * old_state )
1536{
1537 #ifdef KMP_CANCEL_THREADS
1538 int status;
1539 status = pthread_setcancelstate( PTHREAD_CANCEL_DISABLE, old_state );
1540 KMP_CHECK_SYSFAIL( "pthread_setcancelstate", status );
1541 #endif
1542}
1543
1544/* ------------------------------------------------------------------------ */
1545/* ------------------------------------------------------------------------ */
1546
1547static void
1548__kmp_atfork_prepare (void)
1549{
1550 /* nothing to do */
1551}
1552
1553static void
1554__kmp_atfork_parent (void)
1555{
1556 /* nothing to do */
1557}
1558
1559/*
1560 Reset the library so execution in the child starts "all over again" with
1561 clean data structures in initial states. Don't worry about freeing memory
1562 allocated by parent, just abandon it to be safe.
1563*/
1564static void
1565__kmp_atfork_child (void)
1566{
1567 /* TODO make sure this is done right for nested/sibling */
1568 // ATT: Memory leaks are here? TODO: Check it and fix.
1569 /* KMP_ASSERT( 0 ); */
1570
1571 ++__kmp_fork_count;
1572
1573 __kmp_init_runtime = FALSE;
1574 __kmp_init_monitor = 0;
1575 __kmp_init_parallel = FALSE;
1576 __kmp_init_middle = FALSE;
1577 __kmp_init_serial = FALSE;
1578 TCW_4(__kmp_init_gtid, FALSE);
1579 __kmp_init_common = FALSE;
1580
1581 TCW_4(__kmp_init_user_locks, FALSE);
Andrey Churbanov5c56fb52015-02-20 18:05:17 +00001582#if ! KMP_USE_DYNAMIC_LOCK
Jim Cownie07ea89f2014-09-03 11:10:54 +00001583 __kmp_user_lock_table.used = 1;
Jim Cownie5e8470a2013-09-27 10:38:44 +00001584 __kmp_user_lock_table.allocated = 0;
1585 __kmp_user_lock_table.table = NULL;
1586 __kmp_lock_blocks = NULL;
Andrey Churbanov5c56fb52015-02-20 18:05:17 +00001587#endif
Jim Cownie5e8470a2013-09-27 10:38:44 +00001588
1589 __kmp_all_nth = 0;
1590 TCW_4(__kmp_nth, 0);
1591
1592 /* Must actually zero all the *cache arguments passed to __kmpc_threadprivate here
1593 so threadprivate doesn't use stale data */
1594 KA_TRACE( 10, ( "__kmp_atfork_child: checking cache address list %p\n",
1595 __kmp_threadpriv_cache_list ) );
1596
1597 while ( __kmp_threadpriv_cache_list != NULL ) {
1598
1599 if ( *__kmp_threadpriv_cache_list -> addr != NULL ) {
1600 KC_TRACE( 50, ( "__kmp_atfork_child: zeroing cache at address %p\n",
1601 &(*__kmp_threadpriv_cache_list -> addr) ) );
1602
1603 *__kmp_threadpriv_cache_list -> addr = NULL;
1604 }
1605 __kmp_threadpriv_cache_list = __kmp_threadpriv_cache_list -> next;
1606 }
1607
1608 __kmp_init_runtime = FALSE;
1609
1610 /* reset statically initialized locks */
1611 __kmp_init_bootstrap_lock( &__kmp_initz_lock );
1612 __kmp_init_bootstrap_lock( &__kmp_stdio_lock );
1613 __kmp_init_bootstrap_lock( &__kmp_console_lock );
1614
1615 /* This is necessary to make sure no stale data is left around */
1616 /* AC: customers complain that we use unsafe routines in the atfork
1617 handler. Mathworks: dlsym() is unsafe. We call dlsym and dlopen
1618 in dynamic_link when check the presence of shared tbbmalloc library.
1619 Suggestion is to make the library initialization lazier, similar
1620 to what done for __kmpc_begin(). */
1621 // TODO: synchronize all static initializations with regular library
1622 // startup; look at kmp_global.c and etc.
1623 //__kmp_internal_begin ();
1624
1625}
1626
1627void
1628__kmp_register_atfork(void) {
1629 if ( __kmp_need_register_atfork ) {
1630 int status = pthread_atfork( __kmp_atfork_prepare, __kmp_atfork_parent, __kmp_atfork_child );
1631 KMP_CHECK_SYSFAIL( "pthread_atfork", status );
1632 __kmp_need_register_atfork = FALSE;
1633 }
1634}
1635
1636void
1637__kmp_suspend_initialize( void )
1638{
1639 int status;
1640 status = pthread_mutexattr_init( &__kmp_suspend_mutex_attr );
1641 KMP_CHECK_SYSFAIL( "pthread_mutexattr_init", status );
1642 status = pthread_condattr_init( &__kmp_suspend_cond_attr );
1643 KMP_CHECK_SYSFAIL( "pthread_condattr_init", status );
1644}
1645
1646static void
1647__kmp_suspend_initialize_thread( kmp_info_t *th )
1648{
1649 if ( th->th.th_suspend_init_count <= __kmp_fork_count ) {
1650 /* this means we haven't initialized the suspension pthread objects for this thread
1651 in this instance of the process */
1652 int status;
1653 status = pthread_cond_init( &th->th.th_suspend_cv.c_cond, &__kmp_suspend_cond_attr );
1654 KMP_CHECK_SYSFAIL( "pthread_cond_init", status );
1655 status = pthread_mutex_init( &th->th.th_suspend_mx.m_mutex, & __kmp_suspend_mutex_attr );
1656 KMP_CHECK_SYSFAIL( "pthread_mutex_init", status );
1657 *(volatile int*)&th->th.th_suspend_init_count = __kmp_fork_count + 1;
1658 };
1659}
1660
1661void
1662__kmp_suspend_uninitialize_thread( kmp_info_t *th )
1663{
1664 if(th->th.th_suspend_init_count > __kmp_fork_count) {
1665 /* this means we have initialize the suspension pthread objects for this thread
1666 in this instance of the process */
1667 int status;
1668
1669 status = pthread_cond_destroy( &th->th.th_suspend_cv.c_cond );
1670 if ( status != 0 && status != EBUSY ) {
1671 KMP_SYSFAIL( "pthread_cond_destroy", status );
1672 };
1673 status = pthread_mutex_destroy( &th->th.th_suspend_mx.m_mutex );
1674 if ( status != 0 && status != EBUSY ) {
1675 KMP_SYSFAIL( "pthread_mutex_destroy", status );
1676 };
1677 --th->th.th_suspend_init_count;
1678 KMP_DEBUG_ASSERT(th->th.th_suspend_init_count == __kmp_fork_count);
1679 }
1680}
1681
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001682/* This routine puts the calling thread to sleep after setting the
1683 * sleep bit for the indicated flag variable to true.
Jim Cownie5e8470a2013-09-27 10:38:44 +00001684 */
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001685template <class C>
1686static inline void __kmp_suspend_template( int th_gtid, C *flag )
Jim Cownie5e8470a2013-09-27 10:38:44 +00001687{
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001688 KMP_TIME_BLOCK(USER_suspend);
Jim Cownie5e8470a2013-09-27 10:38:44 +00001689 kmp_info_t *th = __kmp_threads[th_gtid];
1690 int status;
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001691 typename C::flag_t old_spin;
Jim Cownie5e8470a2013-09-27 10:38:44 +00001692
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001693 KF_TRACE( 30, ("__kmp_suspend_template: T#%d enter for flag = %p\n", th_gtid, flag->get() ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001694
1695 __kmp_suspend_initialize_thread( th );
1696
1697 status = pthread_mutex_lock( &th->th.th_suspend_mx.m_mutex );
1698 KMP_CHECK_SYSFAIL( "pthread_mutex_lock", status );
1699
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001700 KF_TRACE( 10, ( "__kmp_suspend_template: T#%d setting sleep bit for spin(%p)\n",
1701 th_gtid, flag->get() ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001702
1703 /* TODO: shouldn't this use release semantics to ensure that __kmp_suspend_initialize_thread
1704 gets called first?
1705 */
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001706 old_spin = flag->set_sleeping();
Jim Cownie5e8470a2013-09-27 10:38:44 +00001707
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001708 KF_TRACE( 5, ( "__kmp_suspend_template: T#%d set sleep bit for spin(%p)==%d\n",
1709 th_gtid, flag->get(), *(flag->get()) ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001710
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001711 if ( flag->done_check_val(old_spin) ) {
1712 old_spin = flag->unset_sleeping();
1713 KF_TRACE( 5, ( "__kmp_suspend_template: T#%d false alarm, reset sleep bit for spin(%p)\n",
1714 th_gtid, flag->get()) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001715 } else {
Jim Cownie5e8470a2013-09-27 10:38:44 +00001716 /* Encapsulate in a loop as the documentation states that this may
1717 * "with low probability" return when the condition variable has
1718 * not been signaled or broadcast
1719 */
1720 int deactivated = FALSE;
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001721 TCW_PTR(th->th.th_sleep_loc, (void *)flag);
1722 while ( flag->is_sleeping() ) {
Jim Cownie5e8470a2013-09-27 10:38:44 +00001723#ifdef DEBUG_SUSPEND
1724 char buffer[128];
1725 __kmp_suspend_count++;
1726 __kmp_print_cond( buffer, &th->th.th_suspend_cv );
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001727 __kmp_printf( "__kmp_suspend_template: suspending T#%d: %s\n", th_gtid, buffer );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001728#endif
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001729 // Mark the thread as no longer active (only in the first iteration of the loop).
Jim Cownie5e8470a2013-09-27 10:38:44 +00001730 if ( ! deactivated ) {
1731 th->th.th_active = FALSE;
1732 if ( th->th.th_active_in_pool ) {
1733 th->th.th_active_in_pool = FALSE;
1734 KMP_TEST_THEN_DEC32(
1735 (kmp_int32 *) &__kmp_thread_pool_active_nth );
1736 KMP_DEBUG_ASSERT( TCR_4(__kmp_thread_pool_active_nth) >= 0 );
1737 }
1738 deactivated = TRUE;
1739
1740
1741 }
1742
1743#if USE_SUSPEND_TIMEOUT
1744 struct timespec now;
1745 struct timeval tval;
1746 int msecs;
1747
1748 status = gettimeofday( &tval, NULL );
1749 KMP_CHECK_SYSFAIL_ERRNO( "gettimeofday", status );
1750 TIMEVAL_TO_TIMESPEC( &tval, &now );
1751
1752 msecs = (4*__kmp_dflt_blocktime) + 200;
1753 now.tv_sec += msecs / 1000;
1754 now.tv_nsec += (msecs % 1000)*1000;
1755
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001756 KF_TRACE( 15, ( "__kmp_suspend_template: T#%d about to perform pthread_cond_timedwait\n",
Jim Cownie5e8470a2013-09-27 10:38:44 +00001757 th_gtid ) );
1758 status = pthread_cond_timedwait( &th->th.th_suspend_cv.c_cond, &th->th.th_suspend_mx.m_mutex, & now );
1759#else
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001760 KF_TRACE( 15, ( "__kmp_suspend_template: T#%d about to perform pthread_cond_wait\n",
Jim Cownie5e8470a2013-09-27 10:38:44 +00001761 th_gtid ) );
1762
1763 status = pthread_cond_wait( &th->th.th_suspend_cv.c_cond, &th->th.th_suspend_mx.m_mutex );
1764#endif
1765
1766 if ( (status != 0) && (status != EINTR) && (status != ETIMEDOUT) ) {
1767 KMP_SYSFAIL( "pthread_cond_wait", status );
1768 }
1769#ifdef KMP_DEBUG
1770 if (status == ETIMEDOUT) {
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001771 if ( flag->is_sleeping() ) {
1772 KF_TRACE( 100, ( "__kmp_suspend_template: T#%d timeout wakeup\n", th_gtid ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001773 } else {
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001774 KF_TRACE( 2, ( "__kmp_suspend_template: T#%d timeout wakeup, sleep bit not set!\n",
Jim Cownie5e8470a2013-09-27 10:38:44 +00001775 th_gtid ) );
1776 }
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001777 } else if ( flag->is_sleeping() ) {
1778 KF_TRACE( 100, ( "__kmp_suspend_template: T#%d spurious wakeup\n", th_gtid ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001779 }
1780#endif
Jim Cownie5e8470a2013-09-27 10:38:44 +00001781 } // while
1782
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001783 // Mark the thread as active again (if it was previous marked as inactive)
Jim Cownie5e8470a2013-09-27 10:38:44 +00001784 if ( deactivated ) {
1785 th->th.th_active = TRUE;
1786 if ( TCR_4(th->th.th_in_pool) ) {
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001787 KMP_TEST_THEN_INC32( (kmp_int32 *) &__kmp_thread_pool_active_nth );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001788 th->th.th_active_in_pool = TRUE;
1789 }
1790 }
1791 }
1792
1793#ifdef DEBUG_SUSPEND
1794 {
1795 char buffer[128];
1796 __kmp_print_cond( buffer, &th->th.th_suspend_cv);
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001797 __kmp_printf( "__kmp_suspend_template: T#%d has awakened: %s\n", th_gtid, buffer );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001798 }
1799#endif
1800
1801
1802 status = pthread_mutex_unlock( &th->th.th_suspend_mx.m_mutex );
1803 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
1804
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001805 KF_TRACE( 30, ("__kmp_suspend_template: T#%d exit\n", th_gtid ) );
1806}
1807
1808void __kmp_suspend_32(int th_gtid, kmp_flag_32 *flag) {
1809 __kmp_suspend_template(th_gtid, flag);
1810}
1811void __kmp_suspend_64(int th_gtid, kmp_flag_64 *flag) {
1812 __kmp_suspend_template(th_gtid, flag);
1813}
1814void __kmp_suspend_oncore(int th_gtid, kmp_flag_oncore *flag) {
1815 __kmp_suspend_template(th_gtid, flag);
Jim Cownie5e8470a2013-09-27 10:38:44 +00001816}
1817
1818
1819/* This routine signals the thread specified by target_gtid to wake up
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001820 * after setting the sleep bit indicated by the flag argument to FALSE.
1821 * The target thread must already have called __kmp_suspend_template()
Jim Cownie5e8470a2013-09-27 10:38:44 +00001822 */
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001823template <class C>
1824static inline void __kmp_resume_template( int target_gtid, C *flag )
Jim Cownie5e8470a2013-09-27 10:38:44 +00001825{
1826 kmp_info_t *th = __kmp_threads[target_gtid];
1827 int status;
Jim Cownie5e8470a2013-09-27 10:38:44 +00001828
1829#ifdef KMP_DEBUG
1830 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1831#endif
1832
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001833 KF_TRACE( 30, ( "__kmp_resume_template: T#%d wants to wakeup T#%d enter\n", gtid, target_gtid ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001834 KMP_DEBUG_ASSERT( gtid != target_gtid );
1835
1836 __kmp_suspend_initialize_thread( th );
1837
1838 status = pthread_mutex_lock( &th->th.th_suspend_mx.m_mutex );
1839 KMP_CHECK_SYSFAIL( "pthread_mutex_lock", status );
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001840
1841 if (!flag) {
1842 flag = (C *)th->th.th_sleep_loc;
1843 }
1844
1845 if (!flag) {
1846 KF_TRACE( 5, ( "__kmp_resume_template: T#%d exiting, thread T#%d already awake: flag(%p)\n",
1847 gtid, target_gtid, NULL ) );
1848 status = pthread_mutex_unlock( &th->th.th_suspend_mx.m_mutex );
1849 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
1850 return;
1851 }
1852 else {
1853 typename C::flag_t old_spin = flag->unset_sleeping();
1854 if ( ! flag->is_sleeping_val(old_spin) ) {
1855 KF_TRACE( 5, ( "__kmp_resume_template: T#%d exiting, thread T#%d already awake: flag(%p): "
1856 "%u => %u\n",
1857 gtid, target_gtid, flag->get(), old_spin, *flag->get() ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001858
1859 status = pthread_mutex_unlock( &th->th.th_suspend_mx.m_mutex );
1860 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
1861 return;
1862 }
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001863 KF_TRACE( 5, ( "__kmp_resume_template: T#%d about to wakeup T#%d, reset sleep bit for flag's loc(%p): "
1864 "%u => %u\n",
1865 gtid, target_gtid, flag->get(), old_spin, *flag->get() ) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001866 }
1867 TCW_PTR(th->th.th_sleep_loc, NULL);
1868
Jim Cownie5e8470a2013-09-27 10:38:44 +00001869
1870#ifdef DEBUG_SUSPEND
1871 {
1872 char buffer[128];
1873 __kmp_print_cond( buffer, &th->th.th_suspend_cv );
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001874 __kmp_printf( "__kmp_resume_template: T#%d resuming T#%d: %s\n", gtid, target_gtid, buffer );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001875 }
1876#endif
1877
1878
1879 status = pthread_cond_signal( &th->th.th_suspend_cv.c_cond );
1880 KMP_CHECK_SYSFAIL( "pthread_cond_signal", status );
1881 status = pthread_mutex_unlock( &th->th.th_suspend_mx.m_mutex );
1882 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001883 KF_TRACE( 30, ( "__kmp_resume_template: T#%d exiting after signaling wake up for T#%d\n",
Jim Cownie5e8470a2013-09-27 10:38:44 +00001884 gtid, target_gtid ) );
1885}
1886
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001887void __kmp_resume_32(int target_gtid, kmp_flag_32 *flag) {
1888 __kmp_resume_template(target_gtid, flag);
1889}
1890void __kmp_resume_64(int target_gtid, kmp_flag_64 *flag) {
1891 __kmp_resume_template(target_gtid, flag);
1892}
1893void __kmp_resume_oncore(int target_gtid, kmp_flag_oncore *flag) {
1894 __kmp_resume_template(target_gtid, flag);
1895}
1896
Jim Cownie07ea89f2014-09-03 11:10:54 +00001897void
1898__kmp_resume_monitor()
1899{
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001900 KMP_TIME_BLOCK(USER_resume);
Jim Cownie07ea89f2014-09-03 11:10:54 +00001901 int status;
1902#ifdef KMP_DEBUG
1903 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1904 KF_TRACE( 30, ( "__kmp_resume_monitor: T#%d wants to wakeup T#%d enter\n",
1905 gtid, KMP_GTID_MONITOR ) );
1906 KMP_DEBUG_ASSERT( gtid != KMP_GTID_MONITOR );
1907#endif
1908 status = pthread_mutex_lock( &__kmp_wait_mx.m_mutex );
1909 KMP_CHECK_SYSFAIL( "pthread_mutex_lock", status );
1910#ifdef DEBUG_SUSPEND
1911 {
1912 char buffer[128];
1913 __kmp_print_cond( buffer, &__kmp_wait_cv.c_cond );
1914 __kmp_printf( "__kmp_resume_monitor: T#%d resuming T#%d: %s\n", gtid, KMP_GTID_MONITOR, buffer );
1915 }
1916#endif
1917 status = pthread_cond_signal( &__kmp_wait_cv.c_cond );
1918 KMP_CHECK_SYSFAIL( "pthread_cond_signal", status );
1919 status = pthread_mutex_unlock( &__kmp_wait_mx.m_mutex );
1920 KMP_CHECK_SYSFAIL( "pthread_mutex_unlock", status );
1921 KF_TRACE( 30, ( "__kmp_resume_monitor: T#%d exiting after signaling wake up for T#%d\n",
1922 gtid, KMP_GTID_MONITOR ) );
1923}
Jim Cownie5e8470a2013-09-27 10:38:44 +00001924
1925/* ------------------------------------------------------------------------ */
1926/* ------------------------------------------------------------------------ */
1927
1928void
1929__kmp_yield( int cond )
1930{
1931 if (cond && __kmp_yielding_on) {
1932 sched_yield();
1933 }
1934}
1935
1936/* ------------------------------------------------------------------------ */
1937/* ------------------------------------------------------------------------ */
1938
1939void
1940__kmp_gtid_set_specific( int gtid )
1941{
1942 int status;
1943 KMP_ASSERT( __kmp_init_runtime );
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001944 status = pthread_setspecific( __kmp_gtid_threadprivate_key, (void*)(intptr_t)(gtid+1) );
Jim Cownie5e8470a2013-09-27 10:38:44 +00001945 KMP_CHECK_SYSFAIL( "pthread_setspecific", status );
1946}
1947
1948int
1949__kmp_gtid_get_specific()
1950{
1951 int gtid;
1952 if ( !__kmp_init_runtime ) {
1953 KA_TRACE( 50, ("__kmp_get_specific: runtime shutdown, returning KMP_GTID_SHUTDOWN\n" ) );
1954 return KMP_GTID_SHUTDOWN;
1955 }
1956 gtid = (int)(size_t)pthread_getspecific( __kmp_gtid_threadprivate_key );
1957 if ( gtid == 0 ) {
1958 gtid = KMP_GTID_DNE;
1959 }
1960 else {
1961 gtid--;
1962 }
1963 KA_TRACE( 50, ("__kmp_gtid_get_specific: key:%d gtid:%d\n",
1964 __kmp_gtid_threadprivate_key, gtid ));
1965 return gtid;
1966}
1967
1968/* ------------------------------------------------------------------------ */
1969/* ------------------------------------------------------------------------ */
1970
1971double
1972__kmp_read_cpu_time( void )
1973{
1974 /*clock_t t;*/
1975 struct tms buffer;
1976
1977 /*t =*/ times( & buffer );
1978
1979 return (buffer.tms_utime + buffer.tms_cutime) / (double) CLOCKS_PER_SEC;
1980}
1981
1982int
1983__kmp_read_system_info( struct kmp_sys_info *info )
1984{
1985 int status;
1986 struct rusage r_usage;
1987
1988 memset( info, 0, sizeof( *info ) );
1989
1990 status = getrusage( RUSAGE_SELF, &r_usage);
1991 KMP_CHECK_SYSFAIL_ERRNO( "getrusage", status );
1992
1993 info->maxrss = r_usage.ru_maxrss; /* the maximum resident set size utilized (in kilobytes) */
1994 info->minflt = r_usage.ru_minflt; /* the number of page faults serviced without any I/O */
1995 info->majflt = r_usage.ru_majflt; /* the number of page faults serviced that required I/O */
1996 info->nswap = r_usage.ru_nswap; /* the number of times a process was "swapped" out of memory */
1997 info->inblock = r_usage.ru_inblock; /* the number of times the file system had to perform input */
1998 info->oublock = r_usage.ru_oublock; /* the number of times the file system had to perform output */
1999 info->nvcsw = r_usage.ru_nvcsw; /* the number of times a context switch was voluntarily */
2000 info->nivcsw = r_usage.ru_nivcsw; /* the number of times a context switch was forced */
2001
2002 return (status != 0);
2003}
2004
2005/* ------------------------------------------------------------------------ */
2006/* ------------------------------------------------------------------------ */
2007
2008
2009void
2010__kmp_read_system_time( double *delta )
2011{
2012 double t_ns;
2013 struct timeval tval;
2014 struct timespec stop;
2015 int status;
2016
2017 status = gettimeofday( &tval, NULL );
2018 KMP_CHECK_SYSFAIL_ERRNO( "gettimeofday", status );
2019 TIMEVAL_TO_TIMESPEC( &tval, &stop );
2020 t_ns = TS2NS(stop) - TS2NS(__kmp_sys_timer_data.start);
2021 *delta = (t_ns * 1e-9);
2022}
2023
2024void
2025__kmp_clear_system_time( void )
2026{
2027 struct timeval tval;
2028 int status;
2029 status = gettimeofday( &tval, NULL );
2030 KMP_CHECK_SYSFAIL_ERRNO( "gettimeofday", status );
2031 TIMEVAL_TO_TIMESPEC( &tval, &__kmp_sys_timer_data.start );
2032}
2033
2034/* ------------------------------------------------------------------------ */
2035/* ------------------------------------------------------------------------ */
2036
2037#ifdef BUILD_TV
2038
2039void
2040__kmp_tv_threadprivate_store( kmp_info_t *th, void *global_addr, void *thread_addr )
2041{
2042 struct tv_data *p;
2043
2044 p = (struct tv_data *) __kmp_allocate( sizeof( *p ) );
2045
2046 p->u.tp.global_addr = global_addr;
2047 p->u.tp.thread_addr = thread_addr;
2048
2049 p->type = (void *) 1;
2050
2051 p->next = th->th.th_local.tv_data;
2052 th->th.th_local.tv_data = p;
2053
2054 if ( p->next == 0 ) {
2055 int rc = pthread_setspecific( __kmp_tv_key, p );
2056 KMP_CHECK_SYSFAIL( "pthread_setspecific", rc );
2057 }
2058}
2059
2060#endif /* BUILD_TV */
2061
2062/* ------------------------------------------------------------------------ */
2063/* ------------------------------------------------------------------------ */
2064
2065static int
2066__kmp_get_xproc( void ) {
2067
2068 int r = 0;
2069
2070 #if KMP_OS_LINUX
2071
2072 r = sysconf( _SC_NPROCESSORS_ONLN );
2073
2074 #elif KMP_OS_DARWIN
2075
2076 // Bug C77011 High "OpenMP Threads and number of active cores".
2077
2078 // Find the number of available CPUs.
2079 kern_return_t rc;
2080 host_basic_info_data_t info;
2081 mach_msg_type_number_t num = HOST_BASIC_INFO_COUNT;
2082 rc = host_info( mach_host_self(), HOST_BASIC_INFO, (host_info_t) & info, & num );
2083 if ( rc == 0 && num == HOST_BASIC_INFO_COUNT ) {
2084 // Cannot use KA_TRACE() here because this code works before trace support is
2085 // initialized.
2086 r = info.avail_cpus;
2087 } else {
2088 KMP_WARNING( CantGetNumAvailCPU );
2089 KMP_INFORM( AssumedNumCPU );
2090 }; // if
2091
Alp Toker763b9392014-02-28 09:42:41 +00002092 #elif KMP_OS_FREEBSD
2093
2094 int mib[] = { CTL_HW, HW_NCPU };
2095 size_t len = sizeof( r );
2096 if ( sysctl( mib, 2, &r, &len, NULL, 0 ) < 0 ) {
Jim Cownie4cc4bb42014-10-07 16:25:50 +00002097 r = 0;
2098 KMP_WARNING( CantGetNumAvailCPU );
2099 KMP_INFORM( AssumedNumCPU );
Alp Toker763b9392014-02-28 09:42:41 +00002100 }
2101
Jim Cownie5e8470a2013-09-27 10:38:44 +00002102 #else
2103
2104 #error "Unknown or unsupported OS."
2105
2106 #endif
2107
2108 return r > 0 ? r : 2; /* guess value of 2 if OS told us 0 */
2109
2110} // __kmp_get_xproc
2111
Jim Cownie181b4bb2013-12-23 17:28:57 +00002112int
2113__kmp_read_from_file( char const *path, char const *format, ... )
2114{
2115 int result;
2116 va_list args;
Jim Cownie5e8470a2013-09-27 10:38:44 +00002117
Jim Cownie181b4bb2013-12-23 17:28:57 +00002118 va_start(args, format);
2119 FILE *f = fopen(path, "rb");
2120 if ( f == NULL )
2121 return 0;
2122 result = vfscanf(f, format, args);
2123 fclose(f);
Jim Cownie5e8470a2013-09-27 10:38:44 +00002124
Jim Cownie5e8470a2013-09-27 10:38:44 +00002125 return result;
Jim Cownie181b4bb2013-12-23 17:28:57 +00002126}
Jim Cownie5e8470a2013-09-27 10:38:44 +00002127
2128void
2129__kmp_runtime_initialize( void )
2130{
2131 int status;
2132 pthread_mutexattr_t mutex_attr;
2133 pthread_condattr_t cond_attr;
2134
2135 if ( __kmp_init_runtime ) {
2136 return;
2137 }; // if
2138
2139 #if ( KMP_ARCH_X86 || KMP_ARCH_X86_64 )
2140 if ( ! __kmp_cpuinfo.initialized ) {
2141 __kmp_query_cpuid( &__kmp_cpuinfo );
2142 }; // if
2143 #endif /* KMP_ARCH_X86 || KMP_ARCH_X86_64 */
2144
Jim Cownie5e8470a2013-09-27 10:38:44 +00002145 __kmp_xproc = __kmp_get_xproc();
2146
2147 if ( sysconf( _SC_THREADS ) ) {
2148
2149 /* Query the maximum number of threads */
2150 __kmp_sys_max_nth = sysconf( _SC_THREAD_THREADS_MAX );
2151 if ( __kmp_sys_max_nth == -1 ) {
2152 /* Unlimited threads for NPTL */
2153 __kmp_sys_max_nth = INT_MAX;
2154 }
2155 else if ( __kmp_sys_max_nth <= 1 ) {
2156 /* Can't tell, just use PTHREAD_THREADS_MAX */
2157 __kmp_sys_max_nth = KMP_MAX_NTH;
2158 }
2159
2160 /* Query the minimum stack size */
2161 __kmp_sys_min_stksize = sysconf( _SC_THREAD_STACK_MIN );
2162 if ( __kmp_sys_min_stksize <= 1 ) {
2163 __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
2164 }
2165 }
2166
2167 /* Set up minimum number of threads to switch to TLS gtid */
2168 __kmp_tls_gtid_min = KMP_TLS_GTID_MIN;
2169
2170
2171 #ifdef BUILD_TV
2172 {
2173 int rc = pthread_key_create( & __kmp_tv_key, 0 );
2174 KMP_CHECK_SYSFAIL( "pthread_key_create", rc );
2175 }
2176 #endif
2177
2178 status = pthread_key_create( &__kmp_gtid_threadprivate_key, __kmp_internal_end_dest );
2179 KMP_CHECK_SYSFAIL( "pthread_key_create", status );
2180 status = pthread_mutexattr_init( & mutex_attr );
2181 KMP_CHECK_SYSFAIL( "pthread_mutexattr_init", status );
2182 status = pthread_mutex_init( & __kmp_wait_mx.m_mutex, & mutex_attr );
2183 KMP_CHECK_SYSFAIL( "pthread_mutex_init", status );
2184 status = pthread_condattr_init( & cond_attr );
2185 KMP_CHECK_SYSFAIL( "pthread_condattr_init", status );
2186 status = pthread_cond_init( & __kmp_wait_cv.c_cond, & cond_attr );
2187 KMP_CHECK_SYSFAIL( "pthread_cond_init", status );
2188#if USE_ITT_BUILD
2189 __kmp_itt_initialize();
2190#endif /* USE_ITT_BUILD */
2191
2192 __kmp_init_runtime = TRUE;
2193}
2194
2195void
2196__kmp_runtime_destroy( void )
2197{
2198 int status;
2199
2200 if ( ! __kmp_init_runtime ) {
2201 return; // Nothing to do.
2202 };
2203
2204#if USE_ITT_BUILD
2205 __kmp_itt_destroy();
2206#endif /* USE_ITT_BUILD */
2207
2208 status = pthread_key_delete( __kmp_gtid_threadprivate_key );
2209 KMP_CHECK_SYSFAIL( "pthread_key_delete", status );
2210 #ifdef BUILD_TV
2211 status = pthread_key_delete( __kmp_tv_key );
2212 KMP_CHECK_SYSFAIL( "pthread_key_delete", status );
2213 #endif
2214
2215 status = pthread_mutex_destroy( & __kmp_wait_mx.m_mutex );
2216 if ( status != 0 && status != EBUSY ) {
2217 KMP_SYSFAIL( "pthread_mutex_destroy", status );
2218 }
2219 status = pthread_cond_destroy( & __kmp_wait_cv.c_cond );
2220 if ( status != 0 && status != EBUSY ) {
2221 KMP_SYSFAIL( "pthread_cond_destroy", status );
2222 }
Alp Toker763b9392014-02-28 09:42:41 +00002223 #if KMP_AFFINITY_SUPPORTED
Jim Cownie5e8470a2013-09-27 10:38:44 +00002224 __kmp_affinity_uninitialize();
Jim Cownie5e8470a2013-09-27 10:38:44 +00002225 #endif
2226
2227 __kmp_init_runtime = FALSE;
2228}
2229
2230
2231/* Put the thread to sleep for a time period */
2232/* NOTE: not currently used anywhere */
2233void
2234__kmp_thread_sleep( int millis )
2235{
2236 sleep( ( millis + 500 ) / 1000 );
2237}
2238
2239/* Calculate the elapsed wall clock time for the user */
2240void
2241__kmp_elapsed( double *t )
2242{
2243 int status;
2244# ifdef FIX_SGI_CLOCK
2245 struct timespec ts;
2246
2247 status = clock_gettime( CLOCK_PROCESS_CPUTIME_ID, &ts );
2248 KMP_CHECK_SYSFAIL_ERRNO( "clock_gettime", status );
2249 *t = (double) ts.tv_nsec * (1.0 / (double) NSEC_PER_SEC) +
2250 (double) ts.tv_sec;
2251# else
2252 struct timeval tv;
2253
2254 status = gettimeofday( & tv, NULL );
2255 KMP_CHECK_SYSFAIL_ERRNO( "gettimeofday", status );
2256 *t = (double) tv.tv_usec * (1.0 / (double) USEC_PER_SEC) +
2257 (double) tv.tv_sec;
2258# endif
2259}
2260
2261/* Calculate the elapsed wall clock tick for the user */
2262void
2263__kmp_elapsed_tick( double *t )
2264{
2265 *t = 1 / (double) CLOCKS_PER_SEC;
2266}
2267
2268/*
2269 Determine whether the given address is mapped into the current address space.
2270*/
2271
2272int
2273__kmp_is_address_mapped( void * addr ) {
2274
2275 int found = 0;
2276 int rc;
2277
2278 #if KMP_OS_LINUX
2279
2280 /*
2281 On Linux* OS, read the /proc/<pid>/maps pseudo-file to get all the address ranges mapped
2282 into the address space.
2283 */
2284
2285 char * name = __kmp_str_format( "/proc/%d/maps", getpid() );
2286 FILE * file = NULL;
2287
2288 file = fopen( name, "r" );
2289 KMP_ASSERT( file != NULL );
2290
2291 for ( ; ; ) {
2292
2293 void * beginning = NULL;
2294 void * ending = NULL;
2295 char perms[ 5 ];
2296
2297 rc = fscanf( file, "%p-%p %4s %*[^\n]\n", & beginning, & ending, perms );
2298 if ( rc == EOF ) {
2299 break;
2300 }; // if
2301 KMP_ASSERT( rc == 3 && strlen( perms ) == 4 ); // Make sure all fields are read.
2302
2303 // Ending address is not included in the region, but beginning is.
2304 if ( ( addr >= beginning ) && ( addr < ending ) ) {
2305 perms[ 2 ] = 0; // 3th and 4th character does not matter.
2306 if ( strcmp( perms, "rw" ) == 0 ) {
2307 // Memory we are looking for should be readable and writable.
2308 found = 1;
2309 }; // if
2310 break;
2311 }; // if
2312
2313 }; // forever
2314
2315 // Free resources.
2316 fclose( file );
2317 KMP_INTERNAL_FREE( name );
2318
2319 #elif KMP_OS_DARWIN
2320
2321 /*
2322 On OS X*, /proc pseudo filesystem is not available. Try to read memory using vm
2323 interface.
2324 */
2325
2326 int buffer;
2327 vm_size_t count;
2328 rc =
2329 vm_read_overwrite(
2330 mach_task_self(), // Task to read memory of.
2331 (vm_address_t)( addr ), // Address to read from.
2332 1, // Number of bytes to be read.
2333 (vm_address_t)( & buffer ), // Address of buffer to save read bytes in.
2334 & count // Address of var to save number of read bytes in.
2335 );
2336 if ( rc == 0 ) {
2337 // Memory successfully read.
2338 found = 1;
2339 }; // if
2340
Alp Toker763b9392014-02-28 09:42:41 +00002341 #elif KMP_OS_FREEBSD
2342
Jim Cownie4cc4bb42014-10-07 16:25:50 +00002343 // FIXME(FreeBSD*): Implement this
Alp Toker763b9392014-02-28 09:42:41 +00002344 found = 1;
2345
Jim Cownie5e8470a2013-09-27 10:38:44 +00002346 #else
2347
2348 #error "Unknown or unsupported OS"
2349
2350 #endif
2351
2352 return found;
2353
2354} // __kmp_is_address_mapped
2355
2356#ifdef USE_LOAD_BALANCE
2357
2358
2359# if KMP_OS_DARWIN
2360
2361// The function returns the rounded value of the system load average
2362// during given time interval which depends on the value of
2363// __kmp_load_balance_interval variable (default is 60 sec, other values
2364// may be 300 sec or 900 sec).
2365// It returns -1 in case of error.
2366int
2367__kmp_get_load_balance( int max )
2368{
2369 double averages[3];
2370 int ret_avg = 0;
2371
2372 int res = getloadavg( averages, 3 );
2373
2374 //Check __kmp_load_balance_interval to determine which of averages to use.
2375 // getloadavg() may return the number of samples less than requested that is
2376 // less than 3.
2377 if ( __kmp_load_balance_interval < 180 && ( res >= 1 ) ) {
2378 ret_avg = averages[0];// 1 min
2379 } else if ( ( __kmp_load_balance_interval >= 180
2380 && __kmp_load_balance_interval < 600 ) && ( res >= 2 ) ) {
2381 ret_avg = averages[1];// 5 min
2382 } else if ( ( __kmp_load_balance_interval >= 600 ) && ( res == 3 ) ) {
2383 ret_avg = averages[2];// 15 min
Alp Toker8f2d3f02014-02-24 10:40:15 +00002384 } else {// Error occurred
Jim Cownie5e8470a2013-09-27 10:38:44 +00002385 return -1;
2386 }
2387
2388 return ret_avg;
2389}
2390
2391# else // Linux* OS
2392
2393// The fuction returns number of running (not sleeping) threads, or -1 in case of error.
2394// Error could be reported if Linux* OS kernel too old (without "/proc" support).
2395// Counting running threads stops if max running threads encountered.
2396int
2397__kmp_get_load_balance( int max )
2398{
2399 static int permanent_error = 0;
2400
2401 static int glb_running_threads = 0; /* Saved count of the running threads for the thread balance algortihm */
2402 static double glb_call_time = 0; /* Thread balance algorithm call time */
2403
2404 int running_threads = 0; // Number of running threads in the system.
2405
2406 DIR * proc_dir = NULL; // Handle of "/proc/" directory.
2407 struct dirent * proc_entry = NULL;
2408
2409 kmp_str_buf_t task_path; // "/proc/<pid>/task/<tid>/" path.
2410 DIR * task_dir = NULL; // Handle of "/proc/<pid>/task/<tid>/" directory.
2411 struct dirent * task_entry = NULL;
2412 int task_path_fixed_len;
2413
2414 kmp_str_buf_t stat_path; // "/proc/<pid>/task/<tid>/stat" path.
2415 int stat_file = -1;
2416 int stat_path_fixed_len;
2417
2418 int total_processes = 0; // Total number of processes in system.
2419 int total_threads = 0; // Total number of threads in system.
2420
2421 double call_time = 0.0;
2422
2423 __kmp_str_buf_init( & task_path );
2424 __kmp_str_buf_init( & stat_path );
2425
2426 __kmp_elapsed( & call_time );
2427
2428 if ( glb_call_time &&
2429 ( call_time - glb_call_time < __kmp_load_balance_interval ) ) {
2430 running_threads = glb_running_threads;
2431 goto finish;
2432 }
2433
2434 glb_call_time = call_time;
2435
2436 // Do not spend time on scanning "/proc/" if we have a permanent error.
2437 if ( permanent_error ) {
2438 running_threads = -1;
2439 goto finish;
2440 }; // if
2441
2442 if ( max <= 0 ) {
2443 max = INT_MAX;
2444 }; // if
2445
2446 // Open "/proc/" directory.
2447 proc_dir = opendir( "/proc" );
2448 if ( proc_dir == NULL ) {
2449 // Cannot open "/prroc/". Probably the kernel does not support it. Return an error now and
2450 // in subsequent calls.
2451 running_threads = -1;
2452 permanent_error = 1;
2453 goto finish;
2454 }; // if
2455
2456 // Initialize fixed part of task_path. This part will not change.
2457 __kmp_str_buf_cat( & task_path, "/proc/", 6 );
2458 task_path_fixed_len = task_path.used; // Remember number of used characters.
2459
2460 proc_entry = readdir( proc_dir );
2461 while ( proc_entry != NULL ) {
2462 // Proc entry is a directory and name starts with a digit. Assume it is a process'
2463 // directory.
2464 if ( proc_entry->d_type == DT_DIR && isdigit( proc_entry->d_name[ 0 ] ) ) {
2465
2466 ++ total_processes;
2467 // Make sure init process is the very first in "/proc", so we can replace
2468 // strcmp( proc_entry->d_name, "1" ) == 0 with simpler total_processes == 1.
2469 // We are going to check that total_processes == 1 => d_name == "1" is true (where
2470 // "=>" is implication). Since C++ does not have => operator, let us replace it with its
2471 // equivalent: a => b == ! a || b.
2472 KMP_DEBUG_ASSERT( total_processes != 1 || strcmp( proc_entry->d_name, "1" ) == 0 );
2473
2474 // Construct task_path.
2475 task_path.used = task_path_fixed_len; // Reset task_path to "/proc/".
2476 __kmp_str_buf_cat( & task_path, proc_entry->d_name, strlen( proc_entry->d_name ) );
2477 __kmp_str_buf_cat( & task_path, "/task", 5 );
2478
2479 task_dir = opendir( task_path.str );
2480 if ( task_dir == NULL ) {
2481 // Process can finish between reading "/proc/" directory entry and opening process'
2482 // "task/" directory. So, in general case we should not complain, but have to skip
2483 // this process and read the next one.
2484 // But on systems with no "task/" support we will spend lot of time to scan "/proc/"
2485 // tree again and again without any benefit. "init" process (its pid is 1) should
2486 // exist always, so, if we cannot open "/proc/1/task/" directory, it means "task/"
2487 // is not supported by kernel. Report an error now and in the future.
2488 if ( strcmp( proc_entry->d_name, "1" ) == 0 ) {
2489 running_threads = -1;
2490 permanent_error = 1;
2491 goto finish;
2492 }; // if
2493 } else {
2494 // Construct fixed part of stat file path.
2495 __kmp_str_buf_clear( & stat_path );
2496 __kmp_str_buf_cat( & stat_path, task_path.str, task_path.used );
2497 __kmp_str_buf_cat( & stat_path, "/", 1 );
2498 stat_path_fixed_len = stat_path.used;
2499
2500 task_entry = readdir( task_dir );
2501 while ( task_entry != NULL ) {
2502 // It is a directory and name starts with a digit.
2503 if ( proc_entry->d_type == DT_DIR && isdigit( task_entry->d_name[ 0 ] ) ) {
2504
2505 ++ total_threads;
2506
2507 // Consruct complete stat file path. Easiest way would be:
2508 // __kmp_str_buf_print( & stat_path, "%s/%s/stat", task_path.str, task_entry->d_name );
2509 // but seriae of __kmp_str_buf_cat works a bit faster.
2510 stat_path.used = stat_path_fixed_len; // Reset stat path to its fixed part.
2511 __kmp_str_buf_cat( & stat_path, task_entry->d_name, strlen( task_entry->d_name ) );
2512 __kmp_str_buf_cat( & stat_path, "/stat", 5 );
2513
2514 // Note: Low-level API (open/read/close) is used. High-level API
2515 // (fopen/fclose) works ~ 30 % slower.
2516 stat_file = open( stat_path.str, O_RDONLY );
2517 if ( stat_file == -1 ) {
2518 // We cannot report an error because task (thread) can terminate just
2519 // before reading this file.
2520 } else {
2521 /*
2522 Content of "stat" file looks like:
2523
2524 24285 (program) S ...
2525
2526 It is a single line (if program name does not include fanny
2527 symbols). First number is a thread id, then name of executable file
2528 name in paretheses, then state of the thread. We need just thread
2529 state.
2530
2531 Good news: Length of program name is 15 characters max. Longer
2532 names are truncated.
2533
2534 Thus, we need rather short buffer: 15 chars for program name +
2535 2 parenthesis, + 3 spaces + ~7 digits of pid = 37.
2536
2537 Bad news: Program name may contain special symbols like space,
2538 closing parenthesis, or even new line. This makes parsing "stat"
2539 file not 100 % reliable. In case of fanny program names parsing
2540 may fail (report incorrect thread state).
2541
2542 Parsing "status" file looks more promissing (due to different
2543 file structure and escaping special symbols) but reading and
2544 parsing of "status" file works slower.
2545
2546 -- ln
2547 */
2548 char buffer[ 65 ];
2549 int len;
2550 len = read( stat_file, buffer, sizeof( buffer ) - 1 );
2551 if ( len >= 0 ) {
2552 buffer[ len ] = 0;
2553 // Using scanf:
2554 // sscanf( buffer, "%*d (%*s) %c ", & state );
2555 // looks very nice, but searching for a closing parenthesis works a
2556 // bit faster.
2557 char * close_parent = strstr( buffer, ") " );
2558 if ( close_parent != NULL ) {
2559 char state = * ( close_parent + 2 );
2560 if ( state == 'R' ) {
2561 ++ running_threads;
2562 if ( running_threads >= max ) {
2563 goto finish;
2564 }; // if
2565 }; // if
2566 }; // if
2567 }; // if
2568 close( stat_file );
2569 stat_file = -1;
2570 }; // if
2571 }; // if
2572 task_entry = readdir( task_dir );
2573 }; // while
2574 closedir( task_dir );
2575 task_dir = NULL;
2576 }; // if
2577 }; // if
2578 proc_entry = readdir( proc_dir );
2579 }; // while
2580
2581 //
2582 // There _might_ be a timing hole where the thread executing this
2583 // code get skipped in the load balance, and running_threads is 0.
2584 // Assert in the debug builds only!!!
2585 //
2586 KMP_DEBUG_ASSERT( running_threads > 0 );
2587 if ( running_threads <= 0 ) {
2588 running_threads = 1;
2589 }
2590
2591 finish: // Clean up and exit.
2592 if ( proc_dir != NULL ) {
2593 closedir( proc_dir );
2594 }; // if
2595 __kmp_str_buf_free( & task_path );
2596 if ( task_dir != NULL ) {
2597 closedir( task_dir );
2598 }; // if
2599 __kmp_str_buf_free( & stat_path );
2600 if ( stat_file != -1 ) {
2601 close( stat_file );
2602 }; // if
2603
2604 glb_running_threads = running_threads;
2605
2606 return running_threads;
2607
2608} // __kmp_get_load_balance
2609
2610# endif // KMP_OS_DARWIN
2611
2612#endif // USE_LOAD_BALANCE
2613
Jim Cownie181b4bb2013-12-23 17:28:57 +00002614
Andrey Churbanovcbda8682015-01-13 14:43:35 +00002615#if KMP_COMPILER_GCC && !(KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_PPC64 || KMP_ARCH_AARCH64)
Jim Cownie181b4bb2013-12-23 17:28:57 +00002616
2617int __kmp_invoke_microtask( microtask_t pkfn, int gtid, int tid, int argc,
2618 void *p_argv[] )
2619{
2620 int argc_full = argc + 2;
2621 int i;
2622 ffi_cif cif;
2623 ffi_type *types[argc_full];
2624 void *args[argc_full];
2625 void *idp[2];
2626
2627 /* We're only passing pointers to the target. */
2628 for (i = 0; i < argc_full; i++)
2629 types[i] = &ffi_type_pointer;
2630
2631 /* Ugly double-indirection, but that's how it goes... */
2632 idp[0] = &gtid;
2633 idp[1] = &tid;
2634 args[0] = &idp[0];
2635 args[1] = &idp[1];
2636
2637 for (i = 0; i < argc; i++)
2638 args[2 + i] = &p_argv[i];
2639
2640 if (ffi_prep_cif(&cif, FFI_DEFAULT_ABI, argc_full,
2641 &ffi_type_void, types) != FFI_OK)
2642 abort();
2643
2644 ffi_call(&cif, (void (*)(void))pkfn, NULL, args);
2645
2646 return 1;
2647}
2648
Jim Cownie3051f972014-08-07 10:12:54 +00002649#endif // KMP_COMPILER_GCC && !(KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_PPC64)
2650
Andrey Churbanovcbda8682015-01-13 14:43:35 +00002651#if KMP_ARCH_PPC64 || KMP_ARCH_AARCH64
Jim Cownie3051f972014-08-07 10:12:54 +00002652
2653// we really only need the case with 1 argument, because CLANG always build
2654// a struct of pointers to shared variables referenced in the outlined function
2655int
2656__kmp_invoke_microtask( microtask_t pkfn,
2657 int gtid, int tid,
2658 int argc, void *p_argv[] ) {
2659 switch (argc) {
2660 default:
2661 fprintf(stderr, "Too many args to microtask: %d!\n", argc);
2662 fflush(stderr);
2663 exit(-1);
2664 case 0:
2665 (*pkfn)(&gtid, &tid);
2666 break;
2667 case 1:
2668 (*pkfn)(&gtid, &tid, p_argv[0]);
2669 break;
2670 case 2:
2671 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1]);
2672 break;
2673 case 3:
2674 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2]);
2675 break;
2676 case 4:
2677 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3]);
2678 break;
2679 case 5:
2680 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4]);
2681 break;
2682 case 6:
2683 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2684 p_argv[5]);
2685 break;
2686 case 7:
2687 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2688 p_argv[5], p_argv[6]);
2689 break;
2690 case 8:
2691 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2692 p_argv[5], p_argv[6], p_argv[7]);
2693 break;
2694 case 9:
2695 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2696 p_argv[5], p_argv[6], p_argv[7], p_argv[8]);
2697 break;
2698 case 10:
2699 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2700 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9]);
2701 break;
2702 case 11:
2703 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2704 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9], p_argv[10]);
2705 break;
2706 case 12:
2707 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2708 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2709 p_argv[11]);
2710 break;
2711 case 13:
2712 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2713 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2714 p_argv[11], p_argv[12]);
2715 break;
2716 case 14:
2717 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2718 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2719 p_argv[11], p_argv[12], p_argv[13]);
2720 break;
2721 case 15:
2722 (*pkfn)(&gtid, &tid, p_argv[0], p_argv[1], p_argv[2], p_argv[3], p_argv[4],
2723 p_argv[5], p_argv[6], p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2724 p_argv[11], p_argv[12], p_argv[13], p_argv[14]);
2725 break;
2726 }
2727
2728 return 1;
2729}
2730
2731#endif
Jim Cownie181b4bb2013-12-23 17:28:57 +00002732
Jim Cownie5e8470a2013-09-27 10:38:44 +00002733// end of file //
2734