blob: 3cce67c742c7cf35dd0e6ddc4005e0ba6016ca8e [file] [log] [blame]
Jim Cownie5e8470a2013-09-27 10:38:44 +00001/*
2 * kmp_gsupport.c
Jim Cownie4cc4bb42014-10-07 16:25:50 +00003 * $Revision: 43473 $
4 * $Date: 2014-09-26 15:02:57 -0500 (Fri, 26 Sep 2014) $
Jim Cownie5e8470a2013-09-27 10:38:44 +00005 */
6
7
8//===----------------------------------------------------------------------===//
9//
10// The LLVM Compiler Infrastructure
11//
12// This file is dual licensed under the MIT and the University of Illinois Open
13// Source Licenses. See LICENSE.txt for details.
14//
15//===----------------------------------------------------------------------===//
16
17
Jim Cownie3051f972014-08-07 10:12:54 +000018#if defined(__x86_64) || defined (__powerpc64__)
Jim Cownie5e8470a2013-09-27 10:38:44 +000019# define KMP_I8
20#endif
21#include "kmp.h"
22#include "kmp_atomic.h"
23
24#ifdef __cplusplus
25 extern "C" {
26#endif // __cplusplus
27
28#define MKLOC(loc,routine) \
29 static ident_t (loc) = {0, KMP_IDENT_KMPC, 0, 0, ";unknown;unknown;0;0;;" };
30
Jim Cownie181b4bb2013-12-23 17:28:57 +000031#include "kmp_ftn_os.h"
Jim Cownie5e8470a2013-09-27 10:38:44 +000032
33void
Jim Cownie181b4bb2013-12-23 17:28:57 +000034xexpand(KMP_API_NAME_GOMP_BARRIER)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +000035{
36 int gtid = __kmp_entry_gtid();
37 MKLOC(loc, "GOMP_barrier");
38 KA_TRACE(20, ("GOMP_barrier: T#%d\n", gtid));
39 __kmpc_barrier(&loc, gtid);
40}
41
42
43/* */
44//
45// Mutual exclusion
46//
47
48//
49// The symbol that icc/ifort generates for unnamed for unnamed critical
50// sections - .gomp_critical_user_ - is defined using .comm in any objects
51// reference it. We can't reference it directly here in C code, as the
52// symbol contains a ".".
53//
54// The RTL contains an assembly language definition of .gomp_critical_user_
55// with another symbol __kmp_unnamed_critical_addr initialized with it's
56// address.
57//
58extern kmp_critical_name *__kmp_unnamed_critical_addr;
59
60
61void
Jim Cownie181b4bb2013-12-23 17:28:57 +000062xexpand(KMP_API_NAME_GOMP_CRITICAL_START)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +000063{
64 int gtid = __kmp_entry_gtid();
65 MKLOC(loc, "GOMP_critical_start");
66 KA_TRACE(20, ("GOMP_critical_start: T#%d\n", gtid));
67 __kmpc_critical(&loc, gtid, __kmp_unnamed_critical_addr);
68}
69
70
71void
Jim Cownie181b4bb2013-12-23 17:28:57 +000072xexpand(KMP_API_NAME_GOMP_CRITICAL_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +000073{
74 int gtid = __kmp_get_gtid();
75 MKLOC(loc, "GOMP_critical_end");
76 KA_TRACE(20, ("GOMP_critical_end: T#%d\n", gtid));
77 __kmpc_end_critical(&loc, gtid, __kmp_unnamed_critical_addr);
78}
79
80
81void
Jim Cownie181b4bb2013-12-23 17:28:57 +000082xexpand(KMP_API_NAME_GOMP_CRITICAL_NAME_START)(void **pptr)
Jim Cownie5e8470a2013-09-27 10:38:44 +000083{
84 int gtid = __kmp_entry_gtid();
85 MKLOC(loc, "GOMP_critical_name_start");
86 KA_TRACE(20, ("GOMP_critical_name_start: T#%d\n", gtid));
87 __kmpc_critical(&loc, gtid, (kmp_critical_name *)pptr);
88}
89
90
91void
Jim Cownie181b4bb2013-12-23 17:28:57 +000092xexpand(KMP_API_NAME_GOMP_CRITICAL_NAME_END)(void **pptr)
Jim Cownie5e8470a2013-09-27 10:38:44 +000093{
94 int gtid = __kmp_get_gtid();
95 MKLOC(loc, "GOMP_critical_name_end");
96 KA_TRACE(20, ("GOMP_critical_name_end: T#%d\n", gtid));
97 __kmpc_end_critical(&loc, gtid, (kmp_critical_name *)pptr);
98}
99
100
101//
102// The Gnu codegen tries to use locked operations to perform atomic updates
103// inline. If it can't, then it calls GOMP_atomic_start() before performing
104// the update and GOMP_atomic_end() afterward, regardless of the data type.
105//
106
107void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000108xexpand(KMP_API_NAME_GOMP_ATOMIC_START)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000109{
110 int gtid = __kmp_entry_gtid();
111 KA_TRACE(20, ("GOMP_atomic_start: T#%d\n", gtid));
112 __kmp_acquire_atomic_lock(&__kmp_atomic_lock, gtid);
113}
114
115
116void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000117xexpand(KMP_API_NAME_GOMP_ATOMIC_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000118{
119 int gtid = __kmp_get_gtid();
120 KA_TRACE(20, ("GOMP_atomic_start: T#%d\n", gtid));
121 __kmp_release_atomic_lock(&__kmp_atomic_lock, gtid);
122}
123
124
125int
Jim Cownie181b4bb2013-12-23 17:28:57 +0000126xexpand(KMP_API_NAME_GOMP_SINGLE_START)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000127{
128 int gtid = __kmp_entry_gtid();
129 MKLOC(loc, "GOMP_single_start");
130 KA_TRACE(20, ("GOMP_single_start: T#%d\n", gtid));
131
132 if (! TCR_4(__kmp_init_parallel))
133 __kmp_parallel_initialize();
134
135 //
136 // 3rd parameter == FALSE prevents kmp_enter_single from pushing a
137 // workshare when USE_CHECKS is defined. We need to avoid the push,
138 // as there is no corresponding GOMP_single_end() call.
139 //
140 return __kmp_enter_single(gtid, &loc, FALSE);
141}
142
143
144void *
Jim Cownie181b4bb2013-12-23 17:28:57 +0000145xexpand(KMP_API_NAME_GOMP_SINGLE_COPY_START)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000146{
147 void *retval;
148 int gtid = __kmp_entry_gtid();
149 MKLOC(loc, "GOMP_single_copy_start");
150 KA_TRACE(20, ("GOMP_single_copy_start: T#%d\n", gtid));
151
152 if (! TCR_4(__kmp_init_parallel))
153 __kmp_parallel_initialize();
154
155 //
156 // If this is the first thread to enter, return NULL. The generated
157 // code will then call GOMP_single_copy_end() for this thread only,
158 // with the copyprivate data pointer as an argument.
159 //
160 if (__kmp_enter_single(gtid, &loc, FALSE))
161 return NULL;
162
163 //
164 // Wait for the first thread to set the copyprivate data pointer,
165 // and for all other threads to reach this point.
166 //
167 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
168
169 //
170 // Retrieve the value of the copyprivate data point, and wait for all
171 // threads to do likewise, then return.
172 //
173 retval = __kmp_team_from_gtid(gtid)->t.t_copypriv_data;
174 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
175 return retval;
176}
177
178
179void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000180xexpand(KMP_API_NAME_GOMP_SINGLE_COPY_END)(void *data)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000181{
182 int gtid = __kmp_get_gtid();
183 MKLOC(loc, "GOMP_single_copy_end");
184 KA_TRACE(20, ("GOMP_single_copy_end: T#%d\n", gtid));
185
186 //
187 // Set the copyprivate data pointer fo the team, then hit the barrier
188 // so that the other threads will continue on and read it. Hit another
189 // barrier before continuing, so that the know that the copyprivate
190 // data pointer has been propagated to all threads before trying to
191 // reuse the t_copypriv_data field.
192 //
193 __kmp_team_from_gtid(gtid)->t.t_copypriv_data = data;
194 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
195 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
196}
197
198
199void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000200xexpand(KMP_API_NAME_GOMP_ORDERED_START)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000201{
202 int gtid = __kmp_entry_gtid();
203 MKLOC(loc, "GOMP_ordered_start");
204 KA_TRACE(20, ("GOMP_ordered_start: T#%d\n", gtid));
205 __kmpc_ordered(&loc, gtid);
206}
207
208
209void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000210xexpand(KMP_API_NAME_GOMP_ORDERED_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000211{
212 int gtid = __kmp_get_gtid();
213 MKLOC(loc, "GOMP_ordered_end");
214 KA_TRACE(20, ("GOMP_ordered_start: T#%d\n", gtid));
215 __kmpc_end_ordered(&loc, gtid);
216}
217
218
219/* */
220//
221// Dispatch macro defs
222//
223// They come in two flavors: 64-bit unsigned, and either 32-bit signed
224// (IA-32 architecture) or 64-bit signed (Intel(R) 64).
225//
226
Jim Cownie181b4bb2013-12-23 17:28:57 +0000227#if KMP_ARCH_X86 || KMP_ARCH_ARM
Jim Cownie5e8470a2013-09-27 10:38:44 +0000228# define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_4
229# define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_4
230# define KMP_DISPATCH_NEXT __kmpc_dispatch_next_4
231#else
232# define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_8
233# define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_8
234# define KMP_DISPATCH_NEXT __kmpc_dispatch_next_8
235#endif /* KMP_ARCH_X86 */
236
237# define KMP_DISPATCH_INIT_ULL __kmp_aux_dispatch_init_8u
238# define KMP_DISPATCH_FINI_CHUNK_ULL __kmp_aux_dispatch_fini_chunk_8u
239# define KMP_DISPATCH_NEXT_ULL __kmpc_dispatch_next_8u
240
241
242/* */
243//
244// The parallel contruct
245//
246
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000247#ifndef KMP_DEBUG
Jim Cownie5e8470a2013-09-27 10:38:44 +0000248static
249#endif /* KMP_DEBUG */
250void
251__kmp_GOMP_microtask_wrapper(int *gtid, int *npr, void (*task)(void *),
252 void *data)
253{
254 task(data);
255}
256
257
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000258#ifndef KMP_DEBUG
Jim Cownie5e8470a2013-09-27 10:38:44 +0000259static
260#endif /* KMP_DEBUG */
261void
262__kmp_GOMP_parallel_microtask_wrapper(int *gtid, int *npr,
263 void (*task)(void *), void *data, unsigned num_threads, ident_t *loc,
264 enum sched_type schedule, long start, long end, long incr, long chunk_size)
265{
266 //
267 // Intialize the loop worksharing construct.
268 //
269 KMP_DISPATCH_INIT(loc, *gtid, schedule, start, end, incr, chunk_size,
270 schedule != kmp_sch_static);
271
272 //
273 // Now invoke the microtask.
274 //
275 task(data);
276}
277
278
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000279#ifndef KMP_DEBUG
Jim Cownie5e8470a2013-09-27 10:38:44 +0000280static
281#endif /* KMP_DEBUG */
282void
283__kmp_GOMP_fork_call(ident_t *loc, int gtid, microtask_t wrapper, int argc,...)
284{
285 int rc;
286
287 va_list ap;
288 va_start(ap, argc);
289
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000290 rc = __kmp_fork_call(loc, gtid, fork_context_gnu, argc, wrapper, __kmp_invoke_task_func,
Jim Cownie181b4bb2013-12-23 17:28:57 +0000291#if (KMP_ARCH_X86_64 || KMP_ARCH_ARM) && KMP_OS_LINUX
Jim Cownie5e8470a2013-09-27 10:38:44 +0000292 &ap
293#else
294 ap
295#endif
296 );
297
298 va_end(ap);
299
300 if (rc) {
301 kmp_info_t *thr = __kmp_threads[gtid];
302 __kmp_run_before_invoked_task(gtid, __kmp_tid_from_gtid(gtid), thr,
303 thr->th.th_team);
304 }
305}
306
307
308void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000309xexpand(KMP_API_NAME_GOMP_PARALLEL_START)(void (*task)(void *), void *data, unsigned num_threads)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000310{
311 int gtid = __kmp_entry_gtid();
312 MKLOC(loc, "GOMP_parallel_start");
313 KA_TRACE(20, ("GOMP_parallel_start: T#%d\n", gtid));
314
315 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) {
316 if (num_threads != 0) {
317 __kmp_push_num_threads(&loc, gtid, num_threads);
318 }
319 __kmp_GOMP_fork_call(&loc, gtid,
320 (microtask_t)__kmp_GOMP_microtask_wrapper, 2, task, data);
321 }
322 else {
323 __kmpc_serialized_parallel(&loc, gtid);
324 }
325}
326
327
328void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000329xexpand(KMP_API_NAME_GOMP_PARALLEL_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000330{
331 int gtid = __kmp_get_gtid();
332 MKLOC(loc, "GOMP_parallel_end");
333 KA_TRACE(20, ("GOMP_parallel_end: T#%d\n", gtid));
334
335 if (! __kmp_threads[gtid]->th.th_team->t.t_serialized) {
336 kmp_info_t *thr = __kmp_threads[gtid];
337 __kmp_run_after_invoked_task(gtid, __kmp_tid_from_gtid(gtid), thr,
338 thr->th.th_team);
339 __kmp_join_call(&loc, gtid);
340 }
341 else {
342 __kmpc_end_serialized_parallel(&loc, gtid);
343 }
344}
345
346
347/* */
348//
349// Loop worksharing constructs
350//
351
352//
353// The Gnu codegen passes in an exclusive upper bound for the overall range,
354// but the libguide dispatch code expects an inclusive upper bound, hence the
355// "end - incr" 5th argument to KMP_DISPATCH_INIT (and the " ub - str" 11th
356// argument to __kmp_GOMP_fork_call).
357//
358// Conversely, KMP_DISPATCH_NEXT returns and inclusive upper bound in *p_ub,
359// but the Gnu codegen expects an excluside upper bound, so the adjustment
360// "*p_ub += stride" compenstates for the discrepancy.
361//
362// Correction: the gnu codegen always adjusts the upper bound by +-1, not the
363// stride value. We adjust the dispatch parameters accordingly (by +-1), but
364// we still adjust p_ub by the actual stride value.
365//
366// The "runtime" versions do not take a chunk_sz parameter.
367//
368// The profile lib cannot support construct checking of unordered loops that
369// are predetermined by the compiler to be statically scheduled, as the gcc
370// codegen will not always emit calls to GOMP_loop_static_next() to get the
371// next iteration. Instead, it emits inline code to call omp_get_thread_num()
372// num and calculate the iteration space using the result. It doesn't do this
373// with ordered static loop, so they can be checked.
374//
375
376#define LOOP_START(func,schedule) \
377 int func (long lb, long ub, long str, long chunk_sz, long *p_lb, \
378 long *p_ub) \
379 { \
380 int status; \
381 long stride; \
382 int gtid = __kmp_entry_gtid(); \
383 MKLOC(loc, #func); \
384 KA_TRACE(20, ( #func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \
385 gtid, lb, ub, str, chunk_sz )); \
386 \
387 if ((str > 0) ? (lb < ub) : (lb > ub)) { \
388 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \
389 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \
390 (schedule) != kmp_sch_static); \
391 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \
392 (kmp_int *)p_ub, (kmp_int *)&stride); \
393 if (status) { \
394 KMP_DEBUG_ASSERT(stride == str); \
395 *p_ub += (str > 0) ? 1 : -1; \
396 } \
397 } \
398 else { \
399 status = 0; \
400 } \
401 \
402 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \
403 gtid, *p_lb, *p_ub, status)); \
404 return status; \
405 }
406
407
408#define LOOP_RUNTIME_START(func,schedule) \
409 int func (long lb, long ub, long str, long *p_lb, long *p_ub) \
410 { \
411 int status; \
412 long stride; \
413 long chunk_sz = 0; \
414 int gtid = __kmp_entry_gtid(); \
415 MKLOC(loc, #func); \
416 KA_TRACE(20, ( #func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz %d\n", \
417 gtid, lb, ub, str, chunk_sz )); \
418 \
419 if ((str > 0) ? (lb < ub) : (lb > ub)) { \
420 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \
421 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, TRUE); \
422 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \
423 (kmp_int *)p_ub, (kmp_int *)&stride); \
424 if (status) { \
425 KMP_DEBUG_ASSERT(stride == str); \
426 *p_ub += (str > 0) ? 1 : -1; \
427 } \
428 } \
429 else { \
430 status = 0; \
431 } \
432 \
433 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \
434 gtid, *p_lb, *p_ub, status)); \
435 return status; \
436 }
437
438
439#define LOOP_NEXT(func,fini_code) \
440 int func(long *p_lb, long *p_ub) \
441 { \
442 int status; \
443 long stride; \
444 int gtid = __kmp_get_gtid(); \
445 MKLOC(loc, #func); \
446 KA_TRACE(20, ( #func ": T#%d\n", gtid)); \
447 \
448 fini_code \
449 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \
450 (kmp_int *)p_ub, (kmp_int *)&stride); \
451 if (status) { \
452 *p_ub += (stride > 0) ? 1 : -1; \
453 } \
454 \
455 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, stride 0x%lx, " \
456 "returning %d\n", gtid, *p_lb, *p_ub, stride, status)); \
457 return status; \
458 }
459
460
Jim Cownie181b4bb2013-12-23 17:28:57 +0000461LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_STATIC_START), kmp_sch_static)
462LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT), {})
463LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START), kmp_sch_dynamic_chunked)
464LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT), {})
465LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_GUIDED_START), kmp_sch_guided_chunked)
466LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT), {})
467LOOP_RUNTIME_START(xexpand(KMP_API_NAME_GOMP_LOOP_RUNTIME_START), kmp_sch_runtime)
468LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT), {})
Jim Cownie5e8470a2013-09-27 10:38:44 +0000469
Jim Cownie181b4bb2013-12-23 17:28:57 +0000470LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START), kmp_ord_static)
471LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000472 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000473LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START), kmp_ord_dynamic_chunked)
474LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000475 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000476LOOP_START(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_START), kmp_ord_guided_chunked)
477LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000478 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000479LOOP_RUNTIME_START(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_START), kmp_ord_runtime)
480LOOP_NEXT(xexpand(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000481 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
482
483
484void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000485xexpand(KMP_API_NAME_GOMP_LOOP_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000486{
487 int gtid = __kmp_get_gtid();
488 KA_TRACE(20, ("GOMP_loop_end: T#%d\n", gtid))
489
490 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
491
492 KA_TRACE(20, ("GOMP_loop_end exit: T#%d\n", gtid))
493}
494
495
496void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000497xexpand(KMP_API_NAME_GOMP_LOOP_END_NOWAIT)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000498{
499 KA_TRACE(20, ("GOMP_loop_end_nowait: T#%d\n", __kmp_get_gtid()))
500}
501
502
503/* */
504//
505// Unsigned long long loop worksharing constructs
506//
507// These are new with gcc 4.4
508//
509
510#define LOOP_START_ULL(func,schedule) \
511 int func (int up, unsigned long long lb, unsigned long long ub, \
512 unsigned long long str, unsigned long long chunk_sz, \
513 unsigned long long *p_lb, unsigned long long *p_ub) \
514 { \
515 int status; \
516 long long str2 = up ? ((long long)str) : -((long long)str); \
517 long long stride; \
518 int gtid = __kmp_entry_gtid(); \
519 MKLOC(loc, #func); \
520 \
521 KA_TRACE(20, ( #func ": T#%d, up %d, lb 0x%llx, ub 0x%llx, str 0x%llx, chunk_sz 0x%llx\n", \
522 gtid, up, lb, ub, str, chunk_sz )); \
523 \
524 if ((str > 0) ? (lb < ub) : (lb > ub)) { \
525 KMP_DISPATCH_INIT_ULL(&loc, gtid, (schedule), lb, \
526 (str2 > 0) ? (ub - 1) : (ub + 1), str2, chunk_sz, \
527 (schedule) != kmp_sch_static); \
528 status = KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, \
529 (kmp_uint64 *)p_lb, (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \
530 if (status) { \
531 KMP_DEBUG_ASSERT(stride == str2); \
532 *p_ub += (str > 0) ? 1 : -1; \
533 } \
534 } \
535 else { \
536 status = 0; \
537 } \
538 \
539 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, returning %d\n", \
540 gtid, *p_lb, *p_ub, status)); \
541 return status; \
542 }
543
544
545#define LOOP_RUNTIME_START_ULL(func,schedule) \
546 int func (int up, unsigned long long lb, unsigned long long ub, \
547 unsigned long long str, unsigned long long *p_lb, \
548 unsigned long long *p_ub) \
549 { \
550 int status; \
551 long long str2 = up ? ((long long)str) : -((long long)str); \
552 unsigned long long stride; \
553 unsigned long long chunk_sz = 0; \
554 int gtid = __kmp_entry_gtid(); \
555 MKLOC(loc, #func); \
556 \
557 KA_TRACE(20, ( #func ": T#%d, up %d, lb 0x%llx, ub 0x%llx, str 0x%llx, chunk_sz 0x%llx\n", \
558 gtid, up, lb, ub, str, chunk_sz )); \
559 \
560 if ((str > 0) ? (lb < ub) : (lb > ub)) { \
561 KMP_DISPATCH_INIT_ULL(&loc, gtid, (schedule), lb, \
562 (str2 > 0) ? (ub - 1) : (ub + 1), str2, chunk_sz, TRUE); \
563 status = KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, \
564 (kmp_uint64 *)p_lb, (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \
565 if (status) { \
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000566 KMP_DEBUG_ASSERT((long long)stride == str2); \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000567 *p_ub += (str > 0) ? 1 : -1; \
568 } \
569 } \
570 else { \
571 status = 0; \
572 } \
573 \
574 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, returning %d\n", \
575 gtid, *p_lb, *p_ub, status)); \
576 return status; \
577 }
578
579
580#define LOOP_NEXT_ULL(func,fini_code) \
581 int func(unsigned long long *p_lb, unsigned long long *p_ub) \
582 { \
583 int status; \
584 long long stride; \
585 int gtid = __kmp_get_gtid(); \
586 MKLOC(loc, #func); \
587 KA_TRACE(20, ( #func ": T#%d\n", gtid)); \
588 \
589 fini_code \
590 status = KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, (kmp_uint64 *)p_lb, \
591 (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \
592 if (status) { \
593 *p_ub += (stride > 0) ? 1 : -1; \
594 } \
595 \
596 KA_TRACE(20, ( #func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, stride 0x%llx, " \
597 "returning %d\n", gtid, *p_lb, *p_ub, stride, status)); \
598 return status; \
599 }
600
601
Jim Cownie181b4bb2013-12-23 17:28:57 +0000602LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_START), kmp_sch_static)
603LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_NEXT), {})
604LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_START), kmp_sch_dynamic_chunked)
605LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_NEXT), {})
606LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_START), kmp_sch_guided_chunked)
607LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_NEXT), {})
608LOOP_RUNTIME_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_START), kmp_sch_runtime)
609LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_NEXT), {})
Jim Cownie5e8470a2013-09-27 10:38:44 +0000610
Jim Cownie181b4bb2013-12-23 17:28:57 +0000611LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_START), kmp_ord_static)
612LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000613 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000614LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_START), kmp_ord_dynamic_chunked)
615LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000616 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000617LOOP_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_START), kmp_ord_guided_chunked)
618LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000619 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
Jim Cownie181b4bb2013-12-23 17:28:57 +0000620LOOP_RUNTIME_START_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_START), kmp_ord_runtime)
621LOOP_NEXT_ULL(xexpand(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_NEXT), \
Jim Cownie5e8470a2013-09-27 10:38:44 +0000622 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
623
624
625/* */
626//
627// Combined parallel / loop worksharing constructs
628//
629// There are no ull versions (yet).
630//
631
632#define PARALLEL_LOOP_START(func, schedule) \
633 void func (void (*task) (void *), void *data, unsigned num_threads, \
634 long lb, long ub, long str, long chunk_sz) \
635 { \
636 int gtid = __kmp_entry_gtid(); \
637 int last = FALSE; \
638 MKLOC(loc, #func); \
639 KA_TRACE(20, ( #func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \
640 gtid, lb, ub, str, chunk_sz )); \
641 \
642 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) { \
643 if (num_threads != 0) { \
644 __kmp_push_num_threads(&loc, gtid, num_threads); \
645 } \
646 __kmp_GOMP_fork_call(&loc, gtid, \
647 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9, \
648 task, data, num_threads, &loc, (schedule), lb, \
649 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz); \
650 } \
651 else { \
652 __kmpc_serialized_parallel(&loc, gtid); \
653 } \
654 \
655 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \
656 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \
657 (schedule) != kmp_sch_static); \
658 \
659 KA_TRACE(20, ( #func " exit: T#%d\n", gtid)); \
660 }
661
662
Jim Cownie181b4bb2013-12-23 17:28:57 +0000663PARALLEL_LOOP_START(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC_START), kmp_sch_static)
664PARALLEL_LOOP_START(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC_START), kmp_sch_dynamic_chunked)
665PARALLEL_LOOP_START(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED_START), kmp_sch_guided_chunked)
666PARALLEL_LOOP_START(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME_START), kmp_sch_runtime)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000667
668
Jim Cownie5e8470a2013-09-27 10:38:44 +0000669/* */
670//
671// Tasking constructs
672//
673
674void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000675xexpand(KMP_API_NAME_GOMP_TASK)(void (*func)(void *), void *data, void (*copy_func)(void *, void *),
Jim Cownie5e8470a2013-09-27 10:38:44 +0000676 long arg_size, long arg_align, int if_cond, unsigned gomp_flags)
677{
678 MKLOC(loc, "GOMP_task");
679 int gtid = __kmp_entry_gtid();
680 kmp_int32 flags = 0;
681 kmp_tasking_flags_t *input_flags = (kmp_tasking_flags_t *) & flags;
682
683 KA_TRACE(20, ("GOMP_task: T#%d\n", gtid));
684
685 // The low-order bit is the "tied" flag
686 if (gomp_flags & 1) {
687 input_flags->tiedness = 1;
688 }
689 input_flags->native = 1;
690 // __kmp_task_alloc() sets up all other flags
691
692 if (! if_cond) {
693 arg_size = 0;
694 }
695
696 kmp_task_t *task = __kmp_task_alloc(&loc, gtid, input_flags,
697 sizeof(kmp_task_t), arg_size ? arg_size + arg_align - 1 : 0,
698 (kmp_routine_entry_t)func);
699
700 if (arg_size > 0) {
701 if (arg_align > 0) {
702 task->shareds = (void *)((((size_t)task->shareds)
703 + arg_align - 1) / arg_align * arg_align);
704 }
705 //else error??
706
707 if (copy_func) {
708 (*copy_func)(task->shareds, data);
709 }
710 else {
711 memcpy(task->shareds, data, arg_size);
712 }
713 }
714
715 if (if_cond) {
716 __kmpc_omp_task(&loc, gtid, task);
717 }
718 else {
719 __kmpc_omp_task_begin_if0(&loc, gtid, task);
720 func(data);
721 __kmpc_omp_task_complete_if0(&loc, gtid, task);
722 }
723
724 KA_TRACE(20, ("GOMP_task exit: T#%d\n", gtid));
725}
726
727
728void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000729xexpand(KMP_API_NAME_GOMP_TASKWAIT)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000730{
731 MKLOC(loc, "GOMP_taskwait");
732 int gtid = __kmp_entry_gtid();
733
734 KA_TRACE(20, ("GOMP_taskwait: T#%d\n", gtid));
735
736 __kmpc_omp_taskwait(&loc, gtid);
737
738 KA_TRACE(20, ("GOMP_taskwait exit: T#%d\n", gtid));
739}
740
741
Jim Cownie5e8470a2013-09-27 10:38:44 +0000742/* */
743//
744// Sections worksharing constructs
745//
746
747//
748// For the sections construct, we initialize a dynamically scheduled loop
749// worksharing construct with lb 1 and stride 1, and use the iteration #'s
750// that its returns as sections ids.
751//
752// There are no special entry points for ordered sections, so we always use
753// the dynamically scheduled workshare, even if the sections aren't ordered.
754//
755
756unsigned
Jim Cownie181b4bb2013-12-23 17:28:57 +0000757xexpand(KMP_API_NAME_GOMP_SECTIONS_START)(unsigned count)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000758{
759 int status;
760 kmp_int lb, ub, stride;
761 int gtid = __kmp_entry_gtid();
762 MKLOC(loc, "GOMP_sections_start");
763 KA_TRACE(20, ("GOMP_sections_start: T#%d\n", gtid));
764
765 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
766
767 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, &lb, &ub, &stride);
768 if (status) {
769 KMP_DEBUG_ASSERT(stride == 1);
770 KMP_DEBUG_ASSERT(lb > 0);
771 KMP_ASSERT(lb == ub);
772 }
773 else {
774 lb = 0;
775 }
776
777 KA_TRACE(20, ("GOMP_sections_start exit: T#%d returning %u\n", gtid,
778 (unsigned)lb));
779 return (unsigned)lb;
780}
781
782
783unsigned
Jim Cownie181b4bb2013-12-23 17:28:57 +0000784xexpand(KMP_API_NAME_GOMP_SECTIONS_NEXT)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000785{
786 int status;
787 kmp_int lb, ub, stride;
788 int gtid = __kmp_get_gtid();
789 MKLOC(loc, "GOMP_sections_next");
790 KA_TRACE(20, ("GOMP_sections_next: T#%d\n", gtid));
791
792 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, &lb, &ub, &stride);
793 if (status) {
794 KMP_DEBUG_ASSERT(stride == 1);
795 KMP_DEBUG_ASSERT(lb > 0);
796 KMP_ASSERT(lb == ub);
797 }
798 else {
799 lb = 0;
800 }
801
802 KA_TRACE(20, ("GOMP_sections_next exit: T#%d returning %u\n", gtid,
803 (unsigned)lb));
804 return (unsigned)lb;
805}
806
807
808void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000809xexpand(KMP_API_NAME_GOMP_PARALLEL_SECTIONS_START)(void (*task) (void *), void *data,
Jim Cownie5e8470a2013-09-27 10:38:44 +0000810 unsigned num_threads, unsigned count)
811{
812 int gtid = __kmp_entry_gtid();
813 int last = FALSE;
814 MKLOC(loc, "GOMP_parallel_sections_start");
815 KA_TRACE(20, ("GOMP_parallel_sections_start: T#%d\n", gtid));
816
817 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) {
818 if (num_threads != 0) {
819 __kmp_push_num_threads(&loc, gtid, num_threads);
820 }
821 __kmp_GOMP_fork_call(&loc, gtid,
822 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9, task, data,
823 num_threads, &loc, kmp_nm_dynamic_chunked, (kmp_int)1,
824 (kmp_int)count, (kmp_int)1, (kmp_int)1);
825 }
826 else {
827 __kmpc_serialized_parallel(&loc, gtid);
828 }
829
830 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
831
832 KA_TRACE(20, ("GOMP_parallel_sections_start exit: T#%d\n", gtid));
833}
834
835
836void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000837xexpand(KMP_API_NAME_GOMP_SECTIONS_END)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000838{
839 int gtid = __kmp_get_gtid();
840 KA_TRACE(20, ("GOMP_sections_end: T#%d\n", gtid))
841
842 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
843
844 KA_TRACE(20, ("GOMP_sections_end exit: T#%d\n", gtid))
845}
846
847
848void
Jim Cownie181b4bb2013-12-23 17:28:57 +0000849xexpand(KMP_API_NAME_GOMP_SECTIONS_END_NOWAIT)(void)
Jim Cownie5e8470a2013-09-27 10:38:44 +0000850{
851 KA_TRACE(20, ("GOMP_sections_end_nowait: T#%d\n", __kmp_get_gtid()))
852}
853
Jim Cownie181b4bb2013-12-23 17:28:57 +0000854// libgomp has an empty function for GOMP_taskyield as of 2013-10-10
855void
856xexpand(KMP_API_NAME_GOMP_TASKYIELD)(void)
857{
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000858 KA_TRACE(20, ("GOMP_taskyield: T#%d\n", __kmp_get_gtid()))
859 return;
Jim Cownie181b4bb2013-12-23 17:28:57 +0000860}
861
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000862#if OMP_40_ENABLED // these are new GOMP_4.0 entry points
863
864void
865xexpand(KMP_API_NAME_GOMP_PARALLEL)(void (*task)(void *), void *data, unsigned num_threads, unsigned int flags)
866{
867 int gtid = __kmp_entry_gtid();
868 MKLOC(loc, "GOMP_parallel");
869 KA_TRACE(20, ("GOMP_parallel: T#%d\n", gtid));
870
871 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) {
872 if (num_threads != 0) {
873 __kmp_push_num_threads(&loc, gtid, num_threads);
874 }
875 if(flags != 0) {
876 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags);
877 }
878 __kmp_GOMP_fork_call(&loc, gtid,
879 (microtask_t)__kmp_GOMP_microtask_wrapper, 2, task, data);
880 }
881 else {
882 __kmpc_serialized_parallel(&loc, gtid);
883 }
884 task(data);
885 xexpand(KMP_API_NAME_GOMP_PARALLEL_END)();
886}
887
888void
889xexpand(KMP_API_NAME_GOMP_PARALLEL_SECTIONS)(void (*task) (void *), void *data,
890 unsigned num_threads, unsigned count, unsigned flags)
891{
892 int gtid = __kmp_entry_gtid();
893 int last = FALSE;
894 MKLOC(loc, "GOMP_parallel_sections");
895 KA_TRACE(20, ("GOMP_parallel_sections: T#%d\n", gtid));
896
897 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) {
898 if (num_threads != 0) {
899 __kmp_push_num_threads(&loc, gtid, num_threads);
900 }
901 if(flags != 0) {
902 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags);
903 }
904 __kmp_GOMP_fork_call(&loc, gtid,
905 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9, task, data,
906 num_threads, &loc, kmp_nm_dynamic_chunked, (kmp_int)1,
907 (kmp_int)count, (kmp_int)1, (kmp_int)1);
908 }
909 else {
910 __kmpc_serialized_parallel(&loc, gtid);
911 }
912
913 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
914
915 task(data);
916 xexpand(KMP_API_NAME_GOMP_PARALLEL_END)();
917 KA_TRACE(20, ("GOMP_parallel_sections exit: T#%d\n", gtid));
918}
919
920#define PARALLEL_LOOP(func, schedule) \
921 void func (void (*task) (void *), void *data, unsigned num_threads, \
922 long lb, long ub, long str, long chunk_sz, unsigned flags) \
923 { \
924 int gtid = __kmp_entry_gtid(); \
925 int last = FALSE; \
926 MKLOC(loc, #func); \
927 KA_TRACE(20, ( #func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \
928 gtid, lb, ub, str, chunk_sz )); \
929 \
930 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) { \
931 if (num_threads != 0) { \
932 __kmp_push_num_threads(&loc, gtid, num_threads); \
933 } \
934 if (flags != 0) { \
935 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags); \
936 } \
937 __kmp_GOMP_fork_call(&loc, gtid, \
938 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9, \
939 task, data, num_threads, &loc, (schedule), lb, \
940 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz); \
941 } \
942 else { \
943 __kmpc_serialized_parallel(&loc, gtid); \
944 } \
945 \
946 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \
947 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \
948 (schedule) != kmp_sch_static); \
949 task(data); \
950 xexpand(KMP_API_NAME_GOMP_PARALLEL_END)(); \
951 \
952 KA_TRACE(20, ( #func " exit: T#%d\n", gtid)); \
953 }
954
955PARALLEL_LOOP(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC), kmp_sch_static)
956PARALLEL_LOOP(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC), kmp_sch_dynamic_chunked)
957PARALLEL_LOOP(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED), kmp_sch_guided_chunked)
958PARALLEL_LOOP(xexpand(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME), kmp_sch_runtime)
959
960
961void
962xexpand(KMP_API_NAME_GOMP_TASKGROUP_START)(void)
963{
964 int gtid = __kmp_get_gtid();
965 MKLOC(loc, "GOMP_taskgroup_start");
966 KA_TRACE(20, ("GOMP_taskgroup_start: T#%d\n", gtid));
967
968 __kmpc_taskgroup(&loc, gtid);
969
970 return;
971}
972
973void
974xexpand(KMP_API_NAME_GOMP_TASKGROUP_END)(void)
975{
976 int gtid = __kmp_get_gtid();
977 MKLOC(loc, "GOMP_taskgroup_end");
978 KA_TRACE(20, ("GOMP_taskgroup_end: T#%d\n", gtid));
979
980 __kmpc_end_taskgroup(&loc, gtid);
981
982 return;
983}
984
985#ifndef KMP_DEBUG
986static
987#endif /* KMP_DEBUG */
988kmp_int32 __kmp_gomp_to_iomp_cancellation_kind(int gomp_kind) {
989 kmp_int32 cncl_kind = 0;
990 switch(gomp_kind) {
991 case 1:
992 cncl_kind = cancel_parallel;
993 break;
994 case 2:
995 cncl_kind = cancel_loop;
996 break;
997 case 4:
998 cncl_kind = cancel_sections;
999 break;
1000 case 8:
1001 cncl_kind = cancel_taskgroup;
1002 break;
1003 }
1004 return cncl_kind;
1005}
1006
1007bool
1008xexpand(KMP_API_NAME_GOMP_CANCELLATION_POINT)(int which)
1009{
1010 if(__kmp_omp_cancellation) {
1011 KMP_FATAL(NoGompCancellation);
1012 }
1013 int gtid = __kmp_get_gtid();
1014 MKLOC(loc, "GOMP_cancellation_point");
1015 KA_TRACE(20, ("GOMP_cancellation_point: T#%d\n", gtid));
1016
1017 kmp_int32 cncl_kind = __kmp_gomp_to_iomp_cancellation_kind(which);
1018
1019 return __kmpc_cancellationpoint(&loc, gtid, cncl_kind);
1020}
1021
1022bool
1023xexpand(KMP_API_NAME_GOMP_BARRIER_CANCEL)(void)
1024{
1025 if(__kmp_omp_cancellation) {
1026 KMP_FATAL(NoGompCancellation);
1027 }
1028 KMP_FATAL(NoGompCancellation);
1029 int gtid = __kmp_get_gtid();
1030 MKLOC(loc, "GOMP_barrier_cancel");
1031 KA_TRACE(20, ("GOMP_barrier_cancel: T#%d\n", gtid));
1032
1033 return __kmpc_cancel_barrier(&loc, gtid);
1034}
1035
1036bool
1037xexpand(KMP_API_NAME_GOMP_CANCEL)(int which, bool do_cancel)
1038{
1039 if(__kmp_omp_cancellation) {
1040 KMP_FATAL(NoGompCancellation);
1041 } else {
1042 return FALSE;
1043 }
1044
1045 int gtid = __kmp_get_gtid();
1046 MKLOC(loc, "GOMP_cancel");
1047 KA_TRACE(20, ("GOMP_cancel: T#%d\n", gtid));
1048
1049 kmp_int32 cncl_kind = __kmp_gomp_to_iomp_cancellation_kind(which);
1050
1051 if(do_cancel == FALSE) {
1052 return xexpand(KMP_API_NAME_GOMP_CANCELLATION_POINT)(which);
1053 } else {
1054 return __kmpc_cancel(&loc, gtid, cncl_kind);
1055 }
1056}
1057
1058bool
1059xexpand(KMP_API_NAME_GOMP_SECTIONS_END_CANCEL)(void)
1060{
1061 if(__kmp_omp_cancellation) {
1062 KMP_FATAL(NoGompCancellation);
1063 }
1064 int gtid = __kmp_get_gtid();
1065 MKLOC(loc, "GOMP_sections_end_cancel");
1066 KA_TRACE(20, ("GOMP_sections_end_cancel: T#%d\n", gtid));
1067
1068 return __kmpc_cancel_barrier(&loc, gtid);
1069}
1070
1071bool
1072xexpand(KMP_API_NAME_GOMP_LOOP_END_CANCEL)(void)
1073{
1074 if(__kmp_omp_cancellation) {
1075 KMP_FATAL(NoGompCancellation);
1076 }
1077 int gtid = __kmp_get_gtid();
1078 MKLOC(loc, "GOMP_loop_end_cancel");
1079 KA_TRACE(20, ("GOMP_loop_end_cancel: T#%d\n", gtid));
1080
1081 return __kmpc_cancel_barrier(&loc, gtid);
1082}
1083
1084// All target functions are empty as of 2014-05-29
1085void
1086xexpand(KMP_API_NAME_GOMP_TARGET)(int device, void (*fn) (void *), const void *openmp_target,
1087 size_t mapnum, void **hostaddrs, size_t *sizes, unsigned char *kinds)
1088{
1089 return;
1090}
1091
1092void
1093xexpand(KMP_API_NAME_GOMP_TARGET_DATA)(int device, const void *openmp_target, size_t mapnum,
1094 void **hostaddrs, size_t *sizes, unsigned char *kinds)
1095{
1096 return;
1097}
1098
1099void
1100xexpand(KMP_API_NAME_GOMP_TARGET_END_DATA)(void)
1101{
1102 return;
1103}
1104
1105void
1106xexpand(KMP_API_NAME_GOMP_TARGET_UPDATE)(int device, const void *openmp_target, size_t mapnum,
1107 void **hostaddrs, size_t *sizes, unsigned char *kinds)
1108{
1109 return;
1110}
1111
1112void
1113xexpand(KMP_API_NAME_GOMP_TEAMS)(unsigned int num_teams, unsigned int thread_limit)
1114{
1115 return;
1116}
1117#endif // OMP_40_ENABLED
1118
1119
Jim Cownie181b4bb2013-12-23 17:28:57 +00001120/*
1121 The following sections of code create aliases for the GOMP_* functions,
1122 then create versioned symbols using the assembler directive .symver.
1123 This is only pertinent for ELF .so library
1124 xaliasify and xversionify are defined in kmp_ftn_os.h
1125*/
1126
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001127#ifdef KMP_USE_VERSION_SYMBOLS
Jim Cownie181b4bb2013-12-23 17:28:57 +00001128
1129// GOMP_1.0 aliases
1130xaliasify(KMP_API_NAME_GOMP_ATOMIC_END, 10);
1131xaliasify(KMP_API_NAME_GOMP_ATOMIC_START, 10);
1132xaliasify(KMP_API_NAME_GOMP_BARRIER, 10);
1133xaliasify(KMP_API_NAME_GOMP_CRITICAL_END, 10);
1134xaliasify(KMP_API_NAME_GOMP_CRITICAL_NAME_END, 10);
1135xaliasify(KMP_API_NAME_GOMP_CRITICAL_NAME_START, 10);
1136xaliasify(KMP_API_NAME_GOMP_CRITICAL_START, 10);
1137xaliasify(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT, 10);
1138xaliasify(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START, 10);
1139xaliasify(KMP_API_NAME_GOMP_LOOP_END, 10);
1140xaliasify(KMP_API_NAME_GOMP_LOOP_END_NOWAIT, 10);
1141xaliasify(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT, 10);
1142xaliasify(KMP_API_NAME_GOMP_LOOP_GUIDED_START, 10);
1143xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_NEXT, 10);
1144xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START, 10);
1145xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_NEXT, 10);
1146xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_START, 10);
1147xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_NEXT, 10);
1148xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_START, 10);
1149xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT, 10);
1150xaliasify(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START, 10);
1151xaliasify(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT, 10);
1152xaliasify(KMP_API_NAME_GOMP_LOOP_RUNTIME_START, 10);
1153xaliasify(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT, 10);
1154xaliasify(KMP_API_NAME_GOMP_LOOP_STATIC_START, 10);
1155xaliasify(KMP_API_NAME_GOMP_ORDERED_END, 10);
1156xaliasify(KMP_API_NAME_GOMP_ORDERED_START, 10);
1157xaliasify(KMP_API_NAME_GOMP_PARALLEL_END, 10);
1158xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC_START, 10);
1159xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED_START, 10);
1160xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME_START, 10);
1161xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC_START, 10);
1162xaliasify(KMP_API_NAME_GOMP_PARALLEL_SECTIONS_START, 10);
1163xaliasify(KMP_API_NAME_GOMP_PARALLEL_START, 10);
1164xaliasify(KMP_API_NAME_GOMP_SECTIONS_END, 10);
1165xaliasify(KMP_API_NAME_GOMP_SECTIONS_END_NOWAIT, 10);
1166xaliasify(KMP_API_NAME_GOMP_SECTIONS_NEXT, 10);
1167xaliasify(KMP_API_NAME_GOMP_SECTIONS_START, 10);
1168xaliasify(KMP_API_NAME_GOMP_SINGLE_COPY_END, 10);
1169xaliasify(KMP_API_NAME_GOMP_SINGLE_COPY_START, 10);
1170xaliasify(KMP_API_NAME_GOMP_SINGLE_START, 10);
1171
1172// GOMP_2.0 aliases
Jim Cownie181b4bb2013-12-23 17:28:57 +00001173xaliasify(KMP_API_NAME_GOMP_TASK, 20);
1174xaliasify(KMP_API_NAME_GOMP_TASKWAIT, 20);
Jim Cownie181b4bb2013-12-23 17:28:57 +00001175xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_NEXT, 20);
1176xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_START, 20);
1177xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_NEXT, 20);
1178xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_START, 20);
1179xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_NEXT, 20);
1180xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_START, 20);
1181xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_NEXT, 20);
1182xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_START, 20);
1183xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_NEXT, 20);
1184xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_START, 20);
1185xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_NEXT, 20);
1186xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_START, 20);
1187xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_NEXT, 20);
1188xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_START, 20);
1189xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_NEXT, 20);
1190xaliasify(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_START, 20);
1191
1192// GOMP_3.0 aliases
1193xaliasify(KMP_API_NAME_GOMP_TASKYIELD, 30);
1194
1195// GOMP_4.0 aliases
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001196// The GOMP_parallel* entry points below aren't OpenMP 4.0 related.
1197#if OMP_40_ENABLED
1198xaliasify(KMP_API_NAME_GOMP_PARALLEL, 40);
1199xaliasify(KMP_API_NAME_GOMP_PARALLEL_SECTIONS, 40);
1200xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC, 40);
1201xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED, 40);
1202xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME, 40);
1203xaliasify(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC, 40);
1204xaliasify(KMP_API_NAME_GOMP_TASKGROUP_START, 40);
1205xaliasify(KMP_API_NAME_GOMP_TASKGROUP_END, 40);
1206xaliasify(KMP_API_NAME_GOMP_BARRIER_CANCEL, 40);
1207xaliasify(KMP_API_NAME_GOMP_CANCEL, 40);
1208xaliasify(KMP_API_NAME_GOMP_CANCELLATION_POINT, 40);
1209xaliasify(KMP_API_NAME_GOMP_LOOP_END_CANCEL, 40);
1210xaliasify(KMP_API_NAME_GOMP_SECTIONS_END_CANCEL, 40);
1211xaliasify(KMP_API_NAME_GOMP_TARGET, 40);
1212xaliasify(KMP_API_NAME_GOMP_TARGET_DATA, 40);
1213xaliasify(KMP_API_NAME_GOMP_TARGET_END_DATA, 40);
1214xaliasify(KMP_API_NAME_GOMP_TARGET_UPDATE, 40);
1215xaliasify(KMP_API_NAME_GOMP_TEAMS, 40);
1216#endif
Jim Cownie181b4bb2013-12-23 17:28:57 +00001217
1218// GOMP_1.0 versioned symbols
1219xversionify(KMP_API_NAME_GOMP_ATOMIC_END, 10, "GOMP_1.0");
1220xversionify(KMP_API_NAME_GOMP_ATOMIC_START, 10, "GOMP_1.0");
1221xversionify(KMP_API_NAME_GOMP_BARRIER, 10, "GOMP_1.0");
1222xversionify(KMP_API_NAME_GOMP_CRITICAL_END, 10, "GOMP_1.0");
1223xversionify(KMP_API_NAME_GOMP_CRITICAL_NAME_END, 10, "GOMP_1.0");
1224xversionify(KMP_API_NAME_GOMP_CRITICAL_NAME_START, 10, "GOMP_1.0");
1225xversionify(KMP_API_NAME_GOMP_CRITICAL_START, 10, "GOMP_1.0");
1226xversionify(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT, 10, "GOMP_1.0");
1227xversionify(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START, 10, "GOMP_1.0");
1228xversionify(KMP_API_NAME_GOMP_LOOP_END, 10, "GOMP_1.0");
1229xversionify(KMP_API_NAME_GOMP_LOOP_END_NOWAIT, 10, "GOMP_1.0");
1230xversionify(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT, 10, "GOMP_1.0");
1231xversionify(KMP_API_NAME_GOMP_LOOP_GUIDED_START, 10, "GOMP_1.0");
1232xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_NEXT, 10, "GOMP_1.0");
1233xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START, 10, "GOMP_1.0");
1234xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_NEXT, 10, "GOMP_1.0");
1235xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_START, 10, "GOMP_1.0");
1236xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_NEXT, 10, "GOMP_1.0");
1237xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_START, 10, "GOMP_1.0");
1238xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT, 10, "GOMP_1.0");
1239xversionify(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START, 10, "GOMP_1.0");
1240xversionify(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT, 10, "GOMP_1.0");
1241xversionify(KMP_API_NAME_GOMP_LOOP_RUNTIME_START, 10, "GOMP_1.0");
1242xversionify(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT, 10, "GOMP_1.0");
1243xversionify(KMP_API_NAME_GOMP_LOOP_STATIC_START, 10, "GOMP_1.0");
1244xversionify(KMP_API_NAME_GOMP_ORDERED_END, 10, "GOMP_1.0");
1245xversionify(KMP_API_NAME_GOMP_ORDERED_START, 10, "GOMP_1.0");
1246xversionify(KMP_API_NAME_GOMP_PARALLEL_END, 10, "GOMP_1.0");
1247xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC_START, 10, "GOMP_1.0");
1248xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED_START, 10, "GOMP_1.0");
1249xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME_START, 10, "GOMP_1.0");
1250xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC_START, 10, "GOMP_1.0");
1251xversionify(KMP_API_NAME_GOMP_PARALLEL_SECTIONS_START, 10, "GOMP_1.0");
1252xversionify(KMP_API_NAME_GOMP_PARALLEL_START, 10, "GOMP_1.0");
1253xversionify(KMP_API_NAME_GOMP_SECTIONS_END, 10, "GOMP_1.0");
1254xversionify(KMP_API_NAME_GOMP_SECTIONS_END_NOWAIT, 10, "GOMP_1.0");
1255xversionify(KMP_API_NAME_GOMP_SECTIONS_NEXT, 10, "GOMP_1.0");
1256xversionify(KMP_API_NAME_GOMP_SECTIONS_START, 10, "GOMP_1.0");
1257xversionify(KMP_API_NAME_GOMP_SINGLE_COPY_END, 10, "GOMP_1.0");
1258xversionify(KMP_API_NAME_GOMP_SINGLE_COPY_START, 10, "GOMP_1.0");
1259xversionify(KMP_API_NAME_GOMP_SINGLE_START, 10, "GOMP_1.0");
1260
1261// GOMP_2.0 versioned symbols
Jim Cownie181b4bb2013-12-23 17:28:57 +00001262xversionify(KMP_API_NAME_GOMP_TASK, 20, "GOMP_2.0");
1263xversionify(KMP_API_NAME_GOMP_TASKWAIT, 20, "GOMP_2.0");
Jim Cownie181b4bb2013-12-23 17:28:57 +00001264xversionify(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_NEXT, 20, "GOMP_2.0");
1265xversionify(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_START, 20, "GOMP_2.0");
1266xversionify(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_NEXT, 20, "GOMP_2.0");
1267xversionify(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_START, 20, "GOMP_2.0");
1268xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_NEXT, 20, "GOMP_2.0");
1269xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_START, 20, "GOMP_2.0");
1270xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_NEXT, 20, "GOMP_2.0");
1271xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_START, 20, "GOMP_2.0");
1272xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_NEXT, 20, "GOMP_2.0");
1273xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_START, 20, "GOMP_2.0");
1274xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_NEXT, 20, "GOMP_2.0");
1275xversionify(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_START, 20, "GOMP_2.0");
1276xversionify(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_NEXT, 20, "GOMP_2.0");
1277xversionify(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_START, 20, "GOMP_2.0");
1278xversionify(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_NEXT, 20, "GOMP_2.0");
1279xversionify(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_START, 20, "GOMP_2.0");
1280
1281// GOMP_3.0 versioned symbols
1282xversionify(KMP_API_NAME_GOMP_TASKYIELD, 30, "GOMP_3.0");
1283
1284// GOMP_4.0 versioned symbols
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001285#if OMP_40_ENABLED
1286xversionify(KMP_API_NAME_GOMP_PARALLEL, 40, "GOMP_4.0");
1287xversionify(KMP_API_NAME_GOMP_PARALLEL_SECTIONS, 40, "GOMP_4.0");
1288xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC, 40, "GOMP_4.0");
1289xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED, 40, "GOMP_4.0");
1290xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME, 40, "GOMP_4.0");
1291xversionify(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC, 40, "GOMP_4.0");
1292xversionify(KMP_API_NAME_GOMP_TASKGROUP_START, 40, "GOMP_4.0");
1293xversionify(KMP_API_NAME_GOMP_TASKGROUP_END, 40, "GOMP_4.0");
1294xversionify(KMP_API_NAME_GOMP_BARRIER_CANCEL, 40, "GOMP_4.0");
1295xversionify(KMP_API_NAME_GOMP_CANCEL, 40, "GOMP_4.0");
1296xversionify(KMP_API_NAME_GOMP_CANCELLATION_POINT, 40, "GOMP_4.0");
1297xversionify(KMP_API_NAME_GOMP_LOOP_END_CANCEL, 40, "GOMP_4.0");
1298xversionify(KMP_API_NAME_GOMP_SECTIONS_END_CANCEL, 40, "GOMP_4.0");
1299xversionify(KMP_API_NAME_GOMP_TARGET, 40, "GOMP_4.0");
1300xversionify(KMP_API_NAME_GOMP_TARGET_DATA, 40, "GOMP_4.0");
1301xversionify(KMP_API_NAME_GOMP_TARGET_END_DATA, 40, "GOMP_4.0");
1302xversionify(KMP_API_NAME_GOMP_TARGET_UPDATE, 40, "GOMP_4.0");
1303xversionify(KMP_API_NAME_GOMP_TEAMS, 40, "GOMP_4.0");
1304#endif
Jim Cownie181b4bb2013-12-23 17:28:57 +00001305
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001306#endif // KMP_USE_VERSION_SYMBOLS
Jim Cownie181b4bb2013-12-23 17:28:57 +00001307
Jim Cownie5e8470a2013-09-27 10:38:44 +00001308#ifdef __cplusplus
1309 } //extern "C"
1310#endif // __cplusplus
1311
1312