15 #include "kmp_atomic.h" 18 #include "ompt-specific.h" 25 #define MKLOC(loc, routine) \ 26 static ident_t(loc) = {0, KMP_IDENT_KMPC, 0, 0, ";unknown;unknown;0;0;;"}; 28 #include "kmp_ftn_os.h" 30 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_BARRIER)(void) {
31 int gtid = __kmp_entry_gtid();
32 MKLOC(loc,
"GOMP_barrier");
33 KA_TRACE(20, (
"GOMP_barrier: T#%d\n", gtid));
34 #if OMPT_SUPPORT && OMPT_OPTIONAL 35 omp_frame_t *ompt_frame;
36 if (ompt_enabled.enabled) {
37 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
38 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
39 OMPT_STORE_RETURN_ADDRESS(gtid);
43 #if OMPT_SUPPORT && OMPT_OPTIONAL 44 if (ompt_enabled.enabled) {
45 ompt_frame->enter_frame = NULL;
59 extern kmp_critical_name *__kmp_unnamed_critical_addr;
61 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_START)(void) {
62 int gtid = __kmp_entry_gtid();
63 MKLOC(loc,
"GOMP_critical_start");
64 KA_TRACE(20, (
"GOMP_critical_start: T#%d\n", gtid));
65 #if OMPT_SUPPORT && OMPT_OPTIONAL 66 OMPT_STORE_RETURN_ADDRESS(gtid);
71 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_END)(void) {
72 int gtid = __kmp_get_gtid();
73 MKLOC(loc,
"GOMP_critical_end");
74 KA_TRACE(20, (
"GOMP_critical_end: T#%d\n", gtid));
75 #if OMPT_SUPPORT && OMPT_OPTIONAL 76 OMPT_STORE_RETURN_ADDRESS(gtid);
81 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_NAME_START)(
void **pptr) {
82 int gtid = __kmp_entry_gtid();
83 MKLOC(loc,
"GOMP_critical_name_start");
84 KA_TRACE(20, (
"GOMP_critical_name_start: T#%d\n", gtid));
88 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_NAME_END)(
void **pptr) {
89 int gtid = __kmp_get_gtid();
90 MKLOC(loc,
"GOMP_critical_name_end");
91 KA_TRACE(20, (
"GOMP_critical_name_end: T#%d\n", gtid));
98 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ATOMIC_START)(void) {
99 int gtid = __kmp_entry_gtid();
100 KA_TRACE(20, (
"GOMP_atomic_start: T#%d\n", gtid));
103 __ompt_thread_assign_wait_id(0);
106 __kmp_acquire_atomic_lock(&__kmp_atomic_lock, gtid);
109 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ATOMIC_END)(void) {
110 int gtid = __kmp_get_gtid();
111 KA_TRACE(20, (
"GOMP_atomic_end: T#%d\n", gtid));
112 __kmp_release_atomic_lock(&__kmp_atomic_lock, gtid);
115 int KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_START)(void) {
116 int gtid = __kmp_entry_gtid();
117 MKLOC(loc,
"GOMP_single_start");
118 KA_TRACE(20, (
"GOMP_single_start: T#%d\n", gtid));
120 if (!TCR_4(__kmp_init_parallel))
121 __kmp_parallel_initialize();
126 kmp_int32 rc = __kmp_enter_single(gtid, &loc, FALSE);
128 #if OMPT_SUPPORT && OMPT_OPTIONAL 129 kmp_info_t *this_thr = __kmp_threads[gtid];
130 kmp_team_t *team = this_thr->th.th_team;
131 int tid = __kmp_tid_from_gtid(gtid);
133 if (ompt_enabled.enabled) {
135 if (ompt_enabled.ompt_callback_work) {
136 ompt_callbacks.ompt_callback(ompt_callback_work)(
137 ompt_work_single_executor, ompt_scope_begin,
138 &(team->t.ompt_team_info.parallel_data),
139 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
140 1, OMPT_GET_RETURN_ADDRESS(0));
143 if (ompt_enabled.ompt_callback_work) {
144 ompt_callbacks.ompt_callback(ompt_callback_work)(
145 ompt_work_single_other, ompt_scope_begin,
146 &(team->t.ompt_team_info.parallel_data),
147 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
148 1, OMPT_GET_RETURN_ADDRESS(0));
149 ompt_callbacks.ompt_callback(ompt_callback_work)(
150 ompt_work_single_other, ompt_scope_end,
151 &(team->t.ompt_team_info.parallel_data),
152 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
153 1, OMPT_GET_RETURN_ADDRESS(0));
162 void *KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_COPY_START)(void) {
164 int gtid = __kmp_entry_gtid();
165 MKLOC(loc,
"GOMP_single_copy_start");
166 KA_TRACE(20, (
"GOMP_single_copy_start: T#%d\n", gtid));
168 if (!TCR_4(__kmp_init_parallel))
169 __kmp_parallel_initialize();
174 if (__kmp_enter_single(gtid, &loc, FALSE))
180 #if OMPT_SUPPORT && OMPT_OPTIONAL 181 omp_frame_t *ompt_frame;
182 if (ompt_enabled.enabled) {
183 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
184 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
185 OMPT_STORE_RETURN_ADDRESS(gtid);
188 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
192 retval = __kmp_team_from_gtid(gtid)->t.t_copypriv_data;
193 #if OMPT_SUPPORT && OMPT_OPTIONAL 194 if (ompt_enabled.enabled) {
195 OMPT_STORE_RETURN_ADDRESS(gtid);
198 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
199 #if OMPT_SUPPORT && OMPT_OPTIONAL 200 if (ompt_enabled.enabled) {
201 ompt_frame->enter_frame = NULL;
207 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_COPY_END)(
void *data) {
208 int gtid = __kmp_get_gtid();
209 KA_TRACE(20, (
"GOMP_single_copy_end: T#%d\n", gtid));
215 __kmp_team_from_gtid(gtid)->t.t_copypriv_data = data;
216 #if OMPT_SUPPORT && OMPT_OPTIONAL 217 omp_frame_t *ompt_frame;
218 if (ompt_enabled.enabled) {
219 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
220 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
221 OMPT_STORE_RETURN_ADDRESS(gtid);
224 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
225 #if OMPT_SUPPORT && OMPT_OPTIONAL 226 if (ompt_enabled.enabled) {
227 OMPT_STORE_RETURN_ADDRESS(gtid);
230 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
231 #if OMPT_SUPPORT && OMPT_OPTIONAL 232 if (ompt_enabled.enabled) {
233 ompt_frame->enter_frame = NULL;
238 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ORDERED_START)(void) {
239 int gtid = __kmp_entry_gtid();
240 MKLOC(loc,
"GOMP_ordered_start");
241 KA_TRACE(20, (
"GOMP_ordered_start: T#%d\n", gtid));
242 #if OMPT_SUPPORT && OMPT_OPTIONAL 243 OMPT_STORE_RETURN_ADDRESS(gtid);
248 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ORDERED_END)(void) {
249 int gtid = __kmp_get_gtid();
250 MKLOC(loc,
"GOMP_ordered_end");
251 KA_TRACE(20, (
"GOMP_ordered_start: T#%d\n", gtid));
252 #if OMPT_SUPPORT && OMPT_OPTIONAL 253 OMPT_STORE_RETURN_ADDRESS(gtid);
263 #if KMP_ARCH_X86 || KMP_ARCH_ARM || KMP_ARCH_MIPS 264 #define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_4 265 #define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_4 266 #define KMP_DISPATCH_NEXT __kmpc_dispatch_next_4 268 #define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_8 269 #define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_8 270 #define KMP_DISPATCH_NEXT __kmpc_dispatch_next_8 273 #define KMP_DISPATCH_INIT_ULL __kmp_aux_dispatch_init_8u 274 #define KMP_DISPATCH_FINI_CHUNK_ULL __kmp_aux_dispatch_fini_chunk_8u 275 #define KMP_DISPATCH_NEXT_ULL __kmpc_dispatch_next_8u 283 __kmp_GOMP_microtask_wrapper(
int *gtid,
int *npr,
void (*task)(
void *),
287 omp_frame_t *ompt_frame;
288 omp_state_t enclosing_state;
290 if (ompt_enabled.enabled) {
292 thr = __kmp_threads[*gtid];
295 enclosing_state = thr->th.ompt_thread_info.state;
296 thr->th.ompt_thread_info.state = omp_state_work_parallel;
299 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
300 ompt_frame->exit_frame = OMPT_GET_FRAME_ADDRESS(0);
307 if (ompt_enabled.enabled) {
309 ompt_frame->exit_frame = NULL;
312 thr->th.ompt_thread_info.state = enclosing_state;
321 __kmp_GOMP_parallel_microtask_wrapper(
int *gtid,
int *npr,
322 void (*task)(
void *),
void *data,
323 unsigned num_threads,
ident_t *loc,
329 KMP_DISPATCH_INIT(loc, *gtid, schedule, start, end, incr, chunk_size,
334 omp_frame_t *ompt_frame;
335 omp_state_t enclosing_state;
337 if (ompt_enabled.enabled) {
338 thr = __kmp_threads[*gtid];
340 enclosing_state = thr->th.ompt_thread_info.state;
341 thr->th.ompt_thread_info.state = omp_state_work_parallel;
344 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
345 ompt_frame->exit_frame = OMPT_GET_FRAME_ADDRESS(0);
353 if (ompt_enabled.enabled) {
355 ompt_frame->exit_frame = NULL;
358 thr->th.ompt_thread_info.state = enclosing_state;
367 __kmp_GOMP_fork_call(
ident_t *loc,
int gtid,
void (*unwrapped_task)(
void *),
368 microtask_t wrapper,
int argc, ...) {
370 kmp_info_t *thr = __kmp_threads[gtid];
371 kmp_team_t *team = thr->th.th_team;
372 int tid = __kmp_tid_from_gtid(gtid);
377 rc = __kmp_fork_call(loc, gtid, fork_context_gnu, argc, wrapper,
378 __kmp_invoke_task_func,
379 #
if (KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64) && KMP_OS_LINUX
389 __kmp_run_before_invoked_task(gtid, tid, thr, team);
394 if (ompt_enabled.enabled) {
395 ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);
396 ompt_task_info_t *task_info = __ompt_get_task_info_object(0);
399 if (ompt_enabled.ompt_callback_implicit_task) {
400 ompt_team_size = __kmp_team_from_gtid(gtid)->t.t_nproc;
401 ompt_callbacks.ompt_callback(ompt_callback_implicit_task)(
402 ompt_scope_begin, &(team_info->parallel_data),
403 &(task_info->task_data), ompt_team_size, __kmp_tid_from_gtid(gtid));
404 task_info->thread_num = __kmp_tid_from_gtid(gtid);
406 thr->th.ompt_thread_info.state = omp_state_work_parallel;
411 static void __kmp_GOMP_serialized_parallel(
ident_t *loc, kmp_int32 gtid,
412 void (*task)(
void *)) {
414 OMPT_STORE_RETURN_ADDRESS(gtid);
416 __kmp_serialized_parallel(loc, gtid);
419 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_START)(void (*task)(
void *),
421 unsigned num_threads) {
422 int gtid = __kmp_entry_gtid();
425 omp_frame_t *parent_frame, *frame;
427 if (ompt_enabled.enabled) {
428 __ompt_get_task_info_internal(0, NULL, NULL, &parent_frame, NULL, NULL);
429 parent_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
430 OMPT_STORE_RETURN_ADDRESS(gtid);
434 MKLOC(loc,
"GOMP_parallel_start");
435 KA_TRACE(20, (
"GOMP_parallel_start: T#%d\n", gtid));
438 if (num_threads != 0) {
439 __kmp_push_num_threads(&loc, gtid, num_threads);
441 __kmp_GOMP_fork_call(&loc, gtid, task,
442 (microtask_t)__kmp_GOMP_microtask_wrapper, 2, task,
445 __kmp_GOMP_serialized_parallel(&loc, gtid, task);
449 if (ompt_enabled.enabled) {
450 __ompt_get_task_info_internal(0, NULL, NULL, &frame, NULL, NULL);
451 frame->exit_frame = OMPT_GET_FRAME_ADDRESS(1);
456 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_END)(void) {
457 int gtid = __kmp_get_gtid();
459 int ompt_team_size = __kmp_team_from_gtid(gtid)->t.t_nproc;
461 thr = __kmp_threads[gtid];
463 MKLOC(loc,
"GOMP_parallel_end");
464 KA_TRACE(20, (
"GOMP_parallel_end: T#%d\n", gtid));
466 if (!thr->th.th_team->t.t_serialized) {
467 __kmp_run_after_invoked_task(gtid, __kmp_tid_from_gtid(gtid), thr,
471 if (ompt_enabled.enabled) {
475 OMPT_CUR_TASK_INFO(thr)->frame.exit_frame = NULL;
479 __kmp_join_call(&loc, gtid
515 #define IF_OMPT_SUPPORT(code) code 517 #define IF_OMPT_SUPPORT(code) 520 #define LOOP_START(func, schedule) \ 521 int func(long lb, long ub, long str, long chunk_sz, long *p_lb, \ 525 int gtid = __kmp_entry_gtid(); \ 528 (#func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \ 529 gtid, lb, ub, str, chunk_sz)); \ 531 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 532 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 533 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \ 534 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \ 535 (schedule) != kmp_sch_static); \ 536 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 537 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 538 (kmp_int *)p_ub, (kmp_int *)&stride); \ 540 KMP_DEBUG_ASSERT(stride == str); \ 541 *p_ub += (str > 0) ? 1 : -1; \ 548 (#func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \ 549 gtid, *p_lb, *p_ub, status)); \ 553 #define LOOP_RUNTIME_START(func, schedule) \ 554 int func(long lb, long ub, long str, long *p_lb, long *p_ub) { \ 558 int gtid = __kmp_entry_gtid(); \ 561 (#func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz %d\n", \ 562 gtid, lb, ub, str, chunk_sz)); \ 564 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 565 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 566 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \ 567 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, TRUE); \ 568 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 569 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 570 (kmp_int *)p_ub, (kmp_int *)&stride); \ 572 KMP_DEBUG_ASSERT(stride == str); \ 573 *p_ub += (str > 0) ? 1 : -1; \ 580 (#func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \ 581 gtid, *p_lb, *p_ub, status)); \ 585 #define LOOP_NEXT(func, fini_code) \ 586 int func(long *p_lb, long *p_ub) { \ 589 int gtid = __kmp_get_gtid(); \ 591 KA_TRACE(20, (#func ": T#%d\n", gtid)); \ 593 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 594 fini_code status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 595 (kmp_int *)p_ub, (kmp_int *)&stride); \ 597 *p_ub += (stride > 0) ? 1 : -1; \ 601 (#func " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, stride 0x%lx, " \ 603 gtid, *p_lb, *p_ub, stride, status)); \ 607 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_STATIC_START),
kmp_sch_static)
608 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT), {})
609 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START),
610 kmp_sch_dynamic_chunked)
611 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT), {})
612 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_GUIDED_START),
614 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT), {})
615 LOOP_RUNTIME_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_RUNTIME_START),
617 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT), {})
619 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START),
621 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT),
622 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
623 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START),
624 kmp_ord_dynamic_chunked)
625 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_NEXT),
626 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
627 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_START),
628 kmp_ord_guided_chunked)
629 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_NEXT),
630 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
632 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_START),
634 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_NEXT),
635 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
637 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_END)(void) {
638 int gtid = __kmp_get_gtid();
639 KA_TRACE(20, (
"GOMP_loop_end: T#%d\n", gtid))
641 #if OMPT_SUPPORT && OMPT_OPTIONAL 642 omp_frame_t *ompt_frame;
643 if (ompt_enabled.enabled) {
644 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
645 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
646 OMPT_STORE_RETURN_ADDRESS(gtid);
649 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
650 #if OMPT_SUPPORT && OMPT_OPTIONAL 651 if (ompt_enabled.enabled) {
652 ompt_frame->enter_frame = NULL;
656 KA_TRACE(20, (
"GOMP_loop_end exit: T#%d\n", gtid))
659 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_END_NOWAIT)(void) {
660 KA_TRACE(20, (
"GOMP_loop_end_nowait: T#%d\n", __kmp_get_gtid()))
667 #define LOOP_START_ULL(func, schedule) \ 668 int func(int up, unsigned long long lb, unsigned long long ub, \ 669 unsigned long long str, unsigned long long chunk_sz, \ 670 unsigned long long *p_lb, unsigned long long *p_ub) { \ 672 long long str2 = up ? ((long long)str) : -((long long)str); \ 674 int gtid = __kmp_entry_gtid(); \ 680 ": T#%d, up %d, lb 0x%llx, ub 0x%llx, str 0x%llx, chunk_sz 0x%llx\n", \ 681 gtid, up, lb, ub, str, chunk_sz)); \ 683 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 684 KMP_DISPATCH_INIT_ULL(&loc, gtid, (schedule), lb, \ 685 (str2 > 0) ? (ub - 1) : (ub + 1), str2, chunk_sz, \ 686 (schedule) != kmp_sch_static); \ 688 KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, (kmp_uint64 *)p_lb, \ 689 (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \ 691 KMP_DEBUG_ASSERT(stride == str2); \ 692 *p_ub += (str > 0) ? 1 : -1; \ 699 (#func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, returning %d\n", \ 700 gtid, *p_lb, *p_ub, status)); \ 704 #define LOOP_RUNTIME_START_ULL(func, schedule) \ 705 int func(int up, unsigned long long lb, unsigned long long ub, \ 706 unsigned long long str, unsigned long long *p_lb, \ 707 unsigned long long *p_ub) { \ 709 long long str2 = up ? ((long long)str) : -((long long)str); \ 710 unsigned long long stride; \ 711 unsigned long long chunk_sz = 0; \ 712 int gtid = __kmp_entry_gtid(); \ 718 ": T#%d, up %d, lb 0x%llx, ub 0x%llx, str 0x%llx, chunk_sz 0x%llx\n", \ 719 gtid, up, lb, ub, str, chunk_sz)); \ 721 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 722 KMP_DISPATCH_INIT_ULL(&loc, gtid, (schedule), lb, \ 723 (str2 > 0) ? (ub - 1) : (ub + 1), str2, chunk_sz, \ 726 KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, (kmp_uint64 *)p_lb, \ 727 (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \ 729 KMP_DEBUG_ASSERT((long long)stride == str2); \ 730 *p_ub += (str > 0) ? 1 : -1; \ 737 (#func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, returning %d\n", \ 738 gtid, *p_lb, *p_ub, status)); \ 742 #define LOOP_NEXT_ULL(func, fini_code) \ 743 int func(unsigned long long *p_lb, unsigned long long *p_ub) { \ 746 int gtid = __kmp_get_gtid(); \ 748 KA_TRACE(20, (#func ": T#%d\n", gtid)); \ 751 KMP_DISPATCH_NEXT_ULL(&loc, gtid, NULL, (kmp_uint64 *)p_lb, \ 752 (kmp_uint64 *)p_ub, (kmp_int64 *)&stride); \ 754 *p_ub += (stride > 0) ? 1 : -1; \ 758 (#func " exit: T#%d, *p_lb 0x%llx, *p_ub 0x%llx, stride 0x%llx, " \ 760 gtid, *p_lb, *p_ub, stride, status)); \ 764 LOOP_START_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_START),
766 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_NEXT), {})
767 LOOP_START_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_START),
768 kmp_sch_dynamic_chunked)
769 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_NEXT), {})
770 LOOP_START_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_START),
772 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_NEXT), {})
773 LOOP_RUNTIME_START_ULL(
774 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_START), kmp_sch_runtime)
775 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_NEXT), {})
777 LOOP_START_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_START),
779 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_NEXT),
780 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
782 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_START),
783 kmp_ord_dynamic_chunked)
784 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_NEXT),
785 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
786 LOOP_START_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_START),
787 kmp_ord_guided_chunked)
788 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_NEXT),
789 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
790 LOOP_RUNTIME_START_ULL(
791 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_START),
793 LOOP_NEXT_ULL(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_NEXT),
794 { KMP_DISPATCH_FINI_CHUNK_ULL(&loc, gtid); })
800 #define PARALLEL_LOOP_START(func, schedule, ompt_pre, ompt_post) \
801 void func(
void (*task)(
void *),
void *data,
unsigned num_threads,
long lb, \
802 long ub,
long str,
long chunk_sz) { \
803 int gtid = __kmp_entry_gtid(); \
806 (#func
": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \
807 gtid, lb, ub, str, chunk_sz)); \
812 if (num_threads != 0) { \
813 __kmp_push_num_threads(&loc, gtid, num_threads); \
815 __kmp_GOMP_fork_call(&loc, gtid, task, \
816 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, \
817 9, task, data, num_threads, &loc, (schedule), lb, \
818 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz); \
819 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid)); \
821 __kmp_GOMP_serialized_parallel(&loc, gtid, task); \
822 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid)); \
825 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \
826 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \
831 KA_TRACE(20, (#func
" exit: T#%d\n", gtid)); \
834 #if OMPT_SUPPORT && OMPT_OPTIONAL 836 #define OMPT_LOOP_PRE() \ 837 omp_frame_t *parent_frame; \ 838 if (ompt_enabled.enabled) { \ 839 __ompt_get_task_info_internal(0, NULL, NULL, &parent_frame, NULL, NULL); \ 840 parent_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1); \ 841 OMPT_STORE_RETURN_ADDRESS(gtid); \ 844 #define OMPT_LOOP_POST() \ 845 if (ompt_enabled.enabled) { \ 846 parent_frame->enter_frame = NULL; \ 851 #define OMPT_LOOP_PRE() 853 #define OMPT_LOOP_POST() 858 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC_START),
861 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC_START),
862 kmp_sch_dynamic_chunked, OMPT_LOOP_PRE, OMPT_LOOP_POST)
864 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED_START),
867 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME_START),
868 kmp_sch_runtime, OMPT_LOOP_PRE, OMPT_LOOP_POST)
872 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASK)(void (*func)(
void *),
void *data,
873 void (*copy_func)(
void *,
void *),
874 long arg_size,
long arg_align,
875 bool if_cond,
unsigned gomp_flags
881 MKLOC(loc,
"GOMP_task");
882 int gtid = __kmp_entry_gtid();
884 kmp_tasking_flags_t *input_flags = (kmp_tasking_flags_t *)&flags;
886 KA_TRACE(20, (
"GOMP_task: T#%d\n", gtid));
889 if (!(gomp_flags & 1)) {
890 input_flags->tiedness = 1;
893 if (gomp_flags & 2) {
894 input_flags->final = 1;
896 input_flags->native = 1;
903 kmp_task_t *task = __kmp_task_alloc(
904 &loc, gtid, input_flags,
sizeof(kmp_task_t),
905 arg_size ? arg_size + arg_align - 1 : 0, (kmp_routine_entry_t)func);
909 task->shareds = (
void *)((((
size_t)task->shareds) + arg_align - 1) /
910 arg_align * arg_align);
915 (*copy_func)(task->shareds, data);
917 KMP_MEMCPY(task->shareds, data, arg_size);
922 kmp_taskdata_t *current_task;
923 if (ompt_enabled.enabled) {
924 OMPT_STORE_RETURN_ADDRESS(gtid);
925 current_task = __kmp_threads[gtid]->th.th_current_task;
926 current_task->ompt_task_info.frame.enter_frame = OMPT_GET_FRAME_ADDRESS(1);
932 if (gomp_flags & 8) {
934 const size_t ndeps = (kmp_intptr_t)depend[0];
935 const size_t nout = (kmp_intptr_t)depend[1];
936 kmp_depend_info_t dep_list[ndeps];
938 for (
size_t i = 0U; i < ndeps; i++) {
939 dep_list[i].base_addr = (kmp_intptr_t)depend[2U + i];
940 dep_list[i].len = 0U;
941 dep_list[i].flags.in = 1;
942 dep_list[i].flags.out = (i < nout);
947 __kmpc_omp_task(&loc, gtid, task);
951 ompt_thread_info_t oldInfo;
953 kmp_taskdata_t *taskdata;
954 kmp_taskdata_t *current_task;
955 if (ompt_enabled.enabled) {
957 thread = __kmp_threads[gtid];
958 taskdata = KMP_TASK_TO_TASKDATA(task);
959 oldInfo = thread->th.ompt_thread_info;
960 thread->th.ompt_thread_info.wait_id = 0;
961 thread->th.ompt_thread_info.state = omp_state_work_parallel;
962 taskdata->ompt_task_info.frame.exit_frame = OMPT_GET_FRAME_ADDRESS(0);
963 OMPT_STORE_RETURN_ADDRESS(gtid);
967 __kmpc_omp_task_begin_if0(&loc, gtid, task);
969 __kmpc_omp_task_complete_if0(&loc, gtid, task);
972 if (ompt_enabled.enabled) {
973 thread->th.ompt_thread_info = oldInfo;
974 taskdata->ompt_task_info.frame.exit_frame = NULL;
979 if (ompt_enabled.enabled) {
980 current_task->ompt_task_info.frame.enter_frame = NULL;
984 KA_TRACE(20, (
"GOMP_task exit: T#%d\n", gtid));
987 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKWAIT)(void) {
988 MKLOC(loc,
"GOMP_taskwait");
989 int gtid = __kmp_entry_gtid();
992 if (ompt_enabled.enabled)
993 OMPT_STORE_RETURN_ADDRESS(gtid);
996 KA_TRACE(20, (
"GOMP_taskwait: T#%d\n", gtid));
998 __kmpc_omp_taskwait(&loc, gtid);
1000 KA_TRACE(20, (
"GOMP_taskwait exit: T#%d\n", gtid));
1012 unsigned KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SECTIONS_START)(
unsigned count) {
1014 kmp_int lb, ub, stride;
1015 int gtid = __kmp_entry_gtid();
1016 MKLOC(loc,
"GOMP_sections_start");
1017 KA_TRACE(20, (
"GOMP_sections_start: T#%d\n", gtid));
1019 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
1021 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, &lb, &ub, &stride);
1023 KMP_DEBUG_ASSERT(stride == 1);
1024 KMP_DEBUG_ASSERT(lb > 0);
1025 KMP_ASSERT(lb == ub);
1030 KA_TRACE(20, (
"GOMP_sections_start exit: T#%d returning %u\n", gtid,
1032 return (
unsigned)lb;
1035 unsigned KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SECTIONS_NEXT)(void) {
1037 kmp_int lb, ub, stride;
1038 int gtid = __kmp_get_gtid();
1039 MKLOC(loc,
"GOMP_sections_next");
1040 KA_TRACE(20, (
"GOMP_sections_next: T#%d\n", gtid));
1043 OMPT_STORE_RETURN_ADDRESS(gtid);
1046 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, &lb, &ub, &stride);
1048 KMP_DEBUG_ASSERT(stride == 1);
1049 KMP_DEBUG_ASSERT(lb > 0);
1050 KMP_ASSERT(lb == ub);
1056 20, (
"GOMP_sections_next exit: T#%d returning %u\n", gtid, (
unsigned)lb));
1057 return (
unsigned)lb;
1060 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_SECTIONS_START)(
1061 void (*task)(
void *),
void *data,
unsigned num_threads,
unsigned count) {
1062 int gtid = __kmp_entry_gtid();
1065 omp_frame_t *parent_frame;
1067 if (ompt_enabled.enabled) {
1068 __ompt_get_task_info_internal(0, NULL, NULL, &parent_frame, NULL, NULL);
1069 parent_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
1070 OMPT_STORE_RETURN_ADDRESS(gtid);
1074 MKLOC(loc,
"GOMP_parallel_sections_start");
1075 KA_TRACE(20, (
"GOMP_parallel_sections_start: T#%d\n", gtid));
1078 if (num_threads != 0) {
1079 __kmp_push_num_threads(&loc, gtid, num_threads);
1081 __kmp_GOMP_fork_call(&loc, gtid, task,
1082 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9,
1083 task, data, num_threads, &loc, kmp_nm_dynamic_chunked,
1084 (kmp_int)1, (kmp_int)count, (kmp_int)1, (kmp_int)1);
1086 __kmp_GOMP_serialized_parallel(&loc, gtid, task);
1090 if (ompt_enabled.enabled) {
1091 parent_frame->enter_frame = NULL;
1095 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
1097 KA_TRACE(20, (
"GOMP_parallel_sections_start exit: T#%d\n", gtid));
1100 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SECTIONS_END)(void) {
1101 int gtid = __kmp_get_gtid();
1102 KA_TRACE(20, (
"GOMP_sections_end: T#%d\n", gtid))
1105 omp_frame_t *ompt_frame;
1106 if (ompt_enabled.enabled) {
1107 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
1108 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
1109 OMPT_STORE_RETURN_ADDRESS(gtid);
1112 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
1114 if (ompt_enabled.enabled) {
1115 ompt_frame->enter_frame = NULL;
1119 KA_TRACE(20, (
"GOMP_sections_end exit: T#%d\n", gtid))
1122 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SECTIONS_END_NOWAIT)(void) {
1123 KA_TRACE(20, (
"GOMP_sections_end_nowait: T#%d\n", __kmp_get_gtid()))
1127 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKYIELD)(void) {
1128 KA_TRACE(20, (
"GOMP_taskyield: T#%d\n", __kmp_get_gtid()))
1132 #if OMP_40_ENABLED // these are new GOMP_4.0 entry points 1134 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL)(void (*task)(
void *),
1136 unsigned num_threads,
1137 unsigned int flags) {
1138 int gtid = __kmp_entry_gtid();
1139 MKLOC(loc,
"GOMP_parallel");
1140 KA_TRACE(20, (
"GOMP_parallel: T#%d\n", gtid));
1143 ompt_task_info_t *parent_task_info, *task_info;
1144 if (ompt_enabled.enabled) {
1145 parent_task_info = __ompt_get_task_info_object(0);
1146 parent_task_info->frame.enter_frame = OMPT_GET_FRAME_ADDRESS(1);
1147 OMPT_STORE_RETURN_ADDRESS(gtid);
1151 if (num_threads != 0) {
1152 __kmp_push_num_threads(&loc, gtid, num_threads);
1155 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags);
1157 __kmp_GOMP_fork_call(&loc, gtid, task,
1158 (microtask_t)__kmp_GOMP_microtask_wrapper, 2, task,
1161 __kmp_GOMP_serialized_parallel(&loc, gtid, task);
1164 if (ompt_enabled.enabled) {
1165 task_info = __ompt_get_task_info_object(0);
1166 task_info->frame.exit_frame = OMPT_GET_FRAME_ADDRESS(0);
1171 if (ompt_enabled.enabled) {
1172 OMPT_STORE_RETURN_ADDRESS(gtid);
1175 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_END)();
1177 if (ompt_enabled.enabled) {
1178 task_info->frame.exit_frame = NULL;
1179 parent_task_info->frame.enter_frame = NULL;
1184 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_SECTIONS)(void (*task)(
void *),
1186 unsigned num_threads,
1189 int gtid = __kmp_entry_gtid();
1190 MKLOC(loc,
"GOMP_parallel_sections");
1191 KA_TRACE(20, (
"GOMP_parallel_sections: T#%d\n", gtid));
1194 OMPT_STORE_RETURN_ADDRESS(gtid);
1198 if (num_threads != 0) {
1199 __kmp_push_num_threads(&loc, gtid, num_threads);
1202 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags);
1204 __kmp_GOMP_fork_call(&loc, gtid, task,
1205 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, 9,
1206 task, data, num_threads, &loc, kmp_nm_dynamic_chunked,
1207 (kmp_int)1, (kmp_int)count, (kmp_int)1, (kmp_int)1);
1209 __kmp_GOMP_serialized_parallel(&loc, gtid, task);
1213 OMPT_STORE_RETURN_ADDRESS(gtid);
1216 KMP_DISPATCH_INIT(&loc, gtid, kmp_nm_dynamic_chunked, 1, count, 1, 1, TRUE);
1219 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_END)();
1220 KA_TRACE(20, (
"GOMP_parallel_sections exit: T#%d\n", gtid));
1223 #define PARALLEL_LOOP(func, schedule, ompt_pre, ompt_post) \ 1224 void func(void (*task)(void *), void *data, unsigned num_threads, long lb, \ 1225 long ub, long str, long chunk_sz, unsigned flags) { \ 1226 int gtid = __kmp_entry_gtid(); \ 1227 MKLOC(loc, #func); \ 1229 (#func ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \ 1230 gtid, lb, ub, str, chunk_sz)); \ 1233 if (__kmpc_ok_to_fork(&loc) && (num_threads != 1)) { \ 1234 if (num_threads != 0) { \ 1235 __kmp_push_num_threads(&loc, gtid, num_threads); \ 1238 __kmp_push_proc_bind(&loc, gtid, (kmp_proc_bind_t)flags); \ 1240 __kmp_GOMP_fork_call(&loc, gtid, task, \ 1241 (microtask_t)__kmp_GOMP_parallel_microtask_wrapper, \ 1242 9, task, data, num_threads, &loc, (schedule), lb, \ 1243 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz); \ 1245 __kmp_GOMP_serialized_parallel(&loc, gtid, task); \ 1248 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 1249 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \ 1250 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \ 1251 (schedule) != kmp_sch_static); \ 1253 KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_END)(); \ 1256 KA_TRACE(20, (#func " exit: T#%d\n", gtid)); \ 1259 PARALLEL_LOOP(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC),
1261 PARALLEL_LOOP(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC),
1262 kmp_sch_dynamic_chunked, OMPT_LOOP_PRE, OMPT_LOOP_POST)
1263 PARALLEL_LOOP(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED),
1265 PARALLEL_LOOP(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME),
1266 kmp_sch_runtime, OMPT_LOOP_PRE, OMPT_LOOP_POST)
1268 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKGROUP_START)(void) {
1269 int gtid = __kmp_entry_gtid();
1270 MKLOC(loc,
"GOMP_taskgroup_start");
1271 KA_TRACE(20, (
"GOMP_taskgroup_start: T#%d\n", gtid));
1274 if (ompt_enabled.enabled)
1275 OMPT_STORE_RETURN_ADDRESS(gtid);
1278 __kmpc_taskgroup(&loc, gtid);
1283 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKGROUP_END)(void) {
1284 int gtid = __kmp_get_gtid();
1285 MKLOC(loc,
"GOMP_taskgroup_end");
1286 KA_TRACE(20, (
"GOMP_taskgroup_end: T#%d\n", gtid));
1289 if (ompt_enabled.enabled)
1290 OMPT_STORE_RETURN_ADDRESS(gtid);
1293 __kmpc_end_taskgroup(&loc, gtid);
1302 __kmp_gomp_to_omp_cancellation_kind(
int gomp_kind) {
1303 kmp_int32 cncl_kind = 0;
1304 switch (gomp_kind) {
1306 cncl_kind = cancel_parallel;
1309 cncl_kind = cancel_loop;
1312 cncl_kind = cancel_sections;
1315 cncl_kind = cancel_taskgroup;
1321 bool KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CANCELLATION_POINT)(
int which) {
1322 if (__kmp_omp_cancellation) {
1323 KMP_FATAL(NoGompCancellation);
1325 int gtid = __kmp_get_gtid();
1326 MKLOC(loc,
"GOMP_cancellation_point");
1327 KA_TRACE(20, (
"GOMP_cancellation_point: T#%d\n", gtid));
1329 kmp_int32 cncl_kind = __kmp_gomp_to_omp_cancellation_kind(which);
1331 return __kmpc_cancellationpoint(&loc, gtid, cncl_kind);
1334 bool KMP_EXPAND_NAME(KMP_API_NAME_GOMP_BARRIER_CANCEL)(void) {
1335 if (__kmp_omp_cancellation) {
1336 KMP_FATAL(NoGompCancellation);
1338 KMP_FATAL(NoGompCancellation);
1339 int gtid = __kmp_get_gtid();
1340 MKLOC(loc,
"GOMP_barrier_cancel");
1341 KA_TRACE(20, (
"GOMP_barrier_cancel: T#%d\n", gtid));
1343 return __kmpc_cancel_barrier(&loc, gtid);
1346 bool KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CANCEL)(
int which,
bool do_cancel) {
1347 if (__kmp_omp_cancellation) {
1348 KMP_FATAL(NoGompCancellation);
1353 int gtid = __kmp_get_gtid();
1354 MKLOC(loc,
"GOMP_cancel");
1355 KA_TRACE(20, (
"GOMP_cancel: T#%d\n", gtid));
1357 kmp_int32 cncl_kind = __kmp_gomp_to_omp_cancellation_kind(which);
1359 if (do_cancel == FALSE) {
1360 return KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CANCELLATION_POINT)(which);
1362 return __kmpc_cancel(&loc, gtid, cncl_kind);
1366 bool KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SECTIONS_END_CANCEL)(void) {
1367 if (__kmp_omp_cancellation) {
1368 KMP_FATAL(NoGompCancellation);
1370 int gtid = __kmp_get_gtid();
1371 MKLOC(loc,
"GOMP_sections_end_cancel");
1372 KA_TRACE(20, (
"GOMP_sections_end_cancel: T#%d\n", gtid));
1374 return __kmpc_cancel_barrier(&loc, gtid);
1377 bool KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_END_CANCEL)(void) {
1378 if (__kmp_omp_cancellation) {
1379 KMP_FATAL(NoGompCancellation);
1381 int gtid = __kmp_get_gtid();
1382 MKLOC(loc,
"GOMP_loop_end_cancel");
1383 KA_TRACE(20, (
"GOMP_loop_end_cancel: T#%d\n", gtid));
1385 return __kmpc_cancel_barrier(&loc, gtid);
1389 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TARGET)(
int device, void (*fn)(
void *),
1390 const void *openmp_target,
1391 size_t mapnum,
void **hostaddrs,
1393 unsigned char *kinds) {
1397 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TARGET_DATA)(
1398 int device,
const void *openmp_target,
size_t mapnum,
void **hostaddrs,
1399 size_t *sizes,
unsigned char *kinds) {
1403 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TARGET_END_DATA)(void) {
return; }
1405 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TARGET_UPDATE)(
1406 int device,
const void *openmp_target,
size_t mapnum,
void **hostaddrs,
1407 size_t *sizes,
unsigned char *kinds) {
1411 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TEAMS)(
unsigned int num_teams,
1412 unsigned int thread_limit) {
1415 #endif // OMP_40_ENABLED 1421 static void __kmp_gomp_task_dup(kmp_task_t *dest, kmp_task_t *src,
1422 kmp_int32 last_private) {
1423 kmp_taskdata_t *taskdata = KMP_TASK_TO_TASKDATA(src);
1424 if (taskdata->td_copy_func) {
1425 (taskdata->td_copy_func)(dest->shareds, src->shareds);
1433 template <
typename T>
1434 void __GOMP_taskloop(
void (*func)(
void *),
void *data,
1435 void (*copy_func)(
void *,
void *),
long arg_size,
1436 long arg_align,
unsigned gomp_flags,
1437 unsigned long num_tasks,
int priority, T start, T end,
1439 typedef void (*p_task_dup_t)(kmp_task_t *, kmp_task_t *, kmp_int32);
1440 MKLOC(loc,
"GOMP_taskloop");
1443 int gtid = __kmp_entry_gtid();
1444 kmp_int32 flags = 0;
1445 int if_val = gomp_flags & (1u << 10);
1446 int nogroup = gomp_flags & (1u << 11);
1447 int up = gomp_flags & (1u << 8);
1448 p_task_dup_t task_dup = NULL;
1449 kmp_tasking_flags_t *input_flags = (kmp_tasking_flags_t *)&flags;
1453 buff = __kmp_str_format(
1454 "GOMP_taskloop: T#%%d: func:%%p data:%%p copy_func:%%p " 1455 "arg_size:%%ld arg_align:%%ld gomp_flags:0x%%x num_tasks:%%lu " 1456 "priority:%%d start:%%%s end:%%%s step:%%%s\n",
1457 traits_t<T>::spec, traits_t<T>::spec, traits_t<T>::spec);
1458 KA_TRACE(20, (buff, gtid, func, data, copy_func, arg_size, arg_align,
1459 gomp_flags, num_tasks, priority, start, end, step));
1460 __kmp_str_free(&buff);
1463 KMP_ASSERT((
size_t)arg_size >= 2 *
sizeof(T));
1464 KMP_ASSERT(arg_align > 0);
1466 if (!(gomp_flags & 1)) {
1467 input_flags->tiedness = 1;
1470 if (gomp_flags & 2) {
1471 input_flags->final = 1;
1479 for (
int i =
sizeof(T) * CHAR_BIT - 1; i >= 0L; --i) {
1481 if (step & ((T)1 << i))
1483 step |= ((T)1 << i);
1487 input_flags->native = 1;
1489 if (num_tasks > 0) {
1490 if (gomp_flags & (1u << 9))
1501 __kmp_task_alloc(&loc, gtid, input_flags,
sizeof(kmp_task_t),
1502 arg_size + arg_align - 1, (kmp_routine_entry_t)func);
1503 kmp_taskdata_t *taskdata = KMP_TASK_TO_TASKDATA(task);
1504 taskdata->td_copy_func = copy_func;
1505 taskdata->td_size_loop_bounds =
sizeof(T);
1509 task->shareds = (
void *)((((
size_t)task->shareds) + arg_align - 1) /
1510 arg_align * arg_align);
1512 task_dup = __kmp_gomp_task_dup;
1514 KMP_MEMCPY(task->shareds, data, arg_size);
1516 loop_bounds = (T *)task->shareds;
1517 loop_bounds[0] = start;
1518 loop_bounds[1] = end + (up ? -1 : 1);
1519 __kmpc_taskloop(&loc, gtid, task, if_val, (kmp_uint64 *)&(loop_bounds[0]),
1520 (kmp_uint64 *)&(loop_bounds[1]), (kmp_int64)step, nogroup,
1521 sched, (kmp_uint64)num_tasks, (
void *)task_dup);
1526 #endif // __cplusplus 1528 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKLOOP)(
1529 void (*func)(
void *),
void *data,
void (*copy_func)(
void *,
void *),
1530 long arg_size,
long arg_align,
unsigned gomp_flags,
unsigned long num_tasks,
1531 int priority,
long start,
long end,
long step) {
1532 __GOMP_taskloop<long>(func, data, copy_func, arg_size, arg_align, gomp_flags,
1533 num_tasks, priority, start, end, step);
1536 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_TASKLOOP_ULL)(
1537 void (*func)(
void *),
void *data,
void (*copy_func)(
void *,
void *),
1538 long arg_size,
long arg_align,
unsigned gomp_flags,
unsigned long num_tasks,
1539 int priority,
unsigned long long start,
unsigned long long end,
1540 unsigned long long step) {
1541 __GOMP_taskloop<unsigned long long>(func, data, copy_func, arg_size,
1542 arg_align, gomp_flags, num_tasks,
1543 priority, start, end, step);
1553 #ifdef KMP_USE_VERSION_SYMBOLS 1555 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_ATOMIC_END, 10,
"GOMP_1.0");
1556 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_ATOMIC_START, 10,
"GOMP_1.0");
1557 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_BARRIER, 10,
"GOMP_1.0");
1558 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CRITICAL_END, 10,
"GOMP_1.0");
1559 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CRITICAL_NAME_END, 10,
"GOMP_1.0");
1560 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CRITICAL_NAME_START, 10,
"GOMP_1.0");
1561 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CRITICAL_START, 10,
"GOMP_1.0");
1562 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT, 10,
"GOMP_1.0");
1563 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START, 10,
"GOMP_1.0");
1564 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_END, 10,
"GOMP_1.0");
1565 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_END_NOWAIT, 10,
"GOMP_1.0");
1566 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT, 10,
"GOMP_1.0");
1567 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_GUIDED_START, 10,
"GOMP_1.0");
1568 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_NEXT, 10,
"GOMP_1.0");
1569 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START, 10,
1571 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_NEXT, 10,
"GOMP_1.0");
1572 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_GUIDED_START, 10,
"GOMP_1.0");
1573 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_NEXT, 10,
"GOMP_1.0");
1574 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_RUNTIME_START, 10,
1576 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT, 10,
"GOMP_1.0");
1577 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START, 10,
"GOMP_1.0");
1578 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT, 10,
"GOMP_1.0");
1579 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_RUNTIME_START, 10,
"GOMP_1.0");
1580 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT, 10,
"GOMP_1.0");
1581 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_STATIC_START, 10,
"GOMP_1.0");
1582 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_ORDERED_END, 10,
"GOMP_1.0");
1583 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_ORDERED_START, 10,
"GOMP_1.0");
1584 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_END, 10,
"GOMP_1.0");
1585 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC_START, 10,
1587 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED_START, 10,
1589 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME_START, 10,
1591 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC_START, 10,
1593 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_SECTIONS_START, 10,
"GOMP_1.0");
1594 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_START, 10,
"GOMP_1.0");
1595 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SECTIONS_END, 10,
"GOMP_1.0");
1596 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SECTIONS_END_NOWAIT, 10,
"GOMP_1.0");
1597 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SECTIONS_NEXT, 10,
"GOMP_1.0");
1598 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SECTIONS_START, 10,
"GOMP_1.0");
1599 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SINGLE_COPY_END, 10,
"GOMP_1.0");
1600 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SINGLE_COPY_START, 10,
"GOMP_1.0");
1601 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SINGLE_START, 10,
"GOMP_1.0");
1604 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASK, 20,
"GOMP_2.0");
1605 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKWAIT, 20,
"GOMP_2.0");
1606 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_NEXT, 20,
"GOMP_2.0");
1607 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_DYNAMIC_START, 20,
"GOMP_2.0");
1608 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_NEXT, 20,
"GOMP_2.0");
1609 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_GUIDED_START, 20,
"GOMP_2.0");
1610 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_NEXT, 20,
1612 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_DYNAMIC_START, 20,
1614 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_NEXT, 20,
1616 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_GUIDED_START, 20,
1618 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_NEXT, 20,
1620 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_RUNTIME_START, 20,
1622 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_NEXT, 20,
1624 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_ORDERED_STATIC_START, 20,
1626 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_NEXT, 20,
"GOMP_2.0");
1627 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_RUNTIME_START, 20,
"GOMP_2.0");
1628 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_NEXT, 20,
"GOMP_2.0");
1629 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_ULL_STATIC_START, 20,
"GOMP_2.0");
1632 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKYIELD, 30,
"GOMP_3.0");
1636 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL, 40,
"GOMP_4.0");
1637 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_SECTIONS, 40,
"GOMP_4.0");
1638 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_DYNAMIC, 40,
"GOMP_4.0");
1639 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_GUIDED, 40,
"GOMP_4.0");
1640 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_RUNTIME, 40,
"GOMP_4.0");
1641 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_PARALLEL_LOOP_STATIC, 40,
"GOMP_4.0");
1642 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKGROUP_START, 40,
"GOMP_4.0");
1643 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKGROUP_END, 40,
"GOMP_4.0");
1644 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_BARRIER_CANCEL, 40,
"GOMP_4.0");
1645 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CANCEL, 40,
"GOMP_4.0");
1646 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_CANCELLATION_POINT, 40,
"GOMP_4.0");
1647 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_LOOP_END_CANCEL, 40,
"GOMP_4.0");
1648 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_SECTIONS_END_CANCEL, 40,
"GOMP_4.0");
1649 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TARGET, 40,
"GOMP_4.0");
1650 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TARGET_DATA, 40,
"GOMP_4.0");
1651 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TARGET_END_DATA, 40,
"GOMP_4.0");
1652 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TARGET_UPDATE, 40,
"GOMP_4.0");
1653 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TEAMS, 40,
"GOMP_4.0");
1657 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKLOOP, 45,
"GOMP_4.5");
1658 KMP_VERSION_SYMBOL(KMP_API_NAME_GOMP_TASKLOOP_ULL, 45,
"GOMP_4.5");
1661 #endif // KMP_USE_VERSION_SYMBOLS 1665 #endif // __cplusplus
KMP_EXPORT void __kmpc_end_ordered(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_end_serialized_parallel(ident_t *, kmp_int32 global_tid)
KMP_EXPORT kmp_int32 __kmpc_omp_task_with_deps(ident_t *loc_ref, kmp_int32 gtid, kmp_task_t *new_task, kmp_int32 ndeps, kmp_depend_info_t *dep_list, kmp_int32 ndeps_noalias, kmp_depend_info_t *noalias_dep_list)
KMP_EXPORT void __kmpc_ordered(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_critical(ident_t *, kmp_int32 global_tid, kmp_critical_name *)
KMP_EXPORT kmp_int32 __kmpc_ok_to_fork(ident_t *)
KMP_EXPORT void __kmpc_barrier(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_end_critical(ident_t *, kmp_int32 global_tid, kmp_critical_name *)