15 #include "kmp_atomic.h" 18 #include "ompt-specific.h" 25 #define MKLOC(loc, routine) \ 26 static ident_t(loc) = {0, KMP_IDENT_KMPC, 0, 0, ";unknown;unknown;0;0;;"}; 28 #include "kmp_ftn_os.h" 30 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_BARRIER)(void) {
31 int gtid = __kmp_entry_gtid();
32 MKLOC(loc,
"GOMP_barrier");
33 KA_TRACE(20, (
"GOMP_barrier: T#%d\n", gtid));
34 #if OMPT_SUPPORT && OMPT_OPTIONAL 35 omp_frame_t *ompt_frame;
36 if (ompt_enabled.enabled) {
37 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
38 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
39 OMPT_STORE_RETURN_ADDRESS(gtid);
43 #if OMPT_SUPPORT && OMPT_OPTIONAL 44 if (ompt_enabled.enabled) {
45 ompt_frame->enter_frame = NULL;
59 extern kmp_critical_name *__kmp_unnamed_critical_addr;
61 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_START)(void) {
62 int gtid = __kmp_entry_gtid();
63 MKLOC(loc,
"GOMP_critical_start");
64 KA_TRACE(20, (
"GOMP_critical_start: T#%d\n", gtid));
65 #if OMPT_SUPPORT && OMPT_OPTIONAL 66 OMPT_STORE_RETURN_ADDRESS(gtid);
71 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_END)(void) {
72 int gtid = __kmp_get_gtid();
73 MKLOC(loc,
"GOMP_critical_end");
74 KA_TRACE(20, (
"GOMP_critical_end: T#%d\n", gtid));
75 #if OMPT_SUPPORT && OMPT_OPTIONAL 76 OMPT_STORE_RETURN_ADDRESS(gtid);
81 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_NAME_START)(
void **pptr) {
82 int gtid = __kmp_entry_gtid();
83 MKLOC(loc,
"GOMP_critical_name_start");
84 KA_TRACE(20, (
"GOMP_critical_name_start: T#%d\n", gtid));
88 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_CRITICAL_NAME_END)(
void **pptr) {
89 int gtid = __kmp_get_gtid();
90 MKLOC(loc,
"GOMP_critical_name_end");
91 KA_TRACE(20, (
"GOMP_critical_name_end: T#%d\n", gtid));
98 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ATOMIC_START)(void) {
99 int gtid = __kmp_entry_gtid();
100 KA_TRACE(20, (
"GOMP_atomic_start: T#%d\n", gtid));
103 __ompt_thread_assign_wait_id(0);
106 __kmp_acquire_atomic_lock(&__kmp_atomic_lock, gtid);
109 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ATOMIC_END)(void) {
110 int gtid = __kmp_get_gtid();
111 KA_TRACE(20, (
"GOMP_atomic_end: T#%d\n", gtid));
112 __kmp_release_atomic_lock(&__kmp_atomic_lock, gtid);
115 int KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_START)(void) {
116 int gtid = __kmp_entry_gtid();
117 MKLOC(loc,
"GOMP_single_start");
118 KA_TRACE(20, (
"GOMP_single_start: T#%d\n", gtid));
120 if (!TCR_4(__kmp_init_parallel))
121 __kmp_parallel_initialize();
126 kmp_int32 rc = __kmp_enter_single(gtid, &loc, FALSE);
128 #if OMPT_SUPPORT && OMPT_OPTIONAL 129 kmp_info_t *this_thr = __kmp_threads[gtid];
130 kmp_team_t *team = this_thr->th.th_team;
131 int tid = __kmp_tid_from_gtid(gtid);
133 if (ompt_enabled.enabled) {
135 if (ompt_enabled.ompt_callback_work) {
136 ompt_callbacks.ompt_callback(ompt_callback_work)(
137 ompt_work_single_executor, ompt_scope_begin,
138 &(team->t.ompt_team_info.parallel_data),
139 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
140 1, OMPT_GET_RETURN_ADDRESS(0));
143 if (ompt_enabled.ompt_callback_work) {
144 ompt_callbacks.ompt_callback(ompt_callback_work)(
145 ompt_work_single_other, ompt_scope_begin,
146 &(team->t.ompt_team_info.parallel_data),
147 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
148 1, OMPT_GET_RETURN_ADDRESS(0));
149 ompt_callbacks.ompt_callback(ompt_callback_work)(
150 ompt_work_single_other, ompt_scope_end,
151 &(team->t.ompt_team_info.parallel_data),
152 &(team->t.t_implicit_task_taskdata[tid].ompt_task_info.task_data),
153 1, OMPT_GET_RETURN_ADDRESS(0));
162 void *KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_COPY_START)(void) {
164 int gtid = __kmp_entry_gtid();
165 MKLOC(loc,
"GOMP_single_copy_start");
166 KA_TRACE(20, (
"GOMP_single_copy_start: T#%d\n", gtid));
168 if (!TCR_4(__kmp_init_parallel))
169 __kmp_parallel_initialize();
174 if (__kmp_enter_single(gtid, &loc, FALSE))
180 #if OMPT_SUPPORT && OMPT_OPTIONAL 181 omp_frame_t *ompt_frame;
182 if (ompt_enabled.enabled) {
183 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
184 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
185 OMPT_STORE_RETURN_ADDRESS(gtid);
188 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
192 retval = __kmp_team_from_gtid(gtid)->t.t_copypriv_data;
193 #if OMPT_SUPPORT && OMPT_OPTIONAL 194 if (ompt_enabled.enabled) {
195 OMPT_STORE_RETURN_ADDRESS(gtid);
198 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
199 #if OMPT_SUPPORT && OMPT_OPTIONAL 200 if (ompt_enabled.enabled) {
201 ompt_frame->enter_frame = NULL;
207 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_SINGLE_COPY_END)(
void *data) {
208 int gtid = __kmp_get_gtid();
209 KA_TRACE(20, (
"GOMP_single_copy_end: T#%d\n", gtid));
215 __kmp_team_from_gtid(gtid)->t.t_copypriv_data = data;
216 #if OMPT_SUPPORT && OMPT_OPTIONAL 217 omp_frame_t *ompt_frame;
218 if (ompt_enabled.enabled) {
219 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
220 ompt_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
221 OMPT_STORE_RETURN_ADDRESS(gtid);
224 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
225 #if OMPT_SUPPORT && OMPT_OPTIONAL 226 if (ompt_enabled.enabled) {
227 OMPT_STORE_RETURN_ADDRESS(gtid);
230 __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
231 #if OMPT_SUPPORT && OMPT_OPTIONAL 232 if (ompt_enabled.enabled) {
233 ompt_frame->enter_frame = NULL;
238 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ORDERED_START)(void) {
239 int gtid = __kmp_entry_gtid();
240 MKLOC(loc,
"GOMP_ordered_start");
241 KA_TRACE(20, (
"GOMP_ordered_start: T#%d\n", gtid));
242 #if OMPT_SUPPORT && OMPT_OPTIONAL 243 OMPT_STORE_RETURN_ADDRESS(gtid);
248 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_ORDERED_END)(void) {
249 int gtid = __kmp_get_gtid();
250 MKLOC(loc,
"GOMP_ordered_end");
251 KA_TRACE(20, (
"GOMP_ordered_start: T#%d\n", gtid));
252 #if OMPT_SUPPORT && OMPT_OPTIONAL 253 OMPT_STORE_RETURN_ADDRESS(gtid);
263 #if KMP_ARCH_X86 || KMP_ARCH_ARM || KMP_ARCH_MIPS 264 #define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_4 265 #define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_4 266 #define KMP_DISPATCH_NEXT __kmpc_dispatch_next_4 268 #define KMP_DISPATCH_INIT __kmp_aux_dispatch_init_8 269 #define KMP_DISPATCH_FINI_CHUNK __kmp_aux_dispatch_fini_chunk_8 270 #define KMP_DISPATCH_NEXT __kmpc_dispatch_next_8 273 #define KMP_DISPATCH_INIT_ULL __kmp_aux_dispatch_init_8u 274 #define KMP_DISPATCH_FINI_CHUNK_ULL __kmp_aux_dispatch_fini_chunk_8u 275 #define KMP_DISPATCH_NEXT_ULL __kmpc_dispatch_next_8u 283 __kmp_GOMP_microtask_wrapper(
int *gtid,
int *npr,
void (*task)(
void *),
287 omp_frame_t *ompt_frame;
288 omp_state_t enclosing_state;
290 if (ompt_enabled.enabled) {
292 thr = __kmp_threads[*gtid];
295 enclosing_state = thr->th.ompt_thread_info.state;
296 thr->th.ompt_thread_info.state = omp_state_work_parallel;
299 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
300 ompt_frame->exit_frame = OMPT_GET_FRAME_ADDRESS(0);
307 if (ompt_enabled.enabled) {
309 ompt_frame->exit_frame = NULL;
312 thr->th.ompt_thread_info.state = enclosing_state;
321 __kmp_GOMP_parallel_microtask_wrapper(
int *gtid,
int *npr,
322 void (*task)(
void *),
void *data,
323 unsigned num_threads,
ident_t *loc,
329 KMP_DISPATCH_INIT(loc, *gtid, schedule, start, end, incr, chunk_size,
334 omp_frame_t *ompt_frame;
335 omp_state_t enclosing_state;
337 if (ompt_enabled.enabled) {
338 thr = __kmp_threads[*gtid];
340 enclosing_state = thr->th.ompt_thread_info.state;
341 thr->th.ompt_thread_info.state = omp_state_work_parallel;
344 __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
345 ompt_frame->exit_frame = OMPT_GET_FRAME_ADDRESS(0);
353 if (ompt_enabled.enabled) {
355 ompt_frame->exit_frame = NULL;
358 thr->th.ompt_thread_info.state = enclosing_state;
367 __kmp_GOMP_fork_call(
ident_t *loc,
int gtid,
void (*unwrapped_task)(
void *),
368 microtask_t wrapper,
int argc, ...) {
370 kmp_info_t *thr = __kmp_threads[gtid];
371 kmp_team_t *team = thr->th.th_team;
372 int tid = __kmp_tid_from_gtid(gtid);
377 rc = __kmp_fork_call(loc, gtid, fork_context_gnu, argc, wrapper,
378 __kmp_invoke_task_func,
379 #
if (KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64) && KMP_OS_LINUX
389 __kmp_run_before_invoked_task(gtid, tid, thr, team);
394 if (ompt_enabled.enabled) {
395 ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);
396 ompt_task_info_t *task_info = __ompt_get_task_info_object(0);
399 if (ompt_enabled.ompt_callback_implicit_task) {
400 ompt_team_size = __kmp_team_from_gtid(gtid)->t.t_nproc;
401 ompt_callbacks.ompt_callback(ompt_callback_implicit_task)(
402 ompt_scope_begin, &(team_info->parallel_data),
403 &(task_info->task_data), ompt_team_size, __kmp_tid_from_gtid(gtid));
404 task_info->thread_num = __kmp_tid_from_gtid(gtid);
406 thr->th.ompt_thread_info.state = omp_state_work_parallel;
411 static void __kmp_GOMP_serialized_parallel(
ident_t *loc, kmp_int32 gtid,
412 void (*task)(
void *)) {
414 OMPT_STORE_RETURN_ADDRESS(gtid);
416 __kmp_serialized_parallel(loc, gtid);
419 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_START)(void (*task)(
void *),
421 unsigned num_threads) {
422 int gtid = __kmp_entry_gtid();
425 omp_frame_t *parent_frame, *frame;
427 if (ompt_enabled.enabled) {
428 __ompt_get_task_info_internal(0, NULL, NULL, &parent_frame, NULL, NULL);
429 parent_frame->enter_frame = OMPT_GET_FRAME_ADDRESS(1);
430 OMPT_STORE_RETURN_ADDRESS(gtid);
434 MKLOC(loc,
"GOMP_parallel_start");
435 KA_TRACE(20, (
"GOMP_parallel_start: T#%d\n", gtid));
438 if (num_threads != 0) {
439 __kmp_push_num_threads(&loc, gtid, num_threads);
441 __kmp_GOMP_fork_call(&loc, gtid, task,
442 (microtask_t)__kmp_GOMP_microtask_wrapper, 2, task,
445 __kmp_GOMP_serialized_parallel(&loc, gtid, task);
449 if (ompt_enabled.enabled) {
450 __ompt_get_task_info_internal(0, NULL, NULL, &frame, NULL, NULL);
451 frame->exit_frame = OMPT_GET_FRAME_ADDRESS(1);
456 void KMP_EXPAND_NAME(KMP_API_NAME_GOMP_PARALLEL_END)(void) {
457 int gtid = __kmp_get_gtid();
459 int ompt_team_size = __kmp_team_from_gtid(gtid)->t.t_nproc;
461 thr = __kmp_threads[gtid];
463 MKLOC(loc,
"GOMP_parallel_end");
464 KA_TRACE(20, (
"GOMP_parallel_end: T#%d\n", gtid));
466 if (!thr->th.th_team->t.t_serialized) {
467 __kmp_run_after_invoked_task(gtid, __kmp_tid_from_gtid(gtid), thr,
471 if (ompt_enabled.enabled) {
475 OMPT_CUR_TASK_INFO(thr)->frame.exit_frame = NULL;
479 __kmp_join_call(&loc, gtid
515 #define IF_OMPT_SUPPORT(code) code 517 #define IF_OMPT_SUPPORT(code) 520 #define LOOP_START(func, schedule) \ 521 int func(long lb, long ub, long str, long chunk_sz, long *p_lb, \ 525 int gtid = __kmp_entry_gtid(); \ 526 MKLOC(loc, KMP_STR(func)); \ 530 func) ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz 0x%lx\n", \ 531 gtid, lb, ub, str, chunk_sz)); \ 533 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 534 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 535 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \ 536 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, \ 537 (schedule) != kmp_sch_static); \ 538 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 539 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 540 (kmp_int *)p_ub, (kmp_int *)&stride); \ 542 KMP_DEBUG_ASSERT(stride == str); \ 543 *p_ub += (str > 0) ? 1 : -1; \ 552 func) " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \ 553 gtid, *p_lb, *p_ub, status)); \ 557 #define LOOP_RUNTIME_START(func, schedule) \ 558 int func(long lb, long ub, long str, long *p_lb, long *p_ub) { \ 562 int gtid = __kmp_entry_gtid(); \ 563 MKLOC(loc, KMP_STR(func)); \ 566 (KMP_STR(func) ": T#%d, lb 0x%lx, ub 0x%lx, str 0x%lx, chunk_sz %d\n", \ 567 gtid, lb, ub, str, chunk_sz)); \ 569 if ((str > 0) ? (lb < ub) : (lb > ub)) { \ 570 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 571 KMP_DISPATCH_INIT(&loc, gtid, (schedule), lb, \ 572 (str > 0) ? (ub - 1) : (ub + 1), str, chunk_sz, TRUE); \ 573 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 574 status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 575 (kmp_int *)p_ub, (kmp_int *)&stride); \ 577 KMP_DEBUG_ASSERT(stride == str); \ 578 *p_ub += (str > 0) ? 1 : -1; \ 587 func) " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, returning %d\n", \ 588 gtid, *p_lb, *p_ub, status)); \ 593 #define KMP_DOACROSS_FINI(status, gtid) \ 594 if (!status && __kmp_threads[gtid]->th.th_dispatch->th_doacross_flags) { \ 595 __kmpc_doacross_fini(NULL, gtid); \ 598 #define KMP_DOACROSS_FINI(status, gtid) 601 #define LOOP_NEXT(func, fini_code) \ 602 int func(long *p_lb, long *p_ub) { \ 605 int gtid = __kmp_get_gtid(); \ 606 MKLOC(loc, KMP_STR(func)); \ 607 KA_TRACE(20, (KMP_STR(func) ": T#%d\n", gtid)); \ 609 IF_OMPT_SUPPORT(OMPT_STORE_RETURN_ADDRESS(gtid);) \ 610 fini_code status = KMP_DISPATCH_NEXT(&loc, gtid, NULL, (kmp_int *)p_lb, \ 611 (kmp_int *)p_ub, (kmp_int *)&stride); \ 613 *p_ub += (stride > 0) ? 1 : -1; \ 615 KMP_DOACROSS_FINI(status, gtid) \ 619 (KMP_STR(func) " exit: T#%d, *p_lb 0x%lx, *p_ub 0x%lx, stride 0x%lx, " \ 621 gtid, *p_lb, *p_ub, stride, status)); \ 625 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_STATIC_START),
kmp_sch_static)
626 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_STATIC_NEXT), {})
627 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_DYNAMIC_START),
628 kmp_sch_dynamic_chunked)
629 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_DYNAMIC_NEXT), {})
630 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_GUIDED_START),
632 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_GUIDED_NEXT), {})
633 LOOP_RUNTIME_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_RUNTIME_START),
635 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_RUNTIME_NEXT), {})
637 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_START),
639 LOOP_NEXT(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_STATIC_NEXT),
640 { KMP_DISPATCH_FINI_CHUNK(&loc, gtid); })
641 LOOP_START(KMP_EXPAND_NAME(KMP_API_NAME_GOMP_LOOP_ORDERED_DYNAMIC_START),