14 #include "kmp_affinity.h"
19 #include "kmp_stats.h"
21 #include "kmp_wait_release.h"
22 #include "kmp_wrapper_getpid.h"
24 #if !KMP_OS_DRAGONFLY && !KMP_OS_FREEBSD && !KMP_OS_NETBSD && !KMP_OS_OPENBSD
29 #include <semaphore.h>
31 #include <sys/resource.h>
34 #include <libperfstat.h>
36 #include <sys/syscall.h>
39 #include <sys/times.h>
43 #include <sys/sysinfo.h>
58 #include <mach/mach.h>
59 #include <sys/sysctl.h>
60 #elif KMP_OS_DRAGONFLY || KMP_OS_FREEBSD
61 #include <sys/types.h>
62 #include <sys/sysctl.h>
64 #include <pthread_np.h>
68 #elif KMP_OS_NETBSD || KMP_OS_OPENBSD
69 #include <sys/types.h>
70 #include <sys/sysctl.h>
75 #include <pthread_np.h>
81 #include <sys/loadavg.h>
88 struct kmp_sys_timer {
89 struct timespec start;
92 #ifndef TIMEVAL_TO_TIMESPEC
94 #define TIMEVAL_TO_TIMESPEC(tv, ts) \
96 (ts)->tv_sec = (tv)->tv_sec; \
97 (ts)->tv_nsec = (tv)->tv_usec * 1000; \
102 #define TS2NS(timespec) \
103 (((timespec).tv_sec * (long int)1e9) + (timespec).tv_nsec)
105 static struct kmp_sys_timer __kmp_sys_timer_data;
107 #if KMP_HANDLE_SIGNALS
108 typedef void (*sig_func_t)(int);
109 STATIC_EFI2_WORKAROUND
struct sigaction __kmp_sighldrs[NSIG];
110 static sigset_t __kmp_sigset;
113 static int __kmp_init_runtime = FALSE;
115 static int __kmp_fork_count = 0;
117 static pthread_condattr_t __kmp_suspend_cond_attr;
118 static pthread_mutexattr_t __kmp_suspend_mutex_attr;
120 static kmp_cond_align_t __kmp_wait_cv;
121 static kmp_mutex_align_t __kmp_wait_mx;
123 kmp_uint64 __kmp_ticks_per_msec = 1000000;
124 kmp_uint64 __kmp_ticks_per_usec = 1000;
127 static void __kmp_print_cond(
char *buffer, kmp_cond_align_t *cond) {
128 KMP_SNPRINTF(buffer, 128,
"(cond (lock (%ld, %d)), (descr (%p)))",
129 cond->c_cond.__c_lock.__status, cond->c_cond.__c_lock.__spinlock,
130 cond->c_cond.__c_waiting);
134 #if ((KMP_OS_LINUX || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY || \
136 KMP_AFFINITY_SUPPORTED)
140 void __kmp_affinity_bind_thread(
int which) {
141 KMP_ASSERT2(KMP_AFFINITY_CAPABLE(),
142 "Illegal set affinity operation when not capable");
144 kmp_affin_mask_t *mask;
145 KMP_CPU_ALLOC_ON_STACK(mask);
147 KMP_CPU_SET(which, mask);
148 __kmp_set_system_affinity(mask, TRUE);
149 KMP_CPU_FREE_FROM_STACK(mask);
153 void __kmp_affinity_determine_capable(
const char *env_var) {
156 size_t mask_size = __kmp_xproc / CHAR_BIT;
158 if (__kmp_xproc % CHAR_BIT)
162 if (mask_size %
sizeof(__kmp_affin_mask_size))
163 mask_size +=
sizeof(__kmp_affin_mask_size) -
164 mask_size %
sizeof(__kmp_affin_mask_size);
165 KMP_AFFINITY_ENABLE(mask_size);
167 (
"__kmp_affinity_determine_capable: "
168 "AIX OS affinity interface bindprocessor functional (mask size = "
169 "%" KMP_SIZE_T_SPEC
").\n",
170 __kmp_affin_mask_size));
178 void __kmp_affinity_determine_capable(
const char *env_var) {
182 #define KMP_CPU_SET_SIZE_LIMIT (1024 * 1024)
183 #define KMP_CPU_SET_TRY_SIZE CACHE_LINE
184 #elif KMP_OS_FREEBSD || KMP_OS_DRAGONFLY
185 #define KMP_CPU_SET_SIZE_LIMIT (sizeof(cpuset_t))
187 #define KMP_CPU_SET_SIZE_LIMIT (256)
190 int verbose = __kmp_affinity.flags.verbose;
191 int warnings = __kmp_affinity.flags.warnings;
192 enum affinity_type type = __kmp_affinity.type;
197 buf = (
unsigned char *)KMP_INTERNAL_MALLOC(KMP_CPU_SET_SIZE_LIMIT);
201 gCode = syscall(__NR_sched_getaffinity, 0, KMP_CPU_SET_TRY_SIZE, buf);
202 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
203 "initial getaffinity call returned %ld errno = %d\n",
206 if (gCode < 0 && errno != EINVAL) {
209 (warnings && (type != affinity_none) && (type != affinity_default) &&
210 (type != affinity_disabled))) {
212 kmp_msg_t err_code = KMP_ERR(error);
213 __kmp_msg(kmp_ms_warning, KMP_MSG(GetAffSysCallNotSupported, env_var),
214 err_code, __kmp_msg_null);
215 if (__kmp_generate_warnings == kmp_warnings_off) {
216 __kmp_str_free(&err_code.str);
219 KMP_AFFINITY_DISABLE();
220 KMP_INTERNAL_FREE(buf);
222 }
else if (gCode > 0) {
224 KMP_AFFINITY_ENABLE(gCode);
225 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
226 "affinity supported (mask size %d)\n",
227 (
int)__kmp_affin_mask_size));
228 KMP_INTERNAL_FREE(buf);
234 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
235 "searching for proper set size\n"));
237 for (size = 1; size <= KMP_CPU_SET_SIZE_LIMIT; size *= 2) {
238 gCode = syscall(__NR_sched_getaffinity, 0, size, buf);
239 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
240 "getaffinity for mask size %ld returned %ld errno = %d\n",
241 size, gCode, errno));
244 if (errno == ENOSYS) {
246 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
247 "inconsistent OS call behavior: errno == ENOSYS for mask "
251 (warnings && (type != affinity_none) &&
252 (type != affinity_default) && (type != affinity_disabled))) {
254 kmp_msg_t err_code = KMP_ERR(error);
255 __kmp_msg(kmp_ms_warning, KMP_MSG(GetAffSysCallNotSupported, env_var),
256 err_code, __kmp_msg_null);
257 if (__kmp_generate_warnings == kmp_warnings_off) {
258 __kmp_str_free(&err_code.str);
261 KMP_AFFINITY_DISABLE();
262 KMP_INTERNAL_FREE(buf);
268 KMP_AFFINITY_ENABLE(gCode);
269 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
270 "affinity supported (mask size %d)\n",
271 (
int)__kmp_affin_mask_size));
272 KMP_INTERNAL_FREE(buf);
275 #elif KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY
278 buf = (
unsigned char *)KMP_INTERNAL_MALLOC(KMP_CPU_SET_SIZE_LIMIT);
279 gCode = pthread_getaffinity_np(pthread_self(), KMP_CPU_SET_SIZE_LIMIT,
280 reinterpret_cast<cpuset_t *
>(buf));
281 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
282 "initial getaffinity call returned %d errno = %d\n",
285 KMP_AFFINITY_ENABLE(KMP_CPU_SET_SIZE_LIMIT);
286 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
287 "affinity supported (mask size %d)\n",
288 (
int)__kmp_affin_mask_size));
289 KMP_INTERNAL_FREE(buf);
293 KMP_INTERNAL_FREE(buf);
296 KMP_AFFINITY_DISABLE();
297 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
298 "cannot determine mask size - affinity not supported\n"));
299 if (verbose || (warnings && (type != affinity_none) &&
300 (type != affinity_default) && (type != affinity_disabled))) {
301 KMP_WARNING(AffCantGetMaskSize, env_var);
310 int __kmp_futex_determine_capable() {
312 long rc = syscall(__NR_futex, &loc, FUTEX_WAKE, 1, NULL, NULL, 0);
313 int retval = (rc == 0) || (errno != ENOSYS);
316 (
"__kmp_futex_determine_capable: rc = %d errno = %d\n", rc, errno));
317 KA_TRACE(10, (
"__kmp_futex_determine_capable: futex syscall%s supported\n",
318 retval ?
"" :
" not"));
325 #if (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_WASM) && (!KMP_ASM_INTRINS)
329 kmp_int8 __kmp_test_then_or8(
volatile kmp_int8 *p, kmp_int8 d) {
330 kmp_int8 old_value, new_value;
332 old_value = TCR_1(*p);
333 new_value = old_value | d;
335 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
337 old_value = TCR_1(*p);
338 new_value = old_value | d;
343 kmp_int8 __kmp_test_then_and8(
volatile kmp_int8 *p, kmp_int8 d) {
344 kmp_int8 old_value, new_value;
346 old_value = TCR_1(*p);
347 new_value = old_value & d;
349 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
351 old_value = TCR_1(*p);
352 new_value = old_value & d;
357 kmp_uint32 __kmp_test_then_or32(
volatile kmp_uint32 *p, kmp_uint32 d) {
358 kmp_uint32 old_value, new_value;
360 old_value = TCR_4(*p);
361 new_value = old_value | d;
363 while (!KMP_COMPARE_AND_STORE_REL32(p, old_value, new_value)) {
365 old_value = TCR_4(*p);
366 new_value = old_value | d;
371 kmp_uint32 __kmp_test_then_and32(
volatile kmp_uint32 *p, kmp_uint32 d) {
372 kmp_uint32 old_value, new_value;
374 old_value = TCR_4(*p);
375 new_value = old_value & d;
377 while (!KMP_COMPARE_AND_STORE_REL32(p, old_value, new_value)) {
379 old_value = TCR_4(*p);
380 new_value = old_value & d;
385 #if KMP_ARCH_X86 || KMP_ARCH_WASM
386 kmp_int8 __kmp_test_then_add8(
volatile kmp_int8 *p, kmp_int8 d) {
387 kmp_int8 old_value, new_value;
389 old_value = TCR_1(*p);
390 new_value = old_value + d;
392 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
394 old_value = TCR_1(*p);
395 new_value = old_value + d;
400 kmp_int64 __kmp_test_then_add64(
volatile kmp_int64 *p, kmp_int64 d) {
401 kmp_int64 old_value, new_value;
403 old_value = TCR_8(*p);
404 new_value = old_value + d;
406 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
408 old_value = TCR_8(*p);
409 new_value = old_value + d;
415 kmp_uint64 __kmp_test_then_or64(
volatile kmp_uint64 *p, kmp_uint64 d) {
416 kmp_uint64 old_value, new_value;
418 old_value = TCR_8(*p);
419 new_value = old_value | d;
420 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
422 old_value = TCR_8(*p);
423 new_value = old_value | d;
428 kmp_uint64 __kmp_test_then_and64(
volatile kmp_uint64 *p, kmp_uint64 d) {
429 kmp_uint64 old_value, new_value;
431 old_value = TCR_8(*p);
432 new_value = old_value & d;
433 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
435 old_value = TCR_8(*p);
436 new_value = old_value & d;
443 void __kmp_terminate_thread(
int gtid) {
445 kmp_info_t *th = __kmp_threads[gtid];
450 #ifdef KMP_CANCEL_THREADS
451 KA_TRACE(10, (
"__kmp_terminate_thread: kill (%d)\n", gtid));
452 status = pthread_cancel(th->th.th_info.ds.ds_thread);
453 if (status != 0 && status != ESRCH) {
454 __kmp_fatal(KMP_MSG(CantTerminateWorkerThread), KMP_ERR(status),
465 static kmp_int32 __kmp_set_stack_info(
int gtid, kmp_info_t *th) {
467 #if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
468 KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_AIX
476 if (!KMP_UBER_GTID(gtid)) {
480 if ((status = thr_stksegment(&s)) < 0) {
481 KMP_CHECK_SYSFAIL(
"thr_stksegment", status);
486 KA_TRACE(60, (
"__kmp_set_stack_info: T#%d thr_stksegment returned size:"
487 " %lu, low addr: %p\n",
492 status = pthread_attr_init(&attr);
493 KMP_CHECK_SYSFAIL(
"pthread_attr_init", status);
494 #if KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD
495 status = pthread_attr_get_np(pthread_self(), &attr);
496 KMP_CHECK_SYSFAIL(
"pthread_attr_get_np", status);
498 status = pthread_getattr_np(pthread_self(), &attr);
499 KMP_CHECK_SYSFAIL(
"pthread_getattr_np", status);
501 status = pthread_attr_getstack(&attr, &addr, &size);
502 KMP_CHECK_SYSFAIL(
"pthread_attr_getstack", status);
504 (
"__kmp_set_stack_info: T#%d pthread_attr_getstack returned size:"
505 " %lu, low addr: %p\n",
507 status = pthread_attr_destroy(&attr);
508 KMP_CHECK_SYSFAIL(
"pthread_attr_destroy", status);
512 if (size != 0 && addr != 0) {
514 TCW_PTR(th->th.th_info.ds.ds_stackbase, (((
char *)addr) + size));
515 TCW_PTR(th->th.th_info.ds.ds_stacksize, size);
516 TCW_4(th->th.th_info.ds.ds_stackgrow, FALSE);
522 TCW_PTR(th->th.th_info.ds.ds_stacksize, 0);
523 TCW_PTR(th->th.th_info.ds.ds_stackbase, &stack_data);
524 TCW_4(th->th.th_info.ds.ds_stackgrow, TRUE);
528 static void *__kmp_launch_worker(
void *thr) {
529 int status, old_type, old_state;
530 #ifdef KMP_BLOCK_SIGNALS
531 sigset_t new_set, old_set;
534 #if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
535 KMP_OS_OPENBSD || KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_AIX
536 void *
volatile padding = 0;
540 gtid = ((kmp_info_t *)thr)->th.th_info.ds.ds_gtid;
541 __kmp_gtid_set_specific(gtid);
542 #ifdef KMP_TDATA_GTID
545 #if KMP_STATS_ENABLED
547 __kmp_stats_thread_ptr = ((kmp_info_t *)thr)->th.th_stats;
548 __kmp_stats_thread_ptr->startLife();
549 KMP_SET_THREAD_STATE(IDLE);
554 __kmp_itt_thread_name(gtid);
557 #if KMP_AFFINITY_SUPPORTED
558 __kmp_affinity_bind_init_mask(gtid);
561 #ifdef KMP_CANCEL_THREADS
562 status = pthread_setcanceltype(PTHREAD_CANCEL_ASYNCHRONOUS, &old_type);
563 KMP_CHECK_SYSFAIL(
"pthread_setcanceltype", status);
565 status = pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, &old_state);
566 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
569 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
571 __kmp_clear_x87_fpu_status_word();
572 __kmp_load_x87_fpu_control_word(&__kmp_init_x87_fpu_control_word);
573 __kmp_load_mxcsr(&__kmp_init_mxcsr);
576 #ifdef KMP_BLOCK_SIGNALS
577 status = sigfillset(&new_set);
578 KMP_CHECK_SYSFAIL_ERRNO(
"sigfillset", status);
579 status = pthread_sigmask(SIG_BLOCK, &new_set, &old_set);
580 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
583 #if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
584 KMP_OS_OPENBSD || KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_AIX
585 if (__kmp_stkoffset > 0 && gtid > 0) {
586 padding = KMP_ALLOCA(gtid * __kmp_stkoffset);
592 __kmp_set_stack_info(gtid, (kmp_info_t *)thr);
594 __kmp_check_stack_overlap((kmp_info_t *)thr);
596 exit_val = __kmp_launch_thread((kmp_info_t *)thr);
598 #ifdef KMP_BLOCK_SIGNALS
599 status = pthread_sigmask(SIG_SETMASK, &old_set, NULL);
600 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
609 static void *__kmp_launch_monitor(
void *thr) {
610 int status, old_type, old_state;
611 #ifdef KMP_BLOCK_SIGNALS
614 struct timespec interval;
618 KA_TRACE(10, (
"__kmp_launch_monitor: #1 launched\n"));
621 __kmp_gtid_set_specific(KMP_GTID_MONITOR);
622 #ifdef KMP_TDATA_GTID
623 __kmp_gtid = KMP_GTID_MONITOR;
630 __kmp_itt_thread_ignore();
633 __kmp_set_stack_info(((kmp_info_t *)thr)->th.th_info.ds.ds_gtid,
636 __kmp_check_stack_overlap((kmp_info_t *)thr);
638 #ifdef KMP_CANCEL_THREADS
639 status = pthread_setcanceltype(PTHREAD_CANCEL_ASYNCHRONOUS, &old_type);
640 KMP_CHECK_SYSFAIL(
"pthread_setcanceltype", status);
642 status = pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, &old_state);
643 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
646 #if KMP_REAL_TIME_FIX
651 int sched = sched_getscheduler(0);
652 if (sched == SCHED_FIFO || sched == SCHED_RR) {
655 struct sched_param param;
656 int max_priority = sched_get_priority_max(sched);
658 KMP_WARNING(RealTimeSchedNotSupported);
659 sched_getparam(0, ¶m);
660 if (param.sched_priority < max_priority) {
661 param.sched_priority += 1;
662 rc = sched_setscheduler(0, sched, ¶m);
665 kmp_msg_t err_code = KMP_ERR(error);
666 __kmp_msg(kmp_ms_warning, KMP_MSG(CantChangeMonitorPriority),
667 err_code, KMP_MSG(MonitorWillStarve), __kmp_msg_null);
668 if (__kmp_generate_warnings == kmp_warnings_off) {
669 __kmp_str_free(&err_code.str);
676 __kmp_msg(kmp_ms_warning, KMP_MSG(RunningAtMaxPriority),
677 KMP_MSG(MonitorWillStarve), KMP_HNT(RunningAtMaxPriority),
682 TCW_4(__kmp_global.g.g_time.dt.t_value, 0);
688 if (__kmp_monitor_wakeups == 1) {
690 interval.tv_nsec = 0;
693 interval.tv_nsec = (KMP_NSEC_PER_SEC / __kmp_monitor_wakeups);
696 KA_TRACE(10, (
"__kmp_launch_monitor: #2 monitor\n"));
698 while (!TCR_4(__kmp_global.g.g_done)) {
704 KA_TRACE(15, (
"__kmp_launch_monitor: update\n"));
706 status = gettimeofday(&tval, NULL);
707 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
708 TIMEVAL_TO_TIMESPEC(&tval, &now);
710 now.tv_sec += interval.tv_sec;
711 now.tv_nsec += interval.tv_nsec;
713 if (now.tv_nsec >= KMP_NSEC_PER_SEC) {
715 now.tv_nsec -= KMP_NSEC_PER_SEC;
718 status = pthread_mutex_lock(&__kmp_wait_mx.m_mutex);
719 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
721 if (!TCR_4(__kmp_global.g.g_done)) {
722 status = pthread_cond_timedwait(&__kmp_wait_cv.c_cond,
723 &__kmp_wait_mx.m_mutex, &now);
725 if (status != ETIMEDOUT && status != EINTR) {
726 KMP_SYSFAIL(
"pthread_cond_timedwait", status);
730 status = pthread_mutex_unlock(&__kmp_wait_mx.m_mutex);
731 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
733 TCW_4(__kmp_global.g.g_time.dt.t_value,
734 TCR_4(__kmp_global.g.g_time.dt.t_value) + 1);
739 KA_TRACE(10, (
"__kmp_launch_monitor: #3 cleanup\n"));
741 #ifdef KMP_BLOCK_SIGNALS
742 status = sigfillset(&new_set);
743 KMP_CHECK_SYSFAIL_ERRNO(
"sigfillset", status);
744 status = pthread_sigmask(SIG_UNBLOCK, &new_set, NULL);
745 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
748 KA_TRACE(10, (
"__kmp_launch_monitor: #4 finished\n"));
750 if (__kmp_global.g.g_abort != 0) {
756 KA_TRACE(10, (
"__kmp_launch_monitor: #5 terminate sig=%d\n",
757 __kmp_global.g.g_abort));
762 for (gtid = 1; gtid < __kmp_threads_capacity; ++gtid)
763 __kmp_terminate_thread(gtid);
767 KA_TRACE(10, (
"__kmp_launch_monitor: #6 raise sig=%d\n",
768 __kmp_global.g.g_abort));
770 if (__kmp_global.g.g_abort > 0)
771 raise(__kmp_global.g.g_abort);
774 KA_TRACE(10, (
"__kmp_launch_monitor: #7 exit\n"));
780 void __kmp_create_worker(
int gtid, kmp_info_t *th,
size_t stack_size) {
782 pthread_attr_t thread_attr;
785 th->th.th_info.ds.ds_gtid = gtid;
787 #if KMP_STATS_ENABLED
789 __kmp_acquire_tas_lock(&__kmp_stats_lock, gtid);
795 if (!KMP_UBER_GTID(gtid)) {
796 th->th.th_stats = __kmp_stats_list->push_back(gtid);
800 th->th.th_stats = __kmp_stats_thread_ptr;
802 __kmp_release_tas_lock(&__kmp_stats_lock, gtid);
806 if (KMP_UBER_GTID(gtid)) {
807 KA_TRACE(10, (
"__kmp_create_worker: uber thread (%d)\n", gtid));
808 th->th.th_info.ds.ds_thread = pthread_self();
809 __kmp_set_stack_info(gtid, th);
810 __kmp_check_stack_overlap(th);
814 KA_TRACE(10, (
"__kmp_create_worker: try to create thread (%d)\n", gtid));
818 #ifdef KMP_THREAD_ATTR
819 status = pthread_attr_init(&thread_attr);
821 __kmp_fatal(KMP_MSG(CantInitThreadAttrs), KMP_ERR(status), __kmp_msg_null);
823 status = pthread_attr_setdetachstate(&thread_attr, PTHREAD_CREATE_JOINABLE);
825 __kmp_fatal(KMP_MSG(CantSetWorkerState), KMP_ERR(status), __kmp_msg_null);
835 stack_size += gtid * __kmp_stkoffset * 2;
837 KA_TRACE(10, (
"__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
838 "__kmp_stksize = %lu bytes, final stacksize = %lu bytes\n",
839 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size));
841 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
842 status = pthread_attr_setstacksize(&thread_attr, stack_size);
843 #ifdef KMP_BACKUP_STKSIZE
845 if (!__kmp_env_stksize) {
846 stack_size = KMP_BACKUP_STKSIZE + gtid * __kmp_stkoffset;
847 __kmp_stksize = KMP_BACKUP_STKSIZE;
848 KA_TRACE(10, (
"__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
849 "__kmp_stksize = %lu bytes, (backup) final stacksize = %lu "
851 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size));
852 status = pthread_attr_setstacksize(&thread_attr, stack_size);
857 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
858 KMP_HNT(ChangeWorkerStackSize), __kmp_msg_null);
865 pthread_create(&handle, &thread_attr, __kmp_launch_worker, (
void *)th);
866 if (status != 0 || !handle) {
867 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
868 if (status == EINVAL) {
869 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
870 KMP_HNT(IncreaseWorkerStackSize), __kmp_msg_null);
872 if (status == ENOMEM) {
873 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
874 KMP_HNT(DecreaseWorkerStackSize), __kmp_msg_null);
877 if (status == EAGAIN) {
878 __kmp_fatal(KMP_MSG(NoResourcesForWorkerThread), KMP_ERR(status),
879 KMP_HNT(Decrease_NUM_THREADS), __kmp_msg_null);
881 KMP_SYSFAIL(
"pthread_create", status);
885 if (!KMP_UBER_GTID(gtid)) {
886 #if defined(LIBOMP_HAVE_PTHREAD_SET_NAME_NP)
887 pthread_set_name_np(handle,
"openmp_worker");
888 #elif defined(LIBOMP_HAVE_PTHREAD_SETNAME_NP) && !KMP_OS_DARWIN
890 pthread_setname_np(handle,
"%s",
const_cast<char *
>(
"openmp_worker"));
892 pthread_setname_np(handle,
"openmp_worker");
897 th->th.th_info.ds.ds_thread = handle;
899 #ifdef KMP_THREAD_ATTR
900 status = pthread_attr_destroy(&thread_attr);
902 kmp_msg_t err_code = KMP_ERR(status);
903 __kmp_msg(kmp_ms_warning, KMP_MSG(CantDestroyThreadAttrs), err_code,
905 if (__kmp_generate_warnings == kmp_warnings_off) {
906 __kmp_str_free(&err_code.str);
913 KA_TRACE(10, (
"__kmp_create_worker: done creating thread (%d)\n", gtid));
918 void __kmp_create_monitor(kmp_info_t *th) {
920 pthread_attr_t thread_attr;
923 int auto_adj_size = FALSE;
925 if (__kmp_dflt_blocktime == KMP_MAX_BLOCKTIME) {
927 KA_TRACE(10, (
"__kmp_create_monitor: skipping monitor thread because of "
929 th->th.th_info.ds.ds_tid = 0;
930 th->th.th_info.ds.ds_gtid = 0;
933 KA_TRACE(10, (
"__kmp_create_monitor: try to create monitor\n"));
937 th->th.th_info.ds.ds_tid = KMP_GTID_MONITOR;
938 th->th.th_info.ds.ds_gtid = KMP_GTID_MONITOR;
939 #if KMP_REAL_TIME_FIX
940 TCW_4(__kmp_global.g.g_time.dt.t_value,
943 TCW_4(__kmp_global.g.g_time.dt.t_value, 0);
946 #ifdef KMP_THREAD_ATTR
947 if (__kmp_monitor_stksize == 0) {
948 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
949 auto_adj_size = TRUE;
951 status = pthread_attr_init(&thread_attr);
953 __kmp_fatal(KMP_MSG(CantInitThreadAttrs), KMP_ERR(status), __kmp_msg_null);
955 status = pthread_attr_setdetachstate(&thread_attr, PTHREAD_CREATE_JOINABLE);
957 __kmp_fatal(KMP_MSG(CantSetMonitorState), KMP_ERR(status), __kmp_msg_null);
960 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
961 status = pthread_attr_getstacksize(&thread_attr, &size);
962 KMP_CHECK_SYSFAIL(
"pthread_attr_getstacksize", status);
964 size = __kmp_sys_min_stksize;
968 if (__kmp_monitor_stksize == 0) {
969 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
971 if (__kmp_monitor_stksize < __kmp_sys_min_stksize) {
972 __kmp_monitor_stksize = __kmp_sys_min_stksize;
975 KA_TRACE(10, (
"__kmp_create_monitor: default stacksize = %lu bytes,"
976 "requested stacksize = %lu bytes\n",
977 size, __kmp_monitor_stksize));
982 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
983 KA_TRACE(10, (
"__kmp_create_monitor: setting stacksize = %lu bytes,",
984 __kmp_monitor_stksize));
985 status = pthread_attr_setstacksize(&thread_attr, __kmp_monitor_stksize);
988 __kmp_monitor_stksize *= 2;
991 kmp_msg_t err_code = KMP_ERR(status);
992 __kmp_msg(kmp_ms_warning,
993 KMP_MSG(CantSetMonitorStackSize, (
long int)__kmp_monitor_stksize),
994 err_code, KMP_HNT(ChangeMonitorStackSize), __kmp_msg_null);
995 if (__kmp_generate_warnings == kmp_warnings_off) {
996 __kmp_str_free(&err_code.str);
1002 pthread_create(&handle, &thread_attr, __kmp_launch_monitor, (
void *)th);
1005 #ifdef _POSIX_THREAD_ATTR_STACKSIZE
1006 if (status == EINVAL) {
1007 if (auto_adj_size && (__kmp_monitor_stksize < (
size_t)0x40000000)) {
1008 __kmp_monitor_stksize *= 2;
1011 __kmp_fatal(KMP_MSG(CantSetMonitorStackSize, __kmp_monitor_stksize),
1012 KMP_ERR(status), KMP_HNT(IncreaseMonitorStackSize),
1015 if (status == ENOMEM) {
1016 __kmp_fatal(KMP_MSG(CantSetMonitorStackSize, __kmp_monitor_stksize),
1017 KMP_ERR(status), KMP_HNT(DecreaseMonitorStackSize),
1021 if (status == EAGAIN) {
1022 __kmp_fatal(KMP_MSG(NoResourcesForMonitorThread), KMP_ERR(status),
1023 KMP_HNT(DecreaseNumberOfThreadsInUse), __kmp_msg_null);
1025 KMP_SYSFAIL(
"pthread_create", status);
1028 th->th.th_info.ds.ds_thread = handle;
1030 #if KMP_REAL_TIME_FIX
1032 KMP_DEBUG_ASSERT(
sizeof(kmp_uint32) ==
1033 sizeof(__kmp_global.g.g_time.dt.t_value));
1034 __kmp_wait_4((kmp_uint32
volatile *)&__kmp_global.g.g_time.dt.t_value, -1,
1035 &__kmp_neq_4, NULL);
1038 #ifdef KMP_THREAD_ATTR
1039 status = pthread_attr_destroy(&thread_attr);
1041 kmp_msg_t err_code = KMP_ERR(status);
1042 __kmp_msg(kmp_ms_warning, KMP_MSG(CantDestroyThreadAttrs), err_code,
1044 if (__kmp_generate_warnings == kmp_warnings_off) {
1045 __kmp_str_free(&err_code.str);
1052 KA_TRACE(10, (
"__kmp_create_monitor: monitor created %#.8lx\n",
1053 th->th.th_info.ds.ds_thread));
1058 void __kmp_exit_thread(
int exit_status) {
1062 pthread_exit((
void *)(intptr_t)exit_status);
1067 void __kmp_resume_monitor();
1069 extern "C" void __kmp_reap_monitor(kmp_info_t *th) {
1073 KA_TRACE(10, (
"__kmp_reap_monitor: try to reap monitor thread with handle"
1075 th->th.th_info.ds.ds_thread));
1080 KMP_DEBUG_ASSERT(th->th.th_info.ds.ds_tid == th->th.th_info.ds.ds_gtid);
1081 if (th->th.th_info.ds.ds_gtid != KMP_GTID_MONITOR) {
1082 KA_TRACE(10, (
"__kmp_reap_monitor: monitor did not start, returning\n"));
1092 status = pthread_kill(th->th.th_info.ds.ds_thread, 0);
1093 if (status != ESRCH) {
1094 __kmp_resume_monitor();
1096 KA_TRACE(10, (
"__kmp_reap_monitor: try to join with monitor\n"));
1097 status = pthread_join(th->th.th_info.ds.ds_thread, &exit_val);
1098 if (exit_val != th) {
1099 __kmp_fatal(KMP_MSG(ReapMonitorError), KMP_ERR(status), __kmp_msg_null);
1102 th->th.th_info.ds.ds_tid = KMP_GTID_DNE;
1103 th->th.th_info.ds.ds_gtid = KMP_GTID_DNE;
1105 KA_TRACE(10, (
"__kmp_reap_monitor: done reaping monitor thread with handle"
1107 th->th.th_info.ds.ds_thread));
1114 extern "C" void __kmp_reap_monitor(kmp_info_t *th) { (void)th; }
1117 void __kmp_reap_worker(kmp_info_t *th) {
1124 10, (
"__kmp_reap_worker: try to reap T#%d\n", th->th.th_info.ds.ds_gtid));
1126 status = pthread_join(th->th.th_info.ds.ds_thread, &exit_val);
1130 __kmp_fatal(KMP_MSG(ReapWorkerError), KMP_ERR(status), __kmp_msg_null);
1132 if (exit_val != th) {
1133 KA_TRACE(10, (
"__kmp_reap_worker: worker T#%d did not reap properly, "
1135 th->th.th_info.ds.ds_gtid, exit_val));
1141 KA_TRACE(10, (
"__kmp_reap_worker: done reaping T#%d\n",
1142 th->th.th_info.ds.ds_gtid));
1147 #if KMP_HANDLE_SIGNALS
1149 static void __kmp_null_handler(
int signo) {
1153 static void __kmp_team_handler(
int signo) {
1154 if (__kmp_global.g.g_abort == 0) {
1157 __kmp_debug_printf(
"__kmp_team_handler: caught signal = %d\n", signo);
1172 if (__kmp_debug_buf) {
1173 __kmp_dump_debug_buffer();
1175 __kmp_unregister_library();
1177 TCW_4(__kmp_global.g.g_abort, signo);
1179 TCW_4(__kmp_global.g.g_done, TRUE);
1184 __kmp_debug_printf(
"__kmp_team_handler: unknown signal type");
1191 static void __kmp_sigaction(
int signum,
const struct sigaction *act,
1192 struct sigaction *oldact) {
1193 int rc = sigaction(signum, act, oldact);
1194 KMP_CHECK_SYSFAIL_ERRNO(
"sigaction", rc);
1197 static void __kmp_install_one_handler(
int sig, sig_func_t handler_func,
1198 int parallel_init) {
1201 (
"__kmp_install_one_handler( %d, ..., %d )\n", sig, parallel_init));
1202 if (parallel_init) {
1203 struct sigaction new_action;
1204 struct sigaction old_action;
1205 new_action.sa_handler = handler_func;
1206 new_action.sa_flags = 0;
1207 sigfillset(&new_action.sa_mask);
1208 __kmp_sigaction(sig, &new_action, &old_action);
1209 if (old_action.sa_handler == __kmp_sighldrs[sig].sa_handler) {
1210 sigaddset(&__kmp_sigset, sig);
1213 __kmp_sigaction(sig, &old_action, NULL);
1217 __kmp_sigaction(sig, NULL, &__kmp_sighldrs[sig]);
1222 static void __kmp_remove_one_handler(
int sig) {
1223 KB_TRACE(60, (
"__kmp_remove_one_handler( %d )\n", sig));
1224 if (sigismember(&__kmp_sigset, sig)) {
1225 struct sigaction old;
1227 __kmp_sigaction(sig, &__kmp_sighldrs[sig], &old);
1228 if ((old.sa_handler != __kmp_team_handler) &&
1229 (old.sa_handler != __kmp_null_handler)) {
1231 KB_TRACE(10, (
"__kmp_remove_one_handler: oops, not our handler, "
1232 "restoring: sig=%d\n",
1234 __kmp_sigaction(sig, &old, NULL);
1236 sigdelset(&__kmp_sigset, sig);
1241 void __kmp_install_signals(
int parallel_init) {
1242 KB_TRACE(10, (
"__kmp_install_signals( %d )\n", parallel_init));
1243 if (__kmp_handle_signals || !parallel_init) {
1246 sigemptyset(&__kmp_sigset);
1247 __kmp_install_one_handler(SIGHUP, __kmp_team_handler, parallel_init);
1248 __kmp_install_one_handler(SIGINT, __kmp_team_handler, parallel_init);
1249 __kmp_install_one_handler(SIGQUIT, __kmp_team_handler, parallel_init);
1250 __kmp_install_one_handler(SIGILL, __kmp_team_handler, parallel_init);
1251 __kmp_install_one_handler(SIGABRT, __kmp_team_handler, parallel_init);
1252 __kmp_install_one_handler(SIGFPE, __kmp_team_handler, parallel_init);
1253 __kmp_install_one_handler(SIGBUS, __kmp_team_handler, parallel_init);
1254 __kmp_install_one_handler(SIGSEGV, __kmp_team_handler, parallel_init);
1256 __kmp_install_one_handler(SIGSYS, __kmp_team_handler, parallel_init);
1258 __kmp_install_one_handler(SIGTERM, __kmp_team_handler, parallel_init);
1260 __kmp_install_one_handler(SIGPIPE, __kmp_team_handler, parallel_init);
1265 void __kmp_remove_signals(
void) {
1267 KB_TRACE(10, (
"__kmp_remove_signals()\n"));
1268 for (sig = 1; sig < NSIG; ++sig) {
1269 __kmp_remove_one_handler(sig);
1275 void __kmp_enable(
int new_state) {
1276 #ifdef KMP_CANCEL_THREADS
1277 int status, old_state;
1278 status = pthread_setcancelstate(new_state, &old_state);
1279 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
1280 KMP_DEBUG_ASSERT(old_state == PTHREAD_CANCEL_DISABLE);
1284 void __kmp_disable(
int *old_state) {
1285 #ifdef KMP_CANCEL_THREADS
1287 status = pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, old_state);
1288 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
1292 static void __kmp_atfork_prepare(
void) {
1293 __kmp_acquire_bootstrap_lock(&__kmp_initz_lock);
1294 __kmp_acquire_bootstrap_lock(&__kmp_forkjoin_lock);
1297 static void __kmp_atfork_parent(
void) {
1298 __kmp_release_bootstrap_lock(&__kmp_forkjoin_lock);
1299 __kmp_release_bootstrap_lock(&__kmp_initz_lock);
1305 static void __kmp_atfork_child(
void) {
1306 __kmp_release_bootstrap_lock(&__kmp_forkjoin_lock);
1307 __kmp_release_bootstrap_lock(&__kmp_initz_lock);
1314 #if KMP_AFFINITY_SUPPORTED
1315 #if KMP_OS_LINUX || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY || \
1319 kmp_set_thread_affinity_mask_initial();
1324 if (__kmp_nested_proc_bind.bind_types != NULL) {
1325 __kmp_nested_proc_bind.bind_types[0] = proc_bind_false;
1327 for (kmp_affinity_t *affinity : __kmp_affinities)
1328 *affinity = KMP_AFFINITY_INIT(affinity->env_var);
1329 __kmp_affin_fullMask =
nullptr;
1330 __kmp_affin_origMask =
nullptr;
1331 __kmp_topology =
nullptr;
1335 __kmp_init_monitor = 0;
1337 __kmp_init_parallel = FALSE;
1338 __kmp_init_middle = FALSE;
1339 __kmp_init_serial = FALSE;
1340 TCW_4(__kmp_init_gtid, FALSE);
1341 __kmp_init_common = FALSE;
1343 TCW_4(__kmp_init_user_locks, FALSE);
1344 #if !KMP_USE_DYNAMIC_LOCK
1345 __kmp_user_lock_table.used = 1;
1346 __kmp_user_lock_table.allocated = 0;
1347 __kmp_user_lock_table.table = NULL;
1348 __kmp_lock_blocks = NULL;
1352 TCW_4(__kmp_nth, 0);
1354 __kmp_thread_pool = NULL;
1355 __kmp_thread_pool_insert_pt = NULL;
1356 __kmp_team_pool = NULL;
1360 KA_TRACE(10, (
"__kmp_atfork_child: checking cache address list %p\n",
1361 __kmp_threadpriv_cache_list));
1363 while (__kmp_threadpriv_cache_list != NULL) {
1365 if (*__kmp_threadpriv_cache_list->addr != NULL) {
1366 KC_TRACE(50, (
"__kmp_atfork_child: zeroing cache at address %p\n",
1367 &(*__kmp_threadpriv_cache_list->addr)));
1369 *__kmp_threadpriv_cache_list->addr = NULL;
1371 __kmp_threadpriv_cache_list = __kmp_threadpriv_cache_list->next;
1374 __kmp_init_runtime = FALSE;
1377 __kmp_init_bootstrap_lock(&__kmp_initz_lock);
1378 __kmp_init_bootstrap_lock(&__kmp_stdio_lock);
1379 __kmp_init_bootstrap_lock(&__kmp_console_lock);
1380 __kmp_init_bootstrap_lock(&__kmp_task_team_lock);
1390 __kmp_need_register_serial = FALSE;
1391 __kmp_serial_initialize();
1405 void __kmp_register_atfork(
void) {
1406 if (__kmp_need_register_atfork) {
1408 int status = pthread_atfork(__kmp_atfork_prepare, __kmp_atfork_parent,
1409 __kmp_atfork_child);
1410 KMP_CHECK_SYSFAIL(
"pthread_atfork", status);
1412 __kmp_need_register_atfork = FALSE;
1416 void __kmp_suspend_initialize(
void) {
1418 status = pthread_mutexattr_init(&__kmp_suspend_mutex_attr);
1419 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_init", status);
1420 status = pthread_condattr_init(&__kmp_suspend_cond_attr);
1421 KMP_CHECK_SYSFAIL(
"pthread_condattr_init", status);
1424 void __kmp_suspend_initialize_thread(kmp_info_t *th) {
1425 int old_value = KMP_ATOMIC_LD_RLX(&th->th.th_suspend_init_count);
1426 int new_value = __kmp_fork_count + 1;
1428 if (old_value == new_value)
1431 if (old_value == -1 || !__kmp_atomic_compare_store(
1432 &th->th.th_suspend_init_count, old_value, -1)) {
1433 while (KMP_ATOMIC_LD_ACQ(&th->th.th_suspend_init_count) != new_value) {
1439 status = pthread_cond_init(&th->th.th_suspend_cv.c_cond,
1440 &__kmp_suspend_cond_attr);
1441 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
1442 status = pthread_mutex_init(&th->th.th_suspend_mx.m_mutex,
1443 &__kmp_suspend_mutex_attr);
1444 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
1445 KMP_ATOMIC_ST_REL(&th->th.th_suspend_init_count, new_value);
1449 void __kmp_suspend_uninitialize_thread(kmp_info_t *th) {
1450 if (KMP_ATOMIC_LD_ACQ(&th->th.th_suspend_init_count) > __kmp_fork_count) {
1455 status = pthread_cond_destroy(&th->th.th_suspend_cv.c_cond);
1456 if (status != 0 && status != EBUSY) {
1457 KMP_SYSFAIL(
"pthread_cond_destroy", status);
1459 status = pthread_mutex_destroy(&th->th.th_suspend_mx.m_mutex);
1460 if (status != 0 && status != EBUSY) {
1461 KMP_SYSFAIL(
"pthread_mutex_destroy", status);
1463 --th->th.th_suspend_init_count;
1464 KMP_DEBUG_ASSERT(KMP_ATOMIC_LD_RLX(&th->th.th_suspend_init_count) ==
1470 int __kmp_try_suspend_mx(kmp_info_t *th) {
1471 return (pthread_mutex_trylock(&th->th.th_suspend_mx.m_mutex) == 0);
1474 void __kmp_lock_suspend_mx(kmp_info_t *th) {
1475 int status = pthread_mutex_lock(&th->th.th_suspend_mx.m_mutex);
1476 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
1479 void __kmp_unlock_suspend_mx(kmp_info_t *th) {
1480 int status = pthread_mutex_unlock(&th->th.th_suspend_mx.m_mutex);
1481 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
1487 static inline void __kmp_suspend_template(
int th_gtid, C *flag) {
1488 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_suspend);
1489 kmp_info_t *th = __kmp_threads[th_gtid];
1491 typename C::flag_t old_spin;
1493 KF_TRACE(30, (
"__kmp_suspend_template: T#%d enter for flag = %p\n", th_gtid,
1496 __kmp_suspend_initialize_thread(th);
1498 __kmp_lock_suspend_mx(th);
1500 KF_TRACE(10, (
"__kmp_suspend_template: T#%d setting sleep bit for spin(%p)\n",
1501 th_gtid, flag->get()));
1505 old_spin = flag->set_sleeping();
1506 TCW_PTR(th->th.th_sleep_loc, (
void *)flag);
1507 th->th.th_sleep_loc_type = flag->get_type();
1508 if (__kmp_dflt_blocktime == KMP_MAX_BLOCKTIME &&
1509 __kmp_pause_status != kmp_soft_paused) {
1510 flag->unset_sleeping();
1511 TCW_PTR(th->th.th_sleep_loc, NULL);
1512 th->th.th_sleep_loc_type = flag_unset;
1513 __kmp_unlock_suspend_mx(th);
1516 KF_TRACE(5, (
"__kmp_suspend_template: T#%d set sleep bit for spin(%p)==%x,"
1518 th_gtid, flag->get(), flag->load(), old_spin));
1520 if (flag->done_check_val(old_spin) || flag->done_check()) {
1521 flag->unset_sleeping();
1522 TCW_PTR(th->th.th_sleep_loc, NULL);
1523 th->th.th_sleep_loc_type = flag_unset;
1524 KF_TRACE(5, (
"__kmp_suspend_template: T#%d false alarm, reset sleep bit "
1526 th_gtid, flag->get()));
1531 int deactivated = FALSE;
1533 while (flag->is_sleeping()) {
1534 #ifdef DEBUG_SUSPEND
1536 __kmp_suspend_count++;
1537 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1538 __kmp_printf(
"__kmp_suspend_template: suspending T#%d: %s\n", th_gtid,
1544 th->th.th_active = FALSE;
1545 if (th->th.th_active_in_pool) {
1546 th->th.th_active_in_pool = FALSE;
1547 KMP_ATOMIC_DEC(&__kmp_thread_pool_active_nth);
1548 KMP_DEBUG_ASSERT(TCR_4(__kmp_thread_pool_active_nth) >= 0);
1553 KMP_DEBUG_ASSERT(th->th.th_sleep_loc);
1554 KMP_DEBUG_ASSERT(flag->get_type() == th->th.th_sleep_loc_type);
1556 #if USE_SUSPEND_TIMEOUT
1557 struct timespec now;
1558 struct timeval tval;
1561 status = gettimeofday(&tval, NULL);
1562 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1563 TIMEVAL_TO_TIMESPEC(&tval, &now);
1565 msecs = (4 * __kmp_dflt_blocktime) + 200;
1566 now.tv_sec += msecs / 1000;
1567 now.tv_nsec += (msecs % 1000) * 1000;
1569 KF_TRACE(15, (
"__kmp_suspend_template: T#%d about to perform "
1570 "pthread_cond_timedwait\n",
1572 status = pthread_cond_timedwait(&th->th.th_suspend_cv.c_cond,
1573 &th->th.th_suspend_mx.m_mutex, &now);
1575 KF_TRACE(15, (
"__kmp_suspend_template: T#%d about to perform"
1576 " pthread_cond_wait\n",
1578 status = pthread_cond_wait(&th->th.th_suspend_cv.c_cond,
1579 &th->th.th_suspend_mx.m_mutex);
1582 if ((status != 0) && (status != EINTR) && (status != ETIMEDOUT)) {
1583 KMP_SYSFAIL(
"pthread_cond_wait", status);
1586 KMP_DEBUG_ASSERT(flag->get_type() == flag->get_ptr_type());
1588 if (!flag->is_sleeping() &&
1589 ((status == EINTR) || (status == ETIMEDOUT))) {
1593 flag->unset_sleeping();
1594 TCW_PTR(th->th.th_sleep_loc, NULL);
1595 th->th.th_sleep_loc_type = flag_unset;
1598 if (status == ETIMEDOUT) {
1599 if (flag->is_sleeping()) {
1601 (
"__kmp_suspend_template: T#%d timeout wakeup\n", th_gtid));
1603 KF_TRACE(2, (
"__kmp_suspend_template: T#%d timeout wakeup, sleep bit "
1606 TCW_PTR(th->th.th_sleep_loc, NULL);
1607 th->th.th_sleep_loc_type = flag_unset;
1609 }
else if (flag->is_sleeping()) {
1611 (
"__kmp_suspend_template: T#%d spurious wakeup\n", th_gtid));
1618 th->th.th_active = TRUE;
1619 if (TCR_4(th->th.th_in_pool)) {
1620 KMP_ATOMIC_INC(&__kmp_thread_pool_active_nth);
1621 th->th.th_active_in_pool = TRUE;
1627 TCW_PTR(th->th.th_sleep_loc, NULL);
1628 th->th.th_sleep_loc_type = flag_unset;
1630 KMP_DEBUG_ASSERT(!flag->is_sleeping());
1631 KMP_DEBUG_ASSERT(!th->th.th_sleep_loc);
1632 #ifdef DEBUG_SUSPEND
1635 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1636 __kmp_printf(
"__kmp_suspend_template: T#%d has awakened: %s\n", th_gtid,
1641 __kmp_unlock_suspend_mx(th);
1642 KF_TRACE(30, (
"__kmp_suspend_template: T#%d exit\n", th_gtid));
1645 template <
bool C,
bool S>
1646 void __kmp_suspend_32(
int th_gtid, kmp_flag_32<C, S> *flag) {
1647 __kmp_suspend_template(th_gtid, flag);
1649 template <
bool C,
bool S>
1650 void __kmp_suspend_64(
int th_gtid, kmp_flag_64<C, S> *flag) {
1651 __kmp_suspend_template(th_gtid, flag);
1653 template <
bool C,
bool S>
1654 void __kmp_atomic_suspend_64(
int th_gtid, kmp_atomic_flag_64<C, S> *flag) {
1655 __kmp_suspend_template(th_gtid, flag);
1657 void __kmp_suspend_oncore(
int th_gtid, kmp_flag_oncore *flag) {
1658 __kmp_suspend_template(th_gtid, flag);
1661 template void __kmp_suspend_32<false, false>(
int, kmp_flag_32<false, false> *);
1662 template void __kmp_suspend_64<false, true>(
int, kmp_flag_64<false, true> *);
1663 template void __kmp_suspend_64<true, false>(
int, kmp_flag_64<true, false> *);
1665 __kmp_atomic_suspend_64<false, true>(
int, kmp_atomic_flag_64<false, true> *);
1667 __kmp_atomic_suspend_64<true, false>(
int, kmp_atomic_flag_64<true, false> *);
1673 static inline void __kmp_resume_template(
int target_gtid, C *flag) {
1674 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_resume);
1675 kmp_info_t *th = __kmp_threads[target_gtid];
1679 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1682 KF_TRACE(30, (
"__kmp_resume_template: T#%d wants to wakeup T#%d enter\n",
1683 gtid, target_gtid));
1684 KMP_DEBUG_ASSERT(gtid != target_gtid);
1686 __kmp_suspend_initialize_thread(th);
1688 __kmp_lock_suspend_mx(th);
1690 if (!flag || flag != th->th.th_sleep_loc) {
1693 flag = (C *)CCAST(
void *, th->th.th_sleep_loc);
1699 KF_TRACE(5, (
"__kmp_resume_template: T#%d exiting, thread T#%d already "
1700 "awake: flag(%p)\n",
1701 gtid, target_gtid, (
void *)NULL));
1702 __kmp_unlock_suspend_mx(th);
1704 }
else if (flag->get_type() != th->th.th_sleep_loc_type) {
1709 (
"__kmp_resume_template: T#%d retrying, thread T#%d Mismatch flag(%p), "
1710 "spin(%p) type=%d ptr_type=%d\n",
1711 gtid, target_gtid, flag, flag->get(), flag->get_type(),
1712 th->th.th_sleep_loc_type));
1713 __kmp_unlock_suspend_mx(th);
1714 __kmp_null_resume_wrapper(th);
1718 if (!flag->is_sleeping()) {
1719 KF_TRACE(5, (
"__kmp_resume_template: T#%d exiting, thread T#%d already "
1720 "awake: flag(%p): %u\n",
1721 gtid, target_gtid, flag->get(), (
unsigned int)flag->load()));
1722 __kmp_unlock_suspend_mx(th);
1726 KMP_DEBUG_ASSERT(flag);
1727 flag->unset_sleeping();
1728 TCW_PTR(th->th.th_sleep_loc, NULL);
1729 th->th.th_sleep_loc_type = flag_unset;
1731 KF_TRACE(5, (
"__kmp_resume_template: T#%d about to wakeup T#%d, reset "
1732 "sleep bit for flag's loc(%p): %u\n",
1733 gtid, target_gtid, flag->get(), (
unsigned int)flag->load()));
1735 #ifdef DEBUG_SUSPEND
1738 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1739 __kmp_printf(
"__kmp_resume_template: T#%d resuming T#%d: %s\n", gtid,
1740 target_gtid, buffer);
1743 status = pthread_cond_signal(&th->th.th_suspend_cv.c_cond);
1744 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
1745 __kmp_unlock_suspend_mx(th);
1746 KF_TRACE(30, (
"__kmp_resume_template: T#%d exiting after signaling wake up"
1748 gtid, target_gtid));
1751 template <
bool C,
bool S>
1752 void __kmp_resume_32(
int target_gtid, kmp_flag_32<C, S> *flag) {
1753 __kmp_resume_template(target_gtid, flag);
1755 template <
bool C,
bool S>
1756 void __kmp_resume_64(
int target_gtid, kmp_flag_64<C, S> *flag) {
1757 __kmp_resume_template(target_gtid, flag);
1759 template <
bool C,
bool S>
1760 void __kmp_atomic_resume_64(
int target_gtid, kmp_atomic_flag_64<C, S> *flag) {
1761 __kmp_resume_template(target_gtid, flag);
1763 void __kmp_resume_oncore(
int target_gtid, kmp_flag_oncore *flag) {
1764 __kmp_resume_template(target_gtid, flag);
1767 template void __kmp_resume_32<false, true>(
int, kmp_flag_32<false, true> *);
1768 template void __kmp_resume_32<false, false>(
int, kmp_flag_32<false, false> *);
1769 template void __kmp_resume_64<false, true>(
int, kmp_flag_64<false, true> *);
1771 __kmp_atomic_resume_64<false, true>(
int, kmp_atomic_flag_64<false, true> *);
1774 void __kmp_resume_monitor() {
1775 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_resume);
1778 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1779 KF_TRACE(30, (
"__kmp_resume_monitor: T#%d wants to wakeup T#%d enter\n", gtid,
1781 KMP_DEBUG_ASSERT(gtid != KMP_GTID_MONITOR);
1783 status = pthread_mutex_lock(&__kmp_wait_mx.m_mutex);
1784 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
1785 #ifdef DEBUG_SUSPEND
1788 __kmp_print_cond(buffer, &__kmp_wait_cv.c_cond);
1789 __kmp_printf(
"__kmp_resume_monitor: T#%d resuming T#%d: %s\n", gtid,
1790 KMP_GTID_MONITOR, buffer);
1793 status = pthread_cond_signal(&__kmp_wait_cv.c_cond);
1794 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
1795 status = pthread_mutex_unlock(&__kmp_wait_mx.m_mutex);
1796 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
1797 KF_TRACE(30, (
"__kmp_resume_monitor: T#%d exiting after signaling wake up"
1799 gtid, KMP_GTID_MONITOR));
1803 void __kmp_yield() { sched_yield(); }
1805 void __kmp_gtid_set_specific(
int gtid) {
1806 if (__kmp_init_gtid) {
1808 status = pthread_setspecific(__kmp_gtid_threadprivate_key,
1809 (
void *)(intptr_t)(gtid + 1));
1810 KMP_CHECK_SYSFAIL(
"pthread_setspecific", status);
1812 KA_TRACE(50, (
"__kmp_gtid_set_specific: runtime shutdown, returning\n"));
1816 int __kmp_gtid_get_specific() {
1818 if (!__kmp_init_gtid) {
1819 KA_TRACE(50, (
"__kmp_gtid_get_specific: runtime shutdown, returning "
1820 "KMP_GTID_SHUTDOWN\n"));
1821 return KMP_GTID_SHUTDOWN;
1823 gtid = (int)(
size_t)pthread_getspecific(__kmp_gtid_threadprivate_key);
1825 gtid = KMP_GTID_DNE;
1829 KA_TRACE(50, (
"__kmp_gtid_get_specific: key:%d gtid:%d\n",
1830 __kmp_gtid_threadprivate_key, gtid));
1834 double __kmp_read_cpu_time(
void) {
1840 return (
double)(buffer.tms_utime + buffer.tms_cutime) /
1841 (
double)CLOCKS_PER_SEC;
1844 int __kmp_read_system_info(
struct kmp_sys_info *info) {
1846 struct rusage r_usage;
1848 memset(info, 0,
sizeof(*info));
1850 status = getrusage(RUSAGE_SELF, &r_usage);
1851 KMP_CHECK_SYSFAIL_ERRNO(
"getrusage", status);
1855 info->maxrss = r_usage.ru_maxrss;
1857 info->minflt = r_usage.ru_minflt;
1859 info->majflt = r_usage.ru_majflt;
1861 info->nswap = r_usage.ru_nswap;
1863 info->inblock = r_usage.ru_inblock;
1865 info->oublock = r_usage.ru_oublock;
1867 info->nvcsw = r_usage.ru_nvcsw;
1869 info->nivcsw = r_usage.ru_nivcsw;
1872 return (status != 0);
1875 void __kmp_read_system_time(
double *delta) {
1877 struct timeval tval;
1878 struct timespec stop;
1881 status = gettimeofday(&tval, NULL);
1882 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1883 TIMEVAL_TO_TIMESPEC(&tval, &stop);
1884 t_ns = (double)(TS2NS(stop) - TS2NS(__kmp_sys_timer_data.start));
1885 *delta = (t_ns * 1e-9);
1888 void __kmp_clear_system_time(
void) {
1889 struct timeval tval;
1891 status = gettimeofday(&tval, NULL);
1892 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1893 TIMEVAL_TO_TIMESPEC(&tval, &__kmp_sys_timer_data.start);
1896 static int __kmp_get_xproc(
void) {
1902 __kmp_type_convert(sysconf(_SC_NPROCESSORS_CONF), &(r));
1904 #elif KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_OPENBSD || \
1905 KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_WASI || KMP_OS_AIX
1907 __kmp_type_convert(sysconf(_SC_NPROCESSORS_ONLN), &(r));
1911 size_t len =
sizeof(r);
1912 sysctlbyname(
"hw.logicalcpu", &r, &len, NULL, 0);
1916 #error "Unknown or unsupported OS."
1920 return r > 0 ? r : 2;
1924 int __kmp_read_from_file(
char const *path,
char const *format, ...) {
1928 va_start(args, format);
1929 FILE *f = fopen(path,
"rb");
1934 result = vfscanf(f, format, args);
1941 void __kmp_runtime_initialize(
void) {
1943 pthread_mutexattr_t mutex_attr;
1944 pthread_condattr_t cond_attr;
1946 if (__kmp_init_runtime) {
1950 #if (KMP_ARCH_X86 || KMP_ARCH_X86_64)
1951 if (!__kmp_cpuinfo.initialized) {
1952 __kmp_query_cpuid(&__kmp_cpuinfo);
1956 __kmp_xproc = __kmp_get_xproc();
1958 #if !KMP_32_BIT_ARCH
1962 status = getrlimit(RLIMIT_STACK, &rlim);
1964 __kmp_stksize = rlim.rlim_cur;
1965 __kmp_check_stksize(&__kmp_stksize);
1969 if (sysconf(_SC_THREADS)) {
1972 __kmp_type_convert(sysconf(_SC_THREAD_THREADS_MAX), &(__kmp_sys_max_nth));
1974 if (__kmp_sys_max_nth == -1) {
1977 __kmp_sys_max_nth = KMP_MAX_NTH;
1980 if (__kmp_sys_max_nth == -1) {
1982 __kmp_sys_max_nth = INT_MAX;
1983 }
else if (__kmp_sys_max_nth <= 1) {
1985 __kmp_sys_max_nth = KMP_MAX_NTH;
1990 __kmp_sys_min_stksize = sysconf(_SC_THREAD_STACK_MIN);
1991 if (__kmp_sys_min_stksize <= 1) {
1992 __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
1997 __kmp_tls_gtid_min = KMP_TLS_GTID_MIN;
1999 status = pthread_key_create(&__kmp_gtid_threadprivate_key,
2000 __kmp_internal_end_dest);
2001 KMP_CHECK_SYSFAIL(
"pthread_key_create", status);
2002 status = pthread_mutexattr_init(&mutex_attr);
2003 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_init", status);
2004 status = pthread_mutex_init(&__kmp_wait_mx.m_mutex, &mutex_attr);
2005 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2006 status = pthread_mutexattr_destroy(&mutex_attr);
2007 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_destroy", status);
2008 status = pthread_condattr_init(&cond_attr);
2009 KMP_CHECK_SYSFAIL(
"pthread_condattr_init", status);
2010 status = pthread_cond_init(&__kmp_wait_cv.c_cond, &cond_attr);
2011 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2012 status = pthread_condattr_destroy(&cond_attr);
2013 KMP_CHECK_SYSFAIL(
"pthread_condattr_destroy", status);
2015 __kmp_itt_initialize();
2018 __kmp_init_runtime = TRUE;
2021 void __kmp_runtime_destroy(
void) {
2024 if (!__kmp_init_runtime) {
2029 __kmp_itt_destroy();
2032 status = pthread_key_delete(__kmp_gtid_threadprivate_key);
2033 KMP_CHECK_SYSFAIL(
"pthread_key_delete", status);
2035 status = pthread_mutex_destroy(&__kmp_wait_mx.m_mutex);
2036 if (status != 0 && status != EBUSY) {
2037 KMP_SYSFAIL(
"pthread_mutex_destroy", status);
2039 status = pthread_cond_destroy(&__kmp_wait_cv.c_cond);
2040 if (status != 0 && status != EBUSY) {
2041 KMP_SYSFAIL(
"pthread_cond_destroy", status);
2043 #if KMP_AFFINITY_SUPPORTED
2044 __kmp_affinity_uninitialize();
2047 __kmp_init_runtime = FALSE;
2052 void __kmp_thread_sleep(
int millis) { sleep((millis + 500) / 1000); }
2055 void __kmp_elapsed(
double *t) {
2057 #ifdef FIX_SGI_CLOCK
2060 status = clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts);
2061 KMP_CHECK_SYSFAIL_ERRNO(
"clock_gettime", status);
2063 (double)ts.tv_nsec * (1.0 / (
double)KMP_NSEC_PER_SEC) + (
double)ts.tv_sec;
2067 status = gettimeofday(&tv, NULL);
2068 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
2070 (double)tv.tv_usec * (1.0 / (
double)KMP_USEC_PER_SEC) + (
double)tv.tv_sec;
2075 void __kmp_elapsed_tick(
double *t) { *t = 1 / (double)CLOCKS_PER_SEC; }
2078 kmp_uint64 __kmp_now_nsec() {
2080 gettimeofday(&t, NULL);
2081 kmp_uint64 nsec = (kmp_uint64)KMP_NSEC_PER_SEC * (kmp_uint64)t.tv_sec +
2082 (kmp_uint64)1000 * (kmp_uint64)t.tv_usec;
2086 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
2088 void __kmp_initialize_system_tick() {
2089 kmp_uint64 now, nsec2, diff;
2090 kmp_uint64 delay = 1000000;
2091 kmp_uint64 nsec = __kmp_now_nsec();
2092 kmp_uint64 goal = __kmp_hardware_timestamp() + delay;
2093 while ((now = __kmp_hardware_timestamp()) < goal)
2095 nsec2 = __kmp_now_nsec();
2096 diff = nsec2 - nsec;
2098 double tpus = 1000.0 * (double)(delay + (now - goal)) / (
double)diff;
2100 __kmp_ticks_per_msec = (kmp_uint64)(tpus * 1000.0);
2101 __kmp_ticks_per_usec = (kmp_uint64)tpus;
2110 int __kmp_is_address_mapped(
void *addr) {
2115 #if KMP_OS_LINUX || KMP_OS_HURD
2120 char *name = __kmp_str_format(
"/proc/%d/maps", getpid());
2123 file = fopen(name,
"r");
2124 KMP_ASSERT(file != NULL);
2128 void *beginning = NULL;
2129 void *ending = NULL;
2132 rc = fscanf(file,
"%p-%p %4s %*[^\n]\n", &beginning, &ending, perms);
2136 KMP_ASSERT(rc == 3 &&
2137 KMP_STRLEN(perms) == 4);
2140 if ((addr >= beginning) && (addr < ending)) {
2142 if (strcmp(perms,
"rw") == 0) {
2152 KMP_INTERNAL_FREE(name);
2153 #elif KMP_OS_FREEBSD
2156 int mib[] = {CTL_KERN, KERN_PROC, KERN_PROC_VMMAP, getpid()};
2157 rc = sysctl(mib, 4, NULL, &lstsz, NULL, 0);
2162 lstsz = lstsz * 4 / 3;
2163 buf =
reinterpret_cast<char *
>(KMP_INTERNAL_MALLOC(lstsz));
2164 rc = sysctl(mib, 4, buf, &lstsz, NULL, 0);
2166 KMP_INTERNAL_FREE(buf);
2171 char *up = buf + lstsz;
2174 struct kinfo_vmentry *cur =
reinterpret_cast<struct kinfo_vmentry *
>(lw);
2175 size_t cursz = cur->kve_structsize;
2178 void *start =
reinterpret_cast<void *
>(cur->kve_start);
2179 void *end =
reinterpret_cast<void *
>(cur->kve_end);
2181 if ((addr >= start) && (addr < end)) {
2182 if ((cur->kve_protection & KVME_PROT_READ) != 0 &&
2183 (cur->kve_protection & KVME_PROT_WRITE) != 0) {
2190 KMP_INTERNAL_FREE(buf);
2191 #elif KMP_OS_DRAGONFLY
2192 char err[_POSIX2_LINE_MAX];
2196 vm_map_entry entry, *c;
2202 fd = kvm_openfiles(
nullptr,
nullptr,
nullptr, O_RDONLY, err);
2207 proc = kvm_getprocs(fd, KERN_PROC_PID, getpid(), &num);
2209 if (kvm_read(fd,
static_cast<uintptr_t
>(proc->kp_paddr), &p,
sizeof(p)) !=
2211 kvm_read(fd,
reinterpret_cast<uintptr_t
>(p.p_vmspace), &sp,
sizeof(sp)) !=
2219 uaddr =
reinterpret_cast<uintptr_t
>(addr);
2220 for (c = kvm_vm_map_entry_first(fd, cur, &entry); c;
2221 c = kvm_vm_map_entry_next(fd, c, &entry)) {
2222 if ((uaddr >= entry.ba.start) && (uaddr <= entry.ba.end)) {
2223 if ((entry.protection & VM_PROT_READ) != 0 &&
2224 (entry.protection & VM_PROT_WRITE) != 0) {
2232 #elif KMP_OS_SOLARIS
2240 pid_t pid = getpid();
2241 struct ps_prochandle *fd = Pgrab(pid, PGRAB_RDONLY, &err);
2248 char *name = __kmp_str_format(
"/proc/%d/map", pid);
2249 size_t sz = (1 << 20);
2250 file = open(name, O_RDONLY);
2252 KMP_INTERNAL_FREE(name);
2256 buf = KMP_INTERNAL_MALLOC(sz);
2258 while (sz > 0 && (rd = pread(file, buf, sz, 0)) == sz) {
2261 newbuf = KMP_INTERNAL_REALLOC(buf, sz);
2265 map =
reinterpret_cast<prmap_t *
>(buf);
2266 uaddr =
reinterpret_cast<uintptr_t
>(addr);
2268 for (cur = map; rd > 0; cur++, rd = -
sizeof(*map)) {
2269 if ((uaddr >= cur->pr_vaddr) && (uaddr < cur->pr_vaddr)) {
2270 if ((cur->pr_mflags & MA_READ) != 0 && (cur->pr_mflags & MA_WRITE) != 0) {
2277 KMP_INTERNAL_FREE(map);
2279 KMP_INTERNAL_FREE(name);
2287 rc = vm_read_overwrite(
2289 (vm_address_t)(addr),
2291 (vm_address_t)(&buffer),
2304 mib[2] = VM_PROC_MAP;
2306 mib[4] =
sizeof(
struct kinfo_vmentry);
2309 rc = sysctl(mib, __arraycount(mib), NULL, &size, NULL, 0);
2313 size = size * 4 / 3;
2314 struct kinfo_vmentry *kiv = (
struct kinfo_vmentry *)KMP_INTERNAL_MALLOC(size);
2317 rc = sysctl(mib, __arraycount(mib), kiv, &size, NULL, 0);
2321 for (
size_t i = 0; i < size; i++) {
2322 if (kiv[i].kve_start >= (uint64_t)addr &&
2323 kiv[i].kve_end <= (uint64_t)addr) {
2328 KMP_INTERNAL_FREE(kiv);
2329 #elif KMP_OS_OPENBSD
2333 mib[1] = KERN_PROC_VMMAP;
2338 rc = sysctl(mib, 3, NULL, &size, NULL, 0);
2343 struct kinfo_vmentry kiv = {.kve_start = 0};
2345 while ((rc = sysctl(mib, 3, &kiv, &size, NULL, 0)) == 0) {
2347 if (kiv.kve_end == end)
2350 if (kiv.kve_start >= (uint64_t)addr && kiv.kve_end <= (uint64_t)addr) {
2357 found = (int)addr < (__builtin_wasm_memory_size(0) * PAGESIZE);
2360 uint32_t loadQueryBufSize = 4096u;
2364 loadQueryBuf = (
char *)KMP_INTERNAL_MALLOC(loadQueryBufSize);
2365 if (loadQueryBuf == NULL) {
2369 rc = loadquery(L_GETXINFO | L_IGNOREUNLOAD, loadQueryBuf, loadQueryBufSize);
2371 KMP_INTERNAL_FREE(loadQueryBuf);
2372 if (errno != ENOMEM) {
2376 loadQueryBufSize <<= 1;
2383 struct ld_xinfo *curLdInfo = (
struct ld_xinfo *)loadQueryBuf;
2387 uintptr_t curDataStart = (uintptr_t)curLdInfo->ldinfo_dataorg;
2388 uintptr_t curDataEnd = curDataStart + curLdInfo->ldinfo_datasize;
2391 if (curDataStart <= (uintptr_t)addr && (uintptr_t)addr < curDataEnd) {
2395 if (curLdInfo->ldinfo_next == 0u) {
2399 curLdInfo = (
struct ld_xinfo *)((
char *)curLdInfo + curLdInfo->ldinfo_next);
2401 KMP_INTERNAL_FREE(loadQueryBuf);
2405 #error "Unknown or unsupported OS"
2413 #ifdef USE_LOAD_BALANCE
2415 #if KMP_OS_DARWIN || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
2416 KMP_OS_OPENBSD || KMP_OS_SOLARIS
2423 int __kmp_get_load_balance(
int max) {
2427 int res = getloadavg(averages, 3);
2432 if (__kmp_load_balance_interval < 180 && (res >= 1)) {
2433 ret_avg = (int)averages[0];
2434 }
else if ((__kmp_load_balance_interval >= 180 &&
2435 __kmp_load_balance_interval < 600) &&
2437 ret_avg = (int)averages[1];
2438 }
else if ((__kmp_load_balance_interval >= 600) && (res == 3)) {
2439 ret_avg = (int)averages[2];
2451 int __kmp_get_load_balance(
int max) {
2453 static int glb_running_threads = 0;
2455 static double glb_call_time = 0;
2456 int running_threads = 0;
2458 double call_time = 0.0;
2460 __kmp_elapsed(&call_time);
2462 if (glb_call_time &&
2463 (call_time - glb_call_time < __kmp_load_balance_interval))
2464 return glb_running_threads;
2466 glb_call_time = call_time;
2473 int logical_cpus = perfstat_cpu(NULL, NULL,
sizeof(perfstat_cpu_t), 0);
2474 if (logical_cpus <= 0) {
2479 perfstat_cpu_t *cpu_stat = (perfstat_cpu_t *)KMP_INTERNAL_MALLOC(
2480 logical_cpus *
sizeof(perfstat_cpu_t));
2481 if (cpu_stat == NULL) {
2488 perfstat_id_t first_cpu_name;
2489 strcpy(first_cpu_name.name, FIRST_CPU);
2492 int rc = perfstat_cpu(&first_cpu_name, cpu_stat,
sizeof(perfstat_cpu_t),
2494 KMP_DEBUG_ASSERT(rc == logical_cpus);
2496 KMP_INTERNAL_FREE(cpu_stat);
2500 for (
int i = 0; i < logical_cpus; ++i) {
2501 running_threads += cpu_stat[i].runque;
2502 if (running_threads >= max)
2509 KMP_DEBUG_ASSERT(running_threads > 0);
2510 if (running_threads <= 0)
2511 running_threads = 1;
2513 KMP_INTERNAL_FREE(cpu_stat);
2515 glb_running_threads = running_threads;
2517 return running_threads;
2526 int __kmp_get_load_balance(
int max) {
2527 static int permanent_error = 0;
2528 static int glb_running_threads = 0;
2530 static double glb_call_time = 0;
2532 int running_threads = 0;
2534 DIR *proc_dir = NULL;
2535 struct dirent *proc_entry = NULL;
2537 kmp_str_buf_t task_path;
2538 DIR *task_dir = NULL;
2539 struct dirent *task_entry = NULL;
2540 int task_path_fixed_len;
2542 kmp_str_buf_t stat_path;
2544 int stat_path_fixed_len;
2547 int total_processes = 0;
2550 double call_time = 0.0;
2552 __kmp_str_buf_init(&task_path);
2553 __kmp_str_buf_init(&stat_path);
2555 __kmp_elapsed(&call_time);
2557 if (glb_call_time &&
2558 (call_time - glb_call_time < __kmp_load_balance_interval)) {
2559 running_threads = glb_running_threads;
2563 glb_call_time = call_time;
2566 if (permanent_error) {
2567 running_threads = -1;
2576 proc_dir = opendir(
"/proc");
2577 if (proc_dir == NULL) {
2580 running_threads = -1;
2581 permanent_error = 1;
2586 __kmp_str_buf_cat(&task_path,
"/proc/", 6);
2587 task_path_fixed_len = task_path.used;
2589 proc_entry = readdir(proc_dir);
2590 while (proc_entry != NULL) {
2593 if (proc_entry->d_type == DT_DIR && isdigit(proc_entry->d_name[0])) {
2603 KMP_DEBUG_ASSERT(total_processes != 1 ||
2604 strcmp(proc_entry->d_name,
"1") == 0);
2607 task_path.used = task_path_fixed_len;
2608 __kmp_str_buf_cat(&task_path, proc_entry->d_name,
2609 KMP_STRLEN(proc_entry->d_name));
2610 __kmp_str_buf_cat(&task_path,
"/task", 5);
2612 task_dir = opendir(task_path.str);
2613 if (task_dir == NULL) {
2622 if (strcmp(proc_entry->d_name,
"1") == 0) {
2623 running_threads = -1;
2624 permanent_error = 1;
2629 __kmp_str_buf_clear(&stat_path);
2630 __kmp_str_buf_cat(&stat_path, task_path.str, task_path.used);
2631 __kmp_str_buf_cat(&stat_path,
"/", 1);
2632 stat_path_fixed_len = stat_path.used;
2634 task_entry = readdir(task_dir);
2635 while (task_entry != NULL) {
2637 if (proc_entry->d_type == DT_DIR && isdigit(task_entry->d_name[0])) {
2644 stat_path_fixed_len;
2645 __kmp_str_buf_cat(&stat_path, task_entry->d_name,
2646 KMP_STRLEN(task_entry->d_name));
2647 __kmp_str_buf_cat(&stat_path,
"/stat", 5);
2651 stat_file = open(stat_path.str, O_RDONLY);
2652 if (stat_file == -1) {
2682 len = read(stat_file, buffer,
sizeof(buffer) - 1);
2689 char *close_parent = strstr(buffer,
") ");
2690 if (close_parent != NULL) {
2691 char state = *(close_parent + 2);
2694 if (running_threads >= max) {
2704 task_entry = readdir(task_dir);
2710 proc_entry = readdir(proc_dir);
2716 KMP_DEBUG_ASSERT(running_threads > 0);
2717 if (running_threads <= 0) {
2718 running_threads = 1;
2722 if (proc_dir != NULL) {
2725 __kmp_str_buf_free(&task_path);
2726 if (task_dir != NULL) {
2729 __kmp_str_buf_free(&stat_path);
2730 if (stat_file != -1) {
2734 glb_running_threads = running_threads;
2736 return running_threads;
2744 #if !(KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_MIC || \
2745 ((KMP_OS_LINUX || KMP_OS_DARWIN) && KMP_ARCH_AARCH64) || \
2746 KMP_ARCH_PPC64 || KMP_ARCH_RISCV64 || KMP_ARCH_LOONGARCH64 || \
2747 KMP_ARCH_ARM || KMP_ARCH_VE || KMP_ARCH_S390X || KMP_ARCH_PPC_XCOFF || \
2748 KMP_ARCH_AARCH64_32)
2754 typedef void (*microtask_t0)(
int *,
int *);
2755 typedef void (*microtask_t1)(
int *,
int *,
void *);
2756 typedef void (*microtask_t2)(
int *,
int *,
void *,
void *);
2757 typedef void (*microtask_t3)(
int *,
int *,
void *,
void *,
void *);
2758 typedef void (*microtask_t4)(
int *,
int *,
void *,
void *,
void *,
void *);
2759 typedef void (*microtask_t5)(
int *,
int *,
void *,
void *,
void *,
void *,
2761 typedef void (*microtask_t6)(
int *,
int *,
void *,
void *,
void *,
void *,
2763 typedef void (*microtask_t7)(
int *,
int *,
void *,
void *,
void *,
void *,
2764 void *,
void *,
void *);
2765 typedef void (*microtask_t8)(
int *,
int *,
void *,
void *,
void *,
void *,
2766 void *,
void *,
void *,
void *);
2767 typedef void (*microtask_t9)(
int *,
int *,
void *,
void *,
void *,
void *,
2768 void *,
void *,
void *,
void *,
void *);
2769 typedef void (*microtask_t10)(
int *,
int *,
void *,
void *,
void *,
void *,
2770 void *,
void *,
void *,
void *,
void *,
void *);
2771 typedef void (*microtask_t11)(
int *,
int *,
void *,
void *,
void *,
void *,
2772 void *,
void *,
void *,
void *,
void *,
void *,
2774 typedef void (*microtask_t12)(
int *,
int *,
void *,
void *,
void *,
void *,
2775 void *,
void *,
void *,
void *,
void *,
void *,
2777 typedef void (*microtask_t13)(
int *,
int *,
void *,
void *,
void *,
void *,
2778 void *,
void *,
void *,
void *,
void *,
void *,
2779 void *,
void *,
void *);
2780 typedef void (*microtask_t14)(
int *,
int *,
void *,
void *,
void *,
void *,
2781 void *,
void *,
void *,
void *,
void *,
void *,
2782 void *,
void *,
void *,
void *);
2783 typedef void (*microtask_t15)(
int *,
int *,
void *,
void *,
void *,
void *,
2784 void *,
void *,
void *,
void *,
void *,
void *,
2785 void *,
void *,
void *,
void *,
void *);
2789 int __kmp_invoke_microtask(microtask_t pkfn,
int gtid,
int tid,
int argc,
2793 void **exit_frame_ptr
2797 *exit_frame_ptr = OMPT_GET_FRAME_ADDRESS(0);
2802 fprintf(stderr,
"Too many args to microtask: %d!\n", argc);
2806 (*(microtask_t0)pkfn)(>id, &tid);
2809 (*(microtask_t1)pkfn)(>id, &tid, p_argv[0]);
2812 (*(microtask_t2)pkfn)(>id, &tid, p_argv[0], p_argv[1]);
2815 (*(microtask_t3)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2]);
2818 (*(microtask_t4)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2822 (*(microtask_t5)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2823 p_argv[3], p_argv[4]);
2826 (*(microtask_t6)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2827 p_argv[3], p_argv[4], p_argv[5]);
2830 (*(microtask_t7)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2831 p_argv[3], p_argv[4], p_argv[5], p_argv[6]);
2834 (*(microtask_t8)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2835 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2839 (*(microtask_t9)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2840 p_argv[3], p_argv[4], p_argv[5], p_argv[6], p_argv[7],
2844 (*(microtask_t10)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2845 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2846 p_argv[7], p_argv[8], p_argv[9]);
2849 (*(microtask_t11)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2850 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2851 p_argv[7], p_argv[8], p_argv[9], p_argv[10]);
2854 (*(microtask_t12)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2855 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2856 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2860 (*(microtask_t13)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2861 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2862 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2863 p_argv[11], p_argv[12]);
2866 (*(microtask_t14)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2867 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2868 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2869 p_argv[11], p_argv[12], p_argv[13]);
2872 (*(microtask_t15)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2873 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2874 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2875 p_argv[11], p_argv[12], p_argv[13], p_argv[14]);
2888 pthread_cond_t hidden_helper_threads_initz_cond_var;
2889 pthread_mutex_t hidden_helper_threads_initz_lock;
2890 volatile int hidden_helper_initz_signaled = FALSE;
2893 pthread_cond_t hidden_helper_threads_deinitz_cond_var;
2894 pthread_mutex_t hidden_helper_threads_deinitz_lock;
2895 volatile int hidden_helper_deinitz_signaled = FALSE;
2898 pthread_cond_t hidden_helper_main_thread_cond_var;
2899 pthread_mutex_t hidden_helper_main_thread_lock;
2900 volatile int hidden_helper_main_thread_signaled = FALSE;
2905 sem_t hidden_helper_task_sem;
2908 void __kmp_hidden_helper_worker_thread_wait() {
2909 int status = sem_wait(&hidden_helper_task_sem);
2910 KMP_CHECK_SYSFAIL(
"sem_wait", status);
2913 void __kmp_do_initialize_hidden_helper_threads() {
2916 pthread_cond_init(&hidden_helper_threads_initz_cond_var,
nullptr);
2917 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2919 status = pthread_cond_init(&hidden_helper_threads_deinitz_cond_var,
nullptr);
2920 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2922 status = pthread_cond_init(&hidden_helper_main_thread_cond_var,
nullptr);
2923 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2925 status = pthread_mutex_init(&hidden_helper_threads_initz_lock,
nullptr);
2926 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2928 status = pthread_mutex_init(&hidden_helper_threads_deinitz_lock,
nullptr);
2929 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2931 status = pthread_mutex_init(&hidden_helper_main_thread_lock,
nullptr);
2932 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2935 status = sem_init(&hidden_helper_task_sem, 0, 0);
2936 KMP_CHECK_SYSFAIL(
"sem_init", status);
2940 status = pthread_create(
2942 [](
void *) ->
void * {
2943 __kmp_hidden_helper_threads_initz_routine();
2947 KMP_CHECK_SYSFAIL(
"pthread_create", status);
2950 void __kmp_hidden_helper_threads_initz_wait() {
2953 int status = pthread_mutex_lock(&hidden_helper_threads_initz_lock);
2954 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2956 if (!TCR_4(hidden_helper_initz_signaled)) {
2957 status = pthread_cond_wait(&hidden_helper_threads_initz_cond_var,
2958 &hidden_helper_threads_initz_lock);
2959 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2962 status = pthread_mutex_unlock(&hidden_helper_threads_initz_lock);
2963 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
2966 void __kmp_hidden_helper_initz_release() {
2968 int status = pthread_mutex_lock(&hidden_helper_threads_initz_lock);
2969 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2971 status = pthread_cond_signal(&hidden_helper_threads_initz_cond_var);
2972 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2974 TCW_SYNC_4(hidden_helper_initz_signaled, TRUE);
2976 status = pthread_mutex_unlock(&hidden_helper_threads_initz_lock);
2977 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
2980 void __kmp_hidden_helper_main_thread_wait() {
2983 int status = pthread_mutex_lock(&hidden_helper_main_thread_lock);
2984 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2986 if (!TCR_4(hidden_helper_main_thread_signaled)) {
2987 status = pthread_cond_wait(&hidden_helper_main_thread_cond_var,
2988 &hidden_helper_main_thread_lock);
2989 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2992 status = pthread_mutex_unlock(&hidden_helper_main_thread_lock);
2993 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
2996 void __kmp_hidden_helper_main_thread_release() {
2999 int status = pthread_mutex_lock(&hidden_helper_main_thread_lock);
3000 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3002 status = pthread_cond_signal(&hidden_helper_main_thread_cond_var);
3003 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
3006 TCW_SYNC_4(hidden_helper_main_thread_signaled, TRUE);
3008 status = pthread_mutex_unlock(&hidden_helper_main_thread_lock);
3009 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3012 void __kmp_hidden_helper_worker_thread_signal() {
3013 int status = sem_post(&hidden_helper_task_sem);
3014 KMP_CHECK_SYSFAIL(
"sem_post", status);
3017 void __kmp_hidden_helper_threads_deinitz_wait() {
3020 int status = pthread_mutex_lock(&hidden_helper_threads_deinitz_lock);
3021 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3023 if (!TCR_4(hidden_helper_deinitz_signaled)) {
3024 status = pthread_cond_wait(&hidden_helper_threads_deinitz_cond_var,
3025 &hidden_helper_threads_deinitz_lock);
3026 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
3029 status = pthread_mutex_unlock(&hidden_helper_threads_deinitz_lock);
3030 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3033 void __kmp_hidden_helper_threads_deinitz_release() {
3034 int status = pthread_mutex_lock(&hidden_helper_threads_deinitz_lock);
3035 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3037 status = pthread_cond_signal(&hidden_helper_threads_deinitz_cond_var);
3038 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
3040 TCW_SYNC_4(hidden_helper_deinitz_signaled, TRUE);
3042 status = pthread_mutex_unlock(&hidden_helper_threads_deinitz_lock);
3043 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3046 void __kmp_hidden_helper_worker_thread_wait() {
3047 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3050 void __kmp_do_initialize_hidden_helper_threads() {
3051 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3054 void __kmp_hidden_helper_threads_initz_wait() {
3055 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3058 void __kmp_hidden_helper_initz_release() {
3059 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3062 void __kmp_hidden_helper_main_thread_wait() {
3063 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3066 void __kmp_hidden_helper_main_thread_release() {
3067 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3070 void __kmp_hidden_helper_worker_thread_signal() {
3071 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3074 void __kmp_hidden_helper_threads_deinitz_wait() {
3075 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3078 void __kmp_hidden_helper_threads_deinitz_release() {
3079 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3083 bool __kmp_detect_shm() {
3084 DIR *dir = opendir(
"/dev/shm");
3088 }
else if (ENOENT == errno) {
3095 bool __kmp_detect_tmp() {
3096 DIR *dir = opendir(
"/tmp");
3100 }
else if (ENOENT == errno) {
#define KMP_INIT_PARTITIONED_TIMERS(name)
Initializes the partitioned timers to begin with name.