14#include "kmp_affinity.h"
21#include "kmp_wait_release.h"
22#include "kmp_wrapper_getpid.h"
24#if !KMP_OS_DRAGONFLY && !KMP_OS_FREEBSD && !KMP_OS_NETBSD && !KMP_OS_OPENBSD
31#include <sys/resource.h>
34#include <libperfstat.h>
36#include <sys/syscall.h>
43#include <sys/sysinfo.h>
59#include <sys/sysctl.h>
60#elif KMP_OS_DRAGONFLY || KMP_OS_FREEBSD
62#include <sys/sysctl.h>
64#include <pthread_np.h>
68#elif KMP_OS_NETBSD || KMP_OS_OPENBSD
70#include <sys/sysctl.h>
75#include <pthread_np.h>
81#include <sys/loadavg.h>
89 struct timespec start;
92#ifndef TIMEVAL_TO_TIMESPEC
94#define TIMEVAL_TO_TIMESPEC(tv, ts) \
96 (ts)->tv_sec = (tv)->tv_sec; \
97 (ts)->tv_nsec = (tv)->tv_usec * 1000; \
102#define TS2NS(timespec) \
103 (((timespec).tv_sec * (long int)1e9) + (timespec).tv_nsec)
105static struct kmp_sys_timer __kmp_sys_timer_data;
107#if KMP_HANDLE_SIGNALS
108typedef void (*sig_func_t)(int);
109STATIC_EFI2_WORKAROUND
struct sigaction __kmp_sighldrs[NSIG];
110static sigset_t __kmp_sigset;
113static int __kmp_init_runtime = FALSE;
115static int __kmp_fork_count = 0;
117static pthread_condattr_t __kmp_suspend_cond_attr;
118static pthread_mutexattr_t __kmp_suspend_mutex_attr;
120static kmp_cond_align_t __kmp_wait_cv;
121static kmp_mutex_align_t __kmp_wait_mx;
123kmp_uint64 __kmp_ticks_per_msec = 1000000;
124kmp_uint64 __kmp_ticks_per_usec = 1000;
127static void __kmp_print_cond(
char *buffer, kmp_cond_align_t *cond) {
128 KMP_SNPRINTF(buffer, 128,
"(cond (lock (%ld, %d)), (descr (%p)))",
129 cond->c_cond.__c_lock.__status, cond->c_cond.__c_lock.__spinlock,
130 cond->c_cond.__c_waiting);
134#if ((KMP_OS_LINUX || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY || \
136 KMP_AFFINITY_SUPPORTED)
140void __kmp_affinity_bind_thread(
int which) {
141 KMP_ASSERT2(KMP_AFFINITY_CAPABLE(),
142 "Illegal set affinity operation when not capable");
144 kmp_affin_mask_t *mask;
145 KMP_CPU_ALLOC_ON_STACK(mask);
147 KMP_CPU_SET(which, mask);
148 __kmp_set_system_affinity(mask, TRUE);
149 KMP_CPU_FREE_FROM_STACK(mask);
153void __kmp_affinity_determine_capable(
const char *env_var) {
156 size_t mask_size = __kmp_xproc / CHAR_BIT;
158 if (__kmp_xproc % CHAR_BIT)
162 if (mask_size %
sizeof(__kmp_affin_mask_size))
163 mask_size +=
sizeof(__kmp_affin_mask_size) -
164 mask_size %
sizeof(__kmp_affin_mask_size);
165 KMP_AFFINITY_ENABLE(mask_size);
167 (
"__kmp_affinity_determine_capable: "
168 "AIX OS affinity interface bindprocessor functional (mask size = "
169 "%" KMP_SIZE_T_SPEC
").\n",
170 __kmp_affin_mask_size));
178void __kmp_affinity_determine_capable(
const char *env_var) {
182#define KMP_CPU_SET_SIZE_LIMIT (1024 * 1024)
183#define KMP_CPU_SET_TRY_SIZE CACHE_LINE
184#elif KMP_OS_FREEBSD || KMP_OS_DRAGONFLY
185#define KMP_CPU_SET_SIZE_LIMIT (sizeof(cpuset_t))
187#define KMP_CPU_SET_SIZE_LIMIT (256)
190 int verbose = __kmp_affinity.flags.verbose;
191 int warnings = __kmp_affinity.flags.warnings;
192 enum affinity_type type = __kmp_affinity.type;
197 buf = (
unsigned char *)KMP_INTERNAL_MALLOC(KMP_CPU_SET_SIZE_LIMIT);
201 gCode = syscall(__NR_sched_getaffinity, 0, KMP_CPU_SET_TRY_SIZE, buf);
202 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
203 "initial getaffinity call returned %ld errno = %d\n",
206 if (gCode < 0 && errno != EINVAL) {
209 (warnings && (type != affinity_none) && (type != affinity_default) &&
210 (type != affinity_disabled))) {
212 kmp_msg_t err_code = KMP_ERR(error);
213 __kmp_msg(kmp_ms_warning, KMP_MSG(GetAffSysCallNotSupported, env_var),
214 err_code, __kmp_msg_null);
215 if (__kmp_generate_warnings == kmp_warnings_off) {
216 __kmp_str_free(&err_code.str);
219 KMP_AFFINITY_DISABLE();
220 KMP_INTERNAL_FREE(buf);
222 }
else if (gCode > 0) {
224 KMP_AFFINITY_ENABLE(gCode);
225 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
226 "affinity supported (mask size %d)\n",
227 (
int)__kmp_affin_mask_size));
228 KMP_INTERNAL_FREE(buf);
234 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
235 "searching for proper set size\n"));
237 for (size = 1; size <= KMP_CPU_SET_SIZE_LIMIT; size *= 2) {
238 gCode = syscall(__NR_sched_getaffinity, 0, size, buf);
239 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
240 "getaffinity for mask size %ld returned %ld errno = %d\n",
241 size, gCode, errno));
244 if (errno == ENOSYS) {
246 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
247 "inconsistent OS call behavior: errno == ENOSYS for mask "
251 (warnings && (type != affinity_none) &&
252 (type != affinity_default) && (type != affinity_disabled))) {
254 kmp_msg_t err_code = KMP_ERR(error);
255 __kmp_msg(kmp_ms_warning, KMP_MSG(GetAffSysCallNotSupported, env_var),
256 err_code, __kmp_msg_null);
257 if (__kmp_generate_warnings == kmp_warnings_off) {
258 __kmp_str_free(&err_code.str);
261 KMP_AFFINITY_DISABLE();
262 KMP_INTERNAL_FREE(buf);
268 KMP_AFFINITY_ENABLE(gCode);
269 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
270 "affinity supported (mask size %d)\n",
271 (
int)__kmp_affin_mask_size));
272 KMP_INTERNAL_FREE(buf);
275#elif KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY
278 buf = (
unsigned char *)KMP_INTERNAL_MALLOC(KMP_CPU_SET_SIZE_LIMIT);
279 gCode = pthread_getaffinity_np(pthread_self(), KMP_CPU_SET_SIZE_LIMIT,
280 reinterpret_cast<cpuset_t *
>(buf));
281 KA_TRACE(30, (
"__kmp_affinity_determine_capable: "
282 "initial getaffinity call returned %d errno = %d\n",
285 KMP_AFFINITY_ENABLE(KMP_CPU_SET_SIZE_LIMIT);
286 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
287 "affinity supported (mask size %d)\n",
288 (
int)__kmp_affin_mask_size));
289 KMP_INTERNAL_FREE(buf);
293 KMP_INTERNAL_FREE(buf);
296 KMP_AFFINITY_DISABLE();
297 KA_TRACE(10, (
"__kmp_affinity_determine_capable: "
298 "cannot determine mask size - affinity not supported\n"));
299 if (verbose || (warnings && (type != affinity_none) &&
300 (type != affinity_default) && (type != affinity_disabled))) {
301 KMP_WARNING(AffCantGetMaskSize, env_var);
310int __kmp_futex_determine_capable() {
312 long rc = syscall(__NR_futex, &loc, FUTEX_WAKE, 1, NULL, NULL, 0);
313 int retval = (rc == 0) || (errno != ENOSYS);
316 (
"__kmp_futex_determine_capable: rc = %d errno = %d\n", rc, errno));
317 KA_TRACE(10, (
"__kmp_futex_determine_capable: futex syscall%s supported\n",
318 retval ?
"" :
" not"));
325#if (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_WASM) && (!KMP_ASM_INTRINS)
329kmp_int8 __kmp_test_then_or8(
volatile kmp_int8 *p, kmp_int8 d) {
330 kmp_int8 old_value, new_value;
332 old_value = TCR_1(*p);
333 new_value = old_value | d;
335 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
337 old_value = TCR_1(*p);
338 new_value = old_value | d;
343kmp_int8 __kmp_test_then_and8(
volatile kmp_int8 *p, kmp_int8 d) {
344 kmp_int8 old_value, new_value;
346 old_value = TCR_1(*p);
347 new_value = old_value & d;
349 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
351 old_value = TCR_1(*p);
352 new_value = old_value & d;
357kmp_uint32 __kmp_test_then_or32(
volatile kmp_uint32 *p, kmp_uint32 d) {
358 kmp_uint32 old_value, new_value;
360 old_value = TCR_4(*p);
361 new_value = old_value | d;
363 while (!KMP_COMPARE_AND_STORE_REL32(p, old_value, new_value)) {
365 old_value = TCR_4(*p);
366 new_value = old_value | d;
371kmp_uint32 __kmp_test_then_and32(
volatile kmp_uint32 *p, kmp_uint32 d) {
372 kmp_uint32 old_value, new_value;
374 old_value = TCR_4(*p);
375 new_value = old_value & d;
377 while (!KMP_COMPARE_AND_STORE_REL32(p, old_value, new_value)) {
379 old_value = TCR_4(*p);
380 new_value = old_value & d;
385#if KMP_ARCH_X86 || KMP_ARCH_WASM
386kmp_int8 __kmp_test_then_add8(
volatile kmp_int8 *p, kmp_int8 d) {
387 kmp_int8 old_value, new_value;
389 old_value = TCR_1(*p);
390 new_value = old_value + d;
392 while (!KMP_COMPARE_AND_STORE_REL8(p, old_value, new_value)) {
394 old_value = TCR_1(*p);
395 new_value = old_value + d;
400kmp_int64 __kmp_test_then_add64(
volatile kmp_int64 *p, kmp_int64 d) {
401 kmp_int64 old_value, new_value;
403 old_value = TCR_8(*p);
404 new_value = old_value + d;
406 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
408 old_value = TCR_8(*p);
409 new_value = old_value + d;
415kmp_uint64 __kmp_test_then_or64(
volatile kmp_uint64 *p, kmp_uint64 d) {
416 kmp_uint64 old_value, new_value;
418 old_value = TCR_8(*p);
419 new_value = old_value | d;
420 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
422 old_value = TCR_8(*p);
423 new_value = old_value | d;
428kmp_uint64 __kmp_test_then_and64(
volatile kmp_uint64 *p, kmp_uint64 d) {
429 kmp_uint64 old_value, new_value;
431 old_value = TCR_8(*p);
432 new_value = old_value & d;
433 while (!KMP_COMPARE_AND_STORE_REL64(p, old_value, new_value)) {
435 old_value = TCR_8(*p);
436 new_value = old_value & d;
443void __kmp_terminate_thread(
int gtid) {
445 kmp_info_t *th = __kmp_threads[gtid];
450#ifdef KMP_CANCEL_THREADS
451 KA_TRACE(10, (
"__kmp_terminate_thread: kill (%d)\n", gtid));
452 status = pthread_cancel(th->th.th_info.ds.ds_thread);
453 if (status != 0 && status != ESRCH) {
454 __kmp_fatal(KMP_MSG(CantTerminateWorkerThread), KMP_ERR(status),
465static kmp_int32 __kmp_set_stack_info(
int gtid, kmp_info_t *th) {
467#if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
468 KMP_OS_HAIKU || KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_AIX
476 if (!KMP_UBER_GTID(gtid)) {
480 if ((status = thr_stksegment(&s)) < 0) {
481 KMP_CHECK_SYSFAIL(
"thr_stksegment", status);
486 KA_TRACE(60, (
"__kmp_set_stack_info: T#%d thr_stksegment returned size:"
487 " %lu, low addr: %p\n",
492 status = pthread_attr_init(&attr);
493 KMP_CHECK_SYSFAIL(
"pthread_attr_init", status);
494#if KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD
495 status = pthread_attr_get_np(pthread_self(), &attr);
496 KMP_CHECK_SYSFAIL(
"pthread_attr_get_np", status);
498 status = pthread_getattr_np(pthread_self(), &attr);
499 KMP_CHECK_SYSFAIL(
"pthread_getattr_np", status);
501 status = pthread_attr_getstack(&attr, &addr, &size);
502 KMP_CHECK_SYSFAIL(
"pthread_attr_getstack", status);
504 (
"__kmp_set_stack_info: T#%d pthread_attr_getstack returned size:"
505 " %lu, low addr: %p\n",
507 status = pthread_attr_destroy(&attr);
508 KMP_CHECK_SYSFAIL(
"pthread_attr_destroy", status);
512 if (size != 0 && addr != 0) {
514 TCW_PTR(th->th.th_info.ds.ds_stackbase, (((
char *)addr) + size));
515 TCW_PTR(th->th.th_info.ds.ds_stacksize, size);
516 TCW_4(th->th.th_info.ds.ds_stackgrow, FALSE);
522 TCW_PTR(th->th.th_info.ds.ds_stacksize, 0);
523 TCW_PTR(th->th.th_info.ds.ds_stackbase, &stack_data);
524 TCW_4(th->th.th_info.ds.ds_stackgrow, TRUE);
528static void *__kmp_launch_worker(
void *thr) {
529 int status, old_type, old_state;
530#ifdef KMP_BLOCK_SIGNALS
531 sigset_t new_set, old_set;
534#if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
535 KMP_OS_OPENBSD || KMP_OS_HAIKU || KMP_OS_HURD || KMP_OS_SOLARIS || \
537 void *
volatile padding = 0;
541 gtid = ((kmp_info_t *)thr)->th.th_info.ds.ds_gtid;
542 __kmp_gtid_set_specific(gtid);
548 __kmp_stats_thread_ptr = ((kmp_info_t *)thr)->th.th_stats;
549 __kmp_stats_thread_ptr->startLife();
550 KMP_SET_THREAD_STATE(IDLE);
555 __kmp_itt_thread_name(gtid);
558#if KMP_AFFINITY_SUPPORTED
559 __kmp_affinity_bind_init_mask(gtid);
562#ifdef KMP_CANCEL_THREADS
563 status = pthread_setcanceltype(PTHREAD_CANCEL_ASYNCHRONOUS, &old_type);
564 KMP_CHECK_SYSFAIL(
"pthread_setcanceltype", status);
566 status = pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, &old_state);
567 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
570#if KMP_ARCH_X86 || KMP_ARCH_X86_64
572 __kmp_clear_x87_fpu_status_word();
573 __kmp_load_x87_fpu_control_word(&__kmp_init_x87_fpu_control_word);
574 __kmp_load_mxcsr(&__kmp_init_mxcsr);
577#ifdef KMP_BLOCK_SIGNALS
578 status = sigfillset(&new_set);
579 KMP_CHECK_SYSFAIL_ERRNO(
"sigfillset", status);
580 status = pthread_sigmask(SIG_BLOCK, &new_set, &old_set);
581 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
584#if KMP_OS_LINUX || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
585 KMP_OS_OPENBSD || KMP_OS_HAIKU || KMP_OS_HURD || KMP_OS_SOLARIS || \
587 if (__kmp_stkoffset > 0 && gtid > 0) {
588 padding = KMP_ALLOCA(gtid * __kmp_stkoffset);
594 __kmp_set_stack_info(gtid, (kmp_info_t *)thr);
596 __kmp_check_stack_overlap((kmp_info_t *)thr);
598 exit_val = __kmp_launch_thread((kmp_info_t *)thr);
600#ifdef KMP_BLOCK_SIGNALS
601 status = pthread_sigmask(SIG_SETMASK, &old_set, NULL);
602 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
611static void *__kmp_launch_monitor(
void *thr) {
612 int status, old_type, old_state;
613#ifdef KMP_BLOCK_SIGNALS
616 struct timespec interval;
620 KA_TRACE(10, (
"__kmp_launch_monitor: #1 launched\n"));
623 __kmp_gtid_set_specific(KMP_GTID_MONITOR);
625 __kmp_gtid = KMP_GTID_MONITOR;
632 __kmp_itt_thread_ignore();
635 __kmp_set_stack_info(((kmp_info_t *)thr)->th.th_info.ds.ds_gtid,
638 __kmp_check_stack_overlap((kmp_info_t *)thr);
640#ifdef KMP_CANCEL_THREADS
641 status = pthread_setcanceltype(PTHREAD_CANCEL_ASYNCHRONOUS, &old_type);
642 KMP_CHECK_SYSFAIL(
"pthread_setcanceltype", status);
644 status = pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, &old_state);
645 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
653 int sched = sched_getscheduler(0);
654 if (sched == SCHED_FIFO || sched == SCHED_RR) {
657 struct sched_param param;
658 int max_priority = sched_get_priority_max(sched);
660 KMP_WARNING(RealTimeSchedNotSupported);
661 sched_getparam(0, ¶m);
662 if (param.sched_priority < max_priority) {
663 param.sched_priority += 1;
664 rc = sched_setscheduler(0, sched, ¶m);
667 kmp_msg_t err_code = KMP_ERR(error);
668 __kmp_msg(kmp_ms_warning, KMP_MSG(CantChangeMonitorPriority),
669 err_code, KMP_MSG(MonitorWillStarve), __kmp_msg_null);
670 if (__kmp_generate_warnings == kmp_warnings_off) {
671 __kmp_str_free(&err_code.str);
678 __kmp_msg(kmp_ms_warning, KMP_MSG(RunningAtMaxPriority),
679 KMP_MSG(MonitorWillStarve), KMP_HNT(RunningAtMaxPriority),
684 TCW_4(__kmp_global.g.g_time.dt.t_value, 0);
690 if (__kmp_monitor_wakeups == 1) {
692 interval.tv_nsec = 0;
695 interval.tv_nsec = (KMP_NSEC_PER_SEC / __kmp_monitor_wakeups);
698 KA_TRACE(10, (
"__kmp_launch_monitor: #2 monitor\n"));
700 while (!TCR_4(__kmp_global.g.g_done)) {
706 KA_TRACE(15, (
"__kmp_launch_monitor: update\n"));
708 status = gettimeofday(&tval, NULL);
709 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
710 TIMEVAL_TO_TIMESPEC(&tval, &now);
712 now.tv_sec += interval.tv_sec;
713 now.tv_nsec += interval.tv_nsec;
715 if (now.tv_nsec >= KMP_NSEC_PER_SEC) {
717 now.tv_nsec -= KMP_NSEC_PER_SEC;
720 status = pthread_mutex_lock(&__kmp_wait_mx.m_mutex);
721 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
723 if (!TCR_4(__kmp_global.g.g_done)) {
724 status = pthread_cond_timedwait(&__kmp_wait_cv.c_cond,
725 &__kmp_wait_mx.m_mutex, &now);
727 if (status != ETIMEDOUT && status != EINTR) {
728 KMP_SYSFAIL(
"pthread_cond_timedwait", status);
732 status = pthread_mutex_unlock(&__kmp_wait_mx.m_mutex);
733 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
735 TCW_4(__kmp_global.g.g_time.dt.t_value,
736 TCR_4(__kmp_global.g.g_time.dt.t_value) + 1);
741 KA_TRACE(10, (
"__kmp_launch_monitor: #3 cleanup\n"));
743#ifdef KMP_BLOCK_SIGNALS
744 status = sigfillset(&new_set);
745 KMP_CHECK_SYSFAIL_ERRNO(
"sigfillset", status);
746 status = pthread_sigmask(SIG_UNBLOCK, &new_set, NULL);
747 KMP_CHECK_SYSFAIL(
"pthread_sigmask", status);
750 KA_TRACE(10, (
"__kmp_launch_monitor: #4 finished\n"));
752 if (__kmp_global.g.g_abort != 0) {
758 KA_TRACE(10, (
"__kmp_launch_monitor: #5 terminate sig=%d\n",
759 __kmp_global.g.g_abort));
764 for (gtid = 1; gtid < __kmp_threads_capacity; ++gtid)
765 __kmp_terminate_thread(gtid);
769 KA_TRACE(10, (
"__kmp_launch_monitor: #6 raise sig=%d\n",
770 __kmp_global.g.g_abort));
772 if (__kmp_global.g.g_abort > 0)
773 raise(__kmp_global.g.g_abort);
776 KA_TRACE(10, (
"__kmp_launch_monitor: #7 exit\n"));
782void __kmp_create_worker(
int gtid, kmp_info_t *th,
size_t stack_size) {
784 pthread_attr_t thread_attr;
787 th->th.th_info.ds.ds_gtid = gtid;
791 __kmp_acquire_tas_lock(&__kmp_stats_lock, gtid);
797 if (!KMP_UBER_GTID(gtid)) {
798 th->th.th_stats = __kmp_stats_list->push_back(gtid);
802 th->th.th_stats = __kmp_stats_thread_ptr;
804 __kmp_release_tas_lock(&__kmp_stats_lock, gtid);
808 if (KMP_UBER_GTID(gtid)) {
809 KA_TRACE(10, (
"__kmp_create_worker: uber thread (%d)\n", gtid));
810 th->th.th_info.ds.ds_thread = pthread_self();
811 __kmp_set_stack_info(gtid, th);
812 __kmp_check_stack_overlap(th);
816 KA_TRACE(10, (
"__kmp_create_worker: try to create thread (%d)\n", gtid));
820#ifdef KMP_THREAD_ATTR
821 status = pthread_attr_init(&thread_attr);
823 __kmp_fatal(KMP_MSG(CantInitThreadAttrs), KMP_ERR(status), __kmp_msg_null);
825 status = pthread_attr_setdetachstate(&thread_attr, PTHREAD_CREATE_JOINABLE);
827 __kmp_fatal(KMP_MSG(CantSetWorkerState), KMP_ERR(status), __kmp_msg_null);
837 stack_size += gtid * __kmp_stkoffset * 2;
839 KA_TRACE(10, (
"__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
840 "__kmp_stksize = %lu bytes, final stacksize = %lu bytes\n",
841 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size));
843#ifdef _POSIX_THREAD_ATTR_STACKSIZE
844 status = pthread_attr_setstacksize(&thread_attr, stack_size);
845#ifdef KMP_BACKUP_STKSIZE
847 if (!__kmp_env_stksize) {
848 stack_size = KMP_BACKUP_STKSIZE + gtid * __kmp_stkoffset;
849 __kmp_stksize = KMP_BACKUP_STKSIZE;
850 KA_TRACE(10, (
"__kmp_create_worker: T#%d, default stacksize = %lu bytes, "
851 "__kmp_stksize = %lu bytes, (backup) final stacksize = %lu "
853 gtid, KMP_DEFAULT_STKSIZE, __kmp_stksize, stack_size));
854 status = pthread_attr_setstacksize(&thread_attr, stack_size);
859 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
860 KMP_HNT(ChangeWorkerStackSize), __kmp_msg_null);
867 pthread_create(&handle, &thread_attr, __kmp_launch_worker, (
void *)th);
868 if (status != 0 || !handle) {
869#ifdef _POSIX_THREAD_ATTR_STACKSIZE
870 if (status == EINVAL) {
871 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
872 KMP_HNT(IncreaseWorkerStackSize), __kmp_msg_null);
874 if (status == ENOMEM) {
875 __kmp_fatal(KMP_MSG(CantSetWorkerStackSize, stack_size), KMP_ERR(status),
876 KMP_HNT(DecreaseWorkerStackSize), __kmp_msg_null);
879 if (status == EAGAIN) {
880 __kmp_fatal(KMP_MSG(NoResourcesForWorkerThread), KMP_ERR(status),
881 KMP_HNT(Decrease_NUM_THREADS), __kmp_msg_null);
883 KMP_SYSFAIL(
"pthread_create", status);
887 if (!KMP_UBER_GTID(gtid)) {
888#if defined(LIBOMP_HAVE_PTHREAD_SET_NAME_NP)
889 pthread_set_name_np(handle,
"openmp_worker");
890#elif defined(LIBOMP_HAVE_PTHREAD_SETNAME_NP) && !KMP_OS_DARWIN
892 pthread_setname_np(handle,
"%s",
const_cast<char *
>(
"openmp_worker"));
894 pthread_setname_np(handle,
"openmp_worker");
899 th->th.th_info.ds.ds_thread = handle;
901#ifdef KMP_THREAD_ATTR
902 status = pthread_attr_destroy(&thread_attr);
904 kmp_msg_t err_code = KMP_ERR(status);
905 __kmp_msg(kmp_ms_warning, KMP_MSG(CantDestroyThreadAttrs), err_code,
907 if (__kmp_generate_warnings == kmp_warnings_off) {
908 __kmp_str_free(&err_code.str);
915 KA_TRACE(10, (
"__kmp_create_worker: done creating thread (%d)\n", gtid));
920void __kmp_create_monitor(kmp_info_t *th) {
922 pthread_attr_t thread_attr;
925 int auto_adj_size = FALSE;
927 if (__kmp_dflt_blocktime == KMP_MAX_BLOCKTIME) {
929 KA_TRACE(10, (
"__kmp_create_monitor: skipping monitor thread because of "
931 th->th.th_info.ds.ds_tid = 0;
932 th->th.th_info.ds.ds_gtid = 0;
935 KA_TRACE(10, (
"__kmp_create_monitor: try to create monitor\n"));
939 th->th.th_info.ds.ds_tid = KMP_GTID_MONITOR;
940 th->th.th_info.ds.ds_gtid = KMP_GTID_MONITOR;
942 TCW_4(__kmp_global.g.g_time.dt.t_value,
945 TCW_4(__kmp_global.g.g_time.dt.t_value, 0);
948#ifdef KMP_THREAD_ATTR
949 if (__kmp_monitor_stksize == 0) {
950 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
951 auto_adj_size = TRUE;
953 status = pthread_attr_init(&thread_attr);
955 __kmp_fatal(KMP_MSG(CantInitThreadAttrs), KMP_ERR(status), __kmp_msg_null);
957 status = pthread_attr_setdetachstate(&thread_attr, PTHREAD_CREATE_JOINABLE);
959 __kmp_fatal(KMP_MSG(CantSetMonitorState), KMP_ERR(status), __kmp_msg_null);
962#ifdef _POSIX_THREAD_ATTR_STACKSIZE
963 status = pthread_attr_getstacksize(&thread_attr, &size);
964 KMP_CHECK_SYSFAIL(
"pthread_attr_getstacksize", status);
966 size = __kmp_sys_min_stksize;
970 if (__kmp_monitor_stksize == 0) {
971 __kmp_monitor_stksize = KMP_DEFAULT_MONITOR_STKSIZE;
973 if (__kmp_monitor_stksize < __kmp_sys_min_stksize) {
974 __kmp_monitor_stksize = __kmp_sys_min_stksize;
977 KA_TRACE(10, (
"__kmp_create_monitor: default stacksize = %lu bytes,"
978 "requested stacksize = %lu bytes\n",
979 size, __kmp_monitor_stksize));
984#ifdef _POSIX_THREAD_ATTR_STACKSIZE
985 KA_TRACE(10, (
"__kmp_create_monitor: setting stacksize = %lu bytes,",
986 __kmp_monitor_stksize));
987 status = pthread_attr_setstacksize(&thread_attr, __kmp_monitor_stksize);
990 __kmp_monitor_stksize *= 2;
993 kmp_msg_t err_code = KMP_ERR(status);
994 __kmp_msg(kmp_ms_warning,
995 KMP_MSG(CantSetMonitorStackSize, (
long int)__kmp_monitor_stksize),
996 err_code, KMP_HNT(ChangeMonitorStackSize), __kmp_msg_null);
997 if (__kmp_generate_warnings == kmp_warnings_off) {
998 __kmp_str_free(&err_code.str);
1004 pthread_create(&handle, &thread_attr, __kmp_launch_monitor, (
void *)th);
1007#ifdef _POSIX_THREAD_ATTR_STACKSIZE
1008 if (status == EINVAL) {
1009 if (auto_adj_size && (__kmp_monitor_stksize < (
size_t)0x40000000)) {
1010 __kmp_monitor_stksize *= 2;
1013 __kmp_fatal(KMP_MSG(CantSetMonitorStackSize, __kmp_monitor_stksize),
1014 KMP_ERR(status), KMP_HNT(IncreaseMonitorStackSize),
1017 if (status == ENOMEM) {
1018 __kmp_fatal(KMP_MSG(CantSetMonitorStackSize, __kmp_monitor_stksize),
1019 KMP_ERR(status), KMP_HNT(DecreaseMonitorStackSize),
1023 if (status == EAGAIN) {
1024 __kmp_fatal(KMP_MSG(NoResourcesForMonitorThread), KMP_ERR(status),
1025 KMP_HNT(DecreaseNumberOfThreadsInUse), __kmp_msg_null);
1027 KMP_SYSFAIL(
"pthread_create", status);
1030 th->th.th_info.ds.ds_thread = handle;
1032#if KMP_REAL_TIME_FIX
1034 KMP_DEBUG_ASSERT(
sizeof(kmp_uint32) ==
1035 sizeof(__kmp_global.g.g_time.dt.t_value));
1036 __kmp_wait_4((kmp_uint32
volatile *)&__kmp_global.g.g_time.dt.t_value, -1,
1037 &__kmp_neq_4, NULL);
1040#ifdef KMP_THREAD_ATTR
1041 status = pthread_attr_destroy(&thread_attr);
1043 kmp_msg_t err_code = KMP_ERR(status);
1044 __kmp_msg(kmp_ms_warning, KMP_MSG(CantDestroyThreadAttrs), err_code,
1046 if (__kmp_generate_warnings == kmp_warnings_off) {
1047 __kmp_str_free(&err_code.str);
1054 KA_TRACE(10, (
"__kmp_create_monitor: monitor created %#.8lx\n",
1055 th->th.th_info.ds.ds_thread));
1060void __kmp_exit_thread(
int exit_status) {
1064 pthread_exit((
void *)(intptr_t)exit_status);
1069void __kmp_resume_monitor();
1071extern "C" void __kmp_reap_monitor(kmp_info_t *th) {
1075 KA_TRACE(10, (
"__kmp_reap_monitor: try to reap monitor thread with handle"
1077 th->th.th_info.ds.ds_thread));
1082 KMP_DEBUG_ASSERT(th->th.th_info.ds.ds_tid == th->th.th_info.ds.ds_gtid);
1083 if (th->th.th_info.ds.ds_gtid != KMP_GTID_MONITOR) {
1084 KA_TRACE(10, (
"__kmp_reap_monitor: monitor did not start, returning\n"));
1094 status = pthread_kill(th->th.th_info.ds.ds_thread, 0);
1095 if (status != ESRCH) {
1096 __kmp_resume_monitor();
1098 KA_TRACE(10, (
"__kmp_reap_monitor: try to join with monitor\n"));
1099 status = pthread_join(th->th.th_info.ds.ds_thread, &exit_val);
1100 if (exit_val != th) {
1101 __kmp_fatal(KMP_MSG(ReapMonitorError), KMP_ERR(status), __kmp_msg_null);
1104 th->th.th_info.ds.ds_tid = KMP_GTID_DNE;
1105 th->th.th_info.ds.ds_gtid = KMP_GTID_DNE;
1107 KA_TRACE(10, (
"__kmp_reap_monitor: done reaping monitor thread with handle"
1109 th->th.th_info.ds.ds_thread));
1116extern "C" void __kmp_reap_monitor(kmp_info_t *th) { (void)th; }
1119void __kmp_reap_worker(kmp_info_t *th) {
1126 10, (
"__kmp_reap_worker: try to reap T#%d\n", th->th.th_info.ds.ds_gtid));
1128 status = pthread_join(th->th.th_info.ds.ds_thread, &exit_val);
1132 __kmp_fatal(KMP_MSG(ReapWorkerError), KMP_ERR(status), __kmp_msg_null);
1134 if (exit_val != th) {
1135 KA_TRACE(10, (
"__kmp_reap_worker: worker T#%d did not reap properly, "
1137 th->th.th_info.ds.ds_gtid, exit_val));
1143 KA_TRACE(10, (
"__kmp_reap_worker: done reaping T#%d\n",
1144 th->th.th_info.ds.ds_gtid));
1149#if KMP_HANDLE_SIGNALS
1151static void __kmp_null_handler(
int signo) {
1155static void __kmp_team_handler(
int signo) {
1156 if (__kmp_global.g.g_abort == 0) {
1159 __kmp_debug_printf(
"__kmp_team_handler: caught signal = %d\n", signo);
1174 if (__kmp_debug_buf) {
1175 __kmp_dump_debug_buffer();
1177 __kmp_unregister_library();
1179 TCW_4(__kmp_global.g.g_abort, signo);
1181 TCW_4(__kmp_global.g.g_done, TRUE);
1186 __kmp_debug_printf(
"__kmp_team_handler: unknown signal type");
1193static void __kmp_sigaction(
int signum,
const struct sigaction *act,
1194 struct sigaction *oldact) {
1195 int rc = sigaction(signum, act, oldact);
1196 KMP_CHECK_SYSFAIL_ERRNO(
"sigaction", rc);
1199static void __kmp_install_one_handler(
int sig, sig_func_t handler_func,
1200 int parallel_init) {
1203 (
"__kmp_install_one_handler( %d, ..., %d )\n", sig, parallel_init));
1204 if (parallel_init) {
1205 struct sigaction new_action;
1206 struct sigaction old_action;
1207 new_action.sa_handler = handler_func;
1208 new_action.sa_flags = 0;
1209 sigfillset(&new_action.sa_mask);
1210 __kmp_sigaction(sig, &new_action, &old_action);
1211 if (old_action.sa_handler == __kmp_sighldrs[sig].sa_handler) {
1212 sigaddset(&__kmp_sigset, sig);
1215 __kmp_sigaction(sig, &old_action, NULL);
1219 __kmp_sigaction(sig, NULL, &__kmp_sighldrs[sig]);
1224static void __kmp_remove_one_handler(
int sig) {
1225 KB_TRACE(60, (
"__kmp_remove_one_handler( %d )\n", sig));
1226 if (sigismember(&__kmp_sigset, sig)) {
1227 struct sigaction old;
1229 __kmp_sigaction(sig, &__kmp_sighldrs[sig], &old);
1230 if ((old.sa_handler != __kmp_team_handler) &&
1231 (old.sa_handler != __kmp_null_handler)) {
1233 KB_TRACE(10, (
"__kmp_remove_one_handler: oops, not our handler, "
1234 "restoring: sig=%d\n",
1236 __kmp_sigaction(sig, &old, NULL);
1238 sigdelset(&__kmp_sigset, sig);
1243void __kmp_install_signals(
int parallel_init) {
1244 KB_TRACE(10, (
"__kmp_install_signals( %d )\n", parallel_init));
1245 if (__kmp_handle_signals || !parallel_init) {
1248 sigemptyset(&__kmp_sigset);
1249 __kmp_install_one_handler(SIGHUP, __kmp_team_handler, parallel_init);
1250 __kmp_install_one_handler(SIGINT, __kmp_team_handler, parallel_init);
1251 __kmp_install_one_handler(SIGQUIT, __kmp_team_handler, parallel_init);
1252 __kmp_install_one_handler(SIGILL, __kmp_team_handler, parallel_init);
1253 __kmp_install_one_handler(SIGABRT, __kmp_team_handler, parallel_init);
1254 __kmp_install_one_handler(SIGFPE, __kmp_team_handler, parallel_init);
1255 __kmp_install_one_handler(SIGBUS, __kmp_team_handler, parallel_init);
1256 __kmp_install_one_handler(SIGSEGV, __kmp_team_handler, parallel_init);
1258 __kmp_install_one_handler(SIGSYS, __kmp_team_handler, parallel_init);
1260 __kmp_install_one_handler(SIGTERM, __kmp_team_handler, parallel_init);
1262 __kmp_install_one_handler(SIGPIPE, __kmp_team_handler, parallel_init);
1267void __kmp_remove_signals(
void) {
1269 KB_TRACE(10, (
"__kmp_remove_signals()\n"));
1270 for (sig = 1; sig < NSIG; ++sig) {
1271 __kmp_remove_one_handler(sig);
1277void __kmp_enable(
int new_state) {
1278#ifdef KMP_CANCEL_THREADS
1279 int status, old_state;
1280 status = pthread_setcancelstate(new_state, &old_state);
1281 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
1282 KMP_DEBUG_ASSERT(old_state == PTHREAD_CANCEL_DISABLE);
1286void __kmp_disable(
int *old_state) {
1287#ifdef KMP_CANCEL_THREADS
1289 status = pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, old_state);
1290 KMP_CHECK_SYSFAIL(
"pthread_setcancelstate", status);
1294static void __kmp_atfork_prepare(
void) {
1295 __kmp_acquire_bootstrap_lock(&__kmp_initz_lock);
1296 __kmp_acquire_bootstrap_lock(&__kmp_forkjoin_lock);
1299static void __kmp_atfork_parent(
void) {
1300 __kmp_release_bootstrap_lock(&__kmp_forkjoin_lock);
1301 __kmp_release_bootstrap_lock(&__kmp_initz_lock);
1307static void __kmp_atfork_child(
void) {
1308 __kmp_release_bootstrap_lock(&__kmp_forkjoin_lock);
1309 __kmp_release_bootstrap_lock(&__kmp_initz_lock);
1316#if KMP_AFFINITY_SUPPORTED
1317#if KMP_OS_LINUX || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_DRAGONFLY || \
1321 kmp_set_thread_affinity_mask_initial();
1326 if (__kmp_nested_proc_bind.bind_types != NULL) {
1327 __kmp_nested_proc_bind.bind_types[0] = proc_bind_false;
1329 for (kmp_affinity_t *affinity : __kmp_affinities)
1330 *affinity = KMP_AFFINITY_INIT(affinity->env_var);
1331 __kmp_affin_fullMask =
nullptr;
1332 __kmp_affin_origMask =
nullptr;
1333 __kmp_topology =
nullptr;
1337 __kmp_init_monitor = 0;
1339 __kmp_init_parallel = FALSE;
1340 __kmp_init_middle = FALSE;
1341 __kmp_init_serial = FALSE;
1342 TCW_4(__kmp_init_gtid, FALSE);
1343 __kmp_init_common = FALSE;
1345 TCW_4(__kmp_init_user_locks, FALSE);
1346#if !KMP_USE_DYNAMIC_LOCK
1347 __kmp_user_lock_table.used = 1;
1348 __kmp_user_lock_table.allocated = 0;
1349 __kmp_user_lock_table.table = NULL;
1350 __kmp_lock_blocks = NULL;
1354 TCW_4(__kmp_nth, 0);
1356 __kmp_thread_pool = NULL;
1357 __kmp_thread_pool_insert_pt = NULL;
1358 __kmp_team_pool = NULL;
1362 KA_TRACE(10, (
"__kmp_atfork_child: checking cache address list %p\n",
1363 __kmp_threadpriv_cache_list));
1365 while (__kmp_threadpriv_cache_list != NULL) {
1367 if (*__kmp_threadpriv_cache_list->addr != NULL) {
1368 KC_TRACE(50, (
"__kmp_atfork_child: zeroing cache at address %p\n",
1369 &(*__kmp_threadpriv_cache_list->addr)));
1371 *__kmp_threadpriv_cache_list->addr = NULL;
1373 __kmp_threadpriv_cache_list = __kmp_threadpriv_cache_list->next;
1376 __kmp_init_runtime = FALSE;
1379 __kmp_init_bootstrap_lock(&__kmp_initz_lock);
1380 __kmp_init_bootstrap_lock(&__kmp_stdio_lock);
1381 __kmp_init_bootstrap_lock(&__kmp_console_lock);
1382 __kmp_init_bootstrap_lock(&__kmp_task_team_lock);
1392 __kmp_need_register_serial = FALSE;
1393 __kmp_serial_initialize();
1407void __kmp_register_atfork(
void) {
1408 if (__kmp_need_register_atfork) {
1410 int status = pthread_atfork(__kmp_atfork_prepare, __kmp_atfork_parent,
1411 __kmp_atfork_child);
1412 KMP_CHECK_SYSFAIL(
"pthread_atfork", status);
1414 __kmp_need_register_atfork = FALSE;
1418void __kmp_suspend_initialize(
void) {
1420 status = pthread_mutexattr_init(&__kmp_suspend_mutex_attr);
1421 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_init", status);
1422 status = pthread_condattr_init(&__kmp_suspend_cond_attr);
1423 KMP_CHECK_SYSFAIL(
"pthread_condattr_init", status);
1426void __kmp_suspend_initialize_thread(kmp_info_t *th) {
1427 int old_value = KMP_ATOMIC_LD_RLX(&th->th.th_suspend_init_count);
1428 int new_value = __kmp_fork_count + 1;
1430 if (old_value == new_value)
1433 if (old_value == -1 || !__kmp_atomic_compare_store(
1434 &th->th.th_suspend_init_count, old_value, -1)) {
1435 while (KMP_ATOMIC_LD_ACQ(&th->th.th_suspend_init_count) != new_value) {
1441 status = pthread_cond_init(&th->th.th_suspend_cv.c_cond,
1442 &__kmp_suspend_cond_attr);
1443 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
1444 status = pthread_mutex_init(&th->th.th_suspend_mx.m_mutex,
1445 &__kmp_suspend_mutex_attr);
1446 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
1447 KMP_ATOMIC_ST_REL(&th->th.th_suspend_init_count, new_value);
1451void __kmp_suspend_uninitialize_thread(kmp_info_t *th) {
1452 if (KMP_ATOMIC_LD_ACQ(&th->th.th_suspend_init_count) > __kmp_fork_count) {
1457 status = pthread_cond_destroy(&th->th.th_suspend_cv.c_cond);
1458 if (status != 0 && status != EBUSY) {
1459 KMP_SYSFAIL(
"pthread_cond_destroy", status);
1461 status = pthread_mutex_destroy(&th->th.th_suspend_mx.m_mutex);
1462 if (status != 0 && status != EBUSY) {
1463 KMP_SYSFAIL(
"pthread_mutex_destroy", status);
1465 --th->th.th_suspend_init_count;
1466 KMP_DEBUG_ASSERT(KMP_ATOMIC_LD_RLX(&th->th.th_suspend_init_count) ==
1472int __kmp_try_suspend_mx(kmp_info_t *th) {
1473 return (pthread_mutex_trylock(&th->th.th_suspend_mx.m_mutex) == 0);
1476void __kmp_lock_suspend_mx(kmp_info_t *th) {
1477 int status = pthread_mutex_lock(&th->th.th_suspend_mx.m_mutex);
1478 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
1481void __kmp_unlock_suspend_mx(kmp_info_t *th) {
1482 int status = pthread_mutex_unlock(&th->th.th_suspend_mx.m_mutex);
1483 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
1489static inline void __kmp_suspend_template(
int th_gtid, C *flag) {
1490 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_suspend);
1491 kmp_info_t *th = __kmp_threads[th_gtid];
1493 typename C::flag_t old_spin;
1495 KF_TRACE(30, (
"__kmp_suspend_template: T#%d enter for flag = %p\n", th_gtid,
1498 __kmp_suspend_initialize_thread(th);
1500 __kmp_lock_suspend_mx(th);
1502 KF_TRACE(10, (
"__kmp_suspend_template: T#%d setting sleep bit for spin(%p)\n",
1503 th_gtid, flag->get()));
1507 old_spin = flag->set_sleeping();
1508 TCW_PTR(th->th.th_sleep_loc, (
void *)flag);
1509 th->th.th_sleep_loc_type = flag->get_type();
1510 if (__kmp_dflt_blocktime == KMP_MAX_BLOCKTIME &&
1511 __kmp_pause_status != kmp_soft_paused) {
1512 flag->unset_sleeping();
1513 TCW_PTR(th->th.th_sleep_loc, NULL);
1514 th->th.th_sleep_loc_type = flag_unset;
1515 __kmp_unlock_suspend_mx(th);
1518 KF_TRACE(5, (
"__kmp_suspend_template: T#%d set sleep bit for spin(%p)==%x,"
1520 th_gtid, flag->get(), flag->load(), old_spin));
1522 if (flag->done_check_val(old_spin) || flag->done_check()) {
1523 flag->unset_sleeping();
1524 TCW_PTR(th->th.th_sleep_loc, NULL);
1525 th->th.th_sleep_loc_type = flag_unset;
1526 KF_TRACE(5, (
"__kmp_suspend_template: T#%d false alarm, reset sleep bit "
1528 th_gtid, flag->get()));
1533 int deactivated = FALSE;
1535 while (flag->is_sleeping()) {
1538 __kmp_suspend_count++;
1539 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1540 __kmp_printf(
"__kmp_suspend_template: suspending T#%d: %s\n", th_gtid,
1546 th->th.th_active = FALSE;
1547 if (th->th.th_active_in_pool) {
1548 th->th.th_active_in_pool = FALSE;
1549 KMP_ATOMIC_DEC(&__kmp_thread_pool_active_nth);
1550 KMP_DEBUG_ASSERT(TCR_4(__kmp_thread_pool_active_nth) >= 0);
1555 KMP_DEBUG_ASSERT(th->th.th_sleep_loc);
1556 KMP_DEBUG_ASSERT(flag->get_type() == th->th.th_sleep_loc_type);
1558#if USE_SUSPEND_TIMEOUT
1559 struct timespec now;
1560 struct timeval tval;
1563 status = gettimeofday(&tval, NULL);
1564 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1565 TIMEVAL_TO_TIMESPEC(&tval, &now);
1567 msecs = (4 * __kmp_dflt_blocktime) + 200;
1568 now.tv_sec += msecs / 1000;
1569 now.tv_nsec += (msecs % 1000) * 1000;
1571 KF_TRACE(15, (
"__kmp_suspend_template: T#%d about to perform "
1572 "pthread_cond_timedwait\n",
1574 status = pthread_cond_timedwait(&th->th.th_suspend_cv.c_cond,
1575 &th->th.th_suspend_mx.m_mutex, &now);
1577 KF_TRACE(15, (
"__kmp_suspend_template: T#%d about to perform"
1578 " pthread_cond_wait\n",
1580 status = pthread_cond_wait(&th->th.th_suspend_cv.c_cond,
1581 &th->th.th_suspend_mx.m_mutex);
1584 if ((status != 0) && (status != EINTR) && (status != ETIMEDOUT)) {
1585 KMP_SYSFAIL(
"pthread_cond_wait", status);
1588 KMP_DEBUG_ASSERT(flag->get_type() == flag->get_ptr_type());
1590 if (!flag->is_sleeping() &&
1591 ((status == EINTR) || (status == ETIMEDOUT))) {
1595 flag->unset_sleeping();
1596 TCW_PTR(th->th.th_sleep_loc, NULL);
1597 th->th.th_sleep_loc_type = flag_unset;
1600 if (status == ETIMEDOUT) {
1601 if (flag->is_sleeping()) {
1603 (
"__kmp_suspend_template: T#%d timeout wakeup\n", th_gtid));
1605 KF_TRACE(2, (
"__kmp_suspend_template: T#%d timeout wakeup, sleep bit "
1608 TCW_PTR(th->th.th_sleep_loc, NULL);
1609 th->th.th_sleep_loc_type = flag_unset;
1611 }
else if (flag->is_sleeping()) {
1613 (
"__kmp_suspend_template: T#%d spurious wakeup\n", th_gtid));
1620 th->th.th_active = TRUE;
1621 if (TCR_4(th->th.th_in_pool)) {
1622 KMP_ATOMIC_INC(&__kmp_thread_pool_active_nth);
1623 th->th.th_active_in_pool = TRUE;
1629 TCW_PTR(th->th.th_sleep_loc, NULL);
1630 th->th.th_sleep_loc_type = flag_unset;
1632 KMP_DEBUG_ASSERT(!flag->is_sleeping());
1633 KMP_DEBUG_ASSERT(!th->th.th_sleep_loc);
1637 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1638 __kmp_printf(
"__kmp_suspend_template: T#%d has awakened: %s\n", th_gtid,
1643 __kmp_unlock_suspend_mx(th);
1644 KF_TRACE(30, (
"__kmp_suspend_template: T#%d exit\n", th_gtid));
1647template <
bool C,
bool S>
1648void __kmp_suspend_32(
int th_gtid, kmp_flag_32<C, S> *flag) {
1649 __kmp_suspend_template(th_gtid, flag);
1651template <
bool C,
bool S>
1652void __kmp_suspend_64(
int th_gtid, kmp_flag_64<C, S> *flag) {
1653 __kmp_suspend_template(th_gtid, flag);
1655template <
bool C,
bool S>
1656void __kmp_atomic_suspend_64(
int th_gtid, kmp_atomic_flag_64<C, S> *flag) {
1657 __kmp_suspend_template(th_gtid, flag);
1659void __kmp_suspend_oncore(
int th_gtid, kmp_flag_oncore *flag) {
1660 __kmp_suspend_template(th_gtid, flag);
1663template void __kmp_suspend_32<false, false>(
int, kmp_flag_32<false, false> *);
1664template void __kmp_suspend_64<false, true>(
int, kmp_flag_64<false, true> *);
1665template void __kmp_suspend_64<true, false>(
int, kmp_flag_64<true, false> *);
1667__kmp_atomic_suspend_64<false, true>(
int, kmp_atomic_flag_64<false, true> *);
1669__kmp_atomic_suspend_64<true, false>(
int, kmp_atomic_flag_64<true, false> *);
1675static inline void __kmp_resume_template(
int target_gtid, C *flag) {
1676 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_resume);
1677 kmp_info_t *th = __kmp_threads[target_gtid];
1681 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1684 KF_TRACE(30, (
"__kmp_resume_template: T#%d wants to wakeup T#%d enter\n",
1685 gtid, target_gtid));
1686 KMP_DEBUG_ASSERT(gtid != target_gtid);
1688 __kmp_suspend_initialize_thread(th);
1690 __kmp_lock_suspend_mx(th);
1692 if (!flag || flag != th->th.th_sleep_loc) {
1695 flag = (C *)CCAST(
void *, th->th.th_sleep_loc);
1701 KF_TRACE(5, (
"__kmp_resume_template: T#%d exiting, thread T#%d already "
1702 "awake: flag(%p)\n",
1703 gtid, target_gtid, (
void *)NULL));
1704 __kmp_unlock_suspend_mx(th);
1706 }
else if (flag->get_type() != th->th.th_sleep_loc_type) {
1711 (
"__kmp_resume_template: T#%d retrying, thread T#%d Mismatch flag(%p), "
1712 "spin(%p) type=%d ptr_type=%d\n",
1713 gtid, target_gtid, flag, flag->get(), flag->get_type(),
1714 th->th.th_sleep_loc_type));
1715 __kmp_unlock_suspend_mx(th);
1716 __kmp_null_resume_wrapper(th);
1720 if (!flag->is_sleeping()) {
1721 KF_TRACE(5, (
"__kmp_resume_template: T#%d exiting, thread T#%d already "
1722 "awake: flag(%p): %u\n",
1723 gtid, target_gtid, flag->get(), (
unsigned int)flag->load()));
1724 __kmp_unlock_suspend_mx(th);
1728 KMP_DEBUG_ASSERT(flag);
1729 flag->unset_sleeping();
1730 TCW_PTR(th->th.th_sleep_loc, NULL);
1731 th->th.th_sleep_loc_type = flag_unset;
1733 KF_TRACE(5, (
"__kmp_resume_template: T#%d about to wakeup T#%d, reset "
1734 "sleep bit for flag's loc(%p): %u\n",
1735 gtid, target_gtid, flag->get(), (
unsigned int)flag->load()));
1740 __kmp_print_cond(buffer, &th->th.th_suspend_cv);
1741 __kmp_printf(
"__kmp_resume_template: T#%d resuming T#%d: %s\n", gtid,
1742 target_gtid, buffer);
1745 status = pthread_cond_signal(&th->th.th_suspend_cv.c_cond);
1746 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
1747 __kmp_unlock_suspend_mx(th);
1748 KF_TRACE(30, (
"__kmp_resume_template: T#%d exiting after signaling wake up"
1750 gtid, target_gtid));
1753template <
bool C,
bool S>
1754void __kmp_resume_32(
int target_gtid, kmp_flag_32<C, S> *flag) {
1755 __kmp_resume_template(target_gtid, flag);
1757template <
bool C,
bool S>
1758void __kmp_resume_64(
int target_gtid, kmp_flag_64<C, S> *flag) {
1759 __kmp_resume_template(target_gtid, flag);
1761template <
bool C,
bool S>
1762void __kmp_atomic_resume_64(
int target_gtid, kmp_atomic_flag_64<C, S> *flag) {
1763 __kmp_resume_template(target_gtid, flag);
1765void __kmp_resume_oncore(
int target_gtid, kmp_flag_oncore *flag) {
1766 __kmp_resume_template(target_gtid, flag);
1769template void __kmp_resume_32<false, true>(
int, kmp_flag_32<false, true> *);
1770template void __kmp_resume_32<false, false>(
int, kmp_flag_32<false, false> *);
1771template void __kmp_resume_64<false, true>(
int, kmp_flag_64<false, true> *);
1773__kmp_atomic_resume_64<false, true>(
int, kmp_atomic_flag_64<false, true> *);
1776void __kmp_resume_monitor() {
1777 KMP_TIME_DEVELOPER_PARTITIONED_BLOCK(USER_resume);
1780 int gtid = TCR_4(__kmp_init_gtid) ? __kmp_get_gtid() : -1;
1781 KF_TRACE(30, (
"__kmp_resume_monitor: T#%d wants to wakeup T#%d enter\n", gtid,
1783 KMP_DEBUG_ASSERT(gtid != KMP_GTID_MONITOR);
1785 status = pthread_mutex_lock(&__kmp_wait_mx.m_mutex);
1786 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
1790 __kmp_print_cond(buffer, &__kmp_wait_cv.c_cond);
1791 __kmp_printf(
"__kmp_resume_monitor: T#%d resuming T#%d: %s\n", gtid,
1792 KMP_GTID_MONITOR, buffer);
1795 status = pthread_cond_signal(&__kmp_wait_cv.c_cond);
1796 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
1797 status = pthread_mutex_unlock(&__kmp_wait_mx.m_mutex);
1798 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
1799 KF_TRACE(30, (
"__kmp_resume_monitor: T#%d exiting after signaling wake up"
1801 gtid, KMP_GTID_MONITOR));
1805void __kmp_yield() { sched_yield(); }
1807void __kmp_gtid_set_specific(
int gtid) {
1808 if (__kmp_init_gtid) {
1810 status = pthread_setspecific(__kmp_gtid_threadprivate_key,
1811 (
void *)(intptr_t)(gtid + 1));
1812 KMP_CHECK_SYSFAIL(
"pthread_setspecific", status);
1814 KA_TRACE(50, (
"__kmp_gtid_set_specific: runtime shutdown, returning\n"));
1818int __kmp_gtid_get_specific() {
1820 if (!__kmp_init_gtid) {
1821 KA_TRACE(50, (
"__kmp_gtid_get_specific: runtime shutdown, returning "
1822 "KMP_GTID_SHUTDOWN\n"));
1823 return KMP_GTID_SHUTDOWN;
1825 gtid = (int)(
size_t)pthread_getspecific(__kmp_gtid_threadprivate_key);
1827 gtid = KMP_GTID_DNE;
1831 KA_TRACE(50, (
"__kmp_gtid_get_specific: key:%d gtid:%d\n",
1832 __kmp_gtid_threadprivate_key, gtid));
1836double __kmp_read_cpu_time(
void) {
1842 return (
double)(buffer.tms_utime + buffer.tms_cutime) /
1843 (
double)CLOCKS_PER_SEC;
1846int __kmp_read_system_info(
struct kmp_sys_info *info) {
1848 struct rusage r_usage;
1850 memset(info, 0,
sizeof(*info));
1852 status = getrusage(RUSAGE_SELF, &r_usage);
1853 KMP_CHECK_SYSFAIL_ERRNO(
"getrusage", status);
1857 info->maxrss = r_usage.ru_maxrss;
1859 info->minflt = r_usage.ru_minflt;
1861 info->majflt = r_usage.ru_majflt;
1863 info->nswap = r_usage.ru_nswap;
1865 info->inblock = r_usage.ru_inblock;
1867 info->oublock = r_usage.ru_oublock;
1869 info->nvcsw = r_usage.ru_nvcsw;
1871 info->nivcsw = r_usage.ru_nivcsw;
1874 return (status != 0);
1877void __kmp_read_system_time(
double *delta) {
1879 struct timeval tval;
1880 struct timespec stop;
1883 status = gettimeofday(&tval, NULL);
1884 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1885 TIMEVAL_TO_TIMESPEC(&tval, &stop);
1886 t_ns = (double)(TS2NS(stop) - TS2NS(__kmp_sys_timer_data.start));
1887 *delta = (t_ns * 1e-9);
1890void __kmp_clear_system_time(
void) {
1891 struct timeval tval;
1893 status = gettimeofday(&tval, NULL);
1894 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
1895 TIMEVAL_TO_TIMESPEC(&tval, &__kmp_sys_timer_data.start);
1898static int __kmp_get_xproc(
void) {
1904 __kmp_type_convert(sysconf(_SC_NPROCESSORS_CONF), &(r));
1906#elif KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || KMP_OS_OPENBSD || \
1907 KMP_OS_HAIKU || KMP_OS_HURD || KMP_OS_SOLARIS || KMP_OS_WASI || KMP_OS_AIX
1909 __kmp_type_convert(sysconf(_SC_NPROCESSORS_ONLN), &(r));
1913 size_t len =
sizeof(r);
1914 sysctlbyname(
"hw.logicalcpu", &r, &len, NULL, 0);
1918#error "Unknown or unsupported OS."
1922 return r > 0 ? r : 2;
1926int __kmp_read_from_file(
char const *path,
char const *format, ...) {
1930 va_start(args, format);
1931 FILE *f = fopen(path,
"rb");
1936 result = vfscanf(f, format, args);
1943void __kmp_runtime_initialize(
void) {
1945 pthread_mutexattr_t mutex_attr;
1946 pthread_condattr_t cond_attr;
1948 if (__kmp_init_runtime) {
1952#if (KMP_ARCH_X86 || KMP_ARCH_X86_64)
1953 if (!__kmp_cpuinfo.initialized) {
1954 __kmp_query_cpuid(&__kmp_cpuinfo);
1958 __kmp_xproc = __kmp_get_xproc();
1964 status = getrlimit(RLIMIT_STACK, &rlim);
1966 __kmp_stksize = rlim.rlim_cur;
1967 __kmp_check_stksize(&__kmp_stksize);
1971 if (sysconf(_SC_THREADS)) {
1974 __kmp_type_convert(sysconf(_SC_THREAD_THREADS_MAX), &(__kmp_sys_max_nth));
1976 if (__kmp_sys_max_nth == -1) {
1979 __kmp_sys_max_nth = KMP_MAX_NTH;
1982 if (__kmp_sys_max_nth == -1) {
1984 __kmp_sys_max_nth = INT_MAX;
1985 }
else if (__kmp_sys_max_nth <= 1) {
1987 __kmp_sys_max_nth = KMP_MAX_NTH;
1992 __kmp_sys_min_stksize = sysconf(_SC_THREAD_STACK_MIN);
1993 if (__kmp_sys_min_stksize <= 1) {
1994 __kmp_sys_min_stksize = KMP_MIN_STKSIZE;
1999 __kmp_tls_gtid_min = KMP_TLS_GTID_MIN;
2001 status = pthread_key_create(&__kmp_gtid_threadprivate_key,
2002 __kmp_internal_end_dest);
2003 KMP_CHECK_SYSFAIL(
"pthread_key_create", status);
2004 status = pthread_mutexattr_init(&mutex_attr);
2005 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_init", status);
2006 status = pthread_mutex_init(&__kmp_wait_mx.m_mutex, &mutex_attr);
2007 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2008 status = pthread_mutexattr_destroy(&mutex_attr);
2009 KMP_CHECK_SYSFAIL(
"pthread_mutexattr_destroy", status);
2010 status = pthread_condattr_init(&cond_attr);
2011 KMP_CHECK_SYSFAIL(
"pthread_condattr_init", status);
2012 status = pthread_cond_init(&__kmp_wait_cv.c_cond, &cond_attr);
2013 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2014 status = pthread_condattr_destroy(&cond_attr);
2015 KMP_CHECK_SYSFAIL(
"pthread_condattr_destroy", status);
2017 __kmp_itt_initialize();
2020 __kmp_init_runtime = TRUE;
2023void __kmp_runtime_destroy(
void) {
2026 if (!__kmp_init_runtime) {
2031 __kmp_itt_destroy();
2034 status = pthread_key_delete(__kmp_gtid_threadprivate_key);
2035 KMP_CHECK_SYSFAIL(
"pthread_key_delete", status);
2037 status = pthread_mutex_destroy(&__kmp_wait_mx.m_mutex);
2038 if (status != 0 && status != EBUSY) {
2039 KMP_SYSFAIL(
"pthread_mutex_destroy", status);
2041 status = pthread_cond_destroy(&__kmp_wait_cv.c_cond);
2042 if (status != 0 && status != EBUSY) {
2043 KMP_SYSFAIL(
"pthread_cond_destroy", status);
2045#if KMP_AFFINITY_SUPPORTED
2046 __kmp_affinity_uninitialize();
2049 __kmp_init_runtime = FALSE;
2054void __kmp_thread_sleep(
int millis) { sleep((millis + 500) / 1000); }
2057void __kmp_elapsed(
double *t) {
2062 status = clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts);
2063 KMP_CHECK_SYSFAIL_ERRNO(
"clock_gettime", status);
2065 (double)ts.tv_nsec * (1.0 / (
double)KMP_NSEC_PER_SEC) + (
double)ts.tv_sec;
2069 status = gettimeofday(&tv, NULL);
2070 KMP_CHECK_SYSFAIL_ERRNO(
"gettimeofday", status);
2072 (double)tv.tv_usec * (1.0 / (
double)KMP_USEC_PER_SEC) + (
double)tv.tv_sec;
2077void __kmp_elapsed_tick(
double *t) { *t = 1 / (double)CLOCKS_PER_SEC; }
2080kmp_uint64 __kmp_now_nsec() {
2082 gettimeofday(&t, NULL);
2083 kmp_uint64 nsec = (kmp_uint64)KMP_NSEC_PER_SEC * (kmp_uint64)t.tv_sec +
2084 (kmp_uint64)1000 * (kmp_uint64)t.tv_usec;
2088#if KMP_ARCH_X86 || KMP_ARCH_X86_64
2090void __kmp_initialize_system_tick() {
2091 kmp_uint64 now, nsec2, diff;
2092 kmp_uint64 delay = 1000000;
2093 kmp_uint64 nsec = __kmp_now_nsec();
2094 kmp_uint64 goal = __kmp_hardware_timestamp() + delay;
2095 while ((now = __kmp_hardware_timestamp()) < goal)
2097 nsec2 = __kmp_now_nsec();
2098 diff = nsec2 - nsec;
2100 double tpus = 1000.0 * (double)(delay + (now - goal)) / (
double)diff;
2102 __kmp_ticks_per_msec = (kmp_uint64)(tpus * 1000.0);
2103 __kmp_ticks_per_usec = (kmp_uint64)tpus;
2112int __kmp_is_address_mapped(
void *addr) {
2117#if KMP_OS_LINUX || KMP_OS_HURD
2122 char *name = __kmp_str_format(
"/proc/%d/maps", getpid());
2125 file = fopen(name,
"r");
2126 KMP_ASSERT(file != NULL);
2130 void *beginning = NULL;
2131 void *ending = NULL;
2134 rc = fscanf(file,
"%p-%p %4s %*[^\n]\n", &beginning, &ending, perms);
2138 KMP_ASSERT(rc == 3 &&
2139 KMP_STRLEN(perms) == 4);
2142 if ((addr >= beginning) && (addr < ending)) {
2144 if (strcmp(perms,
"rw") == 0) {
2154 KMP_INTERNAL_FREE(name);
2158 int mib[] = {CTL_KERN, KERN_PROC, KERN_PROC_VMMAP, getpid()};
2159 rc = sysctl(mib, 4, NULL, &lstsz, NULL, 0);
2164 lstsz = lstsz * 4 / 3;
2165 buf =
reinterpret_cast<char *
>(KMP_INTERNAL_MALLOC(lstsz));
2166 rc = sysctl(mib, 4, buf, &lstsz, NULL, 0);
2168 KMP_INTERNAL_FREE(buf);
2173 char *up = buf + lstsz;
2176 struct kinfo_vmentry *cur =
reinterpret_cast<struct kinfo_vmentry *
>(lw);
2177 size_t cursz = cur->kve_structsize;
2180 void *start =
reinterpret_cast<void *
>(cur->kve_start);
2181 void *end =
reinterpret_cast<void *
>(cur->kve_end);
2183 if ((addr >= start) && (addr < end)) {
2184 if ((cur->kve_protection & KVME_PROT_READ) != 0 &&
2185 (cur->kve_protection & KVME_PROT_WRITE) != 0) {
2192 KMP_INTERNAL_FREE(buf);
2193#elif KMP_OS_DRAGONFLY
2194 char err[_POSIX2_LINE_MAX];
2198 vm_map_entry entry, *c;
2204 fd = kvm_openfiles(
nullptr,
nullptr,
nullptr, O_RDONLY, err);
2209 proc = kvm_getprocs(fd, KERN_PROC_PID, getpid(), &num);
2211 if (kvm_read(fd,
static_cast<uintptr_t
>(proc->kp_paddr), &p,
sizeof(p)) !=
2213 kvm_read(fd,
reinterpret_cast<uintptr_t
>(p.p_vmspace), &sp,
sizeof(sp)) !=
2221 uaddr =
reinterpret_cast<uintptr_t
>(addr);
2222 for (c = kvm_vm_map_entry_first(fd, cur, &entry); c;
2223 c = kvm_vm_map_entry_next(fd, c, &entry)) {
2224 if ((uaddr >= entry.ba.start) && (uaddr <= entry.ba.end)) {
2225 if ((entry.protection & VM_PROT_READ) != 0 &&
2226 (entry.protection & VM_PROT_WRITE) != 0) {
2242 pid_t pid = getpid();
2243 struct ps_prochandle *fd = Pgrab(pid, PGRAB_RDONLY, &err);
2250 char *name = __kmp_str_format(
"/proc/%d/map", pid);
2251 size_t sz = (1 << 20);
2252 file = open(name, O_RDONLY);
2254 KMP_INTERNAL_FREE(name);
2258 buf = KMP_INTERNAL_MALLOC(sz);
2260 while (sz > 0 && (rd = pread(file, buf, sz, 0)) == sz) {
2263 newbuf = KMP_INTERNAL_REALLOC(buf, sz);
2267 map =
reinterpret_cast<prmap_t *
>(buf);
2268 uaddr =
reinterpret_cast<uintptr_t
>(addr);
2270 for (cur = map; rd > 0; cur++, rd = -
sizeof(*map)) {
2271 if ((uaddr >= cur->pr_vaddr) && (uaddr < cur->pr_vaddr)) {
2272 if ((cur->pr_mflags & MA_READ) != 0 && (cur->pr_mflags & MA_WRITE) != 0) {
2279 KMP_INTERNAL_FREE(map);
2281 KMP_INTERNAL_FREE(name);
2289 rc = vm_read_overwrite(
2291 (vm_address_t)(addr),
2293 (vm_address_t)(&buffer),
2306 mib[2] = VM_PROC_MAP;
2308 mib[4] =
sizeof(
struct kinfo_vmentry);
2311 rc = sysctl(mib, __arraycount(mib), NULL, &size, NULL, 0);
2315 size = size * 4 / 3;
2316 struct kinfo_vmentry *kiv = (
struct kinfo_vmentry *)KMP_INTERNAL_MALLOC(size);
2319 rc = sysctl(mib, __arraycount(mib), kiv, &size, NULL, 0);
2323 for (
size_t i = 0; i < size; i++) {
2324 if (kiv[i].kve_start >= (uint64_t)addr &&
2325 kiv[i].kve_end <= (uint64_t)addr) {
2330 KMP_INTERNAL_FREE(kiv);
2335 mib[1] = KERN_PROC_VMMAP;
2340 rc = sysctl(mib, 3, NULL, &size, NULL, 0);
2345 struct kinfo_vmentry kiv = {.kve_start = 0};
2347 while ((rc = sysctl(mib, 3, &kiv, &size, NULL, 0)) == 0) {
2349 if (kiv.kve_end == end)
2352 if (kiv.kve_start >= (uint64_t)addr && kiv.kve_end <= (uint64_t)addr) {
2359 found = (int)addr < (__builtin_wasm_memory_size(0) * PAGESIZE);
2362 uint32_t loadQueryBufSize = 4096u;
2366 loadQueryBuf = (
char *)KMP_INTERNAL_MALLOC(loadQueryBufSize);
2367 if (loadQueryBuf == NULL) {
2371 rc = loadquery(L_GETXINFO | L_IGNOREUNLOAD, loadQueryBuf, loadQueryBufSize);
2373 KMP_INTERNAL_FREE(loadQueryBuf);
2374 if (errno != ENOMEM) {
2378 loadQueryBufSize <<= 1;
2385 struct ld_xinfo *curLdInfo = (
struct ld_xinfo *)loadQueryBuf;
2389 uintptr_t curDataStart = (uintptr_t)curLdInfo->ldinfo_dataorg;
2390 uintptr_t curDataEnd = curDataStart + curLdInfo->ldinfo_datasize;
2393 if (curDataStart <= (uintptr_t)addr && (uintptr_t)addr < curDataEnd) {
2397 if (curLdInfo->ldinfo_next == 0u) {
2401 curLdInfo = (
struct ld_xinfo *)((
char *)curLdInfo + curLdInfo->ldinfo_next);
2403 KMP_INTERNAL_FREE(loadQueryBuf);
2410#error "Unknown or unsupported OS"
2418#ifdef USE_LOAD_BALANCE
2420#if KMP_OS_DARWIN || KMP_OS_DRAGONFLY || KMP_OS_FREEBSD || KMP_OS_NETBSD || \
2421 KMP_OS_OPENBSD || KMP_OS_SOLARIS
2428int __kmp_get_load_balance(
int max) {
2432 int res = getloadavg(averages, 3);
2437 if (__kmp_load_balance_interval < 180 && (res >= 1)) {
2438 ret_avg = (int)averages[0];
2439 }
else if ((__kmp_load_balance_interval >= 180 &&
2440 __kmp_load_balance_interval < 600) &&
2442 ret_avg = (int)averages[1];
2443 }
else if ((__kmp_load_balance_interval >= 600) && (res == 3)) {
2444 ret_avg = (int)averages[2];
2456int __kmp_get_load_balance(
int max) {
2458 static int glb_running_threads = 0;
2460 static double glb_call_time = 0;
2461 int running_threads = 0;
2463 double call_time = 0.0;
2465 __kmp_elapsed(&call_time);
2467 if (glb_call_time &&
2468 (call_time - glb_call_time < __kmp_load_balance_interval))
2469 return glb_running_threads;
2471 glb_call_time = call_time;
2478 int logical_cpus = perfstat_cpu(NULL, NULL,
sizeof(perfstat_cpu_t), 0);
2479 if (logical_cpus <= 0) {
2484 perfstat_cpu_t *cpu_stat = (perfstat_cpu_t *)KMP_INTERNAL_MALLOC(
2485 logical_cpus *
sizeof(perfstat_cpu_t));
2486 if (cpu_stat == NULL) {
2493 perfstat_id_t first_cpu_name;
2494 strcpy(first_cpu_name.name, FIRST_CPU);
2497 int rc = perfstat_cpu(&first_cpu_name, cpu_stat,
sizeof(perfstat_cpu_t),
2499 KMP_DEBUG_ASSERT(rc == logical_cpus);
2501 KMP_INTERNAL_FREE(cpu_stat);
2505 for (
int i = 0; i < logical_cpus; ++i) {
2506 running_threads += cpu_stat[i].runque;
2507 if (running_threads >= max)
2514 KMP_DEBUG_ASSERT(running_threads > 0);
2515 if (running_threads <= 0)
2516 running_threads = 1;
2518 KMP_INTERNAL_FREE(cpu_stat);
2520 glb_running_threads = running_threads;
2522 return running_threads;
2531int __kmp_get_load_balance(
int max) {
2532 static int permanent_error = 0;
2533 static int glb_running_threads = 0;
2535 static double glb_call_time = 0;
2537 int running_threads = 0;
2539 DIR *proc_dir = NULL;
2540 struct dirent *proc_entry = NULL;
2542 kmp_str_buf_t task_path;
2543 DIR *task_dir = NULL;
2544 struct dirent *task_entry = NULL;
2545 int task_path_fixed_len;
2547 kmp_str_buf_t stat_path;
2549 int stat_path_fixed_len;
2552 int total_processes = 0;
2555 double call_time = 0.0;
2557 __kmp_str_buf_init(&task_path);
2558 __kmp_str_buf_init(&stat_path);
2560 __kmp_elapsed(&call_time);
2562 if (glb_call_time &&
2563 (call_time - glb_call_time < __kmp_load_balance_interval)) {
2564 running_threads = glb_running_threads;
2568 glb_call_time = call_time;
2571 if (permanent_error) {
2572 running_threads = -1;
2581 proc_dir = opendir(
"/proc");
2582 if (proc_dir == NULL) {
2585 running_threads = -1;
2586 permanent_error = 1;
2591 __kmp_str_buf_cat(&task_path,
"/proc/", 6);
2592 task_path_fixed_len = task_path.used;
2594 proc_entry = readdir(proc_dir);
2595 while (proc_entry != NULL) {
2598 if (proc_entry->d_type == DT_DIR && isdigit(proc_entry->d_name[0])) {
2608 KMP_DEBUG_ASSERT(total_processes != 1 ||
2609 strcmp(proc_entry->d_name,
"1") == 0);
2612 task_path.used = task_path_fixed_len;
2613 __kmp_str_buf_cat(&task_path, proc_entry->d_name,
2614 KMP_STRLEN(proc_entry->d_name));
2615 __kmp_str_buf_cat(&task_path,
"/task", 5);
2617 task_dir = opendir(task_path.str);
2618 if (task_dir == NULL) {
2627 if (strcmp(proc_entry->d_name,
"1") == 0) {
2628 running_threads = -1;
2629 permanent_error = 1;
2634 __kmp_str_buf_clear(&stat_path);
2635 __kmp_str_buf_cat(&stat_path, task_path.str, task_path.used);
2636 __kmp_str_buf_cat(&stat_path,
"/", 1);
2637 stat_path_fixed_len = stat_path.used;
2639 task_entry = readdir(task_dir);
2640 while (task_entry != NULL) {
2642 if (proc_entry->d_type == DT_DIR && isdigit(task_entry->d_name[0])) {
2649 stat_path_fixed_len;
2650 __kmp_str_buf_cat(&stat_path, task_entry->d_name,
2651 KMP_STRLEN(task_entry->d_name));
2652 __kmp_str_buf_cat(&stat_path,
"/stat", 5);
2656 stat_file = open(stat_path.str, O_RDONLY);
2657 if (stat_file == -1) {
2687 len = read(stat_file, buffer,
sizeof(buffer) - 1);
2694 char *close_parent = strstr(buffer,
") ");
2695 if (close_parent != NULL) {
2696 char state = *(close_parent + 2);
2699 if (running_threads >= max) {
2709 task_entry = readdir(task_dir);
2715 proc_entry = readdir(proc_dir);
2721 KMP_DEBUG_ASSERT(running_threads > 0);
2722 if (running_threads <= 0) {
2723 running_threads = 1;
2727 if (proc_dir != NULL) {
2730 __kmp_str_buf_free(&task_path);
2731 if (task_dir != NULL) {
2734 __kmp_str_buf_free(&stat_path);
2735 if (stat_file != -1) {
2739 glb_running_threads = running_threads;
2741 return running_threads;
2749#if !(KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_MIC || \
2750 ((KMP_OS_LINUX || KMP_OS_DARWIN) && KMP_ARCH_AARCH64) || \
2751 KMP_ARCH_PPC64 || KMP_ARCH_RISCV64 || KMP_ARCH_LOONGARCH64 || \
2752 KMP_ARCH_ARM || KMP_ARCH_VE || KMP_ARCH_S390X || KMP_ARCH_PPC_XCOFF || \
2753 KMP_ARCH_AARCH64_32)
2759typedef void (*microtask_t0)(
int *,
int *);
2760typedef void (*microtask_t1)(
int *,
int *,
void *);
2761typedef void (*microtask_t2)(
int *,
int *,
void *,
void *);
2762typedef void (*microtask_t3)(
int *,
int *,
void *,
void *,
void *);
2763typedef void (*microtask_t4)(
int *,
int *,
void *,
void *,
void *,
void *);
2764typedef void (*microtask_t5)(
int *,
int *,
void *,
void *,
void *,
void *,
2766typedef void (*microtask_t6)(
int *,
int *,
void *,
void *,
void *,
void *,
2768typedef void (*microtask_t7)(
int *,
int *,
void *,
void *,
void *,
void *,
2769 void *,
void *,
void *);
2770typedef void (*microtask_t8)(
int *,
int *,
void *,
void *,
void *,
void *,
2771 void *,
void *,
void *,
void *);
2772typedef void (*microtask_t9)(
int *,
int *,
void *,
void *,
void *,
void *,
2773 void *,
void *,
void *,
void *,
void *);
2774typedef void (*microtask_t10)(
int *,
int *,
void *,
void *,
void *,
void *,
2775 void *,
void *,
void *,
void *,
void *,
void *);
2776typedef void (*microtask_t11)(
int *,
int *,
void *,
void *,
void *,
void *,
2777 void *,
void *,
void *,
void *,
void *,
void *,
2779typedef void (*microtask_t12)(
int *,
int *,
void *,
void *,
void *,
void *,
2780 void *,
void *,
void *,
void *,
void *,
void *,
2782typedef void (*microtask_t13)(
int *,
int *,
void *,
void *,
void *,
void *,
2783 void *,
void *,
void *,
void *,
void *,
void *,
2784 void *,
void *,
void *);
2785typedef void (*microtask_t14)(
int *,
int *,
void *,
void *,
void *,
void *,
2786 void *,
void *,
void *,
void *,
void *,
void *,
2787 void *,
void *,
void *,
void *);
2788typedef void (*microtask_t15)(
int *,
int *,
void *,
void *,
void *,
void *,
2789 void *,
void *,
void *,
void *,
void *,
void *,
2790 void *,
void *,
void *,
void *,
void *);
2794int __kmp_invoke_microtask(microtask_t pkfn,
int gtid,
int tid,
int argc,
2798 void **exit_frame_ptr
2802 *exit_frame_ptr = OMPT_GET_FRAME_ADDRESS(0);
2807 fprintf(stderr,
"Too many args to microtask: %d!\n", argc);
2811 (*(microtask_t0)pkfn)(>id, &tid);
2814 (*(microtask_t1)pkfn)(>id, &tid, p_argv[0]);
2817 (*(microtask_t2)pkfn)(>id, &tid, p_argv[0], p_argv[1]);
2820 (*(microtask_t3)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2]);
2823 (*(microtask_t4)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2827 (*(microtask_t5)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2828 p_argv[3], p_argv[4]);
2831 (*(microtask_t6)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2832 p_argv[3], p_argv[4], p_argv[5]);
2835 (*(microtask_t7)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2836 p_argv[3], p_argv[4], p_argv[5], p_argv[6]);
2839 (*(microtask_t8)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2840 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2844 (*(microtask_t9)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2845 p_argv[3], p_argv[4], p_argv[5], p_argv[6], p_argv[7],
2849 (*(microtask_t10)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2850 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2851 p_argv[7], p_argv[8], p_argv[9]);
2854 (*(microtask_t11)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2855 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2856 p_argv[7], p_argv[8], p_argv[9], p_argv[10]);
2859 (*(microtask_t12)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2860 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2861 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2865 (*(microtask_t13)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2866 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2867 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2868 p_argv[11], p_argv[12]);
2871 (*(microtask_t14)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2872 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2873 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2874 p_argv[11], p_argv[12], p_argv[13]);
2877 (*(microtask_t15)pkfn)(>id, &tid, p_argv[0], p_argv[1], p_argv[2],
2878 p_argv[3], p_argv[4], p_argv[5], p_argv[6],
2879 p_argv[7], p_argv[8], p_argv[9], p_argv[10],
2880 p_argv[11], p_argv[12], p_argv[13], p_argv[14]);
2893pthread_cond_t hidden_helper_threads_initz_cond_var;
2894pthread_mutex_t hidden_helper_threads_initz_lock;
2895volatile int hidden_helper_initz_signaled = FALSE;
2898pthread_cond_t hidden_helper_threads_deinitz_cond_var;
2899pthread_mutex_t hidden_helper_threads_deinitz_lock;
2900volatile int hidden_helper_deinitz_signaled = FALSE;
2903pthread_cond_t hidden_helper_main_thread_cond_var;
2904pthread_mutex_t hidden_helper_main_thread_lock;
2905volatile int hidden_helper_main_thread_signaled = FALSE;
2910sem_t hidden_helper_task_sem;
2913void __kmp_hidden_helper_worker_thread_wait() {
2914 int status = sem_wait(&hidden_helper_task_sem);
2915 KMP_CHECK_SYSFAIL(
"sem_wait", status);
2918void __kmp_do_initialize_hidden_helper_threads() {
2921 pthread_cond_init(&hidden_helper_threads_initz_cond_var,
nullptr);
2922 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2924 status = pthread_cond_init(&hidden_helper_threads_deinitz_cond_var,
nullptr);
2925 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2927 status = pthread_cond_init(&hidden_helper_main_thread_cond_var,
nullptr);
2928 KMP_CHECK_SYSFAIL(
"pthread_cond_init", status);
2930 status = pthread_mutex_init(&hidden_helper_threads_initz_lock,
nullptr);
2931 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2933 status = pthread_mutex_init(&hidden_helper_threads_deinitz_lock,
nullptr);
2934 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2936 status = pthread_mutex_init(&hidden_helper_main_thread_lock,
nullptr);
2937 KMP_CHECK_SYSFAIL(
"pthread_mutex_init", status);
2940 status = sem_init(&hidden_helper_task_sem, 0, 0);
2941 KMP_CHECK_SYSFAIL(
"sem_init", status);
2945 status = pthread_create(
2947 [](
void *) ->
void * {
2948 __kmp_hidden_helper_threads_initz_routine();
2952 KMP_CHECK_SYSFAIL(
"pthread_create", status);
2955void __kmp_hidden_helper_threads_initz_wait() {
2958 int status = pthread_mutex_lock(&hidden_helper_threads_initz_lock);
2959 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2961 if (!TCR_4(hidden_helper_initz_signaled)) {
2962 status = pthread_cond_wait(&hidden_helper_threads_initz_cond_var,
2963 &hidden_helper_threads_initz_lock);
2964 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2967 status = pthread_mutex_unlock(&hidden_helper_threads_initz_lock);
2968 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
2971void __kmp_hidden_helper_initz_release() {
2973 int status = pthread_mutex_lock(&hidden_helper_threads_initz_lock);
2974 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2976 status = pthread_cond_signal(&hidden_helper_threads_initz_cond_var);
2977 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2979 TCW_SYNC_4(hidden_helper_initz_signaled, TRUE);
2981 status = pthread_mutex_unlock(&hidden_helper_threads_initz_lock);
2982 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
2985void __kmp_hidden_helper_main_thread_wait() {
2988 int status = pthread_mutex_lock(&hidden_helper_main_thread_lock);
2989 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
2991 if (!TCR_4(hidden_helper_main_thread_signaled)) {
2992 status = pthread_cond_wait(&hidden_helper_main_thread_cond_var,
2993 &hidden_helper_main_thread_lock);
2994 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
2997 status = pthread_mutex_unlock(&hidden_helper_main_thread_lock);
2998 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3001void __kmp_hidden_helper_main_thread_release() {
3004 int status = pthread_mutex_lock(&hidden_helper_main_thread_lock);
3005 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3007 status = pthread_cond_signal(&hidden_helper_main_thread_cond_var);
3008 KMP_CHECK_SYSFAIL(
"pthread_cond_signal", status);
3011 TCW_SYNC_4(hidden_helper_main_thread_signaled, TRUE);
3013 status = pthread_mutex_unlock(&hidden_helper_main_thread_lock);
3014 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3017void __kmp_hidden_helper_worker_thread_signal() {
3018 int status = sem_post(&hidden_helper_task_sem);
3019 KMP_CHECK_SYSFAIL(
"sem_post", status);
3022void __kmp_hidden_helper_threads_deinitz_wait() {
3025 int status = pthread_mutex_lock(&hidden_helper_threads_deinitz_lock);
3026 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3028 if (!TCR_4(hidden_helper_deinitz_signaled)) {
3029 status = pthread_cond_wait(&hidden_helper_threads_deinitz_cond_var,
3030 &hidden_helper_threads_deinitz_lock);
3031 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
3034 status = pthread_mutex_unlock(&hidden_helper_threads_deinitz_lock);
3035 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3038void __kmp_hidden_helper_threads_deinitz_release() {
3039 int status = pthread_mutex_lock(&hidden_helper_threads_deinitz_lock);
3040 KMP_CHECK_SYSFAIL(
"pthread_mutex_lock", status);
3042 status = pthread_cond_signal(&hidden_helper_threads_deinitz_cond_var);
3043 KMP_CHECK_SYSFAIL(
"pthread_cond_wait", status);
3045 TCW_SYNC_4(hidden_helper_deinitz_signaled, TRUE);
3047 status = pthread_mutex_unlock(&hidden_helper_threads_deinitz_lock);
3048 KMP_CHECK_SYSFAIL(
"pthread_mutex_unlock", status);
3051void __kmp_hidden_helper_worker_thread_wait() {
3052 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3055void __kmp_do_initialize_hidden_helper_threads() {
3056 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3059void __kmp_hidden_helper_threads_initz_wait() {
3060 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3063void __kmp_hidden_helper_initz_release() {
3064 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3067void __kmp_hidden_helper_main_thread_wait() {
3068 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3071void __kmp_hidden_helper_main_thread_release() {
3072 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3075void __kmp_hidden_helper_worker_thread_signal() {
3076 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3079void __kmp_hidden_helper_threads_deinitz_wait() {
3080 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3083void __kmp_hidden_helper_threads_deinitz_release() {
3084 KMP_ASSERT(0 &&
"Hidden helper task is not supported on this OS");
3088bool __kmp_detect_shm() {
3089 DIR *dir = opendir(
"/dev/shm");
3093 }
else if (ENOENT == errno) {
3100bool __kmp_detect_tmp() {
3101 DIR *dir = opendir(
"/tmp");
3105 }
else if (ENOENT == errno) {
#define KMP_INIT_PARTITIONED_TIMERS(name)
Initializes the partitioned timers to begin with name.