48 # ifndef KMP_STATIC_STEAL_ENABLED
49 # define KMP_STATIC_STEAL_ENABLED 1
52 #define TASK_CURRENT_NOT_QUEUED 0
53 #define TASK_CURRENT_QUEUED 1
55 #define TASK_DEQUE_BITS 8 // Used solely to define TASK_DEQUE_SIZE and TASK_DEQUE_MASK.
56 #define TASK_DEQUE_SIZE ( 1 << TASK_DEQUE_BITS )
57 #define TASK_DEQUE_MASK ( TASK_DEQUE_SIZE - 1 )
59 #ifdef BUILD_TIED_TASK_STACK
60 #define TASK_STACK_EMPTY 0 // entries when the stack is empty
62 #define TASK_STACK_BLOCK_BITS 5 // Used to define TASK_STACK_SIZE and TASK_STACK_MASK
63 #define TASK_STACK_BLOCK_SIZE ( 1 << TASK_STACK_BLOCK_BITS ) // Number of entries in each task stack array
64 #define TASK_STACK_INDEX_MASK ( TASK_STACK_BLOCK_SIZE - 1 ) // Mask for determining index into stack block
65 #endif // BUILD_TIED_TASK_STACK
67 #define TASK_NOT_PUSHED 1
68 #define TASK_SUCCESSFULLY_PUSHED 0
71 #define TASK_EXPLICIT 1
72 #define TASK_IMPLICIT 0
76 #define KMP_CANCEL_THREADS
77 #define KMP_THREAD_ATTR
88 #include <sys/types.h>
101 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
102 #include <xmmintrin.h>
105 #include "kmp_version.h"
106 #include "kmp_debug.h"
107 #include "kmp_lock.h"
109 #include "kmp_debugger.h"
111 #include "kmp_i18n.h"
113 #define KMP_HANDLE_SIGNALS (KMP_OS_LINUX || KMP_OS_FREEBSD || KMP_OS_WINDOWS || KMP_OS_DARWIN)
115 #ifdef KMP_SETVERSION
117 #include "kaiconfig.h"
120 #include "setversion.h"
123 #include "kmp_wrapper_malloc.h"
126 # if !defined NSIG && defined _NSIG
132 # pragma weak clock_gettime
136 #include "ompt-internal.h"
140 #define NO_FIRST_TOUCH 0
141 #define FIRST_TOUCH 1
145 #define BUILD_MEMORY NO_FIRST_TOUCH
150 #ifndef USE_FAST_MEMORY
151 #define USE_FAST_MEMORY 3
154 #ifndef KMP_NESTED_HOT_TEAMS
155 # define KMP_NESTED_HOT_TEAMS 0
156 # define USE_NESTED_HOT_ARG(x)
158 # if KMP_NESTED_HOT_TEAMS
160 # define USE_NESTED_HOT_ARG(x) ,x
163 # undef KMP_NESTED_HOT_TEAMS
164 # define KMP_NESTED_HOT_TEAMS 0
165 # define USE_NESTED_HOT_ARG(x)
168 # define USE_NESTED_HOT_ARG(x)
173 #ifndef USE_CMP_XCHG_FOR_BGET
174 #define USE_CMP_XCHG_FOR_BGET 1
182 #define KMP_NSEC_PER_SEC 1000000000L
183 #define KMP_USEC_PER_SEC 1000000L
196 #define KMP_IDENT_IMB 0x01
198 #define KMP_IDENT_KMPC 0x02
201 #define KMP_IDENT_AUTOPAR 0x08
203 #define KMP_IDENT_ATOMIC_REDUCE 0x10
205 #define KMP_IDENT_BARRIER_EXPL 0x20
207 #define KMP_IDENT_BARRIER_IMPL 0x0040
208 #define KMP_IDENT_BARRIER_IMPL_MASK 0x01C0
209 #define KMP_IDENT_BARRIER_IMPL_FOR 0x0040
210 #define KMP_IDENT_BARRIER_IMPL_SECTIONS 0x00C0
212 #define KMP_IDENT_BARRIER_IMPL_SINGLE 0x0140
213 #define KMP_IDENT_BARRIER_IMPL_WORKSHARE 0x01C0
238 typedef union kmp_team kmp_team_t;
239 typedef struct kmp_taskdata kmp_taskdata_t;
240 typedef union kmp_task_team kmp_task_team_t;
241 typedef union kmp_team kmp_team_p;
242 typedef union kmp_info kmp_info_p;
243 typedef union kmp_root kmp_root_p;
255 #define KMP_PACK_64(HIGH_32,LOW_32) \
256 ( (kmp_int64) ((((kmp_uint64)(HIGH_32))<<32) | (kmp_uint64)(LOW_32)) )
263 #define SKIP_WS(_x) { while (*(_x) == ' ' || *(_x) == '\t') (_x)++; }
264 #define SKIP_DIGITS(_x) { while (*(_x) >= '0' && *(_x) <= '9') (_x)++; }
265 #define SKIP_TO(_x,_c) { while (*(_x) != '\0' && *(_x) != (_c)) (_x)++; }
270 #define KMP_MAX( x, y ) ( (x) > (y) ? (x) : (y) )
271 #define KMP_MIN( x, y ) ( (x) < (y) ? (x) : (y) )
279 enum kmp_state_timer {
289 #ifdef USE_LOAD_BALANCE
290 dynamic_load_balance,
293 dynamic_thread_limit,
298 #ifndef KMP_SCHED_TYPE_DEFINED
299 #define KMP_SCHED_TYPE_DEFINED
300 typedef enum kmp_sched {
303 kmp_sched_static = 1,
304 kmp_sched_dynamic = 2,
305 kmp_sched_guided = 3,
307 kmp_sched_upper_std = 5,
308 kmp_sched_lower_ext = 100,
309 kmp_sched_trapezoidal = 101,
311 kmp_sched_upper = 102,
312 kmp_sched_default = kmp_sched_static
322 kmp_sch_static_chunked = 33,
324 kmp_sch_dynamic_chunked = 35,
326 kmp_sch_runtime = 37,
328 kmp_sch_trapezoidal = 39,
331 kmp_sch_static_greedy = 40,
332 kmp_sch_static_balanced = 41,
334 kmp_sch_guided_iterative_chunked = 42,
335 kmp_sch_guided_analytical_chunked = 43,
343 kmp_ord_static_chunked = 65,
345 kmp_ord_dynamic_chunked = 67,
346 kmp_ord_guided_chunked = 68,
347 kmp_ord_runtime = 69,
349 kmp_ord_trapezoidal = 71,
368 kmp_nm_dynamic_chunked = 163,
370 kmp_nm_runtime = 165,
372 kmp_nm_trapezoidal = 167,
375 kmp_nm_static_greedy = 168,
376 kmp_nm_static_balanced = 169,
378 kmp_nm_guided_iterative_chunked = 170,
379 kmp_nm_guided_analytical_chunked = 171,
380 kmp_nm_static_steal = 172,
382 kmp_nm_ord_static_chunked = 193,
384 kmp_nm_ord_dynamic_chunked = 195,
385 kmp_nm_ord_guided_chunked = 196,
386 kmp_nm_ord_runtime = 197,
388 kmp_nm_ord_trapezoidal = 199,
395 typedef struct kmp_r_sched {
410 enum clock_function_type {
411 clock_function_gettimeofday,
412 clock_function_clock_gettime
416 #if KMP_ARCH_X86_64 && (KMP_OS_LINUX || KMP_OS_WINDOWS)
429 #undef KMP_FAST_REDUCTION_BARRIER
430 #define KMP_FAST_REDUCTION_BARRIER 1
432 #undef KMP_FAST_REDUCTION_CORE_DUO
433 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
434 #define KMP_FAST_REDUCTION_CORE_DUO 1
437 enum _reduction_method {
438 reduction_method_not_defined = 0,
439 critical_reduce_block = ( 1 << 8 ),
440 atomic_reduce_block = ( 2 << 8 ),
441 tree_reduce_block = ( 3 << 8 ),
442 empty_reduce_block = ( 4 << 8 )
452 #if KMP_FAST_REDUCTION_BARRIER
453 #define PACK_REDUCTION_METHOD_AND_BARRIER(reduction_method,barrier_type) \
454 ( ( reduction_method ) | ( barrier_type ) )
456 #define UNPACK_REDUCTION_METHOD(packed_reduction_method) \
457 ( ( enum _reduction_method )( ( packed_reduction_method ) & ( 0x0000FF00 ) ) )
459 #define UNPACK_REDUCTION_BARRIER(packed_reduction_method) \
460 ( ( enum barrier_type )( ( packed_reduction_method ) & ( 0x000000FF ) ) )
462 #define PACK_REDUCTION_METHOD_AND_BARRIER(reduction_method,barrier_type) \
465 #define UNPACK_REDUCTION_METHOD(packed_reduction_method) \
466 ( packed_reduction_method )
468 #define UNPACK_REDUCTION_BARRIER(packed_reduction_method) \
472 #define TEST_REDUCTION_METHOD(packed_reduction_method,which_reduction_block) \
473 ( ( UNPACK_REDUCTION_METHOD( packed_reduction_method ) ) == ( which_reduction_block ) )
475 #if KMP_FAST_REDUCTION_BARRIER
476 #define TREE_REDUCE_BLOCK_WITH_REDUCTION_BARRIER \
477 ( PACK_REDUCTION_METHOD_AND_BARRIER( tree_reduce_block, bs_reduction_barrier ) )
479 #define TREE_REDUCE_BLOCK_WITH_PLAIN_BARRIER \
480 ( PACK_REDUCTION_METHOD_AND_BARRIER( tree_reduce_block, bs_plain_barrier ) )
483 typedef int PACKED_REDUCTION_METHOD_T;
491 # define USE_CBLKDATA
492 # pragma warning( push )
493 # pragma warning( disable: 271 310 )
494 # include <windows.h>
495 # pragma warning( pop )
499 # include <pthread.h>
509 #if KMP_AFFINITY_SUPPORTED
511 extern size_t __kmp_affin_mask_size;
512 # define KMP_AFFINITY_CAPABLE() (__kmp_affin_mask_size > 0)
513 # define KMP_AFFINITY_DISABLE() (__kmp_affin_mask_size = 0)
514 # define KMP_AFFINITY_ENABLE(mask_size) (__kmp_affin_mask_size = mask_size)
515 # define KMP_CPU_SETSIZE (__kmp_affin_mask_size * CHAR_BIT)
529 typedef unsigned char kmp_affin_mask_t;
531 # define _KMP_CPU_SET(i,mask) (mask[i/CHAR_BIT] |= (((kmp_affin_mask_t)1) << (i % CHAR_BIT)))
532 # define KMP_CPU_SET(i,mask) _KMP_CPU_SET((i), ((kmp_affin_mask_t *)(mask)))
533 # define _KMP_CPU_ISSET(i,mask) (!!(mask[i/CHAR_BIT] & (((kmp_affin_mask_t)1) << (i % CHAR_BIT))))
534 # define KMP_CPU_ISSET(i,mask) _KMP_CPU_ISSET((i), ((kmp_affin_mask_t *)(mask)))
535 # define _KMP_CPU_CLR(i,mask) (mask[i/CHAR_BIT] &= ~(((kmp_affin_mask_t)1) << (i % CHAR_BIT)))
536 # define KMP_CPU_CLR(i,mask) _KMP_CPU_CLR((i), ((kmp_affin_mask_t *)(mask)))
538 # define KMP_CPU_ZERO(mask) \
541 for (__i = 0; __i < __kmp_affin_mask_size; __i++) { \
542 ((kmp_affin_mask_t *)(mask))[__i] = 0; \
546 # define KMP_CPU_COPY(dest, src) \
549 for (__i = 0; __i < __kmp_affin_mask_size; __i++) { \
550 ((kmp_affin_mask_t *)(dest))[__i] \
551 = ((kmp_affin_mask_t *)(src))[__i]; \
555 # define KMP_CPU_COMPLEMENT(mask) \
558 for (__i = 0; __i < __kmp_affin_mask_size; __i++) { \
559 ((kmp_affin_mask_t *)(mask))[__i] \
560 = ~((kmp_affin_mask_t *)(mask))[__i]; \
564 # define KMP_CPU_UNION(dest, src) \
567 for (__i = 0; __i < __kmp_affin_mask_size; __i++) { \
568 ((kmp_affin_mask_t *)(dest))[__i] \
569 |= ((kmp_affin_mask_t *)(src))[__i]; \
581 # if KMP_GROUP_AFFINITY
585 typedef struct GROUP_AFFINITY {
592 typedef DWORD_PTR kmp_affin_mask_t;
594 extern int __kmp_num_proc_groups;
596 # define _KMP_CPU_SET(i,mask) \
597 (mask[i/(CHAR_BIT * sizeof(kmp_affin_mask_t))] |= \
598 (((kmp_affin_mask_t)1) << (i % (CHAR_BIT * sizeof(kmp_affin_mask_t)))))
600 # define KMP_CPU_SET(i,mask) \
601 _KMP_CPU_SET((i), ((kmp_affin_mask_t *)(mask)))
603 # define _KMP_CPU_ISSET(i,mask) \
604 (!!(mask[i/(CHAR_BIT * sizeof(kmp_affin_mask_t))] & \
605 (((kmp_affin_mask_t)1) << (i % (CHAR_BIT * sizeof(kmp_affin_mask_t))))))
607 # define KMP_CPU_ISSET(i,mask) \
608 _KMP_CPU_ISSET((i), ((kmp_affin_mask_t *)(mask)))
610 # define _KMP_CPU_CLR(i,mask) \
611 (mask[i/(CHAR_BIT * sizeof(kmp_affin_mask_t))] &= \
612 ~(((kmp_affin_mask_t)1) << (i % (CHAR_BIT * sizeof(kmp_affin_mask_t)))))
614 # define KMP_CPU_CLR(i,mask) \
615 _KMP_CPU_CLR((i), ((kmp_affin_mask_t *)(mask)))
617 # define KMP_CPU_ZERO(mask) \
620 for (__i = 0; __i < __kmp_num_proc_groups; __i++) { \
621 ((kmp_affin_mask_t *)(mask))[__i] = 0; \
625 # define KMP_CPU_COPY(dest, src) \
628 for (__i = 0; __i < __kmp_num_proc_groups; __i++) { \
629 ((kmp_affin_mask_t *)(dest))[__i] \
630 = ((kmp_affin_mask_t *)(src))[__i]; \
634 # define KMP_CPU_COMPLEMENT(mask) \
637 for (__i = 0; __i < __kmp_num_proc_groups; __i++) { \
638 ((kmp_affin_mask_t *)(mask))[__i] \
639 = ~((kmp_affin_mask_t *)(mask))[__i]; \
643 # define KMP_CPU_UNION(dest, src) \
646 for (__i = 0; __i < __kmp_num_proc_groups; __i++) { \
647 ((kmp_affin_mask_t *)(dest))[__i] \
648 |= ((kmp_affin_mask_t *)(src))[__i]; \
652 typedef DWORD (*kmp_GetActiveProcessorCount_t)(WORD);
653 extern kmp_GetActiveProcessorCount_t __kmp_GetActiveProcessorCount;
655 typedef WORD (*kmp_GetActiveProcessorGroupCount_t)(void);
656 extern kmp_GetActiveProcessorGroupCount_t __kmp_GetActiveProcessorGroupCount;
658 typedef BOOL (*kmp_GetThreadGroupAffinity_t)(HANDLE, GROUP_AFFINITY *);
659 extern kmp_GetThreadGroupAffinity_t __kmp_GetThreadGroupAffinity;
661 typedef BOOL (*kmp_SetThreadGroupAffinity_t)(HANDLE,
const GROUP_AFFINITY *, GROUP_AFFINITY *);
662 extern kmp_SetThreadGroupAffinity_t __kmp_SetThreadGroupAffinity;
664 extern int __kmp_get_proc_group(kmp_affin_mask_t
const *mask);
668 typedef DWORD kmp_affin_mask_t;
670 # define KMP_CPU_SET(i,mask) (*(mask) |= (((kmp_affin_mask_t)1) << (i)))
671 # define KMP_CPU_ISSET(i,mask) (!!(*(mask) & (((kmp_affin_mask_t)1) << (i))))
672 # define KMP_CPU_CLR(i,mask) (*(mask) &= ~(((kmp_affin_mask_t)1) << (i)))
673 # define KMP_CPU_ZERO(mask) (*(mask) = 0)
674 # define KMP_CPU_COPY(dest, src) (*(dest) = *(src))
675 # define KMP_CPU_COMPLEMENT(mask) (*(mask) = ~*(mask))
676 # define KMP_CPU_UNION(dest, src) (*(dest) |= *(src))
686 # define KMP_CPU_ALLOC(ptr) \
687 (ptr = ((kmp_affin_mask_t *)__kmp_allocate(__kmp_affin_mask_size)))
688 # define KMP_CPU_FREE(ptr) __kmp_free(ptr)
697 # define KMP_CPU_INDEX(array,i) \
698 ((kmp_affin_mask_t *)(((char *)(array)) + (i) * __kmp_affin_mask_size))
704 #define KMP_AFFIN_MASK_PRINT_LEN 1024
719 affinity_gran_fine = 0,
720 affinity_gran_thread,
722 affinity_gran_package,
724 #if KMP_GROUP_AFFINITY
731 affinity_gran_default
734 enum affinity_top_method {
735 affinity_top_method_all = 0,
736 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
737 affinity_top_method_apicid,
738 affinity_top_method_x2apicid,
740 affinity_top_method_cpuinfo,
741 #if KMP_GROUP_AFFINITY
742 affinity_top_method_group,
744 affinity_top_method_flat,
745 affinity_top_method_default
748 #define affinity_respect_mask_default (-1)
750 extern enum affinity_type __kmp_affinity_type;
751 extern enum affinity_gran __kmp_affinity_gran;
752 extern int __kmp_affinity_gran_levels;
753 extern int __kmp_affinity_dups;
754 extern enum affinity_top_method __kmp_affinity_top_method;
755 extern int __kmp_affinity_compact;
756 extern int __kmp_affinity_offset;
757 extern int __kmp_affinity_verbose;
758 extern int __kmp_affinity_warnings;
759 extern int __kmp_affinity_respect_mask;
760 extern char * __kmp_affinity_proclist;
761 extern kmp_affin_mask_t *__kmp_affinity_masks;
762 extern unsigned __kmp_affinity_num_masks;
763 extern int __kmp_get_system_affinity(kmp_affin_mask_t *mask,
int abort_on_error);
764 extern int __kmp_set_system_affinity(kmp_affin_mask_t
const *mask,
int abort_on_error);
765 extern void __kmp_affinity_bind_thread(
int which);
768 extern kmp_affin_mask_t *__kmp_affinity_get_fullMask();
770 extern char const * __kmp_cpuinfo_file;
779 typedef enum kmp_proc_bind_t {
789 typedef struct kmp_nested_proc_bind_t {
790 kmp_proc_bind_t *bind_types;
793 } kmp_nested_proc_bind_t;
795 extern kmp_nested_proc_bind_t __kmp_nested_proc_bind;
799 # if KMP_AFFINITY_SUPPORTED
800 # define KMP_PLACE_ALL (-1)
801 # define KMP_PLACE_UNDEFINED (-2)
804 extern int __kmp_affinity_num_places;
808 typedef enum kmp_cancel_kind_t {
815 #endif // OMP_40_ENABLED
817 extern int __kmp_place_num_sockets;
818 extern int __kmp_place_socket_offset;
819 extern int __kmp_place_num_cores;
820 extern int __kmp_place_core_offset;
821 extern int __kmp_place_num_threads_per_core;
826 #define KMP_PAD(type, sz) (sizeof(type) + (sz - ((sizeof(type) - 1) % (sz)) - 1))
832 #define KMP_GTID_DNE (-2)
833 #define KMP_GTID_SHUTDOWN (-3)
834 #define KMP_GTID_MONITOR (-4)
835 #define KMP_GTID_UNKNOWN (-5)
836 #define KMP_GTID_MIN (-6)
838 #define __kmp_get_gtid() __kmp_get_global_thread_id()
839 #define __kmp_entry_gtid() __kmp_get_global_thread_id_reg()
841 #define __kmp_tid_from_gtid(gtid) ( KMP_DEBUG_ASSERT( (gtid) >= 0 ), \
842 __kmp_threads[ (gtid) ]->th.th_info.ds.ds_tid )
844 #define __kmp_get_tid() ( __kmp_tid_from_gtid( __kmp_get_gtid() ) )
845 #define __kmp_gtid_from_tid(tid,team) ( KMP_DEBUG_ASSERT( (tid) >= 0 && (team) != NULL ), \
846 team -> t.t_threads[ (tid) ] -> th.th_info .ds.ds_gtid )
848 #define __kmp_get_team() ( __kmp_threads[ (__kmp_get_gtid()) ]-> th.th_team )
849 #define __kmp_team_from_gtid(gtid) ( KMP_DEBUG_ASSERT( (gtid) >= 0 ), \
850 __kmp_threads[ (gtid) ]-> th.th_team )
852 #define __kmp_thread_from_gtid(gtid) ( KMP_DEBUG_ASSERT( (gtid) >= 0 ), __kmp_threads[ (gtid) ] )
853 #define __kmp_get_thread() ( __kmp_thread_from_gtid( __kmp_get_gtid() ) )
857 #define __kmp_gtid_from_thread(thr) ( KMP_DEBUG_ASSERT( (thr) != NULL ), \
858 (thr)->th.th_info.ds.ds_gtid )
863 #define __kmp_get_team_num_threads(gtid) ( __kmp_threads[ ( gtid ) ] -> th.th_team -> t.t_nproc )
869 #define KMP_UINT64_MAX (~((kmp_uint64)1<<((sizeof(kmp_uint64)*(1<<3))-1)))
871 #define KMP_MIN_NTH 1
874 # ifdef PTHREAD_THREADS_MAX
875 # define KMP_MAX_NTH PTHREAD_THREADS_MAX
877 # define KMP_MAX_NTH (32 * 1024)
881 #ifdef PTHREAD_STACK_MIN
882 # define KMP_MIN_STKSIZE PTHREAD_STACK_MIN
884 # define KMP_MIN_STKSIZE ((size_t)(32 * 1024))
887 #define KMP_MAX_STKSIZE (~((size_t)1<<((sizeof(size_t)*(1<<3))-1)))
890 # define KMP_DEFAULT_STKSIZE ((size_t)(2 * 1024 * 1024))
891 #elif KMP_ARCH_X86_64
892 # define KMP_DEFAULT_STKSIZE ((size_t)(4 * 1024 * 1024))
893 # define KMP_BACKUP_STKSIZE ((size_t)(2 * 1024 * 1024))
895 # define KMP_DEFAULT_STKSIZE ((size_t)(1024 * 1024))
898 #define KMP_DEFAULT_MONITOR_STKSIZE ((size_t)(64 * 1024))
900 #define KMP_DEFAULT_MALLOC_POOL_INCR ((size_t) (1024 * 1024))
901 #define KMP_MIN_MALLOC_POOL_INCR ((size_t) (4 * 1024))
902 #define KMP_MAX_MALLOC_POOL_INCR (~((size_t)1<<((sizeof(size_t)*(1<<3))-1)))
904 #define KMP_MIN_STKOFFSET (0)
905 #define KMP_MAX_STKOFFSET KMP_MAX_STKSIZE
907 # define KMP_DEFAULT_STKOFFSET KMP_MIN_STKOFFSET
909 # define KMP_DEFAULT_STKOFFSET CACHE_LINE
912 #define KMP_MIN_STKPADDING (0)
913 #define KMP_MAX_STKPADDING (2 * 1024 * 1024)
915 #define KMP_MIN_MONITOR_WAKEUPS (1)
916 #define KMP_MAX_MONITOR_WAKEUPS (1000)
917 #define KMP_BLOCKTIME_MULTIPLIER (1000)
918 #define KMP_MIN_BLOCKTIME (0)
919 #define KMP_MAX_BLOCKTIME (INT_MAX)
920 #define KMP_DEFAULT_BLOCKTIME (200)
923 #define KMP_WAKEUPS_FROM_BLOCKTIME(blocktime, monitor_wakeups) \
924 ( ((blocktime) == KMP_MAX_BLOCKTIME) ? (monitor_wakeups) : \
925 ((blocktime) == KMP_MIN_BLOCKTIME) ? KMP_MAX_MONITOR_WAKEUPS : \
926 ((monitor_wakeups) > (KMP_BLOCKTIME_MULTIPLIER / (blocktime))) ? (monitor_wakeups) : \
927 (KMP_BLOCKTIME_MULTIPLIER) / (blocktime) )
930 #define KMP_INTERVALS_FROM_BLOCKTIME(blocktime, monitor_wakeups) \
931 ( ( (blocktime) + (KMP_BLOCKTIME_MULTIPLIER / (monitor_wakeups)) - 1 ) / \
932 (KMP_BLOCKTIME_MULTIPLIER / (monitor_wakeups)) )
934 #define KMP_MIN_STATSCOLS 40
935 #define KMP_MAX_STATSCOLS 4096
936 #define KMP_DEFAULT_STATSCOLS 80
938 #define KMP_MIN_INTERVAL 0
939 #define KMP_MAX_INTERVAL (INT_MAX-1)
940 #define KMP_DEFAULT_INTERVAL 0
942 #define KMP_MIN_CHUNK 1
943 #define KMP_MAX_CHUNK (INT_MAX-1)
944 #define KMP_DEFAULT_CHUNK 1
946 #define KMP_MIN_INIT_WAIT 1
947 #define KMP_MAX_INIT_WAIT (INT_MAX/2)
948 #define KMP_DEFAULT_INIT_WAIT 2048U
950 #define KMP_MIN_NEXT_WAIT 1
951 #define KMP_MAX_NEXT_WAIT (INT_MAX/2)
952 #define KMP_DEFAULT_NEXT_WAIT 1024U
955 #define KMP_MAX_DISP_BUF 7
956 #define KMP_MAX_ORDERED 8
958 #define KMP_MAX_FIELDS 32
960 #define KMP_MAX_BRANCH_BITS 31
962 #define KMP_MAX_ACTIVE_LEVELS_LIMIT INT_MAX
966 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
967 # define KMP_TLS_GTID_MIN 5
969 # define KMP_TLS_GTID_MIN INT_MAX
972 #define KMP_MASTER_TID(tid) ( (tid) == 0 )
973 #define KMP_WORKER_TID(tid) ( (tid) != 0 )
975 #define KMP_MASTER_GTID(gtid) ( __kmp_tid_from_gtid((gtid)) == 0 )
976 #define KMP_WORKER_GTID(gtid) ( __kmp_tid_from_gtid((gtid)) != 0 )
977 #define KMP_UBER_GTID(gtid) \
979 KMP_DEBUG_ASSERT( (gtid) >= KMP_GTID_MIN ), \
980 KMP_DEBUG_ASSERT( (gtid) < __kmp_threads_capacity ), \
981 (gtid) >= 0 && __kmp_root[(gtid)] && __kmp_threads[(gtid)] && \
982 (__kmp_threads[(gtid)] == __kmp_root[(gtid)]->r.r_uber_thread)\
984 #define KMP_INITIAL_GTID(gtid) ( (gtid) == 0 )
988 #define TRUE (! FALSE)
994 # define KMP_INIT_WAIT 64U
995 # define KMP_NEXT_WAIT 32U
997 # define KMP_INIT_WAIT 16U
998 # define KMP_NEXT_WAIT 8U
1000 # define KMP_INIT_WAIT 1024U
1001 # define KMP_NEXT_WAIT 512U
1004 # define KMP_INIT_WAIT 1024U
1005 # define KMP_NEXT_WAIT 512U
1006 #elif KMP_OS_FREEBSD
1008 # define KMP_INIT_WAIT 1024U
1009 # define KMP_NEXT_WAIT 512U
1012 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
1013 typedef struct kmp_cpuid {
1019 extern void __kmp_x86_cpuid(
int mode,
int mode2,
struct kmp_cpuid *p );
1021 extern void __kmp_x86_pause(
void );
1023 static void __kmp_x86_pause(
void ) { _mm_delay_32( 100 ); };
1025 static void __kmp_x86_pause(
void ) { _mm_pause(); };
1027 # define KMP_CPU_PAUSE() __kmp_x86_pause()
1028 #elif KMP_ARCH_PPC64
1029 # define KMP_PPC64_PRI_LOW() __asm__ volatile ("or 1, 1, 1")
1030 # define KMP_PPC64_PRI_MED() __asm__ volatile ("or 2, 2, 2")
1031 # define KMP_PPC64_PRI_LOC_MB() __asm__ volatile ("" : : : "memory")
1032 # define KMP_CPU_PAUSE() do { KMP_PPC64_PRI_LOW(); KMP_PPC64_PRI_MED(); KMP_PPC64_PRI_LOC_MB(); } while (0)
1034 # define KMP_CPU_PAUSE()
1037 #define KMP_INIT_YIELD(count) { (count) = __kmp_yield_init; }
1039 #define KMP_YIELD(cond) { KMP_CPU_PAUSE(); __kmp_yield( (cond) ); }
1044 #define KMP_YIELD_WHEN(cond,count) { KMP_CPU_PAUSE(); (count) -= 2; \
1045 if (!(count)) { KMP_YIELD(cond); (count) = __kmp_yield_next; } }
1046 #define KMP_YIELD_SPIN(count) { KMP_CPU_PAUSE(); (count) -=2; \
1047 if (!(count)) { KMP_YIELD(1); (count) = __kmp_yield_next; } }
1068 ct_ordered_in_parallel,
1070 ct_ordered_in_taskq,
1077 # define IS_CONS_TYPE_TASKQ( ct ) ( ((int)(ct)) >= ((int)ct_taskq) && ((int)(ct)) <= ((int)ct_task_ordered) )
1078 # define IS_CONS_TYPE_ORDERED( ct ) ((ct) == ct_pdo_ordered || (ct) == ct_task_ordered)
1082 enum cons_type type;
1084 kmp_user_lock_p name;
1087 struct cons_header {
1088 int p_top, w_top, s_top;
1089 int stack_size, stack_top;
1090 struct cons_data *stack_data;
1093 struct kmp_region_info {
1095 int offset[KMP_MAX_FIELDS];
1096 int length[KMP_MAX_FIELDS];
1104 typedef HANDLE kmp_thread_t;
1105 typedef DWORD kmp_key_t;
1109 typedef pthread_t kmp_thread_t;
1110 typedef pthread_key_t kmp_key_t;
1113 extern kmp_key_t __kmp_gtid_threadprivate_key;
1115 typedef struct kmp_sys_info {
1126 typedef struct kmp_cpuinfo {
1134 int cpu_stackoffset;
1138 kmp_uint64 frequency;
1144 struct tv_threadprivate {
1151 struct tv_data *next;
1154 struct tv_threadprivate tp;
1158 extern kmp_key_t __kmp_tv_key;
1167 typedef int kmp_itt_mark_t;
1168 #define KMP_ITT_DEBUG 0
1177 #define HIGH_WATER_MARK(nslots) (((nslots) * 3) / 4)
1178 #define __KMP_TASKQ_THUNKS_PER_TH 1
1182 #define TQF_IS_ORDERED 0x0001
1183 #define TQF_IS_LASTPRIVATE 0x0002
1184 #define TQF_IS_NOWAIT 0x0004
1185 #define TQF_HEURISTICS 0x0008
1186 #define TQF_INTERFACE_RESERVED1 0x0010
1187 #define TQF_INTERFACE_RESERVED2 0x0020
1188 #define TQF_INTERFACE_RESERVED3 0x0040
1189 #define TQF_INTERFACE_RESERVED4 0x0080
1191 #define TQF_INTERFACE_FLAGS 0x00ff
1193 #define TQF_IS_LAST_TASK 0x0100
1194 #define TQF_TASKQ_TASK 0x0200
1195 #define TQF_RELEASE_WORKERS 0x0400
1196 #define TQF_ALL_TASKS_QUEUED 0x0800
1197 #define TQF_PARALLEL_CONTEXT 0x1000
1198 #define TQF_DEALLOCATED 0x2000
1200 #define TQF_INTERNAL_FLAGS 0x3f00
1202 typedef struct KMP_ALIGN_CACHE kmpc_aligned_int32_t {
1204 } kmpc_aligned_int32_t;
1206 typedef struct KMP_ALIGN_CACHE kmpc_aligned_queue_slot_t {
1207 struct kmpc_thunk_t *qs_thunk;
1208 } kmpc_aligned_queue_slot_t;
1210 typedef struct kmpc_task_queue_t {
1212 kmp_lock_t tq_link_lck;
1214 struct kmpc_task_queue_t *tq_parent;
1215 struct kmpc_task_queue_t *tq_next_free;
1217 volatile struct kmpc_task_queue_t *tq_first_child;
1218 struct kmpc_task_queue_t *tq_next_child;
1219 struct kmpc_task_queue_t *tq_prev_child;
1220 volatile kmp_int32 tq_ref_count;
1225 struct kmpc_aligned_shared_vars_t *tq_shareds;
1229 kmp_uint32 tq_tasknum_queuing;
1230 volatile kmp_uint32 tq_tasknum_serving;
1233 kmp_lock_t tq_free_thunks_lck;
1234 struct kmpc_thunk_t *tq_free_thunks;
1235 struct kmpc_thunk_t *tq_thunk_space;
1238 kmp_lock_t tq_queue_lck;
1239 kmpc_aligned_queue_slot_t *tq_queue;
1240 volatile struct kmpc_thunk_t *tq_taskq_slot;
1241 kmp_int32 tq_nslots;
1244 volatile kmp_int32 tq_nfull;
1246 volatile kmp_int32 tq_flags;
1249 struct kmpc_aligned_int32_t *tq_th_thunks;
1254 } kmpc_task_queue_t;
1256 typedef void (*kmpc_task_t) (kmp_int32 global_tid,
struct kmpc_thunk_t *thunk);
1259 typedef struct kmpc_shared_vars_t {
1260 kmpc_task_queue_t *sv_queue;
1262 } kmpc_shared_vars_t;
1264 typedef struct KMP_ALIGN_CACHE kmpc_aligned_shared_vars_t {
1265 volatile struct kmpc_shared_vars_t *ai_data;
1266 } kmpc_aligned_shared_vars_t;
1269 typedef struct kmpc_thunk_t {
1271 kmpc_shared_vars_t *th_shareds;
1272 struct kmpc_thunk_t *th_next_free;
1274 kmpc_task_t th_task;
1275 struct kmpc_thunk_t *th_encl_thunk;
1277 kmp_int32 th_status;
1278 kmp_uint32 th_tasknum;
1282 typedef struct KMP_ALIGN_CACHE kmp_taskq {
1283 int tq_curr_thunk_capacity;
1285 kmpc_task_queue_t *tq_root;
1286 kmp_int32 tq_global_flags;
1288 kmp_lock_t tq_freelist_lck;
1289 kmpc_task_queue_t *tq_freelist;
1291 kmpc_thunk_t **tq_curr_thunk;
1297 typedef kmp_int32 kmp_critical_name[8];
1307 typedef void (*
kmpc_micro) ( kmp_int32 * global_tid, kmp_int32 * bound_tid, ... );
1308 typedef void (*kmpc_micro_bound) ( kmp_int32 * bound_tid, kmp_int32 * bound_nth, ... );
1323 typedef void *(*kmpc_ctor) (
void *);
1334 typedef void *(*kmpc_cctor) (
void *,
void *);
1344 typedef void *(*kmpc_ctor_vec) (
void *, size_t);
1356 typedef void *(*kmpc_cctor_vec) (
void *,
void *, size_t);
1366 typedef struct kmp_cached_addr {
1368 struct kmp_cached_addr *next;
1369 } kmp_cached_addr_t;
1371 struct private_data {
1372 struct private_data *next;
1378 struct private_common {
1379 struct private_common *next;
1380 struct private_common *link;
1386 struct shared_common
1388 struct shared_common *next;
1389 struct private_data *pod_init;
1409 #define KMP_HASH_TABLE_LOG2 9
1410 #define KMP_HASH_TABLE_SIZE (1 << KMP_HASH_TABLE_LOG2)
1411 #define KMP_HASH_SHIFT 3
1412 #define KMP_HASH(x) ((((kmp_uintptr_t) x) >> KMP_HASH_SHIFT) & (KMP_HASH_TABLE_SIZE-1))
1414 struct common_table {
1415 struct private_common *data[ KMP_HASH_TABLE_SIZE ];
1418 struct shared_table {
1419 struct shared_common *data[ KMP_HASH_TABLE_SIZE ];
1424 #ifdef KMP_STATIC_STEAL_ENABLED
1425 typedef struct KMP_ALIGN_CACHE dispatch_private_info32 {
1432 kmp_int32 static_steal_counter;
1440 struct KMP_ALIGN( 32 ) {
1447 kmp_uint32 ordered_lower;
1448 kmp_uint32 ordered_upper;
1453 kmp_int32 last_upper;
1455 } dispatch_private_info32_t;
1457 typedef struct KMP_ALIGN_CACHE dispatch_private_info64 {
1464 kmp_int64 static_steal_counter;
1474 struct KMP_ALIGN( 32 ) {
1481 kmp_uint64 ordered_lower;
1482 kmp_uint64 ordered_upper;
1487 kmp_int64 last_upper;
1489 } dispatch_private_info64_t;
1491 typedef struct KMP_ALIGN_CACHE dispatch_private_info32 {
1504 kmp_uint32 ordered_lower;
1505 kmp_uint32 ordered_upper;
1507 kmp_int32 last_upper;
1509 } dispatch_private_info32_t;
1511 typedef struct KMP_ALIGN_CACHE dispatch_private_info64 {
1525 kmp_uint64 ordered_lower;
1526 kmp_uint64 ordered_upper;
1528 kmp_int64 last_upper;
1530 } dispatch_private_info64_t;
1533 typedef struct KMP_ALIGN_CACHE dispatch_private_info {
1534 union private_info {
1535 dispatch_private_info32_t p32;
1536 dispatch_private_info64_t p64;
1540 kmp_int32 ordered_bumped;
1541 kmp_int32 ordered_dummy[KMP_MAX_ORDERED-3];
1542 struct dispatch_private_info * next;
1544 kmp_int32 type_size;
1545 enum cons_type pushed_ws;
1546 } dispatch_private_info_t;
1548 typedef struct dispatch_shared_info32 {
1551 volatile kmp_uint32 iteration;
1552 volatile kmp_uint32 num_done;
1553 volatile kmp_uint32 ordered_iteration;
1554 kmp_int32 ordered_dummy[KMP_MAX_ORDERED-1];
1555 } dispatch_shared_info32_t;
1557 typedef struct dispatch_shared_info64 {
1560 volatile kmp_uint64 iteration;
1561 volatile kmp_uint64 num_done;
1562 volatile kmp_uint64 ordered_iteration;
1563 kmp_int64 ordered_dummy[KMP_MAX_ORDERED-1];
1564 } dispatch_shared_info64_t;
1566 typedef struct dispatch_shared_info {
1568 dispatch_shared_info32_t s32;
1569 dispatch_shared_info64_t s64;
1572 volatile kmp_uint32 buffer_index;
1573 } dispatch_shared_info_t;
1575 typedef struct kmp_disp {
1577 void (*th_deo_fcn)(
int * gtid,
int * cid,
ident_t *);
1579 void (*th_dxo_fcn)(
int * gtid,
int * cid,
ident_t *);
1581 dispatch_shared_info_t *th_dispatch_sh_current;
1582 dispatch_private_info_t *th_dispatch_pr_current;
1584 dispatch_private_info_t *th_disp_buffer;
1585 kmp_int32 th_disp_index;
1586 void* dummy_padding[2];
1587 #if KMP_USE_INTERNODE_ALIGNMENT
1588 char more_padding[INTERNODE_CACHE_LINE];
1598 #define KMP_INIT_BARRIER_STATE 0
1599 #define KMP_BARRIER_SLEEP_BIT 0
1600 #define KMP_BARRIER_UNUSED_BIT 1
1601 #define KMP_BARRIER_BUMP_BIT 2
1603 #define KMP_BARRIER_SLEEP_STATE ((kmp_uint) (1 << KMP_BARRIER_SLEEP_BIT))
1604 #define KMP_BARRIER_UNUSED_STATE ((kmp_uint) (1 << KMP_BARRIER_UNUSED_BIT))
1605 #define KMP_BARRIER_STATE_BUMP ((kmp_uint) (1 << KMP_BARRIER_BUMP_BIT))
1607 #if (KMP_BARRIER_SLEEP_BIT >= KMP_BARRIER_BUMP_BIT)
1608 # error "Barrier sleep bit must be smaller than barrier bump bit"
1610 #if (KMP_BARRIER_UNUSED_BIT >= KMP_BARRIER_BUMP_BIT)
1611 # error "Barrier unused bit must be smaller than barrier bump bit"
1615 #define KMP_BARRIER_NOT_WAITING 0 // Normal state; worker not in wait_sleep
1616 #define KMP_BARRIER_OWN_FLAG 1 // Normal state; worker waiting on own b_go flag in release
1617 #define KMP_BARRIER_PARENT_FLAG 2 // Special state; worker waiting on parent's b_go flag in release
1618 #define KMP_BARRIER_SWITCH_TO_OWN_FLAG 3 // Special state; tells worker to shift from parent to own b_go
1619 #define KMP_BARRIER_SWITCHING 4 // Special state; worker resets appropriate flag on wake-up
1622 bs_plain_barrier = 0,
1623 bs_forkjoin_barrier,
1624 #if KMP_FAST_REDUCTION_BARRIER
1625 bs_reduction_barrier,
1626 #endif // KMP_FAST_REDUCTION_BARRIER
1631 #if !KMP_FAST_REDUCTION_BARRIER
1632 #define bs_reduction_barrier bs_plain_barrier
1633 #endif // KMP_FAST_REDUCTION_BARRIER
1635 typedef enum kmp_bar_pat {
1639 bp_hierarchical_bar = 3,
1643 # define KMP_BARRIER_ICV_PUSH 1
1646 typedef struct kmp_internal_control {
1647 int serial_nesting_level;
1654 int max_active_levels;
1655 kmp_r_sched_t sched;
1657 kmp_proc_bind_t proc_bind;
1658 #endif // OMP_40_ENABLED
1659 struct kmp_internal_control *next;
1660 } kmp_internal_control_t;
1663 copy_icvs( kmp_internal_control_t *dst, kmp_internal_control_t *src ) {
1668 typedef struct KMP_ALIGN_CACHE kmp_bstate {
1673 kmp_internal_control_t th_fixed_icvs;
1675 volatile kmp_uint64 b_go;
1676 KMP_ALIGN_CACHE
volatile kmp_uint64 b_arrived;
1677 kmp_uint32 *skip_per_level;
1678 kmp_uint32 my_level;
1679 kmp_int32 parent_tid;
1682 struct kmp_bstate *parent_bar;
1684 kmp_uint64 leaf_state;
1686 kmp_uint8 base_leaf_kids;
1687 kmp_uint8 leaf_kids;
1689 kmp_uint8 wait_flag;
1690 kmp_uint8 use_oncore_barrier;
1694 KMP_ALIGN_CACHE kmp_uint b_worker_arrived;
1698 union KMP_ALIGN_CACHE kmp_barrier_union {
1700 char b_pad[ KMP_PAD(kmp_bstate_t, CACHE_LINE) ];
1704 typedef union kmp_barrier_union kmp_balign_t;
1707 union KMP_ALIGN_CACHE kmp_barrier_team_union {
1709 char b_pad[ CACHE_LINE ];
1711 kmp_uint64 b_arrived;
1716 kmp_uint b_master_arrived;
1717 kmp_uint b_team_arrived;
1722 typedef union kmp_barrier_team_union kmp_balign_team_t;
1732 typedef struct kmp_win32_mutex
1735 CRITICAL_SECTION cs;
1736 } kmp_win32_mutex_t;
1738 typedef struct kmp_win32_cond
1744 kmp_win32_mutex_t waiters_count_lock_;
1752 int wait_generation_count_;
1762 union KMP_ALIGN_CACHE kmp_cond_union {
1764 char c_pad[ CACHE_LINE ];
1765 pthread_cond_t c_cond;
1768 typedef union kmp_cond_union kmp_cond_align_t;
1770 union KMP_ALIGN_CACHE kmp_mutex_union {
1772 char m_pad[ CACHE_LINE ];
1773 pthread_mutex_t m_mutex;
1776 typedef union kmp_mutex_union kmp_mutex_align_t;
1780 typedef struct kmp_desc_base {
1782 size_t ds_stacksize;
1784 kmp_thread_t ds_thread;
1785 volatile int ds_tid;
1788 volatile int ds_alive;
1806 typedef union KMP_ALIGN_CACHE kmp_desc {
1808 char ds_pad[ KMP_PAD(kmp_desc_base_t, CACHE_LINE) ];
1813 typedef struct kmp_local {
1814 volatile int this_construct;
1819 #if ! USE_CMP_XCHG_FOR_BGET
1820 #ifdef USE_QUEUING_LOCK_FOR_BGET
1821 kmp_lock_t bget_lock;
1823 kmp_bootstrap_lock_t bget_lock;
1830 struct tv_data *tv_data;
1833 PACKED_REDUCTION_METHOD_T packed_reduction_method;
1837 #define get__blocktime( xteam, xtid ) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.blocktime)
1838 #define get__bt_set( xteam, xtid ) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.bt_set)
1839 #define get__bt_intervals( xteam, xtid ) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.bt_intervals)
1841 #define get__nested_2(xteam,xtid) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.nested)
1842 #define get__dynamic_2(xteam,xtid) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.dynamic)
1843 #define get__nproc_2(xteam,xtid) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.nproc)
1844 #define get__sched_2(xteam,xtid) ((xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.sched)
1846 #define set__blocktime_team( xteam, xtid, xval ) \
1847 ( ( (xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.blocktime ) = (xval) )
1849 #define set__bt_intervals_team( xteam, xtid, xval ) \
1850 ( ( (xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.bt_intervals ) = (xval) )
1852 #define set__bt_set_team( xteam, xtid, xval ) \
1853 ( ( (xteam)->t.t_threads[(xtid)]->th.th_current_task->td_icvs.bt_set ) = (xval) )
1856 #define set__nested( xthread, xval ) \
1857 ( ( (xthread)->th.th_current_task->td_icvs.nested ) = (xval) )
1858 #define get__nested( xthread ) \
1859 ( ( (xthread)->th.th_current_task->td_icvs.nested ) ? (FTN_TRUE) : (FTN_FALSE) )
1861 #define set__dynamic( xthread, xval ) \
1862 ( ( (xthread)->th.th_current_task->td_icvs.dynamic ) = (xval) )
1863 #define get__dynamic( xthread ) \
1864 ( ( (xthread)->th.th_current_task->td_icvs.dynamic ) ? (FTN_TRUE) : (FTN_FALSE) )
1866 #define set__nproc( xthread, xval ) \
1867 ( ( (xthread)->th.th_current_task->td_icvs.nproc ) = (xval) )
1869 #define set__max_active_levels( xthread, xval ) \
1870 ( ( (xthread)->th.th_current_task->td_icvs.max_active_levels ) = (xval) )
1872 #define set__sched( xthread, xval ) \
1873 ( ( (xthread)->th.th_current_task->td_icvs.sched ) = (xval) )
1877 #define set__proc_bind( xthread, xval ) \
1878 ( ( (xthread)->th.th_current_task->td_icvs.proc_bind ) = (xval) )
1879 #define get__proc_bind( xthread ) \
1880 ( (xthread)->th.th_current_task->td_icvs.proc_bind )
1889 typedef enum kmp_tasking_mode {
1890 tskm_immediate_exec = 0,
1891 tskm_extra_barrier = 1,
1892 tskm_task_teams = 2,
1894 } kmp_tasking_mode_t;
1896 extern kmp_tasking_mode_t __kmp_tasking_mode;
1897 extern kmp_int32 __kmp_task_stealing_constraint;
1900 #define KMP_TASK_TO_TASKDATA(task) (((kmp_taskdata_t *) task) - 1)
1901 #define KMP_TASKDATA_TO_TASK(taskdata) (kmp_task_t *) (taskdata + 1)
1905 #define KMP_TASKING_ENABLED(task_team) \
1906 (TCR_SYNC_4((task_team)->tt.tt_found_tasks) == TRUE)
1914 typedef kmp_int32 (* kmp_routine_entry_t)( kmp_int32,
void * );
1919 typedef struct kmp_task {
1921 kmp_routine_entry_t routine;
1924 kmp_routine_entry_t destructors;
1925 #endif // OMP_40_ENABLED
1934 typedef struct kmp_taskgroup {
1936 kmp_int32 cancel_request;
1937 struct kmp_taskgroup *parent;
1942 typedef union kmp_depnode kmp_depnode_t;
1943 typedef struct kmp_depnode_list kmp_depnode_list_t;
1944 typedef struct kmp_dephash_entry kmp_dephash_entry_t;
1946 typedef struct kmp_depend_info {
1947 kmp_intptr_t base_addr;
1953 } kmp_depend_info_t;
1955 struct kmp_depnode_list {
1956 kmp_depnode_t * node;
1957 kmp_depnode_list_t * next;
1960 typedef struct kmp_base_depnode {
1961 kmp_depnode_list_t * successors;
1966 #if KMP_SUPPORT_GRAPH_OUTPUT
1970 volatile kmp_int32 npredecessors;
1971 volatile kmp_int32 nrefs;
1972 } kmp_base_depnode_t;
1974 union KMP_ALIGN_CACHE kmp_depnode {
1976 char dn_pad[ KMP_PAD(kmp_base_depnode_t, CACHE_LINE) ];
1977 kmp_base_depnode_t dn;
1980 struct kmp_dephash_entry {
1982 kmp_depnode_t * last_out;
1983 kmp_depnode_list_t * last_ins;
1984 kmp_dephash_entry_t * next_in_bucket;
1987 typedef struct kmp_dephash {
1988 kmp_dephash_entry_t ** buckets;
1990 kmp_uint32 nelements;
1991 kmp_uint32 nconflicts;
1997 #ifdef BUILD_TIED_TASK_STACK
2000 typedef struct kmp_stack_block {
2001 kmp_taskdata_t * sb_block[ TASK_STACK_BLOCK_SIZE ];
2002 struct kmp_stack_block * sb_next;
2003 struct kmp_stack_block * sb_prev;
2004 } kmp_stack_block_t;
2006 typedef struct kmp_task_stack {
2007 kmp_stack_block_t ts_first_block;
2008 kmp_taskdata_t ** ts_top;
2009 kmp_int32 ts_entries;
2012 #endif // BUILD_TIED_TASK_STACK
2014 typedef struct kmp_tasking_flags {
2016 unsigned tiedness : 1;
2018 unsigned merged_if0 : 1;
2020 unsigned destructors_thunk : 1;
2023 unsigned reserved : 11;
2025 unsigned reserved : 12;
2027 #else // OMP_40_ENABLED
2028 unsigned reserved : 13;
2029 #endif // OMP_40_ENABLED
2032 unsigned tasktype : 1;
2033 unsigned task_serial : 1;
2034 unsigned tasking_ser : 1;
2035 unsigned team_serial : 1;
2038 unsigned started : 1;
2039 unsigned executing : 1;
2040 unsigned complete : 1;
2042 unsigned native : 1;
2043 unsigned reserved31 : 7;
2045 } kmp_tasking_flags_t;
2048 struct kmp_taskdata {
2049 kmp_int32 td_task_id;
2050 kmp_tasking_flags_t td_flags;
2051 kmp_team_t * td_team;
2052 kmp_info_p * td_alloc_thread;
2054 kmp_taskdata_t * td_parent;
2059 kmp_uint32 td_taskwait_counter;
2060 kmp_int32 td_taskwait_thread;
2061 KMP_ALIGN_CACHE kmp_internal_control_t td_icvs;
2062 volatile kmp_uint32 td_allocated_child_tasks;
2063 volatile kmp_uint32 td_incomplete_child_tasks;
2065 kmp_taskgroup_t * td_taskgroup;
2066 kmp_dephash_t * td_dephash;
2067 kmp_depnode_t * td_depnode;
2070 ompt_task_info_t ompt_task_info;
2075 kmp_uint32 td_dummy[2];
2080 KMP_BUILD_ASSERT(
sizeof(kmp_taskdata_t) %
sizeof(
void *) == 0 );
2083 typedef struct kmp_base_thread_data {
2084 kmp_info_p * td_thr;
2086 kmp_bootstrap_lock_t td_deque_lock;
2087 kmp_taskdata_t ** td_deque;
2088 kmp_uint32 td_deque_head;
2089 kmp_uint32 td_deque_tail;
2090 kmp_int32 td_deque_ntasks;
2092 kmp_int32 td_deque_last_stolen;
2093 #ifdef BUILD_TIED_TASK_STACK
2094 kmp_task_stack_t td_susp_tied_tasks;
2095 #endif // BUILD_TIED_TASK_STACK
2096 } kmp_base_thread_data_t;
2098 typedef union KMP_ALIGN_CACHE kmp_thread_data {
2099 kmp_base_thread_data_t td;
2101 char td_pad[ KMP_PAD(kmp_base_thread_data_t, CACHE_LINE) ];
2102 } kmp_thread_data_t;
2106 typedef struct kmp_base_task_team {
2107 kmp_bootstrap_lock_t tt_threads_lock;
2109 kmp_task_team_t * tt_next;
2110 kmp_thread_data_t * tt_threads_data;
2112 kmp_int32 tt_found_tasks;
2115 kmp_int32 tt_max_threads;
2117 kmp_int32 tt_found_proxy_tasks;
2121 volatile kmp_uint32 tt_unfinished_threads;
2124 volatile kmp_uint32 tt_active;
2127 #if KMP_USE_INTERNODE_ALIGNMENT
2128 kmp_int32 tt_padme[INTERNODE_CACHE_LINE/
sizeof(kmp_int32)];
2131 volatile kmp_uint32 tt_ref_ct;
2133 } kmp_base_task_team_t;
2135 union KMP_ALIGN_CACHE kmp_task_team {
2136 kmp_base_task_team_t tt;
2138 char tt_pad[ KMP_PAD(kmp_base_task_team_t, CACHE_LINE) ];
2141 #if ( USE_FAST_MEMORY == 3 ) || ( USE_FAST_MEMORY == 5 )
2143 typedef struct kmp_free_list {
2144 void *th_free_list_self;
2145 void *th_free_list_sync;
2146 void *th_free_list_other;
2149 #if KMP_NESTED_HOT_TEAMS
2152 typedef struct kmp_hot_team_ptr {
2153 kmp_team_p *hot_team;
2154 kmp_int32 hot_team_nth;
2155 } kmp_hot_team_ptr_t;
2158 typedef struct kmp_teams_size {
2168 typedef struct KMP_ALIGN_CACHE kmp_base_info {
2176 kmp_team_p *th_team;
2177 kmp_root_p *th_root;
2178 kmp_info_p *th_next_pool;
2179 kmp_disp_t *th_dispatch;
2185 kmp_info_p *th_team_master;
2186 int th_team_serialized;
2188 microtask_t th_teams_microtask;
2197 int th_team_bt_intervals;
2201 #if KMP_AFFINITY_SUPPORTED
2202 kmp_affin_mask_t *th_affin_mask;
2208 KMP_ALIGN_CACHE
int th_set_nproc;
2209 #if KMP_NESTED_HOT_TEAMS
2210 kmp_hot_team_ptr_t *th_hot_teams;
2213 kmp_proc_bind_t th_set_proc_bind;
2214 kmp_teams_size_t th_teams_size;
2215 # if KMP_AFFINITY_SUPPORTED
2216 int th_current_place;
2223 kmp_uint64 th_bar_arrive_time;
2224 kmp_uint64 th_bar_min_time;
2225 kmp_uint64 th_frame_time;
2226 kmp_uint64 th_frame_time_serialized;
2228 kmp_local_t th_local;
2229 struct private_common *th_pri_head;
2236 KMP_ALIGN_CACHE kmp_team_p *th_serial_team;
2239 ompt_thread_info_t ompt_thread_info;
2243 struct common_table *th_pri_common;
2245 volatile kmp_uint32 th_spin_here;
2248 volatile void *th_sleep_loc;
2257 kmp_task_team_t * th_task_team;
2258 kmp_taskdata_t * th_current_task;
2259 kmp_uint8 th_task_state;
2260 kmp_uint8 * th_task_state_memo_stack;
2261 kmp_uint32 th_task_state_top;
2262 kmp_uint32 th_task_state_stack_sz;
2268 kmp_uint8 th_active_in_pool;
2274 struct cons_header * th_cons;
2279 KMP_ALIGN_CACHE kmp_balign_t th_bar[ bs_last_barrier ];
2281 KMP_ALIGN_CACHE
volatile kmp_int32 th_next_waiting;
2283 #if ( USE_FAST_MEMORY == 3 ) || ( USE_FAST_MEMORY == 5 )
2285 kmp_free_list_t th_free_lists[NUM_LISTS];
2289 kmp_win32_cond_t th_suspend_cv;
2290 kmp_win32_mutex_t th_suspend_mx;
2291 int th_suspend_init;
2294 kmp_cond_align_t th_suspend_cv;
2295 kmp_mutex_align_t th_suspend_mx;
2296 int th_suspend_init_count;
2300 kmp_itt_mark_t th_itt_mark_single;
2303 #if KMP_STATS_ENABLED
2304 kmp_stats_list* th_stats;
2308 typedef union KMP_ALIGN_CACHE kmp_info {
2310 char th_pad[ KMP_PAD(kmp_base_info_t, CACHE_LINE) ];
2317 typedef struct kmp_base_data {
2318 volatile kmp_uint32 t_value;
2321 typedef union KMP_ALIGN_CACHE kmp_sleep_team {
2323 char dt_pad[ KMP_PAD(kmp_base_data_t, CACHE_LINE) ];
2327 typedef union KMP_ALIGN_CACHE kmp_ordered_team {
2329 char dt_pad[ KMP_PAD(kmp_base_data_t, CACHE_LINE) ];
2331 } kmp_ordered_team_t;
2333 typedef int (*launch_t)(
int gtid );
2336 #define KMP_MIN_MALLOC_ARGV_ENTRIES 100
2341 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
2342 # define KMP_INLINE_ARGV_BYTES ( 4 * CACHE_LINE - ( ( 3 * KMP_PTR_SKIP + 2 * sizeof(int) + 2 * sizeof(kmp_int8) + sizeof(kmp_int16) + sizeof(kmp_uint32) ) % CACHE_LINE ) )
2344 # define KMP_INLINE_ARGV_BYTES ( 2 * CACHE_LINE - ( ( 3 * KMP_PTR_SKIP + 2 * sizeof(int) ) % CACHE_LINE ) )
2346 #define KMP_INLINE_ARGV_ENTRIES (int)( KMP_INLINE_ARGV_BYTES / KMP_PTR_SKIP )
2348 typedef struct KMP_ALIGN_CACHE kmp_base_team {
2350 KMP_ALIGN_CACHE kmp_ordered_team_t t_ordered;
2351 kmp_balign_team_t t_bar[ bs_last_barrier ];
2352 volatile int t_construct;
2353 kmp_lock_t t_single_lock;
2356 KMP_ALIGN_CACHE
int t_master_tid;
2357 int t_master_this_cons;
2359 kmp_team_p *t_parent;
2360 kmp_team_p *t_next_pool;
2361 kmp_disp_t *t_dispatch;
2362 kmp_task_team_t *t_task_team[2];
2364 kmp_proc_bind_t t_proc_bind;
2365 #endif // OMP_40_ENABLED
2367 kmp_uint64 t_region_time;
2371 KMP_ALIGN_CACHE
void **t_argv;
2378 ompt_team_info_t ompt_team_info;
2379 ompt_lw_taskteam_t *ompt_serialized_team_info;
2382 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
2383 kmp_int8 t_fp_control_saved;
2385 kmp_int16 t_x87_fpu_control_word;
2389 void *t_inline_argv[ KMP_INLINE_ARGV_ENTRIES ];
2391 KMP_ALIGN_CACHE kmp_info_t **t_threads;
2395 dispatch_shared_info_t *t_disp_buffer;
2399 kmp_r_sched_t t_sched;
2400 #if OMP_40_ENABLED && KMP_AFFINITY_SUPPORTED
2403 #endif // OMP_40_ENABLED && KMP_AFFINITY_SUPPORTED
2407 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
2411 char dummy_padding[1024];
2413 KMP_ALIGN_CACHE kmp_taskdata_t *t_implicit_task_taskdata;
2414 kmp_internal_control_t *t_control_stack_top;
2417 kmp_int32 t_cancel_request;
2419 int t_master_active;
2420 kmp_taskq_t t_taskq;
2421 void *t_copypriv_data;
2422 kmp_uint32 t_copyin_counter;
2428 union KMP_ALIGN_CACHE kmp_team {
2431 char t_pad[ KMP_PAD(kmp_base_team_t, CACHE_LINE) ];
2435 typedef union KMP_ALIGN_CACHE kmp_time_global {
2437 char dt_pad[ KMP_PAD(kmp_base_data_t, CACHE_LINE) ];
2439 } kmp_time_global_t;
2441 typedef struct kmp_base_global {
2443 kmp_time_global_t g_time;
2446 volatile int g_abort;
2447 volatile int g_done;
2450 enum dynamic_mode g_dynamic_mode;
2452 } kmp_base_global_t;
2454 typedef union KMP_ALIGN_CACHE kmp_global {
2455 kmp_base_global_t g;
2457 char g_pad[ KMP_PAD(kmp_base_global_t, CACHE_LINE) ];
2461 typedef struct kmp_base_root {
2466 volatile int r_active;
2468 volatile int r_nested;
2471 kmp_team_t *r_root_team;
2472 kmp_team_t *r_hot_team;
2473 kmp_info_t *r_uber_thread;
2474 kmp_lock_t r_begin_lock;
2475 volatile int r_begin;
2479 typedef union KMP_ALIGN_CACHE kmp_root {
2482 char r_pad[ KMP_PAD(kmp_base_root_t, CACHE_LINE) ];
2485 struct fortran_inx_info {
2494 extern int __kmp_settings;
2495 extern int __kmp_duplicate_library_ok;
2497 extern int __kmp_forkjoin_frames;
2498 extern int __kmp_forkjoin_frames_mode;
2500 extern PACKED_REDUCTION_METHOD_T __kmp_force_reduction_method;
2501 extern int __kmp_determ_red;
2504 extern int kmp_a_debug;
2505 extern int kmp_b_debug;
2506 extern int kmp_c_debug;
2507 extern int kmp_d_debug;
2508 extern int kmp_e_debug;
2509 extern int kmp_f_debug;
2513 #define KMP_DEBUG_BUF_LINES_INIT 512
2514 #define KMP_DEBUG_BUF_LINES_MIN 1
2516 #define KMP_DEBUG_BUF_CHARS_INIT 128
2517 #define KMP_DEBUG_BUF_CHARS_MIN 2
2519 extern int __kmp_debug_buf;
2520 extern int __kmp_debug_buf_lines;
2521 extern int __kmp_debug_buf_chars;
2522 extern int __kmp_debug_buf_atomic;
2524 extern char *__kmp_debug_buffer;
2525 extern int __kmp_debug_count;
2526 extern int __kmp_debug_buf_warn_chars;
2530 extern int __kmp_par_range;
2532 #define KMP_PAR_RANGE_ROUTINE_LEN 1024
2533 extern char __kmp_par_range_routine[KMP_PAR_RANGE_ROUTINE_LEN];
2534 #define KMP_PAR_RANGE_FILENAME_LEN 1024
2535 extern char __kmp_par_range_filename[KMP_PAR_RANGE_FILENAME_LEN];
2536 extern int __kmp_par_range_lb;
2537 extern int __kmp_par_range_ub;
2541 extern int __kmp_storage_map;
2542 extern int __kmp_storage_map_verbose;
2543 extern int __kmp_storage_map_verbose_specified;
2545 extern kmp_cpuinfo_t __kmp_cpuinfo;
2547 extern volatile int __kmp_init_serial;
2548 extern volatile int __kmp_init_gtid;
2549 extern volatile int __kmp_init_common;
2550 extern volatile int __kmp_init_middle;
2551 extern volatile int __kmp_init_parallel;
2552 extern volatile int __kmp_init_monitor;
2553 extern volatile int __kmp_init_user_locks;
2554 extern int __kmp_init_counter;
2555 extern int __kmp_root_counter;
2556 extern int __kmp_version;
2559 extern kmp_cached_addr_t *__kmp_threadpriv_cache_list;
2562 extern kmp_uint32 __kmp_barrier_gather_bb_dflt;
2563 extern kmp_uint32 __kmp_barrier_release_bb_dflt;
2564 extern kmp_bar_pat_e __kmp_barrier_gather_pat_dflt;
2565 extern kmp_bar_pat_e __kmp_barrier_release_pat_dflt;
2566 extern kmp_uint32 __kmp_barrier_gather_branch_bits [ bs_last_barrier ];
2567 extern kmp_uint32 __kmp_barrier_release_branch_bits [ bs_last_barrier ];
2568 extern kmp_bar_pat_e __kmp_barrier_gather_pattern [ bs_last_barrier ];
2569 extern kmp_bar_pat_e __kmp_barrier_release_pattern [ bs_last_barrier ];
2570 extern char const *__kmp_barrier_branch_bit_env_name [ bs_last_barrier ];
2571 extern char const *__kmp_barrier_pattern_env_name [ bs_last_barrier ];
2572 extern char const *__kmp_barrier_type_name [ bs_last_barrier ];
2573 extern char const *__kmp_barrier_pattern_name [ bp_last_bar ];
2576 extern kmp_bootstrap_lock_t __kmp_initz_lock;
2577 extern kmp_bootstrap_lock_t __kmp_forkjoin_lock;
2578 extern kmp_bootstrap_lock_t __kmp_exit_lock;
2579 extern kmp_bootstrap_lock_t __kmp_monitor_lock;
2580 extern kmp_bootstrap_lock_t __kmp_tp_cached_lock;
2582 extern kmp_lock_t __kmp_global_lock;
2583 extern kmp_queuing_lock_t __kmp_dispatch_lock;
2584 extern kmp_lock_t __kmp_debug_lock;
2587 extern unsigned int __kmp_init_wait;
2588 extern unsigned int __kmp_next_wait;
2590 extern enum library_type __kmp_library;
2596 extern int __kmp_chunk;
2598 extern size_t __kmp_stksize;
2599 extern size_t __kmp_monitor_stksize;
2600 extern size_t __kmp_stkoffset;
2601 extern int __kmp_stkpadding;
2603 extern size_t __kmp_malloc_pool_incr;
2604 extern int __kmp_env_chunk;
2605 extern int __kmp_env_stksize;
2606 extern int __kmp_env_omp_stksize;
2607 extern int __kmp_env_all_threads;
2608 extern int __kmp_env_omp_all_threads;
2609 extern int __kmp_env_blocktime;
2610 extern int __kmp_env_checks;
2611 extern int __kmp_env_consistency_check;
2612 extern int __kmp_generate_warnings;
2613 extern int __kmp_reserve_warn;
2615 #ifdef DEBUG_SUSPEND
2616 extern int __kmp_suspend_count;
2619 extern kmp_uint32 __kmp_yield_init;
2620 extern kmp_uint32 __kmp_yield_next;
2621 extern kmp_uint32 __kmp_yielding_on;
2622 extern kmp_uint32 __kmp_yield_cycle;
2623 extern kmp_int32 __kmp_yield_on_count;
2624 extern kmp_int32 __kmp_yield_off_count;
2628 extern int __kmp_allThreadsSpecified;
2630 extern size_t __kmp_align_alloc;
2632 extern int __kmp_xproc;
2633 extern int __kmp_avail_proc;
2634 extern size_t __kmp_sys_min_stksize;
2635 extern int __kmp_sys_max_nth;
2636 extern int __kmp_max_nth;
2637 extern int __kmp_threads_capacity;
2638 extern int __kmp_dflt_team_nth;
2639 extern int __kmp_dflt_team_nth_ub;
2640 extern int __kmp_tp_capacity;
2641 extern int __kmp_tp_cached;
2642 extern int __kmp_dflt_nested;
2643 extern int __kmp_dflt_blocktime;
2644 extern int __kmp_monitor_wakeups;
2645 extern int __kmp_bt_intervals;
2646 #ifdef KMP_ADJUST_BLOCKTIME
2647 extern int __kmp_zero_bt;
2649 #ifdef KMP_DFLT_NTH_CORES
2650 extern int __kmp_ncores;
2652 extern int __kmp_abort_delay;
2654 extern int __kmp_need_register_atfork_specified;
2655 extern int __kmp_need_register_atfork;
2656 extern int __kmp_gtid_mode;
2662 extern int __kmp_adjust_gtid_mode;
2663 #ifdef KMP_TDATA_GTID
2665 extern __declspec(thread) int __kmp_gtid;
2667 extern __thread
int __kmp_gtid;
2670 extern int __kmp_tls_gtid_min;
2671 extern int __kmp_foreign_tp;
2672 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
2673 extern int __kmp_inherit_fp_control;
2674 extern kmp_int16 __kmp_init_x87_fpu_control_word;
2675 extern kmp_uint32 __kmp_init_mxcsr;
2678 extern int __kmp_dflt_max_active_levels;
2679 #if KMP_NESTED_HOT_TEAMS
2680 extern int __kmp_hot_teams_mode;
2681 extern int __kmp_hot_teams_max_level;
2685 extern enum clock_function_type __kmp_clock_function;
2686 extern int __kmp_clock_function_param;
2689 #if KMP_ARCH_X86_64 && (KMP_OS_LINUX || KMP_OS_WINDOWS)
2690 extern enum mic_type __kmp_mic_type;
2693 # ifdef USE_LOAD_BALANCE
2694 extern double __kmp_load_balance_interval;
2698 typedef struct kmp_nested_nthreads_t {
2702 } kmp_nested_nthreads_t;
2704 extern kmp_nested_nthreads_t __kmp_nested_nth;
2706 #if KMP_USE_ADAPTIVE_LOCKS
2709 struct kmp_adaptive_backoff_params_t {
2711 kmp_uint32 max_soft_retries;
2713 kmp_uint32 max_badness;
2716 extern kmp_adaptive_backoff_params_t __kmp_adaptive_backoff_params;
2718 #if KMP_DEBUG_ADAPTIVE_LOCKS
2719 extern char * __kmp_speculative_statsfile;
2722 #endif // KMP_USE_ADAPTIVE_LOCKS
2725 extern int __kmp_display_env;
2726 extern int __kmp_display_env_verbose;
2727 extern int __kmp_omp_cancellation;
2736 extern kmp_info_t **__kmp_threads;
2738 extern volatile kmp_team_t * __kmp_team_pool;
2739 extern volatile kmp_info_t * __kmp_thread_pool;
2742 extern volatile int __kmp_nth;
2745 extern volatile int __kmp_all_nth;
2746 extern int __kmp_thread_pool_nth;
2747 extern volatile int __kmp_thread_pool_active_nth;
2749 extern kmp_root_t **__kmp_root;
2753 extern kmp_global_t __kmp_global;
2755 extern kmp_info_t __kmp_monitor;
2756 extern volatile kmp_uint32 __kmp_team_counter;
2757 extern volatile kmp_uint32 __kmp_task_counter;
2761 #define _KMP_GEN_ID( counter ) \
2765 KMP_TEST_THEN_INC32( (volatile kmp_int32 *) & counter ) + 1 \
2770 #define _KMP_GEN_ID( counter ) \
2776 #define KMP_GEN_TASK_ID() _KMP_GEN_ID( __kmp_task_counter )
2777 #define KMP_GEN_TEAM_ID() _KMP_GEN_ID( __kmp_team_counter )
2782 extern void __kmp_print_storage_map_gtid(
int gtid,
void *p1,
void* p2,
size_t size,
char const *format, ... );
2784 extern void __kmp_serial_initialize(
void );
2785 extern void __kmp_middle_initialize(
void );
2786 extern void __kmp_parallel_initialize(
void );
2788 extern void __kmp_internal_begin(
void );
2789 extern void __kmp_internal_end_library(
int gtid );
2790 extern void __kmp_internal_end_thread(
int gtid );
2791 extern void __kmp_internal_end_atexit(
void );
2792 extern void __kmp_internal_end_fini(
void );
2793 extern void __kmp_internal_end_dtor(
void );
2794 extern void __kmp_internal_end_dest(
void* );
2796 extern int __kmp_register_root(
int initial_thread );
2797 extern void __kmp_unregister_root(
int gtid );
2799 extern int __kmp_ignore_mppbeg(
void );
2800 extern int __kmp_ignore_mppend(
void );
2802 extern int __kmp_enter_single(
int gtid,
ident_t *id_ref,
int push_ws );
2803 extern void __kmp_exit_single(
int gtid );
2805 extern void __kmp_parallel_deo(
int *gtid_ref,
int *cid_ref,
ident_t *loc_ref );
2806 extern void __kmp_parallel_dxo(
int *gtid_ref,
int *cid_ref,
ident_t *loc_ref );
2809 #ifdef USE_LOAD_BALANCE
2810 extern int __kmp_get_load_balance(
int );
2814 extern void __kmp_tv_threadprivate_store( kmp_info_t *th,
void *global_addr,
void *thread_addr );
2817 extern int __kmp_get_global_thread_id(
void );
2818 extern int __kmp_get_global_thread_id_reg(
void );
2819 extern void __kmp_exit_thread(
int exit_status );
2820 extern void __kmp_abort(
char const * format, ... );
2821 extern void __kmp_abort_thread(
void );
2822 extern void __kmp_abort_process(
void );
2823 extern void __kmp_warn(
char const * format, ... );
2825 extern void __kmp_set_num_threads(
int new_nth,
int gtid );
2828 static inline kmp_info_t * __kmp_entry_thread()
2830 int gtid = __kmp_entry_gtid();
2832 return __kmp_threads[gtid];
2835 extern void __kmp_set_max_active_levels(
int gtid,
int new_max_active_levels );
2836 extern int __kmp_get_max_active_levels(
int gtid );
2837 extern int __kmp_get_ancestor_thread_num(
int gtid,
int level );
2838 extern int __kmp_get_team_size(
int gtid,
int level );
2839 extern void __kmp_set_schedule(
int gtid, kmp_sched_t new_sched,
int chunk );
2840 extern void __kmp_get_schedule(
int gtid, kmp_sched_t * sched,
int * chunk );
2842 extern unsigned short __kmp_get_random( kmp_info_t * thread );
2843 extern void __kmp_init_random( kmp_info_t * thread );
2845 extern kmp_r_sched_t __kmp_get_schedule_global(
void );
2846 extern void __kmp_adjust_num_threads(
int new_nproc );
2848 extern void * ___kmp_allocate(
size_t size KMP_SRC_LOC_DECL );
2849 extern void * ___kmp_page_allocate(
size_t size KMP_SRC_LOC_DECL );
2850 extern void ___kmp_free(
void * ptr KMP_SRC_LOC_DECL );
2851 #define __kmp_allocate( size ) ___kmp_allocate( (size) KMP_SRC_LOC_CURR )
2852 #define __kmp_page_allocate( size ) ___kmp_page_allocate( (size) KMP_SRC_LOC_CURR )
2853 #define __kmp_free( ptr ) ___kmp_free( (ptr) KMP_SRC_LOC_CURR )
2856 extern void * ___kmp_fast_allocate( kmp_info_t *this_thr,
size_t size KMP_SRC_LOC_DECL );
2857 extern void ___kmp_fast_free( kmp_info_t *this_thr,
void *ptr KMP_SRC_LOC_DECL );
2858 extern void __kmp_free_fast_memory( kmp_info_t *this_thr );
2859 extern void __kmp_initialize_fast_memory( kmp_info_t *this_thr );
2860 #define __kmp_fast_allocate( this_thr, size ) ___kmp_fast_allocate( (this_thr), (size) KMP_SRC_LOC_CURR )
2861 #define __kmp_fast_free( this_thr, ptr ) ___kmp_fast_free( (this_thr), (ptr) KMP_SRC_LOC_CURR )
2864 extern void * ___kmp_thread_malloc( kmp_info_t *th,
size_t size KMP_SRC_LOC_DECL );
2865 extern void * ___kmp_thread_calloc( kmp_info_t *th,
size_t nelem,
size_t elsize KMP_SRC_LOC_DECL );
2866 extern void * ___kmp_thread_realloc( kmp_info_t *th,
void *ptr,
size_t size KMP_SRC_LOC_DECL );
2867 extern void ___kmp_thread_free( kmp_info_t *th,
void *ptr KMP_SRC_LOC_DECL );
2868 #define __kmp_thread_malloc( th, size ) ___kmp_thread_malloc( (th), (size) KMP_SRC_LOC_CURR )
2869 #define __kmp_thread_calloc( th, nelem, elsize ) ___kmp_thread_calloc( (th), (nelem), (elsize) KMP_SRC_LOC_CURR )
2870 #define __kmp_thread_realloc( th, ptr, size ) ___kmp_thread_realloc( (th), (ptr), (size) KMP_SRC_LOC_CURR )
2871 #define __kmp_thread_free( th, ptr ) ___kmp_thread_free( (th), (ptr) KMP_SRC_LOC_CURR )
2873 #define KMP_INTERNAL_MALLOC(sz) malloc(sz)
2874 #define KMP_INTERNAL_FREE(p) free(p)
2875 #define KMP_INTERNAL_REALLOC(p,sz) realloc((p),(sz))
2876 #define KMP_INTERNAL_CALLOC(n,sz) calloc((n),(sz))
2878 extern void __kmp_push_num_threads(
ident_t *loc,
int gtid,
int num_threads );
2881 extern void __kmp_push_proc_bind(
ident_t *loc,
int gtid, kmp_proc_bind_t proc_bind );
2882 extern void __kmp_push_num_teams(
ident_t *loc,
int gtid,
int num_teams,
int num_threads );
2885 extern void __kmp_yield(
int cond );
2888 enum sched_type schedule, kmp_int32 lb, kmp_int32 ub, kmp_int32 st,
2891 enum sched_type schedule, kmp_uint32 lb, kmp_uint32 ub, kmp_int32 st,
2894 enum sched_type schedule, kmp_int64 lb, kmp_int64 ub, kmp_int64 st,
2897 enum sched_type schedule, kmp_uint64 lb, kmp_uint64 ub, kmp_int64 st,
2901 kmp_int32 *p_last, kmp_int32 *p_lb, kmp_int32 *p_ub, kmp_int32 *p_st );
2903 kmp_int32 *p_last, kmp_uint32 *p_lb, kmp_uint32 *p_ub, kmp_int32 *p_st );
2905 kmp_int32 *p_last, kmp_int64 *p_lb, kmp_int64 *p_ub, kmp_int64 *p_st );
2907 kmp_int32 *p_last, kmp_uint64 *p_lb, kmp_uint64 *p_ub, kmp_int64 *p_st );
2915 #ifdef KMP_GOMP_COMPAT
2917 extern void __kmp_aux_dispatch_init_4(
ident_t *loc, kmp_int32 gtid,
2918 enum sched_type schedule, kmp_int32 lb, kmp_int32 ub, kmp_int32 st,
2919 kmp_int32 chunk,
int push_ws );
2920 extern void __kmp_aux_dispatch_init_4u(
ident_t *loc, kmp_int32 gtid,
2921 enum sched_type schedule, kmp_uint32 lb, kmp_uint32 ub, kmp_int32 st,
2922 kmp_int32 chunk,
int push_ws );
2923 extern void __kmp_aux_dispatch_init_8(
ident_t *loc, kmp_int32 gtid,
2924 enum sched_type schedule, kmp_int64 lb, kmp_int64 ub, kmp_int64 st,
2925 kmp_int64 chunk,
int push_ws );
2926 extern void __kmp_aux_dispatch_init_8u(
ident_t *loc, kmp_int32 gtid,
2927 enum sched_type schedule, kmp_uint64 lb, kmp_uint64 ub, kmp_int64 st,
2928 kmp_int64 chunk,
int push_ws );
2929 extern void __kmp_aux_dispatch_fini_chunk_4(
ident_t *loc, kmp_int32 gtid );
2930 extern void __kmp_aux_dispatch_fini_chunk_8(
ident_t *loc, kmp_int32 gtid );
2931 extern void __kmp_aux_dispatch_fini_chunk_4u(
ident_t *loc, kmp_int32 gtid );
2932 extern void __kmp_aux_dispatch_fini_chunk_8u(
ident_t *loc, kmp_int32 gtid );
2937 extern kmp_uint32 __kmp_eq_4( kmp_uint32 value, kmp_uint32 checker );
2938 extern kmp_uint32 __kmp_neq_4( kmp_uint32 value, kmp_uint32 checker );
2939 extern kmp_uint32 __kmp_lt_4( kmp_uint32 value, kmp_uint32 checker );
2940 extern kmp_uint32 __kmp_ge_4( kmp_uint32 value, kmp_uint32 checker );
2941 extern kmp_uint32 __kmp_le_4( kmp_uint32 value, kmp_uint32 checker );
2943 extern kmp_uint32 __kmp_eq_8( kmp_uint64 value, kmp_uint64 checker );
2944 extern kmp_uint32 __kmp_neq_8( kmp_uint64 value, kmp_uint64 checker );
2945 extern kmp_uint32 __kmp_lt_8( kmp_uint64 value, kmp_uint64 checker );
2946 extern kmp_uint32 __kmp_ge_8( kmp_uint64 value, kmp_uint64 checker );
2947 extern kmp_uint32 __kmp_le_8( kmp_uint64 value, kmp_uint64 checker );
2949 extern kmp_uint32 __kmp_wait_yield_4( kmp_uint32
volatile * spinner, kmp_uint32 checker, kmp_uint32 (*pred) (kmp_uint32, kmp_uint32),
void * obj );
2950 extern kmp_uint64 __kmp_wait_yield_8( kmp_uint64
volatile * spinner, kmp_uint64 checker, kmp_uint32 (*pred) (kmp_uint64, kmp_uint64),
void * obj );
2954 class kmp_flag_oncore;
2955 extern void __kmp_wait_32(kmp_info_t *this_thr, kmp_flag_32 *flag,
int final_spin
2957 ,
void * itt_sync_obj
2960 extern void __kmp_release_32(kmp_flag_32 *flag);
2961 extern void __kmp_wait_64(kmp_info_t *this_thr, kmp_flag_64 *flag,
int final_spin
2963 ,
void * itt_sync_obj
2966 extern void __kmp_release_64(kmp_flag_64 *flag);
2967 extern void __kmp_wait_oncore(kmp_info_t *this_thr, kmp_flag_oncore *flag,
int final_spin
2969 ,
void * itt_sync_obj
2972 extern void __kmp_release_oncore(kmp_flag_oncore *flag);
2974 extern void __kmp_infinite_loop(
void );
2976 extern void __kmp_cleanup(
void );
2978 #if KMP_HANDLE_SIGNALS
2979 extern int __kmp_handle_signals;
2980 extern void __kmp_install_signals(
int parallel_init );
2981 extern void __kmp_remove_signals(
void );
2984 extern void __kmp_clear_system_time(
void );
2985 extern void __kmp_read_system_time(
double *delta );
2987 extern void __kmp_check_stack_overlap( kmp_info_t *thr );
2989 extern void __kmp_expand_host_name(
char *buffer,
size_t size );
2990 extern void __kmp_expand_file_name(
char *result,
size_t rlen,
char *pattern );
2993 extern void __kmp_initialize_system_tick(
void );
2996 extern void __kmp_runtime_initialize(
void );
2997 extern void __kmp_runtime_destroy(
void );
2999 #if KMP_AFFINITY_SUPPORTED
3000 extern char *__kmp_affinity_print_mask(
char *buf,
int buf_len, kmp_affin_mask_t *mask);
3001 extern void __kmp_affinity_initialize(
void);
3002 extern void __kmp_affinity_uninitialize(
void);
3003 extern void __kmp_affinity_set_init_mask(
int gtid,
int isa_root);
3005 extern void __kmp_affinity_set_place(
int gtid);
3007 extern void __kmp_affinity_determine_capable(
const char *env_var );
3008 extern int __kmp_aux_set_affinity(
void **mask);
3009 extern int __kmp_aux_get_affinity(
void **mask);
3010 extern int __kmp_aux_set_affinity_mask_proc(
int proc,
void **mask);
3011 extern int __kmp_aux_unset_affinity_mask_proc(
int proc,
void **mask);
3012 extern int __kmp_aux_get_affinity_mask_proc(
int proc,
void **mask);
3013 extern void __kmp_balanced_affinity(
int tid,
int team_size );
3016 extern void __kmp_cleanup_hierarchy();
3017 extern void __kmp_get_hierarchy(kmp_uint32 nproc, kmp_bstate_t *thr_bar);
3019 #if KMP_OS_LINUX && (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64)
3021 extern int __kmp_futex_determine_capable(
void );
3023 #endif // KMP_OS_LINUX && (KMP_ARCH_X86 || KMP_ARCH_X86_64 || KMP_ARCH_ARM || KMP_ARCH_AARCH64)
3025 extern void __kmp_gtid_set_specific(
int gtid );
3026 extern int __kmp_gtid_get_specific(
void );
3028 extern double __kmp_read_cpu_time(
void );
3030 extern int __kmp_read_system_info(
struct kmp_sys_info *info );
3032 extern void __kmp_create_monitor( kmp_info_t *th );
3034 extern void *__kmp_launch_thread( kmp_info_t *thr );
3036 extern void __kmp_create_worker(
int gtid, kmp_info_t *th,
size_t stack_size );
3039 extern int __kmp_still_running(kmp_info_t *th);
3040 extern int __kmp_is_thread_alive( kmp_info_t * th, DWORD *exit_val );
3041 extern void __kmp_free_handle( kmp_thread_t tHandle );
3044 extern void __kmp_reap_monitor( kmp_info_t *th );
3045 extern void __kmp_reap_worker( kmp_info_t *th );
3046 extern void __kmp_terminate_thread(
int gtid );
3048 extern void __kmp_suspend_32(
int th_gtid, kmp_flag_32 *flag );
3049 extern void __kmp_suspend_64(
int th_gtid, kmp_flag_64 *flag );
3050 extern void __kmp_suspend_oncore(
int th_gtid, kmp_flag_oncore *flag );
3051 extern void __kmp_resume_32(
int target_gtid, kmp_flag_32 *flag );
3052 extern void __kmp_resume_64(
int target_gtid, kmp_flag_64 *flag );
3053 extern void __kmp_resume_oncore(
int target_gtid, kmp_flag_oncore *flag );
3055 extern void __kmp_elapsed(
double * );
3056 extern void __kmp_elapsed_tick(
double * );
3058 extern void __kmp_enable(
int old_state );
3059 extern void __kmp_disable(
int *old_state );
3061 extern void __kmp_thread_sleep(
int millis );
3063 extern void __kmp_common_initialize(
void );
3064 extern void __kmp_common_destroy(
void );
3065 extern void __kmp_common_destroy_gtid(
int gtid );
3068 extern void __kmp_register_atfork(
void );
3070 extern void __kmp_suspend_initialize(
void );
3071 extern void __kmp_suspend_uninitialize_thread( kmp_info_t *th );
3073 extern kmp_info_t * __kmp_allocate_thread( kmp_root_t *root,
3074 kmp_team_t *team,
int tid);
3076 extern kmp_team_t * __kmp_allocate_team( kmp_root_t *root,
int new_nproc,
int max_nproc,
3078 ompt_parallel_id_t ompt_parallel_id,
3080 kmp_proc_bind_t proc_bind,
3081 kmp_internal_control_t *new_icvs,
3082 int argc USE_NESTED_HOT_ARG(kmp_info_t *thr) );
3084 extern kmp_team_t * __kmp_allocate_team( kmp_root_t *root,
int new_nproc,
int max_nproc,
3086 ompt_parallel_id_t ompt_parallel_id,
3088 kmp_internal_control_t *new_icvs,
3089 int argc USE_NESTED_HOT_ARG(kmp_info_t *thr) );
3090 #endif // OMP_40_ENABLED
3091 extern void __kmp_free_thread( kmp_info_t * );
3092 extern void __kmp_free_team( kmp_root_t *, kmp_team_t * USE_NESTED_HOT_ARG(kmp_info_t *) );
3093 extern kmp_team_t * __kmp_reap_team( kmp_team_t * );
3097 extern void __kmp_initialize_bget( kmp_info_t *th );
3098 extern void __kmp_finalize_bget( kmp_info_t *th );
3100 KMP_EXPORT
void *kmpc_malloc(
size_t size );
3101 KMP_EXPORT
void *kmpc_calloc(
size_t nelem,
size_t elsize );
3102 KMP_EXPORT
void *kmpc_realloc(
void *ptr,
size_t size );
3103 KMP_EXPORT
void kmpc_free(
void *ptr );
3108 extern int __kmp_barrier(
enum barrier_type bt,
int gtid,
int is_split,
3109 size_t reduce_size,
void *reduce_data,
void (*reduce)(
void *,
void *) );
3110 extern void __kmp_end_split_barrier (
enum barrier_type bt,
int gtid );
3121 extern int __kmp_fork_call(
ident_t *loc,
int gtid,
enum fork_context_e fork_context,
3124 void *unwrapped_task,
3126 microtask_t microtask, launch_t invoker,
3128 #
if (KMP_ARCH_ARM || KMP_ARCH_X86_64 || KMP_ARCH_AARCH64) && KMP_OS_LINUX
3135 extern void __kmp_join_call(
ident_t *loc,
int gtid
3137 ,
int exit_teams = 0
3141 extern void __kmp_serialized_parallel(
ident_t *
id, kmp_int32 gtid);
3142 extern void __kmp_internal_fork(
ident_t *
id,
int gtid, kmp_team_t *team );
3143 extern void __kmp_internal_join(
ident_t *
id,
int gtid, kmp_team_t *team );
3144 extern int __kmp_invoke_task_func(
int gtid );
3145 extern void __kmp_run_before_invoked_task(
int gtid,
int tid, kmp_info_t *this_thr, kmp_team_t *team );
3146 extern void __kmp_run_after_invoked_task(
int gtid,
int tid, kmp_info_t *this_thr, kmp_team_t *team );
3149 KMP_EXPORT
int __kmpc_invoke_task_func(
int gtid );
3151 extern int __kmp_invoke_teams_master(
int gtid );
3152 extern void __kmp_teams_master(
int gtid );
3154 extern void __kmp_save_internal_controls( kmp_info_t * thread );
3155 extern void __kmp_user_set_library (
enum library_type arg);
3156 extern void __kmp_aux_set_library (
enum library_type arg);
3157 extern void __kmp_aux_set_stacksize(
size_t arg);
3158 extern void __kmp_aux_set_blocktime (
int arg, kmp_info_t *thread,
int tid);
3159 extern void __kmp_aux_set_defaults(
char const * str,
int len );
3162 void kmpc_set_blocktime (
int arg);
3163 void ompc_set_nested(
int flag );
3164 void ompc_set_dynamic(
int flag );
3165 void ompc_set_num_threads(
int arg );
3167 extern void __kmp_push_current_task_to_thread( kmp_info_t *this_thr,
3168 kmp_team_t *team,
int tid );
3169 extern void __kmp_pop_current_task_from_thread( kmp_info_t *this_thr );
3170 extern kmp_task_t* __kmp_task_alloc(
ident_t *loc_ref, kmp_int32 gtid,
3171 kmp_tasking_flags_t *flags,
size_t sizeof_kmp_task_t,
size_t sizeof_shareds,
3172 kmp_routine_entry_t task_entry );
3174 extern void __kmp_task_init_ompt( kmp_taskdata_t * task,
int tid );
3176 extern void __kmp_init_implicit_task(
ident_t *loc_ref, kmp_info_t *this_thr,
3177 kmp_team_t *team,
int tid,
int set_curr_task );
3178 int __kmp_execute_tasks_32(kmp_info_t *thread, kmp_int32 gtid, kmp_flag_32 *flag,
int final_spin,
3179 int *thread_finished,
3181 void * itt_sync_obj,
3183 kmp_int32 is_constrained);
3184 int __kmp_execute_tasks_64(kmp_info_t *thread, kmp_int32 gtid, kmp_flag_64 *flag,
int final_spin,
3185 int *thread_finished,
3187 void * itt_sync_obj,
3189 kmp_int32 is_constrained);
3190 int __kmp_execute_tasks_oncore(kmp_info_t *thread, kmp_int32 gtid, kmp_flag_oncore *flag,
int final_spin,
3191 int *thread_finished,
3193 void * itt_sync_obj,
3195 kmp_int32 is_constrained);
3197 extern void __kmp_reap_task_teams(
void );
3198 extern void __kmp_unref_task_team( kmp_task_team_t *task_team, kmp_info_t *thread );
3199 extern void __kmp_wait_to_unref_task_teams(
void );
3200 extern void __kmp_task_team_setup ( kmp_info_t *this_thr, kmp_team_t *team,
int both,
int always );
3201 extern void __kmp_task_team_sync ( kmp_info_t *this_thr, kmp_team_t *team );
3202 extern void __kmp_task_team_wait ( kmp_info_t *this_thr, kmp_team_t *team
3204 ,
void * itt_sync_obj
3207 extern void __kmp_tasking_barrier( kmp_team_t *team, kmp_info_t *thread,
int gtid );
3209 extern int __kmp_is_address_mapped(
void *addr );
3210 extern kmp_uint64 __kmp_hardware_timestamp(
void);
3213 extern int __kmp_read_from_file(
char const *path,
char const *format, ... );
3221 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
3223 extern void __kmp_query_cpuid( kmp_cpuinfo_t *p );
3225 #define __kmp_load_mxcsr(p) _mm_setcsr(*(p))
3226 static inline void __kmp_store_mxcsr( kmp_uint32 *p ) { *p = _mm_getcsr(); }
3228 extern void __kmp_load_x87_fpu_control_word( kmp_int16 *p );
3229 extern void __kmp_store_x87_fpu_control_word( kmp_int16 *p );
3230 extern void __kmp_clear_x87_fpu_status_word();
3231 # define KMP_X86_MXCSR_MASK 0xffffffc0
3235 extern int __kmp_invoke_microtask( microtask_t pkfn,
int gtid,
int npr,
int argc,
void *argv[]
3237 ,
void **exit_frame_ptr
3250 KMP_EXPORT
void * __kmpc_threadprivate (
ident_t *, kmp_int32 global_tid,
void * data,
size_t size );
3280 KMP_EXPORT
void KMPC_FOR_STATIC_INIT (
ident_t *loc, kmp_int32 global_tid, kmp_int32 schedtype, kmp_int32 *plastiter,
3281 kmp_int *plower, kmp_int *pupper, kmp_int *pstride, kmp_int incr, kmp_int chunk );
3285 KMP_EXPORT
void __kmpc_copyprivate(
ident_t *loc, kmp_int32 global_tid,
size_t cpy_size,
void *cpy_data,
void(*cpy_func)(
void*,
void*), kmp_int32 didit );
3287 extern void KMPC_SET_NUM_THREADS (
int arg );
3288 extern void KMPC_SET_DYNAMIC (
int flag );
3289 extern void KMPC_SET_NESTED (
int flag );
3297 KMP_EXPORT kmpc_thunk_t * __kmpc_taskq (
ident_t *loc, kmp_int32 global_tid, kmpc_task_t taskq_task,
size_t sizeof_thunk,
3298 size_t sizeof_shareds, kmp_int32 flags, kmpc_shared_vars_t **shareds);
3299 KMP_EXPORT
void __kmpc_end_taskq (
ident_t *loc, kmp_int32 global_tid, kmpc_thunk_t *thunk);
3300 KMP_EXPORT kmp_int32 __kmpc_task (
ident_t *loc, kmp_int32 global_tid, kmpc_thunk_t *thunk);
3301 KMP_EXPORT
void __kmpc_taskq_task (
ident_t *loc, kmp_int32 global_tid, kmpc_thunk_t *thunk, kmp_int32 status);
3302 KMP_EXPORT
void __kmpc_end_taskq_task (
ident_t *loc, kmp_int32 global_tid, kmpc_thunk_t *thunk);
3303 KMP_EXPORT kmpc_thunk_t * __kmpc_task_buffer (
ident_t *loc, kmp_int32 global_tid, kmpc_thunk_t *taskq_thunk, kmpc_task_t task);
3311 KMP_EXPORT kmp_int32
3312 __kmpc_omp_task(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t * new_task );
3313 KMP_EXPORT kmp_task_t*
3314 __kmpc_omp_task_alloc(
ident_t *loc_ref, kmp_int32 gtid, kmp_int32 flags,
3315 size_t sizeof_kmp_task_t,
size_t sizeof_shareds,
3316 kmp_routine_entry_t task_entry );
3318 __kmpc_omp_task_begin_if0(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t * task );
3320 __kmpc_omp_task_complete_if0(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t *task );
3321 KMP_EXPORT kmp_int32
3322 __kmpc_omp_task_parts(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t * new_task );
3323 KMP_EXPORT kmp_int32
3324 __kmpc_omp_taskwait(
ident_t *loc_ref, kmp_int32 gtid );
3326 KMP_EXPORT kmp_int32
3327 __kmpc_omp_taskyield(
ident_t *loc_ref, kmp_int32 gtid,
int end_part );
3330 void __kmpc_omp_task_begin(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t * task );
3331 void __kmpc_omp_task_complete(
ident_t *loc_ref, kmp_int32 gtid, kmp_task_t *task );
3332 #endif // TASK_UNUSED
3338 KMP_EXPORT
void __kmpc_taskgroup(
ident_t * loc,
int gtid );
3339 KMP_EXPORT
void __kmpc_end_taskgroup(
ident_t * loc,
int gtid );
3342 kmp_int32 ndeps, kmp_depend_info_t *dep_list,
3343 kmp_int32 ndeps_noalias, kmp_depend_info_t *noalias_dep_list );
3345 kmp_int32 ndeps_noalias, kmp_depend_info_t *noalias_dep_list );
3346 extern void __kmp_release_deps ( kmp_int32 gtid, kmp_taskdata_t *task );
3348 extern kmp_int32 __kmp_omp_task( kmp_int32 gtid, kmp_task_t * new_task,
bool serialize_immediate );
3350 KMP_EXPORT kmp_int32 __kmpc_cancel(
ident_t* loc_ref, kmp_int32 gtid, kmp_int32 cncl_kind);
3351 KMP_EXPORT kmp_int32 __kmpc_cancellationpoint(
ident_t* loc_ref, kmp_int32 gtid, kmp_int32 cncl_kind);
3352 KMP_EXPORT kmp_int32 __kmpc_cancel_barrier(
ident_t* loc_ref, kmp_int32 gtid);
3353 KMP_EXPORT
int __kmp_get_cancellation_status(
int cancel_kind);
3357 KMP_EXPORT
void __kmpc_proxy_task_completed( kmp_int32 gtid, kmp_task_t *ptask );
3358 KMP_EXPORT
void __kmpc_proxy_task_completed_ooo ( kmp_task_t *ptask );
3368 KMP_EXPORT
void __kmpc_init_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3369 KMP_EXPORT
void __kmpc_init_nest_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3370 KMP_EXPORT
void __kmpc_destroy_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3371 KMP_EXPORT
void __kmpc_destroy_nest_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3372 KMP_EXPORT
void __kmpc_set_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3373 KMP_EXPORT
void __kmpc_set_nest_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3374 KMP_EXPORT
void __kmpc_unset_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3375 KMP_EXPORT
void __kmpc_unset_nest_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3376 KMP_EXPORT
int __kmpc_test_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3377 KMP_EXPORT
int __kmpc_test_nest_lock(
ident_t *loc, kmp_int32 gtid,
void **user_lock );
3386 kmp_int32 num_vars,
size_t reduce_size,
3387 void *reduce_data,
void (*reduce_func)(
void *lhs_data,
void *rhs_data),
3388 kmp_critical_name *lck );
3391 kmp_int32 num_vars,
size_t reduce_size,
3392 void *reduce_data,
void (*reduce_func)(
void *lhs_data,
void *rhs_data),
3393 kmp_critical_name *lck );
3400 extern PACKED_REDUCTION_METHOD_T
3401 __kmp_determine_reduction_method(
ident_t *loc, kmp_int32 global_tid,
3402 kmp_int32 num_vars,
size_t reduce_size,
3403 void *reduce_data,
void (*reduce_func)(
void *lhs_data,
void *rhs_data),
3404 kmp_critical_name *lck );
3407 KMP_EXPORT kmp_int32 __kmp_get_reduce_method(
void );
3409 KMP_EXPORT kmp_uint64 __kmpc_get_taskid();
3410 KMP_EXPORT kmp_uint64 __kmpc_get_parent_taskid();
3413 KMP_EXPORT
void __kmpc_place_threads(
int,
int,
int,
int,
int);
3422 KMP_EXPORT
void __kmpc_pop_num_threads(
ident_t *loc, kmp_int32 global_tid );
3426 KMP_EXPORT
void __kmpc_push_proc_bind(
ident_t *loc, kmp_int32 global_tid,
int proc_bind );
3434 void * data,
size_t size,
void *** cache );
3437 extern int _You_must_link_with_exactly_one_OpenMP_library;
3438 extern int _You_must_link_with_Intel_OpenMP_library;
3439 #if KMP_OS_WINDOWS && ( KMP_VERSION_MAJOR > 4 )
3440 extern int _You_must_link_with_Microsoft_OpenMP_library;
3447 kmp_threadprivate_insert_private_data(
int gtid,
void *pc_addr,
void *data_addr,
size_t pc_size );
3448 struct private_common *
3449 kmp_threadprivate_insert(
int gtid,
void *pc_addr,
void *data_addr,
size_t pc_size );
3455 # define KMPC_CONVENTION __cdecl
3457 # define KMPC_CONVENTION
3461 typedef enum omp_sched_t {
3462 omp_sched_static = 1,
3463 omp_sched_dynamic = 2,
3464 omp_sched_guided = 3,
3467 typedef void * kmp_affinity_mask_t;
3470 KMP_EXPORT
void KMPC_CONVENTION ompc_set_max_active_levels(
int);
3471 KMP_EXPORT
void KMPC_CONVENTION ompc_set_schedule(omp_sched_t,
int);
3472 KMP_EXPORT
int KMPC_CONVENTION ompc_get_ancestor_thread_num(
int);
3473 KMP_EXPORT
int KMPC_CONVENTION ompc_get_team_size(
int);
3474 KMP_EXPORT
int KMPC_CONVENTION kmpc_set_affinity_mask_proc(
int, kmp_affinity_mask_t *);
3475 KMP_EXPORT
int KMPC_CONVENTION kmpc_unset_affinity_mask_proc(
int, kmp_affinity_mask_t *);
3476 KMP_EXPORT
int KMPC_CONVENTION kmpc_get_affinity_mask_proc(
int, kmp_affinity_mask_t *);
3478 KMP_EXPORT
void KMPC_CONVENTION kmpc_set_stacksize(
int);
3479 KMP_EXPORT
void KMPC_CONVENTION kmpc_set_stacksize_s(
size_t);
3480 KMP_EXPORT
void KMPC_CONVENTION kmpc_set_library(
int);
3481 KMP_EXPORT
void KMPC_CONVENTION kmpc_set_defaults(
char const *);
KMP_EXPORT kmp_int32 __kmpc_master(ident_t *, kmp_int32 global_tid)
KMP_EXPORT kmp_int32 __kmpc_barrier_master(ident_t *, kmp_int32 global_tid)
void __kmpc_dispatch_fini_4(ident_t *loc, kmp_int32 gtid)
KMP_EXPORT void __kmpc_end_single(ident_t *, kmp_int32 global_tid)
void(* kmpc_dtor)(void *)
void __kmpc_dispatch_init_4(ident_t *loc, kmp_int32 gtid, enum sched_type schedule, kmp_int32 lb, kmp_int32 ub, kmp_int32 st, kmp_int32 chunk)
KMP_EXPORT kmp_int32 __kmpc_reduce(ident_t *loc, kmp_int32 global_tid, kmp_int32 num_vars, size_t reduce_size, void *reduce_data, void(*reduce_func)(void *lhs_data, void *rhs_data), kmp_critical_name *lck)
KMP_EXPORT kmp_int32 __kmpc_global_thread_num(ident_t *)
int __kmpc_dispatch_next_4u(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, kmp_uint32 *p_lb, kmp_uint32 *p_ub, kmp_int32 *p_st)
void(* kmpc_dtor_vec)(void *, size_t)
KMP_EXPORT void __kmpc_for_static_fini(ident_t *loc, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_omp_wait_deps(ident_t *loc_ref, kmp_int32 gtid, kmp_int32 ndeps, kmp_depend_info_t *dep_list, kmp_int32 ndeps_noalias, kmp_depend_info_t *noalias_dep_list)
void *(* kmpc_ctor_vec)(void *, size_t)
KMP_EXPORT void * __kmpc_threadprivate_cached(ident_t *loc, kmp_int32 global_tid, void *data, size_t size, void ***cache)
void *(* kmpc_cctor_vec)(void *, void *, size_t)
KMP_EXPORT void __kmpc_flush(ident_t *)
void __kmpc_dispatch_init_8u(ident_t *loc, kmp_int32 gtid, enum sched_type schedule, kmp_uint64 lb, kmp_uint64 ub, kmp_int64 st, kmp_int64 chunk)
KMP_EXPORT kmp_int32 __kmpc_single(ident_t *, kmp_int32 global_tid)
int __kmpc_dispatch_next_4(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, kmp_int32 *p_lb, kmp_int32 *p_ub, kmp_int32 *p_st)
KMP_EXPORT void __kmpc_end(ident_t *)
KMP_EXPORT void __kmpc_end_ordered(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_end_serialized_parallel(ident_t *, kmp_int32 global_tid)
void *(* kmpc_cctor)(void *, void *)
KMP_EXPORT void __kmpc_threadprivate_register(ident_t *, void *data, kmpc_ctor ctor, kmpc_cctor cctor, kmpc_dtor dtor)
KMP_EXPORT kmp_int32 __kmpc_omp_task_with_deps(ident_t *loc_ref, kmp_int32 gtid, kmp_task_t *new_task, kmp_int32 ndeps, kmp_depend_info_t *dep_list, kmp_int32 ndeps_noalias, kmp_depend_info_t *noalias_dep_list)
KMP_EXPORT void __kmpc_begin(ident_t *, kmp_int32 flags)
KMP_EXPORT kmp_int32 __kmpc_bound_thread_num(ident_t *)
KMP_EXPORT kmp_int32 __kmpc_reduce_nowait(ident_t *loc, kmp_int32 global_tid, kmp_int32 num_vars, size_t reduce_size, void *reduce_data, void(*reduce_func)(void *lhs_data, void *rhs_data), kmp_critical_name *lck)
int __kmpc_dispatch_next_8(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, kmp_int64 *p_lb, kmp_int64 *p_ub, kmp_int64 *p_st)
KMP_EXPORT void __kmpc_copyprivate(ident_t *loc, kmp_int32 global_tid, size_t cpy_size, void *cpy_data, void(*cpy_func)(void *, void *), kmp_int32 didit)
KMP_EXPORT void __kmpc_ordered(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_critical(ident_t *, kmp_int32 global_tid, kmp_critical_name *)
KMP_EXPORT void __kmpc_end_barrier_master(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_end_master(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_push_num_threads(ident_t *loc, kmp_int32 global_tid, kmp_int32 num_threads)
KMP_EXPORT void __kmpc_fork_teams(ident_t *loc, kmp_int32 argc, kmpc_micro microtask,...)
KMP_EXPORT kmp_int32 __kmpc_in_parallel(ident_t *loc)
KMP_EXPORT kmp_int32 __kmpc_ok_to_fork(ident_t *)
KMP_EXPORT kmp_int32 __kmpc_global_num_threads(ident_t *)
void __kmpc_dispatch_fini_8u(ident_t *loc, kmp_int32 gtid)
KMP_EXPORT kmp_int32 __kmpc_bound_num_threads(ident_t *)
KMP_EXPORT void __kmpc_end_reduce(ident_t *loc, kmp_int32 global_tid, kmp_critical_name *lck)
void __kmpc_dispatch_fini_4u(ident_t *loc, kmp_int32 gtid)
KMP_EXPORT void __kmpc_barrier(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_end_reduce_nowait(ident_t *loc, kmp_int32 global_tid, kmp_critical_name *lck)
KMP_EXPORT void __kmpc_end_critical(ident_t *, kmp_int32 global_tid, kmp_critical_name *)
void *(* kmpc_ctor)(void *)
KMP_EXPORT void __kmpc_push_num_teams(ident_t *loc, kmp_int32 global_tid, kmp_int32 num_teams, kmp_int32 num_threads)
void __kmpc_dispatch_fini_8(ident_t *loc, kmp_int32 gtid)
void __kmpc_dispatch_init_4u(ident_t *loc, kmp_int32 gtid, enum sched_type schedule, kmp_uint32 lb, kmp_uint32 ub, kmp_int32 st, kmp_int32 chunk)
void(* kmpc_micro)(kmp_int32 *global_tid, kmp_int32 *bound_tid,...)
KMP_EXPORT kmp_int32 __kmpc_barrier_master_nowait(ident_t *, kmp_int32 global_tid)
int __kmpc_dispatch_next_8u(ident_t *loc, kmp_int32 gtid, kmp_int32 *p_last, kmp_uint64 *p_lb, kmp_uint64 *p_ub, kmp_int64 *p_st)
KMP_EXPORT void __kmpc_serialized_parallel(ident_t *, kmp_int32 global_tid)
KMP_EXPORT void __kmpc_fork_call(ident_t *, kmp_int32 nargs, kmpc_micro microtask,...)
KMP_EXPORT void __kmpc_threadprivate_register_vec(ident_t *, void *data, kmpc_ctor_vec ctor, kmpc_cctor_vec cctor, kmpc_dtor_vec dtor, size_t vector_length)
void __kmpc_dispatch_init_8(ident_t *loc, kmp_int32 gtid, enum sched_type schedule, kmp_int64 lb, kmp_int64 ub, kmp_int64 st, kmp_int64 chunk)