2 years ago · da5ee816c1
--- a/contrib/libs/cxxsupp/openmp/kmp.h
+++ b/contrib/libs/cxxsupp/openmp/kmp.h
@@ -100,18 +100,18 @@ class kmp_stats_list;
 
				 #ifndef HWLOC_OBJ_PACKAGE
			
 
				 #define HWLOC_OBJ_PACKAGE HWLOC_OBJ_SOCKET
			
 
				 #endif
			
 
				-#if HWLOC_API_VERSION >= 0x00020000
			
 
				-// hwloc 2.0 changed type of depth of object from unsigned to int
			
 
				-typedef int kmp_hwloc_depth_t;
			
 
				-#else
			
 
				-typedef unsigned int kmp_hwloc_depth_t;
			
 
				-#endif
			
 
				 #endif
			
 
				 
			
 
				 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
			
 
				 #include <xmmintrin.h>
			
 
				 #endif
			
 
				 
			
 
				+// The below has to be defined before including "kmp_barrier.h".
			
 
				+#define KMP_INTERNAL_MALLOC(sz) malloc(sz)
			
 
				+#define KMP_INTERNAL_FREE(p) free(p)
			
 
				+#define KMP_INTERNAL_REALLOC(p, sz) realloc((p), (sz))
			
 
				+#define KMP_INTERNAL_CALLOC(n, sz) calloc((n), (sz))
			
 
				+
			
 
				 #include "kmp_debug.h"
			
 
				 #include "kmp_lock.h"
			
 
				 #include "kmp_version.h"
			
@@ -841,7 +841,9 @@ extern unsigned __kmp_affinity_num_masks;
 
				 extern void __kmp_affinity_bind_thread(int which);
			
 
				 
			
 
				 extern kmp_affin_mask_t *__kmp_affin_fullMask;
			
 
				+extern kmp_affin_mask_t *__kmp_affin_origMask;
			
 
				 extern char *__kmp_cpuinfo_file;
			
 
				+extern bool __kmp_affin_reset;
			
 
				 
			
 
				 #endif /* KMP_AFFINITY_SUPPORTED */
			
 
				 
			
@@ -967,7 +969,6 @@ extern omp_memspace_handle_t const omp_large_cap_mem_space;
 
				 extern omp_memspace_handle_t const omp_const_mem_space;
			
 
				 extern omp_memspace_handle_t const omp_high_bw_mem_space;
			
 
				 extern omp_memspace_handle_t const omp_low_lat_mem_space;
			
 
				-// Preview of target memory support
			
 
				 extern omp_memspace_handle_t const llvm_omp_target_host_mem_space;
			
 
				 extern omp_memspace_handle_t const llvm_omp_target_shared_mem_space;
			
 
				 extern omp_memspace_handle_t const llvm_omp_target_device_mem_space;
			
@@ -987,7 +988,6 @@ extern omp_allocator_handle_t const omp_low_lat_mem_alloc;
 
				 extern omp_allocator_handle_t const omp_cgroup_mem_alloc;
			
 
				 extern omp_allocator_handle_t const omp_pteam_mem_alloc;
			
 
				 extern omp_allocator_handle_t const omp_thread_mem_alloc;
			
 
				-// Preview of target memory support
			
 
				 extern omp_allocator_handle_t const llvm_omp_target_host_mem_alloc;
			
 
				 extern omp_allocator_handle_t const llvm_omp_target_shared_mem_alloc;
			
 
				 extern omp_allocator_handle_t const llvm_omp_target_device_mem_alloc;
			
@@ -1124,7 +1124,7 @@ extern void __kmp_init_target_mem();
 
				 #if KMP_OS_UNIX && (KMP_ARCH_X86 || KMP_ARCH_X86_64)
			
 
				 // HW TSC is used to reduce overhead (clock tick instead of nanosecond).
			
 
				 extern kmp_uint64 __kmp_ticks_per_msec;
			
 
				-#if KMP_COMPILER_ICC
			
 
				+#if KMP_COMPILER_ICC || KMP_COMPILER_ICX
			
 
				 #define KMP_NOW() ((kmp_uint64)_rdtsc())
			
 
				 #else
			
 
				 #define KMP_NOW() __kmp_hardware_timestamp()
			
@@ -1334,7 +1334,10 @@ static inline int __kmp_tpause(uint32_t hint, uint64_t counter) {
 
				   char flag;
			
 
				   __asm__ volatile("#tpause\n.byte 0x66, 0x0F, 0xAE, 0xF1\n"
			
 
				                    "setb   %0"
			
 
				-                   : "=r"(flag)
			
 
				+                   // The "=q" restraint means any register accessible as rl
			
 
				+                   //   in 32-bit mode: a, b, c, and d;
			
 
				+                   //   in 64-bit mode: any integer register
			
 
				+                   : "=q"(flag)
			
 
				                    : "a"(timeLo), "d"(timeHi), "c"(hint)
			
 
				                    :);
			
 
				   return flag;
			
@@ -1361,7 +1364,10 @@ static inline int __kmp_umwait(uint32_t hint, uint64_t counter) {
 
				   char flag;
			
 
				   __asm__ volatile("#umwait\n.byte 0xF2, 0x0F, 0xAE, 0xF1\n"
			
 
				                    "setb   %0"
			
 
				-                   : "=r"(flag)
			
 
				+                   // The "=q" restraint means any register accessible as rl
			
 
				+                   //   in 32-bit mode: a, b, c, and d;
			
 
				+                   //   in 64-bit mode: any integer register
			
 
				+                   : "=q"(flag)
			
 
				                    : "a"(timeLo), "d"(timeHi), "c"(hint)
			
 
				                    :);
			
 
				   return flag;
			
@@ -2548,11 +2554,22 @@ typedef union KMP_ALIGN_CACHE kmp_thread_data {
 
				   char td_pad[KMP_PAD(kmp_base_thread_data_t, CACHE_LINE)];
			
 
				 } kmp_thread_data_t;
			
 
				 
			
 
				+typedef struct kmp_task_pri {
			
 
				+  kmp_thread_data_t td;
			
 
				+  kmp_int32 priority;
			
 
				+  kmp_task_pri *next;
			
 
				+} kmp_task_pri_t;
			
 
				+
			
 
				 // Data for task teams which are used when tasking is enabled for the team
			
 
				 typedef struct kmp_base_task_team {
			
 
				   kmp_bootstrap_lock_t
			
 
				       tt_threads_lock; /* Lock used to allocate per-thread part of task team */
			
 
				   /* must be bootstrap lock since used at library shutdown*/
			
 
				+
			
 
				+  // TODO: check performance vs kmp_tas_lock_t
			
 
				+  kmp_bootstrap_lock_t tt_task_pri_lock; /* Lock to access priority tasks */
			
 
				+  kmp_task_pri_t *tt_task_pri_list;
			
 
				+
			
 
				   kmp_task_team_t *tt_next; /* For linking the task team free list */
			
 
				   kmp_thread_data_t
			
 
				       *tt_threads_data; /* Array of per-thread structures for task team */
			
@@ -2564,6 +2581,7 @@ typedef struct kmp_base_task_team {
 
				   kmp_int32 tt_max_threads; // # entries allocated for threads_data array
			
 
				   kmp_int32 tt_found_proxy_tasks; // found proxy tasks since last barrier
			
 
				   kmp_int32 tt_untied_task_encountered;
			
 
				+  std::atomic<kmp_int32> tt_num_task_pri; // number of priority tasks enqueued
			
 
				   // There is hidden helper thread encountered in this task team so that we must
			
 
				   // wait when waiting on task team
			
 
				   kmp_int32 tt_hidden_helper_task_encountered;
			
@@ -2973,6 +2991,15 @@ struct fortran_inx_info {
 
				   kmp_int32 data;
			
 
				 };
			
 
				 
			
 
				+// This list type exists to hold old __kmp_threads arrays so that
			
 
				+// old references to them may complete while reallocation takes place when
			
 
				+// expanding the array. The items in this list are kept alive until library
			
 
				+// shutdown.
			
 
				+typedef struct kmp_old_threads_list_t {
			
 
				+  kmp_info_t **threads;
			
 
				+  struct kmp_old_threads_list_t *next;
			
 
				+} kmp_old_threads_list_t;
			
 
				+
			
 
				 /* ------------------------------------------------------------------------ */
			
 
				 
			
 
				 extern int __kmp_settings;
			
@@ -3036,6 +3063,8 @@ extern int __kmp_storage_map_verbose_specified;
 
				 #if KMP_ARCH_X86 || KMP_ARCH_X86_64
			
 
				 extern kmp_cpuinfo_t __kmp_cpuinfo;
			
 
				 static inline bool __kmp_is_hybrid_cpu() { return __kmp_cpuinfo.flags.hybrid; }
			
 
				+#elif KMP_OS_DARWIN && KMP_ARCH_AARCH64
			
 
				+static inline bool __kmp_is_hybrid_cpu() { return true; }
			
 
				 #else
			
 
				 static inline bool __kmp_is_hybrid_cpu() { return false; }
			
 
				 #endif
			
@@ -3043,6 +3072,7 @@ static inline bool __kmp_is_hybrid_cpu() { return false; }
 
				 extern volatile int __kmp_init_serial;
			
 
				 extern volatile int __kmp_init_gtid;
			
 
				 extern volatile int __kmp_init_common;
			
 
				+extern volatile int __kmp_need_register_serial;
			
 
				 extern volatile int __kmp_init_middle;
			
 
				 extern volatile int __kmp_init_parallel;
			
 
				 #if KMP_USE_MONITOR
			
@@ -3150,6 +3180,7 @@ extern int __kmp_tp_cached; /* whether threadprivate cache has been created
 
				                                (__kmpc_threadprivate_cached()) */
			
 
				 extern int __kmp_dflt_blocktime; /* number of milliseconds to wait before
			
 
				                                     blocking (env setting) */
			
 
				+extern bool __kmp_wpolicy_passive; /* explicitly set passive wait policy */
			
 
				 #if KMP_USE_MONITOR
			
 
				 extern int
			
 
				     __kmp_monitor_wakeups; /* number of times monitor wakes up per second */
			
@@ -3253,6 +3284,8 @@ extern int __kmp_teams_thread_limit;
 
				 /* the following are protected by the fork/join lock */
			
 
				 /* write: lock  read: anytime */
			
 
				 extern kmp_info_t **__kmp_threads; /* Descriptors for the threads */
			
 
				+/* Holds old arrays of __kmp_threads until library shutdown */
			
 
				+extern kmp_old_threads_list_t *__kmp_old_threads_list;
			
 
				 /* read/write: lock */
			
 
				 extern volatile kmp_team_t *__kmp_team_pool;
			
 
				 extern volatile kmp_info_t *__kmp_thread_pool;
			
@@ -3451,11 +3484,6 @@ extern void ___kmp_thread_free(kmp_info_t *th, void *ptr KMP_SRC_LOC_DECL);
 
				 #define __kmp_thread_free(th, ptr)                                             \
			
 
				   ___kmp_thread_free((th), (ptr)KMP_SRC_LOC_CURR)
			
 
				 
			
 
				-#define KMP_INTERNAL_MALLOC(sz) malloc(sz)
			
 
				-#define KMP_INTERNAL_FREE(p) free(p)
			
 
				-#define KMP_INTERNAL_REALLOC(p, sz) realloc((p), (sz))
			
 
				-#define KMP_INTERNAL_CALLOC(n, sz) calloc((n), (sz))
			
 
				-
			
 
				 extern void __kmp_push_num_threads(ident_t *loc, int gtid, int num_threads);
			
 
				 
			
 
				 extern void __kmp_push_proc_bind(ident_t *loc, int gtid,
			
@@ -3601,8 +3629,18 @@ static inline void __kmp_assign_root_init_mask() {
 
				     r->r.r_affinity_assigned = TRUE;
			
 
				   }
			
 
				 }
			
 
				+static inline void __kmp_reset_root_init_mask(int gtid) {
			
 
				+  kmp_info_t *th = __kmp_threads[gtid];
			
 
				+  kmp_root_t *r = th->th.th_root;
			
 
				+  if (r->r.r_uber_thread == th && r->r.r_affinity_assigned) {
			
 
				+    __kmp_set_system_affinity(__kmp_affin_origMask, FALSE);
			
 
				+    KMP_CPU_COPY(th->th.th_affin_mask, __kmp_affin_origMask);
			
 
				+    r->r.r_affinity_assigned = FALSE;
			
 
				+  }
			
 
				+}
			
 
				 #else /* KMP_AFFINITY_SUPPORTED */
			
 
				 #define __kmp_assign_root_init_mask() /* Nothing */
			
 
				+static inline void __kmp_reset_root_init_mask(int gtid) {}
			
 
				 #endif /* KMP_AFFINITY_SUPPORTED */
			
 
				 // No need for KMP_AFFINITY_SUPPORTED guard as only one field in the
			
 
				 // format string is for affinity, so platforms that do not support
			
@@ -3865,6 +3903,11 @@ KMP_EXPORT kmp_int32 __kmpc_barrier_master_nowait(ident_t *,
 
				 KMP_EXPORT kmp_int32 __kmpc_single(ident_t *, kmp_int32 global_tid);
			
 
				 KMP_EXPORT void __kmpc_end_single(ident_t *, kmp_int32 global_tid);
			
 
				 
			
 
				+KMP_EXPORT kmp_int32 __kmpc_sections_init(ident_t *loc, kmp_int32 global_tid);
			
 
				+KMP_EXPORT kmp_int32 __kmpc_next_section(ident_t *loc, kmp_int32 global_tid,
			
 
				+                                         kmp_int32 numberOfSections);
			
 
				+KMP_EXPORT void __kmpc_end_sections(ident_t *loc, kmp_int32 global_tid);
			
 
				+
			
 
				 KMP_EXPORT void KMPC_FOR_STATIC_INIT(ident_t *loc, kmp_int32 global_tid,
			
 
				                                      kmp_int32 schedtype, kmp_int32 *plastiter,
			
 
				                                      kmp_int *plower, kmp_int *pupper,
			
@@ -3878,6 +3921,9 @@ KMP_EXPORT void __kmpc_copyprivate(ident_t *loc, kmp_int32 global_tid,
 
				                                    void (*cpy_func)(void *, void *),
			
 
				                                    kmp_int32 didit);
			
 
				 
			
 
				+KMP_EXPORT void *__kmpc_copyprivate_light(ident_t *loc, kmp_int32 gtid,
			
 
				+                                          void *cpy_data);
			
 
				+
			
 
				 extern void KMPC_SET_NUM_THREADS(int arg);
			
 
				 extern void KMPC_SET_DYNAMIC(int flag);
			
 
				 extern void KMPC_SET_NESTED(int flag);
			
--- a/contrib/libs/cxxsupp/openmp/kmp_affinity.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_affinity.cpp
@@ -138,6 +138,18 @@ const char *__kmp_hw_get_core_type_string(kmp_hw_core_type_t type) {
 
				   return "unknown";
			
 
				 }
			
 
				 
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+// If affinity is supported, check the affinity
			
 
				+// verbose and warning flags before printing warning
			
 
				+#define KMP_AFF_WARNING(...)                                                   \
			
 
				+  if (__kmp_affinity_verbose ||                                                \
			
 
				+      (__kmp_affinity_warnings && (__kmp_affinity_type != affinity_none))) {   \
			
 
				+    KMP_WARNING(__VA_ARGS__);                                                  \
			
 
				+  }
			
 
				+#else
			
 
				+#define KMP_AFF_WARNING KMP_WARNING
			
 
				+#endif
			
 
				+
			
 
				 ////////////////////////////////////////////////////////////////////////////////
			
 
				 // kmp_hw_thread_t methods
			
 
				 int kmp_hw_thread_t::compare_ids(const void *a, const void *b) {
			
@@ -818,16 +830,16 @@ void kmp_topology_t::canonicalize() {
 
				       // First try core, then thread, then package
			
 
				       kmp_hw_t gran_types[3] = {KMP_HW_CORE, KMP_HW_THREAD, KMP_HW_SOCKET};
			
 
				       for (auto g : gran_types) {
			
 
				-        if (__kmp_topology->get_equivalent_type(g) != KMP_HW_UNKNOWN) {
			
 
				+        if (get_equivalent_type(g) != KMP_HW_UNKNOWN) {
			
 
				           gran_type = g;
			
 
				           break;
			
 
				         }
			
 
				       }
			
 
				       KMP_ASSERT(gran_type != KMP_HW_UNKNOWN);
			
 
				       // Warn user what granularity setting will be used instead
			
 
				-      KMP_WARNING(AffGranularityBad, "KMP_AFFINITY",
			
 
				-                  __kmp_hw_get_catalog_string(__kmp_affinity_gran),
			
 
				-                  __kmp_hw_get_catalog_string(gran_type));
			
 
				+      KMP_AFF_WARNING(AffGranularityBad, "KMP_AFFINITY",
			
 
				+                      __kmp_hw_get_catalog_string(__kmp_affinity_gran),
			
 
				+                      __kmp_hw_get_catalog_string(gran_type));
			
 
				       __kmp_affinity_gran = gran_type;
			
 
				     }
			
 
				 #if KMP_GROUP_AFFINITY
			
@@ -839,12 +851,12 @@ void kmp_topology_t::canonicalize() {
 
				     // processor groups that cover a socket, then the runtime must
			
 
				     // restrict the granularity down to the processor group level.
			
 
				     if (__kmp_num_proc_groups > 1) {
			
 
				-      int gran_depth = __kmp_topology->get_level(gran_type);
			
 
				-      int proc_group_depth = __kmp_topology->get_level(KMP_HW_PROC_GROUP);
			
 
				+      int gran_depth = get_level(gran_type);
			
 
				+      int proc_group_depth = get_level(KMP_HW_PROC_GROUP);
			
 
				       if (gran_depth >= 0 && proc_group_depth >= 0 &&
			
 
				           gran_depth < proc_group_depth) {
			
 
				-        KMP_WARNING(AffGranTooCoarseProcGroup, "KMP_AFFINITY",
			
 
				-                    __kmp_hw_get_catalog_string(__kmp_affinity_gran));
			
 
				+        KMP_AFF_WARNING(AffGranTooCoarseProcGroup, "KMP_AFFINITY",
			
 
				+                        __kmp_hw_get_catalog_string(__kmp_affinity_gran));
			
 
				         __kmp_affinity_gran = gran_type = KMP_HW_PROC_GROUP;
			
 
				       }
			
 
				     }
			
@@ -966,16 +978,16 @@ bool kmp_topology_t::filter_hw_subset() {
 
				     if (equivalent_type != KMP_HW_UNKNOWN) {
			
 
				       __kmp_hw_subset->at(i).type = equivalent_type;
			
 
				     } else {
			
 
				-      KMP_WARNING(AffHWSubsetNotExistGeneric,
			
 
				-                  __kmp_hw_get_catalog_string(type));
			
 
				+      KMP_AFF_WARNING(AffHWSubsetNotExistGeneric,
			
 
				+                      __kmp_hw_get_catalog_string(type));
			
 
				       return false;
			
 
				     }
			
 
				 
			
 
				     // Check to see if current layer has already been
			
 
				     // specified either directly or through an equivalent type
			
 
				     if (specified[equivalent_type] != KMP_HW_UNKNOWN) {
			
 
				-      KMP_WARNING(AffHWSubsetEqvLayers, __kmp_hw_get_catalog_string(type),
			
 
				-                  __kmp_hw_get_catalog_string(specified[equivalent_type]));
			
 
				+      KMP_AFF_WARNING(AffHWSubsetEqvLayers, __kmp_hw_get_catalog_string(type),
			
 
				+                      __kmp_hw_get_catalog_string(specified[equivalent_type]));
			
 
				       return false;
			
 
				     }
			
 
				     specified[equivalent_type] = type;
			
@@ -985,8 +997,8 @@ bool kmp_topology_t::filter_hw_subset() {
 
				     if (max_count < 0 ||
			
 
				         (num != kmp_hw_subset_t::USE_ALL && num + offset > max_count)) {
			
 
				       bool plural = (num > 1);
			
 
				-      KMP_WARNING(AffHWSubsetManyGeneric,
			
 
				-                  __kmp_hw_get_catalog_string(type, plural));
			
 
				+      KMP_AFF_WARNING(AffHWSubsetManyGeneric,
			
 
				+                      __kmp_hw_get_catalog_string(type, plural));
			
 
				       return false;
			
 
				     }
			
 
				 
			
@@ -1008,21 +1020,21 @@ bool kmp_topology_t::filter_hw_subset() {
 
				       if ((using_core_effs || using_core_types) && !__kmp_is_hybrid_cpu()) {
			
 
				         if (item.num_attrs == 1) {
			
 
				           if (using_core_effs) {
			
 
				-            KMP_WARNING(AffHWSubsetIgnoringAttr, "efficiency");
			
 
				+            KMP_AFF_WARNING(AffHWSubsetIgnoringAttr, "efficiency");
			
 
				           } else {
			
 
				-            KMP_WARNING(AffHWSubsetIgnoringAttr, "core_type");
			
 
				+            KMP_AFF_WARNING(AffHWSubsetIgnoringAttr, "core_type");
			
 
				           }
			
 
				           using_core_effs = false;
			
 
				           using_core_types = false;
			
 
				         } else {
			
 
				-          KMP_WARNING(AffHWSubsetAttrsNonHybrid);
			
 
				+          KMP_AFF_WARNING(AffHWSubsetAttrsNonHybrid);
			
 
				           return false;
			
 
				         }
			
 
				       }
			
 
				 
			
 
				       // Check if using both core types and core efficiencies together
			
 
				       if (using_core_types && using_core_effs) {
			
 
				-        KMP_WARNING(AffHWSubsetIncompat, "core_type", "efficiency");
			
 
				+        KMP_AFF_WARNING(AffHWSubsetIncompat, "core_type", "efficiency");
			
 
				         return false;
			
 
				       }
			
 
				 
			
@@ -1058,7 +1070,7 @@ bool kmp_topology_t::filter_hw_subset() {
 
				                 (num != kmp_hw_subset_t::USE_ALL && num + offset > max_count)) {
			
 
				               kmp_str_buf_t buf;
			
 
				               __kmp_hw_get_catalog_core_string(item.attr[j], &buf, num > 0);
			
 
				-              KMP_WARNING(AffHWSubsetManyGeneric, buf.str);
			
 
				+              KMP_AFF_WARNING(AffHWSubsetManyGeneric, buf.str);
			
 
				               __kmp_str_buf_free(&buf);
			
 
				               return false;
			
 
				             }
			
@@ -1080,8 +1092,8 @@ bool kmp_topology_t::filter_hw_subset() {
 
				             }
			
 
				             kmp_str_buf_t buf;
			
 
				             __kmp_hw_get_catalog_core_string(other_attr, &buf, item.num[j] > 0);
			
 
				-            KMP_WARNING(AffHWSubsetIncompat,
			
 
				-                        __kmp_hw_get_catalog_string(KMP_HW_CORE), buf.str);
			
 
				+            KMP_AFF_WARNING(AffHWSubsetIncompat,
			
 
				+                            __kmp_hw_get_catalog_string(KMP_HW_CORE), buf.str);
			
 
				             __kmp_str_buf_free(&buf);
			
 
				             return false;
			
 
				           }
			
@@ -1093,7 +1105,7 @@ bool kmp_topology_t::filter_hw_subset() {
 
				               kmp_str_buf_t buf;
			
 
				               __kmp_hw_get_catalog_core_string(item.attr[j], &buf,
			
 
				                                                item.num[j] > 0);
			
 
				-              KMP_WARNING(AffHWSubsetAttrRepeat, buf.str);
			
 
				+              KMP_AFF_WARNING(AffHWSubsetAttrRepeat, buf.str);
			
 
				               __kmp_str_buf_free(&buf);
			
 
				               return false;
			
 
				             }
			
@@ -1201,7 +1213,7 @@ bool kmp_topology_t::filter_hw_subset() {
 
				 
			
 
				   // One last check that we shouldn't allow filtering entire machine
			
 
				   if (num_filtered == num_hw_threads) {
			
 
				-    KMP_WARNING(AffHWSubsetAllFiltered);
			
 
				+    KMP_AFF_WARNING(AffHWSubsetAllFiltered);
			
 
				     __kmp_free(filtered);
			
 
				     return false;
			
 
				   }
			
@@ -1536,6 +1548,8 @@ int __kmp_affinity_entire_machine_mask(kmp_affin_mask_t *mask) {
 
				 // internal topology object and set the layer ids for it.  Each routine
			
 
				 // returns a boolean on whether it was successful at doing so.
			
 
				 kmp_affin_mask_t *__kmp_affin_fullMask = NULL;
			
 
				+// Original mask is a subset of full mask in multiple processor groups topology
			
 
				+kmp_affin_mask_t *__kmp_affin_origMask = NULL;
			
 
				 
			
 
				 #if KMP_USE_HWLOC
			
 
				 static inline bool __kmp_hwloc_is_cache_type(hwloc_obj_t obj) {
			
@@ -1765,7 +1779,7 @@ static bool __kmp_affinity_create_hwloc_map(kmp_i18n_id_t *const msg_id) {
 
				 
			
 
				   hw_thread_index = 0;
			
 
				   pu = NULL;
			
 
				-  while (pu = hwloc_get_next_obj_by_type(tp, HWLOC_OBJ_PU, pu)) {
			
 
				+  while ((pu = hwloc_get_next_obj_by_type(tp, HWLOC_OBJ_PU, pu))) {
			
 
				     int index = depth - 1;
			
 
				     bool included = KMP_CPU_ISSET(pu->os_index, __kmp_affin_fullMask);
			
 
				     kmp_hw_thread_t &hw_thread = __kmp_topology->at(hw_thread_index);
			
@@ -3353,10 +3367,7 @@ static kmp_affin_mask_t *__kmp_create_masks(unsigned *maxIndex,
 
				     KMP_INFORM(ThreadsMigrate, "KMP_AFFINITY", __kmp_affinity_gran_levels);
			
 
				   }
			
 
				   if (__kmp_affinity_gran_levels >= (int)depth) {
			
 
				-    if (__kmp_affinity_verbose ||
			
 
				-        (__kmp_affinity_warnings && (__kmp_affinity_type != affinity_none))) {
			
 
				-      KMP_WARNING(AffThreadsMayMigrate);
			
 
				-    }
			
 
				+    KMP_AFF_WARNING(AffThreadsMayMigrate);
			
 
				   }
			
 
				 
			
 
				   // Run through the table, forming the masks for all threads on each core.
			
@@ -3443,11 +3454,7 @@ static int nextNewMask;
 
				   {                                                                            \
			
 
				     if (((_osId) > _maxOsId) ||                                                \
			
 
				         (!KMP_CPU_ISSET((_osId), KMP_CPU_INDEX((_osId2Mask), (_osId))))) {     \
			
 
				-      if (__kmp_affinity_verbose ||                                            \
			
 
				-          (__kmp_affinity_warnings &&                                          \
			
 
				-           (__kmp_affinity_type != affinity_none))) {                          \
			
 
				-        KMP_WARNING(AffIgnoreInvalidProcID, _osId);                            \
			
 
				-      }                                                                        \
			
 
				+      KMP_AFF_WARNING(AffIgnoreInvalidProcID, _osId);                          \
			
 
				     } else {                                                                   \
			
 
				       ADD_MASK(KMP_CPU_INDEX(_osId2Mask, (_osId)));                            \
			
 
				     }                                                                          \
			
@@ -3498,11 +3505,7 @@ static void __kmp_affinity_process_proclist(kmp_affin_mask_t **out_masks,
 
				       // Copy the mask for that osId to the sum (union) mask.
			
 
				       if ((num > maxOsId) ||
			
 
				           (!KMP_CPU_ISSET(num, KMP_CPU_INDEX(osId2Mask, num)))) {
			
 
				-        if (__kmp_affinity_verbose ||
			
 
				-            (__kmp_affinity_warnings &&
			
 
				-             (__kmp_affinity_type != affinity_none))) {
			
 
				-          KMP_WARNING(AffIgnoreInvalidProcID, num);
			
 
				-        }
			
 
				+        KMP_AFF_WARNING(AffIgnoreInvalidProcID, num);
			
 
				         KMP_CPU_ZERO(sumMask);
			
 
				       } else {
			
 
				         KMP_CPU_COPY(sumMask, KMP_CPU_INDEX(osId2Mask, num));
			
@@ -3534,11 +3537,7 @@ static void __kmp_affinity_process_proclist(kmp_affin_mask_t **out_masks,
 
				         // Add the mask for that osId to the sum mask.
			
 
				         if ((num > maxOsId) ||
			
 
				             (!KMP_CPU_ISSET(num, KMP_CPU_INDEX(osId2Mask, num)))) {
			
 
				-          if (__kmp_affinity_verbose ||
			
 
				-              (__kmp_affinity_warnings &&
			
 
				-               (__kmp_affinity_type != affinity_none))) {
			
 
				-            KMP_WARNING(AffIgnoreInvalidProcID, num);
			
 
				-          }
			
 
				+          KMP_AFF_WARNING(AffIgnoreInvalidProcID, num);
			
 
				         } else {
			
 
				           KMP_CPU_UNION(sumMask, KMP_CPU_INDEX(osId2Mask, num));
			
 
				           setSize++;
			
@@ -3695,11 +3694,7 @@ static void __kmp_process_subplace_list(const char **scan,
 
				     if (**scan == '}' || **scan == ',') {
			
 
				       if ((start > maxOsId) ||
			
 
				           (!KMP_CPU_ISSET(start, KMP_CPU_INDEX(osId2Mask, start)))) {
			
 
				-        if (__kmp_affinity_verbose ||
			
 
				-            (__kmp_affinity_warnings &&
			
 
				-             (__kmp_affinity_type != affinity_none))) {
			
 
				-          KMP_WARNING(AffIgnoreInvalidProcID, start);
			
 
				-        }
			
 
				+        KMP_AFF_WARNING(AffIgnoreInvalidProcID, start);
			
 
				       } else {
			
 
				         KMP_CPU_UNION(tempMask, KMP_CPU_INDEX(osId2Mask, start));
			
 
				         (*setSize)++;
			
@@ -3728,11 +3723,7 @@ static void __kmp_process_subplace_list(const char **scan,
 
				       for (i = 0; i < count; i++) {
			
 
				         if ((start > maxOsId) ||
			
 
				             (!KMP_CPU_ISSET(start, KMP_CPU_INDEX(osId2Mask, start)))) {
			
 
				-          if (__kmp_affinity_verbose ||
			
 
				-              (__kmp_affinity_warnings &&
			
 
				-               (__kmp_affinity_type != affinity_none))) {
			
 
				-            KMP_WARNING(AffIgnoreInvalidProcID, start);
			
 
				-          }
			
 
				+          KMP_AFF_WARNING(AffIgnoreInvalidProcID, start);
			
 
				           break; // don't proliferate warnings for large count
			
 
				         } else {
			
 
				           KMP_CPU_UNION(tempMask, KMP_CPU_INDEX(osId2Mask, start));
			
@@ -3779,11 +3770,7 @@ static void __kmp_process_subplace_list(const char **scan,
 
				       for (i = 0; i < count; i++) {
			
 
				         if ((start > maxOsId) ||
			
 
				             (!KMP_CPU_ISSET(start, KMP_CPU_INDEX(osId2Mask, start)))) {
			
 
				-          if (__kmp_affinity_verbose ||
			
 
				-              (__kmp_affinity_warnings &&
			
 
				-               (__kmp_affinity_type != affinity_none))) {
			
 
				-            KMP_WARNING(AffIgnoreInvalidProcID, start);
			
 
				-          }
			
 
				+          KMP_AFF_WARNING(AffIgnoreInvalidProcID, start);
			
 
				           break; // don't proliferate warnings for large count
			
 
				         } else {
			
 
				           KMP_CPU_UNION(tempMask, KMP_CPU_INDEX(osId2Mask, start));
			
@@ -3825,10 +3812,7 @@ static void __kmp_process_place(const char **scan, kmp_affin_mask_t *osId2Mask,
 
				     KMP_ASSERT(num >= 0);
			
 
				     if ((num > maxOsId) ||
			
 
				         (!KMP_CPU_ISSET(num, KMP_CPU_INDEX(osId2Mask, num)))) {
			
 
				-      if (__kmp_affinity_verbose ||
			
 
				-          (__kmp_affinity_warnings && (__kmp_affinity_type != affinity_none))) {
			
 
				-        KMP_WARNING(AffIgnoreInvalidProcID, num);
			
 
				-      }
			
 
				+      KMP_AFF_WARNING(AffIgnoreInvalidProcID, num);
			
 
				     } else {
			
 
				       KMP_CPU_UNION(tempMask, KMP_CPU_INDEX(osId2Mask, num));
			
 
				       (*setSize)++;
			
@@ -3945,11 +3929,8 @@ void __kmp_affinity_process_placelist(kmp_affin_mask_t **out_masks,
 
				             (!KMP_CPU_ISSET(j, __kmp_affin_fullMask)) ||
			
 
				             (!KMP_CPU_ISSET(j + stride,
			
 
				                             KMP_CPU_INDEX(osId2Mask, j + stride)))) {
			
 
				-          if ((__kmp_affinity_verbose ||
			
 
				-               (__kmp_affinity_warnings &&
			
 
				-                (__kmp_affinity_type != affinity_none))) &&
			
 
				-              i < count - 1) {
			
 
				-            KMP_WARNING(AffIgnoreInvalidProcID, j + stride);
			
 
				+          if (i < count - 1) {
			
 
				+            KMP_AFF_WARNING(AffIgnoreInvalidProcID, j + stride);
			
 
				           }
			
 
				           continue;
			
 
				         }
			
@@ -4072,8 +4053,13 @@ static void __kmp_aux_affinity_initialize(void) {
 
				   if (__kmp_affin_fullMask == NULL) {
			
 
				     KMP_CPU_ALLOC(__kmp_affin_fullMask);
			
 
				   }
			
 
				+  if (__kmp_affin_origMask == NULL) {
			
 
				+    KMP_CPU_ALLOC(__kmp_affin_origMask);
			
 
				+  }
			
 
				   if (KMP_AFFINITY_CAPABLE()) {
			
 
				     __kmp_get_system_affinity(__kmp_affin_fullMask, TRUE);
			
 
				+    // Make a copy before possible expanding to the entire machine mask
			
 
				+    __kmp_affin_origMask->copy(__kmp_affin_fullMask);
			
 
				     if (__kmp_affinity_respect_mask) {
			
 
				       // Count the number of available processors.
			
 
				       unsigned i;
			
@@ -4085,11 +4071,7 @@ static void __kmp_aux_affinity_initialize(void) {
 
				         __kmp_avail_proc++;
			
 
				       }
			
 
				       if (__kmp_avail_proc > __kmp_xproc) {
			
 
				-        if (__kmp_affinity_verbose ||
			
 
				-            (__kmp_affinity_warnings &&
			
 
				-             (__kmp_affinity_type != affinity_none))) {
			
 
				-          KMP_WARNING(ErrorInitializeAffinity);
			
 
				-        }
			
 
				+        KMP_AFF_WARNING(ErrorInitializeAffinity);
			
 
				         __kmp_affinity_type = affinity_none;
			
 
				         KMP_AFFINITY_DISABLE();
			
 
				         return;
			
@@ -4111,6 +4093,10 @@ static void __kmp_aux_affinity_initialize(void) {
 
				       __kmp_avail_proc =
			
 
				           __kmp_affinity_entire_machine_mask(__kmp_affin_fullMask);
			
 
				 #if KMP_OS_WINDOWS
			
 
				+      if (__kmp_num_proc_groups <= 1) {
			
 
				+        // Copy expanded full mask if topology has single processor group
			
 
				+        __kmp_affin_origMask->copy(__kmp_affin_fullMask);
			
 
				+      }
			
 
				       // Set the process affinity mask since threads' affinity
			
 
				       // masks must be subset of process mask in Windows* OS
			
 
				       __kmp_affin_fullMask->set_process_affinity(true);
			
@@ -4254,10 +4240,8 @@ static void __kmp_aux_affinity_initialize(void) {
 
				 
			
 
				   // Early exit if topology could not be created
			
 
				   if (!__kmp_topology) {
			
 
				-    if (KMP_AFFINITY_CAPABLE() &&
			
 
				-        (__kmp_affinity_verbose ||
			
 
				-         (__kmp_affinity_warnings && (__kmp_affinity_type != affinity_none)))) {
			
 
				-      KMP_WARNING(ErrorInitializeAffinity);
			
 
				+    if (KMP_AFFINITY_CAPABLE()) {
			
 
				+      KMP_AFF_WARNING(ErrorInitializeAffinity);
			
 
				     }
			
 
				     if (nPackages > 0 && nCoresPerPkg > 0 && __kmp_nThreadsPerCore > 0 &&
			
 
				         __kmp_ncores > 0) {
			
@@ -4283,6 +4267,13 @@ static void __kmp_aux_affinity_initialize(void) {
 
				   if (__kmp_affinity_verbose)
			
 
				     __kmp_topology->print("KMP_AFFINITY");
			
 
				   bool filtered = __kmp_topology->filter_hw_subset();
			
 
				+  if (filtered) {
			
 
				+#if KMP_OS_WINDOWS
			
 
				+    // Copy filtered full mask if topology has single processor group
			
 
				+    if (__kmp_num_proc_groups <= 1)
			
 
				+#endif
			
 
				+      __kmp_affin_origMask->copy(__kmp_affin_fullMask);
			
 
				+  }
			
 
				   if (filtered && __kmp_affinity_verbose)
			
 
				     __kmp_topology->print("KMP_HW_SUBSET");
			
 
				   machine_hierarchy.init(__kmp_topology->get_num_hw_threads());
			
@@ -4321,10 +4312,7 @@ static void __kmp_aux_affinity_initialize(void) {
 
				           __kmp_affinity_proclist, osId2Mask, maxIndex);
			
 
				     }
			
 
				     if (__kmp_affinity_num_masks == 0) {
			
 
				-      if (__kmp_affinity_verbose ||
			
 
				-          (__kmp_affinity_warnings && (__kmp_affinity_type != affinity_none))) {
			
 
				-        KMP_WARNING(AffNoValidProcID);
			
 
				-      }
			
 
				+      KMP_AFF_WARNING(AffNoValidProcID);
			
 
				       __kmp_affinity_type = affinity_none;
			
 
				       __kmp_create_affinity_none_places();
			
 
				       return;
			
@@ -4374,9 +4362,7 @@ static void __kmp_aux_affinity_initialize(void) {
 
				 
			
 
				   case affinity_balanced:
			
 
				     if (depth <= 1) {
			
 
				-      if (__kmp_affinity_verbose || __kmp_affinity_warnings) {
			
 
				-        KMP_WARNING(AffBalancedNotAvail, "KMP_AFFINITY");
			
 
				-      }
			
 
				+      KMP_AFF_WARNING(AffBalancedNotAvail, "KMP_AFFINITY");
			
 
				       __kmp_affinity_type = affinity_none;
			
 
				       __kmp_create_affinity_none_places();
			
 
				       return;
			
@@ -4393,9 +4379,7 @@ static void __kmp_aux_affinity_initialize(void) {
 
				 
			
 
				       int nproc = ncores * maxprocpercore;
			
 
				       if ((nproc < 2) || (nproc < __kmp_avail_proc)) {
			
 
				-        if (__kmp_affinity_verbose || __kmp_affinity_warnings) {
			
 
				-          KMP_WARNING(AffBalancedNotAvail, "KMP_AFFINITY");
			
 
				-        }
			
 
				+        KMP_AFF_WARNING(AffBalancedNotAvail, "KMP_AFFINITY");
			
 
				         __kmp_affinity_type = affinity_none;
			
 
				         return;
			
 
				       }
			
@@ -4506,6 +4490,10 @@ void __kmp_affinity_uninitialize(void) {
 
				     KMP_CPU_FREE(__kmp_affin_fullMask);
			
 
				     __kmp_affin_fullMask = NULL;
			
 
				   }
			
 
				+  if (__kmp_affin_origMask != NULL) {
			
 
				+    KMP_CPU_FREE(__kmp_affin_origMask);
			
 
				+    __kmp_affin_origMask = NULL;
			
 
				+  }
			
 
				   __kmp_affinity_num_masks = 0;
			
 
				   __kmp_affinity_type = affinity_default;
			
 
				   __kmp_affinity_num_places = 0;
			
--- a/contrib/libs/cxxsupp/openmp/kmp_alloc.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_alloc.cpp
@@ -1254,7 +1254,6 @@ static void **mk_hbw_preferred_hugetlb;
 
				 static void **mk_dax_kmem;
			
 
				 static void **mk_dax_kmem_all;
			
 
				 static void **mk_dax_kmem_preferred;
			
 
				-// Preview of target memory support
			
 
				 static void *(*kmp_target_alloc_host)(size_t size, int device);
			
 
				 static void *(*kmp_target_alloc_shared)(size_t size, int device);
			
 
				 static void *(*kmp_target_alloc_device)(size_t size, int device);
			
@@ -1269,7 +1268,7 @@ static bool __kmp_target_mem_available;
 
				    MA == llvm_omp_target_shared_mem_alloc ||                                   \
			
 
				    MA == llvm_omp_target_device_mem_alloc)
			
 
				 
			
 
				-#if KMP_OS_UNIX && KMP_DYNAMIC_LIB
			
 
				+#if KMP_OS_UNIX && KMP_DYNAMIC_LIB && !KMP_OS_DARWIN
			
 
				 static inline void chk_kind(void ***pkind) {
			
 
				   KMP_DEBUG_ASSERT(pkind);
			
 
				   if (*pkind) // symbol found
			
@@ -1280,7 +1279,7 @@ static inline void chk_kind(void ***pkind) {
 
				 
			
 
				 void __kmp_init_memkind() {
			
 
				 // as of 2018-07-31 memkind does not support Windows*, exclude it for now
			
 
				-#if KMP_OS_UNIX && KMP_DYNAMIC_LIB
			
 
				+#if KMP_OS_UNIX && KMP_DYNAMIC_LIB && !KMP_OS_DARWIN
			
 
				   // use of statically linked memkind is problematic, as it depends on libnuma
			
 
				   kmp_mk_lib_name = "libmemkind.so";
			
 
				   h_memkind = dlopen(kmp_mk_lib_name, RTLD_LAZY);
			
@@ -1364,7 +1363,7 @@ void __kmp_fini_memkind() {
 
				   mk_dax_kmem_preferred = NULL;
			
 
				 #endif
			
 
				 }
			
 
				-// Preview of target memory support
			
 
				+
			
 
				 void __kmp_init_target_mem() {
			
 
				   *(void **)(&kmp_target_alloc_host) = KMP_DLSYM("llvm_omp_target_alloc_host");
			
 
				   *(void **)(&kmp_target_alloc_shared) =
			
--- a/contrib/libs/cxxsupp/openmp/kmp_atomic.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_atomic.cpp
@@ -2452,6 +2452,7 @@ ATOMIC_CMPXCHG_CPT(float8, mul_cpt, kmp_real64, 64, *,
 
				                                RTYPE, LCK_ID, MASK, GOMP_FLAG)                 \
			
 
				   ATOMIC_BEGIN_CPT_MIX(TYPE_ID, OP_ID, TYPE, RTYPE_ID, RTYPE)                  \
			
 
				   TYPE new_value;                                                              \
			
 
				+  (void)new_value;                                                             \
			
 
				   OP_GOMP_CRITICAL_CPT(TYPE, OP, GOMP_FLAG)                                    \
			
 
				   OP_CMPXCHG_CPT(TYPE, BITS, OP)                                               \
			
 
				   }
			
@@ -2461,6 +2462,7 @@ ATOMIC_CMPXCHG_CPT(float8, mul_cpt, kmp_real64, 64, *,
 
				                                 LCK_ID, GOMP_FLAG)                             \
			
 
				   ATOMIC_BEGIN_CPT_MIX(TYPE_ID, OP_ID, TYPE, RTYPE_ID, RTYPE)                  \
			
 
				   TYPE new_value;                                                              \
			
 
				+  (void)new_value;                                                             \
			
 
				   OP_GOMP_CRITICAL_CPT(TYPE, OP, GOMP_FLAG) /* send assignment */              \
			
 
				   OP_UPDATE_CRITICAL_CPT(TYPE, OP, LCK_ID) /* send assignment */               \
			
 
				   }
			
@@ -3162,6 +3164,7 @@ ATOMIC_CRITICAL_CPT_REV(cmplx16, div_a16_cpt_rev, kmp_cmplx128_a16_t, /, 32c,
 
				                                    RTYPE, LCK_ID, MASK, GOMP_FLAG)             \
			
 
				   ATOMIC_BEGIN_CPT_MIX(TYPE_ID, OP_ID, TYPE, RTYPE_ID, RTYPE)                  \
			
 
				   TYPE new_value;                                                              \
			
 
				+  (void)new_value;                                                             \
			
 
				   OP_GOMP_CRITICAL_CPT_REV(TYPE, OP, GOMP_FLAG)                                \
			
 
				   OP_CMPXCHG_CPT_REV(TYPE, BITS, OP)                                           \
			
 
				   }
			
@@ -3171,6 +3174,7 @@ ATOMIC_CRITICAL_CPT_REV(cmplx16, div_a16_cpt_rev, kmp_cmplx128_a16_t, /, 32c,
 
				                                     LCK_ID, GOMP_FLAG)                         \
			
 
				   ATOMIC_BEGIN_CPT_MIX(TYPE_ID, OP_ID, TYPE, RTYPE_ID, RTYPE)                  \
			
 
				   TYPE new_value;                                                              \
			
 
				+  (void)new_value;                                                             \
			
 
				   OP_GOMP_CRITICAL_CPT_REV(TYPE, OP, GOMP_FLAG) /* send assignment */          \
			
 
				   OP_CRITICAL_CPT_REV(TYPE, OP, LCK_ID) /* send assignment */                  \
			
 
				   }
			
--- a/contrib/libs/cxxsupp/openmp/kmp_atomic.h
+++ b/contrib/libs/cxxsupp/openmp/kmp_atomic.h
@@ -251,6 +251,9 @@ struct KMP_DO_ALIGN(4) kmp_cmplx128_a4_t {
 
				 
			
 
				   kmp_cmplx128_a4_t() : q() {}
			
 
				 
			
 
				+#if defined(__cplusplus) && (KMP_OS_WINDOWS)
			
 
				+  kmp_cmplx128_a4_t(const std::complex<_Quad> &c128) : q(c128) {}
			
 
				+#endif
			
 
				   kmp_cmplx128_a4_t(const kmp_cmplx128 &c128) : q(c128) {}
			
 
				 
			
 
				   kmp_cmplx128_a4_t operator+(const kmp_cmplx128_a4_t &b) {
			
@@ -314,6 +317,9 @@ struct KMP_DO_ALIGN(16) kmp_cmplx128_a16_t {
 
				 
			
 
				   kmp_cmplx128_a16_t() : q() {}
			
 
				 
			
 
				+#if defined(__cplusplus) && (KMP_OS_WINDOWS)
			
 
				+  kmp_cmplx128_a16_t(const std::complex<_Quad> &c128) : q(c128) {}
			
 
				+#endif
			
 
				   kmp_cmplx128_a16_t(const kmp_cmplx128 &c128) : q(c128) {}
			
 
				 
			
 
				   kmp_cmplx128_a16_t operator+(const kmp_cmplx128_a16_t &b) {
			
--- a/contrib/libs/cxxsupp/openmp/kmp_barrier.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_barrier.cpp
@@ -2163,7 +2163,6 @@ void __kmp_join_barrier(int gtid) {
 
				 
			
 
				   kmp_info_t *this_thr = __kmp_threads[gtid];
			
 
				   kmp_team_t *team;
			
 
				-  kmp_uint nproc;
			
 
				   int tid;
			
 
				 #ifdef KMP_DEBUG
			
 
				   int team_id;
			
@@ -2176,12 +2175,14 @@ void __kmp_join_barrier(int gtid) {
 
				     itt_sync_obj = __kmp_itt_barrier_object(gtid, bs_forkjoin_barrier);
			
 
				 #endif
			
 
				 #endif /* USE_ITT_BUILD */
			
 
				+#if ((USE_ITT_BUILD && USE_ITT_NOTIFY) || defined KMP_DEBUG)
			
 
				+  int nproc = this_thr->th.th_team_nproc;
			
 
				+#endif
			
 
				   KMP_MB();
			
 
				 
			
 
				   // Get current info
			
 
				   team = this_thr->th.th_team;
			
 
				-  nproc = this_thr->th.th_team_nproc;
			
 
				-  KMP_DEBUG_ASSERT((int)nproc == team->t.t_nproc);
			
 
				+  KMP_DEBUG_ASSERT(nproc == team->t.t_nproc);
			
 
				   tid = __kmp_tid_from_gtid(gtid);
			
 
				 #ifdef KMP_DEBUG
			
 
				   team_id = team->t.t_id;
			
@@ -2354,7 +2355,7 @@ void __kmp_join_barrier(int gtid) {
 
				           // Set arrive time to zero to be able to check it in
			
 
				           // __kmp_invoke_task(); the same is done inside the loop below
			
 
				           this_thr->th.th_bar_arrive_time = 0;
			
 
				-          for (kmp_uint i = 1; i < nproc; ++i) {
			
 
				+          for (int i = 1; i < nproc; ++i) {
			
 
				             delta += (cur_time - other_threads[i]->th.th_bar_arrive_time);
			
 
				             other_threads[i]->th.th_bar_arrive_time = 0;
			
 
				           }
			
--- a/contrib/libs/cxxsupp/openmp/kmp_csupport.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_csupport.cpp
@@ -354,9 +354,9 @@ void __kmpc_push_num_teams(ident_t *loc, kmp_int32 global_tid,
 
				 @ingroup PARALLEL
			
 
				 @param loc source location information
			
 
				 @param global_tid global thread number
			
 
				-@param num_teams_lo lower bound on number of teams requested for the teams
			
 
				+@param num_teams_lb lower bound on number of teams requested for the teams
			
 
				 construct
			
 
				-@param num_teams_up upper bound on number of teams requested for the teams
			
 
				+@param num_teams_ub upper bound on number of teams requested for the teams
			
 
				 construct
			
 
				 @param num_threads number of threads per team requested for the teams construct
			
 
				 
			
@@ -632,6 +632,11 @@ void __kmpc_end_serialized_parallel(ident_t *loc, kmp_int32 global_tid) {
 
				                 "team %p\n",
			
 
				                 global_tid, this_thr->th.th_task_team, this_thr->th.th_team));
			
 
				     }
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+    if (this_thr->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+      __kmp_reset_root_init_mask(global_tid);
			
 
				+    }
			
 
				+#endif
			
 
				   } else {
			
 
				     if (__kmp_tasking_mode != tskm_immediate_exec) {
			
 
				       KA_TRACE(20, ("__kmpc_end_serialized_parallel: T#%d decreasing nesting "
			
@@ -685,13 +690,13 @@ void __kmpc_flush(ident_t *loc) {
 
				   if (!__kmp_cpuinfo.flags.sse2) {
			
 
				     // CPU cannot execute SSE2 instructions.
			
 
				   } else {
			
 
				-#if KMP_COMPILER_ICC
			
 
				+#if KMP_COMPILER_ICC || KMP_COMPILER_ICX
			
 
				     _mm_mfence();
			
 
				 #elif KMP_COMPILER_MSVC
			
 
				     MemoryBarrier();
			
 
				 #else
			
 
				     __sync_synchronize();
			
 
				-#endif // KMP_COMPILER_ICC
			
 
				+#endif // KMP_COMPILER_ICC || KMP_COMPILER_ICX
			
 
				   }
			
 
				 #endif // KMP_MIC
			
 
				 #elif (KMP_ARCH_ARM || KMP_ARCH_AARCH64 || KMP_ARCH_MIPS || KMP_ARCH_MIPS64 || \
			
@@ -2021,6 +2026,11 @@ void KMP_EXPAND_NAME(ompc_display_affinity)(char const *format) {
 
				   }
			
 
				   __kmp_assign_root_init_mask();
			
 
				   gtid = __kmp_get_gtid();
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (__kmp_threads[gtid]->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+    __kmp_reset_root_init_mask(gtid);
			
 
				+  }
			
 
				+#endif
			
 
				   __kmp_aux_display_affinity(gtid, format);
			
 
				 }
			
 
				 
			
@@ -2034,6 +2044,11 @@ size_t KMP_EXPAND_NAME(ompc_capture_affinity)(char *buffer, size_t buf_size,
 
				   }
			
 
				   __kmp_assign_root_init_mask();
			
 
				   gtid = __kmp_get_gtid();
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (__kmp_threads[gtid]->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+    __kmp_reset_root_init_mask(gtid);
			
 
				+  }
			
 
				+#endif
			
 
				   __kmp_str_buf_init(&capture_buf);
			
 
				   num_required = __kmp_aux_capture_affinity(gtid, format, &capture_buf);
			
 
				   if (buffer && buf_size) {
			
@@ -2224,6 +2239,61 @@ void __kmpc_copyprivate(ident_t *loc, kmp_int32 gtid, size_t cpy_size,
 
				   }
			
 
				 }
			
 
				 
			
 
				+/* --------------------------------------------------------------------------*/
			
 
				+/*!
			
 
				+@ingroup THREADPRIVATE
			
 
				+@param loc       source location information
			
 
				+@param gtid      global thread number
			
 
				+@param cpy_data  pointer to the data to be saved/copied or 0
			
 
				+@return          the saved pointer to the data
			
 
				+
			
 
				+__kmpc_copyprivate_light is a lighter version of __kmpc_copyprivate:
			
 
				+__kmpc_copyprivate_light only saves the pointer it's given (if it's not 0, so
			
 
				+coming from single), and returns that pointer in all calls (for single thread
			
 
				+it's not needed). This version doesn't do any actual data copying. Data copying
			
 
				+has to be done somewhere else, e.g. inline in the generated code. Due to this,
			
 
				+this function doesn't have any barrier at the end of the function, like
			
 
				+__kmpc_copyprivate does, so generated code needs barrier after copying of all
			
 
				+data was done.
			
 
				+*/
			
 
				+void *__kmpc_copyprivate_light(ident_t *loc, kmp_int32 gtid, void *cpy_data) {
			
 
				+  void **data_ptr;
			
 
				+
			
 
				+  KC_TRACE(10, ("__kmpc_copyprivate_light: called T#%d\n", gtid));
			
 
				+
			
 
				+  KMP_MB();
			
 
				+
			
 
				+  data_ptr = &__kmp_team_from_gtid(gtid)->t.t_copypriv_data;
			
 
				+
			
 
				+  if (__kmp_env_consistency_check) {
			
 
				+    if (loc == 0) {
			
 
				+      KMP_WARNING(ConstructIdentInvalid);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  // ToDo: Optimize the following barrier
			
 
				+
			
 
				+  if (cpy_data)
			
 
				+    *data_ptr = cpy_data;
			
 
				+
			
 
				+#if OMPT_SUPPORT
			
 
				+  ompt_frame_t *ompt_frame;
			
 
				+  if (ompt_enabled.enabled) {
			
 
				+    __ompt_get_task_info_internal(0, NULL, NULL, &ompt_frame, NULL, NULL);
			
 
				+    if (ompt_frame->enter_frame.ptr == NULL)
			
 
				+      ompt_frame->enter_frame.ptr = OMPT_GET_FRAME_ADDRESS(0);
			
 
				+    OMPT_STORE_RETURN_ADDRESS(gtid);
			
 
				+  }
			
 
				+#endif
			
 
				+/* This barrier is not a barrier region boundary */
			
 
				+#if USE_ITT_NOTIFY
			
 
				+  __kmp_threads[gtid]->th.th_ident = loc;
			
 
				+#endif
			
 
				+  __kmp_barrier(bs_plain_barrier, gtid, FALSE, 0, NULL, NULL);
			
 
				+
			
 
				+  return *data_ptr;
			
 
				+}
			
 
				+
			
 
				 /* -------------------------------------------------------------------------- */
			
 
				 
			
 
				 #define INIT_LOCK __kmp_init_user_lock_with_checks
			
@@ -4348,7 +4418,7 @@ void *omp_aligned_calloc(size_t align, size_t nmemb, size_t size,
 
				 void *omp_realloc(void *ptr, size_t size, omp_allocator_handle_t allocator,
			
 
				                   omp_allocator_handle_t free_allocator) {
			
 
				   return __kmp_realloc(__kmp_entry_gtid(), ptr, size, allocator,
			
 
				-                        free_allocator);
			
 
				+                       free_allocator);
			
 
				 }
			
 
				 
			
 
				 void omp_free(void *ptr, omp_allocator_handle_t allocator) {
			
--- a/contrib/libs/cxxsupp/openmp/kmp_dispatch.cpp
+++ b/contrib/libs/cxxsupp/openmp/kmp_dispatch.cpp
@@ -1964,9 +1964,22 @@ int __kmp_dispatch_next_algorithm(int gtid,
 
				           &(task_info->task_data), 0, codeptr);                                \
			
 
				     }                                                                          \
			
 
				   }
			
 
				+#define OMPT_LOOP_DISPATCH(lb, ub, st, status)                                 \
			
 
				+  if (ompt_enabled.ompt_callback_dispatch && status) {                         \
			
 
				+    ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);                \
			
 
				+    ompt_task_info_t *task_info = __ompt_get_task_info_object(0);              \
			
 
				+    ompt_dispatch_chunk_t chunk;                                               \
			
 
				+    ompt_data_t instance = ompt_data_none;                                     \
			
 
				+    OMPT_GET_DISPATCH_CHUNK(chunk, lb, ub, st);                                \
			
 
				+    instance.ptr = &chunk;                                                     \
			
 
				+    ompt_callbacks.ompt_callback(ompt_callback_dispatch)(                      \
			
 
				+        &(team_info->parallel_data), &(task_info->task_data),                  \
			
 
				+        ompt_dispatch_ws_loop_chunk, instance);                                \
			
 
				+  }
			
 
				 // TODO: implement count
			
 
				 #else
			
 
				 #define OMPT_LOOP_END // no-op
			
 
				+#define OMPT_LOOP_DISPATCH(lb, ub, st, status) // no-op
			
 
				 #endif
			
 
				 
			
 
				 #if KMP_STATS_ENABLED
			
@@ -2142,6 +2155,7 @@ static int __kmp_dispatch_next(ident_t *loc, int gtid, kmp_int32 *p_last,
 
				 #if INCLUDE_SSC_MARKS
			
 
				     SSC_MARK_DISPATCH_NEXT();
			
 
				 #endif
			
 
				+    OMPT_LOOP_DISPATCH(*p_lb, *p_ub, pr->u.p.st, status);
			
 
				     OMPT_LOOP_END;
			
 
				     KMP_STATS_LOOP_END;
			
 
				     return status;
			
@@ -2265,11 +2279,225 @@ static int __kmp_dispatch_next(ident_t *loc, int gtid, kmp_int32 *p_last,
 
				 #if INCLUDE_SSC_MARKS
			
 
				   SSC_MARK_DISPATCH_NEXT();
			
 
				 #endif
			
 
				+  OMPT_LOOP_DISPATCH(*p_lb, *p_ub, pr->u.p.st, status);
			
 
				   OMPT_LOOP_END;
			
 
				   KMP_STATS_LOOP_END;
			
 
				   return status;
			
 
				 }
			
 
				 
			
 
				+/*!
			
 
				+@ingroup WORK_SHARING
			
 
				+@param loc  source location information
			
 
				+@param global_tid  global thread number
			
 
				+@return Zero if the parallel region is not active and this thread should execute
			
 
				+all sections, non-zero otherwise.
			
 
				+
			
 
				+Beginning of sections construct.
			
 
				+There are no implicit barriers in the "sections" calls, rather the compiler
			
 
				+should introduce an explicit barrier if it is required.
			
 
				+
			
 
				+This implementation is based on __kmp_dispatch_init, using same constructs for
			
 
				+shared data (we can't have sections nested directly in omp for loop, there
			
 
				+should be a parallel region in between)
			
 
				+*/
			
 
				+kmp_int32 __kmpc_sections_init(ident_t *loc, kmp_int32 gtid) {
			
 
				+
			
 
				+  int active;
			
 
				+  kmp_info_t *th;
			
 
				+  kmp_team_t *team;
			
 
				+  kmp_uint32 my_buffer_index;
			
 
				+  dispatch_shared_info_template<kmp_int32> volatile *sh;
			
 
				+
			
 
				+  KMP_DEBUG_ASSERT(__kmp_init_serial);
			
 
				+
			
 
				+  if (!TCR_4(__kmp_init_parallel))
			
 
				+    __kmp_parallel_initialize();
			
 
				+  __kmp_resume_if_soft_paused();
			
 
				+
			
 
				+  /* setup data */
			
 
				+  th = __kmp_threads[gtid];
			
 
				+  team = th->th.th_team;
			
 
				+  active = !team->t.t_serialized;
			
 
				+  th->th.th_ident = loc;
			
 
				+
			
 
				+  KMP_COUNT_BLOCK(OMP_SECTIONS);
			
 
				+  KD_TRACE(10, ("__kmpc_sections: called by T#%d\n", gtid));
			
 
				+
			
 
				+  if (active) {
			
 
				+    // Setup sections in the same way as dynamic scheduled loops.
			
 
				+    // We need one shared data: which section is to execute next.
			
 
				+    // (in case parallel is not active, all sections will be executed on the
			
 
				+    // same thread)
			
 
				+    KMP_DEBUG_ASSERT(th->th.th_dispatch ==
			
 
				+                     &th->th.th_team->t.t_dispatch[th->th.th_info.ds.ds_tid]);
			
 
				+
			
 
				+    my_buffer_index = th->th.th_dispatch->th_disp_index++;
			
 
				+
			
 
				+    // reuse shared data structures from dynamic sched loops:
			
 
				+    sh = reinterpret_cast<dispatch_shared_info_template<kmp_int32> volatile *>(
			
 
				+        &team->t.t_disp_buffer[my_buffer_index % __kmp_dispatch_num_buffers]);
			
 
				+    KD_TRACE(10, ("__kmpc_sections_init: T#%d my_buffer_index:%d\n", gtid,
			
 
				+                  my_buffer_index));
			
 
				+
			
 
				+    th->th.th_dispatch->th_deo_fcn = __kmp_dispatch_deo_error;
			
 
				+    th->th.th_dispatch->th_dxo_fcn = __kmp_dispatch_dxo_error;
			
 
				+
			
 
				+    KD_TRACE(100, ("__kmpc_sections_init: T#%d before wait: my_buffer_index:%d "
			
 
				+                   "sh->buffer_index:%d\n",
			
 
				+                   gtid, my_buffer_index, sh->buffer_index));
			
 
				+    __kmp_wait<kmp_uint32>(&sh->buffer_index, my_buffer_index,
			
 
				+                           __kmp_eq<kmp_uint32> USE_ITT_BUILD_ARG(NULL));
			
 
				+    // Note: KMP_WAIT() cannot be used there: buffer index and
			
 
				+    // my_buffer_index are *always* 32-bit integers.
			
 
				+    KMP_MB();
			
 
				+    KD_TRACE(100, ("__kmpc_sections_init: T#%d after wait: my_buffer_index:%d "
			
 
				+                   "sh->buffer_index:%d\n",
			
 
				+                   gtid, my_buffer_index, sh->buffer_index));
			
 
				+
			
 
				+    th->th.th_dispatch->th_dispatch_pr_current =
			
 
				+        nullptr; // sections construct doesn't need private data
			
 
				+    th->th.th_dispatch->th_dispatch_sh_current =
			
 
				+        CCAST(dispatch_shared_info_t *, (volatile dispatch_shared_info_t *)sh);
			
 
				+  }
			
 
				+
			
 
				+#if OMPT_SUPPORT && OMPT_OPTIONAL
			
 
				+  if (ompt_enabled.ompt_callback_work) {
			
 
				+    ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);
			
 
				+    ompt_task_info_t *task_info = __ompt_get_task_info_object(0);
			
 
				+    ompt_callbacks.ompt_callback(ompt_callback_work)(
			
 
				+        ompt_work_sections, ompt_scope_begin, &(team_info->parallel_data),
			
 
				+        &(task_info->task_data), 0, OMPT_GET_RETURN_ADDRESS(0));
			
 
				+  }
			
 
				+#endif
			
 
				+  KMP_PUSH_PARTITIONED_TIMER(OMP_sections);
			
 
				+
			
 
				+  return active;
			
 
				+}
			
 
				+
			
 
				+/*!
			
 
				+@ingroup WORK_SHARING
			
 
				+@param loc  source location information
			
 
				+@param global_tid  global thread number
			
 
				+@param numberOfSections  number of sections in the 'sections' construct
			
 
				+@return unsigned [from 0 to n) - number (id) of the section to execute next on
			
 
				+this thread. n (or any other number not in range) - nothing to execute on this
			
 
				+thread
			
 
				+*/
			
 
				+
			
 
				+kmp_int32 __kmpc_next_section(ident_t *loc, kmp_int32 gtid,
			
 
				+                              kmp_int32 numberOfSections) {
			
 
				+
			
 
				+  KMP_TIME_PARTITIONED_BLOCK(OMP_sections);
			
 
				+
			
 
				+  kmp_info_t *th = __kmp_threads[gtid];
			
 
				+#ifdef KMP_DEBUG
			
 
				+  kmp_team_t *team = th->th.th_team;
			
 
				+#endif
			
 
				+
			
 
				+  KD_TRACE(1000, ("__kmp_dispatch_next: T#%d; number of sections:%d\n", gtid,
			
 
				+                  numberOfSections));
			
 
				+
			
 
				+  // For serialized case we should not call this function:
			
 
				+  KMP_DEBUG_ASSERT(!team->t.t_serialized);
			
 
				+
			
 
				+  dispatch_shared_info_template<kmp_int32> volatile *sh;
			
 
				+
			
 
				+  KMP_DEBUG_ASSERT(th->th.th_dispatch ==
			
 
				+                   &th->th.th_team->t.t_dispatch[th->th.th_info.ds.ds_tid]);
			
 
				+
			
 
				+  KMP_DEBUG_ASSERT(!(th->th.th_dispatch->th_dispatch_pr_current));
			
 
				+  sh = reinterpret_cast<dispatch_shared_info_template<kmp_int32> volatile *>(
			
 
				+      th->th.th_dispatch->th_dispatch_sh_current);
			
 
				+  KMP_DEBUG_ASSERT(sh);
			
 
				+
			
 
				+  kmp_int32 sectionIndex = 0;
			
 
				+  bool moreSectionsToExecute = true;
			
 
				+
			
 
				+  // Find section to execute:
			
 
				+  sectionIndex = test_then_inc<kmp_int32>((kmp_int32 *)&sh->u.s.iteration);
			
 
				+  if (sectionIndex >= numberOfSections) {
			
 
				+    moreSectionsToExecute = false;
			
 
				+  }
			
 
				+
			
 
				+  // status == 0: no more sections to execute;
			
 
				+  // OMPTODO: __kmpc_end_sections could be bypassed?
			
 
				+  if (!moreSectionsToExecute) {
			
 
				+    kmp_int32 num_done;
			
 
				+
			
 
				+    num_done = test_then_inc<kmp_int32>((kmp_int32 *)(&sh->u.s.num_done));
			
 
				+
			
 
				+    if (num_done == th->th.th_team_nproc - 1) {
			
 
				+      /* NOTE: release this buffer to be reused */
			
 
				+
			
 
				+      KMP_MB(); /* Flush all pending memory write invalidates.  */
			
 
				+
			
 
				+      sh->u.s.num_done = 0;
			
 
				+      sh->u.s.iteration = 0;
			
 
				+
			
 
				+      KMP_MB(); /* Flush all pending memory write invalidates.  */
			
 
				+
			
 
				+      sh->buffer_index += __kmp_dispatch_num_buffers;
			
 
				+      KD_TRACE(100, ("__kmpc_next_section: T#%d change buffer_index:%d\n", gtid,
			
 
				+                     sh->buffer_index));
			
 
				+
			
 
				+      KMP_MB(); /* Flush all pending memory write invalidates.  */
			
 
				+
			
 
				+    } // if
			
 
				+
			
 
				+    th->th.th_dispatch->th_deo_fcn = NULL;
			
 
				+    th->th.th_dispatch->th_dxo_fcn = NULL;
			
 
				+    th->th.th_dispatch->th_dispatch_sh_current = NULL;
			
 
				+    th->th.th_dispatch->th_dispatch_pr_current = NULL;
			
 
				+
			
 
				+#if OMPT_SUPPORT && OMPT_OPTIONAL
			
 
				+    if (ompt_enabled.ompt_callback_dispatch) {
			
 
				+      ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);
			
 
				+      ompt_task_info_t *task_info = __ompt_get_task_info_object(0);
			
 
				+      ompt_data_t instance = ompt_data_none;
			
 
				+      instance.ptr = OMPT_GET_RETURN_ADDRESS(0);
			
 
				+      ompt_callbacks.ompt_callback(ompt_callback_dispatch)(
			
 
				+          &(team_info->parallel_data), &(task_info->task_data),
			
 
				+          ompt_dispatch_section, instance);
			
 
				+    }
			
 
				+#endif
			
 
				+    KMP_POP_PARTITIONED_TIMER();
			
 
				+  }
			
 
				+
			
 
				+  return sectionIndex;
			
 
				+}
			
 
				+
			
 
				+/*!
			
 
				+@ingroup WORK_SHARING
			
 
				+@param loc  source location information
			
 
				+@param global_tid  global thread number
			
 
				+
			
 
				+End of "sections" construct.
			
 
				+Don't need to wait here: barrier is added separately when needed.
			
 
				+*/
			
 
				+void __kmpc_end_sections(ident_t *loc, kmp_int32 gtid) {
			
 
				+
			
 
				+  kmp_info_t *th = __kmp_threads[gtid];
			
 
				+  int active = !th->th.th_team->t.t_serialized;
			
 
				+
			
 
				+  KD_TRACE(100, ("__kmpc_end_sections: T#%d called\n", gtid));
			
 
				+
			
 
				+  if (!active) {
			
 
				+    // In active case call finalization is done in __kmpc_next_section
			
 
				+#if OMPT_SUPPORT && OMPT_OPTIONAL
			
 
				+    if (ompt_enabled.ompt_callback_work) {
			
 
				+      ompt_team_info_t *team_info = __ompt_get_teaminfo(0, NULL);
			
 
				+      ompt_task_info_t *task_info = __ompt_get_task_info_object(0);
			
 
				+      ompt_callbacks.ompt_callback(ompt_callback_work)(
			
 
				+          ompt_work_sections, ompt_scope_end, &(team_info->parallel_data),
			
 
				+          &(task_info->task_data), 0, OMPT_GET_RETURN_ADDRESS(0));
			
 
				+    }
			
 
				+#endif
			
 
				+    KMP_POP_PARTITIONED_TIMER();
			
 
				+  }
			
 
				+
			
 
				+  KD_TRACE(100, ("__kmpc_end_sections: T#%d returned\n", gtid));
			
 
				+}
			
 
				+
			
 
				 template <typename T>
			
 
				 static void __kmp_dist_get_bounds(ident_t *loc, kmp_int32 gtid,
			
 
				                                   kmp_int32 *plastiter, T *plower, T *pupper,
			
--- a/contrib/libs/cxxsupp/openmp/kmp_ftn_entry.h
+++ b/contrib/libs/cxxsupp/openmp/kmp_ftn_entry.h
@@ -238,6 +238,10 @@ int FTN_STDCALL FTN_GET_AFFINITY(void **mask) {
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				   __kmp_assign_root_init_mask();
			
 
				+  int gtid = __kmp_get_gtid();
			
 
				+  if (__kmp_threads[gtid]->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+    __kmp_reset_root_init_mask(gtid);
			
 
				+  }
			
 
				   return __kmp_aux_get_affinity(mask);
			
 
				 #endif
			
 
				 }
			
@@ -358,9 +362,13 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_MAX_THREADS)(void) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   gtid = __kmp_entry_gtid();
			
 
				   thread = __kmp_threads[gtid];
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (thread->th.th_team->t.t_level == 0 && !__kmp_affin_reset) {
			
 
				+    __kmp_assign_root_init_mask();
			
 
				+  }
			
 
				+#endif
			
 
				   // return thread -> th.th_team -> t.t_current_task[
			
 
				   // thread->th.th_info.ds.ds_tid ] -> icvs.nproc;
			
 
				   return thread->th.th_current_task->td_icvs.nproc;
			
@@ -509,6 +517,11 @@ void FTN_STDCALL KMP_EXPAND_NAME_IF_APPEND(FTN_DISPLAY_AFFINITY)(
 
				   }
			
 
				   __kmp_assign_root_init_mask();
			
 
				   gtid = __kmp_get_gtid();
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (__kmp_threads[gtid]->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+    __kmp_reset_root_init_mask(gtid);
			
 
				+  }
			
 
				+#endif
			
 
				   ConvertedString cformat(format, size);
			
 
				   __kmp_aux_display_affinity(gtid, cformat.get());
			
 
				 #endif
			
@@ -537,6 +550,11 @@ size_t FTN_STDCALL KMP_EXPAND_NAME_IF_APPEND(FTN_CAPTURE_AFFINITY)(
 
				   }
			
 
				   __kmp_assign_root_init_mask();
			
 
				   gtid = __kmp_get_gtid();
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (__kmp_threads[gtid]->th.th_team->t.t_level == 0 && __kmp_affin_reset) {
			
 
				+    __kmp_reset_root_init_mask(gtid);
			
 
				+  }
			
 
				+#endif
			
 
				   __kmp_str_buf_init(&capture_buf);
			
 
				   ConvertedString cformat(format, for_size);
			
 
				   num_required = __kmp_aux_capture_affinity(gtid, cformat.get(), &capture_buf);
			
@@ -612,7 +630,16 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_NUM_PROCS)(void) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				+#if KMP_AFFINITY_SUPPORTED
			
 
				+  if (!__kmp_affin_reset) {
			
 
				+    // only bind root here if its affinity reset is not requested
			
 
				+    int gtid = __kmp_entry_gtid();
			
 
				+    kmp_info_t *thread = __kmp_threads[gtid];
			
 
				+    if (thread->th.th_team->t.t_level == 0) {
			
 
				+      __kmp_assign_root_init_mask();
			
 
				+    }
			
 
				+  }
			
 
				+#endif
			
 
				   return __kmp_avail_proc;
			
 
				 #endif
			
 
				 }
			
@@ -802,9 +829,16 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_NUM_PLACES)(void) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return 0;
			
 
				+  if (!__kmp_affin_reset) {
			
 
				+    // only bind root here if its affinity reset is not requested
			
 
				+    int gtid = __kmp_entry_gtid();
			
 
				+    kmp_info_t *thread = __kmp_threads[gtid];
			
 
				+    if (thread->th.th_team->t.t_level == 0) {
			
 
				+      __kmp_assign_root_init_mask();
			
 
				+    }
			
 
				+  }
			
 
				   return __kmp_affinity_num_masks;
			
 
				 #endif
			
 
				 }
			
@@ -818,9 +852,16 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_PLACE_NUM_PROCS)(int place_num) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return 0;
			
 
				+  if (!__kmp_affin_reset) {
			
 
				+    // only bind root here if its affinity reset is not requested
			
 
				+    int gtid = __kmp_entry_gtid();
			
 
				+    kmp_info_t *thread = __kmp_threads[gtid];
			
 
				+    if (thread->th.th_team->t.t_level == 0) {
			
 
				+      __kmp_assign_root_init_mask();
			
 
				+    }
			
 
				+  }
			
 
				   if (place_num < 0 || place_num >= (int)__kmp_affinity_num_masks)
			
 
				     return 0;
			
 
				   kmp_affin_mask_t *mask = KMP_CPU_INDEX(__kmp_affinity_masks, place_num);
			
@@ -844,9 +885,16 @@ void FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_PLACE_PROC_IDS)(int place_num,
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return;
			
 
				+  if (!__kmp_affin_reset) {
			
 
				+    // only bind root here if its affinity reset is not requested
			
 
				+    int gtid = __kmp_entry_gtid();
			
 
				+    kmp_info_t *thread = __kmp_threads[gtid];
			
 
				+    if (thread->th.th_team->t.t_level == 0) {
			
 
				+      __kmp_assign_root_init_mask();
			
 
				+    }
			
 
				+  }
			
 
				   if (place_num < 0 || place_num >= (int)__kmp_affinity_num_masks)
			
 
				     return;
			
 
				   kmp_affin_mask_t *mask = KMP_CPU_INDEX(__kmp_affinity_masks, place_num);
			
@@ -870,11 +918,13 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_PLACE_NUM)(void) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return -1;
			
 
				   gtid = __kmp_entry_gtid();
			
 
				   thread = __kmp_thread_from_gtid(gtid);
			
 
				+  if (thread->th.th_team->t.t_level == 0 && !__kmp_affin_reset) {
			
 
				+    __kmp_assign_root_init_mask();
			
 
				+  }
			
 
				   if (thread->th.th_current_place < 0)
			
 
				     return -1;
			
 
				   return thread->th.th_current_place;
			
@@ -890,11 +940,13 @@ int FTN_STDCALL KMP_EXPAND_NAME(FTN_GET_PARTITION_NUM_PLACES)(void) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return 0;
			
 
				   gtid = __kmp_entry_gtid();
			
 
				   thread = __kmp_thread_from_gtid(gtid);
			
 
				+  if (thread->th.th_team->t.t_level == 0 && !__kmp_affin_reset) {
			
 
				+    __kmp_assign_root_init_mask();
			
 
				+  }
			
 
				   first_place = thread->th.th_first_place;
			
 
				   last_place = thread->th.th_last_place;
			
 
				   if (first_place < 0 || last_place < 0)
			
@@ -917,11 +969,13 @@ KMP_EXPAND_NAME(FTN_GET_PARTITION_PLACE_NUMS)(int *place_nums) {
 
				   if (!TCR_4(__kmp_init_middle)) {
			
 
				     __kmp_middle_initialize();
			
 
				   }
			
 
				-  __kmp_assign_root_init_mask();
			
 
				   if (!KMP_AFFINITY_CAPABLE())
			
 
				     return;
			
 
				   gtid = __kmp_entry_gtid();
			
 
				   thread = __kmp_thread_from_gtid(gtid);
			
 
				+  if (thread->th.th_team->t.t_level == 0 && !__kmp_affin_reset) {
			
 
				+    __kmp_assign_root_init_mask();
			
 
				+  }
			
 
				   first_place = thread->th.th_first_place;
			
 
				   last_place = thread->th.th_last_place;
			
 
				   if (first_place < 0 || last_place < 0)
			
@@ -1567,6 +1621,15 @@ void FTN_STDCALL FTN_DISPLAY_ENV(int verbose) {
 
				 #endif
			
 
				 }
			
 
				 
			
 
				+int FTN_STDCALL FTN_IN_EXPLICIT_TASK(void) {
			
 
				+#ifdef KMP_STUB
			
 
				+  return 0;
			
 
				+#else
			
 
				+  int gtid = __kmp_entry_gtid();
			
 
				+  return __kmp_thread_from_gtid(gtid)->th.th_current_task->td_flags.tasktype;
			
 
				+#endif
			
 
				+}
			
 
				+
			
 
				 // GCC compatibility (versioned symbols)
			
 
				 #ifdef KMP_USE_VERSION_SYMBOLS
			
 
				 
			
--- a/contrib/libs/cxxsupp/openmp/kmp_ftn_os.h
+++ b/contrib/libs/cxxsupp/openmp/kmp_ftn_os.h
@@ -134,6 +134,7 @@
 
				 #define FTN_PAUSE_RESOURCE_ALL omp_pause_resource_all
			
 
				 #define FTN_GET_SUPPORTED_ACTIVE_LEVELS omp_get_supported_active_levels
			
 
				 #define FTN_DISPLAY_ENV omp_display_env
			
 
				+#define FTN_IN_EXPLICIT_TASK omp_in_explicit_task
			
 
				 #define FTN_FULFILL_EVENT omp_fulfill_event
			
 
				 #define FTN_SET_NUM_TEAMS omp_set_num_teams
			
 
				 #define FTN_GET_MAX_TEAMS omp_get_max_teams
			
@@ -270,6 +271,7 @@
 
				 #define FTN_PAUSE_RESOURCE_ALL omp_pause_resource_all_
			
 
				 #define FTN_GET_SUPPORTED_ACTIVE_LEVELS omp_get_supported_active_levels_
			
 
				 #define FTN_DISPLAY_ENV omp_display_env_
			
 
				+#define FTN_IN_EXPLICIT_TASK omp_in_explicit_task_
			
 
				 #define FTN_FULFILL_EVENT omp_fulfill_event_
			
 
				 #define FTN_SET_NUM_TEAMS omp_set_num_teams_
			
 
				 #define FTN_GET_MAX_TEAMS omp_get_max_teams_
			
@@ -404,6 +406,7 @@
 
				 #define FTN_PAUSE_RESOURCE_ALL OMP_PAUSE_RESOURCE_ALL
			
 
				 #define FTN_GET_SUPPORTED_ACTIVE_LEVELS OMP_GET_SUPPORTED_ACTIVE_LEVELS
			
 
				 #define FTN_DISPLAY_ENV OMP_DISPLAY_ENV
			
 
				+#define FTN_IN_EXPLICIT_TASK OMP_IN_EXPLICIT_TASK
			
 
				 #define FTN_FULFILL_EVENT OMP_FULFILL_EVENT
			
 
				 #define FTN_SET_NUM_TEAMS OMP_SET_NUM_TEAMS
			
 
				 #define FTN_GET_MAX_TEAMS OMP_GET_MAX_TEAMS
			
@@ -540,6 +543,7 @@
 
				 #define FTN_PAUSE_RESOURCE_ALL OMP_PAUSE_RESOURCE_ALL_
			
 
				 #define FTN_GET_SUPPORTED_ACTIVE_LEVELS OMP_GET_SUPPORTED_ACTIVE_LEVELS_
			
 
				 #define FTN_DISPLAY_ENV OMP_DISPLAY_ENV_
			
 
				+#define FTN_IN_EXPLICIT_TASK OMP_IN_EXPLICIT_TASK_
			
 
				 #define FTN_FULFILL_EVENT OMP_FULFILL_EVENT_
			
 
				 #define FTN_SET_NUM_TEAMS OMP_SET_NUM_TEAMS_
			
 
				 #define FTN_GET_MAX_TEAMS OMP_GET_MAX_TEAMS_