From: "Zhang, Jun" <jun.zh...@intel.com>

By test, we find in hybrid platform spincount 1 is better.

Use '-march=native -Ofast -funroll-loops -flto',
results as follows:

spec2017 speed   RPL     ADL
657.xz_s         0.00%   0.50%
603.bwaves_s     10.90%  26.20%
607.cactuBSSN_s  5.50%   72.50%
619.lbm_s        2.40%   2.50%
621.wrf_s        -7.70%  2.40%
627.cam4_s       0.50%   0.70%
628.pop2_s       48.20%  153.00%
638.imagick_s    -0.10%  0.20%
644.nab_s        2.30%   1.40%
649.fotonik3d_s  8.00%   13.80%
654.roms_s       1.20%   1.10%
Geomean-int      0.00%   0.50%
Geomean-fp       6.30%   21.10%
Geomean-all      5.70%   19.10%

omp2012          RPL     ADL
350.md           -1.81%  -1.75%
351.bwaves       7.72%   12.50%
352.nab          14.63%  19.71%
357.bt331        -0.20%  1.77%
358.botsalgn     0.00%   0.00%
359.botsspar     0.00%   0.65%
360.ilbdc        0.00%   0.25%
362.fma3d        2.66%   -0.51%
363.swim         10.44%  0.00%
367.imagick      0.00%   0.12%
370.mgrid331     2.49%   25.56%
371.applu331     1.06%   4.22%
372.smithwa      0.74%   3.34%
376.kdtree       10.67%  16.03%
GEOMEAN          3.34%   5.53%

include/ChangeLog:

        * omphook.h: define RUNOMPHOOK macro.

libgomp/ChangeLog:

        * env.c (initialize_env): add RUNOMPHOOK macro.
        * config/linux/x86/omphook.h: define RUNOMPHOOK macro.
---
 include/omphook.h                  |  1 +
 libgomp/config/linux/x86/omphook.h | 19 +++++++++++++++++++
 libgomp/env.c                      |  3 +++
 3 files changed, 23 insertions(+)
 create mode 100644 include/omphook.h
 create mode 100644 libgomp/config/linux/x86/omphook.h

diff --git a/include/omphook.h b/include/omphook.h
new file mode 100644
index 00000000000..2ebe3ad57e6
--- /dev/null
+++ b/include/omphook.h
@@ -0,0 +1 @@
+#define RUNOMPHOOK()
diff --git a/libgomp/config/linux/x86/omphook.h 
b/libgomp/config/linux/x86/omphook.h
new file mode 100644
index 00000000000..aefb311cc07
--- /dev/null
+++ b/libgomp/config/linux/x86/omphook.h
@@ -0,0 +1,19 @@
+#ifdef __x86_64__
+#include "cpuid.h"
+
+/* only for x86 hybrid platform */
+#define RUNOMPHOOK()  \
+  do \
+    { \
+      unsigned int eax, ebx, ecx, edx; \
+      if ((getenv ("GOMP_SPINCOUNT") == NULL) && (wait_policy < 0) \
+         && __get_cpuid_count (7, 0, &eax, &ebx, &ecx, &edx) \
+         && ((edx >> 15) & 1)) \
+       gomp_spin_count_var = 1LL; \
+      if (gomp_throttled_spin_count_var > gomp_spin_count_var) \
+       gomp_throttled_spin_count_var = gomp_spin_count_var; \
+    } \
+  while (0)
+#else
+# include "../../../../include/omphook.h"
+#endif
diff --git a/libgomp/env.c b/libgomp/env.c
index a21adb3fd4b..1f13a148694 100644
--- a/libgomp/env.c
+++ b/libgomp/env.c
@@ -61,6 +61,7 @@
 
 #include "secure_getenv.h"
 #include "environ.h"
+#include "omphook.h"
 
 /* Default values of ICVs according to the OpenMP standard,
    except for default-device-var.  */
@@ -2496,5 +2497,7 @@ initialize_env (void)
   goacc_runtime_initialize ();
 
   goacc_profiling_initialize ();
+
+  RUNOMPHOOK ();
 }
 #endif /* LIBGOMP_OFFLOADED_ONLY */
-- 
2.31.1

Reply via email to