!8 Backport some SPR patches to GCC-12
From: @github-27907959 Reviewed-by: @li-yancheng, @eastb233 Signed-off-by: @eastb233
This commit is contained in:
commit
e586fcabde
77
0002-i386-Add-syscall-to-enable-AMX-for-latest-kernels.patch
Normal file
77
0002-i386-Add-syscall-to-enable-AMX-for-latest-kernels.patch
Normal file
@ -0,0 +1,77 @@
|
|||||||
|
From 5e377d21f1f345d8b157b9bc306e02bb9bd45e01 Mon Sep 17 00:00:00 2001
|
||||||
|
From: Haochen Jiang <haochen.jiang@intel.com>
|
||||||
|
Date: Thu, 16 Jun 2022 00:15:53 -0700
|
||||||
|
Subject: [PATCH] i386: Add syscall to enable AMX for latest kernels
|
||||||
|
|
||||||
|
gcc/testsuite/ChangeLog:
|
||||||
|
|
||||||
|
* gcc.target/i386/amx-check.h (request_perm_xtile_data):
|
||||||
|
New function to check if AMX is usable and enable AMX.
|
||||||
|
(main): Run test if AMX is usable.
|
||||||
|
---
|
||||||
|
gcc/testsuite/gcc.target/i386/amx-check.h | 30 +++++++++++++++++++++++
|
||||||
|
1 file changed, 30 insertions(+)
|
||||||
|
|
||||||
|
diff --git a/gcc/testsuite/gcc.target/i386/amx-check.h b/gcc/testsuite/gcc.target/i386/amx-check.h
|
||||||
|
index 434b0e59703..6fff5ff4631 100644
|
||||||
|
--- a/gcc/testsuite/gcc.target/i386/amx-check.h
|
||||||
|
+++ b/gcc/testsuite/gcc.target/i386/amx-check.h
|
||||||
|
@@ -4,11 +4,24 @@
|
||||||
|
#include <stdlib.h>
|
||||||
|
#include <string.h>
|
||||||
|
#include <stdint.h>
|
||||||
|
+#include <unistd.h>
|
||||||
|
+#ifdef __linux__
|
||||||
|
+#include <sys/syscall.h>
|
||||||
|
+#endif
|
||||||
|
#ifdef DEBUG
|
||||||
|
#include <stdio.h>
|
||||||
|
#endif
|
||||||
|
#include "cpuid.h"
|
||||||
|
|
||||||
|
+#define XFEATURE_XTILECFG 17
|
||||||
|
+#define XFEATURE_XTILEDATA 18
|
||||||
|
+#define XFEATURE_MASK_XTILECFG (1 << XFEATURE_XTILECFG)
|
||||||
|
+#define XFEATURE_MASK_XTILEDATA (1 << XFEATURE_XTILEDATA)
|
||||||
|
+#define XFEATURE_MASK_XTILE (XFEATURE_MASK_XTILECFG | XFEATURE_MASK_XTILEDATA)
|
||||||
|
+
|
||||||
|
+#define ARCH_GET_XCOMP_PERM 0x1022
|
||||||
|
+#define ARCH_REQ_XCOMP_PERM 0x1023
|
||||||
|
+
|
||||||
|
/* TODO: The tmm emulation is temporary for current
|
||||||
|
AMX implementation with no tmm regclass, should
|
||||||
|
be changed in the future. */
|
||||||
|
@@ -44,6 +57,20 @@ typedef struct __tile
|
||||||
|
/* Stride (colum width in byte) used for tileload/store */
|
||||||
|
#define _STRIDE 64
|
||||||
|
|
||||||
|
+#ifdef __linux__
|
||||||
|
+/* We need syscall to use amx functions */
|
||||||
|
+int request_perm_xtile_data()
|
||||||
|
+{
|
||||||
|
+ unsigned long bitmask;
|
||||||
|
+
|
||||||
|
+ if (syscall (SYS_arch_prctl, ARCH_REQ_XCOMP_PERM, XFEATURE_XTILEDATA) ||
|
||||||
|
+ syscall (SYS_arch_prctl, ARCH_GET_XCOMP_PERM, &bitmask))
|
||||||
|
+ return 0;
|
||||||
|
+
|
||||||
|
+ return (bitmask & XFEATURE_MASK_XTILE) != 0;
|
||||||
|
+}
|
||||||
|
+#endif
|
||||||
|
+
|
||||||
|
/* Initialize tile config by setting all tmm size to 16x64 */
|
||||||
|
void init_tile_config (__tilecfg_u *dst)
|
||||||
|
{
|
||||||
|
@@ -185,6 +212,9 @@ main ()
|
||||||
|
#endif
|
||||||
|
#ifdef AMX_BF16
|
||||||
|
&& __builtin_cpu_supports ("amx-bf16")
|
||||||
|
+#endif
|
||||||
|
+#ifdef __linux__
|
||||||
|
+ && request_perm_xtile_data ()
|
||||||
|
#endif
|
||||||
|
)
|
||||||
|
{
|
||||||
|
--
|
||||||
|
2.18.2
|
||||||
|
|
||||||
@ -0,0 +1,83 @@
|
|||||||
|
From 11c72f20d4d7ba1862a257cef05dc3a5e84a276d Mon Sep 17 00:00:00 2001
|
||||||
|
From: "Cui,Lili" <lili.cui@intel.com>
|
||||||
|
Date: Thu, 29 Sep 2022 14:28:06 +0800
|
||||||
|
Subject: [PATCH] Remove AVX512_VP2INTERSECT from PTA_SAPPHIRERAPIDS
|
||||||
|
|
||||||
|
gcc/ChangeLog:
|
||||||
|
|
||||||
|
* config/i386/driver-i386.cc (host_detect_local_cpu):
|
||||||
|
Move sapphirerapids out of AVX512_VP2INTERSECT.
|
||||||
|
* config/i386/i386.h: Remove AVX512_VP2INTERSECT from PTA_SAPPHIRERAPIDS
|
||||||
|
* doc/invoke.texi: Remove AVX512_VP2INTERSECT from SAPPHIRERAPIDS
|
||||||
|
---
|
||||||
|
gcc/config/i386/driver-i386.cc | 13 +++++--------
|
||||||
|
gcc/config/i386/i386.h | 7 +++----
|
||||||
|
gcc/doc/invoke.texi | 8 ++++----
|
||||||
|
3 files changed, 12 insertions(+), 16 deletions(-)
|
||||||
|
|
||||||
|
diff --git a/gcc/config/i386/driver-i386.cc b/gcc/config/i386/driver-i386.cc
|
||||||
|
index 3c702fdca33..ef567045c67 100644
|
||||||
|
--- a/gcc/config/i386/driver-i386.cc
|
||||||
|
+++ b/gcc/config/i386/driver-i386.cc
|
||||||
|
@@ -589,15 +589,12 @@ const char *host_detect_local_cpu (int argc, const char **argv)
|
||||||
|
/* This is unknown family 0x6 CPU. */
|
||||||
|
if (has_feature (FEATURE_AVX))
|
||||||
|
{
|
||||||
|
+ /* Assume Tiger Lake */
|
||||||
|
if (has_feature (FEATURE_AVX512VP2INTERSECT))
|
||||||
|
- {
|
||||||
|
- if (has_feature (FEATURE_TSXLDTRK))
|
||||||
|
- /* Assume Sapphire Rapids. */
|
||||||
|
- cpu = "sapphirerapids";
|
||||||
|
- else
|
||||||
|
- /* Assume Tiger Lake */
|
||||||
|
- cpu = "tigerlake";
|
||||||
|
- }
|
||||||
|
+ cpu = "tigerlake";
|
||||||
|
+ /* Assume Sapphire Rapids. */
|
||||||
|
+ else if (has_feature (FEATURE_TSXLDTRK))
|
||||||
|
+ cpu = "sapphirerapids";
|
||||||
|
/* Assume Cooper Lake */
|
||||||
|
else if (has_feature (FEATURE_AVX512BF16))
|
||||||
|
cpu = "cooperlake";
|
||||||
|
diff --git a/gcc/config/i386/i386.h b/gcc/config/i386/i386.h
|
||||||
|
index 900a3bc3673..372a2cff8fe 100644
|
||||||
|
--- a/gcc/config/i386/i386.h
|
||||||
|
+++ b/gcc/config/i386/i386.h
|
||||||
|
@@ -2326,10 +2326,9 @@ constexpr wide_int_bitmask PTA_ICELAKE_SERVER = PTA_ICELAKE_CLIENT
|
||||||
|
constexpr wide_int_bitmask PTA_TIGERLAKE = PTA_ICELAKE_CLIENT | PTA_MOVDIRI
|
||||||
|
| PTA_MOVDIR64B | PTA_CLWB | PTA_AVX512VP2INTERSECT | PTA_KL | PTA_WIDEKL;
|
||||||
|
constexpr wide_int_bitmask PTA_SAPPHIRERAPIDS = PTA_ICELAKE_SERVER | PTA_MOVDIRI
|
||||||
|
- | PTA_MOVDIR64B | PTA_AVX512VP2INTERSECT | PTA_ENQCMD | PTA_CLDEMOTE
|
||||||
|
- | PTA_PTWRITE | PTA_WAITPKG | PTA_SERIALIZE | PTA_TSXLDTRK | PTA_AMX_TILE
|
||||||
|
- | PTA_AMX_INT8 | PTA_AMX_BF16 | PTA_UINTR | PTA_AVXVNNI | PTA_AVX512FP16
|
||||||
|
- | PTA_AVX512BF16;
|
||||||
|
+ | PTA_MOVDIR64B | PTA_ENQCMD | PTA_CLDEMOTE | PTA_PTWRITE | PTA_WAITPKG
|
||||||
|
+ | PTA_SERIALIZE | PTA_TSXLDTRK | PTA_AMX_TILE | PTA_AMX_INT8 | PTA_AMX_BF16
|
||||||
|
+ | PTA_UINTR | PTA_AVXVNNI | PTA_AVX512FP16 | PTA_AVX512BF16;
|
||||||
|
constexpr wide_int_bitmask PTA_KNL = PTA_BROADWELL | PTA_AVX512PF
|
||||||
|
| PTA_AVX512ER | PTA_AVX512F | PTA_AVX512CD | PTA_PREFETCHWT1;
|
||||||
|
constexpr wide_int_bitmask PTA_BONNELL = PTA_CORE2 | PTA_MOVBE;
|
||||||
|
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
|
||||||
|
index 271c8bb8468..a9ecc4426a4 100644
|
||||||
|
--- a/gcc/doc/invoke.texi
|
||||||
|
+++ b/gcc/doc/invoke.texi
|
||||||
|
@@ -32057,11 +32057,11 @@ Intel sapphirerapids CPU with 64-bit extensions, MOVBE, MMX, SSE, SSE2, SSE3,
|
||||||
|
SSSE3, SSE4.1, SSE4.2, POPCNT, CX16, SAHF, FXSR, AVX, XSAVE, PCLMUL, FSGSBASE,
|
||||||
|
RDRND, F16C, AVX2, BMI, BMI2, LZCNT, FMA, MOVBE, HLE, RDSEED, ADCX, PREFETCHW,
|
||||||
|
AES, CLFLUSHOPT, XSAVEC, XSAVES, SGX, AVX512F, AVX512VL, AVX512BW, AVX512DQ,
|
||||||
|
-AVX512CD, PKU, AVX512VBMI, AVX512IFMA, SHA, AVX512VNNI, GFNI, VAES, AVX512VBMI2
|
||||||
|
+AVX512CD, PKU, AVX512VBMI, AVX512IFMA, SHA, AVX512VNNI, GFNI, VAES, AVX512VBMI2,
|
||||||
|
VPCLMULQDQ, AVX512BITALG, RDPID, AVX512VPOPCNTDQ, PCONFIG, WBNOINVD, CLWB,
|
||||||
|
-MOVDIRI, MOVDIR64B, AVX512VP2INTERSECT, ENQCMD, CLDEMOTE, PTWRITE, WAITPKG,
|
||||||
|
-SERIALIZE, TSXLDTRK, UINTR, AMX-BF16, AMX-TILE, AMX-INT8, AVX-VNNI, AVX512FP16
|
||||||
|
-and AVX512BF16 instruction set support.
|
||||||
|
+MOVDIRI, MOVDIR64B, ENQCMD, CLDEMOTE, PTWRITE, WAITPKG, SERIALIZE, TSXLDTRK,
|
||||||
|
+UINTR, AMX-BF16, AMX-TILE, AMX-INT8, AVX-VNNI, AVX512FP16 and AVX512BF16
|
||||||
|
+instruction set support.
|
||||||
|
|
||||||
|
@item alderlake
|
||||||
|
Intel Alderlake CPU with 64-bit extensions, MOVBE, MMX, SSE, SSE2, SSE3, SSSE3,
|
||||||
|
--
|
||||||
|
2.18.2
|
||||||
|
|
||||||
123
0004-Add-attribute-hot-judgement-for-INLINE_HINT_known_ho.patch
Normal file
123
0004-Add-attribute-hot-judgement-for-INLINE_HINT_known_ho.patch
Normal file
@ -0,0 +1,123 @@
|
|||||||
|
From 1b9a5cc9ec08e9f239dd2096edcc447b7a72f64a Mon Sep 17 00:00:00 2001
|
||||||
|
From: "Cui,Lili" <lili.cui@intel.com>
|
||||||
|
Date: Tue, 1 Nov 2022 09:16:49 +0800
|
||||||
|
Subject: [PATCH] Add attribute hot judgement for INLINE_HINT_known_hot hint.
|
||||||
|
|
||||||
|
We set up INLINE_HINT_known_hot hint only when we have profile feedback,
|
||||||
|
now add function attribute judgement for it, when both caller and callee
|
||||||
|
have __attribute__((hot)), we will also set up INLINE_HINT_known_hot hint
|
||||||
|
for it.
|
||||||
|
|
||||||
|
With this patch applied,
|
||||||
|
ADL Multi-copy: 538.imagic_r 16.7%
|
||||||
|
ICX Multi-copy: 538.imagic_r 15.2%
|
||||||
|
CLX Multi-copy: 538.imagic_r 12.7%
|
||||||
|
Znver3 Multi-copy: 538.imagic_r 10.6%
|
||||||
|
Arm Multi-copy: 538.imagic_r 13.4%
|
||||||
|
|
||||||
|
gcc/ChangeLog
|
||||||
|
|
||||||
|
* ipa-inline-analysis.cc (do_estimate_edge_time): Add function attribute
|
||||||
|
judgement for INLINE_HINT_known_hot hint.
|
||||||
|
|
||||||
|
gcc/testsuite/ChangeLog:
|
||||||
|
|
||||||
|
* gcc.dg/ipa/inlinehint-6.c: New test.
|
||||||
|
---
|
||||||
|
gcc/ipa-inline-analysis.cc | 13 ++++---
|
||||||
|
gcc/testsuite/gcc.dg/ipa/inlinehint-6.c | 47 +++++++++++++++++++++++++
|
||||||
|
2 files changed, 56 insertions(+), 4 deletions(-)
|
||||||
|
create mode 100644 gcc/testsuite/gcc.dg/ipa/inlinehint-6.c
|
||||||
|
|
||||||
|
diff --git a/gcc/ipa-inline-analysis.cc b/gcc/ipa-inline-analysis.cc
|
||||||
|
index 1ca685d1b0e..7bd29c36590 100644
|
||||||
|
--- a/gcc/ipa-inline-analysis.cc
|
||||||
|
+++ b/gcc/ipa-inline-analysis.cc
|
||||||
|
@@ -48,6 +48,7 @@ along with GCC; see the file COPYING3. If not see
|
||||||
|
#include "ipa-utils.h"
|
||||||
|
#include "cfgexpand.h"
|
||||||
|
#include "gimplify.h"
|
||||||
|
+#include "attribs.h"
|
||||||
|
|
||||||
|
/* Cached node/edge growths. */
|
||||||
|
fast_call_summary<edge_growth_cache_entry *, va_heap> *edge_growth_cache = NULL;
|
||||||
|
@@ -249,15 +250,19 @@ do_estimate_edge_time (struct cgraph_edge *edge, sreal *ret_nonspec_time)
|
||||||
|
hints = estimates.hints;
|
||||||
|
}
|
||||||
|
|
||||||
|
- /* When we have profile feedback, we can quite safely identify hot
|
||||||
|
- edges and for those we disable size limits. Don't do that when
|
||||||
|
- probability that caller will call the callee is low however, since it
|
||||||
|
+ /* When we have profile feedback or function attribute, we can quite safely
|
||||||
|
+ identify hot edges and for those we disable size limits. Don't do that
|
||||||
|
+ when probability that caller will call the callee is low however, since it
|
||||||
|
may hurt optimization of the caller's hot path. */
|
||||||
|
- if (edge->count.ipa ().initialized_p () && edge->maybe_hot_p ()
|
||||||
|
+ if ((edge->count.ipa ().initialized_p () && edge->maybe_hot_p ()
|
||||||
|
&& (edge->count.ipa ().apply_scale (2, 1)
|
||||||
|
> (edge->caller->inlined_to
|
||||||
|
? edge->caller->inlined_to->count.ipa ()
|
||||||
|
: edge->caller->count.ipa ())))
|
||||||
|
+ || (lookup_attribute ("hot", DECL_ATTRIBUTES (edge->caller->decl))
|
||||||
|
+ != NULL
|
||||||
|
+ && lookup_attribute ("hot", DECL_ATTRIBUTES (edge->callee->decl))
|
||||||
|
+ != NULL))
|
||||||
|
hints |= INLINE_HINT_known_hot;
|
||||||
|
|
||||||
|
gcc_checking_assert (size >= 0);
|
||||||
|
diff --git a/gcc/testsuite/gcc.dg/ipa/inlinehint-6.c b/gcc/testsuite/gcc.dg/ipa/inlinehint-6.c
|
||||||
|
new file mode 100644
|
||||||
|
index 00000000000..1f3be641c6d
|
||||||
|
--- /dev/null
|
||||||
|
+++ b/gcc/testsuite/gcc.dg/ipa/inlinehint-6.c
|
||||||
|
@@ -0,0 +1,47 @@
|
||||||
|
+/* { dg-options "-O3 -c -fdump-ipa-inline-details -fno-early-inlining -fno-ipa-cp" } */
|
||||||
|
+/* { dg-add-options bind_pic_locally } */
|
||||||
|
+
|
||||||
|
+#define size_t long long int
|
||||||
|
+
|
||||||
|
+struct A
|
||||||
|
+{
|
||||||
|
+ size_t f1, f2, f3, f4;
|
||||||
|
+};
|
||||||
|
+struct C
|
||||||
|
+{
|
||||||
|
+ struct A a;
|
||||||
|
+ size_t b;
|
||||||
|
+};
|
||||||
|
+struct C x;
|
||||||
|
+
|
||||||
|
+__attribute__((hot)) struct C callee (struct A *a, struct C *c)
|
||||||
|
+{
|
||||||
|
+ c->a=(*a);
|
||||||
|
+
|
||||||
|
+ if((c->b + 7) & 17)
|
||||||
|
+ {
|
||||||
|
+ c->a.f1 = c->a.f2 + c->a.f1;
|
||||||
|
+ c->a.f2 = c->a.f3 - c->a.f2;
|
||||||
|
+ c->a.f3 = c->a.f2 + c->a.f3;
|
||||||
|
+ c->a.f4 = c->a.f2 - c->a.f4;
|
||||||
|
+ c->b = c->a.f2;
|
||||||
|
+
|
||||||
|
+ }
|
||||||
|
+ return *c;
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+__attribute__((hot)) struct C caller (size_t d, size_t e, size_t f, size_t g, struct C *c)
|
||||||
|
+{
|
||||||
|
+ struct A a;
|
||||||
|
+ a.f1 = 1 + d;
|
||||||
|
+ a.f2 = e;
|
||||||
|
+ a.f3 = 12 + f;
|
||||||
|
+ a.f4 = 68 + g;
|
||||||
|
+ if (c->b > 0)
|
||||||
|
+ return callee (&a, c);
|
||||||
|
+ else
|
||||||
|
+ return *c;
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+/* { dg-final { scan-ipa-dump "known_hot" "inline" } } */
|
||||||
|
+
|
||||||
|
--
|
||||||
|
2.18.2
|
||||||
|
|
||||||
17
gcc-12.spec
17
gcc-12.spec
@ -84,7 +84,7 @@
|
|||||||
Summary: Various compilers (C, C++, Objective-C, ...)
|
Summary: Various compilers (C, C++, Objective-C, ...)
|
||||||
Name: %{?scl_prefix}gcc
|
Name: %{?scl_prefix}gcc
|
||||||
Version: 12.2.1
|
Version: 12.2.1
|
||||||
Release: 5
|
Release: 8
|
||||||
# libgcc, libgfortran, libgomp, libstdc++ and crtstuff have
|
# libgcc, libgfortran, libgomp, libstdc++ and crtstuff have
|
||||||
# GCC Runtime Exception.
|
# GCC Runtime Exception.
|
||||||
License: GPLv3+ and GPLv3+ with exceptions and GPLv2+ with exceptions and LGPLv2+ and BSD
|
License: GPLv3+ and GPLv3+ with exceptions and GPLv2+ with exceptions and LGPLv2+ and BSD
|
||||||
@ -133,6 +133,9 @@ Provides: %{?scl_prefix}gcc(major) = %{gcc_major}
|
|||||||
|
|
||||||
|
|
||||||
Patch0: 0001-change-gcc-version.patch
|
Patch0: 0001-change-gcc-version.patch
|
||||||
|
Patch1: 0002-i386-Add-syscall-to-enable-AMX-for-latest-kernels.patch
|
||||||
|
Patch2: 0003-Remove-AVX512_VP2INTERSECT-from-PTA_SAPPHIRERAPIDS.patch
|
||||||
|
Patch3: 0004-Add-attribute-hot-judgement-for-INLINE_HINT_known_ho.patch
|
||||||
|
|
||||||
|
|
||||||
# On ARM EABI systems, we do want -gnueabi to be part of the
|
# On ARM EABI systems, we do want -gnueabi to be part of the
|
||||||
@ -591,6 +594,9 @@ not stable, so plugins must be rebuilt any time GCC is updated.
|
|||||||
%setup -q -n gcc-12.2.0
|
%setup -q -n gcc-12.2.0
|
||||||
|
|
||||||
%patch0 -p1
|
%patch0 -p1
|
||||||
|
%patch1 -p1
|
||||||
|
%patch2 -p1
|
||||||
|
%patch3 -p1
|
||||||
|
|
||||||
echo 'openEuler %{version}-%{release}' > gcc/DEV-PHASE
|
echo 'openEuler %{version}-%{release}' > gcc/DEV-PHASE
|
||||||
|
|
||||||
@ -2647,6 +2653,15 @@ end
|
|||||||
%doc rpm.doc/changelogs/libcc1/ChangeLog*
|
%doc rpm.doc/changelogs/libcc1/ChangeLog*
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
* Wed Nov 09 2022 Cui Lili <lili.cui@intel.com> 12.2.1-8
|
||||||
|
- Add attribute hot judgement for INLINE_HINT_known_hot hint
|
||||||
|
|
||||||
|
* Wed Nov 09 2022 Cui Lili <lili.cui@intel.com> 12.2.1-7
|
||||||
|
- Remove AVX512_VP2INTERSECT from PTA_SAPPHIRERAPIDS
|
||||||
|
|
||||||
|
* Wed Nov 09 2022 Haochen Jiang <haochen.jiang@intel.com> 12.2.1-6
|
||||||
|
- i386: Add syscall to enable AMX for latest kernels
|
||||||
|
|
||||||
* Wed Nov 02 2022 liyancheng <412998149@qq.com> 12.2.1-5
|
* Wed Nov 02 2022 liyancheng <412998149@qq.com> 12.2.1-5
|
||||||
- Change isl dependency from Source to BuildRequire
|
- Change isl dependency from Source to BuildRequire
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user