Reduce cost of aligned sse register store.

author liuhongt <hongtao.liu@intel.com>

Sat, 9 Oct 2021 01:42:10 +0000 (09:42 +0800)

committer liuhongt <hongtao.liu@intel.com>

Fri, 19 Nov 2021 01:22:48 +0000 (09:22 +0800)
author liuhongt <hongtao.liu@intel.com>
Sat, 9 Oct 2021 01:42:10 +0000 (09:42 +0800)
committer liuhongt <hongtao.liu@intel.com>
Fri, 19 Nov 2021 01:22:48 +0000 (09:22 +0800)
diff --git a/gcc/config/i386/x86-tune-costs.h b/gcc/config/i386/x86-tune-costs.h

index dd5563d2e641e078853cc20bff6c82c8bd511d92..60d50c97fca70070827bd12c1f67db8b47e3221a 100644 (file)
--- a/gcc/config/i386/x86-tune-costs.h
+++ b/gcc/config/i386/x86-tune-costs.h
@@ -1903,7 +1903,7 @@ struct processor_costs skylake_cost = {
    {6, 6, 6},                           /* cost of storing integer registers */
    {6, 6, 6, 10, 20},                   /* cost of loading SSE register
                                            in 32bit, 64bit, 128bit, 256bit and 512bit */
-  {8, 8, 8, 12, 24},                   /* cost of storing SSE register
+  {8, 8, 8, 8, 16},                    /* cost of storing SSE register
                                            in 32bit, 64bit, 128bit, 256bit and 512bit */
    {6, 6, 6, 10, 20},                   /* cost of unaligned loads.  */
    {8, 8, 8, 8, 16},                    /* cost of unaligned stores.  */
@@ -2029,7 +2029,7 @@ struct processor_costs icelake_cost = {
    {6, 6, 6},                           /* cost of storing integer registers */
    {6, 6, 6, 10, 20},                   /* cost of loading SSE register
                                            in 32bit, 64bit, 128bit, 256bit and 512bit */
-  {8, 8, 8, 12, 24},                   /* cost of storing SSE register
+  {8, 8, 8, 8, 16},                    /* cost of storing SSE register
                                            in 32bit, 64bit, 128bit, 256bit and 512bit */
    {6, 6, 6, 10, 20},                   /* cost of unaligned loads.  */
    {8, 8, 8, 8, 16},                    /* cost of unaligned stores.  */
diff --git a/gcc/testsuite/gcc.target/i386/pr102543.c b/gcc/testsuite/gcc.target/i386/pr102543.c

new file mode 100644 (file)

index 0000000..893eb9a
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr102543.c
@@ -0,0 +1,35 @@
+/* PR target/102543 */
+/* { dg-do compile } */
+/* { dg-options "-Ofast -march=skylake-avx512 -fdump-tree-optimized" } */
+/* { dg-final { scan-tree-dump-not "MEM\\\[" "optimized" } } */
+
+struct a
+{
+  int a[100];
+};
+typedef struct a misaligned_t __attribute__ ((aligned (8)));
+typedef struct a aligned_t __attribute__ ((aligned (32)));
+
+__attribute__ ((used))
+__attribute__ ((noinline))
+void
+t(void *a, int misaligned, aligned_t *d)
+{
+  int i,v;
+  for (i=0;i<100;i++)
+    {
+      if (misaligned)
+       v=((misaligned_t *)a)->a[i];
+      else
+       v=((aligned_t *)a)->a[i];
+      d->a[i]+=v;
+    }
+}
+struct b {int v; misaligned_t m;aligned_t aa;} b;
+aligned_t d;
+int
+main()
+{
+  t(&b.m, 1, &d);
+  return 0;
+}
author	liuhongt <hongtao.liu@intel.com>
	Sat, 9 Oct 2021 01:42:10 +0000 (09:42 +0800)
committer	liuhongt <hongtao.liu@intel.com>
	Fri, 19 Nov 2021 01:22:48 +0000 (09:22 +0800)
gcc/config/i386/x86-tune-costs.h		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/i386/pr102543.c	[new file with mode: 0644]	patch \| blob