i386: Tweak cost of SSE fabs/fneg in ix86_insn_cost.

author Roger Sayle <roger@nextmovesoftware.com>

Mon, 15 Jun 2026 19:09:55 +0000 (20:09 +0100)

committer Roger Sayle <roger@nextmovesoftware.com>

Mon, 15 Jun 2026 19:12:31 +0000 (20:12 +0100)
author Roger Sayle <roger@nextmovesoftware.com>
Mon, 15 Jun 2026 19:09:55 +0000 (20:09 +0100)
committer Roger Sayle <roger@nextmovesoftware.com>
Mon, 15 Jun 2026 19:12:31 +0000 (20:12 +0100)
diff --git a/gcc/config/i386/i386.cc b/gcc/config/i386/i386.cc

index 2945081234b3c5c073684aacf69f4a173822d571..b1fd86c2b320e3ce191fb4dd314a4f97782664f4 100644 (file)
--- a/gcc/config/i386/i386.cc
+++ b/gcc/config/i386/i386.cc
@@ -22462,7 +22462,22 @@ ix86_insn_cost (rtx_insn *insn, bool speed)
        == AVX_PARTIAL_XMM_UPDATE_TRUE)
      insn_cost += COSTS_N_INSNS (3);
  
-  return insn_cost + pattern_cost (PATTERN (insn), speed);
+  rtx pat = PATTERN (insn);
+  /* A USE of a memory is more expensive than a use of a REG.
+     For example *<absneg>mode2_1's use of a signbit mask.  */
+  if (GET_CODE (pat) == PARALLEL)
+    {
+      for (int i = 0; i < XVECLEN (pat, 0); i++)
+       {
+         rtx x = XVECEXP (pat, 0, i);
+         if (GET_CODE (x) == USE && MEM_P (XEXP (x, 0)))
+           insn_cost += !speed ? COSTS_N_BYTES (4)
+                               : TARGET_64BIT ? COSTS_N_INSNS (1) + 1
+                                              : COSTS_N_INSNS (3) + 1;
+       }
+    }
+
+  return insn_cost + pattern_cost (pat, speed);
  }
  
  /* Return cost of SSE/AVX FP->FP conversion (extensions and truncates).  */
diff --git a/gcc/testsuite/gcc.target/i386/fabsneg-2.c b/gcc/testsuite/gcc.target/i386/fabsneg-2.c

new file mode 100644 (file)

index 0000000..dd40c75
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/fabsneg-2.c
@@ -0,0 +1,23 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -mfpmath=sse -march=skylake" } */
+
+float x;
+float y;
+float z;
+
+void foo()
+{
+  x = -x;
+  y = -y;
+  z = -z;
+}
+
+void bar()
+{
+  x = __builtin_fabsf(x);
+  y = __builtin_fabsf(y);
+  z = __builtin_fabsf(z);
+}
+
+/* { dg-final { scan-assembler-times "LC0\[,(\]" 1 } } */
+/* { dg-final { scan-assembler-times "LC1\[,(\]" 1 } } */
author	Roger Sayle <roger@nextmovesoftware.com>
	Mon, 15 Jun 2026 19:09:55 +0000 (20:09 +0100)
committer	Roger Sayle <roger@nextmovesoftware.com>
	Mon, 15 Jun 2026 19:12:31 +0000 (20:12 +0100)
gcc/config/i386/i386.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/i386/fabsneg-2.c	[new file with mode: 0644]	patch \| blob