sched1: parameterize pressure scheduling spilling aggressiveness [PR/114729]

author Vineet Gupta <vineetg@rivosinc.com>

Wed, 4 Dec 2024 18:42:37 +0000 (10:42 -0800)

committer Vineet Gupta <vineetg@rivosinc.com>

Wed, 4 Dec 2024 18:59:46 +0000 (10:59 -0800)
author Vineet Gupta <vineetg@rivosinc.com>
Wed, 4 Dec 2024 18:42:37 +0000 (10:42 -0800)
committer Vineet Gupta <vineetg@rivosinc.com>
Wed, 4 Dec 2024 18:59:46 +0000 (10:59 -0800)
diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc

index 0a6c00926b31e1135aee325c7daa1c7e7dc13f8a..b9ddf7caee1039c0a37cbf807a0cf7aa4d62895c 100644 (file)
--- a/gcc/config/riscv/riscv.cc
+++ b/gcc/config/riscv/riscv.cc
@@ -10616,6 +10616,10 @@ riscv_option_override (void)
                        param_sched_pressure_algorithm,
                        SCHED_PRESSURE_MODEL);
  
+  SET_OPTION_IF_UNSET (&global_options, &global_options_set,
+                      param_cycle_accurate_model,
+                      0);
+
    /* Function to allocate machine-dependent function status.  */
    init_machine_status = &riscv_init_machine_status;
  
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi

index e3c2adc2507730339fbaef3a88f80e5c525ded34..d2409a41d50aa0bab9988e6ecf7fd1d672b0a2b0 100644 (file)
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -17211,6 +17211,16 @@ With @option{--param=openacc-privatization=quiet}, don't diagnose.
  This is the current default.
  With @option{--param=openacc-privatization=noisy}, do diagnose.
  
+@item cycle-accurate-model
+Specifies whether GCC should assume that the scheduling description is mostly
+a cycle-accurate model of the target processor, where the code is intended to
+run on, in the absence of cache misses.  Nonzero means that the selected
+scheduling model is accurate and likely describes an in-order processor,
+and that scheduling will aggressively spill to try and fill any pipeline
+bubbles.  This is the current default.  Zero could mean scheduling descrption
+might not be available/accurate or perhaps not applicale at all such as for
+modern out-of-order processors.
+
  @end table
  
  The following choices of @var{name} are available on AArch64 targets:
diff --git a/gcc/haifa-sched.cc b/gcc/haifa-sched.cc

index 02c893ec5cd3e50f638ce55fa871c20c53f9a6d1..cd4b6baddcd2fe508430cfc69b534f5a1f6c9406 100644 (file)
--- a/gcc/haifa-sched.cc
+++ b/gcc/haifa-sched.cc
@@ -2398,11 +2398,18 @@ model_excess_group_cost (struct model_pressure_group *group,
    int pressure, cl;
  
    cl = ira_pressure_classes[pci];
-  if (delta < 0 && point >= group->limits[pci].point)
+  if (delta < 0)
      {
-      pressure = MAX (group->limits[pci].orig_pressure,
-                     curr_reg_pressure[cl] + delta);
-      return -model_spill_cost (cl, pressure, curr_reg_pressure[cl]);
+      if (point >= group->limits[pci].point)
+       {
+         pressure = MAX (group->limits[pci].orig_pressure,
+                         curr_reg_pressure[cl] + delta);
+         return -model_spill_cost (cl, pressure, curr_reg_pressure[cl]);
+       }
+      /* if target prefers fewer spills, return the -ve delta indicating
+        pressure reduction.  */
+      else if (!param_cycle_accurate_model)
+         return delta;
      }
  
    if (delta > 0)
@@ -2453,7 +2460,7 @@ model_excess_cost (rtx_insn *insn, bool print_p)
      }
  
    if (print_p)
-    fprintf (sched_dump, "\n");
+    fprintf (sched_dump, " ECC %d\n", cost);
  
    return cost;
  }
@@ -2489,8 +2496,9 @@ model_set_excess_costs (rtx_insn **insns, int count)
    bool print_p;
  
    /* Record the baseECC value for each instruction in the model schedule,
-     except that negative costs are converted to zero ones now rather than
-     later.  Do not assign a cost to debug instructions, since they must
+     except that for targets which prefer wider schedules (more spills)
+     negative costs are converted to zero ones now rather than later.
+     Do not assign a cost to debug instructions, since they must
       not change code-generation decisions.  Experiments suggest we also
       get better results by not assigning a cost to instructions from
       a different block.
@@ -2512,7 +2520,7 @@ model_set_excess_costs (rtx_insn **insns, int count)
             print_p = true;
           }
         cost = model_excess_cost (insns[i], print_p);
-       if (cost <= 0)
+       if (param_cycle_accurate_model && cost <= 0)
           {
             priority = INSN_PRIORITY (insns[i]) - insn_delay (insns[i]) - cost;
             priority_base = MAX (priority_base, priority);
@@ -2523,6 +2531,14 @@ model_set_excess_costs (rtx_insn **insns, int count)
    if (print_p)
      fprintf (sched_dump, MODEL_BAR);
  
+  /* Typically in-order cores have a good pipeline scheduling model and the
+     algorithm would try to use that to minimize bubbles, favoring spills.
+     MAX (baseECC, 0) below changes negative baseECC (pressure reduction)
+     to 0 (pressure neutral) thus tending to more spills.
+     Otherwise return.  */
+  if (!param_cycle_accurate_model)
+    return;
+
    /* Use MAX (baseECC, 0) and baseP to calculcate ECC for each
       instruction.  */
    for (i = 0; i < count; i++)
diff --git a/gcc/params.opt b/gcc/params.opt

index 6efadd8ca163fa1d233fda980321c1abed87a81c..f5cc71d0f493d621bc90d35dfcc708e23facba63 100644 (file)
--- a/gcc/params.opt
+++ b/gcc/params.opt
@@ -66,6 +66,10 @@ Enable asan stack protection.
  Common Joined UInteger Var(param_asan_use_after_return) Init(1) IntegerRange(0, 1) Param Optimization
  Enable asan detection of use-after-return bugs.
  
+-param=cycle-accurate-model
+Common Joined UInteger Var(param_cycle_accurate_model) Init(1) IntegerRange(0, 1) Param Optimization
+Whether the scheduling description is mostly a cycle-accurate model of the target processor and is likely to be spill aggressively to fill any pipeline bubbles.
+
  -param=hwasan-instrument-stack=
  Common Joined UInteger Var(param_hwasan_instrument_stack) Init(1) IntegerRange(0, 1) Param Optimization
  Enable hwasan instrumentation of statically sized stack-allocated variables.
diff --git a/gcc/testsuite/gcc.target/riscv/riscv.exp b/gcc/testsuite/gcc.target/riscv/riscv.exp

index 3620ece47582f05c93d096ac21198c178eca17bd..ce84081183f8fd712d8203b0e0dc02c1ce97d8e6 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/riscv.exp
+++ b/gcc/testsuite/gcc.target/riscv/riscv.exp
@@ -38,6 +38,8 @@ dg-init
  # Main loop.
  gcc-dg-runtest [lsort [glob -nocomplain $srcdir/$subdir/*.\[cS\]]] \
         "" $DEFAULT_CFLAGS
+gcc-dg-runtest [lsort [glob -nocomplain $srcdir/$subdir/sched1-spills/*.{\[cS\],cpp}]] \
+       "" $DEFAULT_CFLAGS
  
  # Saturation alu
  foreach opt {
diff --git a/gcc/testsuite/gcc.target/riscv/sched1-spills/spill1.cpp b/gcc/testsuite/gcc.target/riscv/sched1-spills/spill1.cpp

new file mode 100644 (file)

index 0000000..8060ec2
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/sched1-spills/spill1.cpp
@@ -0,0 +1,32 @@
+/* { dg-options "-O2 -march=rv64gc -mabi=lp64d -save-temps -fverbose-asm" } */
+/* { dg-skip-if "" { *-*-* } { "-O0" "O1" "-Og" "-Os" "-Oz" } } */
+
+/* Reduced from SPEC2017 Cactu ML_BSSN_Advect.cpp
+   by comparing -fschedule-insn and -fno-schedule-insns builds.
+   Shows up one extra spill (pair of spill markers "sfp") in verbose asm
+   output which the patch fixes.  */
+
+void s();
+double b, c, d, e, f, g, h, k, l, m, n, o, p, q, t, u, v;
+int *j;
+double *r, *w;
+long x;
+void y() {
+  double *a((double *)s);
+  for (;;)
+    for (; j[1];)
+      for (int i = 1; i < j[0]; i++) {
+        k = l;
+        m = n;
+        o = p = q;
+        r[0] = t;
+        a[0] = u;
+        x = g;
+        e = f;
+        v = w[x];
+        b = c;
+        d = h;
+        }
+}
+
+/* { dg-final { scan-assembler-not "%sfp" } } */
author	Vineet Gupta <vineetg@rivosinc.com>
	Wed, 4 Dec 2024 18:42:37 +0000 (10:42 -0800)
committer	Vineet Gupta <vineetg@rivosinc.com>
	Wed, 4 Dec 2024 18:59:46 +0000 (10:59 -0800)
gcc/config/riscv/riscv.cc		patch \| blob \| blame \| history
gcc/doc/invoke.texi		patch \| blob \| blame \| history
gcc/haifa-sched.cc		patch \| blob \| blame \| history
gcc/params.opt		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/riscv.exp		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/sched1-spills/spill1.cpp	[new file with mode: 0644]	patch \| blob