[PATCH 7/7] RISC-V: Disable by pieces for vector setmem length > UNITS_PER_WORD

author Craig Blackmore <craig.blackmore@embecosm.com>

Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)

committer Jeff Law <jlaw@ventanamicro.com>

Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)
author Craig Blackmore <craig.blackmore@embecosm.com>
Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)
committer Jeff Law <jlaw@ventanamicro.com>
Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)
diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc

index 3ac40234345a988fbfe7524731c7866f8297523b..fc2a83b21876808d9260f5321e893655bb4d0280 100644 (file)
--- a/gcc/config/riscv/riscv.cc
+++ b/gcc/config/riscv/riscv.cc
@@ -12583,6 +12583,22 @@ riscv_stack_clash_protection_alloca_probe_range (void)
    return STACK_CLASH_CALLER_GUARD;
  }
  
+static bool
+riscv_use_by_pieces_infrastructure_p (unsigned HOST_WIDE_INT size,
+                                     unsigned alignment,
+                                     enum by_pieces_operation op, bool speed_p)
+{
+  /* For set/clear with size > UNITS_PER_WORD, by pieces uses vector broadcasts
+     with UNITS_PER_WORD size pieces.  Use setmem<mode> instead which can use
+     bigger chunks.  */
+  if (TARGET_VECTOR && stringop_strategy & STRATEGY_VECTOR
+      && (op == CLEAR_BY_PIECES || op == SET_BY_PIECES)
+      && speed_p && size > UNITS_PER_WORD)
+    return false;
+
+  return default_use_by_pieces_infrastructure_p (size, alignment, op, speed_p);
+}
+
  /* Initialize the GCC target structure.  */
  #undef TARGET_ASM_ALIGNED_HI_OP
  #define TARGET_ASM_ALIGNED_HI_OP "\t.half\t"
@@ -12948,6 +12964,9 @@ riscv_stack_clash_protection_alloca_probe_range (void)
  #undef TARGET_C_MODE_FOR_FLOATING_TYPE
  #define TARGET_C_MODE_FOR_FLOATING_TYPE riscv_c_mode_for_floating_type
  
+#undef TARGET_USE_BY_PIECES_INFRASTRUCTURE_P
+#define TARGET_USE_BY_PIECES_INFRASTRUCTURE_P riscv_use_by_pieces_infrastructure_p
+
  struct gcc_target targetm = TARGET_INITIALIZER;
  
  #include "gt-riscv.h"
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr113469.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr113469.c

index d1c118c02d6e198bc4398706b0c4027486c95a8f..f86084bdb40f2d00d18c2b4151129d6f47154b90 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr113469.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr113469.c
@@ -51,4 +51,5 @@ void p(int buf, __builtin_va_list ab, int q) {
   } while (k);
  }
  
-/* { dg-final { scan-assembler-times {vsetivli\tzero,\s*4,\s*e8,\s*mf4,\s*t[au],\s*m[au]} 2 } } */
+/* { dg-final { scan-assembler-times {vsetivli\tzero,\s*4,\s*e8,\s*mf4,\s*t[au],\s*m[au]} 1 } } */
+/* { dg-final { scan-assembler-times {vsetivli\tzero,\s*8,\s*e8,\s*mf2,\s*t[au],\s*m[au]} 1 } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-2.c b/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-2.c

index faea442a4bdce8523d2cbe82399969bfdb683d11..838fbebadff34208ed4d62dccb333c8efc37e23e 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-2.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-2.c
@@ -5,15 +5,17 @@
  
  #define MIN_VECTOR_BYTES (__riscv_v_min_vlen / 8)
  
-/* Small memsets shouldn't be vectorised.
+/* Vectorise with no loop.
  ** f1:
  **  (
-**  sb\s+a1,0\(a0\)
-**  ...
+**  vsetivli\s+zero,\d+,e8,m1,ta,ma
  **  |
-**  li\s+a2,\d+
-**  tail\s+memset
+**  li\s+a\d+,\d+
+**  vsetvli\s+zero,a\d+,e8,m1,ta,ma
  **  )
+**  vmv\.v\.x\s+v\d+,a1
+**  vse8\.v\s+v\d+,0\(a0\)
+**  ret
  */
  void *
  f1 (void *a, int const b)
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-3.c b/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-3.c

index 25be694d248afa24b02364418c1b990df1458030..02de9a94cc47d4aacd74845e3ba729b1e9e80cea 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-3.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/base/setmem-3.c
@@ -5,15 +5,17 @@
  
  #define MIN_VECTOR_BYTES (__riscv_v_min_vlen / 8)
  
-/* Small memsets shouldn't be vectorised.
+/* Vectorise with no loop.
  ** f1:
  **  (
-**  sb\s+a1,0\(a0\)
-**  ...
+**  vsetivli\s+zero,\d+,e8,m1,ta,ma
  **  |
-**  li\s+a2,\d+
-**  tail\s+memset
+**  li\s+a\d+,\d+
+**  vsetvli\s+zero,a\d+,e8,m1,ta,ma
  **  )
+**  vmv\.v\.x\s+v\d+,a1
+**  vse8\.v\s+v\d+,0\(a0\)
+**  ret
  */
  void *
  f1 (void *a, int const b)
author	Craig Blackmore <craig.blackmore@embecosm.com>
	Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)
committer	Jeff Law <jlaw@ventanamicro.com>
	Sat, 19 Oct 2024 13:08:31 +0000 (07:08 -0600)
gcc/config/riscv/riscv.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/pr113469.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/base/setmem-2.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/base/setmem-3.c		patch \| blob \| blame \| history