[PR target/113666] Simplify VEC_EXTRACT from a uniform vector

author Jeff Law <jeffrey.law@oss.qualcomm.com>

Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)

committer Jeff Law <jeffrey.law@oss.qualcomm.com>

Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)
author Jeff Law <jeffrey.law@oss.qualcomm.com>
Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)
committer Jeff Law <jeffrey.law@oss.qualcomm.com>
Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)
diff --git a/gcc/fold-const-call.cc b/gcc/fold-const-call.cc

index 464d162cf550bcd38c1a7924d0b7cef9d891f252..aa63ced00bbabdf2ed383fba4f53bd1b39d78f25 100644 (file)
--- a/gcc/fold-const-call.cc
+++ b/gcc/fold-const-call.cc
@@ -1459,6 +1459,26 @@ fold_const_vec_shl_insert (tree, tree arg0, tree arg1)
    return NULL_TREE;
  }
  
+/* Fold a call to IFN_VEC_EXTRACT (ARG0, ARG1), returning a value
+   of type TYPE.
+
+   Right now this is only handling uniform vectors, so ARG1 is not
+   used.  But it could be easily adjusted in the future to handle
+   non-uniform vectors by extracting the relevant element.  */
+
+static tree
+fold_const_vec_extract (tree, tree arg0, tree)
+{
+  if (TREE_CODE (arg0) != VECTOR_CST)
+    return NULL_TREE;
+
+  /* vec_extract ( dup(CST), CST) -> dup (CST). */
+  if (tree elem = uniform_vector_p (arg0))
+    return elem;
+
+  return NULL_TREE;
+}
+
  /* Try to evaluate:
  
        *RESULT = FN (*ARG0, *ARG1)
@@ -1865,6 +1885,9 @@ fold_const_call (combined_fn fn, tree type, tree arg0, tree arg1)
      case CFN_VEC_SHL_INSERT:
        return fold_const_vec_shl_insert (type, arg0, arg1);
  
+    case CFN_VEC_EXTRACT:
+      return fold_const_vec_extract (type, arg0, arg1);
+
      case CFN_UBSAN_CHECK_ADD:
      case CFN_ADD_OVERFLOW:
        subcode = PLUS_EXPR;
diff --git a/gcc/match.pd b/gcc/match.pd

index ea840502640bd957a9e549a90d8dc1d35a6dc9bf..e0a2399ca65d64ce536c58684f87ae3c62a26674 100644 (file)
--- a/gcc/match.pd
+++ b/gcc/match.pd
@@ -12226,3 +12226,8 @@ and,
          && TYPE_UNSIGNED (type)
          && @0 == @3)
      (bit_xor (rrotate @0 @4) @2)))
+
+/* Optimize extraction from a uniform vector to a representative element as
+   long as the requested element is within range.  */
+(simplify (IFN_VEC_EXTRACT (vec_duplicate @0) INTEGER_CST@1)
+ @0)
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/base/pr113666.c b/gcc/testsuite/gcc.target/riscv/rvv/base/pr113666.c

new file mode 100644 (file)

index 0000000..b1034d7
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/rvv/base/pr113666.c
@@ -0,0 +1,24 @@
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv -mabi=lp64 -O3" { target rv64} } */
+/* { dg-options "-march=rv32gcv -mabi=ilp32 -O3" { target rv32} } */
+
+unsigned char a;
+
+int main() {
+  short b = a = 0;
+  for (; a != 19; a++)
+    if (a)
+      b = 32872 >> a;
+
+  if (b == 0)
+    return 0;
+  else
+    return 1;
+}
+
+/* If we vectorized, we should still be able to collapse away the VEC_EXTRACT,
+   leaving zero vector code in the final assembly.  So there should be no 
+   vsetvl instructions.  */
+/* { dg-final { scan-assembler-not {vsetivli} } } */
+
+
author	Jeff Law <jeffrey.law@oss.qualcomm.com>
	Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)
committer	Jeff Law <jeffrey.law@oss.qualcomm.com>
	Mon, 19 Jan 2026 14:44:54 +0000 (07:44 -0700)
gcc/fold-const-call.cc		patch \| blob \| blame \| history
gcc/match.pd		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/base/pr113666.c	[new file with mode: 0644]	patch \| blob