RISC-V: Expand VLS mode to scalar mode move[PR111391]

author Juzhe-Zhong <juzhe.zhong@rivai.ai>

Thu, 14 Sep 2023 10:49:52 +0000 (18:49 +0800)

committer Pan Li <pan2.li@intel.com>

Sat, 16 Sep 2023 09:55:01 +0000 (17:55 +0800)
author Juzhe-Zhong <juzhe.zhong@rivai.ai>
Thu, 14 Sep 2023 10:49:52 +0000 (18:49 +0800)
committer Pan Li <pan2.li@intel.com>
Sat, 16 Sep 2023 09:55:01 +0000 (17:55 +0800)
diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md

index c6175a3b1f60f6ac621fcc89968fc3abc9604fef..aca86554a94e5072c3d2c506dae60821b58b0430 100644 (file)
--- a/gcc/config/riscv/autovec.md
+++ b/gcc/config/riscv/autovec.md
@@ -1442,7 +1442,7 @@
  ;; -------------------------------------------------------------------------
  ;; ---- [INT,FP] Extract a vector element.
  ;; -------------------------------------------------------------------------
-(define_expand "@vec_extract<mode><vel>"
+(define_expand "vec_extract<mode><vel>"
    [(set (match_operand:<VEL>     0 "register_operand")
       (vec_select:<VEL>
         (match_operand:V_VLS      1 "register_operand")
diff --git a/gcc/config/riscv/riscv-vsetvl.cc b/gcc/config/riscv/riscv-vsetvl.cc

index dc02246756d6c4c0aba93375298b8b61469ae950..5f031c18df5149aa26ec0b0e6624a51eb53c23b9 100644 (file)
--- a/gcc/config/riscv/riscv-vsetvl.cc
+++ b/gcc/config/riscv/riscv-vsetvl.cc
@@ -649,6 +649,8 @@ emit_vsetvl_insn (enum vsetvl_type insn_type, enum emit_type emit_type,
      {
        fprintf (dump_file, "\nInsert vsetvl insn PATTERN:\n");
        print_rtl_single (dump_file, pat);
+      fprintf (dump_file, "\nfor insn:\n");
+      print_rtl_single (dump_file, rinsn);
      }
  
    if (emit_type == EMIT_DIRECT)
@@ -3867,7 +3869,7 @@ pass_vsetvl::local_eliminate_vsetvl_insn (const bb_info *bb) const
               skip_one = true;
             }
  
-         curr_avl = get_avl (rinsn);
+         curr_avl = curr_dem.get_avl ();
  
           /* Some instrucion like pred_extract_first<mode> don't reqruie avl, so
              the avl is null, use vl_placeholder for unify the handling
diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc

index 762937b0e373796d30cdeb0831606a8b3f657fea..8c766e2e2be4e05086b4a820381ea7ec9e83cb7f 100644 (file)
--- a/gcc/config/riscv/riscv.cc
+++ b/gcc/config/riscv/riscv.cc
@@ -2513,6 +2513,70 @@ riscv_legitimize_move (machine_mode mode, rtx dest, rtx src)
         }
        return true;
      }
+  /* Expand
+       (set (reg:DI target) (subreg:DI (reg:V8QI reg) 0))
+     Expand this data movement instead of simply forbid it since
+     we can improve the code generation for this following scenario
+     by RVV auto-vectorization:
+       (set (reg:V8QI 149) (vec_duplicate:V8QI (reg:QI))
+       (set (reg:DI target) (subreg:DI (reg:V8QI reg) 0))
+     Since RVV mode and scalar mode are in different REG_CLASS,
+     we need to explicitly move data from V_REGS to GR_REGS by scalar move.  */
+  if (SUBREG_P (src) && riscv_v_ext_mode_p (GET_MODE (SUBREG_REG (src))))
+    {
+      machine_mode vmode = GET_MODE (SUBREG_REG (src));
+      unsigned int mode_size = GET_MODE_SIZE (mode).to_constant ();
+      unsigned int vmode_size = GET_MODE_SIZE (vmode).to_constant ();
+      unsigned int nunits = vmode_size / mode_size;
+      scalar_mode smode = as_a<scalar_mode> (mode);
+      unsigned int index = SUBREG_BYTE (src).to_constant () / mode_size;
+      unsigned int num = smode == DImode && !TARGET_VECTOR_ELEN_64 ? 2 : 1;
+
+      if (num == 2)
+       {
+         /* If we want to extract 64bit value but ELEN < 64,
+            we use RVV vector mode with EEW = 32 to extract
+            the highpart and lowpart.  */
+         smode = SImode;
+         nunits = nunits * 2;
+       }
+      vmode = riscv_vector::get_vector_mode (smode, nunits).require ();
+      enum insn_code icode
+       = convert_optab_handler (vec_extract_optab, vmode, smode);
+      gcc_assert (icode != CODE_FOR_nothing);
+      rtx v = gen_lowpart (vmode, SUBREG_REG (src));
+
+      for (unsigned int i = 0; i < num; i++)
+       {
+         class expand_operand ops[3];
+         rtx result;
+         if (num == 1)
+           result = dest;
+         else if (i == 0)
+           result = gen_lowpart (smode, dest);
+         else
+           result = gen_reg_rtx (smode);
+         create_output_operand (&ops[0], result, smode);
+         ops[0].target = 1;
+         create_input_operand (&ops[1], v, vmode);
+         create_integer_operand (&ops[2], index + i);
+         expand_insn (icode, 3, ops);
+         if (ops[0].value != result)
+           emit_move_insn (result, ops[0].value);
+
+         if (i == 1)
+           {
+             rtx tmp
+               = expand_binop (Pmode, ashl_optab, gen_lowpart (Pmode, result),
+                               gen_int_mode (32, Pmode), NULL_RTX, 0,
+                               OPTAB_DIRECT);
+             rtx tmp2 = expand_binop (Pmode, ior_optab, tmp, dest, NULL_RTX, 0,
+                                      OPTAB_DIRECT);
+             emit_move_insn (dest, tmp2);
+           }
+       }
+      return true;
+    }
    /* Expand
         (set (reg:QI target) (mem:QI (address)))
       to
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-9.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-9.c

index 5fba27c7a3583398feefb648fddbfcd6df11decb..7c42438c9d9ac021cbabc76d57af58bb08e8aaa9 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-9.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-9.c
@@ -29,4 +29,3 @@
  TEST_ALL (VEC_PERM)
  
  /* { dg-final { scan-assembler-times {viota.m} 2 } } */
-/* { dg-final { scan-assembler-not {vmv\.v\.i} } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-1.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-1.c

new file mode 100644 (file)

index 0000000..a7f64c9
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-1.c
@@ -0,0 +1,28 @@
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv -mabi=lp64d -Wno-int-conversion -Wno-implicit-function -Wno-incompatible-pointer-types -Wno-implicit-function-declaration -Ofast -ftree-vectorize" } */
+
+int d ();
+typedef struct
+{
+  int b;
+} c;
+int
+e (char *f, long g)
+{
+  f += g;
+  while (g--)
+    *--f = d;
+}
+
+int
+d (c * f)
+{
+  while (h ())
+    switch (f->b)
+      case 'Q':
+      {
+       long a;
+       e (&a, sizeof (a));
+       i (a);
+      }
+}
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-2.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-2.c

new file mode 100644 (file)

index 0000000..1f170c9
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-2.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gc_zve32x_zvl128b -mabi=lp64d -Wno-int-conversion -Wno-implicit-function -Wno-incompatible-pointer-types -Wno-implicit-function-declaration -Ofast -ftree-vectorize" } */
+
+#include "pr111391-1.c"
+
+/* { dg-final { scan-assembler-times {vsetivli\s+zero,\s*2,\s*e32,\s*mf2,\s*t[au],\s*m[au]} 1 } }
+/* { dg-final { scan-assembler-times {vmv\.x\.s} 2 } } */
+/* { dg-final { scan-assembler-times {vslidedown.vi\s+v[0-9]+,\s*v[0-9]+,\s*1} 1 } } */
+/* { dg-final { scan-assembler-times {slli\s+[a-x0-9]+,[a-x0-9]+,32} 1 } } */
+/* { dg-final { scan-assembler-times {or\s+[a-x0-9]+,[a-x0-9]+,[a-x0-9]+} 1 } } */
author	Juzhe-Zhong <juzhe.zhong@rivai.ai>
	Thu, 14 Sep 2023 10:49:52 +0000 (18:49 +0800)
committer	Pan Li <pan2.li@intel.com>
	Sat, 16 Sep 2023 09:55:01 +0000 (17:55 +0800)
gcc/config/riscv/autovec.md		patch \| blob \| blame \| history
gcc/config/riscv/riscv-vsetvl.cc		patch \| blob \| blame \| history
gcc/config/riscv/riscv.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-9.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/riscv/rvv/autovec/pr111391-2.c	[new file with mode: 0644]	patch \| blob