RISC-V: Disallow transformation into VLMAX AVL for cond_len_xxx when length is in...

author Juzhe-Zhong <juzhe.zhong@rivai.ai>

Wed, 27 Dec 2023 02:38:26 +0000 (10:38 +0800)

committer Pan Li <pan2.li@intel.com>

Fri, 29 Dec 2023 00:38:03 +0000 (08:38 +0800)
author Juzhe-Zhong <juzhe.zhong@rivai.ai>
Wed, 27 Dec 2023 02:38:26 +0000 (10:38 +0800)
committer Pan Li <pan2.li@intel.com>
Fri, 29 Dec 2023 00:38:03 +0000 (08:38 +0800)
diff --git a/gcc/config/riscv/riscv-v.cc b/gcc/config/riscv/riscv-v.cc

index 038ab084a37248f871b70c1574269ecc94b47c40..b4c7e0f0126eb68412628fccb8c8379c46427f5b 100644 (file)
--- a/gcc/config/riscv/riscv-v.cc
+++ b/gcc/config/riscv/riscv-v.cc
@@ -68,6 +68,16 @@ imm_avl_p (machine_mode mode)
            : false;
  }
  
+/* Return true if LEN is equal to NUNITS that out of the range [0, 31].  */
+static bool
+is_vlmax_len_p (machine_mode mode, rtx len)
+{
+  poly_int64 value;
+  return poly_int_rtx_p (len, &value)
+        && known_eq (value, GET_MODE_NUNITS (mode))
+        && !satisfies_constraint_K (len);
+}
+
  /* Helper functions for insn_flags && insn_types */
  
  /* Return true if caller need pass mask operand for insn pattern with
@@ -3776,7 +3786,7 @@ expand_load_store (rtx *ops, bool is_load)
    rtx len = ops[3];
    machine_mode mode = GET_MODE (ops[0]);
  
-  if (poly_int_rtx_p (len, &value) && known_eq (value, GET_MODE_NUNITS (mode)))
+  if (is_vlmax_len_p (mode, len))
      {
        /* If the length operand is equal to VF, it is VLMAX load/store.  */
        if (is_load)
@@ -3842,8 +3852,7 @@ expand_cond_len_op (unsigned icode, insn_flags op_type, rtx *ops, rtx len)
    machine_mode mask_mode = GET_MODE (mask);
    poly_int64 value;
    bool is_dummy_mask = rtx_equal_p (mask, CONSTM1_RTX (mask_mode));
-  bool is_vlmax_len
-    = poly_int_rtx_p (len, &value) && known_eq (value, GET_MODE_NUNITS (mode));
+  bool is_vlmax_len = is_vlmax_len_p (mode, len);
  
    unsigned insn_flags = HAS_DEST_P | HAS_MASK_P | HAS_MERGE_P | op_type;
    if (is_dummy_mask)
@@ -4012,7 +4021,7 @@ expand_gather_scatter (rtx *ops, bool is_load)
    unsigned inner_offsize = GET_MODE_BITSIZE (inner_idx_mode);
    poly_int64 nunits = GET_MODE_NUNITS (vec_mode);
    poly_int64 value;
-  bool is_vlmax = poly_int_rtx_p (len, &value) && known_eq (value, nunits);
+  bool is_vlmax = is_vlmax_len_p (vec_mode, len);
  
    /* Extend the offset element to address width.  */
    if (inner_offsize < BITS_PER_WORD)
@@ -4199,7 +4208,7 @@ expand_lanes_load_store (rtx *ops, bool is_load)
    rtx reg = is_load ? ops[0] : ops[1];
    machine_mode mode = GET_MODE (ops[0]);
  
-  if (poly_int_rtx_p (len, &value) && known_eq (value, GET_MODE_NUNITS (mode)))
+  if (is_vlmax_len_p (mode, len))
      {
        /* If the length operand is equal to VF, it is VLMAX load/store.  */
        if (is_load)
@@ -4252,7 +4261,7 @@ expand_fold_extract_last (rtx *ops)
    rtx slide_vect = gen_reg_rtx (mode);
    insn_code icode;
  
-  if (poly_int_rtx_p (len, &value) && known_eq (value, GET_MODE_NUNITS (mode)))
+  if (is_vlmax_len_p (mode, len))
      len = NULL_RTX;
  
    /* Calculate the number of 1-bit in mask. */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/post-ra-avl.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/post-ra-avl.c

index f3d12bac7cd0389402fe699c9853ebdf2b1e5162..bff6dcb1c387020520e2f38baf744bb143f239e9 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/post-ra-avl.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/post-ra-avl.c
@@ -13,4 +13,4 @@ int foo() {
    return a;
  }
  
-/* { dg-final { scan-assembler-times {vsetvli\s+[a-x0-9]+,\s*zero} 1 } } */
+/* { dg-final { scan-assembler-not {vsetvli\s+[a-x0-9]+,\s*zero} } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/base/vf_avl-2.c b/gcc/testsuite/gcc.target/riscv/rvv/base/vf_avl-2.c

new file mode 100644 (file)

index 0000000..5a94a51
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/rvv/base/vf_avl-2.c
@@ -0,0 +1,21 @@
+/* { dg-do compile } */
+/* { dg-options "-O3 -march=rv64gcv -mabi=lp64d --param riscv-autovec-preference=fixed-vlmax" } */
+
+float f[12][100];
+
+void bad1(float v1, float v2)
+{
+  for (int r = 0; r < 100; r += 4)
+    {
+      int i = r + 1;
+      f[0][r] = f[1][r] * (f[2][r] + v2) - f[1][i] * (f[2][i] + v1);
+      f[0][i] = f[1][r] * (f[2][i] + v1) + f[1][i] * (f[2][r] + v2);
+      f[0][r+2] = f[1][r+2] * (f[2][r+2] + v2) - f[1][i+2] * (f[2][i+2] + v1);
+      f[0][i+2] = f[1][r+2] * (f[2][i+2] + v1) + f[1][i+2] * (f[2][r+2] + v2);
+    }
+}
+
+/* { dg-final { scan-assembler-times {vsetivli\s+zero,\s*4,\s*e32,\s*m1,\s*t[au],\s*m[au]} 1 } } */
+/* { dg-final { scan-assembler-times {vsetivli\s+zero,\s*1,\s*e32,\s*m1,\s*t[au],\s*m[au]} 1 } } */
+/* { dg-final { scan-assembler-times {vsetivli} 2 } } */
+/* { dg-final { scan-assembler-not {vsetvli} } } */
author	Juzhe-Zhong <juzhe.zhong@rivai.ai>
	Wed, 27 Dec 2023 02:38:26 +0000 (10:38 +0800)
committer	Pan Li <pan2.li@intel.com>
	Fri, 29 Dec 2023 00:38:03 +0000 (08:38 +0800)
gcc/config/riscv/riscv-v.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/post-ra-avl.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/base/vf_avl-2.c	[new file with mode: 0644]	patch \| blob