RISC-V: VLA preempts VLS on unknown NITERS loop

author Juzhe-Zhong <juzhe.zhong@rivai.ai>

Thu, 11 Jan 2024 02:42:23 +0000 (10:42 +0800)

committer Pan Li <pan2.li@intel.com>

Thu, 11 Jan 2024 06:08:37 +0000 (14:08 +0800)
author Juzhe-Zhong <juzhe.zhong@rivai.ai>
Thu, 11 Jan 2024 02:42:23 +0000 (10:42 +0800)
committer Pan Li <pan2.li@intel.com>
Thu, 11 Jan 2024 06:08:37 +0000 (14:08 +0800)
diff --git a/gcc/config/riscv/riscv-vector-costs.cc b/gcc/config/riscv/riscv-vector-costs.cc

index e53f4a186f3234e6f4deab05dd00864b2e3efabb..58ec0b9b5035bb6347820f7ae95ce11c1ee11483 100644 (file)
--- a/gcc/config/riscv/riscv-vector-costs.cc
+++ b/gcc/config/riscv/riscv-vector-costs.cc
@@ -1042,6 +1042,15 @@ costs::better_main_loop_than_p (const vector_costs *uncast_other) const
             }
         }
      }
+  /* If NITERS is unknown, we should not use VLS modes to vectorize
+     the loop since we don't support partial vectors for VLS modes,
+     that is, we will have full vectors (VLSmodes) on loop body
+     and partial vectors (VLAmodes) on loop epilogue which is very
+     inefficient.  Instead, we should apply partial vectors (VLAmodes)
+     on loop body without an epilogue on unknown NITERS loop.  */
+  else if (!LOOP_VINFO_NITERS_KNOWN_P (this_loop_vinfo)
+          && m_cost_type == VLS_VECTOR_COST)
+    return false;
  
    return vector_costs::better_main_loop_than_p (other);
  }
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-1.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-1.c

index 948b20b68d31f6f4ff814ad96bd109ca5fb86c20..0a1d1f72e6b177704f460a211209df5d54b0be8d 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-1.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-1.c
@@ -21,6 +21,6 @@ f (int8_t *restrict a, int8_t *restrict b, int n)
  
  /* FIXME: Since we don't have VECT cost model yet, LOAD_LANES/STORE_LANES are chosen
     instead of SLP when riscv-autovec-lmul=m1.  */
-/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" "--param riscv-autovec-lmul=m8" } } } } */
+/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
  /* { dg-final { scan-assembler {\tvid\.v} { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
  /* { dg-final { scan-assembler {\tvand} { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-16.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-16.c

index 7b23cafab3fa228ac070c58c681ee03c23f2d4b6..05220c32c5d208a1f653f21a044a50e6c2f2d5cf 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-16.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-16.c
@@ -21,6 +21,6 @@ f (uint8_t *restrict a, uint8_t *restrict b, int n)
  
  /* FIXME: Since we don't have VECT cost model yet, LOAD_LANES/STORE_LANES are chosen
     instead of SLP when riscv-autovec-lmul=m1.  */
-/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" "--param riscv-autovec-lmul=m8" } } } } */
+/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
  /* { dg-final { scan-assembler {\tvid\.v} { xfail { any-opts "--param riscv-autovec-lmul=m1"} } } } */
  /* { dg-final { scan-assembler-not {\tvmul} } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-3.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-3.c

index 3622c59c4392974d549283cda95743f8b59d74d3..5e64231b37d77535c68bc063065b85fae63696e1 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-3.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-3.c
@@ -21,4 +21,4 @@ f (int8_t *restrict a, int8_t *restrict b, int n)
  
  /* FIXME: Since we don't have VECT cost model yet, LOAD_LANES/STORE_LANES are chosen
     instead of SLP when riscv-autovec-lmul=m1.  */
-/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" "--param riscv-autovec-lmul=m8" } } } } */
+/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-5.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-5.c

index 5c0a6775474e3cd435f95061ca99451d319c4f5e..c78b3709078ccc4583405102598cae426e75e454 100644 (file)
--- a/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-5.c
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-5.c
@@ -21,4 +21,4 @@ f (int8_t *restrict a, int8_t *restrict b, int n)
  
  /* FIXME: Since we don't have VECT cost model yet, LOAD_LANES/STORE_LANES are chosen
     instead of SLP when riscv-autovec-lmul=m1.  */
-/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" "--param riscv-autovec-lmul=m8" } } } } */
+/* { dg-final { scan-tree-dump-times "\.VEC_PERM" 1 "optimized" { xfail { any-opts "--param riscv-autovec-lmul=m1" } } } } */
author	Juzhe-Zhong <juzhe.zhong@rivai.ai>
	Thu, 11 Jan 2024 02:42:23 +0000 (10:42 +0800)
committer	Pan Li <pan2.li@intel.com>
	Thu, 11 Jan 2024 06:08:37 +0000 (14:08 +0800)
gcc/config/riscv/riscv-vector-costs.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-1.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-16.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-3.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/riscv/rvv/autovec/partial/slp-5.c		patch \| blob \| blame \| history