]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
Add UNSPEC_MASKOP to vpbroadcastm pattern.
authorliuhongt <hongtao.liu@intel.com>
Thu, 27 Jul 2023 07:14:39 +0000 (15:14 +0800)
committerliuhongt <hongtao.liu@intel.com>
Fri, 28 Jul 2023 02:06:44 +0000 (10:06 +0800)
Prevent rtl optimization of vec_duplicate + zero_extend to
vpbroadcastm since there could be an extra kmov after RA.

gcc/ChangeLog:

PR target/110788
* config/i386/sse.md (avx512cd_maskb_vec_dup<mode>): Add
UNSPEC_MASKOP.
(avx512cd_maskw_vec_dup<mode>): Ditto.

gcc/testsuite/ChangeLog:

* gcc.target/i386/pr110788.c: New test.

gcc/config/i386/sse.md
gcc/testsuite/gcc.target/i386/pr110788.c [new file with mode: 0644]

index 35fd66ed4aa0bcda35fe54888eb8a9da06a2d55a..51961bbfc0b535b80e772bcd2ded9578862e39fd 100644 (file)
    (set_attr "prefix" "evex")
    (set_attr "mode" "<sseinsnmode>")])
 
+;; Use unspec to prevent rtl optimizer to optimize zero_extend + vec_duplicate
+;; to pbroadcastm, there could be an extra kmov after RA.
 (define_insn "avx512cd_maskb_vec_dup<mode>"
   [(set (match_operand:VI8_AVX512VL 0 "register_operand" "=v")
        (vec_duplicate:VI8_AVX512VL
          (zero_extend:DI
-           (match_operand:QI 1 "register_operand" "k"))))]
+           (match_operand:QI 1 "register_operand" "k"))))
+   (unspec [(const_int 0)] UNSPEC_MASKOP)]
   "TARGET_AVX512CD"
   "vpbroadcastmb2q\t{%1, %0|%0, %1}"
   [(set_attr "type" "mskmov")
   [(set (match_operand:VI4_AVX512VL 0 "register_operand" "=v")
        (vec_duplicate:VI4_AVX512VL
          (zero_extend:SI
-           (match_operand:HI 1 "register_operand" "k"))))]
+           (match_operand:HI 1 "register_operand" "k"))))
+   (unspec [(const_int 0)] UNSPEC_MASKOP)]
   "TARGET_AVX512CD"
   "vpbroadcastmw2d\t{%1, %0|%0, %1}"
   [(set_attr "type" "mskmov")
diff --git a/gcc/testsuite/gcc.target/i386/pr110788.c b/gcc/testsuite/gcc.target/i386/pr110788.c
new file mode 100644 (file)
index 0000000..4cf1676
--- /dev/null
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O3 -march=cascadelake --param vect-partial-vector-usage=2" } */
+/* { dg-final { scan-assembler-not "vpbroadcastm" } } */
+
+double a[1024], b[1024];
+
+void foo (int n)
+{
+  for (int i = 0; i < n; ++i)
+    a[i] = b[i] * 3.;
+}