]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
x86: yet more PR target/100711-like splitting
authorJan Beulich <jbeulich@suse.com>
Wed, 5 Jul 2023 07:49:16 +0000 (09:49 +0200)
committerJan Beulich <jbeulich@suse.com>
Wed, 5 Jul 2023 07:49:16 +0000 (09:49 +0200)
Following two-operand bitwise operations, add another splitter to also
deal with not followed by broadcast all on its own, which can be
expressed as simple embedded broadcast instead once a broadcast operand
is actually permitted in the respective insn. While there also permit
a broadcast operand in the corresponding expander.

gcc/

PR target/100711
* config/i386/sse.md: New splitters to simplify
not;vec_duplicate as a singular vpternlog.
(one_cmpl<mode>2): Allow broadcast for operand 1.
(<mask_codefor>one_cmpl<mode>2<mask_name>): Likewise.

gcc/testsuite/

PR target/100711
* gcc.target/i386/pr100711-6.c: New test.

gcc/config/i386/sse.md
gcc/testsuite/gcc.target/i386/pr100711-6.c [new file with mode: 0644]

index d828143c189f5cba5ed7183f9ad25438d190f747..418c337a77529426032928e4b3fe6a8216e9020e 100644 (file)
 
 (define_expand "one_cmpl<mode>2"
   [(set (match_operand:VI 0 "register_operand")
-       (xor:VI (match_operand:VI 1 "vector_operand")
+       (xor:VI (match_operand:VI 1 "bcst_vector_operand")
                (match_dup 2)))]
   "TARGET_SSE"
 {
 
 (define_insn "<mask_codefor>one_cmpl<mode>2<mask_name>"
   [(set (match_operand:VI 0 "register_operand" "=v,v")
-       (xor:VI (match_operand:VI 1 "nonimmediate_operand" "v,m")
+       (xor:VI (match_operand:VI 1 "bcst_vector_operand" "vBr,m")
                (match_operand:VI 2 "vector_all_ones_operand" "BC,BC")))]
   "TARGET_AVX512F
    && (!<mask_applied>
                      (symbol_ref "<MODE_SIZE> == 64 || TARGET_AVX512VL")
                      (const_int 1)))])
 
+(define_split
+  [(set (match_operand:VI48_AVX512F 0 "register_operand")
+       (vec_duplicate:VI48_AVX512F
+         (not:<ssescalarmode>
+           (match_operand:<ssescalarmode> 1 "nonimmediate_operand"))))]
+  "<MODE_SIZE> == 64 || TARGET_AVX512VL
+   || (TARGET_AVX512F && !TARGET_PREFER_AVX256)"
+  [(set (match_dup 0)
+       (xor:VI48_AVX512F
+         (vec_duplicate:VI48_AVX512F (match_dup 1))
+         (match_dup 2)))]
+  "operands[2] = CONSTM1_RTX (<MODE>mode);")
+
 (define_expand "<sse2_avx2>_andnot<mode>3"
   [(set (match_operand:VI_AVX2 0 "register_operand")
        (and:VI_AVX2
diff --git a/gcc/testsuite/gcc.target/i386/pr100711-6.c b/gcc/testsuite/gcc.target/i386/pr100711-6.c
new file mode 100644 (file)
index 0000000..7142a98
--- /dev/null
@@ -0,0 +1,18 @@
+/* { dg-do compile } */
+/* { dg-options "-mavx512f -mno-avx512vl -mprefer-vector-width=512 -O2" } */
+
+typedef int v16si __attribute__ ((vector_size (64)));
+typedef long long v8di __attribute__((vector_size (64)));
+
+v16si foo_v16si (const int *a)
+{
+    return (__extension__ (v16si) {~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a,
+                                  ~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a});
+}
+
+v8di foo_v8di (const long long *a)
+{
+    return (__extension__ (v8di) {~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a, ~*a});
+}
+
+/* { dg-final { scan-assembler-times "vpternlog\[dq\]\[ \\t\]+\\\$0x55, \\(%(?:eax|rdi|edi)\\)\\\{1to\[1-8\]+\\\}" 2 } } */