]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
Lower AVX512 kmask comparison back to AVX2 comparison when op_{true,false} is vector...
authorliuhongt <hongtao.liu@intel.com>
Tue, 18 Jun 2024 06:03:42 +0000 (14:03 +0800)
committerliuhongt <hongtao.liu@intel.com>
Mon, 1 Jul 2024 05:20:08 +0000 (13:20 +0800)
gcc/ChangeLog
PR target/115517
* config/i386/sse.md
(*<avx512>_cvtmask2<ssemodesuffix><mode>_not): New pre_reload
splitter.
(*<avx512>_cvtmask2<ssemodesuffix><mode>_not): Ditto.
(*avx2_pcmp<mode>3_6): Ditto.
(*avx2_pcmp<mode>3_7): Ditto.

gcc/config/i386/sse.md

index 423f13d3982f41a650f351a47c17bf096eb40a56..3d790af3a2c87ddc82962c429429e71d77f5d7a1 100644 (file)
   [(set_attr "prefix" "evex")
    (set_attr "mode" "<sseinsnmode>")])
 
+(define_insn_and_split "*<avx512>_cvtmask2<ssemodesuffix><mode>_not"
+  [(set (match_operand:VI12_AVX512VL 0 "register_operand")
+       (vec_merge:VI12_AVX512VL
+         (match_operand:VI12_AVX512VL 2 "const0_operand")
+         (match_operand:VI12_AVX512VL 3 "vector_all_ones_operand")
+         (match_operand:<avx512fmaskmode> 1 "register_operand")))]
+  "TARGET_AVX512BW && ix86_pre_reload_split ()"
+  "#"
+  "&& 1"
+  [(set (match_dup 4)
+       (not:<avx512fmaskmode> (match_dup 1)))
+   (set (match_dup 0)
+       (vec_merge:VI12_AVX512VL
+         (match_dup 3)
+         (match_dup 2)
+         (match_dup 4)))]
+  "operands[4] = gen_reg_rtx (<avx512fmaskmode>mode);")
+
 (define_expand "<avx512>_cvtmask2<ssemodesuffix><mode>"
   [(set (match_operand:VI48_AVX512VL 0 "register_operand")
        (vec_merge:VI48_AVX512VL
    (set_attr "prefix" "evex")
    (set_attr "mode" "<sseinsnmode>")])
 
+(define_insn_and_split "*<avx512>_cvtmask2<ssemodesuffix><mode>_not"
+  [(set (match_operand:VI48_AVX512VL 0 "register_operand")
+       (vec_merge:VI48_AVX512VL
+         (match_operand:VI48_AVX512VL 2 "const0_operand")
+         (match_operand:VI48_AVX512VL 3 "vector_all_ones_operand")
+         (match_operand:<avx512fmaskmode> 1 "register_operand")))]
+  "TARGET_AVX512F && ix86_pre_reload_split ()"
+  "#"
+  "&& 1"
+  [(set (match_dup 4)
+       (not:<avx512fmaskmode> (match_dup 1)))
+   (set (match_dup 0)
+       (vec_merge:VI48_AVX512VL
+         (match_dup 3)
+         (match_dup 2)
+         (match_dup 4)))]
+  "operands[4] = gen_reg_rtx (<avx512fmaskmode>mode);")
+
 (define_insn "*<avx512>_cvtmask2<ssemodesuffix><mode>_pternlog_false_dep"
   [(set (match_operand:VI48_AVX512VL 0 "register_operand" "=v")
        (vec_merge:VI48_AVX512VL
     std::swap (operands[1], operands[2]);
 })
 
+(define_int_attr pcmp_usmin
+  [(UNSPEC_PCMP "smin") (UNSPEC_UNSIGNED_PCMP "umin")])
+
+(define_insn_and_split "*avx2_pcmp<mode>3_6"
+ [(set (match_operand:VI_128_256  0 "register_operand")
+       (vec_merge:VI_128_256
+         (match_operand:VI_128_256 1 "vector_all_ones_operand")
+         (match_operand:VI_128_256 2 "const0_operand")
+         (unspec:<avx512fmaskmode>
+           [(match_operand:VI_128_256 3 "nonimmediate_operand")
+            (match_operand:VI_128_256 4 "nonimmediate_operand")
+            (match_operand:SI 5 "const_0_to_7_operand")]
+            UNSPEC_PCMP_ITER)))]
+  "TARGET_AVX512VL && ix86_pre_reload_split ()
+   && (INTVAL (operands[5]) == 2 || INTVAL (operands[5]) == 5)"
+  "#"
+  "&& 1"
+  [(const_int 0)]
+{
+  rtx dst_min = gen_reg_rtx (<MODE>mode);
+
+  if (MEM_P (operands[3]) && MEM_P (operands[4]))
+    operands[3] = force_reg (<MODE>mode, operands[3]);
+  emit_insn (gen_<pcmp_usmin><mode>3 (dst_min, operands[3], operands[4]));
+  rtx eq_op = INTVAL (operands[5]) == 2 ? operands[3] : operands[4];
+  emit_move_insn (operands[0], gen_rtx_EQ (<MODE>mode, eq_op, dst_min));
+  DONE;
+})
+
+(define_insn_and_split "*avx2_pcmp<mode>3_7"
+ [(set (match_operand:VI_128_256  0 "register_operand")
+       (vec_merge:VI_128_256
+         (match_operand:VI_128_256 1 "const0_operand")
+         (match_operand:VI_128_256 2 "vector_all_ones_operand")
+         (unspec:<avx512fmaskmode>
+           [(match_operand:VI_128_256 3 "nonimmediate_operand")
+            (match_operand:VI_128_256 4 "nonimmediate_operand")
+            (match_operand:SI 5 "const_0_to_7_operand")]
+            UNSPEC_PCMP_ITER)))]
+  "TARGET_AVX512VL && ix86_pre_reload_split ()
+     /* NE is commutative.  */
+   && (INTVAL (operands[5]) == 4
+         /* LE, 3 must be register.  */
+       || INTVAL (operands[5]) == 2
+         /* NLT aka GE, 4 must be register and we swap operands.  */
+       || INTVAL (operands[5]) == 5)"
+  "#"
+  "&& 1"
+  [(const_int 0)]
+{
+  if (INTVAL (operands[5]) == 5)
+    std::swap (operands[3], operands[4]);
+
+  if (MEM_P (operands[3]))
+    operands[3] = force_reg (<MODE>mode, operands[3]);
+  enum rtx_code code = INTVAL (operands[5]) != 4 ? GT : EQ;
+  emit_move_insn (operands[0], gen_rtx_fmt_ee (code, <MODE>mode,
+                                              operands[3], operands[4]));
+  DONE;
+})
+
 (define_expand "<avx512>_eq<mode>3<mask_scalar_merge_name>"
   [(set (match_operand:<avx512fmaskmode> 0 "register_operand")
        (unspec:<avx512fmaskmode>