]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
LoongArch: Accept ADD, IOR or XOR when combining objects with no bits in common ...
authorXi Ruoyao <xry111@xry111.site>
Mon, 10 Feb 2025 15:39:24 +0000 (23:39 +0800)
committerXi Ruoyao <xry111@xry111.site>
Wed, 19 Feb 2025 06:34:25 +0000 (14:34 +0800)
Since r15-1120, multi-word shifts/rotates produces PLUS instead of IOR.
It's generally a good thing (allowing to use our alsl instruction or
similar instrunction on other architectures), but it's preventing us
from using bytepick.  For example, if we shift a __int128 by 16 bits,
the higher word can be produced via a single bytepick.d instruction with
immediate 2, but we got:

srli.d $r12,$r4,48
slli.d $r5,$r5,16
slli.d $r4,$r4,16
add.d $r5,$r12,$r5
jr $r1

This wasn't work with GCC 14, but after r15-6490 it's supposed to work
if IOR was used instead of PLUS.

To fix this, add a code iterator to match IOR, XOR, and PLUS and use it
instead of just IOR if we know the operands have no overlapping bits.

gcc/ChangeLog:

PR target/115478
* config/loongarch/loongarch.md (any_or_plus): New
define_code_iterator.
(bstrins_<mode>_for_ior_mask): Use any_or_plus instead of ior.
(bytepick_w_<bytepick_imm>): Likewise.
(bytepick_d_<bytepick_imm>): Likewise.
(bytepick_d_<bytepick_imm>_rev): Likewise.

gcc/testsuite/ChangeLog:

PR target/115478
* gcc.target/loongarch/bytepick_shift_128.c: New test.

gcc/config/loongarch/loongarch.md
gcc/testsuite/gcc.target/loongarch/bytepick_shift_128.c [new file with mode: 0644]

index 36d140a9e942334f18166f376fe3cd7468d2e6d4..6c3fdfea00a29245bd722f384d9bf83caea4b420 100644 (file)
                                   (xor "uns_arith_operand")])
 (define_code_attr is_and [(and "true") (ior "false") (xor "false")])
 
+;; If we know the operands does not have overlapping bits, use this
+;; instead of just ior to cover more cases.
+(define_code_iterator any_or_plus [any_or plus])
+
 ;; This code iterator allows unsigned and signed division to be generated
 ;; from the same template.
 (define_code_iterator any_div [div udiv mod umod])
 
 (define_insn_and_split "*bstrins_<mode>_for_ior_mask"
   [(set (match_operand:GPR 0 "register_operand" "=r")
-       (ior:GPR (and:GPR (match_operand:GPR 1 "register_operand" "r")
-                         (match_operand:GPR 2 "const_int_operand" "i"))
-                (and:GPR (match_operand:GPR 3 "register_operand" "r")
-                         (match_operand:GPR 4 "const_int_operand" "i"))))]
+       (any_or_plus:GPR
+         (and:GPR (match_operand:GPR 1 "register_operand" "r")
+                  (match_operand:GPR 2 "const_int_operand" "i"))
+         (and:GPR (match_operand:GPR 3 "register_operand" "r")
+                  (match_operand:GPR 4 "const_int_operand" "i"))))]
   "loongarch_pre_reload_split ()
    && loongarch_use_bstrins_for_ior_with_mask (<MODE>mode, operands)"
   "#"
     DONE;
   })
 
-(define_insn "bytepick_w_<bytepick_imm>"
+(define_insn "*bytepick_w_<bytepick_imm>"
   [(set (match_operand:SI 0 "register_operand" "=r")
-       (ior:SI (lshiftrt:SI (match_operand:SI 1 "register_operand" "r")
-                            (const_int <bytepick_w_lshiftrt_amount>))
-               (ashift:SI (match_operand:SI 2 "register_operand" "r")
-                          (const_int bytepick_w_ashift_amount))))]
+       (any_or_plus:SI
+         (lshiftrt:SI (match_operand:SI 1 "register_operand" "r")
+                      (const_int <bytepick_w_lshiftrt_amount>))
+         (ashift:SI (match_operand:SI 2 "register_operand" "r")
+                    (const_int bytepick_w_ashift_amount))))]
   ""
   "bytepick.w\t%0,%1,%2,<bytepick_imm>"
   [(set_attr "mode" "SI")])
   "bytepick.w\t%0,%2,%1,1"
   [(set_attr "mode" "SI")])
 
-(define_insn "bytepick_d_<bytepick_imm>"
+(define_insn "*bytepick_d_<bytepick_imm>"
   [(set (match_operand:DI 0 "register_operand" "=r")
-       (ior:DI (lshiftrt (match_operand:DI 1 "register_operand" "r")
-                         (const_int <bytepick_d_lshiftrt_amount>))
-               (ashift (match_operand:DI 2 "register_operand" "r")
-                       (const_int bytepick_d_ashift_amount))))]
+       (any_or_plus:DI
+         (lshiftrt (match_operand:DI 1 "register_operand" "r")
+                   (const_int <bytepick_d_lshiftrt_amount>))
+         (ashift (match_operand:DI 2 "register_operand" "r")
+                 (const_int bytepick_d_ashift_amount))))]
   "TARGET_64BIT"
   "bytepick.d\t%0,%1,%2,<bytepick_imm>"
   [(set_attr "mode" "DI")])
 
-(define_insn "bytepick_d_<bytepick_imm>_rev"
+(define_insn "*bytepick_d_<bytepick_imm>_rev"
   [(set (match_operand:DI 0 "register_operand" "=r")
-       (ior:DI (ashift (match_operand:DI 1 "register_operand" "r")
-                       (const_int bytepick_d_ashift_amount))
-               (lshiftrt (match_operand:DI 2 "register_operand" "r")
-                         (const_int <bytepick_d_lshiftrt_amount>))))]
+       (any_or_plus:DI
+         (ashift (match_operand:DI 1 "register_operand" "r")
+                 (const_int bytepick_d_ashift_amount))
+         (lshiftrt (match_operand:DI 2 "register_operand" "r")
+                   (const_int <bytepick_d_lshiftrt_amount>))))]
   "TARGET_64BIT"
   "bytepick.d\t%0,%2,%1,<bytepick_imm>"
   [(set_attr "mode" "DI")])
diff --git a/gcc/testsuite/gcc.target/loongarch/bytepick_shift_128.c b/gcc/testsuite/gcc.target/loongarch/bytepick_shift_128.c
new file mode 100644 (file)
index 0000000..d3a9772
--- /dev/null
@@ -0,0 +1,9 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -march=loongarch64 -mabi=lp64d" } */
+/* { dg-final { scan-assembler "bytepick\\.d" } } */
+
+__int128
+test (__int128 a)
+{
+  return a << 16;
+}