]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
rs6000: Generates permute index directly for little endian targets (PR100866)
authorHaochen Gui <guihaoc@gcc.gnu.org>
Wed, 30 Nov 2022 07:05:59 +0000 (15:05 +0800)
committerHaochen Gui <guihaoc@gcc.gnu.org>
Thu, 1 Dec 2022 02:06:11 +0000 (10:06 +0800)
2022-10-11  Haochen Gui <guihaoc@linux.ibm.com>

gcc/
PR target/100866
* config/rs6000/rs6000-call.cc (swap_endian_selector_for_mode):
Generate permute index directly for little endian targets.
* config/rs6000/vsx.md (revb_<mode>): Call vprem directly with
corresponding permute indexes.

gcc/testsuite/
PR target/100866
* gcc.target/powerpc/pr100866-1.c: New.

gcc/config/rs6000/rs6000-call.cc
gcc/config/rs6000/vsx.md
gcc/testsuite/gcc.target/powerpc/pr100866-1.c [new file with mode: 0644]

index 6da4de67137871ee887f052ec87a937b9c1c8a88..c2a4e4f4e27116436a066870c85c5f493d9fa46a 100644 (file)
@@ -2802,6 +2802,8 @@ rs6000_gimplify_va_arg (tree valist, tree type, gimple_seq *pre_p,
   return build_va_arg_indirect_ref (addr);
 }
 
+/* The selector (perm) is expected to be used with vperm direct as the
+   function generates reversed perm for little endian with this patch.  */
 rtx
 swap_endian_selector_for_mode (machine_mode mode)
 {
@@ -2834,7 +2836,11 @@ swap_endian_selector_for_mode (machine_mode mode)
     }
 
   for (i = 0; i < 16; ++i)
-    perm[i] = GEN_INT (swaparray[i]);
+    if (BYTES_BIG_ENDIAN)
+      perm[i] = GEN_INT (swaparray[i]);
+    else
+      /* Generates the reversed perm for little endian.  */
+      perm[i] = GEN_INT (~swaparray[i] & 0x0000001f);
 
   return force_reg (V16QImode, gen_rtx_CONST_VECTOR (V16QImode,
                                                     gen_rtvec_v (16, perm)));
index fb5cf04147e5eb8e8be22cd175ea8de3ff340c47..992fbc983be52368973b6f688cf4f31ebe574427 100644 (file)
             to the endian mode in use, i.e. in LE mode, put elements
             in BE order.  */
          rtx sel = swap_endian_selector_for_mode (<MODE>mode);
-         emit_insn (gen_altivec_vperm_<mode> (operands[0], operands[1],
-                                              operands[1], sel));
+         emit_insn (gen_altivec_vperm_<mode>_direct (operands[0], operands[1],
+                                                     operands[1], sel));
        }
     }
 
diff --git a/gcc/testsuite/gcc.target/powerpc/pr100866-1.c b/gcc/testsuite/gcc.target/powerpc/pr100866-1.c
new file mode 100644 (file)
index 0000000..63872f2
--- /dev/null
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target powerpc_p8vector_ok } */
+/* { dg-options "-O2 -mdejagnu-cpu=power8" } */
+/* { dg-final { scan-assembler-not {\mxxlnor\M} } } */
+
+#include <altivec.h>
+
+vector unsigned int revb (vector unsigned int a)
+{
+   return vec_revb(a);
+}