From: Haochen Gui Date: Wed, 30 Nov 2022 07:05:59 +0000 (+0800) Subject: rs6000: Generates permute index directly for little endian targets (PR100866) X-Git-Tag: basepoints/gcc-14~2784 X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=9d68cba5eb20442f8075b8f92d1b20a00022852f;p=thirdparty%2Fgcc.git rs6000: Generates permute index directly for little endian targets (PR100866) 2022-10-11 Haochen Gui gcc/ PR target/100866 * config/rs6000/rs6000-call.cc (swap_endian_selector_for_mode): Generate permute index directly for little endian targets. * config/rs6000/vsx.md (revb_): Call vprem directly with corresponding permute indexes. gcc/testsuite/ PR target/100866 * gcc.target/powerpc/pr100866-1.c: New. --- diff --git a/gcc/config/rs6000/rs6000-call.cc b/gcc/config/rs6000/rs6000-call.cc index 6da4de671378..c2a4e4f4e271 100644 --- a/gcc/config/rs6000/rs6000-call.cc +++ b/gcc/config/rs6000/rs6000-call.cc @@ -2802,6 +2802,8 @@ rs6000_gimplify_va_arg (tree valist, tree type, gimple_seq *pre_p, return build_va_arg_indirect_ref (addr); } +/* The selector (perm) is expected to be used with vperm direct as the + function generates reversed perm for little endian with this patch. */ rtx swap_endian_selector_for_mode (machine_mode mode) { @@ -2834,7 +2836,11 @@ swap_endian_selector_for_mode (machine_mode mode) } for (i = 0; i < 16; ++i) - perm[i] = GEN_INT (swaparray[i]); + if (BYTES_BIG_ENDIAN) + perm[i] = GEN_INT (swaparray[i]); + else + /* Generates the reversed perm for little endian. */ + perm[i] = GEN_INT (~swaparray[i] & 0x0000001f); return force_reg (V16QImode, gen_rtx_CONST_VECTOR (V16QImode, gen_rtvec_v (16, perm))); diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md index fb5cf04147e5..992fbc983be5 100644 --- a/gcc/config/rs6000/vsx.md +++ b/gcc/config/rs6000/vsx.md @@ -6099,8 +6099,8 @@ to the endian mode in use, i.e. in LE mode, put elements in BE order. */ rtx sel = swap_endian_selector_for_mode (mode); - emit_insn (gen_altivec_vperm_ (operands[0], operands[1], - operands[1], sel)); + emit_insn (gen_altivec_vperm__direct (operands[0], operands[1], + operands[1], sel)); } } diff --git a/gcc/testsuite/gcc.target/powerpc/pr100866-1.c b/gcc/testsuite/gcc.target/powerpc/pr100866-1.c new file mode 100644 index 000000000000..63872f21bf8b --- /dev/null +++ b/gcc/testsuite/gcc.target/powerpc/pr100866-1.c @@ -0,0 +1,11 @@ +/* { dg-do compile } */ +/* { dg-require-effective-target powerpc_p8vector_ok } */ +/* { dg-options "-O2 -mdejagnu-cpu=power8" } */ +/* { dg-final { scan-assembler-not {\mxxlnor\M} } } */ + +#include + +vector unsigned int revb (vector unsigned int a) +{ + return vec_revb(a); +}