Canonicalize vec_merge in simplify_ternary_operation

author Pengxuan Zheng <quic_pzheng@quicinc.com>

Fri, 7 Feb 2025 00:16:32 +0000 (16:16 -0800)

committer Pengxuan Zheng <quic_pzheng@quicinc.com>

Thu, 8 May 2025 00:33:57 +0000 (17:33 -0700)
author Pengxuan Zheng <quic_pzheng@quicinc.com>
Fri, 7 Feb 2025 00:16:32 +0000 (16:16 -0800)
committer Pengxuan Zheng <quic_pzheng@quicinc.com>
Thu, 8 May 2025 00:33:57 +0000 (17:33 -0700)
diff --git a/gcc/config/aarch64/aarch64-protos.h b/gcc/config/aarch64/aarch64-protos.h

index c83c35c6d71e1c8f5927ce6ed94e96f2120d5202..c935e7bcf33da74dd1b7355a1147546d8359cceb 100644 (file)
--- a/gcc/config/aarch64/aarch64-protos.h
+++ b/gcc/config/aarch64/aarch64-protos.h
@@ -1055,6 +1055,7 @@ void aarch64_subvti_scratch_regs (rtx, rtx, rtx *,
                                   rtx *, rtx *, rtx *);
  void aarch64_expand_subvti (rtx, rtx, rtx,
                             rtx, rtx, rtx, rtx, bool);
+int aarch64_exact_log2_inverse (unsigned int, rtx);
  
  
  /* Initialize builtins for SIMD intrinsics.  */
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index e2afe87e5130cc066b8348659209ab40747327e5..1099e742cbf7418b75a16ec68f4243fc55e96506 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -1193,12 +1193,14 @@
  (define_insn "aarch64_simd_vec_set_zero<mode>"
    [(set (match_operand:VALL_F16 0 "register_operand" "=w")
         (vec_merge:VALL_F16
-           (match_operand:VALL_F16 1 "aarch64_simd_imm_zero" "")
-           (match_operand:VALL_F16 3 "register_operand" "0")
+           (match_operand:VALL_F16 1 "register_operand" "0")
+           (match_operand:VALL_F16 3 "aarch64_simd_imm_zero" "")
             (match_operand:SI 2 "immediate_operand" "i")))]
-  "TARGET_SIMD && exact_log2 (INTVAL (operands[2])) >= 0"
+  "TARGET_SIMD && aarch64_exact_log2_inverse (<nunits>, operands[2]) >= 0"
    {
-    int elt = ENDIAN_LANE_N (<nunits>, exact_log2 (INTVAL (operands[2])));
+    int elt = ENDIAN_LANE_N (<nunits>,
+                            aarch64_exact_log2_inverse (<nunits>,
+                                                        operands[2]));
      operands[2] = GEN_INT ((HOST_WIDE_INT) 1 << elt);
      return "ins\\t%0.<Vetype>[%p2], <vwcore>zr";
    }
diff --git a/gcc/config/aarch64/aarch64.cc b/gcc/config/aarch64/aarch64.cc

index 2dc5f4c4b59de3306a4b0a6664901832a60f0619..9e3f2885bccb62550c5fcfdf93d72fbc2e63233e 100644 (file)
--- a/gcc/config/aarch64/aarch64.cc
+++ b/gcc/config/aarch64/aarch64.cc
@@ -23914,6 +23914,16 @@ aarch64_strided_registers_p (rtx *operands, unsigned int num_operands,
    return true;
  }
  
+/* Return the base 2 logarithm of the bit inverse of OP masked by the lowest
+   NELTS bits, if OP is a power of 2.  Otherwise, returns -1.  */
+
+int
+aarch64_exact_log2_inverse (unsigned int nelts, rtx op)
+{
+  return exact_log2 ((~INTVAL (op))
+                    & ((HOST_WIDE_INT_1U << nelts) - 1));
+}
+
  /* Bounds-check lanes.  Ensure OPERAND lies between LOW (inclusive) and
     HIGH (exclusive).  */
  void
diff --git a/gcc/simplify-rtx.cc b/gcc/simplify-rtx.cc

index 7bcbe11370fa069e9008c9742e09b98b765b3eec..b34fd2f4b9eac3ba28dfcc7610f189b6359687de 100644 (file)
--- a/gcc/simplify-rtx.cc
+++ b/gcc/simplify-rtx.cc
@@ -7387,6 +7387,13 @@ simplify_context::simplify_ternary_operation (rtx_code code, machine_mode mode,
               return gen_rtx_CONST_VECTOR (mode, v);
             }
  
+         if (swap_commutative_operands_p (op0, op1)
+             /* Two operands have same precedence, then first bit of mask
+                select first operand.  */
+             || (!swap_commutative_operands_p (op1, op0) && !(sel & 1)))
+           return simplify_gen_ternary (code, mode, mode, op1, op0,
+                                        GEN_INT (~sel & mask));
+
           /* Replace (vec_merge (vec_merge a b m) c n) with (vec_merge b c n)
              if no element from a appears in the result.  */
           if (GET_CODE (op0) == VEC_MERGE)
author	Pengxuan Zheng <quic_pzheng@quicinc.com>
	Fri, 7 Feb 2025 00:16:32 +0000 (16:16 -0800)
committer	Pengxuan Zheng <quic_pzheng@quicinc.com>
	Thu, 8 May 2025 00:33:57 +0000 (17:33 -0700)
gcc/config/aarch64/aarch64-protos.h		patch \| blob \| blame \| history
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| blame \| history
gcc/config/aarch64/aarch64.cc		patch \| blob \| blame \| history
gcc/simplify-rtx.cc		patch \| blob \| blame \| history