]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
i386: Optimize pinsrq of 0 with index 1 into movq [PR94866]
authorUros Bizjak <ubizjak@gmail.com>
Thu, 24 Aug 2023 20:23:52 +0000 (22:23 +0200)
committerUros Bizjak <ubizjak@gmail.com>
Thu, 24 Aug 2023 20:24:43 +0000 (22:24 +0200)
Add new pattern involving vec_merge RTX that is produced by combine from the
combination of sse4_1_pinsrq and *movdi_internal:

    7: r86:DI=0
    8: r85:V2DI=vec_merge(vec_duplicate(r86:DI),r87:V2DI,0x2)
      REG_DEAD r87:V2DI
      REG_DEAD r86:DI
Successfully matched this instruction:
(set (reg:V2DI 85 [ a ])
    (vec_merge:V2DI (reg:V2DI 87)
        (const_vector:V2DI [
                (const_int 0 [0]) repeated x2
            ])
        (const_int 1 [0x1])))

PR target/94866

gcc/ChangeLog:

* config/i386/sse.md (*sse2_movq128_<mode>_1): New insn pattern.

gcc/testsuite/ChangeLog:

* g++.target/i386/pr94866.C: New test.

gcc/config/i386/sse.md
gcc/testsuite/g++.target/i386/pr94866.C [new file with mode: 0644]

index fb3db940d3d23fdeb023025f7d22628acf3941df..59a0eb1c63f32e64dec71ecc5d907ffe4cbb81fa 100644 (file)
    (set_attr "prefix" "maybe_vex")
    (set_attr "mode" "TI")])
 
+(define_insn "*sse2_movq128_<mode>_1"
+  [(set (match_operand:VI8F_128 0 "register_operand" "=v")
+       (vec_merge:VI8F_128
+         (match_operand:VI8F_128 1 "nonimmediate_operand" "vm")
+         (match_operand:VI8F_128 2 "const0_operand")
+         (const_int 1)))]
+  "TARGET_SSE2"
+  "%vmovq\t{%1, %0|%0, %q1}"
+  [(set_attr "type" "ssemov")
+   (set_attr "prefix" "maybe_vex")
+   (set_attr "mode" "TI")])
+
 ;; Move a DI from a 32-bit register pair (e.g. %edx:%eax) to an xmm.
 ;; We'd rather avoid this entirely; if the 32-bit reg pair was loaded
 ;; from memory, we'd prefer to load the memory directly into the %xmm
diff --git a/gcc/testsuite/g++.target/i386/pr94866.C b/gcc/testsuite/g++.target/i386/pr94866.C
new file mode 100644 (file)
index 0000000..eb0f5ef
--- /dev/null
@@ -0,0 +1,13 @@
+// PR target/94866
+// { dg-do compile }
+// { dg-options "-O2 -msse4.1" }
+// { dg-require-effective-target c++11 }
+
+typedef long long v2di __attribute__((vector_size(16)));
+
+v2di _mm_move_epi64(v2di a)
+{
+    return v2di{a[0], 0LL};
+}
+
+// { dg-final { scan-assembler-times "movq\[ \\t\]+\[^\n\]*%xmm" 1 } }