]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
backport: re PR target/79932 (_mm512_packus_epi32 does not compile under -O0)
authorJakub Jelinek <jakub@redhat.com>
Tue, 30 May 2017 08:08:59 +0000 (10:08 +0200)
committerJakub Jelinek <jakub@gcc.gnu.org>
Tue, 30 May 2017 08:08:59 +0000 (10:08 +0200)
Backported from mainline
2017-03-09  Jakub Jelinek  <jakub@redhat.com>

PR target/79932
* config/i386/avx512bwintrin.h (_mm512_packs_epi32,
_mm512_maskz_packs_epi32, _mm512_mask_packs_epi32,
_mm512_packus_epi32, _mm512_maskz_packus_epi32,
_mm512_mask_packus_epi32): Move definitions outside of __OPTIMIZE__
guarded section.

* gcc.target/i386/pr79932-1.c: New test.

From-SVN: r248656

gcc/ChangeLog
gcc/config/i386/avx512bwintrin.h
gcc/testsuite/ChangeLog
gcc/testsuite/gcc.target/i386/pr79932-1.c [new file with mode: 0644]

index 25502207240df1948a8008bfef13f21e109a11a0..335f83aaf858134307d0067282f718272b65e301 100644 (file)
@@ -1,6 +1,15 @@
 2017-05-30  Jakub Jelinek  <jakub@redhat.com>
 
        Backported from mainline
+       2017-03-09  Jakub Jelinek  <jakub@redhat.com>
+
+       PR target/79932
+       * config/i386/avx512bwintrin.h (_mm512_packs_epi32,
+       _mm512_maskz_packs_epi32, _mm512_mask_packs_epi32,
+       _mm512_packus_epi32, _mm512_maskz_packus_epi32,
+       _mm512_mask_packus_epi32): Move definitions outside of __OPTIMIZE__
+       guarded section.
+
        2017-03-07  Jakub Jelinek  <jakub@redhat.com>
 
        PR rtl-optimization/79901
index 7a7ed68c997ca3949f78a9021432a00ceca41265..56c59a9c6dd94404f0851fdab2b87a047afbc086 100644 (file)
@@ -2420,6 +2420,72 @@ _mm512_cmple_epi16_mask (__m512i __X, __m512i __Y)
                                                  (__mmask32) -1);
 }
 
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_packs_epi32 (__m512i __A, __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi)
+                                                   _mm512_setzero_hi (),
+                                                   (__mmask32) -1);
+}
+
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_packs_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi)
+                                                   _mm512_setzero_hi (),
+                                                   __M);
+}
+
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_packs_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
+                        __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi) __W,
+                                                   __M);
+}
+
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_packus_epi32 (__m512i __A, __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi)
+                                                   _mm512_setzero_hi (),
+                                                   (__mmask32) -1);
+}
+
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_maskz_packus_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi)
+                                                   _mm512_setzero_hi (),
+                                                   __M);
+}
+
+extern __inline __m512i
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
+_mm512_mask_packus_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
+                         __m512i __B)
+{
+  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
+                                                   (__v16si) __B,
+                                                   (__v32hi) __W,
+                                                   __M);
+}
+
 #ifdef __OPTIMIZE__
 extern __inline __m512i
 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
@@ -2743,72 +2809,6 @@ _mm512_cmp_epu8_mask (__m512i __X, __m512i __Y, const int __P)
                                                   (__mmask64) -1);
 }
 
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_packs_epi32 (__m512i __A, __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi)
-                                                   _mm512_setzero_hi (),
-                                                   (__mmask32) -1);
-}
-
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_maskz_packs_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi)
-                                                   _mm512_setzero_hi(),
-                                                   __M);
-}
-
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_mask_packs_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
-                        __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi) __W,
-                                                   __M);
-}
-
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_packus_epi32 (__m512i __A, __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi)
-                                                   _mm512_setzero_hi (),
-                                                   (__mmask32) -1);
-}
-
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_maskz_packus_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi)
-                                                   _mm512_setzero_hi(),
-                                                   __M);
-}
-
-extern __inline __m512i
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
-_mm512_mask_packus_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
-                         __m512i __B)
-{
-  return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
-                                                   (__v16si) __B,
-                                                   (__v32hi) __W,
-                                                   __M);
-}
-
 extern __inline __m512i
 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
 _mm512_bslli_epi128 (__m512i __A, const int __N)
index 656f9ca647b959617ddb2f924a374f28532a2214..a1b4ea59b5376951bf2461736293ed1c790d9866 100644 (file)
@@ -1,6 +1,11 @@
 2017-05-30  Jakub Jelinek  <jakub@redhat.com>
 
        Backported from mainline
+       2017-03-09  Jakub Jelinek  <jakub@redhat.com>
+
+       PR target/79932
+       * gcc.target/i386/pr79932-1.c: New test.
+
        2017-03-07  Jakub Jelinek  <jakub@redhat.com>
 
        PR rtl-optimization/79901
diff --git a/gcc/testsuite/gcc.target/i386/pr79932-1.c b/gcc/testsuite/gcc.target/i386/pr79932-1.c
new file mode 100644 (file)
index 0000000..fee42b9
--- /dev/null
@@ -0,0 +1,19 @@
+/* PR target/79932 */
+/* { dg-do compile } */
+/* { dg-options "-O0 -mavx512bw" } */
+
+#include <x86intrin.h>
+
+__m512i a, b, c, d, e, f, g, h, i;
+__mmask32 m;
+
+void
+foo (void)
+{
+  d = _mm512_packs_epi32 (a, b);
+  e = _mm512_maskz_packs_epi32 (m, a, b);
+  f = _mm512_mask_packs_epi32 (c, m, a, b);
+  g = _mm512_packus_epi32 (a, b);
+  h = _mm512_maskz_packus_epi32 (m, a, b);
+  i = _mm512_mask_packus_epi32 (c, m, a, b);
+}