182 lines
5.4 KiB
Diff
182 lines
5.4 KiB
Diff
2017-03-07 Jakub Jelinek <jakub@redhat.com>
|
|
|
|
PR target/79932
|
|
* config/i386/avx512bwintrin.h (_mm512_packs_epi32,
|
|
_mm512_maskz_packs_epi32, _mm512_mask_packs_epi32,
|
|
_mm512_packus_epi32, _mm512_maskz_packus_epi32,
|
|
_mm512_mask_packus_epi32): Move definitions outside of __OPTIMIZE__
|
|
guarded section.
|
|
|
|
* gcc.target/i386/pr79932-1.c: New test.
|
|
|
|
--- gcc/config/i386/avx512bwintrin.h.jj 2017-01-23 18:09:48.000000000 +0100
|
|
+++ gcc/config/i386/avx512bwintrin.h 2017-03-07 07:47:28.900049849 +0100
|
|
@@ -2656,6 +2656,72 @@ _mm512_cmple_epi16_mask (__m512i __X, __
|
|
(__mmask32) -1);
|
|
}
|
|
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_packs_epi32 (__m512i __A, __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi)
|
|
+ _mm512_setzero_si512 (),
|
|
+ (__mmask32) -1);
|
|
+}
|
|
+
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_maskz_packs_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi)
|
|
+ _mm512_setzero_si512 (),
|
|
+ __M);
|
|
+}
|
|
+
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_mask_packs_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
|
|
+ __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi) __W,
|
|
+ __M);
|
|
+}
|
|
+
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_packus_epi32 (__m512i __A, __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi)
|
|
+ _mm512_setzero_si512 (),
|
|
+ (__mmask32) -1);
|
|
+}
|
|
+
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_maskz_packus_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi)
|
|
+ _mm512_setzero_si512 (),
|
|
+ __M);
|
|
+}
|
|
+
|
|
+extern __inline __m512i
|
|
+__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
+_mm512_mask_packus_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
|
|
+ __m512i __B)
|
|
+{
|
|
+ return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
+ (__v16si) __B,
|
|
+ (__v32hi) __W,
|
|
+ __M);
|
|
+}
|
|
+
|
|
#ifdef __OPTIMIZE__
|
|
extern __inline __mmask32
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
@@ -3012,72 +3078,6 @@ _mm512_cmp_epu8_mask (__m512i __X, __m51
|
|
}
|
|
|
|
extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_packs_epi32 (__m512i __A, __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi)
|
|
- _mm512_setzero_si512 (),
|
|
- (__mmask32) -1);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_maskz_packs_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi)
|
|
- _mm512_setzero_si512 (),
|
|
- __M);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_mask_packs_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
|
|
- __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packssdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi) __W,
|
|
- __M);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_packus_epi32 (__m512i __A, __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi)
|
|
- _mm512_setzero_si512 (),
|
|
- (__mmask32) -1);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_maskz_packus_epi32 (__mmask32 __M, __m512i __A, __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi)
|
|
- _mm512_setzero_si512 (),
|
|
- __M);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
-__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
-_mm512_mask_packus_epi32 (__m512i __W, __mmask32 __M, __m512i __A,
|
|
- __m512i __B)
|
|
-{
|
|
- return (__m512i) __builtin_ia32_packusdw512_mask ((__v16si) __A,
|
|
- (__v16si) __B,
|
|
- (__v32hi) __W,
|
|
- __M);
|
|
-}
|
|
-
|
|
-extern __inline __m512i
|
|
__attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
_mm512_bslli_epi128 (__m512i __A, const int __N)
|
|
{
|
|
--- gcc/testsuite/gcc.target/i386/pr79932-1.c.jj 2017-03-07 07:54:45.181339418 +0100
|
|
+++ gcc/testsuite/gcc.target/i386/pr79932-1.c 2017-03-07 07:54:24.000000000 +0100
|
|
@@ -0,0 +1,19 @@
|
|
+/* PR target/79932 */
|
|
+/* { dg-do compile } */
|
|
+/* { dg-options "-O0 -mavx512bw" } */
|
|
+
|
|
+#include <x86intrin.h>
|
|
+
|
|
+__m512i a, b, c, d, e, f, g, h, i;
|
|
+__mmask32 m;
|
|
+
|
|
+void
|
|
+foo (void)
|
|
+{
|
|
+ d = _mm512_packs_epi32 (a, b);
|
|
+ e = _mm512_maskz_packs_epi32 (m, a, b);
|
|
+ f = _mm512_mask_packs_epi32 (c, m, a, b);
|
|
+ g = _mm512_packus_epi32 (a, b);
|
|
+ h = _mm512_maskz_packus_epi32 (m, a, b);
|
|
+ i = _mm512_mask_packus_epi32 (c, m, a, b);
|
|
+}
|