xref: /dflybsd-src/contrib/gcc-8.0/gcc/config/i386/avx512ifmaintrin.h (revision 38fd149817dfbff97799f62fcb70be98c4e32523)
1*38fd1498Szrj /* Copyright (C) 2013-2018 Free Software Foundation, Inc.
2*38fd1498Szrj 
3*38fd1498Szrj    This file is part of GCC.
4*38fd1498Szrj 
5*38fd1498Szrj    GCC is free software; you can redistribute it and/or modify
6*38fd1498Szrj    it under the terms of the GNU General Public License as published by
7*38fd1498Szrj    the Free Software Foundation; either version 3, or (at your option)
8*38fd1498Szrj    any later version.
9*38fd1498Szrj 
10*38fd1498Szrj    GCC is distributed in the hope that it will be useful,
11*38fd1498Szrj    but WITHOUT ANY WARRANTY; without even the implied warranty of
12*38fd1498Szrj    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13*38fd1498Szrj    GNU General Public License for more details.
14*38fd1498Szrj 
15*38fd1498Szrj    Under Section 7 of GPL version 3, you are granted additional
16*38fd1498Szrj    permissions described in the GCC Runtime Library Exception, version
17*38fd1498Szrj    3.1, as published by the Free Software Foundation.
18*38fd1498Szrj 
19*38fd1498Szrj    You should have received a copy of the GNU General Public License and
20*38fd1498Szrj    a copy of the GCC Runtime Library Exception along with this program;
21*38fd1498Szrj    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
22*38fd1498Szrj    <http://www.gnu.org/licenses/>.  */
23*38fd1498Szrj 
24*38fd1498Szrj #ifndef _IMMINTRIN_H_INCLUDED
25*38fd1498Szrj #error "Never use <avx512ifmaintrin.h> directly; include <immintrin.h> instead."
26*38fd1498Szrj #endif
27*38fd1498Szrj 
28*38fd1498Szrj #ifndef _AVX512IFMAINTRIN_H_INCLUDED
29*38fd1498Szrj #define _AVX512IFMAINTRIN_H_INCLUDED
30*38fd1498Szrj 
31*38fd1498Szrj #ifndef __AVX512IFMA__
32*38fd1498Szrj #pragma GCC push_options
33*38fd1498Szrj #pragma GCC target("avx512ifma")
34*38fd1498Szrj #define __DISABLE_AVX512IFMA__
35*38fd1498Szrj #endif /* __AVX512IFMA__ */
36*38fd1498Szrj 
37*38fd1498Szrj extern __inline __m512i
38*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_madd52lo_epu64(__m512i __X,__m512i __Y,__m512i __Z)39*38fd1498Szrj _mm512_madd52lo_epu64 (__m512i __X, __m512i __Y, __m512i __Z)
40*38fd1498Szrj {
41*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52luq512_mask ((__v8di) __X,
42*38fd1498Szrj 						       (__v8di) __Y,
43*38fd1498Szrj 						       (__v8di) __Z,
44*38fd1498Szrj 						       (__mmask8) -1);
45*38fd1498Szrj }
46*38fd1498Szrj 
47*38fd1498Szrj extern __inline __m512i
48*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_madd52hi_epu64(__m512i __X,__m512i __Y,__m512i __Z)49*38fd1498Szrj _mm512_madd52hi_epu64 (__m512i __X, __m512i __Y, __m512i __Z)
50*38fd1498Szrj {
51*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52huq512_mask ((__v8di) __X,
52*38fd1498Szrj 						       (__v8di) __Y,
53*38fd1498Szrj 						       (__v8di) __Z,
54*38fd1498Szrj 						       (__mmask8) -1);
55*38fd1498Szrj }
56*38fd1498Szrj 
57*38fd1498Szrj extern __inline __m512i
58*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_mask_madd52lo_epu64(__m512i __W,__mmask8 __M,__m512i __X,__m512i __Y)59*38fd1498Szrj _mm512_mask_madd52lo_epu64 (__m512i __W, __mmask8 __M, __m512i __X,
60*38fd1498Szrj 			    __m512i __Y)
61*38fd1498Szrj {
62*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52luq512_mask ((__v8di) __W,
63*38fd1498Szrj 						       (__v8di) __X,
64*38fd1498Szrj 						       (__v8di) __Y,
65*38fd1498Szrj 						       (__mmask8) __M);
66*38fd1498Szrj }
67*38fd1498Szrj 
68*38fd1498Szrj extern __inline __m512i
69*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_mask_madd52hi_epu64(__m512i __W,__mmask8 __M,__m512i __X,__m512i __Y)70*38fd1498Szrj _mm512_mask_madd52hi_epu64 (__m512i __W, __mmask8 __M, __m512i __X,
71*38fd1498Szrj 			    __m512i __Y)
72*38fd1498Szrj {
73*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52huq512_mask ((__v8di) __W,
74*38fd1498Szrj 						       (__v8di) __X,
75*38fd1498Szrj 						       (__v8di) __Y,
76*38fd1498Szrj 						       (__mmask8) __M);
77*38fd1498Szrj }
78*38fd1498Szrj 
79*38fd1498Szrj extern __inline __m512i
80*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_maskz_madd52lo_epu64(__mmask8 __M,__m512i __X,__m512i __Y,__m512i __Z)81*38fd1498Szrj _mm512_maskz_madd52lo_epu64 (__mmask8 __M, __m512i __X, __m512i __Y, __m512i __Z)
82*38fd1498Szrj {
83*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52luq512_maskz ((__v8di) __X,
84*38fd1498Szrj 							(__v8di) __Y,
85*38fd1498Szrj 							(__v8di) __Z,
86*38fd1498Szrj 							(__mmask8) __M);
87*38fd1498Szrj }
88*38fd1498Szrj 
89*38fd1498Szrj extern __inline __m512i
90*38fd1498Szrj __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
_mm512_maskz_madd52hi_epu64(__mmask8 __M,__m512i __X,__m512i __Y,__m512i __Z)91*38fd1498Szrj _mm512_maskz_madd52hi_epu64 (__mmask8 __M, __m512i __X, __m512i __Y, __m512i __Z)
92*38fd1498Szrj {
93*38fd1498Szrj   return (__m512i) __builtin_ia32_vpmadd52huq512_maskz ((__v8di) __X,
94*38fd1498Szrj 							(__v8di) __Y,
95*38fd1498Szrj 							(__v8di) __Z,
96*38fd1498Szrj 							(__mmask8) __M);
97*38fd1498Szrj }
98*38fd1498Szrj 
99*38fd1498Szrj #ifdef __DISABLE_AVX512IFMA__
100*38fd1498Szrj #undef __DISABLE_AVX512IFMA__
101*38fd1498Szrj #pragma GCC pop_options
102*38fd1498Szrj #endif /* __DISABLE_AVX512IFMA__ */
103*38fd1498Szrj 
104*38fd1498Szrj #endif /* _AVX512IFMAINTRIN_H_INCLUDED */
105