xref: /netbsd-src/external/gpl3/gcc.old/dist/gcc/config/i386/avx512pfintrin.h (revision f3cfa6f6ce31685c6c4a758bc430e69eb99f50a4)
1 /* Copyright (C) 2013-2016 Free Software Foundation, Inc.
2 
3    This file is part of GCC.
4 
5    GCC is free software; you can redistribute it and/or modify
6    it under the terms of the GNU General Public License as published by
7    the Free Software Foundation; either version 3, or (at your option)
8    any later version.
9 
10    GCC is distributed in the hope that it will be useful,
11    but WITHOUT ANY WARRANTY; without even the implied warranty of
12    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13    GNU General Public License for more details.
14 
15    Under Section 7 of GPL version 3, you are granted additional
16    permissions described in the GCC Runtime Library Exception, version
17    3.1, as published by the Free Software Foundation.
18 
19    You should have received a copy of the GNU General Public License and
20    a copy of the GCC Runtime Library Exception along with this program;
21    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
22    <http://www.gnu.org/licenses/>.  */
23 
24 #ifndef _IMMINTRIN_H_INCLUDED
25 #error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead."
26 #endif
27 
28 #ifndef _AVX512PFINTRIN_H_INCLUDED
29 #define _AVX512PFINTRIN_H_INCLUDED
30 
31 #ifndef __AVX512PF__
32 #pragma GCC push_options
33 #pragma GCC target("avx512pf")
34 #define __DISABLE_AVX512PF__
35 #endif /* __AVX512PF__ */
36 
37 /* Internal data types for implementing the intrinsics.  */
38 typedef long long __v8di __attribute__ ((__vector_size__ (64)));
39 typedef int __v16si __attribute__ ((__vector_size__ (64)));
40 
41 /* The Intel API is flexible enough that we must allow aliasing with other
42    vector types, and their scalar components.  */
43 typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__));
44 
45 typedef unsigned char  __mmask8;
46 typedef unsigned short __mmask16;
47 
48 #ifdef __OPTIMIZE__
49 extern __inline void
50 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
51 _mm512_mask_prefetch_i32gather_pd (__m256i __index, __mmask8 __mask,
52 				   void const *__addr, int __scale, int __hint)
53 {
54   __builtin_ia32_gatherpfdpd (__mask, (__v8si) __index,
55 			      __addr, __scale, __hint);
56 }
57 
58 extern __inline void
59 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
60 _mm512_mask_prefetch_i32gather_ps (__m512i __index, __mmask16 __mask,
61 				   void const *__addr, int __scale, int __hint)
62 {
63   __builtin_ia32_gatherpfdps (__mask, (__v16si) __index, __addr,
64 			      __scale, __hint);
65 }
66 
67 extern __inline void
68 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
69 _mm512_mask_prefetch_i64gather_pd (__m512i __index, __mmask8 __mask,
70 				   void const *__addr, int __scale, int __hint)
71 {
72   __builtin_ia32_gatherpfqpd (__mask, (__v8di) __index,
73 			      __addr, __scale, __hint);
74 }
75 
76 extern __inline void
77 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
78 _mm512_mask_prefetch_i64gather_ps (__m512i __index, __mmask8 __mask,
79 				   void const *__addr, int __scale, int __hint)
80 {
81   __builtin_ia32_gatherpfqps (__mask, (__v8di) __index, __addr,
82 			      __scale, __hint);
83 }
84 
85 extern __inline void
86 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
87 _mm512_prefetch_i32scatter_pd (void *__addr, __m256i __index, int __scale,
88 			       int __hint)
89 {
90   __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) __index,
91 			       __addr, __scale, __hint);
92 }
93 
94 extern __inline void
95 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
96 _mm512_prefetch_i32scatter_ps (void *__addr, __m512i __index, int __scale,
97 			       int __hint)
98 {
99   __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) __index,
100 			       __addr, __scale, __hint);
101 }
102 
103 extern __inline void
104 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
105 _mm512_mask_prefetch_i32scatter_pd (void *__addr, __mmask8 __mask,
106 				    __m256i __index, int __scale, int __hint)
107 {
108   __builtin_ia32_scatterpfdpd (__mask, (__v8si) __index,
109 			       __addr, __scale, __hint);
110 }
111 
112 extern __inline void
113 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
114 _mm512_mask_prefetch_i32scatter_ps (void *__addr, __mmask16 __mask,
115 				    __m512i __index, int __scale, int __hint)
116 {
117   __builtin_ia32_scatterpfdps (__mask, (__v16si) __index, __addr,
118 			       __scale, __hint);
119 }
120 
121 extern __inline void
122 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
123 _mm512_prefetch_i64scatter_pd (void *__addr, __m512i __index, int __scale,
124 			       int __hint)
125 {
126   __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) __index,
127 			       __addr, __scale, __hint);
128 }
129 
130 extern __inline void
131 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
132 _mm512_prefetch_i64scatter_ps (void *__addr, __m512i __index, int __scale,
133 			       int __hint)
134 {
135   __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) __index,
136 			       __addr, __scale, __hint);
137 }
138 
139 extern __inline void
140 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
141 _mm512_mask_prefetch_i64scatter_pd (void *__addr, __mmask16 __mask,
142 				    __m512i __index, int __scale, int __hint)
143 {
144   __builtin_ia32_scatterpfqpd (__mask, (__v8di) __index,
145 			       __addr, __scale, __hint);
146 }
147 
148 extern __inline void
149 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
150 _mm512_mask_prefetch_i64scatter_ps (void *__addr, __mmask16 __mask,
151 				    __m512i __index, int __scale, int __hint)
152 {
153   __builtin_ia32_scatterpfqps (__mask, (__v8di) __index, __addr,
154 			       __scale, __hint);
155 }
156 
157 #else
158 #define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
159   __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,	     \
160 			      (void const *)ADDR, (int)SCALE, (int)HINT)
161 
162 #define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
163   __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,      \
164 			      (void const *)ADDR, (int)SCALE, (int)HINT)
165 
166 #define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
167   __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
168 			      (void *)ADDR, (int)SCALE, (int)HINT)
169 
170 #define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
171   __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
172 			      (void *)ADDR, (int)SCALE, (int)HINT)
173 
174 #define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT)              \
175   __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX,       \
176 			       (void *)ADDR, (int)SCALE, (int)HINT)
177 
178 #define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT)              \
179   __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX,   \
180 			       (void *)ADDR, (int)SCALE, (int)HINT)
181 
182 #define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
183   __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,       \
184 			       (void *)ADDR, (int)SCALE, (int)HINT)
185 
186 #define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
187   __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,     \
188 			       (void *)ADDR, (int)SCALE, (int)HINT)
189 
190 #define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT)              \
191   __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
192 			       (void *)ADDR, (int)SCALE, (int)HINT)
193 
194 #define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT)              \
195   __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
196 			       (void *)ADDR, (int)SCALE, (int)HINT)
197 
198 #define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
199   __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
200 			       (void *)ADDR, (int)SCALE, (int)HINT)
201 
202 #define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
203   __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
204 			       (void *)ADDR, (int)SCALE, (int)HINT)
205 #endif
206 
207 #ifdef __DISABLE_AVX512PF__
208 #undef __DISABLE_AVX512PF__
209 #pragma GCC pop_options
210 #endif /* __DISABLE_AVX512PF__ */
211 
212 #endif /* _AVX512PFINTRIN_H_INCLUDED */
213