131
|
1 /* Copyright (C) 2013-2018 Free Software Foundation, Inc.
|
111
|
2
|
|
3 This file is part of GCC.
|
|
4
|
|
5 GCC is free software; you can redistribute it and/or modify
|
|
6 it under the terms of the GNU General Public License as published by
|
|
7 the Free Software Foundation; either version 3, or (at your option)
|
|
8 any later version.
|
|
9
|
|
10 GCC is distributed in the hope that it will be useful,
|
|
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
13 GNU General Public License for more details.
|
|
14
|
|
15 Under Section 7 of GPL version 3, you are granted additional
|
|
16 permissions described in the GCC Runtime Library Exception, version
|
|
17 3.1, as published by the Free Software Foundation.
|
|
18
|
|
19 You should have received a copy of the GNU General Public License and
|
|
20 a copy of the GCC Runtime Library Exception along with this program;
|
|
21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
22 <http://www.gnu.org/licenses/>. */
|
|
23
|
|
24 #ifndef _IMMINTRIN_H_INCLUDED
|
|
25 #error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead."
|
|
26 #endif
|
|
27
|
|
28 #ifndef _AVX512PFINTRIN_H_INCLUDED
|
|
29 #define _AVX512PFINTRIN_H_INCLUDED
|
|
30
|
|
31 #ifndef __AVX512PF__
|
|
32 #pragma GCC push_options
|
|
33 #pragma GCC target("avx512pf")
|
|
34 #define __DISABLE_AVX512PF__
|
|
35 #endif /* __AVX512PF__ */
|
|
36
|
|
37 /* Internal data types for implementing the intrinsics. */
|
|
38 typedef long long __v8di __attribute__ ((__vector_size__ (64)));
|
|
39 typedef int __v16si __attribute__ ((__vector_size__ (64)));
|
|
40
|
|
41 /* The Intel API is flexible enough that we must allow aliasing with other
|
|
42 vector types, and their scalar components. */
|
|
43 typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__));
|
|
44
|
|
45 typedef unsigned char __mmask8;
|
|
46 typedef unsigned short __mmask16;
|
|
47
|
|
48 #ifdef __OPTIMIZE__
|
|
49 extern __inline void
|
|
50 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
51 _mm512_prefetch_i32gather_pd (__m256i __index, void const *__addr,
|
|
52 int __scale, int __hint)
|
|
53 {
|
|
54 __builtin_ia32_gatherpfdpd ((__mmask8) 0xFF, (__v8si) __index, __addr,
|
|
55 __scale, __hint);
|
|
56 }
|
|
57
|
|
58 extern __inline void
|
|
59 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
60 _mm512_prefetch_i32gather_ps (__m512i __index, void const *__addr,
|
|
61 int __scale, int __hint)
|
|
62 {
|
|
63 __builtin_ia32_gatherpfdps ((__mmask16) 0xFFFF, (__v16si) __index, __addr,
|
|
64 __scale, __hint);
|
|
65 }
|
|
66
|
|
67 extern __inline void
|
|
68 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
69 _mm512_mask_prefetch_i32gather_pd (__m256i __index, __mmask8 __mask,
|
|
70 void const *__addr, int __scale, int __hint)
|
|
71 {
|
|
72 __builtin_ia32_gatherpfdpd (__mask, (__v8si) __index, __addr, __scale,
|
|
73 __hint);
|
|
74 }
|
|
75
|
|
76 extern __inline void
|
|
77 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
78 _mm512_mask_prefetch_i32gather_ps (__m512i __index, __mmask16 __mask,
|
|
79 void const *__addr, int __scale, int __hint)
|
|
80 {
|
|
81 __builtin_ia32_gatherpfdps (__mask, (__v16si) __index, __addr, __scale,
|
|
82 __hint);
|
|
83 }
|
|
84
|
|
85 extern __inline void
|
|
86 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
87 _mm512_prefetch_i64gather_pd (__m512i __index, void const *__addr,
|
|
88 int __scale, int __hint)
|
|
89 {
|
|
90 __builtin_ia32_gatherpfqpd ((__mmask8) 0xFF, (__v8di) __index, __addr,
|
|
91 __scale, __hint);
|
|
92 }
|
|
93
|
|
94 extern __inline void
|
|
95 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
96 _mm512_prefetch_i64gather_ps (__m512i __index, void const *__addr,
|
|
97 int __scale, int __hint)
|
|
98 {
|
|
99 __builtin_ia32_gatherpfqps ((__mmask8) 0xFF, (__v8di) __index, __addr,
|
|
100 __scale, __hint);
|
|
101 }
|
|
102
|
|
103 extern __inline void
|
|
104 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
105 _mm512_mask_prefetch_i64gather_pd (__m512i __index, __mmask8 __mask,
|
|
106 void const *__addr, int __scale, int __hint)
|
|
107 {
|
|
108 __builtin_ia32_gatherpfqpd (__mask, (__v8di) __index, __addr, __scale,
|
|
109 __hint);
|
|
110 }
|
|
111
|
|
112 extern __inline void
|
|
113 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
114 _mm512_mask_prefetch_i64gather_ps (__m512i __index, __mmask8 __mask,
|
|
115 void const *__addr, int __scale, int __hint)
|
|
116 {
|
|
117 __builtin_ia32_gatherpfqps (__mask, (__v8di) __index, __addr, __scale,
|
|
118 __hint);
|
|
119 }
|
|
120
|
|
121 extern __inline void
|
|
122 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
123 _mm512_prefetch_i32scatter_pd (void *__addr, __m256i __index, int __scale,
|
|
124 int __hint)
|
|
125 {
|
|
126 __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) __index, __addr,
|
|
127 __scale, __hint);
|
|
128 }
|
|
129
|
|
130 extern __inline void
|
|
131 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
132 _mm512_prefetch_i32scatter_ps (void *__addr, __m512i __index, int __scale,
|
|
133 int __hint)
|
|
134 {
|
|
135 __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) __index, __addr,
|
|
136 __scale, __hint);
|
|
137 }
|
|
138
|
|
139 extern __inline void
|
|
140 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
141 _mm512_mask_prefetch_i32scatter_pd (void *__addr, __mmask8 __mask,
|
|
142 __m256i __index, int __scale, int __hint)
|
|
143 {
|
|
144 __builtin_ia32_scatterpfdpd (__mask, (__v8si) __index, __addr, __scale,
|
|
145 __hint);
|
|
146 }
|
|
147
|
|
148 extern __inline void
|
|
149 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
150 _mm512_mask_prefetch_i32scatter_ps (void *__addr, __mmask16 __mask,
|
|
151 __m512i __index, int __scale, int __hint)
|
|
152 {
|
|
153 __builtin_ia32_scatterpfdps (__mask, (__v16si) __index, __addr, __scale,
|
|
154 __hint);
|
|
155 }
|
|
156
|
|
157 extern __inline void
|
|
158 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
159 _mm512_prefetch_i64scatter_pd (void *__addr, __m512i __index, int __scale,
|
|
160 int __hint)
|
|
161 {
|
|
162 __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) __index,__addr,
|
|
163 __scale, __hint);
|
|
164 }
|
|
165
|
|
166 extern __inline void
|
|
167 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
|
168 _mm512_prefetch_i64scatter_ps (void *__addr, __m512i __index, int __scale,
|
|
169 int __hint)
|
|
170 {
|
|
171 __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) __index, __addr,
|
|
172 __scale, __hint);
|
|
173 }
|
|
174
|
|
175 extern __inline void
|
|
176 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
131
|
177 _mm512_mask_prefetch_i64scatter_pd (void *__addr, __mmask8 __mask,
|
111
|
178 __m512i __index, int __scale, int __hint)
|
|
179 {
|
|
180 __builtin_ia32_scatterpfqpd (__mask, (__v8di) __index, __addr, __scale,
|
131
|
181 __hint);
|
111
|
182 }
|
|
183
|
|
184 extern __inline void
|
|
185 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
|
131
|
186 _mm512_mask_prefetch_i64scatter_ps (void *__addr, __mmask8 __mask,
|
111
|
187 __m512i __index, int __scale, int __hint)
|
|
188 {
|
|
189 __builtin_ia32_scatterpfqps (__mask, (__v8di) __index, __addr, __scale,
|
|
190 __hint);
|
|
191 }
|
|
192
|
|
193 #else
|
|
194 #define _mm512_prefetch_i32gather_pd(INDEX, ADDR, SCALE, HINT) \
|
|
195 __builtin_ia32_gatherpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \
|
|
196 (void const *)ADDR, (int)SCALE, (int)HINT)
|
|
197
|
|
198 #define _mm512_prefetch_i32gather_ps(INDEX, ADDR, SCALE, HINT) \
|
|
199 __builtin_ia32_gatherpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \
|
|
200 (void const *)ADDR, (int)SCALE, (int)HINT)
|
|
201
|
|
202 #define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \
|
|
203 __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \
|
|
204 (void const *)ADDR, (int)SCALE, (int)HINT)
|
|
205
|
|
206 #define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \
|
|
207 __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \
|
|
208 (void const *)ADDR, (int)SCALE, (int)HINT)
|
|
209
|
|
210 #define _mm512_prefetch_i64gather_pd(INDEX, ADDR, SCALE, HINT) \
|
|
211 __builtin_ia32_gatherpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
|
|
212 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
213
|
|
214 #define _mm512_prefetch_i64gather_ps(INDEX, ADDR, SCALE, HINT) \
|
|
215 __builtin_ia32_gatherpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
|
|
216 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
217
|
|
218 #define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \
|
|
219 __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
|
|
220 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
221
|
|
222 #define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \
|
|
223 __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
|
|
224 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
225
|
|
226 #define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT) \
|
|
227 __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \
|
|
228 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
229
|
|
230 #define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT) \
|
|
231 __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \
|
|
232 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
233
|
|
234 #define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \
|
|
235 __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \
|
|
236 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
237
|
|
238 #define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \
|
|
239 __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \
|
|
240 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
241
|
|
242 #define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT) \
|
|
243 __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
|
|
244 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
245
|
|
246 #define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT) \
|
|
247 __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \
|
|
248 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
249
|
|
250 #define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \
|
|
251 __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
|
|
252 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
253
|
|
254 #define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \
|
|
255 __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \
|
|
256 (void *)ADDR, (int)SCALE, (int)HINT)
|
|
257 #endif
|
|
258
|
|
259 #ifdef __DISABLE_AVX512PF__
|
|
260 #undef __DISABLE_AVX512PF__
|
|
261 #pragma GCC pop_options
|
|
262 #endif /* __DISABLE_AVX512PF__ */
|
|
263
|
|
264 #endif /* _AVX512PFINTRIN_H_INCLUDED */
|