Mercurial > hg > CbC > CbC_gcc
annotate gcc/config/rs6000/altivec.h @ 131:84e7813d76e9
gcc-8.2
author | mir3636 |
---|---|
date | Thu, 25 Oct 2018 07:37:49 +0900 |
parents | 04ced10e8804 |
children | 1830386684a0 |
rev | line source |
---|---|
0 | 1 /* PowerPC AltiVec include file. |
131 | 2 Copyright (C) 2002-2018 Free Software Foundation, Inc. |
0 | 3 Contributed by Aldy Hernandez (aldyh@redhat.com). |
4 Rewritten by Paolo Bonzini (bonzini@gnu.org). | |
5 | |
6 This file is part of GCC. | |
7 | |
8 GCC is free software; you can redistribute it and/or modify it | |
9 under the terms of the GNU General Public License as published | |
10 by the Free Software Foundation; either version 3, or (at your | |
11 option) any later version. | |
12 | |
13 GCC is distributed in the hope that it will be useful, but WITHOUT | |
14 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY | |
15 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public | |
16 License for more details. | |
17 | |
18 Under Section 7 of GPL version 3, you are granted additional | |
19 permissions described in the GCC Runtime Library Exception, version | |
20 3.1, as published by the Free Software Foundation. | |
21 | |
22 You should have received a copy of the GNU General Public License and | |
23 a copy of the GCC Runtime Library Exception along with this program; | |
24 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see | |
25 <http://www.gnu.org/licenses/>. */ | |
26 | |
27 /* Implemented to conform to the specification included in the AltiVec | |
28 Technology Programming Interface Manual (ALTIVECPIM/D 6/1999 Rev 0). */ | |
29 | |
30 #ifndef _ALTIVEC_H | |
31 #define _ALTIVEC_H 1 | |
32 | |
33 #if !defined(__VEC__) || !defined(__ALTIVEC__) | |
34 #error Use the "-maltivec" flag to enable PowerPC AltiVec support | |
35 #endif | |
36 | |
37 /* If __APPLE_ALTIVEC__ is defined, the compiler supports 'vector', | |
38 'pixel' and 'bool' as context-sensitive AltiVec keywords (in | |
39 non-AltiVec contexts, they revert to their original meanings, | |
40 if any), so we do not need to define them as macros. */ | |
41 | |
42 #if !defined(__APPLE_ALTIVEC__) | |
43 /* You are allowed to undef these for C++ compatibility. */ | |
44 #define vector __vector | |
45 #define pixel __pixel | |
46 #define bool __bool | |
47 #endif | |
48 | |
49 /* Condition register codes for AltiVec predicates. */ | |
50 | |
51 #define __CR6_EQ 0 | |
52 #define __CR6_EQ_REV 1 | |
53 #define __CR6_LT 2 | |
54 #define __CR6_LT_REV 3 | |
55 | |
56 /* Synonyms. */ | |
57 #define vec_vaddcuw vec_addc | |
58 #define vec_vand vec_and | |
59 #define vec_vandc vec_andc | |
60 #define vec_vrfip vec_ceil | |
61 #define vec_vcmpbfp vec_cmpb | |
62 #define vec_vcmpgefp vec_cmpge | |
63 #define vec_vctsxs vec_cts | |
64 #define vec_vctuxs vec_ctu | |
65 #define vec_vexptefp vec_expte | |
66 #define vec_vrfim vec_floor | |
67 #define vec_lvx vec_ld | |
68 #define vec_lvxl vec_ldl | |
69 #define vec_vlogefp vec_loge | |
70 #define vec_vmaddfp vec_madd | |
71 #define vec_vmhaddshs vec_madds | |
72 #define vec_vmladduhm vec_mladd | |
73 #define vec_vmhraddshs vec_mradds | |
74 #define vec_vnmsubfp vec_nmsub | |
75 #define vec_vnor vec_nor | |
76 #define vec_vor vec_or | |
77 #define vec_vpkpx vec_packpx | |
78 #define vec_vperm vec_perm | |
131 | 79 #define vec_permxor __builtin_vec_vpermxor |
0 | 80 #define vec_vrefp vec_re |
81 #define vec_vrfin vec_round | |
82 #define vec_vrsqrtefp vec_rsqrte | |
83 #define vec_vsel vec_sel | |
84 #define vec_vsldoi vec_sld | |
85 #define vec_vsl vec_sll | |
86 #define vec_vslo vec_slo | |
87 #define vec_vspltisb vec_splat_s8 | |
88 #define vec_vspltish vec_splat_s16 | |
89 #define vec_vspltisw vec_splat_s32 | |
90 #define vec_vsr vec_srl | |
91 #define vec_vsro vec_sro | |
92 #define vec_stvx vec_st | |
93 #define vec_stvxl vec_stl | |
94 #define vec_vsubcuw vec_subc | |
95 #define vec_vsum2sws vec_sum2s | |
96 #define vec_vsumsws vec_sums | |
97 #define vec_vrfiz vec_trunc | |
98 #define vec_vxor vec_xor | |
99 | |
100 /* Functions that are resolved by the backend to one of the | |
101 typed builtins. */ | |
102 #define vec_vaddfp __builtin_vec_vaddfp | |
103 #define vec_addc __builtin_vec_addc | |
111 | 104 #define vec_adde __builtin_vec_adde |
105 #define vec_addec __builtin_vec_addec | |
0 | 106 #define vec_vaddsws __builtin_vec_vaddsws |
107 #define vec_vaddshs __builtin_vec_vaddshs | |
108 #define vec_vaddsbs __builtin_vec_vaddsbs | |
109 #define vec_vavgsw __builtin_vec_vavgsw | |
110 #define vec_vavguw __builtin_vec_vavguw | |
111 #define vec_vavgsh __builtin_vec_vavgsh | |
112 #define vec_vavguh __builtin_vec_vavguh | |
113 #define vec_vavgsb __builtin_vec_vavgsb | |
114 #define vec_vavgub __builtin_vec_vavgub | |
115 #define vec_ceil __builtin_vec_ceil | |
116 #define vec_cmpb __builtin_vec_cmpb | |
117 #define vec_vcmpeqfp __builtin_vec_vcmpeqfp | |
118 #define vec_cmpge __builtin_vec_cmpge | |
119 #define vec_vcmpgtfp __builtin_vec_vcmpgtfp | |
120 #define vec_vcmpgtsw __builtin_vec_vcmpgtsw | |
121 #define vec_vcmpgtuw __builtin_vec_vcmpgtuw | |
122 #define vec_vcmpgtsh __builtin_vec_vcmpgtsh | |
123 #define vec_vcmpgtuh __builtin_vec_vcmpgtuh | |
124 #define vec_vcmpgtsb __builtin_vec_vcmpgtsb | |
125 #define vec_vcmpgtub __builtin_vec_vcmpgtub | |
126 #define vec_vcfsx __builtin_vec_vcfsx | |
127 #define vec_vcfux __builtin_vec_vcfux | |
128 #define vec_cts __builtin_vec_cts | |
129 #define vec_ctu __builtin_vec_ctu | |
111 | 130 #define vec_cpsgn __builtin_vec_copysign |
131 #define vec_double __builtin_vec_double | |
132 #define vec_doublee __builtin_vec_doublee | |
133 #define vec_doubleo __builtin_vec_doubleo | |
134 #define vec_doublel __builtin_vec_doublel | |
135 #define vec_doubleh __builtin_vec_doubleh | |
0 | 136 #define vec_expte __builtin_vec_expte |
111 | 137 #define vec_float __builtin_vec_float |
138 #define vec_float2 __builtin_vec_float2 | |
139 #define vec_floate __builtin_vec_floate | |
140 #define vec_floato __builtin_vec_floato | |
0 | 141 #define vec_floor __builtin_vec_floor |
142 #define vec_loge __builtin_vec_loge | |
143 #define vec_madd __builtin_vec_madd | |
144 #define vec_madds __builtin_vec_madds | |
145 #define vec_mtvscr __builtin_vec_mtvscr | |
111 | 146 #define vec_reve __builtin_vec_vreve |
0 | 147 #define vec_vmaxfp __builtin_vec_vmaxfp |
148 #define vec_vmaxsw __builtin_vec_vmaxsw | |
149 #define vec_vmaxsh __builtin_vec_vmaxsh | |
150 #define vec_vmaxsb __builtin_vec_vmaxsb | |
151 #define vec_vminfp __builtin_vec_vminfp | |
152 #define vec_vminsw __builtin_vec_vminsw | |
153 #define vec_vminsh __builtin_vec_vminsh | |
154 #define vec_vminsb __builtin_vec_vminsb | |
155 #define vec_mradds __builtin_vec_mradds | |
156 #define vec_vmsumshm __builtin_vec_vmsumshm | |
157 #define vec_vmsumuhm __builtin_vec_vmsumuhm | |
158 #define vec_vmsummbm __builtin_vec_vmsummbm | |
159 #define vec_vmsumubm __builtin_vec_vmsumubm | |
160 #define vec_vmsumshs __builtin_vec_vmsumshs | |
161 #define vec_vmsumuhs __builtin_vec_vmsumuhs | |
162 #define vec_vmulesb __builtin_vec_vmulesb | |
163 #define vec_vmulesh __builtin_vec_vmulesh | |
164 #define vec_vmuleuh __builtin_vec_vmuleuh | |
165 #define vec_vmuleub __builtin_vec_vmuleub | |
166 #define vec_vmulosh __builtin_vec_vmulosh | |
167 #define vec_vmulouh __builtin_vec_vmulouh | |
168 #define vec_vmulosb __builtin_vec_vmulosb | |
169 #define vec_vmuloub __builtin_vec_vmuloub | |
170 #define vec_nmsub __builtin_vec_nmsub | |
171 #define vec_packpx __builtin_vec_packpx | |
172 #define vec_vpkswss __builtin_vec_vpkswss | |
173 #define vec_vpkuwus __builtin_vec_vpkuwus | |
174 #define vec_vpkshss __builtin_vec_vpkshss | |
175 #define vec_vpkuhus __builtin_vec_vpkuhus | |
176 #define vec_vpkswus __builtin_vec_vpkswus | |
177 #define vec_vpkshus __builtin_vec_vpkshus | |
178 #define vec_re __builtin_vec_re | |
179 #define vec_round __builtin_vec_round | |
67
f6334be47118
update gcc from gcc-4.6-20100522 to gcc-4.6-20110318
nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
180 #define vec_recipdiv __builtin_vec_recipdiv |
111 | 181 #define vec_rlmi __builtin_vec_rlmi |
182 #define vec_vrlnm __builtin_vec_rlnm | |
183 #define vec_rlnm(a,b,c) (__builtin_vec_rlnm((a),((b)<<8)|(c))) | |
67
f6334be47118
update gcc from gcc-4.6-20100522 to gcc-4.6-20110318
nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
184 #define vec_rsqrt __builtin_vec_rsqrt |
0 | 185 #define vec_rsqrte __builtin_vec_rsqrte |
111 | 186 #define vec_signed __builtin_vec_vsigned |
187 #define vec_signed2 __builtin_vec_vsigned2 | |
188 #define vec_signede __builtin_vec_vsignede | |
189 #define vec_signedo __builtin_vec_vsignedo | |
190 #define vec_unsigned __builtin_vec_vunsigned | |
191 #define vec_unsigned2 __builtin_vec_vunsigned2 | |
192 #define vec_unsignede __builtin_vec_vunsignede | |
193 #define vec_unsignedo __builtin_vec_vunsignedo | |
0 | 194 #define vec_vsubfp __builtin_vec_vsubfp |
195 #define vec_subc __builtin_vec_subc | |
111 | 196 #define vec_sube __builtin_vec_sube |
197 #define vec_subec __builtin_vec_subec | |
0 | 198 #define vec_vsubsws __builtin_vec_vsubsws |
199 #define vec_vsubshs __builtin_vec_vsubshs | |
200 #define vec_vsubsbs __builtin_vec_vsubsbs | |
201 #define vec_sum4s __builtin_vec_sum4s | |
202 #define vec_vsum4shs __builtin_vec_vsum4shs | |
203 #define vec_vsum4sbs __builtin_vec_vsum4sbs | |
204 #define vec_vsum4ubs __builtin_vec_vsum4ubs | |
205 #define vec_sum2s __builtin_vec_sum2s | |
206 #define vec_sums __builtin_vec_sums | |
207 #define vec_trunc __builtin_vec_trunc | |
208 #define vec_vupkhpx __builtin_vec_vupkhpx | |
209 #define vec_vupkhsh __builtin_vec_vupkhsh | |
210 #define vec_vupkhsb __builtin_vec_vupkhsb | |
211 #define vec_vupklpx __builtin_vec_vupklpx | |
212 #define vec_vupklsh __builtin_vec_vupklsh | |
213 #define vec_vupklsb __builtin_vec_vupklsb | |
214 #define vec_abs __builtin_vec_abs | |
111 | 215 #define vec_nabs __builtin_vec_nabs |
0 | 216 #define vec_abss __builtin_vec_abss |
217 #define vec_add __builtin_vec_add | |
218 #define vec_adds __builtin_vec_adds | |
219 #define vec_and __builtin_vec_and | |
220 #define vec_andc __builtin_vec_andc | |
221 #define vec_avg __builtin_vec_avg | |
222 #define vec_cmpeq __builtin_vec_cmpeq | |
111 | 223 #define vec_cmpne __builtin_vec_cmpne |
0 | 224 #define vec_cmpgt __builtin_vec_cmpgt |
225 #define vec_ctf __builtin_vec_ctf | |
226 #define vec_dst __builtin_vec_dst | |
227 #define vec_dstst __builtin_vec_dstst | |
228 #define vec_dststt __builtin_vec_dststt | |
229 #define vec_dstt __builtin_vec_dstt | |
230 #define vec_ld __builtin_vec_ld | |
231 #define vec_lde __builtin_vec_lde | |
232 #define vec_ldl __builtin_vec_ldl | |
233 #define vec_lvebx __builtin_vec_lvebx | |
234 #define vec_lvehx __builtin_vec_lvehx | |
235 #define vec_lvewx __builtin_vec_lvewx | |
111 | 236 #define vec_neg __builtin_vec_neg |
237 #define vec_pmsum_be __builtin_vec_vpmsum | |
238 #define vec_shasigma_be __builtin_crypto_vshasigma | |
0 | 239 /* Cell only intrinsics. */ |
240 #ifdef __PPU__ | |
241 #define vec_lvlx __builtin_vec_lvlx | |
242 #define vec_lvlxl __builtin_vec_lvlxl | |
243 #define vec_lvrx __builtin_vec_lvrx | |
244 #define vec_lvrxl __builtin_vec_lvrxl | |
245 #endif | |
246 #define vec_lvsl __builtin_vec_lvsl | |
247 #define vec_lvsr __builtin_vec_lvsr | |
248 #define vec_max __builtin_vec_max | |
111 | 249 #define vec_mergee __builtin_vec_vmrgew |
0 | 250 #define vec_mergeh __builtin_vec_mergeh |
251 #define vec_mergel __builtin_vec_mergel | |
111 | 252 #define vec_mergeo __builtin_vec_vmrgow |
0 | 253 #define vec_min __builtin_vec_min |
254 #define vec_mladd __builtin_vec_mladd | |
255 #define vec_msum __builtin_vec_msum | |
256 #define vec_msums __builtin_vec_msums | |
111 | 257 #define vec_mul __builtin_vec_mul |
0 | 258 #define vec_mule __builtin_vec_mule |
259 #define vec_mulo __builtin_vec_mulo | |
260 #define vec_nor __builtin_vec_nor | |
261 #define vec_or __builtin_vec_or | |
262 #define vec_pack __builtin_vec_pack | |
263 #define vec_packs __builtin_vec_packs | |
264 #define vec_packsu __builtin_vec_packsu | |
265 #define vec_perm __builtin_vec_perm | |
266 #define vec_rl __builtin_vec_rl | |
267 #define vec_sel __builtin_vec_sel | |
268 #define vec_sl __builtin_vec_sl | |
269 #define vec_sld __builtin_vec_sld | |
111 | 270 #define vec_sldw __builtin_vsx_xxsldwi |
0 | 271 #define vec_sll __builtin_vec_sll |
272 #define vec_slo __builtin_vec_slo | |
273 #define vec_splat __builtin_vec_splat | |
274 #define vec_sr __builtin_vec_sr | |
275 #define vec_sra __builtin_vec_sra | |
276 #define vec_srl __builtin_vec_srl | |
277 #define vec_sro __builtin_vec_sro | |
278 #define vec_st __builtin_vec_st | |
279 #define vec_ste __builtin_vec_ste | |
280 #define vec_stl __builtin_vec_stl | |
281 #define vec_stvebx __builtin_vec_stvebx | |
282 #define vec_stvehx __builtin_vec_stvehx | |
283 #define vec_stvewx __builtin_vec_stvewx | |
284 /* Cell only intrinsics. */ | |
285 #ifdef __PPU__ | |
286 #define vec_stvlx __builtin_vec_stvlx | |
287 #define vec_stvlxl __builtin_vec_stvlxl | |
288 #define vec_stvrx __builtin_vec_stvrx | |
289 #define vec_stvrxl __builtin_vec_stvrxl | |
290 #endif | |
291 #define vec_sub __builtin_vec_sub | |
292 #define vec_subs __builtin_vec_subs | |
293 #define vec_sum __builtin_vec_sum | |
294 #define vec_unpackh __builtin_vec_unpackh | |
295 #define vec_unpackl __builtin_vec_unpackl | |
296 #define vec_vaddubm __builtin_vec_vaddubm | |
297 #define vec_vaddubs __builtin_vec_vaddubs | |
298 #define vec_vadduhm __builtin_vec_vadduhm | |
299 #define vec_vadduhs __builtin_vec_vadduhs | |
300 #define vec_vadduwm __builtin_vec_vadduwm | |
301 #define vec_vadduws __builtin_vec_vadduws | |
302 #define vec_vcmpequb __builtin_vec_vcmpequb | |
303 #define vec_vcmpequh __builtin_vec_vcmpequh | |
304 #define vec_vcmpequw __builtin_vec_vcmpequw | |
305 #define vec_vmaxub __builtin_vec_vmaxub | |
306 #define vec_vmaxuh __builtin_vec_vmaxuh | |
307 #define vec_vmaxuw __builtin_vec_vmaxuw | |
308 #define vec_vminub __builtin_vec_vminub | |
309 #define vec_vminuh __builtin_vec_vminuh | |
310 #define vec_vminuw __builtin_vec_vminuw | |
311 #define vec_vmrghb __builtin_vec_vmrghb | |
312 #define vec_vmrghh __builtin_vec_vmrghh | |
313 #define vec_vmrghw __builtin_vec_vmrghw | |
314 #define vec_vmrglb __builtin_vec_vmrglb | |
315 #define vec_vmrglh __builtin_vec_vmrglh | |
316 #define vec_vmrglw __builtin_vec_vmrglw | |
317 #define vec_vpkuhum __builtin_vec_vpkuhum | |
318 #define vec_vpkuwum __builtin_vec_vpkuwum | |
319 #define vec_vrlb __builtin_vec_vrlb | |
320 #define vec_vrlh __builtin_vec_vrlh | |
321 #define vec_vrlw __builtin_vec_vrlw | |
322 #define vec_vslb __builtin_vec_vslb | |
323 #define vec_vslh __builtin_vec_vslh | |
324 #define vec_vslw __builtin_vec_vslw | |
325 #define vec_vspltb __builtin_vec_vspltb | |
326 #define vec_vsplth __builtin_vec_vsplth | |
327 #define vec_vspltw __builtin_vec_vspltw | |
328 #define vec_vsrab __builtin_vec_vsrab | |
329 #define vec_vsrah __builtin_vec_vsrah | |
330 #define vec_vsraw __builtin_vec_vsraw | |
331 #define vec_vsrb __builtin_vec_vsrb | |
332 #define vec_vsrh __builtin_vec_vsrh | |
333 #define vec_vsrw __builtin_vec_vsrw | |
334 #define vec_vsububs __builtin_vec_vsububs | |
335 #define vec_vsububm __builtin_vec_vsububm | |
336 #define vec_vsubuhm __builtin_vec_vsubuhm | |
337 #define vec_vsubuhs __builtin_vec_vsubuhs | |
338 #define vec_vsubuwm __builtin_vec_vsubuwm | |
339 #define vec_vsubuws __builtin_vec_vsubuws | |
340 #define vec_xor __builtin_vec_xor | |
341 | |
342 #define vec_extract __builtin_vec_extract | |
343 #define vec_insert __builtin_vec_insert | |
344 #define vec_splats __builtin_vec_splats | |
345 #define vec_promote __builtin_vec_promote | |
346 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
347 #ifdef __VSX__ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
348 /* VSX additions */ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
349 #define vec_div __builtin_vec_div |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
350 #define vec_mul __builtin_vec_mul |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
351 #define vec_msub __builtin_vec_msub |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
352 #define vec_nmadd __builtin_vec_nmadd |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
353 #define vec_nearbyint __builtin_vec_nearbyint |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
354 #define vec_rint __builtin_vec_rint |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
355 #define vec_sqrt __builtin_vec_sqrt |
67
f6334be47118
update gcc from gcc-4.6-20100522 to gcc-4.6-20110318
nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
356 #define vec_vsx_ld __builtin_vec_vsx_ld |
f6334be47118
update gcc from gcc-4.6-20100522 to gcc-4.6-20110318
nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
357 #define vec_vsx_st __builtin_vec_vsx_st |
111 | 358 #define vec_xl __builtin_vec_vsx_ld |
359 #define vec_xl_be __builtin_vec_xl_be | |
360 #define vec_xst __builtin_vec_vsx_st | |
131 | 361 #define vec_xst_be __builtin_vec_xst_be |
111 | 362 |
363 /* Note, xxsldi and xxpermdi were added as __builtin_vsx_<xxx> functions | |
364 instead of __builtin_vec_<xxx> */ | |
365 #define vec_xxsldwi __builtin_vsx_xxsldwi | |
366 #define vec_xxpermdi __builtin_vsx_xxpermdi | |
367 #endif | |
368 | |
369 #ifdef _ARCH_PWR8 | |
370 /* Vector additions added in ISA 2.07. */ | |
371 #define vec_eqv __builtin_vec_eqv | |
372 #define vec_nand __builtin_vec_nand | |
373 #define vec_orc __builtin_vec_orc | |
374 #define vec_vaddcuq __builtin_vec_vaddcuq | |
375 #define vec_vaddudm __builtin_vec_vaddudm | |
376 #define vec_vadduqm __builtin_vec_vadduqm | |
377 #define vec_vbpermq __builtin_vec_vbpermq | |
378 #define vec_bperm __builtin_vec_vbperm_api | |
379 #define vec_vclz __builtin_vec_vclz | |
380 #define vec_cntlz __builtin_vec_vclz | |
381 #define vec_vclzb __builtin_vec_vclzb | |
382 #define vec_vclzd __builtin_vec_vclzd | |
383 #define vec_vclzh __builtin_vec_vclzh | |
384 #define vec_vclzw __builtin_vec_vclzw | |
385 #define vec_vaddecuq __builtin_vec_vaddecuq | |
386 #define vec_vaddeuqm __builtin_vec_vaddeuqm | |
387 #define vec_vsubecuq __builtin_vec_vsubecuq | |
388 #define vec_vsubeuqm __builtin_vec_vsubeuqm | |
389 #define vec_vgbbd __builtin_vec_vgbbd | |
390 #define vec_gb __builtin_vec_vgbbd | |
391 #define vec_vmaxsd __builtin_vec_vmaxsd | |
392 #define vec_vmaxud __builtin_vec_vmaxud | |
393 #define vec_vminsd __builtin_vec_vminsd | |
394 #define vec_vminud __builtin_vec_vminud | |
395 #define vec_vmrgew __builtin_vec_vmrgew | |
396 #define vec_vmrgow __builtin_vec_vmrgow | |
397 #define vec_vpksdss __builtin_vec_vpksdss | |
398 #define vec_vpksdus __builtin_vec_vpksdus | |
399 #define vec_vpkudum __builtin_vec_vpkudum | |
400 #define vec_vpkudus __builtin_vec_vpkudus | |
401 #define vec_vpopcnt __builtin_vec_vpopcnt | |
402 #define vec_vpopcntb __builtin_vec_vpopcntb | |
403 #define vec_vpopcntd __builtin_vec_vpopcntd | |
404 #define vec_vpopcnth __builtin_vec_vpopcnth | |
405 #define vec_vpopcntw __builtin_vec_vpopcntw | |
406 #define vec_popcnt __builtin_vec_vpopcntu | |
407 #define vec_popcntb __builtin_vec_vpopcntub | |
408 #define vec_popcnth __builtin_vec_vpopcntuh | |
409 #define vec_popcntw __builtin_vec_vpopcntuw | |
410 #define vec_popcntd __builtin_vec_vpopcntud | |
411 #define vec_vrld __builtin_vec_vrld | |
412 #define vec_vsld __builtin_vec_vsld | |
413 #define vec_vsrad __builtin_vec_vsrad | |
414 #define vec_vsrd __builtin_vec_vsrd | |
415 #define vec_vsubcuq __builtin_vec_vsubcuq | |
416 #define vec_vsubudm __builtin_vec_vsubudm | |
417 #define vec_vsubuqm __builtin_vec_vsubuqm | |
418 #define vec_vupkhsw __builtin_vec_vupkhsw | |
419 #define vec_vupklsw __builtin_vec_vupklsw | |
131 | 420 #define vec_revb __builtin_vec_revb |
111 | 421 #endif |
422 | |
423 #ifdef __POWER9_VECTOR__ | |
424 /* Vector additions added in ISA 3.0. */ | |
131 | 425 #define vec_first_match_index __builtin_vec_first_match_index |
426 #define vec_first_match_or_eos_index __builtin_vec_first_match_or_eos_index | |
427 #define vec_first_mismatch_index __builtin_vec_first_mismatch_index | |
428 #define vec_first_mismatch_or_eos_index __builtin_vec_first_mismatch_or_eos_index | |
111 | 429 #define vec_pack_to_short_fp32 __builtin_vec_convert_4f32_8i16 |
430 #define vec_parity_lsbb __builtin_vec_vparity_lsbb | |
431 #define vec_vctz __builtin_vec_vctz | |
432 #define vec_cnttz __builtin_vec_vctz | |
433 #define vec_vctzb __builtin_vec_vctzb | |
434 #define vec_vctzd __builtin_vec_vctzd | |
435 #define vec_vctzh __builtin_vec_vctzh | |
436 #define vec_vctzw __builtin_vec_vctzw | |
131 | 437 #define vec_extract4b __builtin_vec_extract4b |
438 #define vec_insert4b __builtin_vec_insert4b | |
111 | 439 #define vec_vprtyb __builtin_vec_vprtyb |
440 #define vec_vprtybd __builtin_vec_vprtybd | |
441 #define vec_vprtybw __builtin_vec_vprtybw | |
442 | |
443 #ifdef _ARCH_PPC64 | |
444 #define vec_vprtybq __builtin_vec_vprtybq | |
445 #endif | |
446 | |
447 #define vec_absd __builtin_vec_vadu | |
448 #define vec_absdb __builtin_vec_vadub | |
449 #define vec_absdh __builtin_vec_vaduh | |
450 #define vec_absdw __builtin_vec_vaduw | |
451 | |
452 #define vec_slv __builtin_vec_vslv | |
453 #define vec_srv __builtin_vec_vsrv | |
454 | |
455 #define vec_extract_exp __builtin_vec_extract_exp | |
456 #define vec_extract_sig __builtin_vec_extract_sig | |
457 #define vec_insert_exp __builtin_vec_insert_exp | |
458 #define vec_test_data_class __builtin_vec_test_data_class | |
459 | |
460 #define vec_extract_fp_from_shorth __builtin_vec_vextract_fp_from_shorth | |
461 #define vec_extract_fp_from_shortl __builtin_vec_vextract_fp_from_shortl | |
131 | 462 #define vec_extract_fp32_from_shorth __builtin_vec_vextract_fp_from_shorth |
463 #define vec_extract_fp32_from_shortl __builtin_vec_vextract_fp_from_shortl | |
111 | 464 |
465 #define scalar_extract_exp __builtin_vec_scalar_extract_exp | |
466 #define scalar_extract_sig __builtin_vec_scalar_extract_sig | |
467 #define scalar_insert_exp __builtin_vec_scalar_insert_exp | |
468 #define scalar_test_data_class __builtin_vec_scalar_test_data_class | |
469 #define scalar_test_neg __builtin_vec_scalar_test_neg | |
470 | |
471 #define scalar_cmp_exp_gt __builtin_vec_scalar_cmp_exp_gt | |
472 #define scalar_cmp_exp_lt __builtin_vec_scalar_cmp_exp_lt | |
473 #define scalar_cmp_exp_eq __builtin_vec_scalar_cmp_exp_eq | |
474 #define scalar_cmp_exp_unordered __builtin_vec_scalar_cmp_exp_unordered | |
475 | |
476 #ifdef _ARCH_PPC64 | |
477 #define vec_xl_len __builtin_vec_lxvl | |
478 #define vec_xst_len __builtin_vec_stxvl | |
479 #define vec_xl_len_r __builtin_vec_xl_len_r | |
480 #define vec_xst_len_r __builtin_vec_xst_len_r | |
481 #endif | |
482 | |
483 #define vec_cmpnez __builtin_vec_vcmpnez | |
484 | |
485 #define vec_cntlz_lsbb __builtin_vec_vclzlsbb | |
486 #define vec_cnttz_lsbb __builtin_vec_vctzlsbb | |
487 | |
488 #define vec_xlx __builtin_vec_vextulx | |
489 #define vec_xrx __builtin_vec_vexturx | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
490 #endif |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
491 |
0 | 492 /* Predicates. |
493 For C++, we use templates in order to allow non-parenthesized arguments. | |
494 For C, instead, we use macros since non-parenthesized arguments were | |
495 not allowed even in older GCC implementation of AltiVec. | |
496 | |
497 In the future, we may add more magic to the back-end, so that no | |
498 one- or two-argument macros are used. */ | |
499 | |
500 #ifdef __cplusplus__ | |
501 #define __altivec_unary_pred(NAME, CALL) \ | |
502 template <class T> int NAME (T a1) { return CALL; } | |
503 | |
504 #define __altivec_scalar_pred(NAME, CALL) \ | |
505 template <class T, class U> int NAME (T a1, U a2) { return CALL; } | |
506 | |
507 /* Given the vec_step of a type, return the corresponding bool type. */ | |
508 template <int STEP> class __altivec_bool_ret { }; | |
509 template <> class __altivec_bool_ret <4> { | |
510 typedef __vector __bool int __ret; | |
511 }; | |
512 template <> class __altivec_bool_ret <8> { | |
513 typedef __vector __bool short __ret; | |
514 }; | |
515 template <> class __altivec_bool_ret <16> { | |
516 typedef __vector __bool char __ret; | |
517 }; | |
518 | |
519 /* Be very liberal in the pairs we accept. Mistakes such as passing | |
520 a `vector char' and `vector short' will be caught by the middle-end, | |
521 while any attempt to detect them here would produce hard to understand | |
522 error messages involving the implementation details of AltiVec. */ | |
523 #define __altivec_binary_pred(NAME, CALL) \ | |
524 template <class T, class U> \ | |
525 typename __altivec_bool_ret <vec_step (T)>::__ret \ | |
526 NAME (T a1, U a2) \ | |
527 { \ | |
528 return CALL; \ | |
529 } | |
530 | |
531 __altivec_binary_pred(vec_cmplt, | |
532 __builtin_vec_cmpgt (a2, a1)) | |
533 __altivec_binary_pred(vec_cmple, | |
534 __builtin_vec_cmpge (a2, a1)) | |
535 | |
536 __altivec_scalar_pred(vec_all_in, | |
537 __builtin_altivec_vcmpbfp_p (__CR6_EQ, a1, a2)) | |
538 __altivec_scalar_pred(vec_any_out, | |
539 __builtin_altivec_vcmpbfp_p (__CR6_EQ_REV, a1, a2)) | |
540 | |
541 __altivec_unary_pred(vec_all_nan, | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
542 __builtin_altivec_vcmpeq_p (__CR6_EQ, a1, a1)) |
0 | 543 __altivec_unary_pred(vec_any_nan, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
544 __builtin_altivec_vcmpeq_p (__CR6_LT_REV, a1, a1)) |
0 | 545 |
546 __altivec_unary_pred(vec_all_numeric, | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
547 __builtin_altivec_vcmpeq_p (__CR6_LT, a1, a1)) |
0 | 548 __altivec_unary_pred(vec_any_numeric, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
549 __builtin_altivec_vcmpeq_p (__CR6_EQ_REV, a1, a1)) |
0 | 550 |
551 __altivec_scalar_pred(vec_all_eq, | |
552 __builtin_vec_vcmpeq_p (__CR6_LT, a1, a2)) | |
111 | 553 |
554 #ifndef __POWER9_VECTOR__ | |
0 | 555 __altivec_scalar_pred(vec_all_ne, |
556 __builtin_vec_vcmpeq_p (__CR6_EQ, a1, a2)) | |
557 __altivec_scalar_pred(vec_any_eq, | |
558 __builtin_vec_vcmpeq_p (__CR6_EQ_REV, a1, a2)) | |
111 | 559 #else |
560 __altivec_scalar_pred(vec_all_nez, | |
561 __builtin_vec_vcmpnez_p (__CR6_LT, a1, a2)) | |
562 __altivec_scalar_pred(vec_any_eqz, | |
563 __builtin_vec_vcmpnez_p (__CR6_LT_REV, a1, a2)) | |
564 __altivec_scalar_pred(vec_all_ne, | |
565 __builtin_vec_vcmpne_p (a1, a2)) | |
566 __altivec_scalar_pred(vec_any_eq, | |
567 __builtin_vec_vcmpae_p (a1, a2)) | |
568 #endif | |
569 | |
0 | 570 __altivec_scalar_pred(vec_any_ne, |
571 __builtin_vec_vcmpeq_p (__CR6_LT_REV, a1, a2)) | |
572 | |
573 __altivec_scalar_pred(vec_all_gt, | |
574 __builtin_vec_vcmpgt_p (__CR6_LT, a1, a2)) | |
575 __altivec_scalar_pred(vec_all_lt, | |
576 __builtin_vec_vcmpgt_p (__CR6_LT, a2, a1)) | |
577 __altivec_scalar_pred(vec_any_gt, | |
578 __builtin_vec_vcmpgt_p (__CR6_EQ_REV, a1, a2)) | |
579 __altivec_scalar_pred(vec_any_lt, | |
580 __builtin_vec_vcmpgt_p (__CR6_EQ_REV, a2, a1)) | |
581 | |
582 __altivec_scalar_pred(vec_all_ngt, | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
583 __builtin_altivec_vcmpgt_p (__CR6_EQ, a1, a2)) |
0 | 584 __altivec_scalar_pred(vec_all_nlt, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
585 __builtin_altivec_vcmpgt_p (__CR6_EQ, a2, a1)) |
0 | 586 __altivec_scalar_pred(vec_any_ngt, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
587 __builtin_altivec_vcmpgt_p (__CR6_LT_REV, a1, a2)) |
0 | 588 __altivec_scalar_pred(vec_any_nlt, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
589 __builtin_altivec_vcmpgt_p (__CR6_LT_REV, a2, a1)) |
0 | 590 |
591 /* __builtin_vec_vcmpge_p is vcmpgefp for floating-point vector types, | |
592 while for integer types it is converted to __builtin_vec_vcmpgt_p, | |
593 with inverted args and condition code. */ | |
594 __altivec_scalar_pred(vec_all_le, | |
595 __builtin_vec_vcmpge_p (__CR6_LT, a2, a1)) | |
596 __altivec_scalar_pred(vec_all_ge, | |
597 __builtin_vec_vcmpge_p (__CR6_LT, a1, a2)) | |
598 __altivec_scalar_pred(vec_any_le, | |
599 __builtin_vec_vcmpge_p (__CR6_EQ_REV, a2, a1)) | |
600 __altivec_scalar_pred(vec_any_ge, | |
601 __builtin_vec_vcmpge_p (__CR6_EQ_REV, a1, a2)) | |
602 | |
603 __altivec_scalar_pred(vec_all_nge, | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
604 __builtin_altivec_vcmpge_p (__CR6_EQ, a1, a2)) |
0 | 605 __altivec_scalar_pred(vec_all_nle, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
606 __builtin_altivec_vcmpge_p (__CR6_EQ, a2, a1)) |
0 | 607 __altivec_scalar_pred(vec_any_nge, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
608 __builtin_altivec_vcmpge_p (__CR6_LT_REV, a1, a2)) |
0 | 609 __altivec_scalar_pred(vec_any_nle, |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
610 __builtin_altivec_vcmpge_p (__CR6_LT_REV, a2, a1)) |
0 | 611 |
612 #undef __altivec_scalar_pred | |
613 #undef __altivec_unary_pred | |
614 #undef __altivec_binary_pred | |
615 #else | |
616 #define vec_cmplt(a1, a2) __builtin_vec_cmpgt ((a2), (a1)) | |
617 #define vec_cmple(a1, a2) __builtin_vec_cmpge ((a2), (a1)) | |
618 | |
619 #define vec_all_in(a1, a2) __builtin_altivec_vcmpbfp_p (__CR6_EQ, (a1), (a2)) | |
620 #define vec_any_out(a1, a2) __builtin_altivec_vcmpbfp_p (__CR6_EQ_REV, (a1), (a2)) | |
621 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
622 #define vec_all_nan(a1) __builtin_vec_vcmpeq_p (__CR6_EQ, (a1), (a1)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
623 #define vec_any_nan(a1) __builtin_vec_vcmpeq_p (__CR6_LT_REV, (a1), (a1)) |
0 | 624 |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
625 #define vec_all_numeric(a1) __builtin_vec_vcmpeq_p (__CR6_LT, (a1), (a1)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
626 #define vec_any_numeric(a1) __builtin_vec_vcmpeq_p (__CR6_EQ_REV, (a1), (a1)) |
0 | 627 |
628 #define vec_all_eq(a1, a2) __builtin_vec_vcmpeq_p (__CR6_LT, (a1), (a2)) | |
111 | 629 |
630 #ifdef __POWER9_VECTOR__ | |
631 #define vec_all_nez(a1, a2) __builtin_vec_vcmpnez_p (__CR6_LT, (a1), (a2)) | |
632 #define vec_any_eqz(a1, a2) __builtin_vec_vcmpnez_p (__CR6_LT_REV, (a1), (a2)) | |
633 #define vec_all_ne(a1, a2) __builtin_vec_vcmpne_p ((a1), (a2)) | |
634 #define vec_any_eq(a1, a2) __builtin_vec_vcmpae_p ((a1), (a2)) | |
635 #else | |
0 | 636 #define vec_all_ne(a1, a2) __builtin_vec_vcmpeq_p (__CR6_EQ, (a1), (a2)) |
637 #define vec_any_eq(a1, a2) __builtin_vec_vcmpeq_p (__CR6_EQ_REV, (a1), (a2)) | |
111 | 638 #endif |
639 | |
0 | 640 #define vec_any_ne(a1, a2) __builtin_vec_vcmpeq_p (__CR6_LT_REV, (a1), (a2)) |
641 | |
642 #define vec_all_gt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT, (a1), (a2)) | |
643 #define vec_all_lt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT, (a2), (a1)) | |
644 #define vec_any_gt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ_REV, (a1), (a2)) | |
645 #define vec_any_lt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ_REV, (a2), (a1)) | |
646 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
647 #define vec_all_ngt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ, (a1), (a2)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
648 #define vec_all_nlt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ, (a2), (a1)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
649 #define vec_any_ngt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT_REV, (a1), (a2)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
650 #define vec_any_nlt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT_REV, (a2), (a1)) |
0 | 651 |
652 /* __builtin_vec_vcmpge_p is vcmpgefp for floating-point vector types, | |
653 while for integer types it is converted to __builtin_vec_vcmpgt_p, | |
654 with inverted args and condition code. */ | |
655 #define vec_all_le(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT, (a2), (a1)) | |
656 #define vec_all_ge(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT, (a1), (a2)) | |
657 #define vec_any_le(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ_REV, (a2), (a1)) | |
658 #define vec_any_ge(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ_REV, (a1), (a2)) | |
659 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
660 #define vec_all_nge(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ, (a1), (a2)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
661 #define vec_all_nle(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ, (a2), (a1)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
662 #define vec_any_nge(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT_REV, (a1), (a2)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
663 #define vec_any_nle(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT_REV, (a2), (a1)) |
0 | 664 #endif |
665 | |
666 /* These do not accept vectors, so they do not have a __builtin_vec_* | |
667 counterpart. */ | |
668 #define vec_dss(x) __builtin_altivec_dss((x)) | |
669 #define vec_dssall() __builtin_altivec_dssall () | |
670 #define vec_mfvscr() ((__vector unsigned short) __builtin_altivec_mfvscr ()) | |
671 #define vec_splat_s8(x) __builtin_altivec_vspltisb ((x)) | |
672 #define vec_splat_s16(x) __builtin_altivec_vspltish ((x)) | |
673 #define vec_splat_s32(x) __builtin_altivec_vspltisw ((x)) | |
674 #define vec_splat_u8(x) ((__vector unsigned char) vec_splat_s8 ((x))) | |
675 #define vec_splat_u16(x) ((__vector unsigned short) vec_splat_s16 ((x))) | |
676 #define vec_splat_u32(x) ((__vector unsigned int) vec_splat_s32 ((x))) | |
677 | |
678 /* This also accepts a type for its parameter, so it is not enough | |
679 to #define vec_step to __builtin_vec_step. */ | |
680 #define vec_step(x) __builtin_vec_step (* (__typeof__ (x) *) 0) | |
681 | |
682 #endif /* _ALTIVEC_H */ |