1 /* PowerPC AltiVec include file.
2    Copyright (C) 2002-2018 Free Software Foundation, Inc.
3    Contributed by Aldy Hernandez (aldyh@redhat.com).
4    Rewritten by Paolo Bonzini (bonzini@gnu.org).
5 
6    This file is part of GCC.
7 
8    GCC is free software; you can redistribute it and/or modify it
9    under the terms of the GNU General Public License as published
10    by the Free Software Foundation; either version 3, or (at your
11    option) any later version.
12 
13    GCC is distributed in the hope that it will be useful, but WITHOUT
14    ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
15    or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
16    License for more details.
17 
18    Under Section 7 of GPL version 3, you are granted additional
19    permissions described in the GCC Runtime Library Exception, version
20    3.1, as published by the Free Software Foundation.
21 
22    You should have received a copy of the GNU General Public License and
23    a copy of the GCC Runtime Library Exception along with this program;
24    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
25    <http://www.gnu.org/licenses/>.  */
26 
27 /* Implemented to conform to the specification included in the AltiVec
28    Technology Programming Interface Manual (ALTIVECPIM/D 6/1999 Rev 0).  */
29 
30 #ifndef _ALTIVEC_H
31 #define _ALTIVEC_H 1
32 
33 #if !defined(__VEC__) || !defined(__ALTIVEC__)
34 #error Use the "-maltivec" flag to enable PowerPC AltiVec support
35 #endif
36 
37 /* If __APPLE_ALTIVEC__ is defined, the compiler supports 'vector',
38    'pixel' and 'bool' as context-sensitive AltiVec keywords (in
39    non-AltiVec contexts, they revert to their original meanings,
40    if any), so we do not need to define them as macros.  */
41 
42 #if !defined(__APPLE_ALTIVEC__)
43 /* You are allowed to undef these for C++ compatibility.  */
44 #define vector __vector
45 #define pixel __pixel
46 #define bool __bool
47 #endif
48 
49 /* Condition register codes for AltiVec predicates. */
50 
51 #define __CR6_EQ		0
52 #define __CR6_EQ_REV		1
53 #define __CR6_LT		2
54 #define __CR6_LT_REV		3
55 
56 /* Synonyms.  */
57 #define vec_vaddcuw vec_addc
58 #define vec_vand vec_and
59 #define vec_vandc vec_andc
60 #define vec_vrfip vec_ceil
61 #define vec_vcmpbfp vec_cmpb
62 #define vec_vcmpgefp vec_cmpge
63 #define vec_vctsxs vec_cts
64 #define vec_vctuxs vec_ctu
65 #define vec_vexptefp vec_expte
66 #define vec_vrfim vec_floor
67 #define vec_lvx vec_ld
68 #define vec_lvxl vec_ldl
69 #define vec_vlogefp vec_loge
70 #define vec_vmaddfp vec_madd
71 #define vec_vmhaddshs vec_madds
72 #define vec_vmladduhm vec_mladd
73 #define vec_vmhraddshs vec_mradds
74 #define vec_vnmsubfp vec_nmsub
75 #define vec_vnor vec_nor
76 #define vec_vor vec_or
77 #define vec_vpkpx vec_packpx
78 #define vec_vperm vec_perm
79 #define vec_permxor __builtin_vec_vpermxor
80 #define vec_vrefp vec_re
81 #define vec_vrfin vec_round
82 #define vec_vrsqrtefp vec_rsqrte
83 #define vec_vsel vec_sel
84 #define vec_vsldoi vec_sld
85 #define vec_vsl vec_sll
86 #define vec_vslo vec_slo
87 #define vec_vspltisb vec_splat_s8
88 #define vec_vspltish vec_splat_s16
89 #define vec_vspltisw vec_splat_s32
90 #define vec_vsr vec_srl
91 #define vec_vsro vec_sro
92 #define vec_stvx vec_st
93 #define vec_stvxl vec_stl
94 #define vec_vsubcuw vec_subc
95 #define vec_vsum2sws vec_sum2s
96 #define vec_vsumsws vec_sums
97 #define vec_vrfiz vec_trunc
98 #define vec_vxor vec_xor
99 
100 /* Functions that are resolved by the backend to one of the
101    typed builtins.  */
102 #define vec_vaddfp __builtin_vec_vaddfp
103 #define vec_addc __builtin_vec_addc
104 #define vec_adde __builtin_vec_adde
105 #define vec_addec __builtin_vec_addec
106 #define vec_vaddsws __builtin_vec_vaddsws
107 #define vec_vaddshs __builtin_vec_vaddshs
108 #define vec_vaddsbs __builtin_vec_vaddsbs
109 #define vec_vavgsw __builtin_vec_vavgsw
110 #define vec_vavguw __builtin_vec_vavguw
111 #define vec_vavgsh __builtin_vec_vavgsh
112 #define vec_vavguh __builtin_vec_vavguh
113 #define vec_vavgsb __builtin_vec_vavgsb
114 #define vec_vavgub __builtin_vec_vavgub
115 #define vec_ceil __builtin_vec_ceil
116 #define vec_cmpb __builtin_vec_cmpb
117 #define vec_vcmpeqfp __builtin_vec_vcmpeqfp
118 #define vec_cmpge __builtin_vec_cmpge
119 #define vec_vcmpgtfp __builtin_vec_vcmpgtfp
120 #define vec_vcmpgtsw __builtin_vec_vcmpgtsw
121 #define vec_vcmpgtuw __builtin_vec_vcmpgtuw
122 #define vec_vcmpgtsh __builtin_vec_vcmpgtsh
123 #define vec_vcmpgtuh __builtin_vec_vcmpgtuh
124 #define vec_vcmpgtsb __builtin_vec_vcmpgtsb
125 #define vec_vcmpgtub __builtin_vec_vcmpgtub
126 #define vec_vcfsx __builtin_vec_vcfsx
127 #define vec_vcfux __builtin_vec_vcfux
128 #define vec_cts __builtin_vec_cts
129 #define vec_ctu __builtin_vec_ctu
130 #define vec_cpsgn __builtin_vec_copysign
131 #define vec_double __builtin_vec_double
132 #define vec_doublee __builtin_vec_doublee
133 #define vec_doubleo __builtin_vec_doubleo
134 #define vec_doublel __builtin_vec_doublel
135 #define vec_doubleh __builtin_vec_doubleh
136 #define vec_expte __builtin_vec_expte
137 #define vec_float __builtin_vec_float
138 #define vec_float2 __builtin_vec_float2
139 #define vec_floate __builtin_vec_floate
140 #define vec_floato __builtin_vec_floato
141 #define vec_floor __builtin_vec_floor
142 #define vec_loge __builtin_vec_loge
143 #define vec_madd __builtin_vec_madd
144 #define vec_madds __builtin_vec_madds
145 #define vec_mtvscr __builtin_vec_mtvscr
146 #define vec_reve __builtin_vec_vreve
147 #define vec_vmaxfp __builtin_vec_vmaxfp
148 #define vec_vmaxsw __builtin_vec_vmaxsw
149 #define vec_vmaxsh __builtin_vec_vmaxsh
150 #define vec_vmaxsb __builtin_vec_vmaxsb
151 #define vec_vminfp __builtin_vec_vminfp
152 #define vec_vminsw __builtin_vec_vminsw
153 #define vec_vminsh __builtin_vec_vminsh
154 #define vec_vminsb __builtin_vec_vminsb
155 #define vec_mradds __builtin_vec_mradds
156 #define vec_vmsumshm __builtin_vec_vmsumshm
157 #define vec_vmsumuhm __builtin_vec_vmsumuhm
158 #define vec_vmsummbm __builtin_vec_vmsummbm
159 #define vec_vmsumubm __builtin_vec_vmsumubm
160 #define vec_vmsumshs __builtin_vec_vmsumshs
161 #define vec_vmsumuhs __builtin_vec_vmsumuhs
162 #define vec_vmulesb __builtin_vec_vmulesb
163 #define vec_vmulesh __builtin_vec_vmulesh
164 #define vec_vmuleuh __builtin_vec_vmuleuh
165 #define vec_vmuleub __builtin_vec_vmuleub
166 #define vec_vmulosh __builtin_vec_vmulosh
167 #define vec_vmulouh __builtin_vec_vmulouh
168 #define vec_vmulosb __builtin_vec_vmulosb
169 #define vec_vmuloub __builtin_vec_vmuloub
170 #define vec_nmsub __builtin_vec_nmsub
171 #define vec_packpx __builtin_vec_packpx
172 #define vec_vpkswss __builtin_vec_vpkswss
173 #define vec_vpkuwus __builtin_vec_vpkuwus
174 #define vec_vpkshss __builtin_vec_vpkshss
175 #define vec_vpkuhus __builtin_vec_vpkuhus
176 #define vec_vpkswus __builtin_vec_vpkswus
177 #define vec_vpkshus __builtin_vec_vpkshus
178 #define vec_re __builtin_vec_re
179 #define vec_round __builtin_vec_round
180 #define vec_recipdiv __builtin_vec_recipdiv
181 #define vec_rlmi __builtin_vec_rlmi
182 #define vec_vrlnm __builtin_vec_rlnm
183 #define vec_rlnm(a,b,c) (__builtin_vec_rlnm((a),((b)<<8)|(c)))
184 #define vec_rsqrt __builtin_vec_rsqrt
185 #define vec_rsqrte __builtin_vec_rsqrte
186 #define vec_signed __builtin_vec_vsigned
187 #define vec_signed2 __builtin_vec_vsigned2
188 #define vec_signede __builtin_vec_vsignede
189 #define vec_signedo __builtin_vec_vsignedo
190 #define vec_unsigned __builtin_vec_vunsigned
191 #define vec_unsigned2 __builtin_vec_vunsigned2
192 #define vec_unsignede __builtin_vec_vunsignede
193 #define vec_unsignedo __builtin_vec_vunsignedo
194 #define vec_vsubfp __builtin_vec_vsubfp
195 #define vec_subc __builtin_vec_subc
196 #define vec_sube __builtin_vec_sube
197 #define vec_subec __builtin_vec_subec
198 #define vec_vsubsws __builtin_vec_vsubsws
199 #define vec_vsubshs __builtin_vec_vsubshs
200 #define vec_vsubsbs __builtin_vec_vsubsbs
201 #define vec_sum4s __builtin_vec_sum4s
202 #define vec_vsum4shs __builtin_vec_vsum4shs
203 #define vec_vsum4sbs __builtin_vec_vsum4sbs
204 #define vec_vsum4ubs __builtin_vec_vsum4ubs
205 #define vec_sum2s __builtin_vec_sum2s
206 #define vec_sums __builtin_vec_sums
207 #define vec_trunc __builtin_vec_trunc
208 #define vec_vupkhpx __builtin_vec_vupkhpx
209 #define vec_vupkhsh __builtin_vec_vupkhsh
210 #define vec_vupkhsb __builtin_vec_vupkhsb
211 #define vec_vupklpx __builtin_vec_vupklpx
212 #define vec_vupklsh __builtin_vec_vupklsh
213 #define vec_vupklsb __builtin_vec_vupklsb
214 #define vec_abs __builtin_vec_abs
215 #define vec_nabs __builtin_vec_nabs
216 #define vec_abss __builtin_vec_abss
217 #define vec_add __builtin_vec_add
218 #define vec_adds __builtin_vec_adds
219 #define vec_and __builtin_vec_and
220 #define vec_andc __builtin_vec_andc
221 #define vec_avg __builtin_vec_avg
222 #define vec_cmpeq __builtin_vec_cmpeq
223 #define vec_cmpne __builtin_vec_cmpne
224 #define vec_cmpgt __builtin_vec_cmpgt
225 #define vec_ctf __builtin_vec_ctf
226 #define vec_dst __builtin_vec_dst
227 #define vec_dstst __builtin_vec_dstst
228 #define vec_dststt __builtin_vec_dststt
229 #define vec_dstt __builtin_vec_dstt
230 #define vec_ld __builtin_vec_ld
231 #define vec_lde __builtin_vec_lde
232 #define vec_ldl __builtin_vec_ldl
233 #define vec_lvebx __builtin_vec_lvebx
234 #define vec_lvehx __builtin_vec_lvehx
235 #define vec_lvewx __builtin_vec_lvewx
236 #define vec_neg __builtin_vec_neg
237 #define vec_pmsum_be __builtin_vec_vpmsum
238 #define vec_shasigma_be __builtin_crypto_vshasigma
239 /* Cell only intrinsics.  */
240 #ifdef __PPU__
241 #define vec_lvlx __builtin_vec_lvlx
242 #define vec_lvlxl __builtin_vec_lvlxl
243 #define vec_lvrx __builtin_vec_lvrx
244 #define vec_lvrxl __builtin_vec_lvrxl
245 #endif
246 #define vec_lvsl __builtin_vec_lvsl
247 #define vec_lvsr __builtin_vec_lvsr
248 #define vec_max __builtin_vec_max
249 #define vec_mergee __builtin_vec_vmrgew
250 #define vec_mergeh __builtin_vec_mergeh
251 #define vec_mergel __builtin_vec_mergel
252 #define vec_mergeo __builtin_vec_vmrgow
253 #define vec_min __builtin_vec_min
254 #define vec_mladd __builtin_vec_mladd
255 #define vec_msum __builtin_vec_msum
256 #define vec_msums __builtin_vec_msums
257 #define vec_mul __builtin_vec_mul
258 #define vec_mule __builtin_vec_mule
259 #define vec_mulo __builtin_vec_mulo
260 #define vec_nor __builtin_vec_nor
261 #define vec_or __builtin_vec_or
262 #define vec_pack __builtin_vec_pack
263 #define vec_packs __builtin_vec_packs
264 #define vec_packsu __builtin_vec_packsu
265 #define vec_perm __builtin_vec_perm
266 #define vec_rl __builtin_vec_rl
267 #define vec_sel __builtin_vec_sel
268 #define vec_sl __builtin_vec_sl
269 #define vec_sld __builtin_vec_sld
270 #define vec_sldw __builtin_vsx_xxsldwi
271 #define vec_sll __builtin_vec_sll
272 #define vec_slo __builtin_vec_slo
273 #define vec_splat __builtin_vec_splat
274 #define vec_sr __builtin_vec_sr
275 #define vec_sra __builtin_vec_sra
276 #define vec_srl __builtin_vec_srl
277 #define vec_sro __builtin_vec_sro
278 #define vec_st __builtin_vec_st
279 #define vec_ste __builtin_vec_ste
280 #define vec_stl __builtin_vec_stl
281 #define vec_stvebx __builtin_vec_stvebx
282 #define vec_stvehx __builtin_vec_stvehx
283 #define vec_stvewx __builtin_vec_stvewx
284 /* Cell only intrinsics.  */
285 #ifdef __PPU__
286 #define vec_stvlx __builtin_vec_stvlx
287 #define vec_stvlxl __builtin_vec_stvlxl
288 #define vec_stvrx __builtin_vec_stvrx
289 #define vec_stvrxl __builtin_vec_stvrxl
290 #endif
291 #define vec_sub __builtin_vec_sub
292 #define vec_subs __builtin_vec_subs
293 #define vec_sum __builtin_vec_sum
294 #define vec_unpackh __builtin_vec_unpackh
295 #define vec_unpackl __builtin_vec_unpackl
296 #define vec_vaddubm __builtin_vec_vaddubm
297 #define vec_vaddubs __builtin_vec_vaddubs
298 #define vec_vadduhm __builtin_vec_vadduhm
299 #define vec_vadduhs __builtin_vec_vadduhs
300 #define vec_vadduwm __builtin_vec_vadduwm
301 #define vec_vadduws __builtin_vec_vadduws
302 #define vec_vcmpequb __builtin_vec_vcmpequb
303 #define vec_vcmpequh __builtin_vec_vcmpequh
304 #define vec_vcmpequw __builtin_vec_vcmpequw
305 #define vec_vmaxub __builtin_vec_vmaxub
306 #define vec_vmaxuh __builtin_vec_vmaxuh
307 #define vec_vmaxuw __builtin_vec_vmaxuw
308 #define vec_vminub __builtin_vec_vminub
309 #define vec_vminuh __builtin_vec_vminuh
310 #define vec_vminuw __builtin_vec_vminuw
311 #define vec_vmrghb __builtin_vec_vmrghb
312 #define vec_vmrghh __builtin_vec_vmrghh
313 #define vec_vmrghw __builtin_vec_vmrghw
314 #define vec_vmrglb __builtin_vec_vmrglb
315 #define vec_vmrglh __builtin_vec_vmrglh
316 #define vec_vmrglw __builtin_vec_vmrglw
317 #define vec_vpkuhum __builtin_vec_vpkuhum
318 #define vec_vpkuwum __builtin_vec_vpkuwum
319 #define vec_vrlb __builtin_vec_vrlb
320 #define vec_vrlh __builtin_vec_vrlh
321 #define vec_vrlw __builtin_vec_vrlw
322 #define vec_vslb __builtin_vec_vslb
323 #define vec_vslh __builtin_vec_vslh
324 #define vec_vslw __builtin_vec_vslw
325 #define vec_vspltb __builtin_vec_vspltb
326 #define vec_vsplth __builtin_vec_vsplth
327 #define vec_vspltw __builtin_vec_vspltw
328 #define vec_vsrab __builtin_vec_vsrab
329 #define vec_vsrah __builtin_vec_vsrah
330 #define vec_vsraw __builtin_vec_vsraw
331 #define vec_vsrb __builtin_vec_vsrb
332 #define vec_vsrh __builtin_vec_vsrh
333 #define vec_vsrw __builtin_vec_vsrw
334 #define vec_vsububs __builtin_vec_vsububs
335 #define vec_vsububm __builtin_vec_vsububm
336 #define vec_vsubuhm __builtin_vec_vsubuhm
337 #define vec_vsubuhs __builtin_vec_vsubuhs
338 #define vec_vsubuwm __builtin_vec_vsubuwm
339 #define vec_vsubuws __builtin_vec_vsubuws
340 #define vec_xor __builtin_vec_xor
341 
342 #define vec_extract __builtin_vec_extract
343 #define vec_insert __builtin_vec_insert
344 #define vec_splats __builtin_vec_splats
345 #define vec_promote __builtin_vec_promote
346 
347 #ifdef __VSX__
348 /* VSX additions */
349 #define vec_div __builtin_vec_div
350 #define vec_mul __builtin_vec_mul
351 #define vec_msub __builtin_vec_msub
352 #define vec_nmadd __builtin_vec_nmadd
353 #define vec_nearbyint __builtin_vec_nearbyint
354 #define vec_rint __builtin_vec_rint
355 #define vec_sqrt __builtin_vec_sqrt
356 #define vec_vsx_ld __builtin_vec_vsx_ld
357 #define vec_vsx_st __builtin_vec_vsx_st
358 #define vec_xl __builtin_vec_vsx_ld
359 #define vec_xl_be __builtin_vec_xl_be
360 #define vec_xst __builtin_vec_vsx_st
361 #define vec_xst_be __builtin_vec_xst_be
362 
363 /* Note, xxsldi and xxpermdi were added as __builtin_vsx_<xxx> functions
364    instead of __builtin_vec_<xxx>  */
365 #define vec_xxsldwi __builtin_vsx_xxsldwi
366 #define vec_xxpermdi __builtin_vsx_xxpermdi
367 #endif
368 
369 #ifdef _ARCH_PWR8
370 /* Vector additions added in ISA 2.07.  */
371 #define vec_eqv __builtin_vec_eqv
372 #define vec_nand __builtin_vec_nand
373 #define vec_orc __builtin_vec_orc
374 #define vec_vaddcuq __builtin_vec_vaddcuq
375 #define vec_vaddudm __builtin_vec_vaddudm
376 #define vec_vadduqm __builtin_vec_vadduqm
377 #define vec_vbpermq __builtin_vec_vbpermq
378 #define vec_bperm __builtin_vec_vbperm_api
379 #define vec_vclz __builtin_vec_vclz
380 #define vec_cntlz __builtin_vec_vclz
381 #define vec_vclzb __builtin_vec_vclzb
382 #define vec_vclzd __builtin_vec_vclzd
383 #define vec_vclzh __builtin_vec_vclzh
384 #define vec_vclzw __builtin_vec_vclzw
385 #define vec_vaddecuq __builtin_vec_vaddecuq
386 #define vec_vaddeuqm __builtin_vec_vaddeuqm
387 #define vec_vsubecuq __builtin_vec_vsubecuq
388 #define vec_vsubeuqm __builtin_vec_vsubeuqm
389 #define vec_vgbbd __builtin_vec_vgbbd
390 #define vec_gb __builtin_vec_vgbbd
391 #define vec_vmaxsd __builtin_vec_vmaxsd
392 #define vec_vmaxud __builtin_vec_vmaxud
393 #define vec_vminsd __builtin_vec_vminsd
394 #define vec_vminud __builtin_vec_vminud
395 #define vec_vmrgew __builtin_vec_vmrgew
396 #define vec_vmrgow __builtin_vec_vmrgow
397 #define vec_vpksdss __builtin_vec_vpksdss
398 #define vec_vpksdus __builtin_vec_vpksdus
399 #define vec_vpkudum __builtin_vec_vpkudum
400 #define vec_vpkudus __builtin_vec_vpkudus
401 #define vec_vpopcnt __builtin_vec_vpopcnt
402 #define vec_vpopcntb __builtin_vec_vpopcntb
403 #define vec_vpopcntd __builtin_vec_vpopcntd
404 #define vec_vpopcnth __builtin_vec_vpopcnth
405 #define vec_vpopcntw __builtin_vec_vpopcntw
406 #define vec_popcnt __builtin_vec_vpopcntu
407 #define vec_popcntb __builtin_vec_vpopcntub
408 #define vec_popcnth __builtin_vec_vpopcntuh
409 #define vec_popcntw __builtin_vec_vpopcntuw
410 #define vec_popcntd __builtin_vec_vpopcntud
411 #define vec_vrld __builtin_vec_vrld
412 #define vec_vsld __builtin_vec_vsld
413 #define vec_vsrad __builtin_vec_vsrad
414 #define vec_vsrd __builtin_vec_vsrd
415 #define vec_vsubcuq __builtin_vec_vsubcuq
416 #define vec_vsubudm __builtin_vec_vsubudm
417 #define vec_vsubuqm __builtin_vec_vsubuqm
418 #define vec_vupkhsw __builtin_vec_vupkhsw
419 #define vec_vupklsw __builtin_vec_vupklsw
420 #define vec_revb __builtin_vec_revb
421 #define vec_sbox_be __builtin_crypto_vsbox_be
422 #define vec_cipher_be __builtin_crypto_vcipher_be
423 #define vec_cipherlast_be __builtin_crypto_vcipherlast_be
424 #define vec_ncipher_be __builtin_crypto_vncipher_be
425 #define vec_ncipherlast_be __builtin_crypto_vncipherlast_be
426 #endif
427 
428 #ifdef __POWER9_VECTOR__
429 /* Vector additions added in ISA 3.0.  */
430 #define vec_first_match_index __builtin_vec_first_match_index
431 #define vec_first_match_or_eos_index __builtin_vec_first_match_or_eos_index
432 #define vec_first_mismatch_index __builtin_vec_first_mismatch_index
433 #define vec_first_mismatch_or_eos_index __builtin_vec_first_mismatch_or_eos_index
434 #define vec_pack_to_short_fp32 __builtin_vec_convert_4f32_8i16
435 #define vec_parity_lsbb __builtin_vec_vparity_lsbb
436 #define vec_vctz __builtin_vec_vctz
437 #define vec_cnttz __builtin_vec_vctz
438 #define vec_vctzb __builtin_vec_vctzb
439 #define vec_vctzd __builtin_vec_vctzd
440 #define vec_vctzh __builtin_vec_vctzh
441 #define vec_vctzw __builtin_vec_vctzw
442 #define vec_extract4b __builtin_vec_extract4b
443 #define vec_insert4b __builtin_vec_insert4b
444 #define vec_vprtyb __builtin_vec_vprtyb
445 #define vec_vprtybd __builtin_vec_vprtybd
446 #define vec_vprtybw __builtin_vec_vprtybw
447 
448 #ifdef _ARCH_PPC64
449 #define vec_vprtybq __builtin_vec_vprtybq
450 #endif
451 
452 #define vec_absd __builtin_vec_vadu
453 #define vec_absdb __builtin_vec_vadub
454 #define vec_absdh __builtin_vec_vaduh
455 #define vec_absdw __builtin_vec_vaduw
456 
457 #define vec_slv __builtin_vec_vslv
458 #define vec_srv __builtin_vec_vsrv
459 
460 #define vec_extract_exp __builtin_vec_extract_exp
461 #define vec_extract_sig __builtin_vec_extract_sig
462 #define vec_insert_exp __builtin_vec_insert_exp
463 #define vec_test_data_class __builtin_vec_test_data_class
464 
465 #define vec_extract_fp_from_shorth __builtin_vec_vextract_fp_from_shorth
466 #define vec_extract_fp_from_shortl __builtin_vec_vextract_fp_from_shortl
467 #define vec_extract_fp32_from_shorth __builtin_vec_vextract_fp_from_shorth
468 #define vec_extract_fp32_from_shortl __builtin_vec_vextract_fp_from_shortl
469 
470 #define scalar_extract_exp __builtin_vec_scalar_extract_exp
471 #define scalar_extract_sig __builtin_vec_scalar_extract_sig
472 #define scalar_insert_exp __builtin_vec_scalar_insert_exp
473 #define scalar_test_data_class __builtin_vec_scalar_test_data_class
474 #define scalar_test_neg __builtin_vec_scalar_test_neg
475 
476 #define scalar_cmp_exp_gt __builtin_vec_scalar_cmp_exp_gt
477 #define scalar_cmp_exp_lt __builtin_vec_scalar_cmp_exp_lt
478 #define scalar_cmp_exp_eq __builtin_vec_scalar_cmp_exp_eq
479 #define scalar_cmp_exp_unordered __builtin_vec_scalar_cmp_exp_unordered
480 
481 #ifdef _ARCH_PPC64
482 #define vec_xl_len __builtin_vec_lxvl
483 #define vec_xst_len __builtin_vec_stxvl
484 #define vec_xl_len_r __builtin_vec_xl_len_r
485 #define vec_xst_len_r __builtin_vec_xst_len_r
486 #endif
487 
488 #define vec_cmpnez __builtin_vec_vcmpnez
489 
490 #define vec_cntlz_lsbb __builtin_vec_vclzlsbb
491 #define vec_cnttz_lsbb __builtin_vec_vctzlsbb
492 
493 #define vec_xlx __builtin_vec_vextulx
494 #define vec_xrx __builtin_vec_vexturx
495 #endif
496 
497 /* Predicates.
498    For C++, we use templates in order to allow non-parenthesized arguments.
499    For C, instead, we use macros since non-parenthesized arguments were
500    not allowed even in older GCC implementation of AltiVec.
501 
502    In the future, we may add more magic to the back-end, so that no
503    one- or two-argument macros are used.  */
504 
505 #ifdef __cplusplus__
506 #define __altivec_unary_pred(NAME, CALL) \
507 template <class T> int NAME (T a1) { return CALL; }
508 
509 #define __altivec_scalar_pred(NAME, CALL) \
510 template <class T, class U> int NAME (T a1, U a2) { return CALL; }
511 
512 /* Given the vec_step of a type, return the corresponding bool type.  */
513 template <int STEP> class __altivec_bool_ret { };
514 template <> class __altivec_bool_ret <4> {
515   typedef __vector __bool int __ret;
516 };
517 template <> class __altivec_bool_ret <8> {
518   typedef __vector __bool short __ret;
519 };
520 template <> class __altivec_bool_ret <16> {
521   typedef __vector __bool char __ret;
522 };
523 
524 /* Be very liberal in the pairs we accept.  Mistakes such as passing
525    a `vector char' and `vector short' will be caught by the middle-end,
526    while any attempt to detect them here would produce hard to understand
527    error messages involving the implementation details of AltiVec.  */
528 #define __altivec_binary_pred(NAME, CALL) \
529 template <class T, class U> \
530 typename __altivec_bool_ret <vec_step (T)>::__ret \
531 NAME (T a1, U a2) \
532 { \
533   return CALL; \
534 }
535 
536 __altivec_binary_pred(vec_cmplt,
537   __builtin_vec_cmpgt (a2, a1))
538 __altivec_binary_pred(vec_cmple,
539   __builtin_vec_cmpge (a2, a1))
540 
541 __altivec_scalar_pred(vec_all_in,
542   __builtin_altivec_vcmpbfp_p (__CR6_EQ, a1, a2))
543 __altivec_scalar_pred(vec_any_out,
544   __builtin_altivec_vcmpbfp_p (__CR6_EQ_REV, a1, a2))
545 
546 __altivec_unary_pred(vec_all_nan,
547   __builtin_altivec_vcmpeq_p (__CR6_EQ, a1, a1))
548 __altivec_unary_pred(vec_any_nan,
549   __builtin_altivec_vcmpeq_p (__CR6_LT_REV, a1, a1))
550 
551 __altivec_unary_pred(vec_all_numeric,
552   __builtin_altivec_vcmpeq_p (__CR6_LT, a1, a1))
553 __altivec_unary_pred(vec_any_numeric,
554   __builtin_altivec_vcmpeq_p (__CR6_EQ_REV, a1, a1))
555 
556 __altivec_scalar_pred(vec_all_eq,
557   __builtin_vec_vcmpeq_p (__CR6_LT, a1, a2))
558 
559 #ifndef __POWER9_VECTOR__
560 __altivec_scalar_pred(vec_all_ne,
561   __builtin_vec_vcmpeq_p (__CR6_EQ, a1, a2))
562 __altivec_scalar_pred(vec_any_eq,
563   __builtin_vec_vcmpeq_p (__CR6_EQ_REV, a1, a2))
564 #else
565 __altivec_scalar_pred(vec_all_nez,
566   __builtin_vec_vcmpnez_p (__CR6_LT, a1, a2))
567 __altivec_scalar_pred(vec_any_eqz,
568   __builtin_vec_vcmpnez_p (__CR6_LT_REV, a1, a2))
569 __altivec_scalar_pred(vec_all_ne,
570   __builtin_vec_vcmpne_p (a1, a2))
571 __altivec_scalar_pred(vec_any_eq,
572   __builtin_vec_vcmpae_p (a1, a2))
573 #endif
574 
575 __altivec_scalar_pred(vec_any_ne,
576   __builtin_vec_vcmpeq_p (__CR6_LT_REV, a1, a2))
577 
578 __altivec_scalar_pred(vec_all_gt,
579   __builtin_vec_vcmpgt_p (__CR6_LT, a1, a2))
580 __altivec_scalar_pred(vec_all_lt,
581   __builtin_vec_vcmpgt_p (__CR6_LT, a2, a1))
582 __altivec_scalar_pred(vec_any_gt,
583   __builtin_vec_vcmpgt_p (__CR6_EQ_REV, a1, a2))
584 __altivec_scalar_pred(vec_any_lt,
585   __builtin_vec_vcmpgt_p (__CR6_EQ_REV, a2, a1))
586 
587 __altivec_scalar_pred(vec_all_ngt,
588   __builtin_altivec_vcmpgt_p (__CR6_EQ, a1, a2))
589 __altivec_scalar_pred(vec_all_nlt,
590   __builtin_altivec_vcmpgt_p (__CR6_EQ, a2, a1))
591 __altivec_scalar_pred(vec_any_ngt,
592   __builtin_altivec_vcmpgt_p (__CR6_LT_REV, a1, a2))
593 __altivec_scalar_pred(vec_any_nlt,
594   __builtin_altivec_vcmpgt_p (__CR6_LT_REV, a2, a1))
595 
596 /* __builtin_vec_vcmpge_p is vcmpgefp for floating-point vector types,
597    while for integer types it is converted to __builtin_vec_vcmpgt_p,
598    with inverted args and condition code.  */
599 __altivec_scalar_pred(vec_all_le,
600   __builtin_vec_vcmpge_p (__CR6_LT, a2, a1))
601 __altivec_scalar_pred(vec_all_ge,
602   __builtin_vec_vcmpge_p (__CR6_LT, a1, a2))
603 __altivec_scalar_pred(vec_any_le,
604   __builtin_vec_vcmpge_p (__CR6_EQ_REV, a2, a1))
605 __altivec_scalar_pred(vec_any_ge,
606   __builtin_vec_vcmpge_p (__CR6_EQ_REV, a1, a2))
607 
608 __altivec_scalar_pred(vec_all_nge,
609   __builtin_altivec_vcmpge_p (__CR6_EQ, a1, a2))
610 __altivec_scalar_pred(vec_all_nle,
611   __builtin_altivec_vcmpge_p (__CR6_EQ, a2, a1))
612 __altivec_scalar_pred(vec_any_nge,
613   __builtin_altivec_vcmpge_p (__CR6_LT_REV, a1, a2))
614 __altivec_scalar_pred(vec_any_nle,
615   __builtin_altivec_vcmpge_p (__CR6_LT_REV, a2, a1))
616 
617 #undef __altivec_scalar_pred
618 #undef __altivec_unary_pred
619 #undef __altivec_binary_pred
620 #else
621 #define vec_cmplt(a1, a2) __builtin_vec_cmpgt ((a2), (a1))
622 #define vec_cmple(a1, a2) __builtin_vec_cmpge ((a2), (a1))
623 
624 #define vec_all_in(a1, a2) __builtin_altivec_vcmpbfp_p (__CR6_EQ, (a1), (a2))
625 #define vec_any_out(a1, a2) __builtin_altivec_vcmpbfp_p (__CR6_EQ_REV, (a1), (a2))
626 
627 #define vec_all_nan(a1) __builtin_vec_vcmpeq_p (__CR6_EQ, (a1), (a1))
628 #define vec_any_nan(a1) __builtin_vec_vcmpeq_p (__CR6_LT_REV, (a1), (a1))
629 
630 #define vec_all_numeric(a1) __builtin_vec_vcmpeq_p (__CR6_LT, (a1), (a1))
631 #define vec_any_numeric(a1) __builtin_vec_vcmpeq_p (__CR6_EQ_REV, (a1), (a1))
632 
633 #define vec_all_eq(a1, a2) __builtin_vec_vcmpeq_p (__CR6_LT, (a1), (a2))
634 
635 #ifdef __POWER9_VECTOR__
636 #define vec_all_nez(a1, a2) __builtin_vec_vcmpnez_p (__CR6_LT, (a1), (a2))
637 #define vec_any_eqz(a1, a2) __builtin_vec_vcmpnez_p (__CR6_LT_REV, (a1), (a2))
638 #define vec_all_ne(a1, a2) __builtin_vec_vcmpne_p ((a1), (a2))
639 #define vec_any_eq(a1, a2) __builtin_vec_vcmpae_p ((a1), (a2))
640 #else
641 #define vec_all_ne(a1, a2) __builtin_vec_vcmpeq_p (__CR6_EQ, (a1), (a2))
642 #define vec_any_eq(a1, a2) __builtin_vec_vcmpeq_p (__CR6_EQ_REV, (a1), (a2))
643 #endif
644 
645 #define vec_any_ne(a1, a2) __builtin_vec_vcmpeq_p (__CR6_LT_REV, (a1), (a2))
646 
647 #define vec_all_gt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT, (a1), (a2))
648 #define vec_all_lt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT, (a2), (a1))
649 #define vec_any_gt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ_REV, (a1), (a2))
650 #define vec_any_lt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ_REV, (a2), (a1))
651 
652 #define vec_all_ngt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ, (a1), (a2))
653 #define vec_all_nlt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_EQ, (a2), (a1))
654 #define vec_any_ngt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT_REV, (a1), (a2))
655 #define vec_any_nlt(a1, a2) __builtin_vec_vcmpgt_p (__CR6_LT_REV, (a2), (a1))
656 
657 /* __builtin_vec_vcmpge_p is vcmpgefp for floating-point vector types,
658    while for integer types it is converted to __builtin_vec_vcmpgt_p,
659    with inverted args and condition code.  */
660 #define vec_all_le(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT, (a2), (a1))
661 #define vec_all_ge(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT, (a1), (a2))
662 #define vec_any_le(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ_REV, (a2), (a1))
663 #define vec_any_ge(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ_REV, (a1), (a2))
664 
665 #define vec_all_nge(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ, (a1), (a2))
666 #define vec_all_nle(a1, a2) __builtin_vec_vcmpge_p (__CR6_EQ, (a2), (a1))
667 #define vec_any_nge(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT_REV, (a1), (a2))
668 #define vec_any_nle(a1, a2) __builtin_vec_vcmpge_p (__CR6_LT_REV, (a2), (a1))
669 #endif
670 
671 /* These do not accept vectors, so they do not have a __builtin_vec_*
672    counterpart.  */
673 #define vec_dss(x) __builtin_altivec_dss((x))
674 #define vec_dssall() __builtin_altivec_dssall ()
675 #define vec_mfvscr() ((__vector unsigned short) __builtin_altivec_mfvscr ())
676 #define vec_splat_s8(x) __builtin_altivec_vspltisb ((x))
677 #define vec_splat_s16(x) __builtin_altivec_vspltish ((x))
678 #define vec_splat_s32(x) __builtin_altivec_vspltisw ((x))
679 #define vec_splat_u8(x) ((__vector unsigned char) vec_splat_s8 ((x)))
680 #define vec_splat_u16(x) ((__vector unsigned short) vec_splat_s16 ((x)))
681 #define vec_splat_u32(x) ((__vector unsigned int) vec_splat_s32 ((x)))
682 
683 /* This also accepts a type for its parameter, so it is not enough
684    to #define vec_step to __builtin_vec_step.  */
685 #define vec_step(x) __builtin_vec_step (* (__typeof__ (x) *) 0)
686 
687 #endif /* _ALTIVEC_H */
688