1 /* { dg-do compile { target { powerpc*-*-* } } } */
2 /* { dg-options "-mdejagnu-cpu=power8 -O0 -mno-fold-gimple -dp" } */
3 /* { dg-prune-output "gimple folding of rs6000 builtins has been disabled." } */
4 
5 #include <altivec.h>
6 
7 vector double y = { 2.0, 4.0 };
8 vector double z;
9 
main()10 int main ()
11 {
12   vector float fa = {1.0, 2.0, 3.0, -4.0};
13   vector float fb = {-2.0, -3.0, -4.0, -5.0};
14   vector float fd = vec_and (fa, fb);
15   vector float fc = vec_cpsgn (fa, fb);
16   vector float fe = vec_mergeh (fa, fb);
17   vector float ff = vec_mergel (fa, fb);
18 
19   vector double da = {1.0, 2.0};
20   vector double db = {-2.0, -3.0};
21   vector double dz = vec_and (da, db);
22 
23   vector signed int si_a = {1, 2, 3, 4};
24   vector unsigned int ui_a = {1, 2, 3, 4};
25 
26   vector long long la = {5L, 14L};
27   vector long long lb = {3L, 86L};
28   vector long long lc = vec_and (la, lb);
29   vector bool long long ld = {0, -1};
30   vector long long le = vec_and (la, ld);
31   vector long long lf = vec_and (ld, lb);
32 
33   vector unsigned long long ua = {5L, 14L};
34   vector unsigned long long ub = {3L, 86L};
35   vector unsigned long long uc = vec_and (ua, ub);
36   vector bool long long ud = {0, -1};
37   vector unsigned long long ue = vec_and (ua, ud);
38   vector unsigned long long uf = vec_and (ud, ub);
39 
40   vector long long lg = vec_andc (la, lb);
41   vector long long lh = vec_andc (la, ld);
42   vector long long li = vec_andc (ld, lb);
43 
44   vector unsigned long long ug = vec_andc (ua, ub);
45   vector unsigned long long uh = vec_andc (ua, ud);
46   vector unsigned long long ui = vec_andc (ud, ub);
47 
48   vector double de = {1.0, -4.0};
49   vector double df = {-2.0, 5.0};
50   vector double dg = vec_cpsgn (de, df);
51   vector double dzw = vec_mergeh (de, df);
52   vector double dze = vec_mergel (de, df);
53 
54   vector long long lj = vec_mergeh (la, lb);
55   vector long long lk = vec_mergeh (la, ld);
56   vector long long ll = vec_mergeh (ld, la);
57 
58   vector unsigned long long uj = vec_mergeh (ua, ub);
59   vector unsigned long long uk = vec_mergeh (ua, ud);
60   vector unsigned long long ul = vec_mergeh (ud, ua);
61 
62   vector pixel pa = {9, 16, 25, 36, 1, 2, 3, 4};
63   vector pixel pb = {25, 36, 1, 2, 45, 3, 4, 99};
64   vector pixel pc = vec_mergeh (pa, pb);
65   vector pixel pd = vec_mergel (pa, pb);
66 
67   vector long long lm = vec_mergel (la, lb);
68   vector long long ln = vec_mergel (la, ld);
69   vector long long lo = vec_mergel (ld, la);
70 
71   vector unsigned long long um = vec_mergel (ua, ub);
72   vector unsigned long long un = vec_mergel (ua, ud);
73   vector unsigned long long uo = vec_mergel (ud, ua);
74 
75   vector long long lp = vec_nor (la, lb);
76   vector long long lq = vec_nor (la, ld);
77   vector long long lr = vec_nor (ld, la);
78 
79   vector unsigned long long up = vec_nor (ua, ub);
80   vector unsigned long long uq = vec_nor (ua, ud);
81   vector unsigned long long ur = vec_nor (ud, ua);
82 
83   vector unsigned char ca = {0,4,8,1,5,9,2,6,10,3,7,11,15,12,14,13};
84   vector unsigned char cbb = {5,4,8,3,1,9,2,6,10,3,7,11,15,12,14,13};
85 
86   vector unsigned char ucba = {5,4,8,3,1,9,2,6,10,3,7,11,15,12,14,13};
87   vector unsigned char ucbb = {5,4,8,3,1,9,2,6,10,3,7,11,15,12,14,13};
88   vector unsigned char ucbc = {5,4,8,3,1,9,2,6,10,3,7,11,15,12,14,13};
89 
90   vector long long lv = vec_perm (la, lb, ca);
91 
92   vector unsigned char  ucm = vec_and (ca, cbb);
93   vector unsigned char  ucn = vec_andc (ca, cbb);
94   vector unsigned char  uco = vec_mergel (ca, cbb);
95 
96   vector unsigned long long uv = vec_perm (ua, ub, ca);
97 
98   vector long long lx = vec_sel (la, lb, uc);
99   vector long long ly = vec_sel (la, lb, ld);
100 
101   vector unsigned long long uw = vec_sel (ua, ub, lc);
102   vector unsigned long long ux = vec_sel (ua, ub, uc);
103   vector unsigned long long uy = vec_sel (ua, ub, ld);
104 
105   vector long long lz = vec_xor (la, lb);
106   vector long long l0 = vec_xor (la, ld);
107   vector long long l1 = vec_xor (ld, la);
108 
109   vector unsigned long long uz = vec_xor (ua, ub);
110   vector unsigned long long u0 = vec_xor (ua, ud);
111   vector unsigned long long u1 = vec_xor (ud, ua);
112 
113   int ia = vec_all_eq (ua, ub);
114   int ib = vec_all_ge (ua, ub);
115   int ic = vec_all_gt (ua, ub);
116   int id = vec_all_le (ua, ub);
117   int ie = vec_all_lt (ua, ub);
118   int ig = vec_all_ne (ua, ub);
119 
120   int ih = vec_any_eq (ua, ub);
121   int ii = vec_any_ge (ua, ub);
122   int ij = vec_any_gt (ua, ub);
123   int ik = vec_any_le (ua, ub);
124   int il = vec_any_lt (ua, ub);
125   int im = vec_any_ne (ua, ub);
126 
127   vector short ssa = {9, 16, 25, 36, 1, 2, 3, 4};
128   vector short ssb = {-8, -27, -64, -125, 2, 3, 5, 3};
129   vector short sscc = vec_and (ssa, ssb);
130   vector short sscd = vec_mergeh (ssa, ssb);
131   vector short ssce = vec_mergel (ssa, ssb);
132 
133   vector int sia = {9, 16, 25, 36};
134   vector int sib = {-8, -27, -64, -125};
135   vector int sicc = vec_and (sia, sib);
136   vector int sicd = vec_andc (sia, sib);
137   vector int sig = vec_mergel (sia, sib);
138 
139   vector unsigned int uia = {9, 16, 25, 36};
140   vector unsigned int uib = {8, 27, 64, 125};
141   vector unsigned int uicc = vec_and (uia, uib);
142   vector unsigned int uidd = vec_andc (uia, uib);
143   vector unsigned int uig = vec_mergel (uia, uib);
144 
145   vector bool char bca = {0, 1, 4, 7};
146   vector bool char bcb = {-8, 9, 2, 9};
147   vector bool char bcc = vec_and (bca, bcb);
148   vector bool char bcd = vec_andc (bca, bcb);
149   vector bool char bce = vec_mergel (bca, bcb);
150 
151   vector bool short bsa = {0, -1, -1, 0, 3, 4, 6, 7};
152   vector bool short bsb = {-1, -1, 0, -1, 0, 0, 0, 0};
153   vector bool short bscc = vec_and (bsa, bsb);
154   vector bool short bscd = vec_andc (bsa, bsb);
155   vector bool short bsce = vec_mergel (bsa, bsb);
156 
157   vector bool int bia = {0, -1, -1, 0};
158   vector bool int bib = {-1, -1, 0, -1};
159   vector bool int bicc = vec_and (bia, bib);
160   vector bool int bicd = vec_andc (bia, bib);
161   vector bool int bide = vec_mergel (bia, bib);
162 
163   vector unsigned int uie = vec_packsu (ua, ub);
164 
165   vector long long l2 = vec_cntlz (la);
166   vector unsigned long long u2 = vec_cntlz (ua);
167   vector int sie = vec_cntlz (sia);
168   vector unsigned int uif = vec_cntlz (uia);
169   vector short sszz = vec_cntlz (ssa);
170 
171   vector unsigned short usa = {81, 72, 63, 54, 45, 36, 27, 18};
172   vector unsigned short usb = {81, 72, 63, 54, 45, 36, 27, 18};
173   vector unsigned short usd = vec_and (usa, usb);
174   vector unsigned short use = vec_andc (usa, usb);
175   vector unsigned short usc = vec_cntlz (usa);
176   vector unsigned short uscd = vec_mergeh (usa, usb);
177   vector unsigned short usce = vec_mergel (usa, usb);
178 
179   vector signed char sca = {-4, 3, -9, 15, -31, 31, 0, 0,
180 		            1, 117, -36, 99, 98, 97, 96, 95};
181   vector signed char scb = vec_cntlz (sca);
182   vector signed char scc = vec_mergel (sca, scb);
183 
184   vector unsigned char uca = {4, 3, 9, 15, 30, 31, 0, 0,
185 			      1, 117, 36, 99, 98, 97, 96, 95};
186   vector unsigned char cb = vec_cntlz (ca);
187 
188   vector double dd = vec_xl (0, &y);
189   vec_xst (dd, 0, &z);
190 
191   vector double dzz = vec_round (dd);
192   vector double dzz1 = vec_rsqrt (dd);
193   vector double dzz2 = vec_rsqrte (dd);
194 
195   vector float ff1 = vec_round (fa);
196   vector float ff2 = vec_rsqrt (fa);
197   vector float ff3 = vec_rsqrte (fa);
198 
199   vector double dff = vec_splat (de, 0);
200   vector double dgg = vec_splat (de, 1);
201   vector long long l3 = vec_splat (l2, 0);
202   vector long long l4 = vec_splat (l2, 1);
203   vector unsigned long long u3 = vec_splat (u2, 0);
204   vector unsigned long long u4 = vec_splat (u2, 1);
205   vector bool long long l5 = vec_splat (ld, 0);
206   vector bool long long l6 = vec_splat (ld, 1);
207   vector bool long long l10 = vec_mergee (ld, ld);
208   vector bool long long l11 = vec_mergeo (ld, ld);
209   vector bool long long l15 = vec_and (ld, ld);
210 
211   vector long long l7 = vec_div (l3, l4);
212   vector unsigned long long u5 = vec_div (u3, u4);
213   vector long long l12 = vec_mergee (la, lb);
214   vector long long l13 = vec_mergeo (la, lb);
215   vector unsigned long long u8 = vec_mergee (u3, u4);
216   vector unsigned long long u9 = vec_mergeo (u3, u4);
217 
218   vector long long l8 = vec_mul (l3, l4);
219   vector unsigned long long u6 = vec_mul (u3, u4);
220 
221   vector int sz = vec_cts (fa, 0x1F);
222   vector unsigned int usz = vec_ctu (fa, 0x1F);
223 
224   vector float f1 = vec_mergee (fa, fb);
225   vector float f2 = vec_mergeo (fa, fb);
226 
227   vector double d1 = vec_mergee (da, db);
228   vector double d2 = vec_mergeo (da, db);
229 
230   vector float f3 = vec_ctf (si_a, 1);
231   vector float f4 = vec_ctf (ui_a, 2);
232 
233   vector bool char z_vbc2 = vec_splat (bca, 0);
234   vector signed char z_vsc1 = vec_splat (sca, 1);
235   vector unsigned char z_vuc1 = vec_splat (ucbc, 2);
236 
237   vector bool int z_vbi1 = vec_splat (bia, 3);
238   vector signed int z_vsi1 = vec_splat (sia, 1);
239   vector unsigned int z_vui1 = vec_splat (uia, 2);
240 
241   vector bool int z_bi2 = vec_mergee (bia, bib);
242   vector signed int z_si2 = vec_mergee (sia, sib);
243   vector unsigned int z_ui2 = vec_mergee (uia, uib);
244 
245   vector bool char z_bc2 = vec_mergeh (bca, bcb);
246   vector signed char z_sc2 = vec_mergeh (sca, scb);
247   vector bool int z_bi3 = vec_mergeh (bia, bib);
248   vector signed int z_si3 = vec_mergeh (sia, sib);
249   vector unsigned int z_ui3 = vec_mergeh (uia, uib);
250   vector bool short z_bs1 = vec_mergeh (bsa, bsb);
251 
252   vector bool int z_bi4 = vec_mergeo (bia, bib);
253   vector signed int z_si4 = vec_mergeo (sia, sib);
254   vector unsigned int z_ui4 = vec_mergeo (uia, uib);
255 
256   vector pixel int z_vp1 = vec_splat (pa, 1);
257   vector bool short z_bs2 = vec_splat (bsa, 0);
258   vector short signed int z_vss1 = vec_splat (ssa, 2);
259   vector unsigned short int z_vuss1 = vec_splat (usa, 1);
260 
261   return 0;
262 }
263 
264 /* Expected results:
265    vec_all_eq          vcmpequd.
266    vec_all_ge          vcmpgtud.
267    vec_all_ne          vcmpequd.
268    vec_any_eq          vcmpequd.
269    vec_any_ne          vcmpequd.
270    vec_all_gt          vcmpgtud.
271    vec_all_le          vcmpgtud.
272    vec_all_lt          vcmpgtud.
273    vec_any_ge          vcmpgtud.
274    vec_any_gt          vcmpgtud.
275    vec_any_lt          vcmpgtud.
276    vec_any_le          vcmpgtud.
277    vec_and             xxland
278    vec_andc            xxlandc
279    vec_cntlz           vclzd, vclzb, vclzw, vclzh
280    vec_cpsgn           xvcpsgnsp
281    vec_ctf             xvmuldp
282    vec_cts             vctsxs
283    vec_ctu             vctuxs
284    vec_div             divd, divdu | __divdi3(), __udivdi3()
285    vec_mergel          vmrghb, vmrghh, xxmrghw
286    vec_mergeh          xxmrglw, vmrglh, vmrglb
287    vec_mul             mulld | mullw, mulhwu
288    vec_nor             xxlnor
289    vec_packsu          vpkudus
290    vec_perm            vperm
291    vec_round           xvrdpi
292    vec_sel             xxsel
293    vec_xor             xxlxor
294    vec_rsqrt           xvrsqrtesp
295    vec_rsqrte          xvrsqrtesp
296    vec_xl              lxvd2x
297    vec_xst             stxvd2x
298    vec_splat           xxspltb, xxspltw, vsplth
299    vec_mergee          xxmrgld, vmrgow
300    vec_mergeo          xxmrghd, vmrgew  */
301 
302 /* { dg-final { scan-assembler-times "vcmpequd" 8 } } */
303 /* { dg-final { scan-assembler-times "vcmpgtud" 16 } } */
304 /* { dg-final { scan-assembler-times "xxland" 30 } } */
305 /* { dg-final { scan-assembler-times "xxlandc" 13 } } */
306 /* { dg-final { scan-assembler-times "vclzb" 2 } } */
307 /* { dg-final { scan-assembler-times "vclzd" 2 } } */
308 /* { dg-final { scan-assembler-times "vclzw" 2 } } */
309 /* { dg-final { scan-assembler-times "vclzh" 2 } } */
310 /* { dg-final { scan-assembler-times "xvcpsgnsp" 1 } } */
311 /* { dg-final { scan-assembler-times "xvcpsgndp" 1 } } */
312 /* { dg-final { scan-assembler-times "xvmuldp" 2 } } */
313 /* { dg-final { scan-assembler-times "xvcvdpsxds" 0 } } */
314 /* { dg-final { scan-assembler-times "vctsxs" 2 } } */
315 /* { dg-final { scan-assembler-times "xvcvdpuxds" 0 } } */
316 /* { dg-final { scan-assembler-times "vctuxs" 2 } } */
317 
318 /* { dg-final { scan-assembler-times "vmrghb" 4 { target be } } } */
319 /* { dg-final { scan-assembler-times "vmrghb" 5 { target le } } } */
320 /* { dg-final { scan-assembler-times "vmrghh" 8 } } */
321 /* { dg-final { scan-assembler-times "xxmrghw" 8 } } */
322 /* { dg-final { scan-assembler-times "xxmrglw" 8 } } */
323 /* { dg-final { scan-assembler-times "vmrglh" 8 } } */
324 /* { dg-final { scan-assembler-times "xxlnor" 6 } } */
325 /* { dg-final { scan-assembler-times {\mvpkudus\M} 1 } } */
326 /* { dg-final { scan-assembler-times "vperm" 4 } } */
327 /* { dg-final { scan-assembler-times "xvrdpi" 2 } } */
328 /* { dg-final { scan-assembler-times "xxsel" 10 } } */
329 /* { dg-final { scan-assembler-times "xxlxor" 6 } } */
330 /* { dg-final { scan-assembler-times "divd" 8  { target lp64 } } } */
331 /* { dg-final { scan-assembler-times "divdu" 2  { target lp64 } } } */
332 /* { dg-final { scan-assembler-times "mulld" 4  { target lp64 } } } */
333 /* check for .__divdi3 (AIX), __divdi3 (Linux) and ___divdi3 (Darwin) */
334 /* { dg-final { scan-assembler-times {\mbl \.?_?__divdi3\M} 2   { target { ilp32 } } } } */
335 /* check for both .__udivdi3 (AIX), __udivdi3 (Linux) and ___udivdi3 (Darwin) */
336 /* { dg-final { scan-assembler-times {\mbl \.?_?__udivdi3\M} 2  { target { ilp32 } } } } */
337 /* { dg-final { scan-assembler-times "mullw" 12  { target ilp32 } } } */
338 /* { dg-final { scan-assembler-times "mulhwu" 4  { target ilp32 } } } */
339 /* { dg-final { scan-assembler-times "xxmrgld" 0 } } */
340 /* { dg-final { scan-assembler-times "xxmrghd" 0 } } */
341 /* { dg-final { scan-assembler-times "xvrsqrtesp" 2 } } */
342 /* { dg-final { scan-assembler-times "xvrsqrtedp" 2 } } */
343 /* { dg-final { scan-assembler-times "xxspltd" 8 } } */
344 /* { dg-final { scan-assembler-times "vcfsx" 2 } } */
345 /* { dg-final { scan-assembler-times "vcfux" 2 } } */
346 /* { dg-final { scan-assembler-times "vspltb" 6 } } */
347 /* { dg-final { scan-assembler-times "vspltw" 0 } } */
348 /* { dg-final { scan-assembler-times "vmrgow" 8 } } */
349 /* { dg-final { scan-assembler-times "vmrglb" 5 { target le } } } */
350 /* { dg-final { scan-assembler-times "vmrglb" 6 { target be } } } */
351 /* { dg-final { scan-assembler-times "vmrgew" 8 } } */
352 /* { dg-final { scan-assembler-times "vsplth" 8 } } */
353 /* { dg-final { scan-assembler-times "vcmpequd." 8 } } */
354 /* { dg-final { scan-assembler-times "vcmpgtud." 16 } } */
355 /* { dg-final { scan-assembler-times "vrfin" 2 } } */
356 
357