1 /* { dg-do run { target aarch64_sve_hw } } */
2 /* { dg-options "-O" } */
3 /* { dg-options "-O -msve-vector-bits=256" { target aarch64_sve256_hw } } */
4 
5 #include "vec_perm_1.c"
6 
7 #define TEST_VEC_PERM(TYPE, MASK_TYPE, EXPECTED_RESULT,			\
8 		      VALUES1, VALUES2, MASK)				\
9 {									\
10   TYPE expected_result = EXPECTED_RESULT;				\
11   TYPE values1 = VALUES1;						\
12   TYPE values2 = VALUES2;						\
13   MASK_TYPE mask = MASK;						\
14   TYPE dest;								\
15   dest = vec_perm_##TYPE (values1, values2, mask);			\
16   if (__builtin_memcmp (&dest, &expected_result, sizeof (TYPE)) != 0)	\
17     __builtin_abort ();							\
18 }
19 
main(void)20 int main (void)
21 {
22   TEST_VEC_PERM (vnx2di, vnx2di,
23 		 ((vnx2di) { 5, 36, 7, 48 }),
24 		 ((vnx2di) { 4, 5, 6, 7 }),
25 		 ((vnx2di) { 12, 24, 36, 48 }),
26 		 ((vnx2di) { 1 + (8 * 1), 6 + (8 * 3),
27 			     3 + (8 * 1), 7 + (8 * 5) }));
28   TEST_VEC_PERM (vnx4si, vnx4si,
29 		 ((vnx4si) { 34, 38, 40, 10, 9, 8, 7, 35 }),
30 		 ((vnx4si) { 3, 4, 5, 6, 7, 8, 9, 10 }),
31 		 ((vnx4si) { 33, 34, 35, 36, 37, 38, 39, 40 }),
32 		 ((vnx4si) { 9 + (16 * 2), 13 + (16 * 5),
33 			     15 + (16 * 1), 7 + (16 * 0),
34 			     6 + (16 * 8), 5 + (16 * 2),
35 			     4 + (16 * 3), 10 + (16 * 2) }));
36   TEST_VEC_PERM (vnx8hi, vnx8hi,
37 		 ((vnx8hi) { 12, 16, 18, 10, 42, 43, 44, 34,
38 			     7, 48, 3, 35, 9, 8, 7, 13 }),
39 		 ((vnx8hi) { 3, 4, 5, 6, 7, 8, 9, 10,
40 			     11, 12, 13, 14, 15, 16, 17, 18 }),
41 		 ((vnx8hi) { 33, 34, 35, 36, 37, 38, 39, 40,
42 			     41, 42, 43, 44, 45, 46, 47, 48 }),
43 		 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
44 			     15 + (32 * 8), 7 + (32 * 9),
45 			     25 + (32 * 4), 26 + (32 * 3),
46 			     27 + (32 * 1), 17 + (32 * 2),
47 			     4 + (32 * 6), 31 + (32 * 7),
48 			     0 + (32 * 8), 18 + (32 * 9),
49 			     6 + (32 * 6), 5 + (32 * 7),
50 			     4 + (32 * 2), 10 + (32 * 2) }));
51   TEST_VEC_PERM (vnx16qi, vnx16qi,
52 		 ((vnx16qi) { 5, 6, 7, 4, 5, 6, 4, 5,
53 			      6, 7, 12, 24, 36, 48, 12, 24,
54 			      5, 6, 7, 4, 5, 6, 4, 5,
55 			      6, 7, 12, 24, 36, 48, 12, 24 }),
56 		 ((vnx16qi) { 4, 5, 6, 7, 4, 5, 6, 7,
57 			      4, 5, 6, 7, 4, 5, 6, 7,
58 			      4, 5, 6, 7, 4, 5, 6, 7,
59 			      4, 5, 6, 7, 4, 5, 6, 7 }),
60 		 ((vnx16qi) { 12, 24, 36, 48, 12, 24, 36, 48,
61 			      12, 24, 36, 48, 12, 24, 36, 48,
62 			      12, 24, 36, 48, 12, 24, 36, 48,
63 			      12, 24, 36, 48, 12, 24, 36, 48 }),
64 		 ((vnx16qi) { 5 + (64 * 3), 6 + (64 * 1),
65 			      7 + (64 * 2), 8 + (64 * 1),
66 			      9 + (64 * 3), 10 + (64 * 1),
67 			      28 + (64 * 3), 29 + (64 * 3),
68 			      30 + (64 * 1), 31 + (64 * 1),
69 			      32 + (64 * 3), 33 + (64 * 2),
70 			      54 + (64 * 2), 55 + (64 * 2),
71 			      56 + (64 * 1), 61 + (64 * 2),
72 			      5 + (64 * 2), 6 + (64 * 1),
73 			      7 + (64 * 2), 8 + (64 * 2),
74 			      9 + (64 * 2), 10 + (64 * 1),
75 			      28 + (64 * 3), 29 + (64 * 1),
76 			      30 + (64 * 3), 31 + (64 * 3),
77 			      32 + (64 * 1), 33 + (64 * 1),
78 			      54 + (64 * 2), 55 + (64 * 2),
79 			      56 + (64 * 2), 61 + (64 * 2) }));
80   TEST_VEC_PERM (vnx2df, vnx2di,
81 		 ((vnx2df) { 5.1, 36.1, 7.1, 48.1 }),
82 		 ((vnx2df) { 4.1, 5.1, 6.1, 7.1 }),
83 		 ((vnx2df) { 12.1, 24.1, 36.1, 48.1 }),
84 		 ((vnx2di) { 1 + (8 * 3), 6 + (8 * 10),
85 			     3 + (8 * 8), 7 + (8 * 2) }));
86   TEST_VEC_PERM (vnx4sf, vnx4si,
87 		 ((vnx4sf) { 34.2, 38.2, 40.2, 10.2, 9.2, 8.2, 7.2, 35.2 }),
88 		 ((vnx4sf) { 3.2, 4.2, 5.2, 6.2, 7.2, 8.2, 9.2, 10.2 }),
89 		 ((vnx4sf) { 33.2, 34.2, 35.2, 36.2,
90 			     37.2, 38.2, 39.2, 40.2 }),
91 		 ((vnx4si) { 9 + (16 * 1), 13 + (16 * 5),
92 			     15 + (16 * 4), 7 + (16 * 4),
93 			     6 + (16 * 3), 5 + (16 * 2),
94 			     4 + (16 * 1), 10 + (16 * 0) }));
95   TEST_VEC_PERM (vnx8hf, vnx8hi,
96 		 ((vnx8hf) { 12.0, 16.0, 18.0, 10.0, 42.0, 43.0, 44.0, 34.0,
97 			     7.0, 48.0, 3.0, 35.0, 9.0, 8.0, 7.0, 13.0 }),
98 		 ((vnx8hf) { 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0,
99 			     11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0 }),
100 		 ((vnx8hf) { 33.0, 34.0, 35.0, 36.0, 37.0, 38.0, 39.0, 40.0,
101 			     41.0, 42.0, 43.0, 44.0, 45.0, 46.0, 47.0, 48.0 }),
102 		 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
103 			     15 + (32 * 8), 7 + (32 * 9),
104 			     25 + (32 * 4), 26 + (32 * 3),
105 			     27 + (32 * 1), 17 + (32 * 2),
106 			     4 + (32 * 6), 31 + (32 * 7),
107 			     0 + (32 * 8), 18 + (32 * 9),
108 			     6 + (32 * 6), 5 + (32 * 7),
109 			     4 + (32 * 2), 10 + (32 * 2) }));
110   return 0;
111 }
112