1 /* { dg-do compile { target { ! ia32 } } } */
2 /* { dg-options "-O2 -mavx512vl -mno-avx512bw -masm=att" } */
3 
4 typedef char V1 __attribute__((vector_size (16)));
5 
6 void
f1(V1 x)7 f1 (V1 x)
8 {
9   register V1 a __asm ("xmm16");
10   a = x;
11   asm volatile ("" : "+v" (a));
12   a = __builtin_shuffle (a, (V1) { 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 0, 1, 2, 3, 4, 5 });
13   asm volatile ("" : "+v" (a));
14 }
15 
16 /* { dg-final { scan-assembler-not "vpalignr\[^\n\r]*\\\$6\[^\n\r]*%xmm16\[^\n\r]*%xmm16\[^\n\r]*%xmm16" } } */
17 
18 typedef short V2 __attribute__((vector_size (16)));
19 
20 void
f2(V2 x)21 f2 (V2 x)
22 {
23   register V2 a __asm ("xmm16");
24   a = x;
25   asm volatile ("" : "+v" (a));
26   a = __builtin_shuffle (a, (V2) { 5, 6, 7, 0, 1, 2, 3, 4 });
27   asm volatile ("" : "+v" (a));
28 }
29 
30 /* { dg-final { scan-assembler-not "vpalignr\[^\n\r]*\\\$10\[^\n\r]*%xmm16\[^\n\r]*%xmm16\[^\n\r]*%xmm16" } } */
31 
32 typedef int V3 __attribute__((vector_size (16)));
33 
34 void
f3(V3 x)35 f3 (V3 x)
36 {
37   register V3 a __asm ("xmm16");
38   a = x;
39   asm volatile ("" : "+v" (a));
40   a = __builtin_shuffle (a, (V3) { 3, 0, 1, 2 });
41   asm volatile ("" : "+v" (a));
42 }
43 
44 /* { dg-final { scan-assembler-times "vpshufd\[^\n\r]*\\\$147\[^\n\r]*%xmm16\[^\n\r]*%xmm16" 1 } } */
45 
46 typedef long long V4 __attribute__((vector_size (16)));
47 
48 void
f4(V4 x)49 f4 (V4 x)
50 {
51   register V4 a __asm ("xmm16");
52   a = x;
53   asm volatile ("" : "+v" (a));
54   a = __builtin_shuffle (a, (V4) { 1, 0 });
55   asm volatile ("" : "+v" (a));
56 }
57 
58 /* { dg-final { scan-assembler-not "vpalignr\[^\n\r]*\\\$8\[^\n\r]*%xmm16\[^\n\r]*%xmm16\[^\n\r]*%xmm16" } } */
59 
60 typedef float V5 __attribute__((vector_size (16)));
61 
62 void
f5(V5 x)63 f5 (V5 x)
64 {
65   register V5 a __asm ("xmm16");
66   a = x;
67   asm volatile ("" : "+v" (a));
68   a = __builtin_shuffle (a, (V3) { 3, 0, 1, 2 });
69   asm volatile ("" : "+v" (a));
70 }
71 
72 /* { dg-final { scan-assembler-times "vpermilps\[^\n\r]*\\\$147\[^\n\r]*%xmm16\[^\n\r]*%xmm16" 1 } } */
73 
74 typedef double V6 __attribute__((vector_size (16)));
75 
76 void
f6(V6 x)77 f6 (V6 x)
78 {
79   register V6 a __asm ("xmm16");
80   a = x;
81   asm volatile ("" : "+v" (a));
82   a = __builtin_shuffle (a, (V4) { 1, 0 });
83   asm volatile ("" : "+v" (a));
84 }
85 
86 /* { dg-final { scan-assembler-times "vpermilpd\[^\n\r]*\\\$1\[^\n\r]*%xmm16\[^\n\r]*%xmm16" 1 } } */
87