1 /* { dg-do run } */
2 /* { dg-options "-mavx2 -O2" } */
3 /* { dg-require-effective-target avx2 } */
4
5 #include "avx2-check.h"
6 #include "ssse3-vals.h"
7
8 static short
signed_saturate_to_word(int x)9 signed_saturate_to_word (int x)
10 {
11 if (x > (int) 0x7fff)
12 return 0x7fff;
13
14 if (x < (int) 0xffff8000)
15 return 0x8000;
16
17 return (short) x;
18 }
19
20 static void
compute_phsubsw256(short * i1,short * i2,short * r)21 compute_phsubsw256 (short *i1, short *i2, short *r)
22 {
23 int i;
24
25 for (i = 0; i < 4; i++)
26 r[i + 0] = signed_saturate_to_word (i1[2 * i] - i1[2 * i + 1]);
27
28 for (i = 0; i < 4; i++)
29 r[i + 4] = signed_saturate_to_word (i2[2 * i] - i2[2 * i + 1]);
30
31 for (i = 0; i < 4; i++)
32 r[i + 8] = signed_saturate_to_word (i1[2 * i + 8] - i1[2 * i + 9]);
33
34 for (i = 0; i < 4; i++)
35 r[i + 12] = signed_saturate_to_word (i2[2 * i + 8] - i2[2 * i + 9]);
36 }
37
38 static void
avx2_test(void)39 avx2_test (void)
40 {
41 union256i_w s1, s2, res;
42 short res_ref[16];
43 int i;
44 int fail = 0;
45
46 for (i = 0; i < 256; i += 16)
47 {
48 s1.x = _mm256_loadu_si256 ((__m256i *) & vals[i]);
49 s2.x = _mm256_loadu_si256 ((__m256i *) & vals[i + 8]);
50
51 res.x = _mm256_hsubs_epi16 (s1.x, s2.x);
52
53 compute_phsubsw256 (s1.a, s2.a, res_ref);
54
55 fail += check_union256i_w (res, res_ref);
56 }
57
58 if (fail != 0)
59 abort ();
60 }
61