1 /* { dg-do run } */
2 /* { dg-require-effective-target ssse3 } */
3 /* { dg-options "-O2 -fno-strict-aliasing -mssse3" } */
4 
5 #ifndef CHECK_H
6 #define CHECK_H "ssse3-check.h"
7 #endif
8 
9 #ifndef TEST
10 #define TEST ssse3_test
11 #endif
12 
13 #include CHECK_H
14 #include "ssse3-vals.h"
15 
16 #include <tmmintrin.h>
17 
18 #ifndef __AVX__
19 /* Test the 64-bit form */
20 static void
ssse3_test_psignw(int * i1,int * i2,int * r)21 ssse3_test_psignw (int *i1, int *i2, int *r)
22 {
23   __m64 t1 = *(__m64 *) i1;
24   __m64 t2 = *(__m64 *) i2;
25   *(__m64 *) r = _mm_sign_pi16 (t1, t2);
26   _mm_empty ();
27 }
28 #endif
29 
30 /* Test the 128-bit form */
31 static void
ssse3_test_psignw128(int * i1,int * i2,int * r)32 ssse3_test_psignw128 (int *i1, int *i2, int *r)
33 {
34   /* Assumes incoming pointers are 16-byte aligned */
35   __m128i t1 = *(__m128i *) i1;
36   __m128i t2 = *(__m128i *) i2;
37  *(__m128i *) r = _mm_sign_epi16 (t1, t2);
38 }
39 
40 /* Routine to manually compute the results */
41 static void
compute_correct_result(int * i1,int * i2,int * r)42 compute_correct_result (int *i1, int *i2, int *r)
43 {
44   short *s1 = (short *) i1;
45   short *s2 = (short *) i2;
46   short *sout = (short *) r;
47   int i;
48 
49   for (i = 0; i < 8; i++)
50     if (s2[i] < 0)
51       sout[i] = -s1[i];
52     else if (s2[i] == 0)
53       sout[i] = 0;
54     else
55       sout[i] = s1[i];
56 }
57 
58 static void
TEST(void)59 TEST (void)
60 {
61   int i;
62   int r [4] __attribute__ ((aligned(16)));
63   int ck [4];
64   int fail = 0;
65 
66   for (i = 0; i < 256; i += 8)
67     {
68       /* Manually compute the result */
69       compute_correct_result (&vals[i + 0], &vals[i + 4], ck);
70 
71 #ifndef __AVX__
72       /* Run the 64-bit tests */
73       ssse3_test_psignw (&vals[i + 0], &vals[i + 4], &r[0]);
74       ssse3_test_psignw (&vals[i + 2], &vals[i + 6], &r[2]);
75       fail += chk_128 (ck, r);
76 #endif
77 
78       /* Run the 128-bit tests */
79       ssse3_test_psignw128 (&vals[i + 0], &vals[i + 4], r);
80       fail += chk_128 (ck, r);
81     }
82 
83   if (fail != 0)
84     abort ();
85 }
86