1 /* { dg-do run } */
2 /* { dg-require-effective-target sse4 } */
3 /* { dg-options "-O2 -msse4.1" } */
4 
5 #ifndef CHECK_H
6 #define CHECK_H "sse4_1-check.h"
7 #endif
8 
9 #ifndef TEST
10 #define TEST sse4_1_test
11 #endif
12 
13 #include CHECK_H
14 
15 #include <smmintrin.h>
16 
17 #define lmskN  0x00
18 #define lmsk0  0x01
19 #define lmsk1  0x02
20 #define lmsk01 0x03
21 
22 #define hmskA  0x30
23 #define hmsk0  0x10
24 #define hmsk1  0x20
25 #define hmsk01 0x30
26 #define hmskN  0x00
27 
28 #ifndef HIMASK
29 #define HIMASK hmskA
30 #endif
31 
32 static void
TEST(void)33 TEST (void)
34 {
35   union
36     {
37       __m128d x;
38       double d[2];
39     } val1, val2, res[4];
40   int masks[4];
41   int i, j;
42 
43   val1.d[0] = 2.;
44   val1.d[1] = 3.;
45 
46   val2.d[0] = 10.;
47   val2.d[1] = 100.;
48 
49   res[0].x = _mm_dp_pd (val1.x, val2.x, HIMASK | lmskN);
50   res[1].x = _mm_dp_pd (val1.x, val2.x, HIMASK | lmsk0);
51   res[2].x = _mm_dp_pd (val1.x, val2.x, HIMASK | lmsk1);
52   res[3].x = _mm_dp_pd (val1.x, val2.x, HIMASK | lmsk01);
53 
54   masks[0] = HIMASK | lmskN;
55   masks[1] = HIMASK | lmsk0;
56   masks[2] = HIMASK | lmsk1;
57   masks[3] = HIMASK | lmsk01;
58 
59   for (i = 0; i < 4; i++)
60     {
61       double tmp = 0.;
62 
63       for (j = 0; j < 2; j++)
64 	if (HIMASK & (0x10 << j))
65 	  tmp = tmp + (val1.d[j] * val2.d[j]);
66 
67       for (j = 0; j < 2; j++)
68 	if ((masks[i] & (1 << j)) && res[i].d[j] != tmp)
69 	  abort ();
70    }
71 }
72