1 /* { dg-do run } */
2 /* { dg-options "-O2 -mavx512f -std=c99" } */
3 /* { dg-require-effective-target avx512f } */
4 /* { dg-require-effective-target c99_runtime } */
5
6 #define AVX512F
7
8 #include "avx512f-helper.h"
9
10 #include <math.h>
11 #define SIZE (AVX512F_LEN / 64)
12 #include "avx512f-mask-type.h"
13
14 #undef SUF
15 #undef SSIZE
16 #undef GEN_CMP
17 #undef CHECK_CMP
18
19 #if AVX512F_LEN == 512
20 #define SUF(fun) _mm512##fun
21 #define SSIZE 8
22
23 #define GEN_CMP(type) \
24 { \
25 dst3 = _mm512_cmp##type##_pd_mask(source1.x, source2.x);\
26 dst4 = _mm512_mask_cmp##type##_pd_mask(mask, source1.x, source2.x);\
27 if (dst3 != dst1) abort(); \
28 if (dst4 != dst2) abort(); \
29 }
30
31 #define CHECK_CMP(imm) \
32 if (imm == _CMP_EQ_OQ) GEN_CMP(eq) \
33 if (imm == _CMP_LT_OS) GEN_CMP(lt) \
34 if (imm == _CMP_LE_OS) GEN_CMP(le) \
35 if (imm == _CMP_UNORD_Q) GEN_CMP(unord) \
36 if (imm == _CMP_NEQ_UQ) GEN_CMP(neq) \
37 if (imm == _CMP_NLT_US) GEN_CMP(nlt) \
38 if (imm == _CMP_NLE_US) GEN_CMP(nle) \
39 if (imm == _CMP_ORD_Q) GEN_CMP(ord)
40
41 #endif
42
43 #if AVX512F_LEN == 256
44 #define SUF(fun) _mm256##fun
45 #define SSIZE 4
46 #define GEN_CMP(type)
47 #define CHECK_CMP(imm)
48 #endif
49
50 #if AVX512F_LEN == 128
51 #define SUF(fun) _mm##fun
52 #define SSIZE 2
53 #define GEN_CMP(type)
54 #define CHECK_CMP(imm)
55 #endif
56
57 #undef CMP
58 #define CMP(imm, rel) \
59 dst_ref = 0; \
60 for (i = 0; i < SSIZE; i++) \
61 { \
62 dst_ref = (((int) rel) << i) | dst_ref; \
63 } \
64 source1.x = SUF(_loadu_pd)(s1); \
65 source2.x = SUF(_loadu_pd)(s2); \
66 dst1 = SUF(_cmp_pd_mask)(source1.x, source2.x, imm);\
67 dst2 = SUF(_mask_cmp_pd_mask)(mask, source1.x, source2.x, imm);\
68 if (dst_ref != dst1) abort(); \
69 if ((dst_ref & mask) != dst2) abort(); \
70 CHECK_CMP(imm)
71
72 void
TEST()73 TEST ()
74 {
75 UNION_TYPE (AVX512F_LEN, d) source1, source2;
76 MASK_TYPE dst1, dst2, dst3, dst4, dst_ref;
77 MASK_TYPE mask = MASK_VALUE;
78 int i;
79 double s1[8]={2134.3343, 6678.346, 453.345635, 54646.464,
80 231.23311, 5674.455, 111.111111, 23241.152};
81 double s2[8]={41124.234, 6678.346, 8653.65635, 856.43576,
82 231.23311, 4646.123, 111.111111, 124.12455};
83
84 CMP(_CMP_EQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]);
85 CMP(_CMP_LT_OS, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]);
86 CMP(_CMP_LE_OS, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]);
87 CMP(_CMP_UNORD_Q, isunordered(s1[i], s2[i]));
88 CMP(_CMP_NEQ_UQ, isunordered(s1[i], s2[i]) || s1[i] != s2[i]);
89 CMP(_CMP_NLT_US, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]);
90 CMP(_CMP_NLE_US, isunordered(s1[i], s2[i]) || s1[i] > s2[i]);
91 CMP(_CMP_ORD_Q, !isunordered(s1[i], s2[i]));
92
93 CMP(_CMP_EQ_UQ, isunordered(s1[i], s2[i]) || s1[i] == s2[i]);
94 CMP(_CMP_NGE_US, isunordered(s1[i], s2[i]) || s1[i] < s2[i]);
95 CMP(_CMP_NGT_US, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]);
96
97 CMP(_CMP_FALSE_OQ, 0);
98 CMP(_CMP_NEQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]);
99 CMP(_CMP_GE_OS, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]);
100 CMP(_CMP_GT_OS, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]);
101 CMP(_CMP_TRUE_UQ, 1);
102
103 CMP(_CMP_EQ_OS, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]);
104 CMP(_CMP_LT_OQ, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]);
105 CMP(_CMP_LE_OQ, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]);
106 CMP(_CMP_UNORD_S, isunordered(s1[i], s2[i]));
107 CMP(_CMP_NEQ_US, isunordered(s1[i], s2[i]) || s1[i] != s2[i]);
108 CMP(_CMP_NLT_UQ, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]);
109 CMP(_CMP_NLE_UQ, isunordered(s1[i], s2[i]) || s1[i] > s2[i]);
110 CMP(_CMP_ORD_S, !isunordered(s1[i], s2[i]));
111 CMP(_CMP_EQ_US, isunordered(s1[i], s2[i]) || s1[i] == s2[i]);
112 CMP(_CMP_NGE_UQ, isunordered(s1[i], s2[i]) || s1[i] < s2[i]);
113 CMP(_CMP_NGT_UQ, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]);
114 CMP(_CMP_FALSE_OS, 0);
115 CMP(_CMP_NEQ_OS, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]);
116 CMP(_CMP_GE_OQ, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]);
117 CMP(_CMP_GT_OQ, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]);
118 CMP(_CMP_TRUE_US, 1)
119 }
120