2 /* { dg-options "-O2 -mavx512f -std=c99" } */
3 /* { dg-require-effective-target avx512f } */
4 /* { dg-require-effective-target c99_runtime } */
8 #include "avx512f-helper.h"
11 #define SIZE (AVX512F_LEN / 32)
12 #include "avx512f-mask-type.h"
14 #if AVX512F_LEN == 512
16 #define CMP(imm, rel) \
18 for (i = 0; i < 16; i++) \
20 dst_ref = (((int) rel) << i) | dst_ref; \
22 source1.x = _mm512_loadu_ps(s1); \
23 source2.x = _mm512_loadu_ps(s2); \
24 dst1 = _mm512_cmp_ps_mask(source1.x, source2.x, imm);\
25 dst2 = _mm512_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
26 if (dst_ref != dst1) abort(); \
27 if ((dst_ref & mask) != dst2) abort();
30 #if AVX512F_LEN == 256
32 #define CMP(imm, rel) \
34 for (i = 0; i < 8; i++) \
36 dst_ref = (((int) rel) << i) | dst_ref; \
38 source1.x = _mm256_loadu_ps(s1); \
39 source2.x = _mm256_loadu_ps(s2); \
40 dst1 = _mm256_cmp_ps_mask(source1.x, source2.x, imm);\
41 dst2 = _mm256_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
42 if (dst_ref != dst1) abort(); \
43 if ((dst_ref & mask) != dst2) abort();
46 #if AVX512F_LEN == 128
48 #define CMP(imm, rel) \
50 for (i = 0; i < 4; i++) \
52 dst_ref = (((int) rel) << i) | dst_ref; \
54 source1.x = _mm_loadu_ps(s1); \
55 source2.x = _mm_loadu_ps(s2); \
56 dst1 = _mm_cmp_ps_mask(source1.x, source2.x, imm);\
57 dst2 = _mm_mask_cmp_ps_mask(mask, source1.x, source2.x, imm);\
58 if (dst_ref != dst1) abort(); \
59 if ((dst_ref & mask) != dst2) abort();
65 UNION_TYPE (AVX512F_LEN
,) source1
, source2
;
66 MASK_TYPE dst1
, dst2
, dst_ref
;
67 MASK_TYPE mask
= MASK_VALUE
;
69 float s1
[16] = {2134.3343, 6678.346, 453.345635, 54646.464,
70 231.23311, 5674.455, 111.111111, 23241.152,
71 123.14811, 1245.124, 244.151353, 53454.141,
72 926.16717, 3733.261, 643.161644, 23514.633};
73 float s2
[16] = {41124.234, 6678.346, 8653.65635, 856.43576,
74 231.23311, 4646.123, 111.111111, 124.12455,
75 123.14811, 1245.124, 244.151353, 53454.141,
76 2134.3343, 6678.346, 453.345635, 54646.464};
78 CMP(_CMP_EQ_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] == s2
[i
]);
79 CMP(_CMP_LT_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] < s2
[i
]);
80 CMP(_CMP_LE_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] <= s2
[i
]);
81 CMP(_CMP_UNORD_Q
, isunordered(s1
[i
], s2
[i
]));
82 CMP(_CMP_NEQ_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] != s2
[i
]);
83 CMP(_CMP_NLT_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] >= s2
[i
]);
84 CMP(_CMP_NLE_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] > s2
[i
]);
85 CMP(_CMP_ORD_Q
, !isunordered(s1
[i
], s2
[i
]));
87 CMP(_CMP_EQ_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] == s2
[i
]);
88 CMP(_CMP_NGE_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] < s2
[i
]);
89 CMP(_CMP_NGT_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] <= s2
[i
]);
91 CMP(_CMP_FALSE_OQ
, 0);
92 CMP(_CMP_NEQ_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] != s2
[i
]);
93 CMP(_CMP_GE_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] >= s2
[i
]);
94 CMP(_CMP_GT_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] > s2
[i
]);
97 CMP(_CMP_EQ_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] == s2
[i
]);
98 CMP(_CMP_LT_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] < s2
[i
]);
99 CMP(_CMP_LE_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] <= s2
[i
]);
100 CMP(_CMP_UNORD_S
, isunordered(s1
[i
], s2
[i
]));
101 CMP(_CMP_NEQ_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] != s2
[i
]);
102 CMP(_CMP_NLT_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] >= s2
[i
]);
103 CMP(_CMP_NLE_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] > s2
[i
]);
104 CMP(_CMP_ORD_S
, !isunordered(s1
[i
], s2
[i
]));
105 CMP(_CMP_EQ_US
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] == s2
[i
]);
106 CMP(_CMP_NGE_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] < s2
[i
]);
107 CMP(_CMP_NGT_UQ
, isunordered(s1
[i
], s2
[i
]) || s1
[i
] <= s2
[i
]);
108 CMP(_CMP_FALSE_OS
, 0);
109 CMP(_CMP_NEQ_OS
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] != s2
[i
]);
110 CMP(_CMP_GE_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] >= s2
[i
]);
111 CMP(_CMP_GT_OQ
, !isunordered(s1
[i
], s2
[i
]) && s1
[i
] > s2
[i
]);