2 /* { dg-options "-O2 -mavx512f" } */
3 /* { dg-require-effective-target avx512f } */
5 #include "avx512f-check.h"
7 #include "avx512f-helper.h"
9 #define SIZE (128 / 32)
10 #include "avx512f-mask-type.h"
13 calc_add (float *r
, float *s1
, float *s2
)
18 for (i
= 1; i
< SIZE
; i
++)
26 union128 res1
, res2
, res3
, res4
, res5
, src1
, src2
;
27 MASK_TYPE mask
= MASK_VALUE
;
31 for (i
= 0; i
< SIZE
; i
++)
33 src1
.a
[i
] = 1.5 + 34.67 * i
* sign
;
34 src2
.a
[i
] = -22.17 * i
* sign
+ 1.0;
37 for (i
= 0; i
< SIZE
; i
++)
39 res1
.a
[i
] = DEFAULT_VALUE
;
40 res4
.a
[i
] = DEFAULT_VALUE
;
43 res1
.x
= _mm_mask_add_ss (res1
.x
, mask
, src1
.x
, src2
.x
);
44 res2
.x
= _mm_maskz_add_ss (mask
, src1
.x
, src2
.x
);
45 res3
.x
= _mm_add_round_ss (src1
.x
, src2
.x
, _MM_FROUND_NO_EXC
);
46 res4
.x
= _mm_mask_add_round_ss (res4
.x
, mask
, src1
.x
, src2
.x
, _MM_FROUND_NO_EXC
);
47 res5
.x
= _mm_maskz_add_round_ss (mask
, src1
.x
, src2
.x
, _MM_FROUND_NO_EXC
);
49 calc_add (res_ref
, src1
.a
, src2
.a
);
51 MASK_MERGE () (res_ref
, mask
, 1);
52 if (check_union128 (res1
, res_ref
))
55 MASK_ZERO () (res_ref
, mask
, 1);
56 if (check_union128 (res2
, res_ref
))
59 calc_add (res_ref
, src1
.a
, src2
.a
);
61 if (check_union128 (res3
, res_ref
))
64 MASK_MERGE () (res_ref
, mask
, 1);
65 if (check_union128 (res4
, res_ref
))
68 MASK_ZERO () (res_ref
, mask
, 1);
69 if (check_union128 (res5
, res_ref
))