2 /* { dg-options "-O2 -mavx512bw" } */
3 /* { dg-require-effective-target avx512bw } */
6 #include "avx512f-helper.h"
8 #define DST_SIZE (AVX512F_LEN / 16)
9 #define SRC_SIZE (AVX512F_LEN / 32)
13 #include "avx512f-mask-type.h"
16 EVAL(int_to_ushort
, AVX512F_LEN
,) (int iVal
)
22 else if (iVal
> USHRT_MAX
)
31 CALC (int *src1
, int *src2
, unsigned short *dst
)
36 for (i
= 0; i
< DST_SIZE
; i
++)
38 ptr
= (i
/ 4) % 2 ? src2
: src1
;
39 dst
[i
] = EVAL(int_to_ushort
, AVX512F_LEN
,) (ptr
[i
% 4 + (i
/ 8) * 4]);
46 UNION_TYPE (AVX512F_LEN
, i_d
) s1
, s2
;
47 UNION_TYPE (AVX512F_LEN
, i_w
) res1
, res2
, res3
;
48 MASK_TYPE mask
= MASK_VALUE
;
49 unsigned short dst_ref
[DST_SIZE
];
52 for (i
= 0; i
< DST_SIZE
; i
++)
53 res2
.a
[i
] = DEFAULT_VALUE
;
55 for (i
= 0; i
< SRC_SIZE
; i
++)
61 res1
.x
= INTRINSIC (_packus_epi32
) (s1
.x
, s2
.x
);
62 res2
.x
= INTRINSIC (_mask_packus_epi32
) (res2
.x
, mask
, s1
.x
, s2
.x
);
63 res3
.x
= INTRINSIC (_maskz_packus_epi32
) (mask
, s1
.x
, s2
.x
);
65 CALC (s1
.a
, s2
.a
, dst_ref
);
67 if (UNION_CHECK (AVX512F_LEN
, i_w
) (res1
, dst_ref
))
70 MASK_MERGE (i_w
) (dst_ref
, mask
, DST_SIZE
);
71 if (UNION_CHECK (AVX512F_LEN
, i_w
) (res2
, dst_ref
))
74 MASK_ZERO (i_w
) (dst_ref
, mask
, DST_SIZE
);
75 if (UNION_CHECK (AVX512F_LEN
, i_w
) (res3
, dst_ref
))