2 /* { dg-options "-mavx2 -O2" } */
3 /* { dg-require-effective-target avx2 } */
5 #include "avx2-check.h"
6 #include "ssse3-vals.h"
9 compute_phaddw256 (short *i1
, short *i2
, short *r
)
13 for (i
= 0; i
< 4; i
++)
14 r
[i
+ 0] = i1
[2 * i
] + i1
[2 * i
+ 1];
16 for (i
= 0; i
< 4; i
++)
17 r
[i
+ 4] = i2
[2 * i
] + i2
[2 * i
+ 1];
19 for (i
= 0; i
< 4; i
++)
20 r
[i
+ 8] = i1
[2 * i
+ 8] + i1
[2 * i
+ 9];
22 for (i
= 0; i
< 4; i
++)
23 r
[i
+ 12] = i2
[2 * i
+ 8] + i2
[2 * i
+ 9];
29 union256i_w s1
, s2
, res
;
34 for (i
= 0; i
< 256; i
+= 16)
36 s1
.x
= _mm256_loadu_si256 ((__m256i
*) & vals
[i
]);
37 s2
.x
= _mm256_loadu_si256 ((__m256i
*) & vals
[i
+ 8]);
39 res
.x
= _mm256_hadd_epi16 (s1
.x
, s2
.x
);
41 compute_phaddw256 (s1
.a
, s2
.a
, res_ref
);
43 fail
+= check_union256i_w (res
, res_ref
);