Add support for conditional reductions using SVE CLASTB
[official-gcc.git] / gcc / testsuite / gcc.target / aarch64 / sve / vec_perm_1_overrange_run.c
blob317cae6010c4318554c6ee1f38ecda50e30a715e
1 /* { dg-do run { target aarch64_sve_hw } } */
2 /* { dg-options "-O" } */
3 /* { dg-options "-O -msve-vector-bits=256" { target aarch64_sve256_hw } } */
5 #include "vec_perm_1.c"
7 #define TEST_VEC_PERM(TYPE, MASK_TYPE, EXPECTED_RESULT, \
8 VALUES1, VALUES2, MASK) \
9 { \
10 TYPE expected_result = EXPECTED_RESULT; \
11 TYPE values1 = VALUES1; \
12 TYPE values2 = VALUES2; \
13 MASK_TYPE mask = MASK; \
14 TYPE dest; \
15 dest = vec_perm_##TYPE (values1, values2, mask); \
16 if (__builtin_memcmp (&dest, &expected_result, sizeof (TYPE)) != 0) \
17 __builtin_abort (); \
20 int main (void)
22 TEST_VEC_PERM (vnx2di, vnx2di,
23 ((vnx2di) { 5, 36, 7, 48 }),
24 ((vnx2di) { 4, 5, 6, 7 }),
25 ((vnx2di) { 12, 24, 36, 48 }),
26 ((vnx2di) { 1 + (8 * 1), 6 + (8 * 3),
27 3 + (8 * 1), 7 + (8 * 5) }));
28 TEST_VEC_PERM (vnx4si, vnx4si,
29 ((vnx4si) { 34, 38, 40, 10, 9, 8, 7, 35 }),
30 ((vnx4si) { 3, 4, 5, 6, 7, 8, 9, 10 }),
31 ((vnx4si) { 33, 34, 35, 36, 37, 38, 39, 40 }),
32 ((vnx4si) { 9 + (16 * 2), 13 + (16 * 5),
33 15 + (16 * 1), 7 + (16 * 0),
34 6 + (16 * 8), 5 + (16 * 2),
35 4 + (16 * 3), 10 + (16 * 2) }));
36 TEST_VEC_PERM (vnx8hi, vnx8hi,
37 ((vnx8hi) { 12, 16, 18, 10, 42, 43, 44, 34,
38 7, 48, 3, 35, 9, 8, 7, 13 }),
39 ((vnx8hi) { 3, 4, 5, 6, 7, 8, 9, 10,
40 11, 12, 13, 14, 15, 16, 17, 18 }),
41 ((vnx8hi) { 33, 34, 35, 36, 37, 38, 39, 40,
42 41, 42, 43, 44, 45, 46, 47, 48 }),
43 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
44 15 + (32 * 8), 7 + (32 * 9),
45 25 + (32 * 4), 26 + (32 * 3),
46 27 + (32 * 1), 17 + (32 * 2),
47 4 + (32 * 6), 31 + (32 * 7),
48 0 + (32 * 8), 18 + (32 * 9),
49 6 + (32 * 6), 5 + (32 * 7),
50 4 + (32 * 2), 10 + (32 * 2) }));
51 TEST_VEC_PERM (vnx16qi, vnx16qi,
52 ((vnx16qi) { 5, 6, 7, 4, 5, 6, 4, 5,
53 6, 7, 12, 24, 36, 48, 12, 24,
54 5, 6, 7, 4, 5, 6, 4, 5,
55 6, 7, 12, 24, 36, 48, 12, 24 }),
56 ((vnx16qi) { 4, 5, 6, 7, 4, 5, 6, 7,
57 4, 5, 6, 7, 4, 5, 6, 7,
58 4, 5, 6, 7, 4, 5, 6, 7,
59 4, 5, 6, 7, 4, 5, 6, 7 }),
60 ((vnx16qi) { 12, 24, 36, 48, 12, 24, 36, 48,
61 12, 24, 36, 48, 12, 24, 36, 48,
62 12, 24, 36, 48, 12, 24, 36, 48,
63 12, 24, 36, 48, 12, 24, 36, 48 }),
64 ((vnx16qi) { 5 + (64 * 3), 6 + (64 * 1),
65 7 + (64 * 2), 8 + (64 * 1),
66 9 + (64 * 3), 10 + (64 * 1),
67 28 + (64 * 3), 29 + (64 * 3),
68 30 + (64 * 1), 31 + (64 * 1),
69 32 + (64 * 3), 33 + (64 * 2),
70 54 + (64 * 2), 55 + (64 * 2),
71 56 + (64 * 1), 61 + (64 * 2),
72 5 + (64 * 2), 6 + (64 * 1),
73 7 + (64 * 2), 8 + (64 * 2),
74 9 + (64 * 2), 10 + (64 * 1),
75 28 + (64 * 3), 29 + (64 * 1),
76 30 + (64 * 3), 31 + (64 * 3),
77 32 + (64 * 1), 33 + (64 * 1),
78 54 + (64 * 2), 55 + (64 * 2),
79 56 + (64 * 2), 61 + (64 * 2) }));
80 TEST_VEC_PERM (vnx2df, vnx2di,
81 ((vnx2df) { 5.1, 36.1, 7.1, 48.1 }),
82 ((vnx2df) { 4.1, 5.1, 6.1, 7.1 }),
83 ((vnx2df) { 12.1, 24.1, 36.1, 48.1 }),
84 ((vnx2di) { 1 + (8 * 3), 6 + (8 * 10),
85 3 + (8 * 8), 7 + (8 * 2) }));
86 TEST_VEC_PERM (vnx4sf, vnx4si,
87 ((vnx4sf) { 34.2, 38.2, 40.2, 10.2, 9.2, 8.2, 7.2, 35.2 }),
88 ((vnx4sf) { 3.2, 4.2, 5.2, 6.2, 7.2, 8.2, 9.2, 10.2 }),
89 ((vnx4sf) { 33.2, 34.2, 35.2, 36.2,
90 37.2, 38.2, 39.2, 40.2 }),
91 ((vnx4si) { 9 + (16 * 1), 13 + (16 * 5),
92 15 + (16 * 4), 7 + (16 * 4),
93 6 + (16 * 3), 5 + (16 * 2),
94 4 + (16 * 1), 10 + (16 * 0) }));
95 TEST_VEC_PERM (vnx8hf, vnx8hi,
96 ((vnx8hf) { 12.0, 16.0, 18.0, 10.0, 42.0, 43.0, 44.0, 34.0,
97 7.0, 48.0, 3.0, 35.0, 9.0, 8.0, 7.0, 13.0 }),
98 ((vnx8hf) { 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0,
99 11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0 }),
100 ((vnx8hf) { 33.0, 34.0, 35.0, 36.0, 37.0, 38.0, 39.0, 40.0,
101 41.0, 42.0, 43.0, 44.0, 45.0, 46.0, 47.0, 48.0 }),
102 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
103 15 + (32 * 8), 7 + (32 * 9),
104 25 + (32 * 4), 26 + (32 * 3),
105 27 + (32 * 1), 17 + (32 * 2),
106 4 + (32 * 6), 31 + (32 * 7),
107 0 + (32 * 8), 18 + (32 * 9),
108 6 + (32 * 6), 5 + (32 * 7),
109 4 + (32 * 2), 10 + (32 * 2) }));
110 return 0;