IVOPT performance tuning patch. The main problem is a variant of maximal weight
[official-gcc.git] / gcc / testsuite / gcc.dg / vect / slp-multitypes-3.c
blob926cc28a4f64e73300fbc4ac5b25cd085a1554d1
1 /* { dg-require-effective-target vect_int } */
3 #include <stdarg.h>
4 #include <stdio.h>
5 #include "tree-vect.h"
7 #define N 8
8 unsigned int in[N*8] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63};
9 unsigned char in2[N*8] = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63};
11 __attribute__ ((noinline)) int
12 main1 ()
14 int i;
15 unsigned int out[N*8];
16 unsigned char out2[N*8];
18 for (i = 0; i < N/2; i++)
20 out[i*8] = in[i*8] + 5;
21 out[i*8 + 1] = in[i*8 + 1] + 6;
22 out[i*8 + 2] = in[i*8 + 2] + 7;
23 out[i*8 + 3] = in[i*8 + 3] + 8;
24 out[i*8 + 4] = in[i*8 + 4] + 9;
25 out[i*8 + 5] = in[i*8 + 5] + 10;
26 out[i*8 + 6] = in[i*8 + 6] + 11;
27 out[i*8 + 7] = in[i*8 + 7] + 12;
29 out2[i*16] = in2[i*16] + 2;
30 out2[i*16 + 1] = in2[i*16 + 1] + 3;
31 out2[i*16 + 2] = in2[i*16 + 2] + 4;
32 out2[i*16 + 3] = in2[i*16 + 3] + 3;
33 out2[i*16 + 4] = in2[i*16 + 4] + 2;
34 out2[i*16 + 5] = in2[i*16 + 5] + 3;
35 out2[i*16 + 6] = in2[i*16 + 6] + 2;
36 out2[i*16 + 7] = in2[i*16 + 7] + 4;
37 out2[i*16 + 8] = in2[i*16 + 8] + 2;
38 out2[i*16 + 9] = in2[i*16 + 9] + 5;
39 out2[i*16 + 10] = in2[i*16 + 10] + 2;
40 out2[i*16 + 11] = in2[i*16 + 11] + 3;
41 out2[i*16 + 12] = in2[i*16 + 12] + 4;
42 out2[i*16 + 13] = in2[i*16 + 13] + 4;
43 out2[i*16 + 14] = in2[i*16 + 14] + 3;
44 out2[i*16 + 15] = in2[i*16 + 15] + 2;
48 /* check results: */
49 for (i = 0; i < N/2; i++)
51 if (out[i*8] != in[i*8] + 5
52 || out[i*8 + 1] != in[i*8 + 1] + 6
53 || out[i*8 + 2] != in[i*8 + 2] + 7
54 || out[i*8 + 3] != in[i*8 + 3] + 8
55 || out[i*8 + 4] != in[i*8 + 4] + 9
56 || out[i*8 + 5] != in[i*8 + 5] + 10
57 || out[i*8 + 6] != in[i*8 + 6] + 11
58 || out[i*8 + 7] != in[i*8 + 7] + 12
59 || out2[i*16] != in2[i*16] + 2
60 || out2[i*16 + 1] != in2[i*16 + 1] + 3
61 || out2[i*16 + 2] != in2[i*16 + 2] + 4
62 || out2[i*16 + 3] != in2[i*16 + 3] + 3
63 || out2[i*16 + 4] != in2[i*16 + 4] + 2
64 || out2[i*16 + 5] != in2[i*16 + 5] + 3
65 || out2[i*16 + 6] != in2[i*16 + 6] + 2
66 || out2[i*16 + 7] != in2[i*16 + 7] + 4
67 || out2[i*16 + 8] != in2[i*16 + 8] + 2
68 || out2[i*16 + 9] != in2[i*16 + 9] + 5
69 || out2[i*16 + 10] != in2[i*16 + 10] + 2
70 || out2[i*16 + 11] != in2[i*16 + 11] + 3
71 || out2[i*16 + 12] != in2[i*16 + 12] + 4
72 || out2[i*16 + 13] != in2[i*16 + 13] + 4
73 || out2[i*16 + 14] != in2[i*16 + 14] + 3
74 || out2[i*16 + 15] != in2[i*16 + 15] + 2)
76 abort ();
79 return 0;
82 int main (void)
84 check_vect ();
86 main1 ();
88 return 0;
91 /* { dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" { xfail { sparc*-*-* && ilp32 } } } } */
92 /* { dg-final { scan-tree-dump-times "vectorizing stmts using SLP" 2 "vect" { xfail { sparc*-*-* && ilp32 } }} } */
93 /* { dg-final { cleanup-tree-dump "vect" } } */