1 ; RUN: opt %loadPolly %defaultOpts -polly-codegen -enable-polly-vector -dce -S %s | FileCheck %s
2 ; Obtained from C source as:
3 ; clang -S -emit-llvm -O0 slp-9.c
4 ; opt -correlated-propagation -mem2reg -instcombine -loop-simplify -indvars -instnamer slp-9.s > slp-9.ll
7 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
8 target triple = "x86_64-unknown-linux-gnu"
10 @X = common global [64 x i16] zeroinitializer, align 16
11 @Y = common global [64 x i16] zeroinitializer, align 16
12 @result = common global [64 x i32] zeroinitializer, align 16
14 define i32 @foo1(i32 %len) nounwind uwtable {
18 for.cond: ; preds = %for.inc, %entry
19 %tmp = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
20 %mul = mul i32 %tmp, 2
21 %add1 = add i32 %mul, 1
22 %div = sdiv i32 %len, 2
23 %cmp = icmp slt i32 %tmp, %div
24 br i1 %cmp, label %for.body, label %for.end
26 for.body: ; preds = %for.cond
27 %idxprom = sext i32 %mul to i64
28 %arrayidx = getelementptr inbounds [64 x i16]* @X, i64 0, i64 %idxprom
29 %tmp3 = load i16* %arrayidx, align 4
30 %conv = sext i16 %tmp3 to i32
31 %idxprom6 = sext i32 %mul to i64
32 %arrayidx7 = getelementptr inbounds [64 x i16]* @Y, i64 0, i64 %idxprom6
33 %tmp8 = load i16* %arrayidx7, align 4
34 %conv9 = sext i16 %tmp8 to i32
35 %mul10 = mul nsw i32 %conv, %conv9
36 %idxprom13 = sext i32 %mul to i64
37 %arrayidx14 = getelementptr inbounds [64 x i32]* @result, i64 0, i64 %idxprom13
38 store i32 %mul10, i32* %arrayidx14, align 8
39 %idxprom17 = sext i32 %add1 to i64
40 %arrayidx18 = getelementptr inbounds [64 x i16]* @X, i64 0, i64 %idxprom17
41 %tmp19 = load i16* %arrayidx18, align 2
42 %conv20 = sext i16 %tmp19 to i32
43 %idxprom24 = sext i32 %add1 to i64
44 %arrayidx25 = getelementptr inbounds [64 x i16]* @Y, i64 0, i64 %idxprom24
45 %tmp26 = load i16* %arrayidx25, align 2
46 %conv27 = sext i16 %tmp26 to i32
47 %mul28 = mul nsw i32 %conv20, %conv27
48 %idxprom32 = sext i32 %add1 to i64
49 %arrayidx33 = getelementptr inbounds [64 x i32]* @result, i64 0, i64 %idxprom32
50 store i32 %mul28, i32* %arrayidx33, align 4
53 for.inc: ; preds = %for.body
54 %inc = add nsw i32 %tmp, 1
57 for.end: ; preds = %for.cond
61 define i32 @main() nounwind uwtable {
63 call void @check_vect()
66 for.cond: ; preds = %for.inc, %entry
67 %indvar1 = phi i64 [ %indvar.next2, %for.inc ], [ 0, %entry ]
68 %arrayidx7 = getelementptr [64 x i16]* @Y, i64 0, i64 %indvar1
69 %tmp = mul i64 %indvar1, -1
70 %tmp3 = add i64 %tmp, 64
71 %conv4 = trunc i64 %tmp3 to i16
72 %arrayidx = getelementptr [64 x i16]* @X, i64 0, i64 %indvar1
73 %conv = trunc i64 %indvar1 to i16
74 %exitcond = icmp ne i64 %indvar1, 64
75 br i1 %exitcond, label %for.body, label %for.end
77 for.body: ; preds = %for.cond
78 store i16 %conv, i16* %arrayidx, align 2
79 store i16 %conv4, i16* %arrayidx7, align 2
80 call void asm sideeffect "", "~{dirflag},~{fpsr},~{flags}"() nounwind, !srcloc !0
83 for.inc: ; preds = %for.body
84 %indvar.next2 = add i64 %indvar1, 1
87 for.end: ; preds = %for.cond
88 %call = call i32 @foo1(i32 64)
91 for.cond9: ; preds = %for.inc30, %for.end
92 %indvar = phi i64 [ %indvar.next, %for.inc30 ], [ 0, %for.end ]
93 %arrayidx25 = getelementptr [64 x i16]* @Y, i64 0, i64 %indvar
94 %arrayidx20 = getelementptr [64 x i16]* @X, i64 0, i64 %indvar
95 %arrayidx16 = getelementptr [64 x i32]* @result, i64 0, i64 %indvar
96 %i.1 = trunc i64 %indvar to i32
97 %cmp11 = icmp slt i32 %i.1, 64
98 br i1 %cmp11, label %for.body13, label %for.end33
100 for.body13: ; preds = %for.cond9
101 %tmp17 = load i32* %arrayidx16, align 4
102 %tmp21 = load i16* %arrayidx20, align 2
103 %conv22 = sext i16 %tmp21 to i32
104 %tmp26 = load i16* %arrayidx25, align 2
105 %conv27 = sext i16 %tmp26 to i32
106 %mul = mul nsw i32 %conv22, %conv27
107 %cmp28 = icmp eq i32 %tmp17, %mul
108 br i1 %cmp28, label %if.end, label %if.then
110 if.then: ; preds = %for.body13
111 call void @abort() noreturn nounwind
114 if.end: ; preds = %for.body13
117 for.inc30: ; preds = %if.end
118 %indvar.next = add i64 %indvar, 1
121 for.end33: ; preds = %for.cond9
125 define internal void @check_vect() nounwind uwtable noinline {
127 %a = alloca i32, align 4
128 %b = alloca i32, align 4
129 %c = alloca i32, align 4
130 %d = alloca i32, align 4
131 %call = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* @sig_ill_handler) nounwind
132 %call1 = call i32 @__get_cpuid(i32 1, i32* %a, i32* %b, i32* %c, i32* %d)
133 %tobool = icmp eq i32 %call1, 0
134 br i1 %tobool, label %if.then, label %lor.lhs.false
136 lor.lhs.false: ; preds = %entry
137 %tmp4 = load i32* %d, align 4
138 %and6 = and i32 %tmp4, 67108864
139 %cmp = icmp eq i32 %and6, 0
140 br i1 %cmp, label %if.then, label %if.end
142 if.then: ; preds = %entry, %lor.lhs.false
143 call void @exit(i32 0) noreturn nounwind
146 if.end: ; preds = %lor.lhs.false
147 %call7 = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* null) nounwind
151 declare void @abort() noreturn
153 declare void (i32)* @signal(i32, void (i32)*) nounwind
155 define internal void @sig_ill_handler(i32 %sig) nounwind uwtable {
157 call void @exit(i32 0) noreturn nounwind
160 return: ; No predecessors!
164 define internal i32 @__get_cpuid(i32 %__level, i32* %__eax, i32* %__ebx, i32* %__ecx, i32* %__edx) nounwind uwtable inlinehint {
166 %and = and i32 %__level, -2147483648
167 %call = call i32 @__get_cpuid_max(i32 %and, i32* null)
168 %cmp = icmp ult i32 %call, %__level
169 br i1 %cmp, label %if.then, label %if.end
171 if.then: ; preds = %entry
174 if.end: ; preds = %entry
175 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__level) nounwind, !srcloc !1
176 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
177 %asmresult8 = extractvalue { i32, i32, i32, i32 } %tmp, 1
178 %asmresult9 = extractvalue { i32, i32, i32, i32 } %tmp, 2
179 %asmresult10 = extractvalue { i32, i32, i32, i32 } %tmp, 3
180 store i32 %asmresult, i32* %__eax, align 4
181 store i32 %asmresult8, i32* %__ebx, align 4
182 store i32 %asmresult9, i32* %__ecx, align 4
183 store i32 %asmresult10, i32* %__edx, align 4
186 return: ; preds = %if.end, %if.then
187 %retval.0 = phi i32 [ 0, %if.then ], [ 1, %if.end ]
191 declare void @exit(i32) noreturn
193 define internal i32 @__get_cpuid_max(i32 %__ext, i32* %__sig) nounwind uwtable inlinehint {
195 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__ext) nounwind, !srcloc !2
196 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
197 %tobool = icmp eq i32* %__sig, null
198 br i1 %tobool, label %if.end, label %if.then
200 if.then: ; preds = %entry
201 %asmresult1 = extractvalue { i32, i32, i32, i32 } %tmp, 1
202 store i32 %asmresult1, i32* %__sig, align 4
205 if.end: ; preds = %entry, %if.then
209 !0 = metadata !{i32 549}
210 !1 = metadata !{i32 -2147343379, i32 -2147343371}
211 !2 = metadata !{i32 -2147343502, i32 -2147343494}