1 ; RUN: opt %loadPolly %defaultOpts -polly-codegen -enable-polly-vector -dce -S %s | FileCheck %s
2 ; Obtained from C source as:
3 ; clang -S -emit-llvm -O0 slp-widen-mult-u8.c
4 ; opt -correlated-propagation -mem2reg -instcombine -loop-simplify -indvars -instnamer slp-widen-mult-u8.s > slp-widen-mult-u8.ll
6 ; ModuleID = 'slp-widen-mult-u8.s'
7 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
8 target triple = "x86_64-unknown-linux-gnu"
10 @X = global [64 x i8] c"\00\01\02\03\04\05\06\07\08\09\0A\0B\0C\0D\0E\0F\10\11\12\13\14\15\16\17\18\19\1A\1B\1C\1D\1E\1F !\22#$%&'()*+,-./0123456789:;<=>?", align 16
11 @Y = global [64 x i8] c"@?>=<;:9876543210/.-,+*)('&%$#\22! \1F\1E\1D\1C\1B\1A\19\18\17\16\15\14\13\12\11\10\0F\0E\0D\0C\0B\0A\09\08\07\06\05\04\03\02\01", align 16
12 @result = common global [64 x i16] zeroinitializer, align 16
14 define i32 @foo1(i32 %len) nounwind uwtable noinline {
18 for.cond: ; preds = %for.inc, %entry
19 %tmp = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
20 %mul = mul i32 %tmp, 2
21 %add1 = add i32 %mul, 1
22 %div = sdiv i32 %len, 2
23 %cmp = icmp slt i32 %tmp, %div
24 br i1 %cmp, label %for.body, label %for.end
26 for.body: ; preds = %for.cond
27 %idxprom = sext i32 %mul to i64
28 %arrayidx = getelementptr inbounds [64 x i8]* @X, i64 0, i64 %idxprom
29 %tmp3 = load i8* %arrayidx, align 2
30 %conv = zext i8 %tmp3 to i16
31 %idxprom6 = sext i32 %mul to i64
32 %arrayidx7 = getelementptr inbounds [64 x i8]* @Y, i64 0, i64 %idxprom6
33 %tmp8 = load i8* %arrayidx7, align 2
34 %conv9 = zext i8 %tmp8 to i16
35 %mul10 = mul i16 %conv, %conv9
36 %idxprom14 = sext i32 %mul to i64
37 %arrayidx15 = getelementptr inbounds [64 x i16]* @result, i64 0, i64 %idxprom14
38 store i16 %mul10, i16* %arrayidx15, align 4
39 %idxprom18 = sext i32 %add1 to i64
40 %arrayidx19 = getelementptr inbounds [64 x i8]* @X, i64 0, i64 %idxprom18
41 %tmp20 = load i8* %arrayidx19, align 1
42 %conv21 = zext i8 %tmp20 to i16
43 %idxprom25 = sext i32 %add1 to i64
44 %arrayidx26 = getelementptr inbounds [64 x i8]* @Y, i64 0, i64 %idxprom25
45 %tmp27 = load i8* %arrayidx26, align 1
46 %conv28 = zext i8 %tmp27 to i16
47 %mul29 = mul i16 %conv21, %conv28
48 %idxprom34 = sext i32 %add1 to i64
49 %arrayidx35 = getelementptr inbounds [64 x i16]* @result, i64 0, i64 %idxprom34
50 store i16 %mul29, i16* %arrayidx35, align 2
53 for.inc: ; preds = %for.body
54 %inc = add nsw i32 %tmp, 1
57 for.end: ; preds = %for.cond
61 define i32 @main() nounwind uwtable {
63 call void @check_vect()
64 %call = call i32 @foo1(i32 64)
67 for.cond: ; preds = %for.inc, %entry
68 %indvar = phi i64 [ %indvar.next, %for.inc ], [ 0, %entry ]
69 %arrayidx10 = getelementptr [64 x i8]* @Y, i64 0, i64 %indvar
70 %arrayidx5 = getelementptr [64 x i8]* @X, i64 0, i64 %indvar
71 %arrayidx = getelementptr [64 x i16]* @result, i64 0, i64 %indvar
72 %i.0 = trunc i64 %indvar to i32
73 %cmp = icmp slt i32 %i.0, 64
74 br i1 %cmp, label %for.body, label %for.end
76 for.body: ; preds = %for.cond
77 %tmp2 = load i16* %arrayidx, align 2
78 %conv = zext i16 %tmp2 to i32
79 %tmp6 = load i8* %arrayidx5, align 1
80 %conv7 = zext i8 %tmp6 to i32
81 %tmp11 = load i8* %arrayidx10, align 1
82 %conv12 = zext i8 %tmp11 to i32
83 %mul = mul nsw i32 %conv7, %conv12
84 %cmp13 = icmp eq i32 %conv, %mul
85 br i1 %cmp13, label %if.end, label %if.then
87 if.then: ; preds = %for.body
88 call void @abort() noreturn nounwind
91 if.end: ; preds = %for.body
94 for.inc: ; preds = %if.end
95 %indvar.next = add i64 %indvar, 1
98 for.end: ; preds = %for.cond
102 define internal void @check_vect() nounwind uwtable noinline {
104 %a = alloca i32, align 4
105 %b = alloca i32, align 4
106 %c = alloca i32, align 4
107 %d = alloca i32, align 4
108 %call = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* @sig_ill_handler) nounwind
109 %call1 = call i32 @__get_cpuid(i32 1, i32* %a, i32* %b, i32* %c, i32* %d)
110 %tobool = icmp eq i32 %call1, 0
111 br i1 %tobool, label %if.then, label %lor.lhs.false
113 lor.lhs.false: ; preds = %entry
114 %tmp4 = load i32* %d, align 4
115 %and6 = and i32 %tmp4, 67108864
116 %cmp = icmp eq i32 %and6, 0
117 br i1 %cmp, label %if.then, label %if.end
119 if.then: ; preds = %entry, %lor.lhs.false
120 call void @exit(i32 0) noreturn nounwind
123 if.end: ; preds = %lor.lhs.false
124 %call7 = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* null) nounwind
128 declare void @abort() noreturn
130 declare void (i32)* @signal(i32, void (i32)*) nounwind
132 define internal void @sig_ill_handler(i32 %sig) nounwind uwtable {
134 call void @exit(i32 0) noreturn nounwind
137 return: ; No predecessors!
141 define internal i32 @__get_cpuid(i32 %__level, i32* %__eax, i32* %__ebx, i32* %__ecx, i32* %__edx) nounwind uwtable inlinehint {
143 %and = and i32 %__level, -2147483648
144 %call = call i32 @__get_cpuid_max(i32 %and, i32* null)
145 %cmp = icmp ult i32 %call, %__level
146 br i1 %cmp, label %if.then, label %if.end
148 if.then: ; preds = %entry
151 if.end: ; preds = %entry
152 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__level) nounwind, !srcloc !0
153 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
154 %asmresult8 = extractvalue { i32, i32, i32, i32 } %tmp, 1
155 %asmresult9 = extractvalue { i32, i32, i32, i32 } %tmp, 2
156 %asmresult10 = extractvalue { i32, i32, i32, i32 } %tmp, 3
157 store i32 %asmresult, i32* %__eax, align 4
158 store i32 %asmresult8, i32* %__ebx, align 4
159 store i32 %asmresult9, i32* %__ecx, align 4
160 store i32 %asmresult10, i32* %__edx, align 4
163 return: ; preds = %if.end, %if.then
164 %retval.0 = phi i32 [ 0, %if.then ], [ 1, %if.end ]
168 declare void @exit(i32) noreturn
170 define internal i32 @__get_cpuid_max(i32 %__ext, i32* %__sig) nounwind uwtable inlinehint {
172 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__ext) nounwind, !srcloc !1
173 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
174 %tobool = icmp eq i32* %__sig, null
175 br i1 %tobool, label %if.end, label %if.then
177 if.then: ; preds = %entry
178 %asmresult1 = extractvalue { i32, i32, i32, i32 } %tmp, 1
179 store i32 %asmresult1, i32* %__sig, align 4
182 if.end: ; preds = %entry, %if.then
186 !0 = metadata !{i32 -2147342998, i32 -2147342990}
187 !1 = metadata !{i32 -2147343121, i32 -2147343113}