1 ; RUN: opt %loadPolly %defaultOpts -polly-codegen -enable-polly-vector -dce -S %s | FileCheck %s
2 ; Obtained from C source as:
3 ; clang -S -emit-llvm -O0 vect-strided-a-u32-mult.c
4 ; opt -correlated-propagation -mem2reg -instcombine -loop-simplify -indvars -instnamer vect-strided-a-u32-mult.s > vect-strided-a-u32-mult.ll
6 ; ModuleID = 'vect-strided-a-u32-mult.s'
7 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
8 target triple = "x86_64-unknown-linux-gnu"
10 %struct.ii = type { i32, i32 }
12 define i32 @main1() nounwind uwtable noinline {
14 %arr = alloca [128 x i16], align 16
15 %iarr = alloca [128 x %struct.ii], align 16
16 %res = alloca [128 x i16], align 16
17 %ires = alloca [128 x %struct.ii], align 16
20 for.cond: ; preds = %for.inc, %entry
21 %indvar18 = phi i64 [ %indvar.next19, %for.inc ], [ 0, %entry ]
22 %b = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar18, i32 1
23 %tmp = mul i64 %indvar18, 3
24 %mul = trunc i64 %tmp to i32
25 %scevgep23 = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar18
26 %a = bitcast %struct.ii* %scevgep23 to i32*
27 %i.0 = trunc i64 %indvar18 to i32
28 %arrayidx = getelementptr [128 x i16]* %arr, i64 0, i64 %indvar18
29 %conv = trunc i64 %indvar18 to i16
30 %exitcond20 = icmp ne i64 %indvar18, 128
31 br i1 %exitcond20, label %for.body, label %for.end
33 for.body: ; preds = %for.cond
34 store i16 %conv, i16* %arrayidx, align 2
35 store i32 %i.0, i32* %a, align 8
36 store i32 %mul, i32* %b, align 4
37 call void asm sideeffect "", "~{dirflag},~{fpsr},~{flags}"() nounwind, !srcloc !0
40 for.inc: ; preds = %for.body
41 %indvar.next19 = add i64 %indvar18, 1
44 for.end: ; preds = %for.cond
47 for.cond13: ; preds = %for.inc46, %for.end
48 %indvar8 = phi i64 [ %indvar.next9, %for.inc46 ], [ 0, %for.end ]
49 %arrayidx42 = getelementptr [128 x i16]* %res, i64 0, i64 %indvar8
50 %b37 = getelementptr [128 x %struct.ii]* %ires, i64 0, i64 %indvar8, i32 1
51 %scevgep12 = getelementptr [128 x %struct.ii]* %ires, i64 0, i64 %indvar8
52 %a27 = bitcast %struct.ii* %scevgep12 to i32*
53 %scevgep14 = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar8
54 %a22 = bitcast %struct.ii* %scevgep14 to i32*
55 %b19 = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar8, i32 1
56 %ptr.0 = getelementptr [128 x i16]* %arr, i64 0, i64 %indvar8
57 %exitcond = icmp ne i64 %indvar8, 128
58 br i1 %exitcond, label %for.body17, label %for.end49
60 for.body17: ; preds = %for.cond13
61 %tmp20 = load i32* %b19, align 4
62 %tmp23 = load i32* %a22, align 4
63 %sub = sub i32 %tmp20, %tmp23
64 store i32 %sub, i32* %a27, align 8
65 %tmp30 = load i32* %b19, align 4
66 %tmp33 = load i32* %a22, align 4
67 %add = add i32 %tmp30, %tmp33
68 store i32 %add, i32* %b37, align 4
69 %tmp39 = load i16* %ptr.0, align 2
70 store i16 %tmp39, i16* %arrayidx42, align 2
73 for.inc46: ; preds = %for.body17
74 %indvar.next9 = add i64 %indvar8, 1
77 for.end49: ; preds = %for.cond13
80 for.cond50: ; preds = %for.inc104, %for.end49
81 %indvar = phi i64 [ %indvar.next, %for.inc104 ], [ 0, %for.end49 ]
82 %scevgep = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar
83 %a80 = bitcast %struct.ii* %scevgep to i32*
84 %b75 = getelementptr [128 x %struct.ii]* %iarr, i64 0, i64 %indvar, i32 1
85 %b89 = getelementptr [128 x %struct.ii]* %ires, i64 0, i64 %indvar, i32 1
86 %scevgep4 = getelementptr [128 x %struct.ii]* %ires, i64 0, i64 %indvar
87 %a70 = bitcast %struct.ii* %scevgep4 to i32*
88 %arrayidx62 = getelementptr [128 x i16]* %arr, i64 0, i64 %indvar
89 %arrayidx57 = getelementptr [128 x i16]* %res, i64 0, i64 %indvar
90 %i.2 = trunc i64 %indvar to i32
91 %cmp52 = icmp slt i32 %i.2, 128
92 br i1 %cmp52, label %for.body54, label %for.end107
94 for.body54: ; preds = %for.cond50
95 %tmp58 = load i16* %arrayidx57, align 2
96 %tmp63 = load i16* %arrayidx62, align 2
97 %cmp65 = icmp eq i16 %tmp58, %tmp63
98 br i1 %cmp65, label %lor.lhs.false, label %if.then
100 lor.lhs.false: ; preds = %for.body54
101 %tmp71 = load i32* %a70, align 8
102 %tmp76 = load i32* %b75, align 4
103 %tmp81 = load i32* %a80, align 8
104 %sub82 = sub i32 %tmp76, %tmp81
105 %cmp83 = icmp eq i32 %tmp71, %sub82
106 br i1 %cmp83, label %lor.lhs.false85, label %if.then
108 lor.lhs.false85: ; preds = %lor.lhs.false
109 %tmp90 = load i32* %b89, align 4
110 %tmp95 = load i32* %b75, align 4
111 %tmp100 = load i32* %a80, align 8
112 %add101 = add i32 %tmp95, %tmp100
113 %cmp102 = icmp eq i32 %tmp90, %add101
114 br i1 %cmp102, label %if.end, label %if.then
116 if.then: ; preds = %lor.lhs.false85, %lor.lhs.false, %for.body54
117 call void @abort() noreturn nounwind
120 if.end: ; preds = %lor.lhs.false85
123 for.inc104: ; preds = %if.end
124 %indvar.next = add i64 %indvar, 1
127 for.end107: ; preds = %for.cond50
131 declare void @abort() noreturn
133 define i32 @main() nounwind uwtable {
135 call void @check_vect()
136 %call = call i32 @main1()
140 define internal void @check_vect() nounwind uwtable noinline {
142 %a = alloca i32, align 4
143 %b = alloca i32, align 4
144 %c = alloca i32, align 4
145 %d = alloca i32, align 4
146 %call = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* @sig_ill_handler) nounwind
147 %call1 = call i32 @__get_cpuid(i32 1, i32* %a, i32* %b, i32* %c, i32* %d)
148 %tobool = icmp eq i32 %call1, 0
149 br i1 %tobool, label %if.then, label %lor.lhs.false
151 lor.lhs.false: ; preds = %entry
152 %tmp4 = load i32* %d, align 4
153 %and6 = and i32 %tmp4, 67108864
154 %cmp = icmp eq i32 %and6, 0
155 br i1 %cmp, label %if.then, label %if.end
157 if.then: ; preds = %entry, %lor.lhs.false
158 call void @exit(i32 0) noreturn nounwind
161 if.end: ; preds = %lor.lhs.false
162 %call7 = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* null) nounwind
166 declare void (i32)* @signal(i32, void (i32)*) nounwind
168 define internal void @sig_ill_handler(i32 %sig) nounwind uwtable {
170 call void @exit(i32 0) noreturn nounwind
173 return: ; No predecessors!
177 define internal i32 @__get_cpuid(i32 %__level, i32* %__eax, i32* %__ebx, i32* %__ecx, i32* %__edx) nounwind uwtable inlinehint {
179 %and = and i32 %__level, -2147483648
180 %call = call i32 @__get_cpuid_max(i32 %and, i32* null)
181 %cmp = icmp ult i32 %call, %__level
182 br i1 %cmp, label %if.then, label %if.end
184 if.then: ; preds = %entry
187 if.end: ; preds = %entry
188 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__level) nounwind, !srcloc !1
189 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
190 %asmresult8 = extractvalue { i32, i32, i32, i32 } %tmp, 1
191 %asmresult9 = extractvalue { i32, i32, i32, i32 } %tmp, 2
192 %asmresult10 = extractvalue { i32, i32, i32, i32 } %tmp, 3
193 store i32 %asmresult, i32* %__eax, align 4
194 store i32 %asmresult8, i32* %__ebx, align 4
195 store i32 %asmresult9, i32* %__ecx, align 4
196 store i32 %asmresult10, i32* %__edx, align 4
199 return: ; preds = %if.end, %if.then
200 %retval.0 = phi i32 [ 0, %if.then ], [ 1, %if.end ]
204 declare void @exit(i32) noreturn
206 define internal i32 @__get_cpuid_max(i32 %__ext, i32* %__sig) nounwind uwtable inlinehint {
208 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__ext) nounwind, !srcloc !2
209 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
210 %tobool = icmp eq i32* %__sig, null
211 br i1 %tobool, label %if.end, label %if.then
213 if.then: ; preds = %entry
214 %asmresult1 = extractvalue { i32, i32, i32, i32 } %tmp, 1
215 store i32 %asmresult1, i32* %__sig, align 4
218 if.end: ; preds = %entry, %if.then
222 !0 = metadata !{i32 469}
223 !1 = metadata !{i32 -2147343238, i32 -2147343230}
224 !2 = metadata !{i32 -2147343361, i32 -2147343353}