1 ; RUN: opt %loadPolly %defaultOpts -polly-codegen -enable-polly-vector -dce -S %s | FileCheck %s
2 ; Obtained from C source as:
3 ; clang -S -emit-llvm -O0 vect-nest-cycle-1.c
4 ; opt -correlated-propagation -mem2reg -instcombine -loop-simplify -indvars -instnamer vect-nest-cycle-1.s > vect-nest-cycle-1.ll
6 ; ModuleID = 'vect-nest-cycle-1.s'
7 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
8 target triple = "x86_64-unknown-linux-gnu"
10 @in = global [16 x float] [float 2.320000e+02, float 1.320000e+02, float 3.200000e+01, float 4.320000e+02, float 5.320000e+02, float 3.210000e+02, float 3.270000e+02, float 3.230000e+02, float 3.210000e+02, float 3.240000e+02, float 3.220000e+02, float 3.290000e+02, float 4.320000e+02, float 8.320000e+02, float 9.320000e+02, float 2.320000e+02], align 16
11 @check_res = global [16 x float] [float 1.120000e+02, float -4.000000e+00, float -1.200000e+02, float 2.640000e+02, float 3.480000e+02, float 1.210000e+02, float 1.110000e+02, float 9.100000e+01, float 7.300000e+01, float 6.000000e+01, float 4.200000e+01, float 3.300000e+01, float 1.200000e+02, float 5.040000e+02, float 5.880000e+02, float -1.280000e+02], align 16
12 @a = global [32 x float] [float 0.000000e+00, float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00, float 5.000000e+00, float 6.000000e+00, float 7.000000e+00, float 8.000000e+00, float 9.000000e+00, float 1.000000e+01, float 1.100000e+01, float 1.200000e+01, float 1.300000e+01, float 1.400000e+01, float 1.500000e+01, float 1.600000e+01, float 1.700000e+01, float 1.800000e+01, float 1.900000e+01, float 2.000000e+01, float 2.100000e+01, float 2.200000e+01, float 2.300000e+01, float 2.400000e+01, float 2.500000e+01, float 2.600000e+01, float 2.700000e+01, float 2.800000e+01, float 2.900000e+01, float 3.000000e+01, float 3.100000e+01], align 16
13 @out = common global [16 x float] zeroinitializer, align 16
15 define void @foo() nounwind uwtable noinline {
19 for.cond: ; preds = %for.inc18, %entry
20 %indvar3 = phi i64 [ %indvar.next4, %for.inc18 ], [ 0, %entry ]
21 %arrayidx17 = getelementptr [16 x float]* @out, i64 0, i64 %indvar3
22 %arrayidx = getelementptr [16 x float]* @in, i64 0, i64 %indvar3
23 %exitcond6 = icmp ne i64 %indvar3, 16
24 br i1 %exitcond6, label %for.body, label %for.end21
26 for.body: ; preds = %for.cond
27 %tmp2 = load float* %arrayidx, align 4
30 for.cond3: ; preds = %for.inc, %for.body
31 %indvar1 = phi i64 [ %indvar.next2, %for.inc ], [ 0, %for.body ]
32 %res.0 = phi float [ %tmp2, %for.body ], [ %sub, %for.inc ]
33 %tmp7 = add i64 %indvar3, %indvar1
34 %arrayidx11 = getelementptr [32 x float]* @a, i64 0, i64 %tmp7
35 %exitcond = icmp ne i64 %indvar1, 16
36 br i1 %exitcond, label %for.body6, label %for.end
38 for.body6: ; preds = %for.cond3
41 for.inc: ; preds = %for.body6
42 %tmp12 = load float* %arrayidx11, align 4
43 %sub = fsub float %res.0, %tmp12
44 %indvar.next2 = add i64 %indvar1, 1
47 for.end: ; preds = %for.cond3
48 %res.0.lcssa = phi float [ %res.0, %for.cond3 ]
49 store float %res.0.lcssa, float* %arrayidx17, align 4
52 for.inc18: ; preds = %for.end
53 %indvar.next4 = add i64 %indvar3, 1
56 for.end21: ; preds = %for.cond
59 for.cond22: ; preds = %for.inc35, %for.end21
60 %indvar = phi i64 [ %indvar.next, %for.inc35 ], [ 0, %for.end21 ]
61 %arrayidx32 = getelementptr [16 x float]* @check_res, i64 0, i64 %indvar
62 %arrayidx28 = getelementptr [16 x float]* @out, i64 0, i64 %indvar
63 %i.1 = trunc i64 %indvar to i32
64 %cmp24 = icmp slt i32 %i.1, 16
65 br i1 %cmp24, label %for.body25, label %for.end38
67 for.body25: ; preds = %for.cond22
68 %tmp29 = load float* %arrayidx28, align 4
69 %tmp33 = load float* %arrayidx32, align 4
70 %cmp34 = fcmp une float %tmp29, %tmp33
71 br i1 %cmp34, label %if.then, label %if.end
73 if.then: ; preds = %for.body25
74 call void @abort() noreturn nounwind
77 if.end: ; preds = %for.body25
80 for.inc35: ; preds = %if.end
81 %indvar.next = add i64 %indvar, 1
84 for.end38: ; preds = %for.cond22
88 declare void @abort() noreturn
90 define i32 @main() nounwind uwtable {
92 call void @check_vect()
97 define internal void @check_vect() nounwind uwtable noinline {
99 %a = alloca i32, align 4
100 %b = alloca i32, align 4
101 %c = alloca i32, align 4
102 %d = alloca i32, align 4
103 %call = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* @sig_ill_handler) nounwind
104 %call1 = call i32 @__get_cpuid(i32 1, i32* %a, i32* %b, i32* %c, i32* %d)
105 %tobool = icmp eq i32 %call1, 0
106 br i1 %tobool, label %if.then, label %lor.lhs.false
108 lor.lhs.false: ; preds = %entry
109 %tmp4 = load i32* %d, align 4
110 %and6 = and i32 %tmp4, 67108864
111 %cmp = icmp eq i32 %and6, 0
112 br i1 %cmp, label %if.then, label %if.end
114 if.then: ; preds = %entry, %lor.lhs.false
115 call void @exit(i32 0) noreturn nounwind
118 if.end: ; preds = %lor.lhs.false
119 %call7 = call void (i32)* (i32, void (i32)*)* @signal(i32 4, void (i32)* null) nounwind
123 declare void (i32)* @signal(i32, void (i32)*) nounwind
125 define internal void @sig_ill_handler(i32 %sig) nounwind uwtable {
127 call void @exit(i32 0) noreturn nounwind
130 return: ; No predecessors!
134 define internal i32 @__get_cpuid(i32 %__level, i32* %__eax, i32* %__ebx, i32* %__ecx, i32* %__edx) nounwind uwtable inlinehint {
136 %and = and i32 %__level, -2147483648
137 %call = call i32 @__get_cpuid_max(i32 %and, i32* null)
138 %cmp = icmp ult i32 %call, %__level
139 br i1 %cmp, label %if.then, label %if.end
141 if.then: ; preds = %entry
144 if.end: ; preds = %entry
145 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__level) nounwind, !srcloc !0
146 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
147 %asmresult8 = extractvalue { i32, i32, i32, i32 } %tmp, 1
148 %asmresult9 = extractvalue { i32, i32, i32, i32 } %tmp, 2
149 %asmresult10 = extractvalue { i32, i32, i32, i32 } %tmp, 3
150 store i32 %asmresult, i32* %__eax, align 4
151 store i32 %asmresult8, i32* %__ebx, align 4
152 store i32 %asmresult9, i32* %__ecx, align 4
153 store i32 %asmresult10, i32* %__edx, align 4
156 return: ; preds = %if.end, %if.then
157 %retval.0 = phi i32 [ 0, %if.then ], [ 1, %if.end ]
161 declare void @exit(i32) noreturn
163 define internal i32 @__get_cpuid_max(i32 %__ext, i32* %__sig) nounwind uwtable inlinehint {
165 %tmp = call { i32, i32, i32, i32 } asm "cpuid\0A\09", "={ax},={bx},={cx},={dx},0,~{dirflag},~{fpsr},~{flags}"(i32 %__ext) nounwind, !srcloc !1
166 %asmresult = extractvalue { i32, i32, i32, i32 } %tmp, 0
167 %tobool = icmp eq i32* %__sig, null
168 br i1 %tobool, label %if.end, label %if.then
170 if.then: ; preds = %entry
171 %asmresult1 = extractvalue { i32, i32, i32, i32 } %tmp, 1
172 store i32 %asmresult1, i32* %__sig, align 4
175 if.end: ; preds = %entry, %if.then
179 !0 = metadata !{i32 -2147343393, i32 -2147343385}
180 !1 = metadata !{i32 -2147343516, i32 -2147343508}