1 ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -asm-verbose=false | FileCheck %s
3 ; These tests check for loop branching structure, and that the loop align
4 ; directive is placed in the expected place.
6 ; CodeGen should insert a branch into the middle of the loop in
7 ; order to avoid a branch within the loop.
12 ; CHECK-NEXT: .LBB0_2:
13 ; CHECK-NEXT: callq loop_latch
14 ; CHECK-NEXT: .LBB0_1:
15 ; CHECK-NEXT: callq loop_header
17 define void @simple() nounwind {
22 call void @loop_header()
23 %t0 = tail call i32 @get()
24 %t1 = icmp slt i32 %t0, 0
25 br i1 %t1, label %done, label %bb
28 call void @loop_latch()
36 ; CodeGen should move block_a to the top of the loop so that it
37 ; falls through into the loop, avoiding a branch within the loop.
39 ; CHECK-LABEL: slightly_more_involved:
42 ; CHECK-NEXT: .LBB1_4:
43 ; CHECK-NEXT: callq bar99
44 ; CHECK-NEXT: .LBB1_1:
45 ; CHECK-NEXT: callq body
47 define void @slightly_more_involved() nounwind {
54 %t1 = icmp slt i32 %t0, 2
55 br i1 %t1, label %block_a, label %bb
59 %t3 = icmp slt i32 %t2, 99
60 br i1 %t3, label %exit, label %loop
71 ; Same as slightly_more_involved, but block_a is now a CFG diamond with
72 ; fallthrough edges which should be preserved.
73 ; "callq block_a_merge_func" is tail duped.
75 ; CHECK-LABEL: yet_more_involved:
78 ; CHECK-NEXT: .LBB2_5:
79 ; CHECK-NEXT: callq block_a_true_func
80 ; CHECK-NEXT: callq block_a_merge_func
81 ; CHECK-NEXT: .LBB2_1:
82 ; CHECK-NEXT: callq body
86 ; CHECK-NEXT: callq get
87 ; CHECK-NEXT: cmpl $2999, %eax
88 ; CHECK-NEXT: jle .LBB2_5
89 ; CHECK-NEXT: callq block_a_false_func
90 ; CHECK-NEXT: callq block_a_merge_func
91 ; CHECK-NEXT: jmp .LBB2_1
93 define void @yet_more_involved() nounwind {
100 %t1 = icmp slt i32 %t0, 2
101 br i1 %t1, label %block_a, label %bb
104 %t2 = call i32 @get()
105 %t3 = icmp slt i32 %t2, 99
106 br i1 %t3, label %exit, label %loop
110 %z0 = call i32 @get()
111 %z1 = icmp slt i32 %z0, 3000
112 br i1 %z1, label %block_a_true, label %block_a_false
115 call void @block_a_true_func()
116 br label %block_a_merge
119 call void @block_a_false_func()
120 br label %block_a_merge
123 call void @block_a_merge_func()
131 ; CodeGen should move the CFG islands that are part of the loop but don't
132 ; conveniently fit anywhere so that they are at least contiguous with the
135 ; CHECK-LABEL: cfg_islands:
138 ; CHECK-NEXT: .LBB3_7:
139 ; CHECK-NEXT: callq bar100
140 ; CHECK-NEXT: .LBB3_1:
141 ; CHECK-NEXT: callq loop_header
144 ; CHECK-NEXT: callq bar101
145 ; CHECK-NEXT: jmp .LBB3_1
147 ; CHECK-NEXT: .LBB3_3:
149 ; CHECK-NEXT: callq bar102
150 ; CHECK-NEXT: jmp .LBB3_1
151 ; CHECK-NEXT: .LBB3_4:
153 ; CHECK-NEXT: callq loop_latch
154 ; CHECK-NEXT: jmp .LBB3_1
155 ; CHECK-NEXT: .LBB3_6:
157 define void @cfg_islands() nounwind {
162 call void @loop_header()
163 %t0 = call i32 @get()
164 %t1 = icmp slt i32 %t0, 100
165 br i1 %t1, label %block100, label %bb
168 %t2 = call i32 @get()
169 %t3 = icmp slt i32 %t2, 101
170 br i1 %t3, label %block101, label %bb1
173 %t4 = call i32 @get()
174 %t5 = icmp slt i32 %t4, 102
175 br i1 %t5, label %block102, label %bb2
178 %t6 = call i32 @get()
179 %t7 = icmp slt i32 %t6, 103
180 br i1 %t7, label %exit, label %bb3
183 call void @loop_latch()
203 ; CHECK-LABEL: check_minsize:
206 ; CHECK-NEXT: .LBB4_2:
207 ; CHECK-NEXT: callq loop_latch
208 ; CHECK-NEXT: .LBB4_1:
209 ; CHECK-NEXT: callq loop_header
212 define void @check_minsize() minsize nounwind {
217 call void @loop_header()
218 %t0 = tail call i32 @get()
219 %t1 = icmp slt i32 %t0, 0
220 br i1 %t1, label %done, label %bb
223 call void @loop_latch()
231 ; This is exactly the same function as slightly_more_involved.
232 ; The difference is that when optimising for size, we do not want
233 ; to see this reordering.
235 ; CHECK-LABEL: slightly_more_involved_2:
236 ; CHECK-NOT: jmp .LBB5_1
238 ; CHECK-NEXT: callq body
240 define void @slightly_more_involved_2() #0 {
246 %t0 = call i32 @get()
247 %t1 = icmp slt i32 %t0, 2
248 br i1 %t1, label %block_a, label %bb
251 %t2 = call i32 @get()
252 %t3 = icmp slt i32 %t2, 99
253 br i1 %t3, label %exit, label %loop
264 attributes #0 = { minsize norecurse nounwind optsize readnone uwtable }
266 declare void @bar99() nounwind
267 declare void @bar100() nounwind
268 declare void @bar101() nounwind
269 declare void @bar102() nounwind
270 declare void @body() nounwind
271 declare void @exit() nounwind
272 declare void @loop_header() nounwind
273 declare void @loop_latch() nounwind
274 declare i32 @get() nounwind
275 declare void @block_a_true_func() nounwind
276 declare void @block_a_false_func() nounwind
277 declare void @block_a_merge_func() nounwind