1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc -mtriple=thumbv8.1m.main-none-none-eabi -verify-machineinstrs -mattr=+mve %s -o - | FileCheck %s
4 @var_36 = hidden local_unnamed_addr global i8 0, align 1
5 @arr_61 = hidden local_unnamed_addr global [1 x i32] zeroinitializer, align 4
7 define i32 @test(i8 zeroext %var_2, i16 signext %var_15, ptr %arr_60) {
9 ; CHECK: @ %bb.0: @ %entry
10 ; CHECK-NEXT: .save {r4, r5, r6, r7, r8, r9, r10, r11, lr}
11 ; CHECK-NEXT: push.w {r4, r5, r6, r7, r8, r9, r10, r11, lr}
12 ; CHECK-NEXT: .pad #16
13 ; CHECK-NEXT: sub sp, #16
14 ; CHECK-NEXT: cmp r0, #0
15 ; CHECK-NEXT: beq.w .LBB0_11
16 ; CHECK-NEXT: @ %bb.1: @ %for.cond1.preheader
17 ; CHECK-NEXT: cmp r2, #0
18 ; CHECK-NEXT: beq.w .LBB0_12
19 ; CHECK-NEXT: @ %bb.2: @ %for.cond1.preheader1
20 ; CHECK-NEXT: addw r0, r2, #441
21 ; CHECK-NEXT: str r0, [sp, #8] @ 4-byte Spill
22 ; CHECK-NEXT: addw r0, r2, #419
23 ; CHECK-NEXT: str r0, [sp, #4] @ 4-byte Spill
24 ; CHECK-NEXT: addw r0, r2, #397
25 ; CHECK-NEXT: movw r5, :lower16:var_36
26 ; CHECK-NEXT: str r0, [sp] @ 4-byte Spill
27 ; CHECK-NEXT: movw r0, #27476
28 ; CHECK-NEXT: movt r5, :upper16:var_36
29 ; CHECK-NEXT: sdiv r1, r0, r1
30 ; CHECK-NEXT: str r2, [sp, #12] @ 4-byte Spill
31 ; CHECK-NEXT: .LBB0_3: @ %for.cond1
32 ; CHECK-NEXT: @ =>This Loop Header: Depth=1
33 ; CHECK-NEXT: @ Child Loop BB0_4 Depth 2
34 ; CHECK-NEXT: @ Child Loop BB0_5 Depth 3
35 ; CHECK-NEXT: @ Child Loop BB0_7 Depth 3
36 ; CHECK-NEXT: @ Child Loop BB0_9 Depth 3
37 ; CHECK-NEXT: ldr.w r12, [sp, #8] @ 4-byte Reload
38 ; CHECK-NEXT: mov.w r10, #0
39 ; CHECK-NEXT: ldrd r8, r0, [sp] @ 8-byte Folded Reload
40 ; CHECK-NEXT: .LBB0_4: @ %for.cond6.preheader
41 ; CHECK-NEXT: @ Parent Loop BB0_3 Depth=1
42 ; CHECK-NEXT: @ => This Loop Header: Depth=2
43 ; CHECK-NEXT: @ Child Loop BB0_5 Depth 3
44 ; CHECK-NEXT: @ Child Loop BB0_7 Depth 3
45 ; CHECK-NEXT: @ Child Loop BB0_9 Depth 3
46 ; CHECK-NEXT: movw r3, :lower16:arr_61
47 ; CHECK-NEXT: movt r3, :upper16:arr_61
48 ; CHECK-NEXT: add.w r11, r3, #4
49 ; CHECK-NEXT: movs r3, #11
50 ; CHECK-NEXT: dls lr, r3
51 ; CHECK-NEXT: mov r4, r11
52 ; CHECK-NEXT: mov r3, r8
53 ; CHECK-NEXT: .LBB0_5: @ %for.body10
54 ; CHECK-NEXT: @ Parent Loop BB0_3 Depth=1
55 ; CHECK-NEXT: @ Parent Loop BB0_4 Depth=2
56 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=3
57 ; CHECK-NEXT: str r2, [r4, #-4]
58 ; CHECK-NEXT: ldrb r6, [r3, #-1]
59 ; CHECK-NEXT: cmp r6, #0
61 ; CHECK-NEXT: sxthne.w r9, r1
62 ; CHECK-NEXT: moveq.w r9, #0
63 ; CHECK-NEXT: add.w r6, r2, #396
64 ; CHECK-NEXT: cmp.w r9, #0
65 ; CHECK-NEXT: str r6, [r4]
66 ; CHECK-NEXT: cset r6, ne
67 ; CHECK-NEXT: strb r6, [r5]
68 ; CHECK-NEXT: add.w r2, r2, #792
69 ; CHECK-NEXT: ldrb r6, [r3]
70 ; CHECK-NEXT: adds r4, #8
71 ; CHECK-NEXT: adds r3, #2
72 ; CHECK-NEXT: cmp r6, #0
74 ; CHECK-NEXT: sxthne r6, r1
75 ; CHECK-NEXT: moveq r6, #0
76 ; CHECK-NEXT: cmp r6, #0
77 ; CHECK-NEXT: cset r6, ne
78 ; CHECK-NEXT: strb r6, [r5]
79 ; CHECK-NEXT: le lr, .LBB0_5
80 ; CHECK-NEXT: @ %bb.6: @ %for.cond.cleanup9
81 ; CHECK-NEXT: @ in Loop: Header=BB0_4 Depth=2
82 ; CHECK-NEXT: movs r2, #11
83 ; CHECK-NEXT: mov r4, r11
84 ; CHECK-NEXT: dls lr, r2
85 ; CHECK-NEXT: mov r3, r0
86 ; CHECK-NEXT: ldr r2, [sp, #12] @ 4-byte Reload
87 ; CHECK-NEXT: .LBB0_7: @ %for.body10.1
88 ; CHECK-NEXT: @ Parent Loop BB0_3 Depth=1
89 ; CHECK-NEXT: @ Parent Loop BB0_4 Depth=2
90 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=3
91 ; CHECK-NEXT: str r2, [r4, #-4]
92 ; CHECK-NEXT: add.w r7, r2, #396
93 ; CHECK-NEXT: ldrb r6, [r3, #-1]
94 ; CHECK-NEXT: add.w r2, r2, #792
95 ; CHECK-NEXT: cmp r6, #0
97 ; CHECK-NEXT: sxthne r6, r1
98 ; CHECK-NEXT: moveq r6, #0
99 ; CHECK-NEXT: cmp r6, #0
100 ; CHECK-NEXT: str r7, [r4]
101 ; CHECK-NEXT: cset r6, ne
102 ; CHECK-NEXT: adds r4, #8
103 ; CHECK-NEXT: strb r6, [r5]
104 ; CHECK-NEXT: ldrb r6, [r3]
105 ; CHECK-NEXT: adds r3, #2
106 ; CHECK-NEXT: cmp r6, #0
108 ; CHECK-NEXT: sxthne r6, r1
109 ; CHECK-NEXT: moveq r6, #0
110 ; CHECK-NEXT: cmp r6, #0
111 ; CHECK-NEXT: cset r6, ne
112 ; CHECK-NEXT: strb r6, [r5]
113 ; CHECK-NEXT: le lr, .LBB0_7
114 ; CHECK-NEXT: @ %bb.8: @ %for.cond.cleanup9.1
115 ; CHECK-NEXT: @ in Loop: Header=BB0_4 Depth=2
116 ; CHECK-NEXT: movs r2, #11
117 ; CHECK-NEXT: mov r3, r12
118 ; CHECK-NEXT: dls lr, r2
119 ; CHECK-NEXT: ldr r2, [sp, #12] @ 4-byte Reload
120 ; CHECK-NEXT: .LBB0_9: @ %for.body10.2
121 ; CHECK-NEXT: @ Parent Loop BB0_3 Depth=1
122 ; CHECK-NEXT: @ Parent Loop BB0_4 Depth=2
123 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=3
124 ; CHECK-NEXT: str r2, [r11, #-4]
125 ; CHECK-NEXT: add.w r6, r2, #396
126 ; CHECK-NEXT: ldrb r4, [r3, #-1]
127 ; CHECK-NEXT: add.w r2, r2, #792
128 ; CHECK-NEXT: cmp r4, #0
130 ; CHECK-NEXT: sxthne r4, r1
131 ; CHECK-NEXT: moveq r4, #0
132 ; CHECK-NEXT: cmp r4, #0
133 ; CHECK-NEXT: str.w r6, [r11]
134 ; CHECK-NEXT: cset r4, ne
135 ; CHECK-NEXT: add.w r11, r11, #8
136 ; CHECK-NEXT: strb r4, [r5]
137 ; CHECK-NEXT: ldrb r4, [r3]
138 ; CHECK-NEXT: adds r3, #2
139 ; CHECK-NEXT: cmp r4, #0
141 ; CHECK-NEXT: sxthne r4, r1
142 ; CHECK-NEXT: moveq r4, #0
143 ; CHECK-NEXT: cmp r4, #0
144 ; CHECK-NEXT: cset r4, ne
145 ; CHECK-NEXT: strb r4, [r5]
146 ; CHECK-NEXT: le lr, .LBB0_9
147 ; CHECK-NEXT: @ %bb.10: @ %for.cond.cleanup9.2
148 ; CHECK-NEXT: @ in Loop: Header=BB0_4 Depth=2
149 ; CHECK-NEXT: add.w r2, r10, #3
150 ; CHECK-NEXT: add.w r12, r12, #66
151 ; CHECK-NEXT: adds r0, #66
152 ; CHECK-NEXT: add.w r8, r8, #66
153 ; CHECK-NEXT: uxtb.w r10, r2
154 ; CHECK-NEXT: ldr r2, [sp, #12] @ 4-byte Reload
155 ; CHECK-NEXT: cmp.w r10, #18
156 ; CHECK-NEXT: blo.w .LBB0_4
157 ; CHECK-NEXT: b .LBB0_3
158 ; CHECK-NEXT: .LBB0_11: @ %for.cond.cleanup
159 ; CHECK-NEXT: add sp, #16
160 ; CHECK-NEXT: pop.w {r4, r5, r6, r7, r8, r9, r10, r11, pc}
161 ; CHECK-NEXT: .LBB0_12: @ %for.cond1.us.preheader
162 ; CHECK-NEXT: movw r0, :lower16:arr_61
163 ; CHECK-NEXT: movs r1, #0
164 ; CHECK-NEXT: movt r0, :upper16:arr_61
165 ; CHECK-NEXT: str r1, [r0, #84]
166 ; CHECK-NEXT: .inst.n 0xdefe
168 %tobool.not = icmp eq i8 %var_2, 0
169 br i1 %tobool.not, label %for.cond.cleanup, label %for.cond1.preheader
171 for.cond1.preheader: ; preds = %entry
172 %cmp11.not = icmp eq ptr %arr_60, null
173 br i1 %cmp11.not, label %for.cond1.us.preheader, label %for.cond1
175 for.cond1.us.preheader: ; preds = %for.cond1.preheader
176 store i32 0, ptr getelementptr ([1 x i32], ptr @arr_61, i32 21, i32 0), align 4
177 call void @llvm.trap()
180 for.cond.cleanup: ; preds = %entry
183 for.cond1: ; preds = %for.cond.cleanup9.2, %for.cond1.preheader
184 br label %for.cond6.preheader
186 for.cond6.preheader: ; preds = %for.cond.cleanup9.2, %for.cond1
187 %conv45 = phi i32 [ 0, %for.cond1 ], [ %conv.2, %for.cond.cleanup9.2 ]
190 for.cond.cleanup9: ; preds = %cond.end22.1
191 %add27 = add nuw nsw i32 %conv45, 1
192 %conv = and i32 %add27, 255
193 br label %for.body10.1
195 for.body10: ; preds = %cond.end22.1, %for.cond6.preheader
196 %i_15.044 = phi i32 [ 0, %for.cond6.preheader ], [ %add.1, %cond.end22.1 ]
197 %arraydecay = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %i_15.044, i32 0
198 %0 = ptrtoint ptr %arraydecay to i32
199 %arrayidx13 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %i_15.044
200 store i32 %0, ptr %arrayidx13, align 4
201 %arrayidx16 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv45, i32 %i_15.044
202 %1 = load i8, ptr %arrayidx16, align 1
203 %tobool18.not = icmp eq i8 %1, 0
204 br i1 %tobool18.not, label %cond.end22, label %cond.true19
206 cond.true19: ; preds = %for.body10
207 %div43 = sdiv i16 27476, %var_15
208 %div.sext = sext i16 %div43 to i32
211 cond.end22: ; preds = %for.body10, %cond.true19
212 %cond23 = phi i32 [ %div.sext, %cond.true19 ], [ 0, %for.body10 ]
213 %tobool24 = icmp ne i32 %cond23, 0
214 %frombool = zext i1 %tobool24 to i8
215 store i8 %frombool, ptr @var_36, align 1
216 %add = or i32 %i_15.044, 1
217 %arraydecay.1 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %add, i32 0
218 %2 = ptrtoint ptr %arraydecay.1 to i32
219 %arrayidx13.1 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %add
220 store i32 %2, ptr %arrayidx13.1, align 4
221 %arrayidx16.1 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv45, i32 %add
222 %3 = load i8, ptr %arrayidx16.1, align 1
223 %tobool18.not.1 = icmp eq i8 %3, 0
224 br i1 %tobool18.not.1, label %cond.end22.1, label %cond.true19.1
226 cond.true19.1: ; preds = %cond.end22
227 %div43.1 = sdiv i16 27476, %var_15
228 %div.sext.1 = sext i16 %div43.1 to i32
229 br label %cond.end22.1
231 cond.end22.1: ; preds = %cond.true19.1, %cond.end22
232 %cond23.1 = phi i32 [ %div.sext.1, %cond.true19.1 ], [ 0, %cond.end22 ]
233 %tobool24.1 = icmp ne i32 %cond23.1, 0
234 %frombool.1 = zext i1 %tobool24.1 to i8
235 store i8 %frombool.1, ptr @var_36, align 1
236 %add.1 = add nuw nsw i32 %i_15.044, 2
237 %exitcond105.not.1 = icmp eq i32 %add.1, 22
238 br i1 %exitcond105.not.1, label %for.cond.cleanup9, label %for.body10
240 for.body10.1: ; preds = %cond.end22.1.1, %for.cond.cleanup9
241 %i_15.044.1 = phi i32 [ 0, %for.cond.cleanup9 ], [ %add.1.1, %cond.end22.1.1 ]
242 %arraydecay.1108 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %i_15.044.1, i32 0
243 %4 = ptrtoint ptr %arraydecay.1108 to i32
244 %arrayidx13.1109 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %i_15.044.1
245 store i32 %4, ptr %arrayidx13.1109, align 4
246 %arrayidx16.1110 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv, i32 %i_15.044.1
247 %5 = load i8, ptr %arrayidx16.1110, align 1
248 %tobool18.not.1111 = icmp eq i8 %5, 0
249 br i1 %tobool18.not.1111, label %cond.end22.1119, label %cond.true19.1114
251 cond.true19.1114: ; preds = %for.body10.1
252 %div43.1112 = sdiv i16 27476, %var_15
253 %div.sext.1113 = sext i16 %div43.1112 to i32
254 br label %cond.end22.1119
256 cond.end22.1119: ; preds = %cond.true19.1114, %for.body10.1
257 %cond23.1115 = phi i32 [ %div.sext.1113, %cond.true19.1114 ], [ 0, %for.body10.1 ]
258 %tobool24.1116 = icmp ne i32 %cond23.1115, 0
259 %frombool.1117 = zext i1 %tobool24.1116 to i8
260 store i8 %frombool.1117, ptr @var_36, align 1
261 %add.1118 = or i32 %i_15.044.1, 1
262 %arraydecay.1.1 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %add.1118, i32 0
263 %6 = ptrtoint ptr %arraydecay.1.1 to i32
264 %arrayidx13.1.1 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %add.1118
265 store i32 %6, ptr %arrayidx13.1.1, align 4
266 %arrayidx16.1.1 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv, i32 %add.1118
267 %7 = load i8, ptr %arrayidx16.1.1, align 1
268 %tobool18.not.1.1 = icmp eq i8 %7, 0
269 br i1 %tobool18.not.1.1, label %cond.end22.1.1, label %cond.true19.1.1
271 cond.true19.1.1: ; preds = %cond.end22.1119
272 %div43.1.1 = sdiv i16 27476, %var_15
273 %div.sext.1.1 = sext i16 %div43.1.1 to i32
274 br label %cond.end22.1.1
276 cond.end22.1.1: ; preds = %cond.true19.1.1, %cond.end22.1119
277 %cond23.1.1 = phi i32 [ %div.sext.1.1, %cond.true19.1.1 ], [ 0, %cond.end22.1119 ]
278 %tobool24.1.1 = icmp ne i32 %cond23.1.1, 0
279 %frombool.1.1 = zext i1 %tobool24.1.1 to i8
280 store i8 %frombool.1.1, ptr @var_36, align 1
281 %add.1.1 = add nuw nsw i32 %i_15.044.1, 2
282 %exitcond105.not.1.1 = icmp eq i32 %add.1.1, 22
283 br i1 %exitcond105.not.1.1, label %for.cond.cleanup9.1, label %for.body10.1
285 for.cond.cleanup9.1: ; preds = %cond.end22.1.1
286 %add27.1 = add nuw nsw i32 %conv45, 2
287 %conv.1 = and i32 %add27.1, 255
288 br label %for.body10.2
290 for.body10.2: ; preds = %cond.end22.1.2, %for.cond.cleanup9.1
291 %i_15.044.2 = phi i32 [ 0, %for.cond.cleanup9.1 ], [ %add.1.2, %cond.end22.1.2 ]
292 %arraydecay.2 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %i_15.044.2, i32 0
293 %8 = ptrtoint ptr %arraydecay.2 to i32
294 %arrayidx13.2 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %i_15.044.2
295 store i32 %8, ptr %arrayidx13.2, align 4
296 %arrayidx16.2 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv.1, i32 %i_15.044.2
297 %9 = load i8, ptr %arrayidx16.2, align 1
298 %tobool18.not.2 = icmp eq i8 %9, 0
299 br i1 %tobool18.not.2, label %cond.end22.2, label %cond.true19.2
301 cond.true19.2: ; preds = %for.body10.2
302 %div43.2 = sdiv i16 27476, %var_15
303 %div.sext.2 = sext i16 %div43.2 to i32
304 br label %cond.end22.2
306 cond.end22.2: ; preds = %cond.true19.2, %for.body10.2
307 %cond23.2 = phi i32 [ %div.sext.2, %cond.true19.2 ], [ 0, %for.body10.2 ]
308 %tobool24.2 = icmp ne i32 %cond23.2, 0
309 %frombool.2 = zext i1 %tobool24.2 to i8
310 store i8 %frombool.2, ptr @var_36, align 1
311 %add.2 = or i32 %i_15.044.2, 1
312 %arraydecay.1.2 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 %add.2, i32 0
313 %10 = ptrtoint ptr %arraydecay.1.2 to i32
314 %arrayidx13.1.2 = getelementptr inbounds [1 x i32], ptr @arr_61, i32 0, i32 %add.2
315 store i32 %10, ptr %arrayidx13.1.2, align 4
316 %arrayidx16.1.2 = getelementptr inbounds [18 x [22 x i8]], ptr %arr_60, i32 1, i32 %conv.1, i32 %add.2
317 %11 = load i8, ptr %arrayidx16.1.2, align 1
318 %tobool18.not.1.2 = icmp eq i8 %11, 0
319 br i1 %tobool18.not.1.2, label %cond.end22.1.2, label %cond.true19.1.2
321 cond.true19.1.2: ; preds = %cond.end22.2
322 %div43.1.2 = sdiv i16 27476, %var_15
323 %div.sext.1.2 = sext i16 %div43.1.2 to i32
324 br label %cond.end22.1.2
326 cond.end22.1.2: ; preds = %cond.true19.1.2, %cond.end22.2
327 %cond23.1.2 = phi i32 [ %div.sext.1.2, %cond.true19.1.2 ], [ 0, %cond.end22.2 ]
328 %tobool24.1.2 = icmp ne i32 %cond23.1.2, 0
329 %frombool.1.2 = zext i1 %tobool24.1.2 to i8
330 store i8 %frombool.1.2, ptr @var_36, align 1
331 %add.1.2 = add nuw nsw i32 %i_15.044.2, 2
332 %exitcond105.not.1.2 = icmp eq i32 %add.1.2, 22
333 br i1 %exitcond105.not.1.2, label %for.cond.cleanup9.2, label %for.body10.2
335 for.cond.cleanup9.2: ; preds = %cond.end22.1.2
336 %add27.2 = add nuw nsw i32 %conv45, 3
337 %conv.2 = and i32 %add27.2, 255
338 %cmp.2 = icmp ult i32 %conv.2, 18
339 br i1 %cmp.2, label %for.cond6.preheader, label %for.cond1
342 declare void @llvm.trap() #1
345 @b = hidden local_unnamed_addr global i32 0, align 4
346 @a = hidden local_unnamed_addr global i32 0, align 4
347 @c = hidden local_unnamed_addr global [1 x i32] zeroinitializer, align 4
349 define i32 @d(i64 %e, i32 %f, i64 %g, i32 %h) {
351 ; CHECK: @ %bb.0: @ %entry
352 ; CHECK-NEXT: .save {r4, r5, r6, r7, r8, r9, r10, r11, lr}
353 ; CHECK-NEXT: push.w {r4, r5, r6, r7, r8, r9, r10, r11, lr}
354 ; CHECK-NEXT: .pad #4
355 ; CHECK-NEXT: sub sp, #4
356 ; CHECK-NEXT: .vsave {d8, d9, d10, d11, d12, d13, d14, d15}
357 ; CHECK-NEXT: vpush {d8, d9, d10, d11, d12, d13, d14, d15}
358 ; CHECK-NEXT: .pad #16
359 ; CHECK-NEXT: sub sp, #16
360 ; CHECK-NEXT: mov lr, r0
361 ; CHECK-NEXT: subs r0, #1
362 ; CHECK-NEXT: sbcs r0, r1, #0
363 ; CHECK-NEXT: blt.w .LBB1_28
364 ; CHECK-NEXT: @ %bb.1: @ %for.cond2.preheader.lr.ph
365 ; CHECK-NEXT: movs r0, #1
366 ; CHECK-NEXT: cmp r2, #1
367 ; CHECK-NEXT: csel r7, r2, r0, lt
368 ; CHECK-NEXT: mov r12, r1
369 ; CHECK-NEXT: mov r1, r7
370 ; CHECK-NEXT: cmp r7, #3
372 ; CHECK-NEXT: movls r1, #3
373 ; CHECK-NEXT: mov r4, r2
374 ; CHECK-NEXT: subs r1, r1, r7
375 ; CHECK-NEXT: movw r2, #43691
376 ; CHECK-NEXT: adds r1, #2
377 ; CHECK-NEXT: movt r2, #43690
378 ; CHECK-NEXT: ldr r6, [sp, #128]
379 ; CHECK-NEXT: movw r8, :lower16:c
380 ; CHECK-NEXT: umull r1, r2, r1, r2
381 ; CHECK-NEXT: movt r8, :upper16:c
382 ; CHECK-NEXT: movs r1, #4
383 ; CHECK-NEXT: @ implicit-def: $r10
384 ; CHECK-NEXT: @ implicit-def: $r5
385 ; CHECK-NEXT: @ implicit-def: $r11
386 ; CHECK-NEXT: mov.w r9, #12
387 ; CHECK-NEXT: str r4, [sp, #12] @ 4-byte Spill
388 ; CHECK-NEXT: add.w r0, r0, r2, lsr #1
389 ; CHECK-NEXT: add.w r1, r1, r2, lsr #1
390 ; CHECK-NEXT: movw r2, #65532
391 ; CHECK-NEXT: vdup.32 q6, r0
392 ; CHECK-NEXT: movt r2, #32767
393 ; CHECK-NEXT: and.w r3, r1, r2
394 ; CHECK-NEXT: adr r1, .LCPI1_0
395 ; CHECK-NEXT: vdup.32 q7, r0
396 ; CHECK-NEXT: vldrw.u32 q0, [r1]
397 ; CHECK-NEXT: adr r1, .LCPI1_1
398 ; CHECK-NEXT: vldrw.u32 q5, [r1]
399 ; CHECK-NEXT: strd r3, r7, [sp, #4] @ 8-byte Folded Spill
400 ; CHECK-NEXT: vadd.i32 q4, q0, r7
401 ; CHECK-NEXT: b .LBB1_6
402 ; CHECK-NEXT: .LBB1_2: @ %for.body6.preheader
403 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
404 ; CHECK-NEXT: mov r0, r11
405 ; CHECK-NEXT: cmn.w r11, #4
407 ; CHECK-NEXT: mvnle r0, #3
408 ; CHECK-NEXT: movw r2, #18725
409 ; CHECK-NEXT: adds r0, #6
410 ; CHECK-NEXT: movt r2, #9362
411 ; CHECK-NEXT: sub.w r1, r0, r11
412 ; CHECK-NEXT: mov r10, r3
413 ; CHECK-NEXT: umull r2, r3, r1, r2
414 ; CHECK-NEXT: subs r2, r1, r3
415 ; CHECK-NEXT: add.w r2, r3, r2, lsr #1
416 ; CHECK-NEXT: lsrs r3, r2, #2
417 ; CHECK-NEXT: lsls r3, r3, #3
418 ; CHECK-NEXT: sub.w r2, r3, r2, lsr #2
419 ; CHECK-NEXT: subs r1, r2, r1
420 ; CHECK-NEXT: mov r3, r10
421 ; CHECK-NEXT: add r0, r1
422 ; CHECK-NEXT: .LBB1_3: @ %for.cond.cleanup5.loopexit134.split.loop.exit139
423 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
424 ; CHECK-NEXT: add.w r11, r0, #7
425 ; CHECK-NEXT: .LBB1_4: @ %for.cond.cleanup5
426 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
427 ; CHECK-NEXT: mov.w r10, #0
428 ; CHECK-NEXT: .LBB1_5: @ %for.cond.cleanup5
429 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
430 ; CHECK-NEXT: adds r5, #2
431 ; CHECK-NEXT: subs.w r1, r5, lr
432 ; CHECK-NEXT: asr.w r0, r5, #31
433 ; CHECK-NEXT: sbcs.w r0, r0, r12
434 ; CHECK-NEXT: bge.w .LBB1_28
435 ; CHECK-NEXT: .LBB1_6: @ %for.cond2.preheader
436 ; CHECK-NEXT: @ =>This Loop Header: Depth=1
437 ; CHECK-NEXT: @ Child Loop BB1_19 Depth 2
438 ; CHECK-NEXT: @ Child Loop BB1_10 Depth 2
439 ; CHECK-NEXT: @ Child Loop BB1_12 Depth 3
440 ; CHECK-NEXT: @ Child Loop BB1_14 Depth 3
441 ; CHECK-NEXT: cmp.w r11, #2
442 ; CHECK-NEXT: bgt .LBB1_5
443 ; CHECK-NEXT: @ %bb.7: @ %for.body6.lr.ph
444 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
445 ; CHECK-NEXT: cmp r7, #5
446 ; CHECK-NEXT: bhi .LBB1_17
447 ; CHECK-NEXT: @ %bb.8: @ %for.body6.us.preheader
448 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
449 ; CHECK-NEXT: ldrd r2, r3, [sp, #120]
450 ; CHECK-NEXT: movs r0, #32
451 ; CHECK-NEXT: movs r1, #0
452 ; CHECK-NEXT: mov r4, r6
453 ; CHECK-NEXT: mov r7, r12
454 ; CHECK-NEXT: mov r6, lr
455 ; CHECK-NEXT: bl __aeabi_ldivmod
456 ; CHECK-NEXT: mov lr, r6
457 ; CHECK-NEXT: mov r6, r4
458 ; CHECK-NEXT: mov r12, r7
459 ; CHECK-NEXT: ldr r3, [sp, #4] @ 4-byte Reload
460 ; CHECK-NEXT: ldr r4, [sp, #12] @ 4-byte Reload
461 ; CHECK-NEXT: vdup.32 q0, r2
462 ; CHECK-NEXT: ldr r7, [sp, #8] @ 4-byte Reload
463 ; CHECK-NEXT: mov r0, r11
464 ; CHECK-NEXT: b .LBB1_10
465 ; CHECK-NEXT: .LBB1_9: @ %for.cond.cleanup17.us
466 ; CHECK-NEXT: @ in Loop: Header=BB1_10 Depth=2
467 ; CHECK-NEXT: add.w r11, r0, #7
468 ; CHECK-NEXT: cmn.w r0, #4
469 ; CHECK-NEXT: mov.w r10, #0
470 ; CHECK-NEXT: mov r0, r11
471 ; CHECK-NEXT: bge .LBB1_5
472 ; CHECK-NEXT: .LBB1_10: @ %for.body6.us
473 ; CHECK-NEXT: @ Parent Loop BB1_6 Depth=1
474 ; CHECK-NEXT: @ => This Loop Header: Depth=2
475 ; CHECK-NEXT: @ Child Loop BB1_12 Depth 3
476 ; CHECK-NEXT: @ Child Loop BB1_14 Depth 3
477 ; CHECK-NEXT: movs r1, #0
478 ; CHECK-NEXT: cbz r4, .LBB1_13
479 ; CHECK-NEXT: @ %bb.11: @ %for.body13.us51.preheader
480 ; CHECK-NEXT: @ in Loop: Header=BB1_10 Depth=2
481 ; CHECK-NEXT: movw r2, :lower16:a
482 ; CHECK-NEXT: vmov q1, q4
483 ; CHECK-NEXT: movt r2, :upper16:a
484 ; CHECK-NEXT: str r1, [r2]
485 ; CHECK-NEXT: movw r2, :lower16:b
486 ; CHECK-NEXT: movt r2, :upper16:b
487 ; CHECK-NEXT: str r1, [r2]
488 ; CHECK-NEXT: mov r2, r3
489 ; CHECK-NEXT: .LBB1_12: @ %vector.body111
490 ; CHECK-NEXT: @ Parent Loop BB1_6 Depth=1
491 ; CHECK-NEXT: @ Parent Loop BB1_10 Depth=2
492 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=3
493 ; CHECK-NEXT: vqadd.u32 q2, q5, r1
494 ; CHECK-NEXT: subs r2, #4
495 ; CHECK-NEXT: vcmp.u32 hi, q7, q2
496 ; CHECK-NEXT: vshl.i32 q2, q1, #2
497 ; CHECK-NEXT: add.w r1, r1, #4
498 ; CHECK-NEXT: vadd.i32 q2, q2, r8
499 ; CHECK-NEXT: vadd.i32 q1, q1, r9
501 ; CHECK-NEXT: vstrwt.32 q0, [q2]
502 ; CHECK-NEXT: bne .LBB1_12
503 ; CHECK-NEXT: b .LBB1_15
504 ; CHECK-NEXT: .LBB1_13: @ %vector.body.preheader
505 ; CHECK-NEXT: @ in Loop: Header=BB1_10 Depth=2
506 ; CHECK-NEXT: mov r2, r3
507 ; CHECK-NEXT: vmov q1, q4
508 ; CHECK-NEXT: .LBB1_14: @ %vector.body
509 ; CHECK-NEXT: @ Parent Loop BB1_6 Depth=1
510 ; CHECK-NEXT: @ Parent Loop BB1_10 Depth=2
511 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=3
512 ; CHECK-NEXT: vqadd.u32 q2, q5, r1
513 ; CHECK-NEXT: subs r2, #4
514 ; CHECK-NEXT: vcmp.u32 hi, q6, q2
515 ; CHECK-NEXT: vshl.i32 q2, q1, #2
516 ; CHECK-NEXT: add.w r1, r1, #4
517 ; CHECK-NEXT: vadd.i32 q2, q2, r8
518 ; CHECK-NEXT: vadd.i32 q1, q1, r9
520 ; CHECK-NEXT: vstrwt.32 q0, [q2]
521 ; CHECK-NEXT: bne .LBB1_14
522 ; CHECK-NEXT: .LBB1_15: @ %for.cond9.for.cond15.preheader_crit_edge.us
523 ; CHECK-NEXT: @ in Loop: Header=BB1_10 Depth=2
524 ; CHECK-NEXT: cmp r6, #0
525 ; CHECK-NEXT: beq .LBB1_9
526 ; CHECK-NEXT: @ %bb.16: @ %for.cond9.for.cond15.preheader_crit_edge.us
527 ; CHECK-NEXT: @ in Loop: Header=BB1_10 Depth=2
528 ; CHECK-NEXT: eor r1, r10, #1
529 ; CHECK-NEXT: lsls r1, r1, #31
530 ; CHECK-NEXT: bne .LBB1_9
531 ; CHECK-NEXT: b .LBB1_26
532 ; CHECK-NEXT: .LBB1_17: @ %for.body6.lr.ph.split
533 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
534 ; CHECK-NEXT: cmp r6, #0
535 ; CHECK-NEXT: beq.w .LBB1_2
536 ; CHECK-NEXT: @ %bb.18: @ in Loop: Header=BB1_6 Depth=1
537 ; CHECK-NEXT: mov r0, r11
538 ; CHECK-NEXT: .LBB1_19: @ %for.body6.us60
539 ; CHECK-NEXT: @ Parent Loop BB1_6 Depth=1
540 ; CHECK-NEXT: @ => This Inner Loop Header: Depth=2
541 ; CHECK-NEXT: lsls.w r1, r10, #31
542 ; CHECK-NEXT: bne .LBB1_27
543 ; CHECK-NEXT: @ %bb.20: @ %for.cond.cleanup17.us63
544 ; CHECK-NEXT: @ in Loop: Header=BB1_19 Depth=2
545 ; CHECK-NEXT: cmn.w r0, #4
546 ; CHECK-NEXT: bge.w .LBB1_3
547 ; CHECK-NEXT: @ %bb.21: @ %for.cond.cleanup17.us63.1
548 ; CHECK-NEXT: @ in Loop: Header=BB1_19 Depth=2
549 ; CHECK-NEXT: cmn.w r0, #12
550 ; CHECK-NEXT: bgt .LBB1_24
551 ; CHECK-NEXT: @ %bb.22: @ %for.cond.cleanup17.us63.2
552 ; CHECK-NEXT: @ in Loop: Header=BB1_19 Depth=2
553 ; CHECK-NEXT: cmn.w r0, #19
554 ; CHECK-NEXT: bgt .LBB1_25
555 ; CHECK-NEXT: @ %bb.23: @ %for.cond.cleanup17.us63.3
556 ; CHECK-NEXT: @ in Loop: Header=BB1_19 Depth=2
557 ; CHECK-NEXT: add.w r11, r0, #28
558 ; CHECK-NEXT: cmn.w r0, #25
559 ; CHECK-NEXT: mov.w r10, #0
560 ; CHECK-NEXT: mov r0, r11
561 ; CHECK-NEXT: blt .LBB1_19
562 ; CHECK-NEXT: b .LBB1_5
563 ; CHECK-NEXT: .LBB1_24: @ %for.cond.cleanup5.loopexit134.split.loop.exit137
564 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
565 ; CHECK-NEXT: add.w r11, r0, #14
566 ; CHECK-NEXT: b .LBB1_4
567 ; CHECK-NEXT: .LBB1_25: @ %for.cond.cleanup5.loopexit134.split.loop.exit135
568 ; CHECK-NEXT: @ in Loop: Header=BB1_6 Depth=1
569 ; CHECK-NEXT: add.w r11, r0, #21
570 ; CHECK-NEXT: b .LBB1_4
571 ; CHECK-NEXT: .LBB1_26: @ %for.inc19.us
572 ; CHECK-NEXT: @ =>This Inner Loop Header: Depth=1
573 ; CHECK-NEXT: b .LBB1_26
574 ; CHECK-NEXT: .LBB1_27: @ %for.inc19.us66
575 ; CHECK-NEXT: @ =>This Inner Loop Header: Depth=1
576 ; CHECK-NEXT: b .LBB1_27
577 ; CHECK-NEXT: .LBB1_28: @ %for.cond.cleanup
578 ; CHECK-NEXT: add sp, #16
579 ; CHECK-NEXT: vpop {d8, d9, d10, d11, d12, d13, d14, d15}
580 ; CHECK-NEXT: add sp, #4
581 ; CHECK-NEXT: pop.w {r4, r5, r6, r7, r8, r9, r10, r11, pc}
582 ; CHECK-NEXT: .p2align 4
583 ; CHECK-NEXT: @ %bb.29:
584 ; CHECK-NEXT: .LCPI1_0:
585 ; CHECK-NEXT: .long 0 @ 0x0
586 ; CHECK-NEXT: .long 3 @ 0x3
587 ; CHECK-NEXT: .long 6 @ 0x6
588 ; CHECK-NEXT: .long 9 @ 0x9
589 ; CHECK-NEXT: .LCPI1_1:
590 ; CHECK-NEXT: .long 0 @ 0x0
591 ; CHECK-NEXT: .long 1 @ 0x1
592 ; CHECK-NEXT: .long 2 @ 0x2
593 ; CHECK-NEXT: .long 3 @ 0x3
595 %cmp47 = icmp sgt i64 %e, 0
596 br i1 %cmp47, label %for.cond2.preheader.lr.ph, label %for.cond.cleanup
598 for.cond2.preheader.lr.ph: ; preds = %entry
599 %cmp7.inv = icmp slt i32 %f, 1
600 %spec.select = select i1 %cmp7.inv, i32 %f, i32 1
601 %cmp1041 = icmp ult i32 %spec.select, 6
602 %tobool.not = icmp eq i32 %f, 0
603 %tobool20.not97 = icmp eq i32 %h, 0
604 %0 = icmp ugt i32 %spec.select, 3
605 %umax = select i1 %0, i32 %spec.select, i32 3
606 %1 = add i32 %umax, 2
607 %2 = sub i32 %1, %spec.select
609 %4 = add nuw nsw i32 %3, 1
610 %5 = icmp ugt i32 %spec.select, 3
611 %umax112 = select i1 %5, i32 %spec.select, i32 3
612 %6 = add i32 %umax112, 2
613 %7 = sub i32 %6, %spec.select
615 %9 = add nuw nsw i32 %8, 1
616 %n.rnd.up114 = add nuw nsw i32 %8, 4
617 %n.vec116 = and i32 %n.rnd.up114, 2147483644
618 %.splatinsert121 = insertelement <4 x i32> poison, i32 %spec.select, i32 0
619 %.splat122 = shufflevector <4 x i32> %.splatinsert121, <4 x i32> poison, <4 x i32> zeroinitializer
620 %induction123 = add <4 x i32> %.splat122, <i32 0, i32 3, i32 6, i32 9>
621 %n.rnd.up = add nuw nsw i32 %3, 4
622 %n.vec = and i32 %n.rnd.up, 2147483644
623 %.splatinsert = insertelement <4 x i32> poison, i32 %spec.select, i32 0
624 %.splat = shufflevector <4 x i32> %.splatinsert, <4 x i32> poison, <4 x i32> zeroinitializer
625 %induction = add <4 x i32> %.splat, <i32 0, i32 3, i32 6, i32 9>
626 br label %for.cond2.preheader
628 for.cond2.preheader: ; preds = %for.cond2.preheader.lr.ph, %for.cond.cleanup5
629 %l.0.off050 = phi i1 [ undef, %for.cond2.preheader.lr.ph ], [ %l.1.off0.lcssa, %for.cond.cleanup5 ]
630 %i.049 = phi i32 [ undef, %for.cond2.preheader.lr.ph ], [ %add26, %for.cond.cleanup5 ]
631 %j.048 = phi i32 [ undef, %for.cond2.preheader.lr.ph ], [ %j.1.lcssa, %for.cond.cleanup5 ]
632 %cmp343 = icmp slt i32 %j.048, 3
633 br i1 %cmp343, label %for.body6.lr.ph, label %for.cond.cleanup5
635 for.body6.lr.ph: ; preds = %for.cond2.preheader
636 br i1 %cmp1041, label %for.body6.us.preheader, label %for.body6.lr.ph.split
638 for.body6.us.preheader: ; preds = %for.body6.lr.ph
639 %rem.us = srem i64 32, %g
640 %conv14.us = trunc i64 %rem.us to i32
641 %broadcast.splatinsert131 = insertelement <4 x i32> poison, i32 %conv14.us, i32 0
642 %broadcast.splat132 = shufflevector <4 x i32> %broadcast.splatinsert131, <4 x i32> poison, <4 x i32> zeroinitializer
643 %broadcast.splatinsert107 = insertelement <4 x i32> poison, i32 %conv14.us, i32 0
644 %broadcast.splat108 = shufflevector <4 x i32> %broadcast.splatinsert107, <4 x i32> poison, <4 x i32> zeroinitializer
645 br label %for.body6.us
647 for.body6.us: ; preds = %for.body6.us.preheader, %for.cond.cleanup17.us
648 %l.1.off045.us = phi i1 [ false, %for.cond.cleanup17.us ], [ %l.0.off050, %for.body6.us.preheader ]
649 %j.144.us = phi i32 [ %add23.us, %for.cond.cleanup17.us ], [ %j.048, %for.body6.us.preheader ]
650 br i1 %tobool.not, label %vector.body, label %for.body13.us51.preheader
652 vector.body: ; preds = %for.body6.us, %vector.body
653 %index = phi i32 [ %index.next, %vector.body ], [ 0, %for.body6.us ]
654 %vec.ind = phi <4 x i32> [ %vec.ind.next, %vector.body ], [ %induction, %for.body6.us ]
655 %active.lane.mask = call <4 x i1> @llvm.get.active.lane.mask.v4i1.i32(i32 %index, i32 %4)
656 %10 = getelementptr inbounds [1 x i32], ptr @c, i32 0, <4 x i32> %vec.ind
657 call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> %broadcast.splat108, <4 x ptr> %10, i32 4, <4 x i1> %active.lane.mask)
658 %index.next = add i32 %index, 4
659 %vec.ind.next = add <4 x i32> %vec.ind, <i32 12, i32 12, i32 12, i32 12>
660 %11 = icmp eq i32 %index.next, %n.vec
661 br i1 %11, label %for.cond9.for.cond15.preheader_crit_edge.us, label %vector.body
663 for.body13.us51.preheader: ; preds = %for.body6.us
664 store i32 0, ptr @b, align 4
665 store i32 0, ptr @a, align 4
666 br label %vector.body111
668 vector.body111: ; preds = %vector.body111, %for.body13.us51.preheader
669 %index117 = phi i32 [ 0, %for.body13.us51.preheader ], [ %index.next118, %vector.body111 ]
670 %vec.ind124 = phi <4 x i32> [ %induction123, %for.body13.us51.preheader ], [ %vec.ind.next125, %vector.body111 ]
671 %active.lane.mask130 = call <4 x i1> @llvm.get.active.lane.mask.v4i1.i32(i32 %index117, i32 %9)
672 %12 = getelementptr inbounds [1 x i32], ptr @c, i32 0, <4 x i32> %vec.ind124
673 call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> %broadcast.splat132, <4 x ptr> %12, i32 4, <4 x i1> %active.lane.mask130)
674 %index.next118 = add i32 %index117, 4
675 %vec.ind.next125 = add <4 x i32> %vec.ind124, <i32 12, i32 12, i32 12, i32 12>
676 %13 = icmp eq i32 %index.next118, %n.vec116
677 br i1 %13, label %for.cond9.for.cond15.preheader_crit_edge.us, label %vector.body111
679 for.cond.cleanup17.us: ; preds = %for.cond9.for.cond15.preheader_crit_edge.us
680 %add23.us = add nsw i32 %j.144.us, 7
681 %cmp3.us = icmp slt i32 %j.144.us, -4
682 br i1 %cmp3.us, label %for.body6.us, label %for.cond.cleanup5
684 for.inc19.us: ; preds = %for.cond9.for.cond15.preheader_crit_edge.us, %for.inc19.us
685 br label %for.inc19.us
687 for.cond9.for.cond15.preheader_crit_edge.us: ; preds = %vector.body111, %vector.body
688 %l.1.off045.us.not = xor i1 %l.1.off045.us, true
689 %brmerge = or i1 %tobool20.not97, %l.1.off045.us.not
690 br i1 %brmerge, label %for.cond.cleanup17.us, label %for.inc19.us
692 for.body6.lr.ph.split: ; preds = %for.body6.lr.ph
693 br i1 %tobool20.not97, label %for.body6.preheader, label %for.body6.us60
695 for.body6.preheader: ; preds = %for.body6.lr.ph.split
696 %14 = icmp sgt i32 %j.048, -4
697 %smax = select i1 %14, i32 %j.048, i32 -4
698 %15 = add nsw i32 %smax, 6
699 %16 = sub i32 %15, %j.048
700 %17 = urem i32 %16, 7
701 %18 = sub i32 %16, %17
702 %19 = add nsw i32 %j.048, 7
703 %20 = add i32 %19, %18
704 br label %for.cond.cleanup5
706 for.body6.us60: ; preds = %for.body6.lr.ph.split, %for.cond.cleanup17.us63.3
707 %l.1.off045.us61 = phi i1 [ false, %for.cond.cleanup17.us63.3 ], [ %l.0.off050, %for.body6.lr.ph.split ]
708 %j.144.us62 = phi i32 [ %add23.us64.3, %for.cond.cleanup17.us63.3 ], [ %j.048, %for.body6.lr.ph.split ]
709 br i1 %l.1.off045.us61, label %for.inc19.us66, label %for.cond.cleanup17.us63
711 for.cond.cleanup17.us63: ; preds = %for.body6.us60
712 %cmp3.us65 = icmp slt i32 %j.144.us62, -4
713 br i1 %cmp3.us65, label %for.cond.cleanup17.us63.1, label %for.cond.cleanup5.loopexit134.split.loop.exit139
715 for.inc19.us66: ; preds = %for.body6.us60, %for.inc19.us66
716 br label %for.inc19.us66
718 for.cond.cleanup: ; preds = %for.cond.cleanup5, %entry
721 for.cond.cleanup5.loopexit134.split.loop.exit135: ; preds = %for.cond.cleanup17.us63.2
722 %add23.us64.2.le = add nsw i32 %j.144.us62, 21
723 br label %for.cond.cleanup5
725 for.cond.cleanup5.loopexit134.split.loop.exit137: ; preds = %for.cond.cleanup17.us63.1
726 %add23.us64.1.le = add nsw i32 %j.144.us62, 14
727 br label %for.cond.cleanup5
729 for.cond.cleanup5.loopexit134.split.loop.exit139: ; preds = %for.cond.cleanup17.us63
730 %add23.us64.le = add nsw i32 %j.144.us62, 7
731 br label %for.cond.cleanup5
733 for.cond.cleanup5: ; preds = %for.cond.cleanup5.loopexit134.split.loop.exit135, %for.cond.cleanup5.loopexit134.split.loop.exit137, %for.cond.cleanup5.loopexit134.split.loop.exit139, %for.cond.cleanup17.us63.3, %for.cond.cleanup17.us, %for.body6.preheader, %for.cond2.preheader
734 %j.1.lcssa = phi i32 [ %j.048, %for.cond2.preheader ], [ %20, %for.body6.preheader ], [ %add23.us, %for.cond.cleanup17.us ], [ %add23.us64.2.le, %for.cond.cleanup5.loopexit134.split.loop.exit135 ], [ %add23.us64.1.le, %for.cond.cleanup5.loopexit134.split.loop.exit137 ], [ %add23.us64.le, %for.cond.cleanup5.loopexit134.split.loop.exit139 ], [ %add23.us64.3, %for.cond.cleanup17.us63.3 ]
735 %l.1.off0.lcssa = phi i1 [ %l.0.off050, %for.cond2.preheader ], [ false, %for.body6.preheader ], [ false, %for.cond.cleanup17.us ], [ false, %for.cond.cleanup17.us63.3 ], [ false, %for.cond.cleanup5.loopexit134.split.loop.exit139 ], [ false, %for.cond.cleanup5.loopexit134.split.loop.exit137 ], [ false, %for.cond.cleanup5.loopexit134.split.loop.exit135 ]
736 %add26 = add nsw i32 %i.049, 2
737 %conv = sext i32 %add26 to i64
738 %cmp = icmp slt i64 %conv, %e
739 br i1 %cmp, label %for.cond2.preheader, label %for.cond.cleanup
741 for.cond.cleanup17.us63.1: ; preds = %for.cond.cleanup17.us63
742 %cmp3.us65.1 = icmp slt i32 %j.144.us62, -11
743 br i1 %cmp3.us65.1, label %for.cond.cleanup17.us63.2, label %for.cond.cleanup5.loopexit134.split.loop.exit137
745 for.cond.cleanup17.us63.2: ; preds = %for.cond.cleanup17.us63.1
746 %cmp3.us65.2 = icmp slt i32 %j.144.us62, -18
747 br i1 %cmp3.us65.2, label %for.cond.cleanup17.us63.3, label %for.cond.cleanup5.loopexit134.split.loop.exit135
749 for.cond.cleanup17.us63.3: ; preds = %for.cond.cleanup17.us63.2
750 %add23.us64.3 = add nsw i32 %j.144.us62, 28
751 %cmp3.us65.3 = icmp slt i32 %j.144.us62, -25
752 br i1 %cmp3.us65.3, label %for.body6.us60, label %for.cond.cleanup5
755 declare <4 x i1> @llvm.get.active.lane.mask.v4i1.i32(i32, i32) #1
756 declare void @llvm.masked.scatter.v4i32.v4p0(<4 x i32>, <4 x ptr>, i32 immarg, <4 x i1>) #2