1 # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
2 # RUN: llc -mtriple=aarch64 -run-pass=aarch64-postlegalizer-lowering -verify-machineinstrs %s -o - | FileCheck %s
8 tracksRegLiveness: true
13 ; CHECK-LABEL: name: splat_4xi32
15 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $w0
16 ; CHECK: [[DUP:%[0-9]+]]:_(<4 x s32>) = G_DUP [[COPY]](s32)
17 ; CHECK: $q0 = COPY [[DUP]](<4 x s32>)
18 ; CHECK: RET_ReallyLR implicit $q0
20 %2:_(<4 x s32>) = G_IMPLICIT_DEF
21 %3:_(s32) = G_CONSTANT i32 0
22 %1:_(<4 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
23 %4:_(<4 x s32>) = G_SHUFFLE_VECTOR %1(<4 x s32>), %2, shufflemask(0, 0, 0, 0)
24 $q0 = COPY %4(<4 x s32>)
25 RET_ReallyLR implicit $q0
32 tracksRegLiveness: true
37 ; CHECK-LABEL: name: splat_2xi64
39 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
40 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s64>) = G_DUP [[COPY]](s64)
41 ; CHECK: $q0 = COPY [[DUP]](<2 x s64>)
42 ; CHECK: RET_ReallyLR implicit $q0
44 %2:_(<2 x s64>) = G_IMPLICIT_DEF
45 %3:_(s32) = G_CONSTANT i32 0
46 %1:_(<2 x s64>) = G_INSERT_VECTOR_ELT %2, %0(s64), %3(s32)
47 %4:_(<2 x s64>) = G_SHUFFLE_VECTOR %1(<2 x s64>), %2, shufflemask(0, 0)
48 $q0 = COPY %4(<2 x s64>)
49 RET_ReallyLR implicit $q0
56 tracksRegLiveness: true
61 ; CHECK-LABEL: name: splat_2xi32
63 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $w0
64 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s32>) = G_DUP [[COPY]](s32)
65 ; CHECK: $d0 = COPY [[DUP]](<2 x s32>)
66 ; CHECK: RET_ReallyLR implicit $d0
68 %2:_(<2 x s32>) = G_IMPLICIT_DEF
69 %3:_(s32) = G_CONSTANT i32 0
70 %1:_(<2 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
71 %4:_(<2 x s32>) = G_SHUFFLE_VECTOR %1(<2 x s32>), %2, shufflemask(0, 0)
72 $d0 = COPY %4(<2 x s32>)
73 RET_ReallyLR implicit $d0
80 tracksRegLiveness: true
85 ; CHECK-LABEL: name: splat_4xf32
87 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $s0
88 ; CHECK: [[DUP:%[0-9]+]]:_(<4 x s32>) = G_DUP [[COPY]](s32)
89 ; CHECK: $q0 = COPY [[DUP]](<4 x s32>)
90 ; CHECK: RET_ReallyLR implicit $q0
92 %2:_(<4 x s32>) = G_IMPLICIT_DEF
93 %3:_(s32) = G_CONSTANT i32 0
94 %1:_(<4 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
95 %4:_(<4 x s32>) = G_SHUFFLE_VECTOR %1(<4 x s32>), %2, shufflemask(0, 0, 0, 0)
96 $q0 = COPY %4(<4 x s32>)
97 RET_ReallyLR implicit $q0
104 tracksRegLiveness: true
109 ; CHECK-LABEL: name: splat_2xf64
110 ; CHECK: liveins: $d0
111 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $d0
112 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s64>) = G_DUP [[COPY]](s64)
113 ; CHECK: $q0 = COPY [[DUP]](<2 x s64>)
114 ; CHECK: RET_ReallyLR implicit $q0
116 %2:_(<2 x s64>) = G_IMPLICIT_DEF
117 %3:_(s32) = G_CONSTANT i32 0
118 %1:_(<2 x s64>) = G_INSERT_VECTOR_ELT %2, %0(s64), %3(s32)
119 %4:_(<2 x s64>) = G_SHUFFLE_VECTOR %1(<2 x s64>), %2, shufflemask(0, 0)
120 $q0 = COPY %4(<2 x s64>)
121 RET_ReallyLR implicit $q0
128 tracksRegLiveness: true
133 ; CHECK-LABEL: name: splat_2xf32
134 ; CHECK: liveins: $s0
135 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $s0
136 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s32>) = G_DUP [[COPY]](s32)
137 ; CHECK: $d0 = COPY [[DUP]](<2 x s32>)
138 ; CHECK: RET_ReallyLR implicit $d0
140 %2:_(<2 x s32>) = G_IMPLICIT_DEF
141 %3:_(s32) = G_CONSTANT i32 0
142 %1:_(<2 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
143 %4:_(<2 x s32>) = G_SHUFFLE_VECTOR %1(<2 x s32>), %2, shufflemask(0, 0)
144 $d0 = COPY %4(<2 x s32>)
145 RET_ReallyLR implicit $d0
149 name: splat_2xf64_copies
152 tracksRegLiveness: true
157 ; This test is exactly the same as splat_2xf64, except it adds two copies.
158 ; These copies shouldn't get in the way of matching the dup pattern.
159 ; CHECK-LABEL: name: splat_2xf64_copies
160 ; CHECK: liveins: $d0
161 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $d0
162 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s64>) = G_DUP [[COPY]](s64)
163 ; CHECK: $q0 = COPY [[DUP]](<2 x s64>)
164 ; CHECK: RET_ReallyLR implicit $q0
166 %2:_(<2 x s64>) = G_IMPLICIT_DEF
167 %6:_(<2 x s64>) = COPY %2
168 %3:_(s32) = G_CONSTANT i32 0
169 %1:_(<2 x s64>) = G_INSERT_VECTOR_ELT %6, %0(s64), %3(s32)
170 %7:_(<2 x s64>) = COPY %1
171 %4:_(<2 x s64>) = G_SHUFFLE_VECTOR %7(<2 x s64>), %2, shufflemask(0, 0)
172 $q0 = COPY %4(<2 x s64>)
173 RET_ReallyLR implicit $q0
180 tracksRegLiveness: true
184 ; Make sure that we don't do the optimization when it's not all zeroes.
185 ; CHECK-LABEL: name: not_all_zeros
186 ; CHECK: liveins: $x0
187 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
188 ; CHECK: [[DEF:%[0-9]+]]:_(<2 x s64>) = G_IMPLICIT_DEF
189 ; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 0
190 ; CHECK: [[IVEC:%[0-9]+]]:_(<2 x s64>) = G_INSERT_VECTOR_ELT [[DEF]], [[COPY]](s64), [[C]](s32)
191 ; CHECK: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 0
192 ; CHECK: [[EXT:%[0-9]+]]:_(<2 x s64>) = G_EXT [[IVEC]], [[DEF]], [[C1]](s32)
193 ; CHECK: $q0 = COPY [[EXT]](<2 x s64>)
194 ; CHECK: RET_ReallyLR implicit $q0
196 %2:_(<2 x s64>) = G_IMPLICIT_DEF
197 %3:_(s32) = G_CONSTANT i32 0
198 %1:_(<2 x s64>) = G_INSERT_VECTOR_ELT %2, %0(s64), %3(s32)
199 %4:_(<2 x s64>) = G_SHUFFLE_VECTOR %1(<2 x s64>), %2, shufflemask(0, 1)
200 $q0 = COPY %4(<2 x s64>)
201 RET_ReallyLR implicit $q0
208 tracksRegLiveness: true
212 ; If all the elements are undefined, we consider it a splat. In this case,
213 ; we can choose 0 as our index.
215 ; We should get a G_DUP here.
217 ; CHECK-LABEL: name: all_undef
218 ; CHECK: liveins: $x0
219 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
220 ; CHECK: [[DUP:%[0-9]+]]:_(<2 x s64>) = G_DUP [[COPY]](s64)
221 ; CHECK: $q0 = COPY [[DUP]](<2 x s64>)
222 ; CHECK: RET_ReallyLR implicit $q0
224 %2:_(<2 x s64>) = G_IMPLICIT_DEF
225 %3:_(s32) = G_CONSTANT i32 0
226 %1:_(<2 x s64>) = G_INSERT_VECTOR_ELT %2, %0(s64), %3(s32)
227 %4:_(<2 x s64>) = G_SHUFFLE_VECTOR %1(<2 x s64>), %2, shufflemask(-1, -1)
228 $q0 = COPY %4(<2 x s64>)
229 RET_ReallyLR implicit $q0
236 tracksRegLiveness: true
240 ; Make sure we can skip past undef values.
242 ; We should get a G_DUP here.
244 ; CHECK-LABEL: name: one_undef
245 ; CHECK: liveins: $s0
246 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $s0
247 ; CHECK: [[DUP:%[0-9]+]]:_(<4 x s32>) = G_DUP [[COPY]](s32)
248 ; CHECK: $q0 = COPY [[DUP]](<4 x s32>)
249 ; CHECK: RET_ReallyLR implicit $q0
251 %2:_(<4 x s32>) = G_IMPLICIT_DEF
252 %3:_(s32) = G_CONSTANT i32 0
253 %1:_(<4 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
254 %4:_(<4 x s32>) = G_SHUFFLE_VECTOR %1(<4 x s32>), %2, shufflemask(0, -1, 0, 0)
255 $q0 = COPY %4(<4 x s32>)
256 RET_ReallyLR implicit $q0
260 name: not_all_zeros_with_undefs
263 tracksRegLiveness: true
267 ; Check a non-splat mask with an undef value. We shouldn't get a G_DUP here.
269 ; CHECK-LABEL: name: not_all_zeros_with_undefs
270 ; CHECK: liveins: $s0
271 ; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $s0
272 ; CHECK: [[DEF:%[0-9]+]]:_(<4 x s32>) = G_IMPLICIT_DEF
273 ; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 0
274 ; CHECK: [[IVEC:%[0-9]+]]:_(<4 x s32>) = G_INSERT_VECTOR_ELT [[DEF]], [[COPY]](s32), [[C]](s32)
275 ; CHECK: [[SHUF:%[0-9]+]]:_(<4 x s32>) = G_SHUFFLE_VECTOR [[IVEC]](<4 x s32>), [[DEF]], shufflemask(undef, 0, 0, 3)
276 ; CHECK: $q0 = COPY [[SHUF]](<4 x s32>)
277 ; CHECK: RET_ReallyLR implicit $q0
279 %2:_(<4 x s32>) = G_IMPLICIT_DEF
280 %3:_(s32) = G_CONSTANT i32 0
281 %1:_(<4 x s32>) = G_INSERT_VECTOR_ELT %2, %0(s32), %3(s32)
282 %4:_(<4 x s32>) = G_SHUFFLE_VECTOR %1(<4 x s32>), %2, shufflemask(-1, 0, 0, 3)
283 $q0 = COPY %4(<4 x s32>)
284 RET_ReallyLR implicit $q0
291 tracksRegLiveness: true
295 ; CHECK-LABEL: name: splat_4xi16
296 ; CHECK: liveins: $h0
297 ; CHECK: %copy:_(s16) = COPY $h0
298 ; CHECK: %splat:_(<4 x s16>) = G_DUP %copy(s16)
299 ; CHECK: $d0 = COPY %splat(<4 x s16>)
300 ; CHECK: RET_ReallyLR implicit $d0
301 %copy:_(s16) = COPY $h0
302 %undef:_(<4 x s16>) = G_IMPLICIT_DEF
303 %cst:_(s32) = G_CONSTANT i32 0
304 %ins:_(<4 x s16>) = G_INSERT_VECTOR_ELT %undef, %copy(s16), %cst(s32)
305 %splat:_(<4 x s16>) = G_SHUFFLE_VECTOR %ins(<4 x s16>), %undef, shufflemask(0, 0, 0, 0)
306 $d0 = COPY %splat(<4 x s16>)
307 RET_ReallyLR implicit $d0
314 tracksRegLiveness: true
318 ; CHECK-LABEL: name: splat_8xi8
319 ; CHECK: liveins: $w0
320 ; CHECK: %copy:_(s32) = COPY $w0
321 ; CHECK: %splat:_(<8 x s8>) = G_DUP %copy(s32)
322 ; CHECK: $d0 = COPY %splat(<8 x s8>)
323 ; CHECK: RET_ReallyLR implicit $d0
324 %copy:_(s32) = COPY $w0
325 %undef:_(<8 x s8>) = G_IMPLICIT_DEF
326 %cst:_(s32) = G_CONSTANT i32 0
327 %ins:_(<8 x s8>) = G_INSERT_VECTOR_ELT %undef, %copy(s32), %cst(s32)
328 %splat:_(<8 x s8>) = G_SHUFFLE_VECTOR %ins(<8 x s8>), %undef, shufflemask(0, 0, 0, 0, 0, 0, 0, 0)
329 $d0 = COPY %splat(<8 x s8>)
330 RET_ReallyLR implicit $d0
337 tracksRegLiveness: true
340 liveins: $w0, $w1, $w2, $w3
341 ; The G_SHUFFLE_VECTOR is fed by a G_BUILD_VECTOR, and the 0th input
342 ; operand is not a constant. We should get a G_DUP.
344 ; CHECK-LABEL: name: build_vector
345 ; CHECK: liveins: $w0, $w1, $w2, $w3
346 ; CHECK: %lane:_(s32) = COPY $w0
347 ; CHECK: %shuf:_(<4 x s32>) = G_DUP %lane(s32)
348 ; CHECK: $q0 = COPY %shuf(<4 x s32>)
349 ; CHECK: RET_ReallyLR implicit $q0
350 %lane:_(s32) = COPY $w0
354 %undef:_(<4 x s32>) = G_IMPLICIT_DEF
355 %buildvec:_(<4 x s32>) = G_BUILD_VECTOR %lane, %b, %c, %d
356 %shuf:_(<4 x s32>) = G_SHUFFLE_VECTOR %buildvec(<4 x s32>), %undef, shufflemask(0, 0, 0, 0)
357 $q0 = COPY %shuf(<4 x s32>)
358 RET_ReallyLR implicit $q0