1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
2 ; RUN: llc -mtriple=aarch64 -mattr=+sve < %s | FileCheck %s
4 ; Test that we do not end in an infinite loop (https://github.com/llvm/llvm-project/issues/63322)
6 declare void @llvm.masked.scatter.nxv16i8.nxv16p0(<vscale x 16 x i8>, <vscale x 16 x ptr>, i32 immarg, <vscale x 16 x i1>)
8 define fastcc i8 @allocno_reload_assign() {
9 ; CHECK-LABEL: allocno_reload_assign:
11 ; CHECK-NEXT: fmov d0, xzr
12 ; CHECK-NEXT: ptrue p0.d
13 ; CHECK-NEXT: mov z16.d, #0 // =0x0
14 ; CHECK-NEXT: cmpeq p0.d, p0/z, z0.d, #0
15 ; CHECK-NEXT: uzp1 p0.s, p0.s, p0.s
16 ; CHECK-NEXT: uzp1 p0.h, p0.h, p0.h
17 ; CHECK-NEXT: uzp1 p0.b, p0.b, p0.b
18 ; CHECK-NEXT: mov z0.b, p0/z, #1 // =0x1
19 ; CHECK-NEXT: fmov w8, s0
20 ; CHECK-NEXT: mov z0.b, #0 // =0x0
21 ; CHECK-NEXT: uunpklo z1.h, z0.b
22 ; CHECK-NEXT: uunpkhi z0.h, z0.b
23 ; CHECK-NEXT: mvn w8, w8
24 ; CHECK-NEXT: sbfx x8, x8, #0, #1
25 ; CHECK-NEXT: whilelo p0.b, xzr, x8
26 ; CHECK-NEXT: uunpklo z2.s, z1.h
27 ; CHECK-NEXT: uunpkhi z3.s, z1.h
28 ; CHECK-NEXT: uunpklo z5.s, z0.h
29 ; CHECK-NEXT: uunpkhi z7.s, z0.h
30 ; CHECK-NEXT: punpklo p1.h, p0.b
31 ; CHECK-NEXT: punpkhi p0.h, p0.b
32 ; CHECK-NEXT: punpklo p2.h, p1.b
33 ; CHECK-NEXT: punpkhi p3.h, p1.b
34 ; CHECK-NEXT: uunpklo z0.d, z2.s
35 ; CHECK-NEXT: uunpkhi z1.d, z2.s
36 ; CHECK-NEXT: punpklo p5.h, p0.b
37 ; CHECK-NEXT: uunpklo z2.d, z3.s
38 ; CHECK-NEXT: uunpkhi z3.d, z3.s
39 ; CHECK-NEXT: punpkhi p7.h, p0.b
40 ; CHECK-NEXT: uunpklo z4.d, z5.s
41 ; CHECK-NEXT: uunpkhi z5.d, z5.s
42 ; CHECK-NEXT: uunpklo z6.d, z7.s
43 ; CHECK-NEXT: uunpkhi z7.d, z7.s
44 ; CHECK-NEXT: punpklo p0.h, p2.b
45 ; CHECK-NEXT: punpkhi p1.h, p2.b
46 ; CHECK-NEXT: punpklo p2.h, p3.b
47 ; CHECK-NEXT: punpkhi p3.h, p3.b
48 ; CHECK-NEXT: punpklo p4.h, p5.b
49 ; CHECK-NEXT: punpkhi p5.h, p5.b
50 ; CHECK-NEXT: punpklo p6.h, p7.b
51 ; CHECK-NEXT: punpkhi p7.h, p7.b
52 ; CHECK-NEXT: .LBB0_1: // =>This Inner Loop Header: Depth=1
53 ; CHECK-NEXT: st1b { z0.d }, p0, [z16.d]
54 ; CHECK-NEXT: st1b { z1.d }, p1, [z16.d]
55 ; CHECK-NEXT: st1b { z2.d }, p2, [z16.d]
56 ; CHECK-NEXT: st1b { z3.d }, p3, [z16.d]
57 ; CHECK-NEXT: st1b { z4.d }, p4, [z16.d]
58 ; CHECK-NEXT: st1b { z5.d }, p5, [z16.d]
59 ; CHECK-NEXT: st1b { z6.d }, p6, [z16.d]
60 ; CHECK-NEXT: st1b { z7.d }, p7, [z16.d]
61 ; CHECK-NEXT: b .LBB0_1
65 %constexpr = icmp eq <vscale x 16 x ptr> insertelement (<vscale x 16 x ptr> poison, ptr null, i64 0), zeroinitializer
66 %constexpr1 = shufflevector <vscale x 16 x i1> %constexpr, <vscale x 16 x i1> poison, <vscale x 16 x i32> zeroinitializer
67 %constexpr2 = xor <vscale x 16 x i1> %constexpr1, shufflevector (<vscale x 16 x i1> insertelement (<vscale x 16 x i1> poison, i1 true, i64 0), <vscale x 16 x i1> poison, <vscale x 16 x i32> zeroinitializer)
68 call void @llvm.masked.scatter.nxv16i8.nxv16p0(<vscale x 16 x i8> zeroinitializer, <vscale x 16 x ptr> zeroinitializer, i32 0, <vscale x 16 x i1> %constexpr2)
72 uselistorder <vscale x 16 x i1> poison, { 1, 2, 0 }