1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc -mtriple=aarch64-unknown-linux-gnu --aarch64-enable-sink-fold=true < %s | FileCheck %s
5 ; ptr - (ptr & (alignment-1))
7 ; ptr & (0 - alignment)
9 ; This needs to be a backend-level fold because only by now pointers
10 ; are just registers; in middle-end IR this can only be done via @llvm.ptrmask()
11 ; intrinsic which is not sufficiently widely-spread yet.
13 ; https://bugs.llvm.org/show_bug.cgi?id=44448
15 ; The basic positive tests
17 define i32 @t0_32(i32 %ptr, i32 %alignment) nounwind {
20 ; CHECK-NEXT: neg w8, w1
21 ; CHECK-NEXT: and w0, w0, w8
23 %mask = add i32 %alignment, -1
24 %bias = and i32 %ptr, %mask
25 %r = sub i32 %ptr, %bias
28 define i64 @t1_64(i64 %ptr, i64 %alignment) nounwind {
31 ; CHECK-NEXT: neg x8, x1
32 ; CHECK-NEXT: and x0, x0, x8
34 %mask = add i64 %alignment, -1
35 %bias = and i64 %ptr, %mask
36 %r = sub i64 %ptr, %bias
40 define i32 @t2_commutative(i32 %ptr, i32 %alignment) nounwind {
41 ; CHECK-LABEL: t2_commutative:
43 ; CHECK-NEXT: neg w8, w1
44 ; CHECK-NEXT: and w0, w0, w8
46 %mask = add i32 %alignment, -1
47 %bias = and i32 %mask, %ptr ; swapped
48 %r = sub i32 %ptr, %bias
54 define i32 @t3_extrause0(i32 %ptr, i32 %alignment, i32* %mask_storage) nounwind {
55 ; CHECK-LABEL: t3_extrause0:
57 ; CHECK-NEXT: neg w8, w1
58 ; CHECK-NEXT: sub w9, w1, #1
59 ; CHECK-NEXT: and w0, w0, w8
60 ; CHECK-NEXT: str w9, [x2]
62 %mask = add i32 %alignment, -1
63 store i32 %mask, i32* %mask_storage
64 %bias = and i32 %ptr, %mask
65 %r = sub i32 %ptr, %bias
68 define i32 @n4_extrause1(i32 %ptr, i32 %alignment, i32* %bias_storage) nounwind {
69 ; CHECK-LABEL: n4_extrause1:
71 ; CHECK-NEXT: sub w8, w1, #1
72 ; CHECK-NEXT: and w8, w0, w8
73 ; CHECK-NEXT: sub w0, w0, w8
74 ; CHECK-NEXT: str w8, [x2]
76 %mask = add i32 %alignment, -1
77 %bias = and i32 %ptr, %mask ; has extra uses, can't fold
78 store i32 %bias, i32* %bias_storage
79 %r = sub i32 %ptr, %bias
82 define i32 @n5_extrause2(i32 %ptr, i32 %alignment, i32* %mask_storage, i32* %bias_storage) nounwind {
83 ; CHECK-LABEL: n5_extrause2:
85 ; CHECK-NEXT: sub w8, w1, #1
86 ; CHECK-NEXT: and w9, w0, w8
87 ; CHECK-NEXT: str w8, [x2]
88 ; CHECK-NEXT: sub w0, w0, w9
89 ; CHECK-NEXT: str w9, [x3]
91 %mask = add i32 %alignment, -1
92 store i32 %mask, i32* %mask_storage
93 %bias = and i32 %ptr, %mask ; has extra uses, can't fold
94 store i32 %bias, i32* %bias_storage
95 %r = sub i32 %ptr, %bias
101 define i32 @n6_different_ptrs(i32 %ptr0, i32 %ptr1, i32 %alignment) nounwind {
102 ; CHECK-LABEL: n6_different_ptrs:
104 ; CHECK-NEXT: sub w8, w2, #1
105 ; CHECK-NEXT: and w8, w1, w8
106 ; CHECK-NEXT: sub w0, w0, w8
108 %mask = add i32 %alignment, -1
109 %bias = and i32 %ptr1, %mask ; not %ptr0
110 %r = sub i32 %ptr0, %bias ; not %ptr1
113 define i32 @n7_different_ptrs_commutative(i32 %ptr0, i32 %ptr1, i32 %alignment) nounwind {
114 ; CHECK-LABEL: n7_different_ptrs_commutative:
116 ; CHECK-NEXT: sub w8, w2, #1
117 ; CHECK-NEXT: and w8, w8, w1
118 ; CHECK-NEXT: sub w0, w0, w8
120 %mask = add i32 %alignment, -1
121 %bias = and i32 %mask, %ptr1 ; swapped, not %ptr0
122 %r = sub i32 %ptr0, %bias ; not %ptr1
126 define i32 @n8_not_lowbit_mask(i32 %ptr, i32 %alignment) nounwind {
127 ; CHECK-LABEL: n8_not_lowbit_mask:
129 ; CHECK-NEXT: add w8, w1, #1
130 ; CHECK-NEXT: bic w0, w0, w8
132 %mask = add i32 %alignment, 1 ; not -1
133 %bias = and i32 %ptr, %mask
134 %r = sub i32 %ptr, %bias
138 define i32 @n9_sub_is_not_commutative(i32 %ptr, i32 %alignment) nounwind {
139 ; CHECK-LABEL: n9_sub_is_not_commutative:
141 ; CHECK-NEXT: sub w8, w1, #1
142 ; CHECK-NEXT: and w8, w0, w8
143 ; CHECK-NEXT: sub w0, w8, w0
145 %mask = add i32 %alignment, -1
146 %bias = and i32 %ptr, %mask
147 %r = sub i32 %bias, %ptr ; wrong order