1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc -mtriple=arm64-apple-iphoneos -aarch64-enable-sink-fold=true -o - %s | FileCheck %s
4 define i3 @sign_i3(i3 %a) {
5 ; CHECK-LABEL: sign_i3:
7 ; CHECK-NEXT: sbfx w8, w0, #2, #1
8 ; CHECK-NEXT: orr w0, w8, #0x1
10 %c = icmp sgt i3 %a, -1
11 %res = select i1 %c, i3 1, i3 -1
15 define i4 @sign_i4(i4 %a) {
16 ; CHECK-LABEL: sign_i4:
18 ; CHECK-NEXT: sbfx w8, w0, #3, #1
19 ; CHECK-NEXT: orr w0, w8, #0x1
21 %c = icmp sgt i4 %a, -1
22 %res = select i1 %c, i4 1, i4 -1
26 define i8 @sign_i8(i8 %a) {
27 ; CHECK-LABEL: sign_i8:
29 ; CHECK-NEXT: sbfx w8, w0, #7, #1
30 ; CHECK-NEXT: orr w0, w8, #0x1
32 %c = icmp sgt i8 %a, -1
33 %res = select i1 %c, i8 1, i8 -1
37 define i16 @sign_i16(i16 %a) {
38 ; CHECK-LABEL: sign_i16:
40 ; CHECK-NEXT: sbfx w8, w0, #15, #1
41 ; CHECK-NEXT: orr w0, w8, #0x1
43 %c = icmp sgt i16 %a, -1
44 %res = select i1 %c, i16 1, i16 -1
48 define i32 @sign_i32(i32 %a) {
49 ; CHECK-LABEL: sign_i32:
51 ; CHECK-NEXT: asr w8, w0, #31
52 ; CHECK-NEXT: orr w0, w8, #0x1
54 %c = icmp sgt i32 %a, -1
55 %res = select i1 %c, i32 1, i32 -1
59 define i64 @sign_i64(i64 %a) {
60 ; CHECK-LABEL: sign_i64:
62 ; CHECK-NEXT: asr x8, x0, #63
63 ; CHECK-NEXT: orr x0, x8, #0x1
65 %c = icmp sgt i64 %a, -1
66 %res = select i1 %c, i64 1, i64 -1
71 define i64 @not_sign_i64(i64 %a) {
72 ; CHECK-LABEL: not_sign_i64:
74 ; CHECK-NEXT: mov w8, #1 // =0x1
75 ; CHECK-NEXT: cmp x0, #0
76 ; CHECK-NEXT: cneg x0, x8, le
78 %c = icmp sgt i64 %a, 0
79 %res = select i1 %c, i64 1, i64 -1
83 define i64 @not_sign_i64_2(i64 %a) {
84 ; CHECK-LABEL: not_sign_i64_2:
86 ; CHECK-NEXT: asr x0, x0, #63
88 %c = icmp sgt i64 %a, -1
89 %res = select i1 %c, i64 0, i64 -1
93 define i64 @not_sign_i64_3(i64 %a) {
94 ; CHECK-LABEL: not_sign_i64_3:
96 ; CHECK-NEXT: mvn x8, x0
97 ; CHECK-NEXT: lsr x0, x8, #63
99 %c = icmp sgt i64 %a, -1
100 %res = select i1 %c, i64 1, i64 0
104 define i64 @not_sign_i64_4(i64 %a) {
105 ; CHECK-LABEL: not_sign_i64_4:
107 ; CHECK-NEXT: mov x0, #-1 // =0xffffffffffffffff
109 %c = icmp ugt i64 %a, -1
110 %res = select i1 %c, i64 1, i64 -1
114 define <7 x i8> @sign_7xi8(<7 x i8> %a) {
115 ; CHECK-LABEL: sign_7xi8:
117 ; CHECK-NEXT: movi v1.8b, #1
118 ; CHECK-NEXT: cmlt v0.8b, v0.8b, #0
119 ; CHECK-NEXT: orr v0.8b, v0.8b, v1.8b
121 %c = icmp sgt <7 x i8> %a, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
122 %res = select <7 x i1> %c, <7 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, <7 x i8> <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
126 define <8 x i8> @sign_8xi8(<8 x i8> %a) {
127 ; CHECK-LABEL: sign_8xi8:
129 ; CHECK-NEXT: movi v1.8b, #1
130 ; CHECK-NEXT: cmlt v0.8b, v0.8b, #0
131 ; CHECK-NEXT: orr v0.8b, v0.8b, v1.8b
133 %c = icmp sgt <8 x i8> %a, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
134 %res = select <8 x i1> %c, <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, <8 x i8> <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
138 define <16 x i8> @sign_16xi8(<16 x i8> %a) {
139 ; CHECK-LABEL: sign_16xi8:
141 ; CHECK-NEXT: movi v1.16b, #1
142 ; CHECK-NEXT: cmlt v0.16b, v0.16b, #0
143 ; CHECK-NEXT: orr v0.16b, v0.16b, v1.16b
145 %c = icmp sgt <16 x i8> %a, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
146 %res = select <16 x i1> %c, <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, <16 x i8> <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
150 define <3 x i32> @sign_3xi32(<3 x i32> %a) {
151 ; CHECK-LABEL: sign_3xi32:
153 ; CHECK-NEXT: cmlt v0.4s, v0.4s, #0
154 ; CHECK-NEXT: orr v0.4s, #1
156 %c = icmp sgt <3 x i32> %a, <i32 -1, i32 -1, i32 -1>
157 %res = select <3 x i1> %c, <3 x i32> <i32 1, i32 1, i32 1>, <3 x i32> <i32 -1, i32 -1, i32 -1>
161 define <4 x i32> @sign_4xi32(<4 x i32> %a) {
162 ; CHECK-LABEL: sign_4xi32:
164 ; CHECK-NEXT: cmlt v0.4s, v0.4s, #0
165 ; CHECK-NEXT: orr v0.4s, #1
167 %c = icmp sgt <4 x i32> %a, <i32 -1, i32 -1, i32 -1, i32 -1>
168 %res = select <4 x i1> %c, <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>
172 define <4 x i32> @sign_4xi32_multi_use(<4 x i32> %a) {
173 ; CHECK-LABEL: sign_4xi32_multi_use:
175 ; CHECK-NEXT: sub sp, sp, #32
176 ; CHECK-NEXT: str x30, [sp, #16] // 8-byte Folded Spill
177 ; CHECK-NEXT: .cfi_def_cfa_offset 32
178 ; CHECK-NEXT: .cfi_offset w30, -16
179 ; CHECK-NEXT: movi v1.2d, #0xffffffffffffffff
180 ; CHECK-NEXT: cmlt v2.4s, v0.4s, #0
181 ; CHECK-NEXT: orr v2.4s, #1
182 ; CHECK-NEXT: cmgt v1.4s, v0.4s, v1.4s
183 ; CHECK-NEXT: str q2, [sp] // 16-byte Folded Spill
184 ; CHECK-NEXT: xtn v0.4h, v1.4s
185 ; CHECK-NEXT: bl use_4xi1
186 ; CHECK-NEXT: ldr q0, [sp] // 16-byte Folded Reload
187 ; CHECK-NEXT: ldr x30, [sp, #16] // 8-byte Folded Reload
188 ; CHECK-NEXT: add sp, sp, #32
190 %c = icmp sgt <4 x i32> %a, <i32 -1, i32 -1, i32 -1, i32 -1>
191 %res = select <4 x i1> %c, <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>
192 call void @use_4xi1(<4 x i1> %c)
196 ; Second icmp operand breaks sign pattern.
197 define <4 x i32> @not_sign_4xi32(<4 x i32> %a) {
198 ; CHECK-LABEL: not_sign_4xi32:
200 ; CHECK-NEXT: adrp x8, .LCPI16_0
201 ; CHECK-NEXT: movi v2.4s, #1
202 ; CHECK-NEXT: ldr q1, [x8, :lo12:.LCPI16_0]
203 ; CHECK-NEXT: cmgt v0.4s, v0.4s, v1.4s
204 ; CHECK-NEXT: and v1.16b, v0.16b, v2.16b
205 ; CHECK-NEXT: orn v0.16b, v1.16b, v0.16b
207 %c = icmp sgt <4 x i32> %a, <i32 1, i32 -1, i32 -1, i32 -1>
208 %res = select <4 x i1> %c, <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>
212 ; First select operand breaks sign pattern.
213 define <4 x i32> @not_sign_4xi32_2(<4 x i32> %a) {
214 ; CHECK-LABEL: not_sign_4xi32_2:
216 ; CHECK-NEXT: adrp x8, .LCPI17_0
217 ; CHECK-NEXT: cmlt v0.4s, v0.4s, #0
218 ; CHECK-NEXT: ldr q1, [x8, :lo12:.LCPI17_0]
219 ; CHECK-NEXT: orr v0.16b, v0.16b, v1.16b
221 %c = icmp sgt <4 x i32> %a, <i32 -1, i32 -1, i32 -1, i32 -1>
222 %res = select <4 x i1> %c, <4 x i32> <i32 1, i32 1, i32 -1, i32 1>, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>
226 ; Second select operand breaks sign pattern.
227 define <4 x i32> @not_sign_4xi32_3(<4 x i32> %a) {
228 ; CHECK-LABEL: not_sign_4xi32_3:
230 ; CHECK-NEXT: movi v1.2d, #0xffffffffffffffff
231 ; CHECK-NEXT: adrp x8, .LCPI18_0
232 ; CHECK-NEXT: cmgt v0.4s, v0.4s, v1.4s
233 ; CHECK-NEXT: ldr q1, [x8, :lo12:.LCPI18_0]
234 ; CHECK-NEXT: bic v1.16b, v1.16b, v0.16b
235 ; CHECK-NEXT: sub v0.4s, v1.4s, v0.4s
237 %c = icmp sgt <4 x i32> %a, <i32 -1, i32 -1, i32 -1, i32 -1>
238 %res = select <4 x i1> %c, <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 1>
243 define <4 x i65> @sign_4xi65(<4 x i65> %a) {
244 ; CHECK-LABEL: sign_4xi65:
246 ; CHECK-NEXT: sbfx x8, x1, #0, #1
247 ; CHECK-NEXT: sbfx x9, x5, #0, #1
248 ; CHECK-NEXT: sbfx x10, x3, #0, #1
249 ; CHECK-NEXT: lsr x1, x8, #63
250 ; CHECK-NEXT: orr x8, x8, #0x1
251 ; CHECK-NEXT: lsr x3, x10, #63
252 ; CHECK-NEXT: fmov d0, x8
253 ; CHECK-NEXT: sbfx x8, x7, #0, #1
254 ; CHECK-NEXT: lsr x5, x9, #63
255 ; CHECK-NEXT: orr x2, x10, #0x1
256 ; CHECK-NEXT: orr x4, x9, #0x1
257 ; CHECK-NEXT: lsr x7, x8, #63
258 ; CHECK-NEXT: orr x6, x8, #0x1
259 ; CHECK-NEXT: mov v0.d[1], x1
260 ; CHECK-NEXT: fmov x0, d0
262 %c = icmp sgt <4 x i65> %a, <i65 -1, i65 -1, i65 -1, i65 -1>
263 %res = select <4 x i1> %c, <4 x i65> <i65 1, i65 1, i65 1, i65 1>, <4 x i65 > <i65 -1, i65 -1, i65 -1, i65 -1>
267 declare void @use_4xi1(<4 x i1>)