1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
2 ; RUN: llc -mtriple=thumbv7-unknown-linux < %s | FileCheck -check-prefixes=CHECK %s
4 declare half @llvm.exp10.f16(half)
5 declare <1 x half> @llvm.exp10.v1f16(<1 x half>)
6 declare <2 x half> @llvm.exp10.v2f16(<2 x half>)
7 declare <3 x half> @llvm.exp10.v3f16(<3 x half>)
8 declare <4 x half> @llvm.exp10.v4f16(<4 x half>)
9 declare float @llvm.exp10.f32(float)
10 declare <1 x float> @llvm.exp10.v1f32(<1 x float>)
11 declare <2 x float> @llvm.exp10.v2f32(<2 x float>)
12 declare <3 x float> @llvm.exp10.v3f32(<3 x float>)
13 declare <4 x float> @llvm.exp10.v4f32(<4 x float>)
14 declare double @llvm.exp10.f64(double)
15 declare <1 x double> @llvm.exp10.v1f64(<1 x double>)
16 declare <2 x double> @llvm.exp10.v2f64(<2 x double>)
17 declare <3 x double> @llvm.exp10.v3f64(<3 x double>)
18 declare <4 x double> @llvm.exp10.v4f64(<4 x double>)
20 define half @exp10_f16(half %x) {
21 ; CHECK-LABEL: exp10_f16:
23 ; CHECK-NEXT: push {r7, lr}
24 ; CHECK-NEXT: bl __gnu_h2f_ieee
25 ; CHECK-NEXT: bl exp10f
26 ; CHECK-NEXT: bl __gnu_f2h_ieee
27 ; CHECK-NEXT: pop {r7, pc}
28 %r = call half @llvm.exp10.f16(half %x)
32 define <1 x half> @exp10_v1f16(<1 x half> %x) {
33 ; CHECK-LABEL: exp10_v1f16:
35 ; CHECK-NEXT: push {r7, lr}
36 ; CHECK-NEXT: bl __gnu_f2h_ieee
37 ; CHECK-NEXT: bl __gnu_h2f_ieee
38 ; CHECK-NEXT: bl exp10f
39 ; CHECK-NEXT: pop {r7, pc}
40 %r = call <1 x half> @llvm.exp10.v1f16(<1 x half> %x)
44 define <2 x half> @exp10_v2f16(<2 x half> %x) {
45 ; CHECK-LABEL: exp10_v2f16:
47 ; CHECK-NEXT: push {r4, r5, r7, lr}
48 ; CHECK-NEXT: mov r4, r1
49 ; CHECK-NEXT: bl __gnu_h2f_ieee
50 ; CHECK-NEXT: bl exp10f
51 ; CHECK-NEXT: bl __gnu_f2h_ieee
52 ; CHECK-NEXT: mov r5, r0
53 ; CHECK-NEXT: mov r0, r4
54 ; CHECK-NEXT: bl __gnu_h2f_ieee
55 ; CHECK-NEXT: bl exp10f
56 ; CHECK-NEXT: bl __gnu_f2h_ieee
57 ; CHECK-NEXT: mov r1, r0
58 ; CHECK-NEXT: mov r0, r5
59 ; CHECK-NEXT: pop {r4, r5, r7, pc}
60 %r = call <2 x half> @llvm.exp10.v2f16(<2 x half> %x)
64 define <3 x half> @exp10_v3f16(<3 x half> %x) {
65 ; CHECK-LABEL: exp10_v3f16:
67 ; CHECK-NEXT: push {r4, r5, r6, lr}
68 ; CHECK-NEXT: mov r4, r2
69 ; CHECK-NEXT: mov r6, r1
70 ; CHECK-NEXT: bl __gnu_h2f_ieee
71 ; CHECK-NEXT: bl exp10f
72 ; CHECK-NEXT: bl __gnu_f2h_ieee
73 ; CHECK-NEXT: mov r5, r0
74 ; CHECK-NEXT: mov r0, r6
75 ; CHECK-NEXT: bl __gnu_h2f_ieee
76 ; CHECK-NEXT: bl exp10f
77 ; CHECK-NEXT: bl __gnu_f2h_ieee
78 ; CHECK-NEXT: mov r6, r0
79 ; CHECK-NEXT: mov r0, r4
80 ; CHECK-NEXT: bl __gnu_h2f_ieee
81 ; CHECK-NEXT: bl exp10f
82 ; CHECK-NEXT: bl __gnu_f2h_ieee
83 ; CHECK-NEXT: mov r2, r0
84 ; CHECK-NEXT: mov r0, r5
85 ; CHECK-NEXT: mov r1, r6
86 ; CHECK-NEXT: pop {r4, r5, r6, pc}
87 %r = call <3 x half> @llvm.exp10.v3f16(<3 x half> %x)
91 define <4 x half> @exp10_v4f16(<4 x half> %x) {
92 ; CHECK-LABEL: exp10_v4f16:
94 ; CHECK-NEXT: push {r4, r5, r6, r7, lr}
95 ; CHECK-NEXT: sub sp, #4
96 ; CHECK-NEXT: mov r4, r3
97 ; CHECK-NEXT: mov r6, r2
98 ; CHECK-NEXT: mov r7, r1
99 ; CHECK-NEXT: bl __gnu_h2f_ieee
100 ; CHECK-NEXT: bl exp10f
101 ; CHECK-NEXT: bl __gnu_f2h_ieee
102 ; CHECK-NEXT: mov r5, r0
103 ; CHECK-NEXT: mov r0, r7
104 ; CHECK-NEXT: bl __gnu_h2f_ieee
105 ; CHECK-NEXT: bl exp10f
106 ; CHECK-NEXT: bl __gnu_f2h_ieee
107 ; CHECK-NEXT: mov r7, r0
108 ; CHECK-NEXT: mov r0, r6
109 ; CHECK-NEXT: bl __gnu_h2f_ieee
110 ; CHECK-NEXT: bl exp10f
111 ; CHECK-NEXT: bl __gnu_f2h_ieee
112 ; CHECK-NEXT: mov r6, r0
113 ; CHECK-NEXT: mov r0, r4
114 ; CHECK-NEXT: bl __gnu_h2f_ieee
115 ; CHECK-NEXT: bl exp10f
116 ; CHECK-NEXT: bl __gnu_f2h_ieee
117 ; CHECK-NEXT: mov r3, r0
118 ; CHECK-NEXT: mov r0, r5
119 ; CHECK-NEXT: mov r1, r7
120 ; CHECK-NEXT: mov r2, r6
121 ; CHECK-NEXT: add sp, #4
122 ; CHECK-NEXT: pop {r4, r5, r6, r7, pc}
123 %r = call <4 x half> @llvm.exp10.v4f16(<4 x half> %x)
127 define float @exp10_f32(float %x) {
128 ; CHECK-LABEL: exp10_f32:
130 ; CHECK-NEXT: b exp10f
131 %r = call float @llvm.exp10.f32(float %x)
135 define <1 x float> @exp10_v1f32(<1 x float> %x) {
136 ; CHECK-LABEL: exp10_v1f32:
138 ; CHECK-NEXT: push {r7, lr}
139 ; CHECK-NEXT: bl exp10f
140 ; CHECK-NEXT: pop {r7, pc}
141 %r = call <1 x float> @llvm.exp10.v1f32(<1 x float> %x)
145 define <2 x float> @exp10_v2f32(<2 x float> %x) {
146 ; CHECK-LABEL: exp10_v2f32:
148 ; CHECK-NEXT: push {r4, lr}
149 ; CHECK-NEXT: vpush {d8}
150 ; CHECK-NEXT: vmov d8, r0, r1
151 ; CHECK-NEXT: vmov r0, s17
152 ; CHECK-NEXT: bl exp10f
153 ; CHECK-NEXT: mov r4, r0
154 ; CHECK-NEXT: vmov r0, s16
155 ; CHECK-NEXT: bl exp10f
156 ; CHECK-NEXT: mov r1, r4
157 ; CHECK-NEXT: vpop {d8}
158 ; CHECK-NEXT: pop {r4, pc}
159 %r = call <2 x float> @llvm.exp10.v2f32(<2 x float> %x)
163 define <3 x float> @exp10_v3f32(<3 x float> %x) {
164 ; CHECK-LABEL: exp10_v3f32:
166 ; CHECK-NEXT: push {r4, r5, r6, lr}
167 ; CHECK-NEXT: vpush {d8, d9}
168 ; CHECK-NEXT: vmov d1, r2, r3
169 ; CHECK-NEXT: mov r5, r0
170 ; CHECK-NEXT: vmov d0, r0, r1
171 ; CHECK-NEXT: mov r4, r1
172 ; CHECK-NEXT: vmov r0, s2
173 ; CHECK-NEXT: bl exp10f
174 ; CHECK-NEXT: mov r6, r0
175 ; CHECK-NEXT: mov r0, r4
176 ; CHECK-NEXT: bl exp10f
177 ; CHECK-NEXT: vmov s17, r0
178 ; CHECK-NEXT: mov r0, r5
179 ; CHECK-NEXT: bl exp10f
180 ; CHECK-NEXT: vmov s16, r0
181 ; CHECK-NEXT: vmov s18, r6
182 ; CHECK-NEXT: vmov r0, r1, d8
183 ; CHECK-NEXT: vmov r2, r3, d9
184 ; CHECK-NEXT: vpop {d8, d9}
185 ; CHECK-NEXT: pop {r4, r5, r6, pc}
186 %r = call <3 x float> @llvm.exp10.v3f32(<3 x float> %x)
190 define <4 x float> @exp10_v4f32(<4 x float> %x) {
191 ; CHECK-LABEL: exp10_v4f32:
193 ; CHECK-NEXT: push {r4, r5, r6, r7, lr}
194 ; CHECK-NEXT: sub sp, #4
195 ; CHECK-NEXT: vpush {d8, d9}
196 ; CHECK-NEXT: mov r6, r0
197 ; CHECK-NEXT: mov r0, r1
198 ; CHECK-NEXT: mov r4, r3
199 ; CHECK-NEXT: mov r5, r2
200 ; CHECK-NEXT: bl exp10f
201 ; CHECK-NEXT: mov r7, r0
202 ; CHECK-NEXT: mov r0, r4
203 ; CHECK-NEXT: bl exp10f
204 ; CHECK-NEXT: vmov s19, r0
205 ; CHECK-NEXT: mov r0, r5
206 ; CHECK-NEXT: bl exp10f
207 ; CHECK-NEXT: vmov s18, r0
208 ; CHECK-NEXT: mov r0, r6
209 ; CHECK-NEXT: vmov s17, r7
210 ; CHECK-NEXT: bl exp10f
211 ; CHECK-NEXT: vmov s16, r0
212 ; CHECK-NEXT: vmov r2, r3, d9
213 ; CHECK-NEXT: vmov r0, r1, d8
214 ; CHECK-NEXT: vpop {d8, d9}
215 ; CHECK-NEXT: add sp, #4
216 ; CHECK-NEXT: pop {r4, r5, r6, r7, pc}
217 %r = call <4 x float> @llvm.exp10.v4f32(<4 x float> %x)
221 define double @exp10_f64(double %x) {
222 ; CHECK-LABEL: exp10_f64:
224 ; CHECK-NEXT: b exp10
225 %r = call double @llvm.exp10.f64(double %x)
230 ; define <1 x double> @exp10_v1f64(<1 x double> %x) {
231 ; %r = call <1 x double> @llvm.exp10.v1f64(<1 x double> %x)
232 ; ret <1 x double> %r
235 define <2 x double> @exp10_v2f64(<2 x double> %x) {
236 ; CHECK-LABEL: exp10_v2f64:
238 ; CHECK-NEXT: push {r4, r5, r6, r7, lr}
239 ; CHECK-NEXT: sub sp, #4
240 ; CHECK-NEXT: mov r4, r3
241 ; CHECK-NEXT: mov r5, r2
242 ; CHECK-NEXT: bl exp10
243 ; CHECK-NEXT: mov r6, r0
244 ; CHECK-NEXT: mov r7, r1
245 ; CHECK-NEXT: mov r0, r5
246 ; CHECK-NEXT: mov r1, r4
247 ; CHECK-NEXT: bl exp10
248 ; CHECK-NEXT: mov r2, r0
249 ; CHECK-NEXT: mov r3, r1
250 ; CHECK-NEXT: mov r0, r6
251 ; CHECK-NEXT: mov r1, r7
252 ; CHECK-NEXT: add sp, #4
253 ; CHECK-NEXT: pop {r4, r5, r6, r7, pc}
254 %r = call <2 x double> @llvm.exp10.v2f64(<2 x double> %x)
258 define <3 x double> @exp10_v3f64(<3 x double> %x) {
259 ; CHECK-LABEL: exp10_v3f64:
261 ; CHECK-NEXT: push {r4, lr}
262 ; CHECK-NEXT: vpush {d8, d9}
263 ; CHECK-NEXT: mov r4, r0
264 ; CHECK-NEXT: mov r1, r3
265 ; CHECK-NEXT: mov r0, r2
266 ; CHECK-NEXT: bl exp10
267 ; CHECK-NEXT: ldrd r2, r3, [sp, #24]
268 ; CHECK-NEXT: vmov d8, r0, r1
269 ; CHECK-NEXT: mov r1, r3
270 ; CHECK-NEXT: mov r0, r2
271 ; CHECK-NEXT: bl exp10
272 ; CHECK-NEXT: ldrd r2, r3, [sp, #32]
273 ; CHECK-NEXT: vmov d9, r0, r1
274 ; CHECK-NEXT: mov r1, r3
275 ; CHECK-NEXT: vst1.64 {d8, d9}, [r4:128]!
276 ; CHECK-NEXT: mov r0, r2
277 ; CHECK-NEXT: bl exp10
278 ; CHECK-NEXT: strd r0, r1, [r4]
279 ; CHECK-NEXT: vpop {d8, d9}
280 ; CHECK-NEXT: pop {r4, pc}
281 %r = call <3 x double> @llvm.exp10.v3f64(<3 x double> %x)
285 define <4 x double> @exp10_v4f64(<4 x double> %x) {
286 ; CHECK-LABEL: exp10_v4f64:
288 ; CHECK-NEXT: push.w {r4, r5, r6, r7, r8, lr}
289 ; CHECK-NEXT: vpush {d8, d9, d10, d11}
290 ; CHECK-NEXT: mov r4, r0
291 ; CHECK-NEXT: mov r1, r3
292 ; CHECK-NEXT: mov r0, r2
293 ; CHECK-NEXT: bl exp10
294 ; CHECK-NEXT: add r2, sp, #64
295 ; CHECK-NEXT: vmov d8, r0, r1
296 ; CHECK-NEXT: vld1.64 {d16, d17}, [r2]
297 ; CHECK-NEXT: vmov r2, r3, d17
298 ; CHECK-NEXT: vmov r5, r8, d16
299 ; CHECK-NEXT: mov r0, r2
300 ; CHECK-NEXT: mov r1, r3
301 ; CHECK-NEXT: bl exp10
302 ; CHECK-NEXT: mov r7, r0
303 ; CHECK-NEXT: mov r6, r1
304 ; CHECK-NEXT: ldrd r0, r1, [sp, #56]
305 ; CHECK-NEXT: bl exp10
306 ; CHECK-NEXT: vmov d9, r0, r1
307 ; CHECK-NEXT: mov r0, r5
308 ; CHECK-NEXT: mov r1, r8
309 ; CHECK-NEXT: vmov d11, r7, r6
310 ; CHECK-NEXT: bl exp10
311 ; CHECK-NEXT: vmov d10, r0, r1
312 ; CHECK-NEXT: vst1.64 {d8, d9}, [r4:128]!
313 ; CHECK-NEXT: vst1.64 {d10, d11}, [r4:128]
314 ; CHECK-NEXT: vpop {d8, d9, d10, d11}
315 ; CHECK-NEXT: pop.w {r4, r5, r6, r7, r8, pc}
316 %r = call <4 x double> @llvm.exp10.v4f64(<4 x double> %x)