1 ; RUN: llc < %s -mtriple=thumbv7-none-eabi -mcpu=cortex-m3 | FileCheck %s -check-prefix=CHECK -check-prefix=SOFT -check-prefix=NONE
2 ; RUN: llc < %s -mtriple=thumbv7-none-eabihf -mcpu=cortex-m4 | FileCheck %s -check-prefix=CHECK -check-prefix=SOFT -check-prefix=SP
3 ; RUN: llc < %s -mtriple=thumbv7-none-eabihf -mcpu=cortex-m7 | FileCheck %s -check-prefix=CHECK -check-prefix=HARD -check-prefix=DP -check-prefix=VFP -check-prefix=FP-ARMv8
4 ; RUN: llc < %s -mtriple=thumbv7-none-eabihf -mcpu=cortex-m7 -mattr=-fp64 | FileCheck %s -check-prefix=CHECK -check-prefix=SOFT -check-prefix=SP
5 ; RUN: llc < %s -mtriple=thumbv7-none-eabihf -mcpu=cortex-a7 | FileCheck %s -check-prefix=CHECK -check-prefix=HARD -check-prefix=DP -check-prefix=NEON -check-prefix=VFP4
6 ; RUN: llc < %s -mtriple=thumbv7-none-eabihf -mcpu=cortex-a57 | FileCheck %s -check-prefix=CHECK -check-prefix=HARD -check-prefix=DP -check-prefix=NEON -check-prefix=FP-ARMv8
8 declare double @llvm.sqrt.f64(double %Val)
9 define double @sqrt_d(double %a) {
10 ; CHECK-LABEL: sqrt_d:
11 ; SOFT: {{(bl|b)}} sqrt
12 ; HARD: vsqrt.f64 d0, d0
13 %1 = call double @llvm.sqrt.f64(double %a)
17 declare double @llvm.powi.f64.i32(double %Val, i32 %power)
18 define double @powi_d(double %a, i32 %b) {
19 ; CHECK-LABEL: powi_d:
20 ; SOFT: {{(bl|b)}} __powidf2
22 %1 = call double @llvm.powi.f64.i32(double %a, i32 %b)
26 declare double @llvm.sin.f64(double %Val)
27 define double @sin_d(double %a) {
29 ; SOFT: {{(bl|b)}} sin
31 %1 = call double @llvm.sin.f64(double %a)
35 declare double @llvm.cos.f64(double %Val)
36 define double @cos_d(double %a) {
38 ; SOFT: {{(bl|b)}} cos
40 %1 = call double @llvm.cos.f64(double %a)
44 declare double @llvm.pow.f64(double %Val, double %power)
45 define double @pow_d(double %a, double %b) {
47 ; SOFT: {{(bl|b)}} pow
49 %1 = call double @llvm.pow.f64(double %a, double %b)
53 declare double @llvm.exp.f64(double %Val)
54 define double @exp_d(double %a) {
56 ; SOFT: {{(bl|b)}} exp
58 %1 = call double @llvm.exp.f64(double %a)
62 declare double @llvm.exp2.f64(double %Val)
63 define double @exp2_d(double %a) {
64 ; CHECK-LABEL: exp2_d:
65 ; SOFT: {{(bl|b)}} exp2
67 %1 = call double @llvm.exp2.f64(double %a)
71 declare double @llvm.log.f64(double %Val)
72 define double @log_d(double %a) {
74 ; SOFT: {{(bl|b)}} log
76 %1 = call double @llvm.log.f64(double %a)
80 declare double @llvm.log10.f64(double %Val)
81 define double @log10_d(double %a) {
82 ; CHECK-LABEL: log10_d:
83 ; SOFT: {{(bl|b)}} log10
85 %1 = call double @llvm.log10.f64(double %a)
89 declare double @llvm.log2.f64(double %Val)
90 define double @log2_d(double %a) {
91 ; CHECK-LABEL: log2_d:
92 ; SOFT: {{(bl|b)}} log2
94 %1 = call double @llvm.log2.f64(double %a)
98 declare double @llvm.fma.f64(double %a, double %b, double %c)
99 define double @fma_d(double %a, double %b, double %c) {
100 ; CHECK-LABEL: fma_d:
101 ; SOFT: {{(bl|b)}} fma
103 %1 = call double @llvm.fma.f64(double %a, double %b, double %c)
107 ; FIXME: the FPv4-SP version is less efficient than the no-FPU version
108 declare double @llvm.fabs.f64(double %Val)
109 define double @abs_d(double %a) {
110 ; CHECK-LABEL: abs_d:
111 ; NONE: bic r1, r1, #-2147483648
112 ; SP: vldr [[D1:d[0-9]+]], .LCPI{{.*}}
113 ; SP-DAG: vmov [[R2:r[0-9]+]], [[R3:r[0-9]+]], [[D1]]
114 ; SP-DAG: vmov [[R0:r[0-9]+]], [[R1:r[0-9]+]], [[D0:d[0-9]+]]
115 ; SP: lsrs [[R4:r[0-9]+]], [[R3]], #31
116 ; SP: bfi [[R5:r[0-9]+]], [[R4]], #31, #1
117 ; SP: vmov [[D0]], [[R0]], [[R5]]
118 ; DP: vabs.f64 d0, d0
119 %1 = call double @llvm.fabs.f64(double %a)
123 declare double @llvm.copysign.f64(double %Mag, double %Sgn)
124 define double @copysign_d(double %a, double %b) {
125 ; CHECK-LABEL: copysign_d:
126 ; SOFT: lsrs [[REG:r[0-9]+]], {{r[0-9]+}}, #31
127 ; SOFT: bfi {{r[0-9]+}}, [[REG]], #31, #1
128 ; VFP: lsrs [[REG:r[0-9]+]], {{r[0-9]+}}, #31
129 ; VFP: bfi {{r[0-9]+}}, [[REG]], #31, #1
130 ; NEON: vmov.i32 d16, #0x80000000
131 ; NEON-NEXT: vshl.i64 d16, d16, #32
132 ; NEON-NEXT: vbit d0, d1, d16
134 %1 = call double @llvm.copysign.f64(double %a, double %b)
138 declare double @llvm.floor.f64(double %Val)
139 define double @floor_d(double %a) {
140 ; CHECK-LABEL: floor_d:
141 ; SOFT: {{(bl|b)}} floor
143 ; FP-ARMv8: vrintm.f64
144 %1 = call double @llvm.floor.f64(double %a)
148 declare double @llvm.ceil.f64(double %Val)
149 define double @ceil_d(double %a) {
150 ; CHECK-LABEL: ceil_d:
151 ; SOFT: {{(bl|b)}} ceil
153 ; FP-ARMv8: vrintp.f64
154 %1 = call double @llvm.ceil.f64(double %a)
158 declare double @llvm.trunc.f64(double %Val)
159 define double @trunc_d(double %a) {
160 ; CHECK-LABEL: trunc_d:
161 ; SOFT: {{(bl|b)}} trunc
163 ; FP-ARMv8: vrintz.f64
164 %1 = call double @llvm.trunc.f64(double %a)
168 declare double @llvm.rint.f64(double %Val)
169 define double @rint_d(double %a) {
170 ; CHECK-LABEL: rint_d:
171 ; SOFT: {{(bl|b)}} rint
173 ; FP-ARMv8: vrintx.f64
174 %1 = call double @llvm.rint.f64(double %a)
178 declare double @llvm.nearbyint.f64(double %Val)
179 define double @nearbyint_d(double %a) {
180 ; CHECK-LABEL: nearbyint_d:
181 ; SOFT: {{(bl|b)}} nearbyint
183 ; FP-ARMv8: vrintr.f64
184 %1 = call double @llvm.nearbyint.f64(double %a)
188 declare double @llvm.round.f64(double %Val)
189 define double @round_d(double %a) {
190 ; CHECK-LABEL: round_d:
191 ; SOFT: {{(bl|b)}} round
193 ; FP-ARMv8: vrinta.f64
194 %1 = call double @llvm.round.f64(double %a)
198 declare double @llvm.fmuladd.f64(double %a, double %b, double %c)
199 define double @fmuladd_d(double %a, double %b, double %c) {
200 ; CHECK-LABEL: fmuladd_d:
201 ; SOFT: bl __aeabi_dmul
202 ; SOFT: bl __aeabi_dadd
206 %1 = call double @llvm.fmuladd.f64(double %a, double %b, double %c)
210 declare i16 @llvm.convert.to.fp16.f64(double %a)
211 define i16 @d_to_h(double %a) {
212 ; CHECK-LABEL: d_to_h:
213 ; SOFT: bl __aeabi_d2h
214 ; VFP4: bl __aeabi_d2h
215 ; FP-ARMv8: vcvt{{[bt]}}.f16.f64
216 %1 = call i16 @llvm.convert.to.fp16.f64(double %a)
220 declare double @llvm.convert.from.fp16.f64(i16 %a)
221 define double @h_to_d(i16 %a) {
222 ; CHECK-LABEL: h_to_d:
223 ; NONE: bl __aeabi_h2f
224 ; NONE: bl __aeabi_f2d
225 ; SP: vcvt{{[bt]}}.f32.f16
227 ; VFPv4: vcvt{{[bt]}}.f32.f16
228 ; VFPv4: vcvt.f64.f32
229 ; FP-ARMv8: vcvt{{[bt]}}.f64.f16
230 %1 = call double @llvm.convert.from.fp16.f64(i16 %a)