1 //===-- Single-precision atan function ------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "src/math/atanf.h"
10 #include "inv_trigf_utils.h"
11 #include "src/__support/FPUtil/FPBits.h"
12 #include "src/__support/FPUtil/PolyEval.h"
13 #include "src/__support/FPUtil/except_value_utils.h"
14 #include "src/__support/FPUtil/multiply_add.h"
15 #include "src/__support/FPUtil/nearest_integer.h"
16 #include "src/__support/FPUtil/rounding_mode.h"
17 #include "src/__support/macros/config.h"
18 #include "src/__support/macros/optimization.h" // LIBC_UNLIKELY
20 namespace LIBC_NAMESPACE_DECL
{
22 LLVM_LIBC_FUNCTION(float, atanf
, (float x
)) {
23 using FPBits
= typename
fputil::FPBits
<float>;
25 constexpr double FINAL_SIGN
[2] = {1.0, -1.0};
26 constexpr double SIGNED_PI_OVER_2
[2] = {0x1.921fb54442d18p0
,
27 -0x1.921fb54442d18p0
};
30 Sign sign
= x_bits
.sign();
31 x_bits
.set_sign(Sign::POS
);
32 uint32_t x_abs
= x_bits
.uintval();
34 // x is inf or nan, |x| < 2^-4 or |x|= > 16.
35 if (LIBC_UNLIKELY(x_abs
<= 0x3d80'0000U
|| x_abs
>= 0x4180'0000U
)) {
36 double x_d
= static_cast<double>(x
);
37 double const_term
= 0.0;
38 if (LIBC_UNLIKELY(x_abs
>= 0x4180'0000)) {
39 // atan(+-Inf) = +-pi/2.
40 if (x_bits
.is_inf()) {
41 volatile double sign_pi_over_2
= SIGNED_PI_OVER_2
[sign
.is_neg()];
42 return static_cast<float>(sign_pi_over_2
);
48 const_term
= SIGNED_PI_OVER_2
[sign
.is_neg()];
51 if (LIBC_UNLIKELY(x_bits
.is_zero()))
54 if (LIBC_UNLIKELY(x_abs
< 0x3980'0000)) {
55 #if defined(LIBC_TARGET_CPU_HAS_FMA)
56 return fputil::multiply_add(x
, -0x1.0p
-25f
, x
);
58 double x_d
= static_cast<double>(x
);
59 return static_cast<float>(fputil::multiply_add(x_d
, -0x1.0p
-25, x_d
));
60 #endif // LIBC_TARGET_CPU_HAS_FMA
62 // Use Taylor polynomial:
63 // atan(x) ~ x * (1 - x^2 / 3 + x^4 / 5 - x^6 / 7 + x^8 / 9 - x^10 / 11).
64 constexpr double ATAN_TAYLOR
[6] = {
65 0x1.0000000000000p
+0, -0x1.5555555555555p
-2, 0x1.999999999999ap
-3,
66 -0x1.2492492492492p
-3, 0x1.c71c71c71c71cp
-4, -0x1.745d1745d1746p
-4,
68 double x2
= x_d
* x_d
;
70 double c0
= fputil::multiply_add(x2
, ATAN_TAYLOR
[1], ATAN_TAYLOR
[0]);
71 double c1
= fputil::multiply_add(x2
, ATAN_TAYLOR
[3], ATAN_TAYLOR
[2]);
72 double c2
= fputil::multiply_add(x2
, ATAN_TAYLOR
[5], ATAN_TAYLOR
[4]);
73 double p
= fputil::polyeval(x4
, c0
, c1
, c2
);
74 double r
= fputil::multiply_add(x_d
, p
, const_term
);
75 return static_cast<float>(r
);
78 // Range reduction steps:
79 // 1) atan(x) = sign(x) * atan(|x|)
80 // 2) If |x| > 1, atan(|x|) = pi/2 - atan(1/|x|)
81 // 3) For 1/16 < x <= 1, we find k such that: |x - k/16| <= 1/32.
82 // 4) Then we use polynomial approximation:
83 // atan(x) ~ atan((k/16) + (x - (k/16)) * Q(x - k/16)
85 double x_d
, const_term
, final_sign
;
88 if (x_abs
> 0x3f80'0000U
) {
89 // |x| > 1, we need to invert x, so we will perform range reduction in
91 x_d
= 1.0 / static_cast<double>(x_bits
.get_val());
92 double k_d
= fputil::nearest_integer(x_d
* 0x1.0p4
);
93 x_d
= fputil::multiply_add(k_d
, -0x1.0p
-4, x_d
);
94 idx
= static_cast<int>(k_d
);
95 final_sign
= FINAL_SIGN
[sign
.is_pos()];
96 // Adjust constant term of the polynomial by +- pi/2.
97 const_term
= fputil::multiply_add(final_sign
, ATAN_COEFFS
[idx
][0],
98 SIGNED_PI_OVER_2
[sign
.is_neg()]);
100 // Exceptional value:
101 if (LIBC_UNLIKELY(x_abs
== 0x3d8d'6b23U
)) { // |x| = 0x1.1ad646p-4
102 return sign
.is_pos() ? fputil::round_result_slightly_down(0x1.1a6386p
-4f
)
103 : fputil::round_result_slightly_up(-0x1.1a6386p
-4f
);
105 // Perform range reduction in single precision.
106 float x_f
= x_bits
.get_val();
107 float k_f
= fputil::nearest_integer(x_f
* 0x1.0p4f
);
108 x_f
= fputil::multiply_add(k_f
, -0x1.0p
-4f
, x_f
);
109 x_d
= static_cast<double>(x_f
);
110 idx
= static_cast<int>(k_f
);
111 final_sign
= FINAL_SIGN
[sign
.is_neg()];
112 const_term
= final_sign
* ATAN_COEFFS
[idx
][0];
115 double p
= atan_eval(x_d
, idx
);
116 double r
= fputil::multiply_add(final_sign
* x_d
, p
, const_term
);
118 return static_cast<float>(r
);
121 } // namespace LIBC_NAMESPACE_DECL