2 * Copyright
(c) 2014, 2015 Advanced Micro Devices
, Inc.
4 * Permission is hereby granted
, free of charge
, to any person obtaining a copy
5 * of this software and associated documentation files
(the "Software"), to deal
6 * in the Software without restriction
, including without limitation the rights
7 * to use
, copy
, modify
, merge
, publish
, distribute
, sublicense
, and
/or sell
8 * copies of the Software
, and to permit persons to whom the Software is
9 * furnished to do so
, subject to the following conditions
:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED
"AS IS", WITHOUT WARRANTY OF ANY KIND
, EXPRESS OR
15 * IMPLIED
, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY
,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
17 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM
, DAMAGES OR OTHER
18 * LIABILITY
, WHETHER IN AN ACTION OF CONTRACT
, TORT OR OTHERWISE
, ARISING FROM
,
19 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
30 #pragma OPENCL EXTENSION cl_khr_fp64
: enable
32 _CLC_DEF double __clc_exp_helper
(double x
, double x_min
, double x_max
, double r
, int n
) {
37 // 6 term tail of Taylor expansion of e^r
38 double z2
= r
* fma
(r,
42 fma
(r, 0x1.6c16c16c16c17p-10
, 0x1.1111111111111p-7
),
43 0x1.5555555555555p-5
),
44 0x1.5555555555555p-3
),
45 0x1.0000000000000p-1
),
48 double2 tv
= USE_TABLE
(two_to_jby64_ep_tbl, j
);
49 z2
= fma
(tv.s0
+ tv.s1
, z2
, tv.s1
) + tv.s0
;
51 int small_value
= (m < -
1022) ||
((m == -
1022) && (z2 < 1.0));
55 double z3
= z2
* as_double
(((long)n1
+ 1023) << 52);
56 z3
*= as_double
(((long)n2
+ 1023) << 52);
59 z2
= small_value ? z3
: z2
;
61 z2
= isnan
(x) ? x
: z2
;
63 z2
= x
> x_max ? as_double
(PINFBITPATT_DP64) : z2
;
64 z2
= x
< x_min ?
0.0 : z2
;