2 * Copyright
(c) 2014 Advanced Micro Devices
, Inc.
4 * Permission is hereby granted
, free of charge
, to any person obtaining a copy
5 * of this software and associated documentation files
(the "Software"), to deal
6 * in the Software without restriction
, including without limitation the rights
7 * to use
, copy
, modify
, merge
, publish
, distribute
, sublicense
, and
/or sell
8 * copies of the Software
, and to permit persons to whom the Software is
9 * furnished to do so
, subject to the following conditions
:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED
"AS IS", WITHOUT WARRANTY OF ANY KIND
, EXPRESS OR
15 * IMPLIED
, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY
,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
17 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM
, DAMAGES OR OTHER
18 * LIABILITY
, WHETHER IN AN ACTION OF CONTRACT
, TORT OR OTHERWISE
, ARISING FROM
,
19 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 #include
<clc
/clcmacro.h
>
27 #include
"sincos_helpers.h"
29 _CLC_OVERLOAD _CLC_DEF float cos
(float x
)
32 int ax
= ix
& 0x7fffffff;
33 float dx
= as_float
(ax);
36 int regn
= __clc_argReductionS
(&r0
, &r1
, dx
);
38 float ss
= -__clc_sinf_piby4
(r0, r1
);
39 float cc
= __clc_cosf_piby4
(r0, r1
);
41 float c
= (regn & 1) != 0 ? ss
: cc
;
42 c
= as_float
(as_int(c) ^
((regn > 1) << 31));
44 c
= ax
>= PINFBITPATT_SP32 ? as_float
(QNANBITPATT_SP32) : c
;
49 _CLC_UNARY_VECTORIZE
(_CLC_OVERLOAD _CLC_DEF
, float
, cos
, float
);
53 #pragma OPENCL EXTENSION cl_khr_fp64
: enable
55 _CLC_OVERLOAD _CLC_DEF double cos
(double x
) {
62 __clc_remainder_piby2_medium
(x, &r
, &rr
, ®n
);
64 __clc_remainder_piby2_large
(x, &r
, &rr
, ®n
);
66 double2 sc
= __clc_sincos_piby4
(r, rr
);
69 int2 c
= as_int2
(regn & 1 ? sc.lo
: sc.hi
);
70 c.hi ^
= (regn > 1) << 31;
72 return isnan
(x) | isinf
(x) ? as_double
(QNANBITPATT_DP64) : as_double
(c);
75 _CLC_UNARY_VECTORIZE
(_CLC_OVERLOAD _CLC_DEF
, double
, cos
, double
);
79 _CLC_DEFINE_UNARY_BUILTIN_FP16
(cos)