8354 sync regcomp(3C) with upstream (fix make catalog)
[unleashed/tickless.git] / usr / src / lib / libmvec / common / __vcosbig.c
blobbd4a2412154288ab2a06389dfb0b0e89961ca4bc
1 /*
2 * CDDL HEADER START
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
19 * CDDL HEADER END
23 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
26 * Copyright 2006 Sun Microsystems, Inc. All rights reserved.
27 * Use is subject to license terms.
30 #include <sys/isa_defs.h>
32 #ifdef _LITTLE_ENDIAN
33 #define HI(x) *(1+(int*)x)
34 #define LO(x) *(unsigned*)x
35 #else
36 #define HI(x) *(int*)x
37 #define LO(x) *(1+(unsigned*)x)
38 #endif
40 #ifdef __RESTRICT
41 #define restrict _Restrict
42 #else
43 #define restrict
44 #endif
46 extern const double __vlibm_TBL_sincos_hi[], __vlibm_TBL_sincos_lo[];
47 extern int __vlibm_rem_pio2m(double *, double *, int, int, int);
49 static const double
50 zero = 0.0,
51 one = 1.0,
52 two24 = 16777216.0,
53 pp1 = -1.666666666605760465276263943134982554676e-0001,
54 pp2 = 8.333261209690963126718376566146180944442e-0003,
55 p1 = -1.666666666666629669805215138920301589656e-0001,
56 p2 = 8.333333332390951295683993455280336376663e-0003,
57 p3 = -1.984126237997976692791551778230098403960e-0004,
58 p4 = 2.753403624854277237649987622848330351110e-0006,
59 qq1 = -4.999999999977710986407023955908711557870e-0001,
60 qq2 = 4.166654863857219350645055881018842089580e-0002,
61 q1 = -4.999999999999931701464060878888294524481e-0001,
62 q2 = 4.166666666394861917535640593963708222319e-0002,
63 q3 = -1.388888552656142867832756687736851681462e-0003,
64 q4 = 2.478519423681460796618128289454530524759e-0005;
66 void
67 __vlibm_vcos_big(int n, double * restrict x, int stridex, double * restrict y,
68 int stridey, int thresh)
70 for (; n--; x += stridex, y += stridey)
72 double tx, tt[3], ty[2], t, w, z, a;
73 unsigned hx, xsb;
74 int e0, nx, j;
76 hx = HI(x);
77 xsb = hx & 0x80000000;
78 hx &= ~0x80000000;
79 if (hx <= thresh || hx >= 0x7ff00000)
80 continue;
81 e0 = (hx >> 20) - 1046;
82 HI(&tx) = 0x41600000 | (hx & 0xfffff);
83 LO(&tx) = LO(x);
84 tt[0] = (double)((int) tx);
85 tx = (tx - tt[0]) * two24;
86 if (tx != zero)
88 nx = 2;
89 tt[1] = (double)((int) tx);
90 tt[2] = (tx - tt[1]) * two24;
91 if (tt[2] != zero)
92 nx = 3;
94 else
96 nx = 1;
97 tt[1] = tt[2] = zero;
99 nx = __vlibm_rem_pio2m(tt, ty, e0, nx, 2);
100 if (xsb)
102 nx = -nx;
103 ty[0] = -ty[0];
104 ty[1] = -ty[1];
106 nx = (nx + 1) & 3; /* Add 1 to turn sin into cos */
108 /* now nx and ty[*] are the quadrant and reduced arg */
109 xsb = (nx & 2) << 30;
110 hx = HI(&ty[0]);
111 if (nx & 1)
113 if (hx & 0x80000000)
115 ty[0] = -ty[0];
116 ty[1] = -ty[1];
117 hx &= ~0x80000000;
119 if (hx < 0x3fc40000)
121 z = ty[0] * ty[0];
122 t = z * (q1 + z * (q2 + z * (q3 + z * q4)));
123 a = one + t;
125 else
127 j = (hx + 0x4000) & 0x7fff8000;
128 HI(&t) = j;
129 LO(&t) = 0;
130 ty[0] = (ty[0] - t) + ty[1];
131 z = ty[0] * ty[0];
132 t = z * (qq1 + z * qq2);
133 w = ty[0] * (one + z * (pp1 + z * pp2));
134 j = ((j - 0x3fc40000) >> 13) & ~3;
135 a = __vlibm_TBL_sincos_hi[j+1];
136 t = __vlibm_TBL_sincos_lo[j+1] - (__vlibm_TBL_sincos_hi[j] * w - a * t);
137 a += t;
140 else
142 if (hx & 0x80000000)
144 ty[0] = -ty[0];
145 ty[1] = -ty[1];
146 hx &= ~0x80000000;
147 xsb ^= 0x80000000;
149 if (hx < 0x3fc90000)
151 z = ty[0] * ty[0];
152 t = z * (p1 + z * (p2 + z * (p3 + z * p4)));
153 a = ty[0] + (ty[1] + ty[0] * t);
155 else
157 j = (hx + 0x4000) & 0x7fff8000;
158 HI(&t) = j;
159 LO(&t) = 0;
160 ty[0] = (ty[0] - t) + ty[1];
161 z = ty[0] * ty[0];
162 t = z * (qq1 + z * qq2);
163 w = ty[0] * (one + z * (pp1 + z * pp2));
164 j = ((j - 0x3fc40000) >> 13) & ~3;
165 a = __vlibm_TBL_sincos_hi[j];
166 t = (__vlibm_TBL_sincos_hi[j+1] * w + a * t) + __vlibm_TBL_sincos_lo[j];
167 a += t;
170 if (xsb) a = -a;
171 *y = a;