2 * Linux/PA-RISC Project (http://www.parisc-linux.org/)
4 * Floating-point emulation code
5 * Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2, or (at your option)
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
25 * @(#) pa/spmath/dfsqrt.c $Revision: 1.1 $
28 * Double Floating-point Square Root
30 * External Interfaces:
31 * dbl_fsqrt(srcptr,nullptr,dstptr,status)
33 * Internal Interfaces:
36 * <<please update with a overview of the operation of this file>>
43 #include "dbl_float.h"
46 * Double Floating-point Square Root
52 dbl_floating_point
*srcptr
,
53 unsigned int *nullptr,
54 dbl_floating_point
*dstptr
,
57 register unsigned int srcp1
, srcp2
, resultp1
, resultp2
;
58 register unsigned int newbitp1
, newbitp2
, sump1
, sump2
;
59 register int src_exponent
;
60 register boolean guardbit
= FALSE
, even_exponent
;
62 Dbl_copyfromptr(srcptr
,srcp1
,srcp2
);
64 * check source operand for NaN or infinity
66 if ((src_exponent
= Dbl_exponent(srcp1
)) == DBL_INFINITY_EXPONENT
) {
70 if (Dbl_isone_signaling(srcp1
)) {
71 /* trap if INVALIDTRAP enabled */
72 if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION
);
78 * Return quiet NaN or positive infinity.
79 * Fall thru to negative test if negative infinity.
81 if (Dbl_iszero_sign(srcp1
) ||
82 Dbl_isnotzero_mantissa(srcp1
,srcp2
)) {
83 Dbl_copytoptr(srcp1
,srcp2
,dstptr
);
89 * check for zero source operand
91 if (Dbl_iszero_exponentmantissa(srcp1
,srcp2
)) {
92 Dbl_copytoptr(srcp1
,srcp2
,dstptr
);
97 * check for negative source operand
99 if (Dbl_isone_sign(srcp1
)) {
100 /* trap if INVALIDTRAP enabled */
101 if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION
);
104 Dbl_makequietnan(srcp1
,srcp2
);
105 Dbl_copytoptr(srcp1
,srcp2
,dstptr
);
112 if (src_exponent
> 0) {
113 even_exponent
= Dbl_hidden(srcp1
);
114 Dbl_clear_signexponent_set_hidden(srcp1
);
117 /* normalize operand */
118 Dbl_clear_signexponent(srcp1
);
120 Dbl_normalize(srcp1
,srcp2
,src_exponent
);
121 even_exponent
= src_exponent
& 1;
124 /* exponent is even */
125 /* Add comment here. Explain why odd exponent needs correction */
126 Dbl_leftshiftby1(srcp1
,srcp2
);
129 * Add comment here. Explain following algorithm.
131 * Trust me, it works.
134 Dbl_setzero(resultp1
,resultp2
);
135 Dbl_allp1(newbitp1
) = 1 << (DBL_P
- 32);
136 Dbl_setzero_mantissap2(newbitp2
);
137 while (Dbl_isnotzero(newbitp1
,newbitp2
) && Dbl_isnotzero(srcp1
,srcp2
)) {
138 Dbl_addition(resultp1
,resultp2
,newbitp1
,newbitp2
,sump1
,sump2
);
139 if(Dbl_isnotgreaterthan(sump1
,sump2
,srcp1
,srcp2
)) {
140 Dbl_leftshiftby1(newbitp1
,newbitp2
);
142 Dbl_addition(resultp1
,resultp2
,newbitp1
,newbitp2
,
144 Dbl_subtract(srcp1
,srcp2
,sump1
,sump2
,srcp1
,srcp2
);
145 Dbl_rightshiftby2(newbitp1
,newbitp2
);
148 Dbl_rightshiftby1(newbitp1
,newbitp2
);
150 Dbl_leftshiftby1(srcp1
,srcp2
);
152 /* correct exponent for pre-shift */
154 Dbl_rightshiftby1(resultp1
,resultp2
);
157 /* check for inexact */
158 if (Dbl_isnotzero(srcp1
,srcp2
)) {
159 if (!even_exponent
&& Dbl_islessthan(resultp1
,resultp2
,srcp1
,srcp2
)) {
160 Dbl_increment(resultp1
,resultp2
);
162 guardbit
= Dbl_lowmantissap2(resultp2
);
163 Dbl_rightshiftby1(resultp1
,resultp2
);
165 /* now round result */
166 switch (Rounding_mode()) {
168 Dbl_increment(resultp1
,resultp2
);
171 /* stickybit is always true, so guardbit
172 * is enough to determine rounding */
174 Dbl_increment(resultp1
,resultp2
);
178 /* increment result exponent by 1 if mantissa overflowed */
179 if (Dbl_isone_hiddenoverflow(resultp1
)) src_exponent
+=2;
181 if (Is_inexacttrap_enabled()) {
182 Dbl_set_exponent(resultp1
,
183 ((src_exponent
-DBL_BIAS
)>>1)+DBL_BIAS
);
184 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
185 return(INEXACTEXCEPTION
);
187 else Set_inexactflag();
190 Dbl_rightshiftby1(resultp1
,resultp2
);
192 Dbl_set_exponent(resultp1
,((src_exponent
-DBL_BIAS
)>>1)+DBL_BIAS
);
193 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);