arch/parisc/math-emu/dfmpy.c

   1 // SPDX-License-Identifier: GPL-2.0-or-later
   2 /*
   3  * Linux/PA-RISC Project (http://www.parisc-linux.org/)
   4  *
   5  * Floating-point emulation code
   6  *  Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
   7  */
   8 /*
   9  * BEGIN_DESC
  10  *
  11  *  File:
  12  *      @(#)    pa/spmath/dfmpy.c               $Revision: 1.1 $
  13  *
  14  *  Purpose:
  15  *      Double Precision Floating-point Multiply
  16  *
  17  *  External Interfaces:
  18  *      dbl_fmpy(srcptr1,srcptr2,dstptr,status)
  19  *
  20  *  Internal Interfaces:
  21  *
  22  *  Theory:
  23  *      <<please update with a overview of the operation of this file>>
  24  *
  25  * END_DESC
  26 */
  27
  28
  29 #include "float.h"
  30 #include "dbl_float.h"
  31
  32 /*
  33  *  Double Precision Floating-point Multiply
  34  */
  35
  36 int
  37 dbl_fmpy(
  38             dbl_floating_point *srcptr1,
  39             dbl_floating_point *srcptr2,
  40             dbl_floating_point *dstptr,
  41             unsigned int *status)
  42 {
  43         register unsigned int opnd1p1, opnd1p2, opnd2p1, opnd2p2;
  44         register unsigned int opnd3p1, opnd3p2, resultp1, resultp2;
  45         register int dest_exponent, count;
  46         register boolean inexact = FALSE, guardbit = FALSE, stickybit = FALSE;
  47         boolean is_tiny;
  48
  49         Dbl_copyfromptr(srcptr1,opnd1p1,opnd1p2);
  50         Dbl_copyfromptr(srcptr2,opnd2p1,opnd2p2);
  51
  52         /*
  53          * set sign bit of result
  54          */
  55         if (Dbl_sign(opnd1p1) ^ Dbl_sign(opnd2p1))
  56                 Dbl_setnegativezerop1(resultp1);
  57         else Dbl_setzerop1(resultp1);
  58         /*
  59          * check first operand for NaN's or infinity
  60          */
  61         if (Dbl_isinfinity_exponent(opnd1p1)) {
  62                 if (Dbl_iszero_mantissa(opnd1p1,opnd1p2)) {
  63                         if (Dbl_isnotnan(opnd2p1,opnd2p2)) {
  64                                 if (Dbl_iszero_exponentmantissa(opnd2p1,opnd2p2)) {
  65                                         /*
  66                                          * invalid since operands are infinity
  67                                          * and zero
  68                                          */
  69                                         if (Is_invalidtrap_enabled())
  70                                                 return(INVALIDEXCEPTION);
  71                                         Set_invalidflag();
  72                                         Dbl_makequietnan(resultp1,resultp2);
  73                                         Dbl_copytoptr(resultp1,resultp2,dstptr);
  74                                         return(NOEXCEPTION);
  75                                 }
  76                                 /*
  77                                  * return infinity
  78                                  */
  79                                 Dbl_setinfinity_exponentmantissa(resultp1,resultp2);
  80                                 Dbl_copytoptr(resultp1,resultp2,dstptr);
  81                                 return(NOEXCEPTION);
  82                         }
  83                 }
  84                 else {
  85                         /*
  86                          * is NaN; signaling or quiet?
  87                          */
  88                         if (Dbl_isone_signaling(opnd1p1)) {
  89                                 /* trap if INVALIDTRAP enabled */
  90                                 if (Is_invalidtrap_enabled())
  91                                         return(INVALIDEXCEPTION);
  92                                 /* make NaN quiet */
  93                                 Set_invalidflag();
  94                                 Dbl_set_quiet(opnd1p1);
  95                         }
  96                         /*
  97                          * is second operand a signaling NaN?
  98                          */
  99                         else if (Dbl_is_signalingnan(opnd2p1)) {
 100                                 /* trap if INVALIDTRAP enabled */
 101                                 if (Is_invalidtrap_enabled())
 102                                         return(INVALIDEXCEPTION);
 103                                 /* make NaN quiet */
 104                                 Set_invalidflag();
 105                                 Dbl_set_quiet(opnd2p1);
 106                                 Dbl_copytoptr(opnd2p1,opnd2p2,dstptr);
 107                                 return(NOEXCEPTION);
 108                         }
 109                         /*
 110                          * return quiet NaN
 111                          */
 112                         Dbl_copytoptr(opnd1p1,opnd1p2,dstptr);
 113                         return(NOEXCEPTION);
 114                 }
 115         }
 116         /*
 117          * check second operand for NaN's or infinity
 118          */
 119         if (Dbl_isinfinity_exponent(opnd2p1)) {
 120                 if (Dbl_iszero_mantissa(opnd2p1,opnd2p2)) {
 121                         if (Dbl_iszero_exponentmantissa(opnd1p1,opnd1p2)) {
 122                                 /* invalid since operands are zero & infinity */
 123                                 if (Is_invalidtrap_enabled())
 124                                         return(INVALIDEXCEPTION);
 125                                 Set_invalidflag();
 126                                 Dbl_makequietnan(opnd2p1,opnd2p2);
 127                                 Dbl_copytoptr(opnd2p1,opnd2p2,dstptr);
 128                                 return(NOEXCEPTION);
 129                         }
 130                         /*
 131                          * return infinity
 132                          */
 133                         Dbl_setinfinity_exponentmantissa(resultp1,resultp2);
 134                         Dbl_copytoptr(resultp1,resultp2,dstptr);
 135                         return(NOEXCEPTION);
 136                 }
 137                 /*
 138                  * is NaN; signaling or quiet?
 139                  */
 140                 if (Dbl_isone_signaling(opnd2p1)) {
 141                         /* trap if INVALIDTRAP enabled */
 142                         if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
 143                         /* make NaN quiet */
 144                         Set_invalidflag();
 145                         Dbl_set_quiet(opnd2p1);
 146                 }
 147                 /*
 148                  * return quiet NaN
 149                  */
 150                 Dbl_copytoptr(opnd2p1,opnd2p2,dstptr);
 151                 return(NOEXCEPTION);
 152         }
 153         /*
 154          * Generate exponent
 155          */
 156         dest_exponent = Dbl_exponent(opnd1p1) + Dbl_exponent(opnd2p1) -DBL_BIAS;
 157
 158         /*
 159          * Generate mantissa
 160          */
 161         if (Dbl_isnotzero_exponent(opnd1p1)) {
 162                 /* set hidden bit */
 163                 Dbl_clear_signexponent_set_hidden(opnd1p1);
 164         }
 165         else {
 166                 /* check for zero */
 167                 if (Dbl_iszero_mantissa(opnd1p1,opnd1p2)) {
 168                         Dbl_setzero_exponentmantissa(resultp1,resultp2);
 169                         Dbl_copytoptr(resultp1,resultp2,dstptr);
 170                         return(NOEXCEPTION);
 171                 }
 172                 /* is denormalized, adjust exponent */
 173                 Dbl_clear_signexponent(opnd1p1);
 174                 Dbl_leftshiftby1(opnd1p1,opnd1p2);
 175                 Dbl_normalize(opnd1p1,opnd1p2,dest_exponent);
 176         }
 177         /* opnd2 needs to have hidden bit set with msb in hidden bit */
 178         if (Dbl_isnotzero_exponent(opnd2p1)) {
 179                 Dbl_clear_signexponent_set_hidden(opnd2p1);
 180         }
 181         else {
 182                 /* check for zero */
 183                 if (Dbl_iszero_mantissa(opnd2p1,opnd2p2)) {
 184                         Dbl_setzero_exponentmantissa(resultp1,resultp2);
 185                         Dbl_copytoptr(resultp1,resultp2,dstptr);
 186                         return(NOEXCEPTION);
 187                 }
 188                 /* is denormalized; want to normalize */
 189                 Dbl_clear_signexponent(opnd2p1);
 190                 Dbl_leftshiftby1(opnd2p1,opnd2p2);
 191                 Dbl_normalize(opnd2p1,opnd2p2,dest_exponent);
 192         }
 193
 194         /* Multiply two source mantissas together */
 195
 196         /* make room for guard bits */
 197         Dbl_leftshiftby7(opnd2p1,opnd2p2);
 198         Dbl_setzero(opnd3p1,opnd3p2);
 199         /*
 200          * Four bits at a time are inspected in each loop, and a
 201          * simple shift and add multiply algorithm is used.
 202          */
 203         for (count=1;count<=DBL_P;count+=4) {
 204                 stickybit |= Dlow4p2(opnd3p2);
 205                 Dbl_rightshiftby4(opnd3p1,opnd3p2);
 206                 if (Dbit28p2(opnd1p2)) {
 207                         /* Twoword_add should be an ADDC followed by an ADD. */
 208                         Twoword_add(opnd3p1, opnd3p2, opnd2p1<<3 | opnd2p2>>29,
 209                                     opnd2p2<<3);
 210                 }
 211                 if (Dbit29p2(opnd1p2)) {
 212                         Twoword_add(opnd3p1, opnd3p2, opnd2p1<<2 | opnd2p2>>30,
 213                                     opnd2p2<<2);
 214                 }
 215                 if (Dbit30p2(opnd1p2)) {
 216                         Twoword_add(opnd3p1, opnd3p2, opnd2p1<<1 | opnd2p2>>31,
 217                                     opnd2p2<<1);
 218                 }
 219                 if (Dbit31p2(opnd1p2)) {
 220                         Twoword_add(opnd3p1, opnd3p2, opnd2p1, opnd2p2);
 221                 }
 222                 Dbl_rightshiftby4(opnd1p1,opnd1p2);
 223         }
 224         if (Dbit3p1(opnd3p1)==0) {
 225                 Dbl_leftshiftby1(opnd3p1,opnd3p2);
 226         }
 227         else {
 228                 /* result mantissa >= 2. */
 229                 dest_exponent++;
 230         }
 231         /* check for denormalized result */
 232         while (Dbit3p1(opnd3p1)==0) {
 233                 Dbl_leftshiftby1(opnd3p1,opnd3p2);
 234                 dest_exponent--;
 235         }
 236         /*
 237          * check for guard, sticky and inexact bits
 238          */
 239         stickybit |= Dallp2(opnd3p2) << 25;
 240         guardbit = (Dallp2(opnd3p2) << 24) >> 31;
 241         inexact = guardbit | stickybit;
 242
 243         /* align result mantissa */
 244         Dbl_rightshiftby8(opnd3p1,opnd3p2);
 245
 246         /*
 247          * round result
 248          */
 249         if (inexact && (dest_exponent>0 || Is_underflowtrap_enabled())) {
 250                 Dbl_clear_signexponent(opnd3p1);
 251                 switch (Rounding_mode()) {
 252                         case ROUNDPLUS:
 253                                 if (Dbl_iszero_sign(resultp1))
 254                                         Dbl_increment(opnd3p1,opnd3p2);
 255                                 break;
 256                         case ROUNDMINUS:
 257                                 if (Dbl_isone_sign(resultp1))
 258                                         Dbl_increment(opnd3p1,opnd3p2);
 259                                 break;
 260                         case ROUNDNEAREST:
 261                                 if (guardbit) {
 262                                 if (stickybit || Dbl_isone_lowmantissap2(opnd3p2))
 263                                 Dbl_increment(opnd3p1,opnd3p2);
 264                                 }
 265                 }
 266                 if (Dbl_isone_hidden(opnd3p1)) dest_exponent++;
 267         }
 268         Dbl_set_mantissa(resultp1,resultp2,opnd3p1,opnd3p2);
 269
 270         /*
 271          * Test for overflow
 272          */
 273         if (dest_exponent >= DBL_INFINITY_EXPONENT) {
 274                 /* trap if OVERFLOWTRAP enabled */
 275                 if (Is_overflowtrap_enabled()) {
 276                         /*
 277                          * Adjust bias of result
 278                          */
 279                         Dbl_setwrapped_exponent(resultp1,dest_exponent,ovfl);
 280                         Dbl_copytoptr(resultp1,resultp2,dstptr);
 281                         if (inexact)
 282                             if (Is_inexacttrap_enabled())
 283                                 return (OVERFLOWEXCEPTION | INEXACTEXCEPTION);
 284                             else Set_inexactflag();
 285                         return (OVERFLOWEXCEPTION);
 286                 }
 287                 inexact = TRUE;
 288                 Set_overflowflag();
 289                 /* set result to infinity or largest number */
 290                 Dbl_setoverflow(resultp1,resultp2);
 291         }
 292         /*
 293          * Test for underflow
 294          */
 295         else if (dest_exponent <= 0) {
 296                 /* trap if UNDERFLOWTRAP enabled */
 297                 if (Is_underflowtrap_enabled()) {
 298                         /*
 299                          * Adjust bias of result
 300                          */
 301                         Dbl_setwrapped_exponent(resultp1,dest_exponent,unfl);
 302                         Dbl_copytoptr(resultp1,resultp2,dstptr);
 303                         if (inexact)
 304                             if (Is_inexacttrap_enabled())
 305                                 return (UNDERFLOWEXCEPTION | INEXACTEXCEPTION);
 306                             else Set_inexactflag();
 307                         return (UNDERFLOWEXCEPTION);
 308                 }
 309
 310                 /* Determine if should set underflow flag */
 311                 is_tiny = TRUE;
 312                 if (dest_exponent == 0 && inexact) {
 313                         switch (Rounding_mode()) {
 314                         case ROUNDPLUS:
 315                                 if (Dbl_iszero_sign(resultp1)) {
 316                                         Dbl_increment(opnd3p1,opnd3p2);
 317                                         if (Dbl_isone_hiddenoverflow(opnd3p1))
 318                                             is_tiny = FALSE;
 319                                         Dbl_decrement(opnd3p1,opnd3p2);
 320                                 }
 321                                 break;
 322                         case ROUNDMINUS:
 323                                 if (Dbl_isone_sign(resultp1)) {
 324                                         Dbl_increment(opnd3p1,opnd3p2);
 325                                         if (Dbl_isone_hiddenoverflow(opnd3p1))
 326                                             is_tiny = FALSE;
 327                                         Dbl_decrement(opnd3p1,opnd3p2);
 328                                 }
 329                                 break;
 330                         case ROUNDNEAREST:
 331                                 if (guardbit && (stickybit ||
 332                                     Dbl_isone_lowmantissap2(opnd3p2))) {
 333                                         Dbl_increment(opnd3p1,opnd3p2);
 334                                         if (Dbl_isone_hiddenoverflow(opnd3p1))
 335                                             is_tiny = FALSE;
 336                                         Dbl_decrement(opnd3p1,opnd3p2);
 337                                 }
 338                                 break;
 339                         }
 340                 }
 341
 342                 /*
 343                  * denormalize result or set to signed zero
 344                  */
 345                 stickybit = inexact;
 346                 Dbl_denormalize(opnd3p1,opnd3p2,dest_exponent,guardbit,
 347                  stickybit,inexact);
 348
 349                 /* return zero or smallest number */
 350                 if (inexact) {
 351                         switch (Rounding_mode()) {
 352                         case ROUNDPLUS:
 353                                 if (Dbl_iszero_sign(resultp1)) {
 354                                         Dbl_increment(opnd3p1,opnd3p2);
 355                                 }
 356                                 break;
 357                         case ROUNDMINUS:
 358                                 if (Dbl_isone_sign(resultp1)) {
 359                                         Dbl_increment(opnd3p1,opnd3p2);
 360                                 }
 361                                 break;
 362                         case ROUNDNEAREST:
 363                                 if (guardbit && (stickybit ||
 364                                     Dbl_isone_lowmantissap2(opnd3p2))) {
 365                                         Dbl_increment(opnd3p1,opnd3p2);
 366                                 }
 367                                 break;
 368                         }
 369                         if (is_tiny) Set_underflowflag();
 370                 }
 371                 Dbl_set_exponentmantissa(resultp1,resultp2,opnd3p1,opnd3p2);
 372         }
 373         else Dbl_set_exponent(resultp1,dest_exponent);
 374         /* check for inexact */
 375         Dbl_copytoptr(resultp1,resultp2,dstptr);
 376         if (inexact) {
 377                 if (Is_inexacttrap_enabled()) return(INEXACTEXCEPTION);
 378                 else Set_inexactflag();
 379         }
 380         return(NOEXCEPTION);
 381 }