none/tests/ppc64/ppc64_helpers.h

   1 /*
   2  * ppc64_helpers.h
   3  * Copyright (C) 2016-2017 Will Schmidt <will_schmidt@vnet.ibm.com>
   4  *
   5  * This file contains helper functions for the ISA 3.0 test suite.
   6  */
   7
   8 /*
   9  *   This program is free software; you can redistribute it and/or
  10  *   modify it under the terms of the GNU General Public License V2
  11  *   as published by the Free Software Foundation
  12  *
  13  *   This program is distributed in the hope that it will be useful,
  14  *   but WITHOUT ANY WARRANTY; without even the implied warranty of
  15  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  16  *   GNU General Public License for more details.
  17  *
  18  *   You should have received a copy of the GNU General Public License
  19  *   along with this program; if not, see <http://www.gnu.org/licenses/>.
  20  */
  21
  22 #include "tests/malloc.h"       // memalign32
  23
  24 typedef uint64_t  HWord_t;
  25
  26 #if defined (DEBUG_ARGS_BUILD)
  27 #define AB_DPRINTF(fmt, args...) do { fprintf(stderr, fmt , ##args); } while (0)
  28 #else
  29 #define AB_DPRINTF(fmt, args...) do { } while (0)
  30 #endif
  31
  32 /* Exhaustive tests?
  33  * Due to the excessive size of the test results, allow a #ifdef to
  34  * enable/disable most of the input values.
  35  * Off by default.
  36  */
  37 // #define EXHAUSTIVE_TESTS 1
  38
  39
  40 #define ALLCR "cr0","cr1","cr2","cr3","cr4","cr5","cr6","cr7"
  41
  42 #define SET_CR(_arg) \
  43       __asm__ __volatile__ ("mtcr  %0" : : "b"(_arg) : ALLCR );
  44
  45 #define SET_CR0_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x80,%0 " : : "b" (_arg):"cr0");
  46 #define SET_CR1_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x40,%0 " : : "b" (_arg):"cr1");
  47 #define SET_CR2_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x20,%0 " : : "b" (_arg):"cr2");
  48 #define SET_CR3_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x10,%0 " : : "b" (_arg):"cr3");
  49 #define SET_CR4_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x08,%0 " : : "r" (_arg):"cr4");
  50 #define SET_CR5_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x04,%0 " : : "r" (_arg):"cr5");
  51 #define SET_CR6_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x02,%0 " : : "r" (_arg):"cr6");
  52 #define SET_CR7_FIELD(_arg) __asm__ __volatile__ ("mtocrf 0x01,%0 " : : "r" (_arg):"cr7");
  53
  54 #define SET_XER(_arg) \
  55       __asm__ __volatile__ ("mtxer %0" : : "b"(_arg) : "xer" );
  56
  57 #define GET_CR(_lval) \
  58       __asm__ __volatile__ ("mfcr %0"  : "=b"(_lval) )
  59
  60 #define GET_XER(_lval) \
  61       __asm__ __volatile__ ("mfxer %0" : "=b"(_lval) )
  62
  63 #define SET_CR_ZERO \
  64       SET_CR(0)
  65
  66 #define SET_FPSCR_ZERO                                        \
  67    do {                                                       \
  68       double _d = 0.0;                                        \
  69       __asm__ __volatile__ ("mtfsf 0xFF, %0" : : "f"(_d) );   \
  70    } while (0);
  71
  72 #define GET_FPSCR(_arg) \
  73   __asm__ __volatile__ ("mffs %0"  : "=f"(_arg) );
  74
  75 /*  The bit definitions for the FPSCR are as follows.
  76 Bit(s) Description
  77 0:31 Reserved
  78 32 Floating-Point Exception Summary (FX)
  79 33 Floating-Point Enabled Exception Summary (FEX)
  80 34 Floating-Point Invalid Operation Exception Summary (VX)
  81 35 Floating-Point Overflow Exception (OX)
  82 36 Floating-Point Underflow Exception (UX)
  83 37 Floating-Point Zero Divide Exception (ZX)
  84 38 Floating-Point Inexact Exception (XX)
  85 39 Floating-Point Invalid Operation Exception (SNaN) (VXSNAN)
  86 40 Floating-Point Invalid Operation Exception (∞ - ∞) (VXISI)
  87 41 Floating-Point Invalid Operation Exception (∞ ÷ ∞) (VXIDI)
  88 42 Floating-Point Invalid Operation Exception (0 ÷ 0) (VXZDZ)
  89 43 Floating-Point Invalid Operation Exception (∞ × 0) (VXIMZ)
  90 44 Floating-Point Invalid Operation Exception (Invalid Compare) (VXVC)
  91 45 Floating-Point Fraction Rounded (FR)
  92 46 Floating-Point Fraction Inexact (FI)
  93 47:51 Floating-Point Result Flags (FPRF)
  94 47 Floating-Point Result Class Descriptor (C)
  95 48:51 Floating-Point Condition Code (FPCC)
  96       48 Floating-Point Less Than or Negative (FL or <)
  97       49 Floating-Point Greater Than or Positive (FG or >)
  98       50 Floating-Point Equal or Zero (FE or =)
  99       51 Floating-Point Unordered or NaN (FU or ?)
 100 52 Reserved
 101 53 Floating-Point Invalid Operation Exception (Software-Defined Condition) (VXSOFT)
 102 54 Floating-Point Invalid Operation Exception (Invalid Square Root) (VXSQRT)
 103 55 Floating-Point Invalid Operation Exception (Invalid Integer Convert) (VXCVI)
 104 56 Floating-Point Invalid Operation Exception Enable (VE)
 105 57 Floating-Point Overflow Exception Enable (OE)
 106 58 Floating-Point Underflow Exception Enable (UE)
 107 59 Floating-Point Zero Divide Exception Enable (ZE)
 108 60 Floating-Point Inexact Exception Enable (XE)
 109 61 Floating-Point Non-IEEE Mode (NI)
 110 62:63 Floating-Point Rounding Control (RN)
 111    00 Round to Nearest
 112    01 Round toward Zero
 113    10 Round toward +Infinity
 114    11 Round toward -Infinity
 115 */
 116 /* NOTE, currently Valgrind only tracks the rounding mode, C and FPCC fields in the
 117  *       FPSCR register.
 118  */
 119
 120 static char * fpscr_strings[] = {
 121 " 0-RSVD", " 1-RSVD", " 2-RSVD", " 3-RSVD", " 4-RSVD", " 5-RSVD", " 6-RSVD",
 122 " 7-RSVD", " 8-RSVD", " 9-RSVD", "10-RSVD", "11-RSVD", "12-RSVD", "13-RSVD",
 123 "14-RSVD", "15-RSVD", "16-RSVD", "17-RSVD", "18-RSVD", "19-RSVD", "20-RSVD",
 124 "21-RSVD", "22-RSVD", "23-RSVD", "24-RSVD", "25-RSVD", "26-RSVD", "27-RSVD",
 125 "28-RSVD", "29-DRN0", "30-DRN1", "31-DRN2",
 126 /* 32 */ "FX", "FEX", "VX",
 127 /* 35 */ "OX", "UX", "ZX", "XX", "VXSNAN",
 128 /* 40 */ "VXISI (inf-inf)", "VXIDI (inf/inf)", "VXZDZ (0/0)",
 129 /* 43 */ "VXIMZ (inf*0)", "VXVC",
 130 /* 45 */ "FR", "FI",
 131 /* 47 */ "FPRF-C", "FPCC-FL", "FPCC-FG",
 132 /* 50 */ "FPCC-FE", "FPCC-FU",
 133 /* 52 */ "52-RSVD", "FXSOFT", "VXSQRT",
 134 /* 55 */ "VXCVI", "VE", "OE", "UE", "ZE",
 135 /* 60 */ "XE", "NI", "RN-bit62", "RN-bit63"
 136 };
 137
 138 #define FPCC_C_BIT    (0x1 << (63-47))
 139 #define FPCC_FL_BIT   (0x1 << (63-48))
 140 #define FPCC_FG_BIT   (0x1 << (63-49))
 141 #define FPCC_FE_BIT   (0x1 << (63-50))
 142 #define FPCC_FU_BIT   (0x1 << (63-51))
 143 #define FPCC_FPRF_MASK  FPCC_C_BIT|FPCC_FL_BIT|FPCC_FG_BIT|FPCC_FE_BIT|FPCC_FU_BIT
 144
 145 #define FPSCR_RN_BIT62   (0x1 << (63-62))
 146 #define FPSCR_RN_BIT63   (0x1 << (63-63))
 147
 148 #define CRFIELD_BIT0 0x8
 149 #define CRFIELD_BIT1 0x4
 150 #define CRFIELD_BIT2 0x2
 151 #define CRFIELD_BIT3 0x1
 152
 153 /* dissect_cr*:
 154  * display the condition register bits in a
 155  * human readable format.
 156  */
 157
 158 static inline int cr_overflow_set(unsigned this_cr) {
 159    return (this_cr & CRFIELD_BIT3);
 160 }
 161
 162 static inline int cr_zero_set(unsigned this_cr) {
 163    return (this_cr & CRFIELD_BIT2);
 164 }
 165
 166 static inline int cr_positive_set(unsigned this_cr) {
 167    return (this_cr & CRFIELD_BIT1);
 168 }
 169
 170 static inline int cr_negative_set(unsigned this_cr) {
 171    return (this_cr & CRFIELD_BIT0);
 172 }
 173
 174 /* __dissect_cr takes a bitfield directly, not the full condition register.
 175  * This is a helper for dissect_cr_rn.
 176  */
 177 inline static void __dissect_cr(unsigned this_cr) {
 178 if (cr_negative_set(this_cr))
 179    printf("%s(LT)", verbose ? " 0x1=Negative" : "");
 180
 181 if (cr_positive_set(this_cr))
 182    printf("%s(GT)", verbose ? " 0x2=Positive" : "");
 183
 184 if (cr_zero_set(this_cr))
 185    printf("%s(EQ)", verbose ? " 0x4=Zero" : "");
 186
 187 if (cr_overflow_set(this_cr))
 188    printf("%s(SO)", verbose ? " 0x8=Overflow" : "");
 189 }
 190
 191 /* Extract one CR field */
 192 static int extract_cr_rn(unsigned long local_cr,unsigned long rn) {
 193    unsigned int masked_cr;
 194    unsigned long shifted_value;
 195
 196    shifted_value = local_cr >> ( ( (7 - rn) * 4 ) );
 197    masked_cr = shifted_value & 0xf;
 198    return masked_cr;
 199 }
 200
 201 /* Display one CR field */
 202 static void dissect_cr_rn(unsigned long local_cr, unsigned long rn) {
 203    unsigned int masked_cr;
 204
 205    masked_cr = extract_cr_rn(local_cr, rn);
 206    __dissect_cr(masked_cr);
 207 }
 208
 209 /* Display all of the CR fields... */
 210 static void dissect_cr(unsigned long local_cr) {
 211    unsigned int crn;
 212
 213    for (crn = 0; crn < 8; crn++) {
 214       dissect_cr_rn(local_cr, crn);
 215    }
 216 }
 217
 218 /* dissect the fpscr bits that are valid under valgrind.
 219  * Valgrind tracks the C (FPSCR[47]), FPCC (FPSCR[48:51)
 220  * DRN (FPSCR[29:31]) and RN (FPSCR[62:63]).
 221  */
 222 static void dissect_fpscr_valgrind(unsigned long local_fpscr) {
 223    int i;
 224    long mybit;
 225
 226    /* Print DRN fields */
 227    for (i = 29; i < 32; i++) {
 228       mybit = 1LL << (63 - i);
 229       if (mybit & local_fpscr) {
 230          printf(" %s",fpscr_strings[i]);
 231       }
 232    }
 233
 234    /* Print C and FPCC fields */
 235    for (i = 47; i < 52; i++) {
 236       mybit = 1LL << (63 - i);
 237       if (mybit & local_fpscr) {
 238          printf(" %s",fpscr_strings[i]);
 239       }
 240    }
 241
 242    /* Print RN field */
 243    for (i = 62; i < 64; i++) {
 244       mybit = 1LL << (63 - i);
 245       if (mybit & local_fpscr) {
 246          printf(" %s",fpscr_strings[i]);
 247       }
 248    }
 249 }
 250
 251 /* dissect the fpscr bits.
 252  * This prints the entire FPSCR field.  This is only called under higher
 253  * verbosities, as valgrind does not track most of these bits.
 254  */
 255 static void dissect_fpscr_raw(unsigned long local_fpscr) {
 256 /* Due to the additional involved logic, the rounding mode (RN) bits 61-62
 257  * are handled within dissect_fpscr_rounding_mode(). */
 258    int i;
 259    long mybit;
 260
 261    for (i = 0; i < 61; i++) {
 262       /* also note that the bit numbering is backwards. */
 263       mybit = 1LL << (63 - i);
 264       if (mybit & local_fpscr) {
 265          printf(" %s", fpscr_strings[i]);
 266       }
 267    }
 268 }
 269
 270 static void dissect_fpscr(unsigned long local_fpscr) {
 271    if (verbose > 1) {
 272       printf(" [[ fpscr:%lx ]] ", local_fpscr);
 273       dissect_fpscr_raw(local_fpscr);
 274    } else {
 275       dissect_fpscr_valgrind(local_fpscr);
 276    }
 277 }
 278
 279 /* Display the rounding mode */
 280 static void dissect_fpscr_rounding_mode(unsigned long local_fpscr) {
 281    /* special case handing for the rounding mode round-nearest (RN) bits. 62:63 */
 282    printf("Rounding Mode: ");
 283
 284    if (local_fpscr & FPSCR_RN_BIT62)
 285       if (local_fpscr & FPSCR_RN_BIT63)
 286          /* 0b11 */ printf("RN-to--INF");
 287       else
 288          /* 0b10 */ printf("RN-to-+INF");
 289    else
 290       if (local_fpscr & FPSCR_RN_BIT63)
 291          /* 0b01 */ printf("RN-to-Nearest");
 292       else
 293          /* 0b00 */ printf("RN-to-Zero");
 294 }
 295
 296 /*
 297  * Arithmetic, rounding, and Convert From Integer instructions will set
 298  * bits in the FPCC field to indicate the class of the result.
 299  * The table is described as follows;
 300      flags / Result value class
 301   C < > = ?
 302   1 0 0 0 1 Quiet NaN
 303   0 1 0 0 1 -Infinity
 304   0 1 0 0 0 -Normalized Number
 305   1 1 0 0 0 -Denormalized Number
 306   1 0 0 1 0 -Zero
 307   0 0 0 1 0 +Zero
 308   1 0 1 0 0 +Denormalized Number
 309   0 0 1 0 0 +Normalized Number
 310   0 0 1 0 1 +Infinity
 311 */
 312
 313 static void dissect_fpscr_result_value_class(unsigned long local_fpscr) {
 314    if (local_fpscr & FPCC_C_BIT) {
 315       if (local_fpscr & FPCC_FL_BIT)
 316             printf("-Denormalized");
 317
 318       else if (local_fpscr & FPCC_FG_BIT)
 319             printf("+Denormalized");
 320
 321       else if (local_fpscr & FPCC_FE_BIT)
 322             printf("-Zero        ");
 323
 324       else if (local_fpscr & FPCC_FU_BIT)
 325             printf("Quiet NaN    ");
 326
 327    } else {
 328       if (local_fpscr & FPCC_FL_BIT) {
 329          if (local_fpscr & FPCC_FU_BIT)
 330             printf("-Infinity    ");
 331
 332          else
 333             printf("-Normalized  ");
 334
 335       } else if (local_fpscr & FPCC_FG_BIT) {
 336          if (local_fpscr & FPCC_FU_BIT)
 337             printf("+Infinity    ");
 338
 339          else
 340             printf("+Normalized  ");
 341
 342          if (local_fpscr & FPCC_FE_BIT)
 343             printf("+Zero        ");
 344       }
 345    }
 346 }
 347
 348 /* Interpret the fields in the FPCC as they apply to the DCMX checks.
 349  * The 'Match' indicator will typically be evaluated by the caller.
 350  *
 351  *  DMCX:
 352     * DCMX bit / 0x value / Data Class
 353     *        0       0x01  NaN
 354     *        1       0x02  +Infinity
 355     *        2       0x04  -Infinity
 356     *        3       0x08  +Zero
 357     *        4       0x10  -Zero
 358     *        5       0x20  +Denormal
 359     *        6       0x40  -Denormal
 360     *        7       0x7f  ALL bits set.
 361 */
 362
 363 static void dissect_fpscr_dcmx_indicator(unsigned long local_fpscr) {
 364    if (verbose > 2) printf("fpscr_cc:%lx ", local_fpscr & (FPCC_FPRF_MASK) );
 365
 366    // See if the data class of the src value matches the set DCMX bits.
 367    if (verbose > 1) printf("%s ", (local_fpscr&FPCC_FE_BIT) ? "Match":"");
 368
 369    // Display the sign bit of the src value.
 370    if (verbose > 1) printf("SRC sign:%s ", (local_fpscr&FPCC_FL_BIT) ? "-" : "+");
 371
 372    // The src value can be either a SP or DP value, this indicates
 373    // if it is a valid SP value.
 374    if (verbose > 1) printf("%s ", (local_fpscr&FPCC_FE_BIT) ? "SP" : "");
 375 }
 376
 377 /* dissect_xer helpers*/
 378 static char * xer_strings[] = {
 379 " 0-RSVD", " 1-RSVD", " 2-RSVD", " 3-RSVD", " 4-RSVD", " 5-RSVD", " 6-RSVD",
 380 " 7-RSVD", " 8-RSVD", " 9-RSVD", "10-RSVD", "11-RSVD", "12-RSVD", "13-RSVD",
 381 "14-RSVD", "15-RSVD", "16-RSVD", "17-RSVD", "18-RSVD", "19-RSVD",
 382 "20-RSVD", "21-RSVD", "22-RSVD", "23-RSVD", "24-RSVD", "25-RSVD",
 383 "26-RSVD", "27-RSVD", "28-RSVD", "29-RSVD", "30-RSVD", "31-RSVD",
 384 /* 32 */ "SO", "OV", "CA",
 385 /* 35 */ "35-RSVD", "36-RSVD", "37-RSVD", "38-RSVD", "39-RSVD",
 386 /* 40 */ "40-RSVD", "41-RSVD", "42-RSVD", "43-RSVD",
 387 /* 44 */ "OV32", "CA32",
 388 /* 46 */ "46-RSVD", "47-RSVD", "48-RSVD", "49-RSVD", "50-RSVD", "51-RSVD",
 389          "52-RSVD", "53-RSVD", "54-RSVD", "55-RSVD", "56-RSVD",
 390 /* 57:63 # bytes transferred by a Load/Store String Indexed instruction. */
 391          "LSI/SSI-0", "LSI/SSI-1", "LSI/SSI-2", "LSI/SSI-3",
 392          "LSI/SSI-4", "LSI/SSI-5", "LSI/SSI-6",
 393 };
 394
 395 /* Dissect the XER register contents.
 396  */
 397 static void dissect_xer_raw(unsigned long local_xer) {
 398    int i;
 399    long mybit;
 400
 401    for (i = 0; i <= 63; i++) {
 402       mybit = 1ULL << (63 - i); /* compensate for reversed bit numbering. */
 403       if (mybit & local_xer)
 404          printf(" %s", xer_strings[i]);
 405    }
 406 }
 407 /* Display only the XER contents that are relevant for our tests.
 408  * this is currently the OV and OV32 bits.  */
 409 static void dissect_xer_valgrind(unsigned long local_xer) {
 410    int i;
 411    long mybit;
 412       i = 33;  // OV
 413       mybit = 1ULL << (63 - i);
 414       if (mybit & local_xer) printf(" %s", xer_strings[i]);
 415       i = 44;  // OV32
 416       mybit = 1ULL << (63 - i);
 417       if (mybit & local_xer) printf(" %s", xer_strings[i]);
 418 }
 419
 420
 421 /* */
 422 static void dissect_xer(unsigned long local_xer) {
 423    if (verbose > 1)
 424       printf(" [[ xer:%lx ]]", local_xer);
 425    if (verbose > 2 )
 426       dissect_xer_raw(local_xer);
 427    else
 428       dissect_xer_valgrind(local_xer);
 429 }
 430
 431
 432 /* DFP helpers for bcd-to-dpd, dpd-to-bcd, misc.
 433  * pulled from vex/.../host_generic_simd64.c
 434  */
 435 /*------------------------------------------------------------------*/
 436 /* Decimal Floating Point (DFP) helper functions */
 437 /*------------------------------------------------------------------*/
 438 #define NOT( x )    ( ( ( x ) == 0) ? 1 : 0)
 439 #define GET( x, y ) ( ( ( x ) & ( 0x1UL << ( y ) ) ) >> ( y ) )
 440 #define PUT( x, y ) ( ( x )<< ( y ) )
 441
 442 static unsigned long dpb_to_bcd( unsigned long chunk )
 443 {
 444    int a, b, c, d, e, f, g, h, i, j, k, m;
 445    int p, q, r, s, t, u, v, w, x, y;
 446    unsigned long value;
 447
 448    /* convert 10 bit densely packed BCD to BCD */
 449    p = GET( chunk, 9 );
 450    q = GET( chunk, 8 );
 451    r = GET( chunk, 7 );
 452    s = GET( chunk, 6 );
 453    t = GET( chunk, 5 );
 454    u = GET( chunk, 4 );
 455    v = GET( chunk, 3 );
 456    w = GET( chunk, 2 );
 457    x = GET( chunk, 1 );
 458    y = GET( chunk, 0 );
 459
 460    /* The BCD bit values are given by the following boolean equations.*/
 461    a = ( NOT(s) & v & w ) | ( t & v & w & s ) | ( v & w & NOT(x) );
 462    b = ( p & s & x & NOT(t) ) | ( p & NOT(w) ) | ( p & NOT(v) );
 463    c = ( q & s & x & NOT(t) ) | ( q & NOT(w) ) | ( q & NOT(v) );
 464    d = r;
 465    e = ( v & NOT(w) & x ) | ( s & v & w & x ) | ( NOT(t) & v & x & w );
 466    f = ( p & t & v & w & x & NOT(s) ) | ( s & NOT(x) & v ) | ( s & NOT(v) );
 467    g = ( q & t & w & v & x & NOT(s) ) | ( t & NOT(x) & v ) | ( t & NOT(v) );
 468    h = u;
 469    i = ( t & v & w & x ) | ( s & v & w & x ) | ( v & NOT(w) & NOT(x) );
 470    j = ( p & NOT(s) & NOT(t) & w & v ) | ( s & v & NOT(w) & x )
 471       | ( p & w & NOT(x) & v ) | ( w & NOT(v) );
 472    k = ( q & NOT(s) & NOT(t) & v & w ) | ( t & v & NOT(w) & x )
 473       | ( q & v & w & NOT(x) ) | ( x & NOT(v) );
 474    m = y;
 475
 476    value = PUT(a, 11) | PUT(b, 10) | PUT(c, 9) | PUT(d, 8) | PUT(e, 7)
 477                | PUT(f, 6) | PUT(g, 5) | PUT(h, 4) | PUT(i, 3) | PUT(j, 2)
 478                | PUT(k, 1) | PUT(m, 0);
 479     return value;
 480 }
 481 #undef NOT
 482 #undef GET
 483 #undef PUT
 484
 485
 486 typedef union dfp_union {
 487    _Decimal128  dec_val128;
 488    struct {
 489 #if defined(VGP_ppc64le_linux)
 490    unsigned long vall;
 491    unsigned long valu;
 492 #else
 493    unsigned long valu;
 494    unsigned long vall;
 495 #endif
 496    } u128;
 497 } dfp_val_t;
 498
 499 /* Based on and enhanced from the dfp128_vals table in test_dfp5.c.
 500  * Todo: Refine/refactor and turn into a build_table function.
 501  */
 502
 503 static unsigned long dfp128_vals[] = {
 504 #ifdef EXHAUSTIVE_TESTS
 505    // Some finite numbers
 506    0x2208000000000000ULL, 0x0000000000000001ULL, //  1 *10^0
 507    0xa208800000000000ULL, 0x0000000000000001ULL, // -1 *10^1
 508    0x0000000000000000ULL, 0x0000000000000001ULL, //  1 *10^-6176. (smallest exp)
 509    0x43ffc00000000000ULL, 0x0000000000000001ULL, //  1 *10^6111
 510    0x6fffc00000000000ULL, 0x0000000000000001ULL, // foo *10^2015.
 511    0x67ffc00000000000ULL, 0x0000000000000001ULL, // foo *10^-2081.
 512    0x77ffc00000000000ULL, 0x0000000000000001ULL, //  1 *10^6111 (largest exp)
 513    0x77ffffffffffffffULL, 0xffffffffffffffffULL, // max possible value *10^6111 (largest exp)
 514    0x0000000000000000ULL, 0x0000000000000001ULL, // min possible value 1 *10^-6176. (smallest exp)
 515    0x8000000000000000ULL, 0x0000000000000001ULL, // -1 *10^-6176. (smallest exp)
 516
 517    /* data bits sprinkled across the significand field. */
 518    0xa208800001000000ULL, 0x0000000000010000ULL, //-foo *10^1
 519    0xa208800000000100ULL, 0x0000000000000100ULL, //-foo *10^1
 520    0xa208800000000000ULL, 0x0000100000000000ULL, //-foo *10^1
 521    0xa208800000000000ULL, 0x0000000001000000ULL, //-foo *10^1
 522    0xa208800000000000ULL, 0x0000000000000001ULL, //-foo *10^1
 523
 524    // pre-existing dfp128 values:
 525    0x2207c00000000000ULL, 0x0000000000000e50ULL, // foo * 10^-1
 526    0x2207c00000000000ULL, 0x000000000014c000ULL, // foo * 10^-1
 527    0xa207c00000000000ULL, 0x00000000000000e0ULL, // foo * 10^-1
 528    0x2206c00000000000ULL, 0x00000000000000cfULL, // foo * 10^-5
 529    0xa205c00000000000ULL, 0x000000010a395bcfULL, // foo * 10^-9
 530    0x6209400000fd0000ULL, 0x00253f1f534acdd4ULL, // foo * 10^-4091
 531    0x000400000089b000ULL, 0x0a6000d000000049ULL, // very small number // foo * 10^-6160
 532
 533    // flavors of zero
 534    0x2208000000000000ULL, 0x0000000000000000ULL, // 0*10^256
 535    0xa208000000000000ULL, 0x0000000000000000ULL, // -0*10^0
 536    0xa248000000000000ULL, 0x0000000000000000ULL, // 0*10^256
 537
 538    // flavors of NAN
 539    0x7c00000000000000ULL, 0x0000000000000000ULL, // quiet
 540    0xfc00000000000000ULL, 0xc00100035b007700ULL, // NAN
 541    0x7e00000000000000ULL, 0xfe000000d0e0a0d0ULL, // signaling NAN
 542
 543    // flavors of Infinity
 544    0x7800000000000000ULL, 0x0000000000000000ULL, // +inf
 545    0xf800000000000000ULL, 0x0000000000000000ULL, // -inf
 546    0xf900000000000000ULL, 0x0000000000000000ULL  // -inf
 547 #else
 548    0x2208000000000000ULL, 0x0000000000000001ULL, //  1 *10^0
 549    0x77ffffffffffffffULL, 0xffffffffffffffffULL, // max possible value *10^6111 (largest exp)
 550    0xa208000000000000ULL, 0x0000000000000000ULL, // -0*10^0
 551    0xfc00000000000000ULL, 0xc00100035b007700ULL, // NAN
 552    0x7e00000000000000ULL, 0xfe000000d0e0a0d0ULL, // signaling NAN
 553    0xf800000000000000ULL, 0x0000000000000000ULL, // -inf
 554 #endif
 555 };
 556
 557 #define NUM_DFP128_VALS (sizeof(dfp128_vals) / sizeof(unsigned long))
 558 unsigned long nb_dfp128_vals = NUM_DFP128_VALS;
 559
 560 /* Todo: update dfp64_vals to match dfp128_vals content. */
 561
 562 static unsigned long dfp64_vals[] = {
 563 #ifdef EXHAUSTIVE_TESTS
 564    0x77fcffffffffffffULL, // max possible value 9..9 *10^369 (largest exp)
 565    0x0000000000000001ULL, // min possible nonzero value 1 *10^-398. (smallest exp)
 566    0x4248000000000001ULL, // 1*10^260
 567    0x2234000000000e50ULL, // foo*10^-1
 568    0x223400000014c000ULL, //
 569    0xa2340000000000e0ULL, //
 570    0x22240000000000cfULL, // foo*10^-5
 571    0xa21400010a395bcfULL, // negative -foo*10^-9
 572    0x6e4d3f1f534acdd4ULL, // huge number foo*10^5
 573    0x000400000089b000ULL, // very small number foo*10^-397
 574
 575    // flavors of zero
 576    0x2238000000000000ULL,
 577    0xa238000000000000ULL, // 0 * 10 ^0
 578    0x4248000000000000ULL, // 0 * 10 ^260
 579
 580    // flavors of NAN
 581    0x7e34000000000111ULL, //signaling NaN
 582    0xfe000000d0e0a0d0ULL, //signaling NaN
 583    0xfc00000000000000ULL, //quiet NaN
 584
 585    // flavors of Infinity
 586    0x7800000000000000ULL, //+Inf
 587    0xf800000000000000ULL, //-Inf
 588    0x7a34000000000000ULL, //+Inf
 589 #else
 590    0x77fcffffffffffffULL, // max possible value 9..9 *10^369 (largest exp)
 591    0x4248000000000000ULL, // 0 * 10 ^260
 592    0xfe000000d0e0a0d0ULL, //signaling NaN
 593    0xf800000000000000ULL, //-Inf
 594 #endif
 595 };
 596
 597 #define NUM_DFP64_VALS (sizeof(dfp64_vals) / sizeof(unsigned long))
 598 unsigned long nb_dfp64_vals = NUM_DFP64_VALS;
 599
 600 /* shift helpers */
 601 #define SH_0  0
 602 #define SH_1  1
 603 #define SH_2  15
 604 #define SH_3  63
 605
 606 static uint64_t shift_amounts[] = {
 607    SH_0,
 608    SH_1,
 609    SH_2,
 610    SH_3,
 611 #define SHIFT_ARRAY_SIZE 4
 612 };
 613
 614 /* vector splat helpers */
 615 #define SPLAT0 0
 616 #define SPLAT1 1
 617 #define SPLAT2 0xaa
 618 #define SPLAT3 0x55
 619 #define SPLAT4 0xff
 620
 621 static uint64_t splat_values[] = {
 622    SPLAT0,
 623    SPLAT1,
 624    SPLAT2,
 625    SPLAT3,
 626    SPLAT4,
 627 #define SPLAT_ARRAY_SIZE 5
 628 };
 629
 630 /* a small memory range used to test load-from and store-to vsx */
 631 #define BUFFER_SIZE 4
 632 #define MAX_BUFFER_PATTERNS 6
 633 unsigned long buffer[BUFFER_SIZE];
 634
 635 static void initialize_buffer(int t)
 636 {
 637    int x;
 638
 639    for (x = 0; x < BUFFER_SIZE; x++)
 640       /* Don't want each of the 32-bit chunks to be identical. Loads of a
 641        * byte from the wrong 32-bit chuck are not detectable if the chunks
 642        * are identical.
 643        */
 644       switch((t+x)%BUFFER_SIZE) {
 645       case 0:
 646          buffer[x] = 0xffffffffffffffff;
 647          break;
 648       case 1:
 649          buffer[x] = 0x0001020304050607;
 650          break;
 651       case 2:
 652          buffer[x] = 0x5555555555555555;
 653          break;
 654       case 3:
 655          buffer[x] = 0x0000000000000000;
 656          break;
 657       case 4:
 658          buffer[x] = 0x5a05a05a05a05a05;
 659          break;
 660       case 5:
 661          buffer[x] = 0x0102030405060708;
 662          break;
 663       default:
 664          buffer[x] = 0x1010101010101010;
 665          break;
 666    }
 667 }
 668
 669 #define PATTERN_SIZE 5
 670 unsigned long pattern[PATTERN_SIZE] = {
 671         0xffffffffffffffff,
 672         0xaaaaaaaaaaaaaaaa,
 673         0x5152535455565758,
 674         0x0000000000000000,
 675         0xffaa5599113377cc,
 676 };
 677
 678
 679 static void dump_small_buffer(void) {
 680    int x;
 681
 682    printf("[ ");
 683
 684    for (x = 0; x < BUFFER_SIZE; x++)
 685       printf("%016lx ", buffer[x] );
 686
 687    printf("]");
 688 }
 689
 690 /* value to be shifted */
 691 static uint64_t values_to_shift[] = {
 692                   0x0,
 693                   0x1,
 694                  0x10,
 695                 0x100,
 696                0x1000,
 697               0x10000,
 698              0x100000,
 699             0x1000000,
 700            0x10000000,
 701           0x100000000,
 702          0x1000000000,
 703         0x10000000000,
 704        0x100000000000,
 705       0x1000000000000,
 706      0x10000000000000,
 707     0x100000000000000,
 708    0x1000000000000000,
 709                   0xf,
 710                  0x1f,
 711                 0x10f,
 712                0x100f,
 713               0x1000f,
 714              0x10000f,
 715             0x100000f,
 716            0x1000000f,
 717           0x10000000f,
 718          0x100000000f,
 719         0x1000000000f,
 720        0x10000000000f,
 721       0x100000000000f,
 722      0x1000000000000f,
 723     0x10000000000000f,
 724    0x100000000000000f,
 725                   0x7,
 726                  0x70,
 727                 0x700,
 728                0x7000,
 729               0x70000,
 730              0x700000,
 731             0x7000000,
 732            0x70000000,
 733           0x700000000,
 734          0x7000000000,
 735         0x70000000000,
 736        0x700000000000,
 737       0x7000000000000,
 738      0x70000000000000,
 739     0x700000000000000,
 740    0x7000000000000000,
 741                   0x8,
 742                  0x80,
 743                 0x800,
 744                0x8000,
 745               0x80000,
 746              0x800000,
 747             0x8000000,
 748            0x80000000,
 749           0x800000000,
 750          0x8000000000,
 751         0x80000000000,
 752        0x800000000000,
 753       0x8000000000000,
 754      0x80000000000000,
 755     0x800000000000000,
 756    0x8000000000000000,
 757    0xffffffffffffffff,
 758    0
 759 #define SHIFT_VALUES_SIZE 66
 760 };
 761
 762 /* DFP related helper functions: */
 763
 764 /* For DFP finite numbers, the combination field (G field) is a
 765  * combination of the exponent and the LMD (Left Most Digit) of the
 766  * significand.  The fields are encoded/decoded as described in the
 767  * table here.
 768  *       00       01      10   -< Exponent bits.
 769  * 0:   00000   01000   10000
 770  * ...
 771  * 7:   00111   01111   10111
 772  * 8:   11000   11010   11100
 773  * 9:   11001   11011   11101  (encoded special field).
 774  * |
 775  * ^ LMD value.
 776 */
 777 #define DFP_GFIELD_MASK  0x7c00000000000000UL
 778 #define DFP_GFIELD_SHIFT 58
 779
 780 static unsigned int special_field_LMD(uint64_t dword1) {
 781    unsigned long g_field_specials;
 782    int left_two_bits;
 783    int right_three_bits;
 784
 785    g_field_specials = (dword1 & DFP_GFIELD_MASK) >> DFP_GFIELD_SHIFT;
 786    left_two_bits = (g_field_specials & 0x18) >> 3;
 787    right_three_bits = g_field_specials & 0x07;
 788
 789    /* The LMD result maps directly to the right_three_bits value as
 790     * long as the left two bits are 0b00,0b01,0b10.  So a compare
 791     * against 3 is sufficient to determine if we can return the right
 792     * three bits directly.  (LMD values 0..7).
 793     */
 794    if (left_two_bits < 3) {
 795       return (right_three_bits);
 796    }
 797
 798    /* LMD values of 8 or 9 require a bit of swizzle, but a check of
 799     * the right-most bit is sufficient to determine whether LMD value
 800     * is 8 or 9.
 801     */
 802    if (right_three_bits & 0x1)
 803       return 9;
 804    else
 805       return 8;
 806 }
 807
 808 /* Returns the exponent bits, as decoded from the G field. */
 809 static inline int special_field_exponent_bits(unsigned long dword1) {
 810    unsigned long g_field_specials;
 811    int left_two_bits;
 812    int right_three_bits;
 813
 814    g_field_specials = (dword1 & DFP_GFIELD_MASK) >> DFP_GFIELD_SHIFT;
 815    left_two_bits = (g_field_specials & 0x18) >> 3;
 816    right_three_bits = g_field_specials & 0x07;
 817
 818    /* The special field exponent bits maps directly to the left_two_bits
 819     * value as long as the left two bits are 0b00,0b01,0b10.  So a compare
 820     * against 3 is sufficient for those values.
 821     */
 822    if (left_two_bits < 3) {
 823       return (left_two_bits);
 824    }
 825
 826    switch(right_three_bits) {
 827       case 0:
 828       case 1: return 0x0;
 829       case 2:
 830       case 3: return 0x1;
 831       case 4:
 832       case 5: return 0x2;
 833       case 6: /* Infinity */ return 0x0;
 834       case 7: /* NaN */  return 0x0;
 835    }
 836    return -1;  /* should never hit this */
 837 }
 838
 839 /* get_declet().  Return a 10-bit declet, beginning at the 'start'
 840  * offset.
 841  *
 842  * | dword1 | dword0 |
 843  * | 0    63|64   127|
 844  */
 845 #define TEN_BITS 0x03ffULL
 846
 847 static inline int get_declet(int start, uint64_t dword1, uint64_t dword0) {
 848    unsigned long local_declet;
 849    unsigned int dword0_shift;
 850    unsigned int dword1_shift;
 851
 852    dword1_shift = 63 - (start + 9);
 853    dword0_shift = 127 - (start + 9);
 854
 855    if (verbose>5) printf("\n%s (%d) %016lx %016lx",
 856                          __FUNCTION__, start, dword1, dword0);
 857
 858    if ((start + 9) < 63) { /* fully within dword1 */
 859       local_declet = (dword1 >> dword1_shift) & TEN_BITS;
 860
 861    } else if (start >= 65) {/* fully within dword0 */
 862       local_declet = (dword0 >> dword0_shift) & TEN_BITS;
 863
 864    } else { /* straddling the two dwords*/
 865       unsigned long mask_dword0;
 866       unsigned long mask_dword1;
 867
 868       mask_dword1 = TEN_BITS >> (64 - dword0_shift);
 869       mask_dword0 = TEN_BITS << (dword0_shift);
 870       local_declet =
 871          ((dword1 & mask_dword1) << (64-dword0_shift)) +
 872          ((dword0 & mask_dword0) >> dword0_shift);
 873    }
 874    return local_declet;
 875 }
 876
 877 static int get_bcd_digit_from_dpd(int start, uint64_t dword1,
 878                                   uint64_t dword0) {
 879    long bcd_digit;
 880    long declet;
 881
 882    declet = get_declet(start, dword1, dword0);
 883    bcd_digit = dpb_to_bcd(declet);
 884    return bcd_digit;
 885 }
 886
 887
 888 /* The 'exponent left' shift is for moving the leftmost two bits
 889  * of the exponent down to where they can be easily merged with the
 890  * rest of the exponent.
 891  */
 892 #define DFP128_EXPONENT_RIGHT_MASK       0x03ffc00000000000
 893 #define DFP64_EXPONENT_RIGHT_MASK        0x03fc000000000000
 894 #define DFP128_EXPONENT_RIGHT_MASK_SHIFT 46
 895 #define DFP64_EXPONENT_RIGHT_MASK_SHIFT  50
 896 #define DFP128_EXPONENT_LEFT_SHIFT       12
 897 #define DFP64_EXPONENT_LEFT_SHIFT         8
 898
 899 #define DFP_NAN                          0x1f
 900 #define DFP_INF                          0x1e
 901 #define DFP_SIGNALING_NAN_BIT            0x0200000000000000
 902
 903 /* Start of the Trailing Significand field is at bit # .. */
 904 #define DFP128_T_START         18
 905 #define DFP64_T_START          14
 906
 907 //The exponent bias value is 101 for DFP Short, 398
 908 //for DFP Long, and 6176 for DFP Extended.
 909 #define DFP128_EXPONENT_BIAS 6176
 910 #define DFP64_EXPONENT_BIAS   398
 911
 912 /* return the dfp exponent from the leading dword. */
 913 static inline signed long dfp128_exponent(unsigned long dword1) {
 914    unsigned long exponent_left;
 915    unsigned long exponent_right;
 916    unsigned long biased_exponent;
 917    signed long exponent;
 918
 919    exponent_left = special_field_exponent_bits(dword1);
 920    exponent_right = (dword1 & DFP128_EXPONENT_RIGHT_MASK);
 921    biased_exponent = (exponent_left << DFP128_EXPONENT_LEFT_SHIFT) +
 922                      (exponent_right >> DFP128_EXPONENT_RIGHT_MASK_SHIFT);
 923
 924    /* Unbias the exponent. */
 925    exponent = biased_exponent - DFP128_EXPONENT_BIAS;
 926
 927    return exponent;
 928 }
 929
 930 /* Interpret the paired 64-bit values as a extended (quad) 128 bit DFP.
 931  *
 932  * | Significand | Combination Field/    |                          |
 933  * | sign bit    | Encoded Exponent      | remainder of significand |
 934  * |0            |1                    17|18                     127|
 935  *  ^ (bit0) Significand sign bit.
 936  *                ^ (bit 1:17) Combination field. Contains high bits of
 937  *                  exponent (encoded), LMD of significand (encoded),
 938  *                  and the remainder of the exponent.  First five bits
 939  *                  will indicate special cases NAN or INF.
 940  *                                   ^ (bit 18:127) Remainder of the
 941  *                                     significand.
 942  */
 943
 944 #define DFP128_COMBINATION_MASK      0x7fffc
 945 #define DFP64_COMBINATION_MASK       0x7ffc
 946 #define DFP128_COMBINATION_SHIFT     46
 947 #define DFP64_COMBINATION_SHIFT      50
 948 #define DFP_SPECIAL_SYMBOLS_MASK     0x1f
 949 #define DFP_SPECIAL_SYMBOLS_SHIFT    58
 950
 951 static inline void dissect_dfp128_float(uint64_t dword1, uint64_t dword0) {
 952    long signbit;
 953    signed long exponent;
 954    unsigned long gfield_special_symbols;
 955    unsigned long lmd_digit;
 956    unsigned long bcd_digits[13];
 957    int i;
 958    int silent=0; // suppress leading zeros from the output.
 959
 960    if (verbose > 5) printf("RAW128: %016lx %016lx ", dword1, dword0);
 961
 962    signbit = (dword1 >> 63);
 963
 964    if (signbit) printf("-");
 965    else         printf("+");
 966
 967    gfield_special_symbols =
 968       ((dword1 >> DFP_SPECIAL_SYMBOLS_SHIFT) & DFP_SPECIAL_SYMBOLS_MASK);
 969
 970    switch (gfield_special_symbols) {
 971       case DFP_INF:
 972          printf(   "inf      ");
 973          break;
 974
 975       case DFP_NAN:
 976          if (dword1 & DFP_SIGNALING_NAN_BIT)
 977             printf("SNaN     ");
 978          else
 979             printf("QNaN     ");
 980          break;
 981
 982       default:
 983          printf(   "Finite   ");
 984          exponent  = dfp128_exponent(dword1);
 985          lmd_digit = special_field_LMD(dword1);
 986
 987          for (i = 0; i < 11; i++) {
 988             bcd_digits[i] = get_bcd_digit_from_dpd((DFP128_T_START
 989                                                     + 10 * i), dword1, dword0);
 990          }
 991
 992          if (lmd_digit) {
 993             silent++;
 994             printf("%01lx", lmd_digit);
 995
 996          } else {
 997             printf(" ");
 998          }
 999
1000          for (i = 0; i < 11; i++) {
1001             if (bcd_digits[i] || silent ) {
1002                silent++;
1003                printf("%03lx", bcd_digits[i]);
1004
1005             } else {
1006                /* always print at least the last zero */
1007                if (i == 10)
1008                   printf("  0");
1009
1010                else
1011                   printf("   ");
1012             }
1013          }
1014          printf(" * 10 ^ ");
1015          printf("%ld ", exponent);
1016    }
1017 }
1018
1019 /* Interpret the 64-bit values as a 64 bit DFP.
1020 *
1021 * | Significand | Combination Field/    |                          |
1022 * | sign bit    | Encoded Exponent      | remainder of significand |
1023 * |0            |1                    13|14                      63|
1024 *  ^ (bit0) Significand sign bit.
1025 *                ^ (bit 1:13) Combination field. Contains high bits of
1026 *                  exponent (encoded), LMD of significand (encoded),
1027 *                  and the remainder of the exponent.  First five bits
1028 *                  will indicate special cases NAN or INF.
1029 *                                        ^ (bit 14:63) Remainder of the
1030 *                                          significand.
1031 */
1032
1033 /* return the dfp exponent from the leading dword. */
1034 static inline signed long dfp64_exponent(unsigned long dword1) {
1035    unsigned long exponent_left;
1036    unsigned long exponent_right;
1037    unsigned long biased_exponent;
1038    signed long exponent;
1039
1040    exponent_left = special_field_exponent_bits(dword1);
1041    exponent_right = (dword1 & DFP64_EXPONENT_RIGHT_MASK);
1042    biased_exponent = (exponent_left << DFP64_EXPONENT_LEFT_SHIFT) +
1043                      (exponent_right >> DFP64_EXPONENT_RIGHT_MASK_SHIFT);
1044
1045    /* Unbias the exponent. */
1046    exponent = biased_exponent - DFP64_EXPONENT_BIAS;
1047    return exponent;
1048 }
1049
1050 static inline void dissect_dfp64_float(uint64_t dword1) {
1051    long signbit;
1052    signed long exponent;
1053    unsigned long gfield_special_symbols;
1054    unsigned long lmd_digit;
1055    unsigned long bcd_digits[13];
1056    int i;
1057    int silent=0; // suppress leading zeros from the output.
1058
1059    if (verbose > 5) printf("RAW64: %016lx ", dword1);
1060
1061    signbit = (dword1 >> 63);
1062
1063    if (signbit) printf("-");
1064    else         printf("+");
1065
1066    gfield_special_symbols =
1067       ((dword1 >> DFP_SPECIAL_SYMBOLS_SHIFT) & DFP_SPECIAL_SYMBOLS_MASK);
1068
1069    switch (gfield_special_symbols) {
1070       case DFP_INF:
1071          printf(   "inf      ");
1072          break;
1073
1074       case DFP_NAN:
1075          if (dword1 & DFP_SIGNALING_NAN_BIT)
1076             printf("SNaN     ");
1077          else
1078             printf("QNaN     ");
1079          break;
1080
1081       default:
1082          printf(   "Finite   ");
1083          exponent  = dfp64_exponent(dword1);
1084          lmd_digit = special_field_LMD(dword1);
1085
1086          for (i = 0; i < 5; i++)
1087             bcd_digits[i] = get_bcd_digit_from_dpd((DFP64_T_START + 10 * i),
1088                                                    dword1, 0);
1089
1090          if (lmd_digit) {
1091             silent++;
1092             printf("%01lx", lmd_digit);
1093
1094          } else {
1095             printf(" ");
1096          }
1097
1098          for (i = 0; i < 5; i++) {
1099             if (bcd_digits[i] || silent) {
1100                silent++;
1101                printf("%03lx", bcd_digits[i]);
1102
1103             } else { // suppress leading zeros.
1104                /* always print at least the last zero */
1105                if (i == 4)
1106                   printf("  0");
1107
1108                else
1109                   printf("   ");
1110             }
1111          }
1112          printf(" * 10 ^ ");
1113          printf("%ld ", exponent);
1114    }
1115 }
1116
1117 static void dump_dfp128_table(void) {
1118    int i;
1119
1120    printf("DFP 128 table:\n");
1121
1122    for (i = 0; i < nb_dfp128_vals; i += 2) {
1123       printf("i=:%2d ", i);
1124       dissect_dfp128_float(dfp128_vals[i], dfp128_vals[i+1]);
1125       printf("\n");
1126    }
1127 }
1128
1129 static void dump_dfp64_table(void) {
1130    int i;
1131
1132    printf("DFP 64 table:\n");
1133
1134    for (i = 0; i<nb_dfp64_vals; i++) {
1135       printf("i=:%2d ", i);
1136       dissect_dfp64_float(dfp64_vals[i]);
1137       printf("\n");
1138    }
1139 }
1140
1141
1142 /* Data Formats for floating point.
1143  * Floating point values include the following:
1144  *  -INF -NOR -DEN -0 +0 +DEN +NOR +INF
1145  *  INFinite: When the biased exponent is the MAX possible value, and
1146  *   the fraction field is 0.
1147  *  ZERo.    biased exponent is zero, fraction is 0.
1148  *  DENormalized.   biased exponent is 0, and fraction is non-zero.
1149  *  NORmalized. All other values that are neither Zero, Denormalized,
1150  *   or Infinite.  Biased exponent=1..MAX-1.
1151  */
1152
1153 /* Quad (128bit):
1154  * | Sign | EXPonent+Bias  | FRACTION/Mantissa |
1155  *  0      1             15 16              127
1156  *  exponent is 15 bits. ranging from:  0x0000 .. 0x7fff
1157  *     0 = (zero if fraction==0, DeNormal if fraction !=0 )
1158  *     1...0x7ffe = normalized
1159  *     7fff  =  (infinite if fraction==0, NaN if fraction !=0)
1160  */
1161 #define QUAD_EXP_MASK 0x7fff
1162
1163 /* This assumes we are working on the top half of a quad stored in a 64-bit
1164  *  register.
1165  */
1166 #define QUAD_EXP_SHIFT 48
1167 #define QUAD_MANTISSA_MASK 0x0000ffffffffffff
1168 static inline unsigned long build_binary128_float(unsigned long signbit,
1169                                                   unsigned long exponent,
1170                                                   unsigned long mantissa) {
1171    unsigned long thevalue;
1172
1173    thevalue = (unsigned long) (signbit << 63) |
1174       ((exponent & QUAD_EXP_MASK) << QUAD_EXP_SHIFT) |
1175       (mantissa & QUAD_MANTISSA_MASK);
1176
1177    if (verbose > 3)
1178       printf("%s %lx \n", __FUNCTION__, (unsigned long)thevalue);
1179
1180    return thevalue;
1181 }
1182
1183  /* double (64bit):
1184  * | Sign | EXPonent+Bias  | FRACTION/Mantissa |
1185  *  0      1             11 12              63
1186  * exponent is 11 bits. ranging from:  0x000 .. 0x7ff
1187  *    0 = (zero if fraction==0, DeNormal if fraction !=0 )
1188  *    1...0x7fe = normalized
1189  *    7ff  =  (infinite if fraction==0, NaN if fraction !=0)
1190 */
1191 #define DOUBLE_EXP_MASK 0x7ff
1192 #define DOUBLE_EXP_SHIFT 52
1193 #define DOUBLE_MANTISSA_MASK 0x000fffffffffffff
1194
1195 static inline unsigned long build_binary64_float(unsigned long signbit,
1196                                                  unsigned long exponent,
1197                                                  unsigned long mantissa) {
1198    unsigned long  thevalue;
1199
1200    thevalue = (unsigned long ) (signbit << 63) |
1201       ((exponent & DOUBLE_EXP_MASK) << DOUBLE_EXP_SHIFT) |
1202       (mantissa & DOUBLE_MANTISSA_MASK );
1203
1204    if (verbose > 3)
1205       printf("%s %lx \n", __FUNCTION__, (unsigned long)thevalue);
1206
1207    return thevalue;
1208 }
1209
1210  /* floating point single (32bit):
1211  * | Sign | EXPonent+Bias  | FRACTION/Mantissa |
1212  *  0      1              8 9                31
1213  * exponent is 8 bits. ranging from:  0x00 .. 0xff
1214  *    0 = (zero if fraction==0, DeNormal if fraction !=0 )
1215  *    1...0x7e = normalized
1216  *    7f = (infinite if fraction==0, NaN if fraction !=0) */
1217 #define SINGLE_EXP_MASK 0xff
1218 #define SINGLE_EXP_SHIFT 23
1219 #define SINGLE_MANTISSA_MASK 0x007fffff
1220
1221 /* This is building the 32-bit float. */
1222 static inline unsigned long build_binary32_float(unsigned long signbit,
1223                                                  unsigned long exponent,
1224                                                  unsigned long mantissa) {
1225    unsigned long thevalue;
1226    unsigned long local_signbit;
1227    unsigned long local_exponent;
1228    unsigned long local_mantissa;
1229
1230    local_signbit  = (signbit != 0) << 31;
1231    local_exponent = ((exponent & SINGLE_EXP_MASK) << SINGLE_EXP_SHIFT);
1232    local_mantissa = (mantissa & SINGLE_MANTISSA_MASK);
1233
1234    thevalue = (unsigned long) (local_signbit) |
1235       (local_exponent) |
1236       (local_mantissa);
1237
1238    if (verbose > 3)
1239       printf("%s %lx \n", __FUNCTION__, (unsigned long)thevalue);
1240
1241    return thevalue;
1242 }
1243
1244 /* floating point half (16bit):
1245  * | Sign | EXPonent+Bias  | FRACTION/Mantissa |
1246  *  0      1              6 7               15
1247  * exponent is 6 bits.  0x00 .. 0x7e masked with EXP_MASK
1248  *    0 = (zero if fraction==0, DeNormal if fraction !=0 )
1249  *    1...0x7d = normalized
1250  *    7e = (infinite if fraction==0, NaN if fraction !=0) */
1251 /* when extracting the exponent from the 16-bit half-word, use this mask. */
1252 #define HALF_EXP_MASK 0x7e00
1253
1254 /* when building the 16-bit half-word, mask against this,
1255  * then shift into place
1256  */
1257 #define HALF_EXP_MASK_NORMALIZED 0x3f
1258 #define HALF_EXP_SHIFT 9
1259 #define HALF_MANTISSA_MASK 0x01ff
1260
1261 /* This is building the 16-bit float. */
1262 static inline unsigned long build_binary16_float(unsigned long in_signbit,
1263                                                  unsigned long exponent,
1264                                                  unsigned mantissa) {
1265    unsigned long thevalue;
1266    unsigned long local_signbit;
1267    unsigned long local_exponent;
1268    unsigned long local_mantissa;
1269
1270    local_signbit = (in_signbit != 0) << 15;
1271
1272    local_exponent= ((exponent & HALF_EXP_MASK_NORMALIZED) << HALF_EXP_SHIFT);
1273    local_mantissa = (mantissa & HALF_MANTISSA_MASK);
1274
1275    thevalue = (unsigned long) (local_signbit) | (local_exponent)
1276       | (local_mantissa);
1277
1278    if (verbose > 3)
1279       printf("%s %lx \n", __FUNCTION__, (unsigned long)thevalue);
1280
1281    return thevalue;
1282 }
1283
1284 /* dissect_binary128_float:
1285  * Interpret the (high half) 64-bit value as normal/denormal/inf/NaN.
1286  * This is as it would be interpreted as the MSB portion of
1287  *  a 128-bit wide QUAD.
1288  */
1289 static inline void dissect_binary128_float(uint64_t value) {
1290    unsigned long signbit;
1291    unsigned long exponent;
1292    unsigned long  mantissa;
1293
1294    signbit  = (value >> 63);
1295    exponent = ( QUAD_EXP_MASK & (value >> QUAD_EXP_SHIFT));
1296    mantissa = ( QUAD_MANTISSA_MASK & value);
1297
1298    if (verbose > 4) printf("128 bit:");
1299
1300    if (signbit) printf("-");
1301    else         printf("+");
1302
1303    switch (exponent) {
1304       case 0x0:
1305          if (mantissa == 0) printf("zero     ");
1306          else               printf("denormal ");
1307          break;
1308
1309       case QUAD_EXP_MASK:
1310          if (mantissa == 0) printf("inf      ");
1311          else               printf("NaN      ");
1312          break;
1313
1314       default:              printf("Normal   ");
1315    }
1316
1317    if (verbose > 4)
1318       printf("%lx %4lx %16lx %16lx \n", signbit, exponent, mantissa, value);
1319 }
1320
1321 /* Interpret the 64-bit value as normal/denormal/inf/NaN
1322  * this is as interpreted as the 64-bit float
1323  */
1324 static inline void dissect_binary64_float(uint64_t value) {
1325    unsigned long signbit;
1326    unsigned long exponent;
1327    unsigned long mantissa;
1328
1329    signbit  = (value >> 63); // bit0
1330    exponent = ( DOUBLE_EXP_MASK & (value >> DOUBLE_EXP_SHIFT));
1331    mantissa = ( DOUBLE_MANTISSA_MASK & value);
1332
1333    if (verbose > 4) printf(" 64 bit:");
1334
1335    if (signbit) printf("-");
1336    else         printf("+");
1337
1338    switch (exponent) {
1339       case 0x0:
1340          if (mantissa == 0) printf("zero     ");
1341          else               printf("denormal ");
1342          break;
1343
1344       case DOUBLE_EXP_MASK:
1345          if (mantissa == 0) printf("inf      ");
1346          else               printf("NaN      ");
1347          break;
1348
1349       default:              printf("Normal   ");
1350    }
1351
1352    if (verbose>4)
1353       printf("%lx %4lx %16lx %16lx\n", signbit, exponent, mantissa, value);
1354 }
1355
1356 /* interpret the 32-bit value as normal/denormal/inf/NaN.
1357  * Note that the value is stored in the upper half of a
1358  * 64-bit, which is itself in the upper half of a quad.
1359  */
1360 static inline void dissect_binary32_float(uint64_t value) {
1361    unsigned long signbit;
1362    unsigned long exponent;
1363    unsigned long mantissa;
1364    unsigned long adj_value;
1365
1366    /* shift down to where the offsets make more sense.*/
1367    adj_value = value;   //>>32;
1368    signbit  = (adj_value >> 31);
1369    exponent = ( SINGLE_EXP_MASK & (adj_value >> SINGLE_EXP_SHIFT));
1370    mantissa = ( SINGLE_MANTISSA_MASK & adj_value);
1371
1372    if (verbose > 4) printf(" 32 bit:");
1373
1374    if (signbit) printf("-");
1375    else         printf("+");
1376
1377    switch (exponent) {
1378       case 0x0:
1379          if (mantissa == 0) printf("zero     ");
1380          else               printf("denormal ");
1381          break;
1382
1383       case SINGLE_EXP_MASK:
1384          if (mantissa == 0) printf("inf      ");
1385          else               printf("NaN      ");
1386          break;
1387
1388       default:              printf("Normal   ");
1389    }
1390
1391    if (verbose>4)
1392       printf("%lx %4lx %16lx %16lx \n", signbit, exponent, mantissa, adj_value);
1393 }
1394
1395 /* Interpret the 16-bit value as normal/denormal/inf/NaN. */
1396 static inline void dissect_binary16_float(uint64_t value) {
1397    unsigned long signbit;
1398    unsigned long exponent;
1399    unsigned long mantissa;
1400    unsigned long adj_value;
1401
1402    adj_value = (value & 0xffff);
1403    signbit  = ((adj_value & 0x8000) > 1);
1404    exponent = ((adj_value & HALF_EXP_MASK ) >> HALF_EXP_SHIFT) ;
1405    mantissa = (adj_value & HALF_MANTISSA_MASK);
1406
1407    if (verbose > 4) printf(" 16 bit:");
1408
1409    if (signbit) printf("-");
1410    else         printf("+");
1411
1412    switch (exponent) {
1413       case 0x0:
1414          if (mantissa == 0) printf("zero     ");
1415          else               printf("denormal ");
1416          break;
1417
1418       case HALF_EXP_MASK:
1419          if (mantissa == 0) printf("inf      ");
1420          else               printf("NaN      ");
1421          break;
1422
1423       default:              printf("Normal   ");
1424    }
1425
1426    if (verbose > 4)
1427       printf("%lx %4lx %16lx %16lx \n",
1428              signbit, exponent>>HALF_EXP_SHIFT, mantissa, adj_value);
1429 }
1430
1431 #define dissect_double_as_32s(vec_foo) \
1432   printf(" "); \
1433   dissect_binary16_float((vec_foo & 0xffffffff)); \
1434   printf(" "); \
1435   dissect_binary16_float((vec_foo >> 32) & 0xffffffff);
1436
1437 #define dissect_double_as_16s(vec_foo) \
1438   printf(" "); \
1439   dissect_binary16_float((vec_foo&0xffff)); \
1440   printf(" "); \
1441   dissect_binary16_float((vec_foo>>16)&0xffff); \
1442   printf(" "); \
1443   dissect_binary16_float((vec_foo>>32)&0xffff); \
1444   printf(" "); \
1445   dissect_binary16_float((vec_foo>>48)&0xffff);
1446
1447 /* a table of exponent values for use in the float precision tests. */
1448 unsigned long exponent_table[] = {
1449 #ifdef EXHAUSTIVE_TESTS
1450   0x0000,   /* +/-0 or +/-DENormalized, depending on associated mantissa. */
1451   0x1a,     /* within NORmalized for 16,32,64,128-bit.                    */
1452   0x1f,     /* +/-INF or +/-NaN for 16bit, NORmalized for 32,64,128       */
1453   0xff,     /* +/-INF or +/-NaN for 32bit, NORmalized for 64,128          */
1454   0x7ff,    /* +/-INF or +/-NaN for 32 and 64bit, NORmalized for 128      */
1455   0x7fff,   /* +/-INF or +/-NaN for 128bit.                               */
1456 #else
1457   0x0000,   /* +/-0 or +/-DENormalized, depending on associated mantissa. */
1458   0xff,     /* +/-INF or +/-NaN for 32bit, NORmalized for 64,128          */
1459   0x7ff,    /* +/-INF or +/-NaN for 32 and 64bit, NORmalized for 128      */
1460   0x7fff,   /* +/-INF or +/-NaN for 128bit.                               */
1461 #endif
1462 };
1463 #define MAX_EXPONENTS  (sizeof(exponent_table) / sizeof(unsigned long))
1464
1465 unsigned long mantissa_table[] = {
1466 #ifdef EXHAUSTIVE_TESTS
1467   0xbeefbeefbeef, /* NOR or DEN or NaN */
1468   0x000000000000, /* ZERO or INF */
1469   0x7fffffffffff, /* NOR or DEN or NaN */
1470 #else
1471   0x000000000000, /* ZERO or INF */
1472   0x7fffffffffff, /* NOR or DEN or NaN */
1473 #endif
1474 };
1475 #define MAX_MANTISSAS (sizeof(mantissa_table) / sizeof(unsigned long))
1476
1477 /* build in 64-bit chunks, low doubleword is zero. */
1478 static unsigned long * float_vsxargs;
1479 static unsigned long * binary128_float_vsxargs = NULL;
1480 static unsigned long * binary64_float_vsxargs = NULL;
1481 static unsigned long * binary32_float_vsxargs = NULL;
1482 static unsigned long * binary16_float_vsxargs = NULL;
1483
1484 unsigned long nb_float_vsxargs;
1485
1486 #define MAX_FLOAT_VSX_ARRAY_SIZE (((MAX_EXPONENTS * MAX_MANTISSAS) * 2 + 1) * 2)
1487
1488 void build_float_vsx_tables (void)
1489 {
1490    long i = 0;
1491    unsigned long signbit;
1492    unsigned long exponent;
1493    unsigned long mantissa;/* also referred to as FRACTION in the ISA.*/
1494    unsigned long exponent_index;
1495    unsigned long mantissa_index;
1496
1497    if (verbose > 2) printf("%s\n", __FUNCTION__);
1498
1499    binary128_float_vsxargs = malloc(MAX_FLOAT_VSX_ARRAY_SIZE
1500                                     * sizeof(unsigned long));
1501
1502    float_vsxargs = binary128_float_vsxargs;
1503
1504    binary64_float_vsxargs = malloc(MAX_FLOAT_VSX_ARRAY_SIZE
1505                                    * sizeof(unsigned long));
1506
1507    binary32_float_vsxargs = malloc(MAX_FLOAT_VSX_ARRAY_SIZE
1508                                    * sizeof(unsigned long));
1509    binary16_float_vsxargs = malloc(MAX_FLOAT_VSX_ARRAY_SIZE
1510                                    * sizeof(unsigned long));
1511
1512    for (signbit = 0; signbit < 2; signbit++) {
1513       for (exponent_index = 0; exponent_index < MAX_EXPONENTS;
1514            exponent_index++) {
1515
1516          for (mantissa_index = 0; mantissa_index < MAX_MANTISSAS;
1517               mantissa_index++) {
1518
1519             exponent = exponent_table[exponent_index];
1520             mantissa = mantissa_table[mantissa_index];
1521
1522          if (verbose > 2) {
1523             printf("signbit:%lx ", signbit);
1524             printf("exponent:%4lx ", exponent);
1525             printf("mantissa:%lx ", mantissa);
1526             printf("\n");
1527          }
1528
1529          binary128_float_vsxargs[i] = build_binary128_float(signbit, exponent,
1530                                                             mantissa);
1531
1532          binary128_float_vsxargs[i+1] = 0;
1533
1534          binary64_float_vsxargs[i] = build_binary64_float(signbit, exponent,
1535                                                           mantissa);
1536
1537          binary64_float_vsxargs[i+1] = build_binary64_float(signbit, exponent,
1538                                                             mantissa);
1539
1540          binary32_float_vsxargs[i] = build_binary32_float(signbit, exponent,
1541                                                           mantissa);
1542
1543          binary32_float_vsxargs[i+1] = build_binary32_float(signbit, exponent,
1544                                                             mantissa);
1545
1546          binary16_float_vsxargs[i] = build_binary16_float(signbit, exponent,
1547                                                           mantissa);
1548
1549          binary16_float_vsxargs[i+1] = build_binary16_float(signbit, exponent,
1550                                                             mantissa);
1551          i += 2;
1552          }
1553       }
1554    }
1555    nb_float_vsxargs = i;
1556 }
1557
1558 /* Display entries stored in the float_vsx table.  These are used as
1559  * quad/double/singles, stored as quads. */
1560 void dump_float_vsx_table (void) {
1561    int i;
1562
1563    printf("Float VSX Table:");
1564    printf("128-bit (quad):\n");
1565
1566    for (i = 0; i < nb_float_vsxargs; i += 2) {
1567       printf("i =: %2d ", i);
1568       dissect_binary128_float(binary128_float_vsxargs[i]);
1569    }
1570
1571    printf("64-bit (double):\n");
1572
1573    for (i = 0; i< nb_float_vsxargs; i += 2) {
1574       printf("i = %2d ", i);
1575       dissect_binary64_float(binary64_float_vsxargs[i]);
1576    }
1577
1578    printf("32-bit (single):\n");
1579
1580    for (i = 0; i < nb_float_vsxargs; i += 2) {
1581       printf("i = %2d ", i);
1582       dissect_binary32_float(binary32_float_vsxargs[i]);
1583    }
1584
1585    printf("16-bit (half):\n");
1586
1587    for (i = 0; i < nb_float_vsxargs; i += 2) {
1588       printf("i =% 2d ", i);
1589       dissect_binary16_float(binary16_float_vsxargs[i]);
1590    }
1591
1592    printf("\n");
1593 }
1594
1595 static void print_dcmx_field(unsigned long local_dcmx) {
1596    /* Note - this splats out the local_dxmc field from the form used to
1597     * globally pass it, with a single set bit, into the functions that use
1598     * it.  The actual DCMX field is a bit-field from 0x00 to 0x3f. If
1599     * multiple bits are ever set, this function and the way it is passed
1600     * into the users will need to be updated.  This does not handle
1601     * multiple bits being set.
1602     */
1603
1604    printf(" DCMX=[");
1605
1606    switch(local_dcmx) {
1607       case 0: printf("ALL"); break;
1608       case 1: printf("NaN"); break;
1609       case 2: printf("+inf"); break;
1610       case 3: printf("-inf"); break;
1611       case 4: printf("+zero"); break;
1612       case 5: printf("-zero"); break;
1613       case 6: printf("+denormal"); break;
1614       case 7: printf("-denormal"); break;
1615       default: printf("other"); break;
1616    }
1617
1618    if (verbose > 3)
1619       printf(" %lx", local_dcmx);
1620
1621    printf("] ");
1622 }
1623
1624 #define MAX_CHAR_ARGS_ARRAY_SIZE 128
1625
1626 static unsigned char * char_args;
1627 unsigned long nb_char_args;
1628
1629 static void build_char_table(void) {
1630    long i = 0;
1631    char ichar;
1632
1633    char_args = memalign(32, MAX_CHAR_ARGS_ARRAY_SIZE * sizeof(char));
1634
1635 #ifdef EXHAUSTIVE_TESTS
1636    for (ichar = 'a'; ichar <= 'z'; ichar++) { char_args[i++] = ichar; }
1637    for (ichar = '0'; ichar <= '9'; ichar++) { char_args[i++] = ichar; }
1638    for (ichar = 'A'; ichar <= 'Z'; ichar++) { char_args[i++] = ichar; }
1639 #else
1640    for (ichar = 'a'; ichar <= 'z'; ichar+=6) { char_args[i++] = ichar; }
1641    for (ichar = '0'; ichar <= '9'; ichar+=6) { char_args[i++] = ichar; }
1642    for (ichar = 'A'; ichar <= 'Z'; ichar+=6) { char_args[i++] = ichar; }
1643 #endif
1644
1645    char_args[i++] = ' ';
1646    char_args[i++] = '+';
1647    char_args[i++] = '-';
1648    char_args[i++] = '/';
1649    char_args[i++] = '[';
1650    char_args[i++] = ']';
1651    char_args[i++] = '`';
1652    char_args[i++] = '_';
1653    nb_char_args = i;
1654 }
1655
1656 static void dump_char_table() {
1657    int i;
1658
1659    printf("Char Table:");
1660
1661    for (i = 0; i<nb_char_args; i++)
1662       printf("%c ", char_args[i]);
1663
1664    printf("\n");
1665 }
1666
1667 #define MAX_CHAR_RANGES_SIZE 128
1668
1669 static unsigned char * char_ranges;
1670 unsigned long nb_char_ranges;
1671
1672 static void build_char_range_table(void) {
1673 /* ... in groups of four. */
1674
1675    long i = 0;
1676    char char_start, char_end;
1677
1678    char_ranges = memalign(32, MAX_CHAR_RANGES_SIZE * sizeof(char));
1679    char_start = 'a';
1680    char_end   = 'z';
1681    char_ranges[i++] = char_start;
1682    char_ranges[i++] = char_end;
1683
1684    char_start = 'A';
1685    char_end   = 'Z';
1686    char_ranges[i++] = char_start;
1687    char_ranges[i++] = char_end;
1688
1689    char_start = '0';
1690    char_end   = '9';
1691    char_ranges[i++] = char_start;
1692    char_ranges[i++] = char_end;
1693
1694    char_start = 'f';
1695    char_end   = 'z';
1696    char_ranges[i++] = char_start;
1697    char_ranges[i++] = char_end;
1698
1699    char_start = 'a';
1700    char_end   = 'e';
1701    char_ranges[i++] = char_start;
1702    char_ranges[i++] = char_end;
1703
1704    char_start = 'A';
1705    char_end   = 'E';
1706    char_ranges[i++] = char_start;
1707    char_ranges[i++] = char_end;
1708
1709    nb_char_ranges = i;
1710 }
1711
1712 static void dump_char_range_table()
1713 {
1714    int i;
1715
1716    printf("Char Range Table:");
1717
1718    for (i = 0; i < nb_char_ranges; i += 4) {
1719        printf(" [ %c-%c %c-%c ] ",
1720                 char_ranges[i], char_ranges[i+1],
1721                 char_ranges[i+2], char_ranges[i+3] );
1722    }
1723
1724    printf("\n");
1725 }
1726
1727 static HWord_t *iargs = NULL;
1728 static int nb_iargs = 0;
1729
1730 static void build_iargs_table (void) {
1731    uint64_t tmp;
1732    int i = 0;
1733
1734    iargs = malloc(20 * sizeof(HWord_t));
1735
1736    for (tmp = 0; ; tmp = 123456789*tmp + 123456789999) {
1737       if ((long)tmp < 0 )
1738          tmp = 0xFFFFFFFFFFFFFFFFULL;
1739
1740       iargs[i++] = tmp;
1741       AB_DPRINTF("val %016lx\n", tmp);
1742
1743       if (tmp == 0xFFFFFFFFFFFFFFFFULL)
1744          break;
1745    }
1746
1747    AB_DPRINTF("Registered %d iargs values\n", i);
1748    nb_iargs = i;
1749 }
1750
1751 static unsigned long * vsxargs = NULL;
1752 unsigned long nb_vargs;
1753
1754 #define MAX_VSX_ARRAY_SIZE 42
1755
1756 static void build_vsx_table (void)
1757 {
1758    long i = 0;
1759    // A VSX register is 128-bits wide.
1760    // We build contents here using pairs of 64-bit longs.
1761    // Permutes work against two (non-paired) VSX regs, so these are
1762    //  also grouped by twos.
1763    vsxargs = memalign(16, MAX_VSX_ARRAY_SIZE * sizeof(unsigned long));
1764 #ifdef EXHAUSTIVE_TESTS
1765    vsxargs[i++] = 0x0000000000000000UL; vsxargs[i++] = 0x0000000000000000UL;
1766    vsxargs[i++] = 0x0102030405060708UL; vsxargs[i++] = 0x0102010201020102UL;
1767
1768    vsxargs[i++] = 0xaaaaaaaaaaaaaaaaUL; vsxargs[i++] = 0xaaaaaaaaaaaaaaaaUL;
1769    vsxargs[i++] = 0x5555555555555555UL; vsxargs[i++] = 0x5555555555555555UL;
1770
1771    vsxargs[i++] = 0x08090a0b0c0d0e0fUL; vsxargs[i++] = 0x0102010201020102UL;
1772    vsxargs[i++] = 0xf0f1f2f3f4f5f6f7UL; vsxargs[i++] = 0xf8f9fafbfcfdfeffUL;
1773
1774    vsxargs[i++] = 0x7ea1a5a7abadb0baUL; vsxargs[i++] = 0x070d111d1e555e70UL;
1775    vsxargs[i++] = 0xe5e7ecedeff0f1faUL; vsxargs[i++] = 0xbeb1c0caced0dbdeUL;
1776
1777    vsxargs[i++] = 0x00115e7eadbabec0UL; vsxargs[i++] = 0xced0deede5ecef00UL;
1778    vsxargs[i++] = 0x00111e7ea5abadb1UL; vsxargs[i++] = 0xbecad0deedeffe00UL;
1779
1780    vsxargs[i++] = 0x0011223344556677UL; vsxargs[i++] = 0x8899aabbccddeeffUL;
1781    vsxargs[i++] = 0xf0e0d0c0b0a09080UL; vsxargs[i++] = 0x7060504030201000UL;
1782 #else
1783    vsxargs[i++] = 0x0000000000000000UL; vsxargs[i++] = 0x0000000000000000UL;
1784    vsxargs[i++] = 0x0102030405060708UL; vsxargs[i++] = 0x0102010201020102UL;
1785
1786    vsxargs[i++] = 0x0011223344556677UL; vsxargs[i++] = 0x8899aabbccddeeffUL;
1787    vsxargs[i++] = 0xf0e0d0c0b0a09080UL; vsxargs[i++] = 0x7060504030201000UL;
1788 #endif
1789
1790    // these next three groups are specific for vector rotate tests.
1791    //  bits 11:15,19:23,27:31 of each 32-bit word contain mb,me,sh values.
1792    vsxargs[i++] = 0x0000100000001002ULL; vsxargs[i++] = 0x0000100800001010ULL;
1793    vsxargs[i++] = 0x0010100000101002ULL; vsxargs[i++] = 0x0010100800101010ULL;
1794
1795    // vector rotate special...
1796    vsxargs[i++] = 0x00001c0000001c02ULL; vsxargs[i++] = 0x00001c0800001c10ULL;
1797    vsxargs[i++] = 0x00101c0000101c02ULL; vsxargs[i++] = 0x00101c0800101c10ULL;
1798
1799    // vector rotate special...
1800    vsxargs[i++] = 0x00001f0000001f02ULL; vsxargs[i++] = 0x00001f0800001f10ULL;
1801    vsxargs[i++] = 0x00101f0000101f02ULL; vsxargs[i++] = 0x00101f0800101f10ULL;
1802
1803    AB_DPRINTF("Registered %d vargs values\n", i/2);
1804    nb_vargs = i;
1805 }
1806
1807 /* VPCV = Vector Permute Control Vector */
1808 unsigned long nb_vpcv;
1809 static unsigned long * vpcv = NULL;
1810
1811 #define MAX_VPCV_SIZE 20
1812
1813 static void build_vector_permute_table(void)
1814 {
1815    int i=0;
1816
1817    vpcv = memalign(16, MAX_VPCV_SIZE * sizeof(unsigned long));
1818
1819 #ifdef EXHAUSTIVE_TESTS
1820    /* These two lines are complementary pairs of each other. */
1821    vpcv[i++]=0x12021a0817141317ULL; vpcv[i++]=0x100d1b05070f0205ULL;
1822    vpcv[i++]=0x0d1d0517080b0c08ULL; vpcv[i++]=0x0f12041a18101d1cULL;
1823    vpcv[i++]=0x100d1b070f020505ULL; vpcv[i++]=0x0e201f1400130105ULL;
1824    vpcv[i++]=0x0705030a0b01ea0cULL; vpcv[i++]=0x0e0c09010602080dULL;
1825 #else
1826    vpcv[i++]=0x12021a0817141317ULL; vpcv[i++]=0x100d1b05070f0205ULL;
1827    vpcv[i++]=0x0705030a0b01ea0cULL; vpcv[i++]=0x0e0c09010602080dULL;
1828 #endif
1829    nb_vpcv=i;
1830    AB_DPRINTF("Registered %d permute control vectors \n", nb_vpcv);
1831
1832    if (i >= MAX_VPCV_SIZE)
1833       printf("Warning! Exceeded size of table building the vector permute control . \n");
1834 }
1835
1836 /* Decimal Encodings...
1837  * Packed, National, Zoned decimal content follows.
1838  * Note: Watch the conversions in and out of the
1839  *       dwords / vectors for reverses with respect to
1840  *       top/bottom low/high
1841  */
1842
1843 /* Packed Decimals:
1844  * A valid encoding of a packed decimal integer value requires the following
1845  * properties:
1846  *   – Each of the 31 4-bit digits of the operand’s magnitude (bits 0:123)
1847  *     must be in the range 0-9.
1848  *   – The sign code (bits 124:127) must be in the range 10-15. (0xa-0xf).
1849  * Source operands with sign codes of 0b1010, 0b1100, 0b1110, and 0b1111 are
1850  * interpreted as positive values.  Source operands with sign codes of
1851  * 0b1011 and 0b1101 are interpreted as negative values.
1852  * Positive and zero results are encoded with a either sign code of
1853  * 0b1100 or 0b1111, depending on the preferred sign (indicated as an
1854  * immediate operand).  Negative results are encoded with a sign code
1855  * of 0b1101.
1856  * PS - This is the 'preferred sign' bit encoded in some BCD associated
1857  * instructions.
1858  */
1859
1860 // Note: table content is limited to values encoded, not interpreted.
1861 unsigned int packed_decimal_sign_codes[] = {
1862    /* positive operands */
1863    0xc, 0xf,  // 0b1100, 0b1111
1864
1865    /* negative operands */
1866    0xd  // 0b1101
1867 };
1868
1869 #define NR_PACKED_DECIMAL_SIGNS 3
1870 #define MAX_PACKED_DECIMAL_TABLE_SIZE 8 * 16 * 2 + 20
1871
1872 static unsigned long * packed_decimal_table;
1873
1874 /* build into a pair of doubles */
1875 unsigned long nb_packed_decimal_entries;
1876
1877 static void dissect_packed_decimal_sign(unsigned long local_sign) {
1878   switch(local_sign) {
1879      case 0xa: /*0b1010:*/ printf("[ + ]"); break;
1880      case 0xb: /*0b1011:*/ printf("[ - ]"); break;
1881      case 0xc: /*0b1100:*/ printf("(+|0)"); break;
1882      case 0xd: /*0b1101:*/ printf("( - )"); break;
1883      case 0xe: /*0b1110:*/ printf("[ + ]"); break;
1884      case 0xf: /*0b1111:*/ printf("(+|0)"); break;
1885      default: printf("(?%02lx)", local_sign);
1886   }
1887 }
1888
1889 int extract_packed_decimal_sign(unsigned long dword1, unsigned long dword0) {
1890    return  (dword1 & 0xf);
1891 }
1892
1893 static void dissect_packed_decimal(unsigned long dword1,unsigned long dword0)
1894 {
1895    int i;
1896    int local_sign;
1897    int nibble;
1898
1899    local_sign = extract_packed_decimal_sign(dword1, dword0);
1900    printf("packed_decimal: [");
1901
1902    for (i = 60; i >= 0; i -= 4) {
1903       nibble=(dword1 >> (i)) & 0xf;
1904       printf(" %x", nibble);
1905    }
1906
1907    for (i = 60; i >= 0; i -= 4) {
1908       nibble=(dword0 >> (i)) & 0xf;
1909       printf(" %x", nibble);
1910    }
1911
1912    printf(" ");
1913    dissect_packed_decimal_sign(local_sign);
1914    printf(" ] ");
1915 }
1916
1917 static void build_packed_decimal_table(void)
1918 {
1919    long sign_index;
1920    long sign_value;
1921    unsigned long i = 0;
1922    unsigned long value;
1923  #ifdef EXHAUSTIVE_TESTS
1924    int scramble;
1925 #endif
1926
1927    if (verbose) printf("%s\n", __FUNCTION__);
1928
1929    packed_decimal_table = malloc((MAX_PACKED_DECIMAL_TABLE_SIZE + 2)
1930                                  * sizeof (unsigned long));
1931
1932    for (sign_index = 0; sign_index < NR_PACKED_DECIMAL_SIGNS; sign_index++) {
1933       sign_value = packed_decimal_sign_codes[sign_index];
1934
1935       for (value = 0; value <= 9; value++) {
1936         packed_decimal_table[i]    = 0x1111111111111111 * value;
1937         packed_decimal_table[i+1]  = sign_value;
1938         packed_decimal_table[i+1] += 0x1111111111111110 * value;
1939
1940         if (verbose>3) dissect_packed_decimal(packed_decimal_table[i+1],
1941                                               packed_decimal_table[i]);
1942         if (verbose>3) printf("\n");
1943         i+=2;
1944       }
1945
1946 #ifdef EXHAUSTIVE_TESTS
1947       for (scramble = 1; scramble <= 4; scramble++) {
1948         packed_decimal_table[i]    = 0x3210321032103210 * scramble;
1949         packed_decimal_table[i+1]  = sign_value;
1950         packed_decimal_table[i+1] += 0x0123012301230120 * scramble;
1951
1952         if (verbose>3) dissect_packed_decimal(packed_decimal_table[i+1],
1953                                               packed_decimal_table[i]);
1954         if (verbose>3) printf("\n");
1955         i+=2;
1956       }
1957 #endif
1958
1959       /* Add some entries that will provide interesting output from
1960        * the convert TO tests.
1961        */
1962       packed_decimal_table[i]    = 0x0000000000000000;
1963       packed_decimal_table[i+1]  = sign_value;
1964       packed_decimal_table[i+1] += 0x0000000012345670;
1965
1966       if (verbose > 3) dissect_packed_decimal(packed_decimal_table[i+1],
1967                                               packed_decimal_table[i]);
1968
1969       if (verbose>3) printf("\n");
1970
1971       i += 2;
1972
1973 #ifdef EXHAUSTIVE_TESTS
1974       packed_decimal_table[i]    = 0x0000000000000000;
1975       packed_decimal_table[i+1]  = sign_value;
1976       packed_decimal_table[i+1] += 0x0000000098765430;
1977
1978       if (verbose > 3) dissect_packed_decimal(packed_decimal_table[i+1],
1979                                               packed_decimal_table[i]);
1980
1981       if (verbose > 3) printf("\n");
1982
1983       i += 2;
1984
1985       packed_decimal_table[i]    = 0x000000000000000b;
1986       packed_decimal_table[i+1]  = sign_value;
1987       packed_decimal_table[i+1] += 0x0000000000000000;
1988
1989       if (verbose > 3) dissect_packed_decimal(packed_decimal_table[i+1],
1990                                               packed_decimal_table[i]);
1991
1992       if (verbose>3) printf("\n");
1993
1994       i += 2;
1995 #endif
1996
1997       packed_decimal_table[i]    = 0x0030000000000000;
1998       packed_decimal_table[i+1]  = sign_value;
1999       packed_decimal_table[i+1] += 0x0000000000000000;
2000
2001       if (verbose > 3) dissect_packed_decimal(packed_decimal_table[i+1],
2002                                             packed_decimal_table[i]);
2003
2004       if (verbose > 3) printf("\n");
2005
2006       i += 2;
2007    }
2008
2009    if (verbose>2) printf("\n");
2010
2011    nb_packed_decimal_entries = i;
2012 }
2013
2014 static void dump_packed_decimal_table(void) {
2015    int i;
2016
2017    printf("packed_decimal_table:\n");
2018
2019    for (i = 0; i < nb_packed_decimal_entries; i += 2) {
2020       printf("i =: %2d ", i);
2021       dissect_packed_decimal(packed_decimal_table[i+1],
2022                              packed_decimal_table[i]);
2023       printf("\n");
2024    }
2025 }
2026
2027 /* National decimals:
2028  * A valid encoding of a national decimal value requires the following.
2029  * – The contents of halfword 7 (sign code) must be
2030  *   either 0x002B or 0x002D.
2031  * – The contents of halfwords 0 to 6 must be in the
2032  *   range 0x0030 to 0x0039.
2033  * National decimal values having a sign code of 0x002B
2034  * are interpreted as positive values.
2035  * National decimal values having a sign code of 0x002D
2036  * are interpreted as negative values.
2037  */
2038 unsigned int national_decimal_sign_codes[] = {
2039    /* positive */  0x002b,
2040    /* negative */  0x002d
2041 };
2042
2043 #define NR_NATIONAL_DECIMAL_SIGNS 2
2044
2045 unsigned int national_decimal_values[] = {
2046 #ifdef EXHAUSTIVE_TESTS
2047    0x0030, 0x0031, 0x0032, 0x0033, 0x0034,
2048    0x0035, 0x0036, 0x0037, 0x0038, 0x0039
2049 #else
2050    0x0030, 0x0031,
2051    0x0035, 0x0039
2052 #endif
2053 };
2054
2055 #define NR_NATIONAL_DECIMAL_VALUES (sizeof(national_decimal_values) / sizeof(unsigned int))
2056
2057 static unsigned long * national_decimal_table;
2058
2059 #define MAX_NATIONAL_DECIMAL_TABLE_SIZE 10 * NR_NATIONAL_DECIMAL_VALUES * NR_NATIONAL_DECIMAL_SIGNS
2060
2061 unsigned long nb_national_decimal_entries;
2062
2063 static void dissect_national_decimal_sign(unsigned long local_sign) {
2064    switch(local_sign) {
2065       case 0x002b:
2066             printf("( + )");
2067             break;
2068
2069       case 0x002d:
2070             printf("( - )");
2071             break;
2072
2073      default: printf("unhandled sign value: %lx", local_sign);
2074    }
2075 }
2076
2077 int extract_national_decimal_sign(unsigned long dword1, unsigned long dword0) {
2078    return (dword1 & 0x0ff);
2079 }
2080
2081 static void dissect_national_decimal(unsigned long dword1,
2082                                      unsigned long dword0)
2083 {
2084    int i;
2085    int local_sign;
2086    long hword;
2087
2088    printf("national_decimal: [");
2089
2090    if (verbose>4) printf("raw: [%016lx %016lx] ", dword1, dword0);
2091
2092    for (i = 48;i >= 0; i -= 16) {
2093       hword = dword1 >> (i) & 0x00ff;
2094
2095       /* validity of national decimal value */
2096       /* the i>0 clause skips the validity check against the sign value. */
2097       if (((i > 0) && (hword < 0x30)) || (hword > 0x39)) printf("!");
2098
2099       printf("%04lx ", hword);
2100    }
2101
2102    for (i = 48; i >= 0; i -= 16) {
2103       hword = dword0 >> (i) & 0x00ff;
2104
2105       if ((hword < 0x30) || (hword > 0x39)) printf("!");
2106
2107       printf("%04lx ", hword);
2108    }
2109
2110    local_sign = extract_national_decimal_sign(dword1, dword0);
2111    dissect_national_decimal_sign(local_sign);
2112    printf(" ] ");
2113 }
2114
2115 static void build_national_decimal_table(void)
2116 {
2117    long sign_index;
2118    long sign_value;
2119    unsigned long i = 0;
2120    int index;
2121    unsigned long value;
2122
2123    if (verbose) printf("%s\n",__FUNCTION__);
2124    national_decimal_table = malloc(MAX_NATIONAL_DECIMAL_TABLE_SIZE
2125                                    * sizeof (unsigned long));
2126
2127    for (sign_index = 0; sign_index < NR_NATIONAL_DECIMAL_SIGNS; sign_index++) {
2128       sign_value = national_decimal_sign_codes[sign_index];
2129
2130       for (index = 0; index < NR_NATIONAL_DECIMAL_VALUES; index++) {
2131          value = national_decimal_values[index];
2132
2133          national_decimal_table[i]    = 0x0001000100010001 * value;
2134          national_decimal_table[i+1]  = 0x0001000100010000 * value;
2135          national_decimal_table[i+1] += sign_value ;
2136
2137          if (verbose > 3) {
2138             dissect_national_decimal(national_decimal_table[i+1],
2139                                      national_decimal_table[i]);
2140             printf("\n");
2141          }
2142          i += 2;
2143       }
2144 #ifdef EXHAUSTIVE_TESTS
2145       { /* a few more for fun */
2146          national_decimal_table[i]    = 0x0031003200330034;
2147          national_decimal_table[i+1]  = 0x0035003600370000;
2148          national_decimal_table[i+1] += sign_value ;
2149
2150          if (verbose > 3) {
2151             dissect_national_decimal(national_decimal_table[i+1],
2152                                      national_decimal_table[i]);
2153             printf("\n");
2154          }
2155
2156          i += 2;
2157          national_decimal_table[i]    = 0x0031003200330034;
2158          national_decimal_table[i+1]  = 0x0035003600370000;
2159          national_decimal_table[i+1] += sign_value ;
2160
2161          if (verbose > 3) {
2162             dissect_national_decimal(national_decimal_table[i+1],
2163                                      national_decimal_table[i]);
2164             printf("\n");
2165          }
2166          i += 2;
2167       }
2168 #endif
2169    }
2170
2171    if (verbose > 2) printf("\n");
2172
2173    nb_national_decimal_entries = i;
2174 }
2175
2176 static void dump_national_decimal_table(void) {
2177    int i;
2178
2179    printf("national_decimal_table:\n");
2180
2181    for (i = 0; i < nb_national_decimal_entries; i += 2) {
2182       printf("#%2d ", i);
2183       dissect_national_decimal(national_decimal_table[i+1],
2184                                national_decimal_table[i]);
2185       printf("\n");
2186    }
2187 }
2188
2189
2190 /* Zoned Decimals:
2191  *
2192  * When PS=0, do the following.
2193  *  A valid encoding of a zoned decimal value requires the following.
2194  *  – The contents of bits 0:3 of byte 15 (sign code) can be any
2195  *    value in the range 0x0 to 0xF.
2196  *  – The contents of bits 0:3 of bytes 0 to 14 (zone) must
2197  *    be the value 0x3.
2198  *  – The contents of bits 4:7 of bytes 0 to 15 must
2199  *    be a value in the range 0x0 to 0x9.
2200  *  Zoned decimal values having a sign code of 0x0, 0x1, 0x2, 0x3,
2201  *  0x8, 0x9, 0xA, or 0xB are interpreted as positive values.
2202  *  Zoned decimal values having a sign code of 0x4, 0x5, 0x6, 0x7,
2203  *  0xC, 0xD, 0xE, or 0xF are interpreted as negative values.
2204     :: 0,1,2,3,        8,9,a,b,         are interpreted as positive.
2205     ::         4,5,6,7,        c,d,e,f  are interpreted as negative.
2206  * When PS=1, do the following.
2207  *  A valid encoding of a zoned decimal source operand requires the following.
2208  *  – The contents of bits 0:3 of byte 15 (sign code) must be a value in the
2209  *    range 0xA to 0xF.
2210  *  – The contents of bits 0:3 of bytes 0 to 14 (zone) must be the value 0xF.
2211  *  – The contents of bits 4:7 of bytes 0 to 15 must be a value in the
2212  *    range 0x0 to 0x9.
2213  *  Zoned decimal source operands having a sign code of 0xA, 0xC, 0xE,
2214  *  or 0xF are interpreted as positive values.
2215  *  Zoned decimal source operands having a sign code of 0xB or 0xD are
2216  *  interpreted as negative values.
2217     ::                     a,  c,  e,f  are interpreted as positive.
2218     ::                       b,  d,     are interpreted as negative.
2219  */
2220
2221 /* a valid sign is anything in range 0-9,a-f,
2222  * For coverage that does not overwhelm, we have chosen to use  0,1,4,a,b,f. */
2223 #define NM_ZONED_DECIMAL_SIGNS 6
2224 #define NM_ZONED_VALUES 5   /* 0,2,4,6,9 */
2225 #define NM_PS_VALUES 2      /* 0,1 */
2226 #define NM_ZONED_ADDITIONAL_PATTERNS 4
2227 #define MAX_ZONED_DECIMAL_TABLE_SIZE  NM_ZONED_DECIMAL_SIGNS * NM_ZONED_VALUES * NM_ZONED_ADDITIONAL_PATTERNS * NM_PS_VALUES + 10
2228
2229 static unsigned long zoned_decimal_table_[MAX_ZONED_DECIMAL_TABLE_SIZE];
2230 static unsigned long * zoned_decimal_table;
2231 unsigned long nb_zoned_decimal_entries;
2232
2233 static void dissect_zoned_decimal_sign(unsigned long local_sign, int ps) {
2234    if (ps == 0) {
2235       switch(local_sign) {
2236          case 0x0: case 0x1: case 0x2: case 0x3:
2237          case 0x8: case 0x9: case 0xa: case 0xb:
2238             printf("( + )");
2239             break;
2240
2241          case 0x4: case 0x5: case 0x6: case 0x7:
2242          case 0xc: case 0xd: case 0xe: case 0xf:
2243             printf("( - )");
2244             break;
2245          default: printf("zoned decimal (ps=%d). Unhandled sign value: %lx",
2246                          ps, local_sign);
2247       }
2248    }
2249
2250    if (ps == 1) {
2251       switch(local_sign) {
2252          case 0xa: case 0xc: case 0xe: case 0xf:
2253             printf("( + )");
2254             break;
2255
2256          case 0xb: case 0xd:
2257             printf("( - )");
2258             break;
2259
2260          default: printf("zoned decimal (ps=%d). Unhandled sign value: %lx",
2261                          ps, local_sign);
2262       }
2263    }
2264 }
2265
2266 /* Valid byte values within a zoned decimal are in the ranges of
2267  * 0x30..0x39 when PS==0, or 0xf0..0xff when PS==1.
2268  */
2269 static void check_zoned_byte_validity(int byte, int ps) {
2270    if (ps == 0) {
2271       /* check the zone */
2272       if (((byte & 0x30) != 0x30))
2273          printf("!=30");
2274
2275    } else { /* ps==1 */
2276       if (((byte & 0xf0) != 0xf0))
2277          printf("%x !=f0 ", byte );
2278    }
2279
2280    /* check the numeric value */
2281    if ((byte & 0x0f) > 0x9)
2282       printf("!(0..9)");
2283 }
2284
2285 int extract_zoned_decimal_sign(unsigned long dword1, unsigned long dword0) {
2286    return ((dword1 & 0xf0) >> 4);
2287 }
2288
2289 static void dissect_zoned_decimal(unsigned long dword1, unsigned long dword0,
2290                                   int ps)
2291 {
2292    int i;
2293    int local_sign;
2294    int byte;
2295
2296    printf("zoned_decimal: [");
2297
2298    for (i = 56; i >= 0; i -= 8) {
2299       byte = (dword1 >> (i)) & 0xff;
2300       check_zoned_byte_validity(byte, ps);
2301       printf(" %02x", byte);
2302    }
2303
2304    for (i = 56; i >= 0; i -= 8) {
2305       byte = (dword0 >> (i)) & 0x00ff;
2306       check_zoned_byte_validity(byte, ps);
2307
2308       if ((byte & 0xf) > 0x9) printf(" !(>9)");
2309       printf(" %02x", byte);
2310    }
2311
2312    local_sign = extract_zoned_decimal_sign(dword1, dword0);
2313    dissect_zoned_decimal_sign(local_sign, ps);
2314    printf(" ]");
2315 }
2316
2317 #ifdef EXHAUSTIVE_TESTS
2318 // Randomly chosen exhaustive coverage for k includes values: 0,2,4,7,9
2319 # define SELECTIVE_INCREMENT_ZONED(k) \
2320    if (k == 7) k = 9;                    \
2321       else if (k == 4) k = 7;            \
2322          else if (k == 2) k = 4;         \
2323             else if (k == 0) k = 2;      \
2324                else k++;
2325 // Randomly chosen exhaustive coverage for signs includes values: 0,1,4,a,b,f
2326 # define SELECTIVE_INCREMENT_SIGNS(signs)              \
2327          if (signs == 0x0) signs = 0x1;                   \
2328          else if (signs == 0x1) signs = 0x4;              \
2329             else if (signs == 0x4) signs = 0xa;           \
2330                else if (signs == 0xa) signs = 0xb;        \
2331                   else if (signs == 0xb) signs = 0xf;     \
2332                      else signs++;
2333 #else
2334 // Randomly chosen coverage for k includes values: 0,7,9
2335 # define SELECTIVE_INCREMENT_ZONED(k) \
2336    if (k == 7) k = 9;                 \
2337       else if (k == 0) k = 7;      \
2338          else k++;
2339 // Randomly chosen coverage for signs includes values: 0,4,b,f
2340 # define SELECTIVE_INCREMENT_SIGNS(signs)                  \
2341       if (signs == 0x0) signs = 0x4;                      \
2342             else if (signs == 0x4) signs = 0xb;           \
2343                   else if (signs == 0xb) signs = 0xf;     \
2344                      else signs++;
2345 #endif
2346
2347
2348 static void build_zoned_decimal_table(void)
2349 {
2350    unsigned long signs;
2351    unsigned long i;
2352    int k;
2353    int ps;
2354    int signs_start,signs_end;
2355
2356    if (verbose) printf("%s\n", __FUNCTION__);
2357
2358    zoned_decimal_table = zoned_decimal_table_;
2359    i = 0;
2360
2361    for (ps = 0; ps <= 1; ps++) {
2362       if (ps == 0) {
2363          signs_start = 0;
2364          signs_end   = 0xf;
2365
2366       } else {
2367          signs_start = 0xa;
2368          signs_end   = 0xf;
2369       }
2370
2371       for (signs = signs_start;
2372            signs <= signs_end;  /* signs selectively updated below */) {
2373
2374          if (verbose > 2) printf("ps=%d sign:%lx\n", ps, signs);
2375
2376          for (k = 0 ; k < 9;  /* k selectively updated below */) {
2377             if (ps == 0) {
2378                zoned_decimal_table[i]   = 0x3030303030303030;  // set bits 0:3 of bytes 0..7.
2379                zoned_decimal_table[i+1] = 0x3030303030303000;  // bits 0:3 of bytes 8..14 must be 0x3
2380
2381             } else {
2382                zoned_decimal_table[i]   = 0xf0f0f0f0f0f0f0f0;  // set bits 0:3 of bytes 0..7.
2383                zoned_decimal_table[i+1] = 0xf0f0f0f0f0f0f000;  // bits 0:3 of bytes 8..14 must be 0x3
2384             }
2385
2386             zoned_decimal_table[i]   += 0x010101010101010 * k; // set bits 4..7 of bytes 0..7.
2387             zoned_decimal_table[i+1] += 0x010101010101000 * k; // bits 4:7 of bytes 8..15 must be 0..9.
2388             zoned_decimal_table[i+1] += (signs << 4); // bits 0:3 of byte 15 is the sign.
2389             if (verbose > 3) {
2390                dissect_zoned_decimal(zoned_decimal_table[i+1],
2391                                      zoned_decimal_table[i], ps);
2392                printf("\n");
2393             }
2394             i += 2;
2395             SELECTIVE_INCREMENT_ZONED(k)
2396          }
2397
2398          /* add a few more patterns outside of the k patterns. */
2399          if (ps == 0) {
2400             zoned_decimal_table[i]   = 0x3030303030303030;
2401             zoned_decimal_table[i+1] = 0x3030303030303000;
2402
2403          } else  {
2404             zoned_decimal_table[i]   = 0xf0f0f0f0f0f0f0f0;
2405             zoned_decimal_table[i+1] = 0xf0f0f0f0f0f0f000;
2406          }
2407
2408          zoned_decimal_table[i]      += 0x0908070605040302;
2409          zoned_decimal_table[i+1]    += 0x0102030405060700;
2410          zoned_decimal_table[i+1]    += (signs<<4); // bits 0:3 of byte 15.
2411
2412          if (verbose > 3) {
2413             dissect_zoned_decimal(zoned_decimal_table[i+1],
2414                                   zoned_decimal_table[i], ps);
2415             printf("\n");
2416          }
2417
2418          i += 2;
2419          SELECTIVE_INCREMENT_SIGNS(signs)
2420       } /* signs loop */
2421    } /* ps loop */
2422
2423    nb_zoned_decimal_entries = i;
2424 }
2425
2426 static void dump_zoned_decimal_table(void) {
2427    int i;
2428    int ps;
2429
2430    for (ps = 0; ps <= 1; ps++) {
2431       printf("zoned_decimal_table ps=%d:\n", ps);
2432
2433       for (i = 0; i < nb_zoned_decimal_entries; i += 2) {
2434          printf("#%2d ", i);
2435          dissect_zoned_decimal(zoned_decimal_table[i+1],
2436                                zoned_decimal_table[i], ps);
2437          printf("\n");
2438       }
2439    }
2440 }
2441
2442 /* Build table containing shift and truncate values */
2443 #define MAX_DECIMAL_SHIFT_TABLE_SIZE 64
2444
2445 static unsigned long * decimal_shift_table;
2446 unsigned long nb_decimal_shift_entries;
2447
2448 static void build_decimal_shift_table(void) {
2449    unsigned long i = 0;
2450    unsigned long value;
2451
2452    if (verbose) printf("%s\n",__FUNCTION__);
2453
2454    decimal_shift_table = malloc(MAX_DECIMAL_SHIFT_TABLE_SIZE
2455                                 * sizeof (unsigned long));
2456
2457    for (value = 0; value <= 31; value++) {
2458         decimal_shift_table[i]   = value;
2459         decimal_shift_table[i+1] = 0;
2460         i += 2;
2461    }
2462
2463    if (verbose>2) printf("\n");
2464
2465    nb_decimal_shift_entries = i;
2466 }
2467
2468 static void dump_decimal_shift_table(void) {
2469    int i;
2470
2471    printf("decimal_shift_table:\n");
2472
2473    for (i = 0; i < nb_decimal_shift_entries; i += 2) {
2474       printf("i=:%2d ", i);
2475       printf(" 0x%2lx 0x%2lx ", decimal_shift_table[i],
2476              decimal_shift_table[i+1]);
2477       printf("\n");
2478    }
2479 }