VEX/priv/host_ppc_defs.c

   1
   2 /*---------------------------------------------------------------*/
   3 /*--- begin                                   host_ppc_defs.c ---*/
   4 /*---------------------------------------------------------------*/
   5
   6 /*
   7    This file is part of Valgrind, a dynamic binary instrumentation
   8    framework.
   9
  10    Copyright (C) 2004-2017 OpenWorks LLP
  11       info@open-works.net
  12
  13    This program is free software; you can redistribute it and/or
  14    modify it under the terms of the GNU General Public License as
  15    published by the Free Software Foundation; either version 2 of the
  16    License, or (at your option) any later version.
  17
  18    This program is distributed in the hope that it will be useful, but
  19    WITHOUT ANY WARRANTY; without even the implied warranty of
  20    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  21    General Public License for more details.
  22
  23    You should have received a copy of the GNU General Public License
  24    along with this program; if not, see <http://www.gnu.org/licenses/>.
  25
  26    The GNU General Public License is contained in the file COPYING.
  27
  28    Neither the names of the U.S. Department of Energy nor the
  29    University of California nor the names of its contributors may be
  30    used to endorse or promote products derived from this software
  31    without prior written permission.
  32 */
  33
  34 #include "libvex_basictypes.h"
  35 #include "libvex.h"
  36 #include "libvex_trc_values.h"
  37
  38 #include "main_util.h"
  39 #include "host_generic_regs.h"
  40 #include "host_ppc_defs.h"
  41
  42
  43 /* --------- Registers. --------- */
  44
  45 const RRegUniverse* getRRegUniverse_PPC ( Bool mode64 )
  46 {
  47    /* The real-register universe is a big constant, so we just want to
  48       initialise it once.  rRegUniverse_PPC_initted values: 0=not initted,
  49       1=initted for 32-bit-mode, 2=initted for 64-bit-mode */
  50    static RRegUniverse rRegUniverse_PPC;
  51    static UInt         rRegUniverse_PPC_initted = 0;
  52
  53    /* Handy shorthand, nothing more */
  54    RRegUniverse* ru = &rRegUniverse_PPC;
  55
  56    /* This isn't thread-safe.  Sigh. */
  57    UInt howNeeded = mode64 ? 2 : 1;
  58    if (LIKELY(rRegUniverse_PPC_initted == howNeeded))
  59       return ru;
  60
  61    RRegUniverse__init(ru);
  62
  63    /* Add the registers.  The initial segment of this array must be
  64       those available for allocation by reg-alloc, and those that
  65       follow are not available for allocation. */
  66    // GPR0 = scratch reg where poss. - some ops interpret as value zero
  67    // GPR1 = stack pointer
  68    // GPR2 = TOC pointer
  69    ru->allocable_start[(mode64) ? HRcInt64 : HRcInt32] = ru->size;
  70    // GPR14 and above are callee save. List them first.
  71    ru->regs[ru->size++] = hregPPC_GPR14(mode64);
  72    ru->regs[ru->size++] = hregPPC_GPR15(mode64);
  73    ru->regs[ru->size++] = hregPPC_GPR16(mode64);
  74    ru->regs[ru->size++] = hregPPC_GPR17(mode64);
  75    ru->regs[ru->size++] = hregPPC_GPR18(mode64);
  76    ru->regs[ru->size++] = hregPPC_GPR19(mode64);
  77    ru->regs[ru->size++] = hregPPC_GPR20(mode64);
  78    ru->regs[ru->size++] = hregPPC_GPR21(mode64);
  79    ru->regs[ru->size++] = hregPPC_GPR22(mode64);
  80    ru->regs[ru->size++] = hregPPC_GPR23(mode64);
  81    ru->regs[ru->size++] = hregPPC_GPR24(mode64);
  82    ru->regs[ru->size++] = hregPPC_GPR25(mode64);
  83    ru->regs[ru->size++] = hregPPC_GPR26(mode64);
  84    ru->regs[ru->size++] = hregPPC_GPR27(mode64);
  85    ru->regs[ru->size++] = hregPPC_GPR28(mode64);
  86
  87    // Caller save registers now.
  88    ru->regs[ru->size++] = hregPPC_GPR3(mode64);
  89    ru->regs[ru->size++] = hregPPC_GPR4(mode64);
  90    ru->regs[ru->size++] = hregPPC_GPR5(mode64);
  91    ru->regs[ru->size++] = hregPPC_GPR6(mode64);
  92    ru->regs[ru->size++] = hregPPC_GPR7(mode64);
  93    ru->regs[ru->size++] = hregPPC_GPR8(mode64);
  94    ru->regs[ru->size++] = hregPPC_GPR9(mode64);
  95    ru->regs[ru->size++] = hregPPC_GPR10(mode64);
  96    if (!mode64) {
  97       /* in mode64:
  98          r11 used for calls by ptr / env ptr for some langs
  99          r12 used for exception handling and global linkage code */
 100       ru->regs[ru->size++] = hregPPC_GPR11(mode64);
 101       ru->regs[ru->size++] = hregPPC_GPR12(mode64);
 102    }
 103    // GPR13 = thread specific pointer
 104    ru->allocable_end[(mode64) ? HRcInt64 : HRcInt32] = ru->size - 1;
 105    // GPR29 is reserved for the dispatcher
 106    // GPR30 is reserved as AltiVec spill reg temporary
 107    // GPR31 is reserved for the GuestStatePtr
 108
 109    /* Don't waste the reg-allocs's time trawling through zillions of
 110       FP registers - they mostly will never be used.  We'll tolerate
 111       the occasional extra spill instead. */
 112    /* For both ppc32-linux and ppc64-linux, f14-f31 are callee save.
 113       So use them. */
 114    ru->allocable_start[HRcFlt64] = ru->size;
 115    ru->regs[ru->size++] = hregPPC_FPR14(mode64);
 116    ru->regs[ru->size++] = hregPPC_FPR15(mode64);
 117    ru->regs[ru->size++] = hregPPC_FPR16(mode64);
 118    ru->regs[ru->size++] = hregPPC_FPR17(mode64);
 119    ru->regs[ru->size++] = hregPPC_FPR18(mode64);
 120    ru->regs[ru->size++] = hregPPC_FPR19(mode64);
 121    ru->regs[ru->size++] = hregPPC_FPR20(mode64);
 122    ru->regs[ru->size++] = hregPPC_FPR21(mode64);
 123    ru->allocable_end[HRcFlt64] = ru->size - 1;
 124
 125    /* Same deal re Altivec */
 126    /* For both ppc32-linux and ppc64-linux, v20-v31 are callee save.
 127       So use them. */
 128    /* NB, vr29 is used as a scratch temporary -- do not allocate */
 129    ru->allocable_start[HRcVec128] = ru->size;
 130    ru->regs[ru->size++] = hregPPC_VR20(mode64);
 131    ru->regs[ru->size++] = hregPPC_VR21(mode64);
 132    ru->regs[ru->size++] = hregPPC_VR22(mode64);
 133    ru->regs[ru->size++] = hregPPC_VR23(mode64);
 134    ru->regs[ru->size++] = hregPPC_VR24(mode64);
 135    ru->regs[ru->size++] = hregPPC_VR25(mode64);
 136    ru->regs[ru->size++] = hregPPC_VR26(mode64);
 137    ru->regs[ru->size++] = hregPPC_VR27(mode64);
 138    ru->allocable_end[HRcVec128] = ru->size - 1;
 139    ru->allocable = ru->size;
 140
 141    /* And other regs, not available to the allocator. */
 142    ru->regs[ru->size++] = hregPPC_GPR1(mode64);
 143    ru->regs[ru->size++] = hregPPC_GPR29(mode64);
 144    ru->regs[ru->size++] = hregPPC_GPR30(mode64);
 145    ru->regs[ru->size++] = hregPPC_GPR31(mode64);
 146    ru->regs[ru->size++] = hregPPC_VR29(mode64);
 147
 148    rRegUniverse_PPC_initted = howNeeded;
 149
 150    RRegUniverse__check_is_sane(ru);
 151    return ru;
 152 }
 153
 154
 155 UInt ppHRegPPC ( HReg reg )
 156 {
 157    Int r;
 158    static const HChar* ireg32_names[32]
 159       = { "%r0",  "%r1",  "%r2",  "%r3",
 160           "%r4",  "%r5",  "%r6",  "%r7",
 161           "%r8",  "%r9",  "%r10", "%r11",
 162           "%r12", "%r13", "%r14", "%r15",
 163           "%r16", "%r17", "%r18", "%r19",
 164           "%r20", "%r21", "%r22", "%r23",
 165           "%r24", "%r25", "%r26", "%r27",
 166           "%r28", "%r29", "%r30", "%r31" };
 167    /* Be generic for all virtual regs. */
 168    if (hregIsVirtual(reg)) {
 169       return ppHReg(reg);
 170    }
 171    /* But specific for real regs. */
 172    switch (hregClass(reg)) {
 173    case HRcInt64:
 174       r = hregEncoding(reg);
 175       vassert(r >= 0 && r < 32);
 176       return vex_printf("%s", ireg32_names[r]);
 177    case HRcInt32:
 178       r = hregEncoding(reg);
 179       vassert(r >= 0 && r < 32);
 180       return vex_printf("%s", ireg32_names[r]);
 181    case HRcFlt64:
 182       r = hregEncoding(reg);
 183       vassert(r >= 0 && r < 32);
 184       return vex_printf("%%fr%d", r);
 185    case HRcVec128:
 186       r = hregEncoding(reg);
 187       vassert(r >= 0 && r < 32);
 188       return vex_printf("%%v%d", r);
 189    default:
 190       vpanic("ppHRegPPC");
 191    }
 192 }
 193
 194
 195 /* --------- Condition codes, Intel encoding. --------- */
 196
 197 const HChar* showPPCCondCode ( PPCCondCode cond )
 198 {
 199    if (cond.test == Pct_ALWAYS) return "always";
 200
 201    switch (cond.flag) {
 202    case Pcf_7SO:
 203       return (cond.test == Pct_TRUE) ? "cr7.so=1" : "cr7.so=0";
 204    case Pcf_7EQ:
 205       return (cond.test == Pct_TRUE) ? "cr7.eq=1" : "cr7.eq=0";
 206    case Pcf_7GT:
 207       return (cond.test == Pct_TRUE) ? "cr7.gt=1" : "cr7.gt=0";
 208    case Pcf_7LT:
 209       return (cond.test == Pct_TRUE) ? "cr7.lt=1" : "cr7.lt=0";
 210    case Pcf_NONE:
 211       return "no-flag";
 212    default: vpanic("ppPPCCondCode");
 213    }
 214 }
 215
 216 /* construct condition code */
 217 PPCCondCode mk_PPCCondCode ( PPCCondTest test, PPCCondFlag flag )
 218 {
 219    PPCCondCode cc;
 220    cc.flag = flag;
 221    cc.test = test;
 222    if (test == Pct_ALWAYS) {
 223       vassert(flag == Pcf_NONE);
 224    } else {
 225       vassert(flag != Pcf_NONE);
 226    }
 227    return cc;
 228 }
 229
 230 /* false->true, true->false */
 231 PPCCondTest invertCondTest ( PPCCondTest ct )
 232 {
 233    vassert(ct != Pct_ALWAYS);
 234    return (ct == Pct_TRUE) ? Pct_FALSE : Pct_TRUE;
 235 }
 236
 237
 238 /* --------- PPCAMode: memory address expressions. --------- */
 239
 240 PPCAMode* PPCAMode_IR ( Int idx, HReg base ) {
 241    PPCAMode* am = LibVEX_Alloc_inline(sizeof(PPCAMode));
 242    vassert(idx >= -0x8000 && idx < 0x8000);
 243    am->tag = Pam_IR;
 244    am->Pam.IR.base = base;
 245    am->Pam.IR.index = idx;
 246    return am;
 247 }
 248 PPCAMode* PPCAMode_RR ( HReg idx, HReg base ) {
 249    PPCAMode* am = LibVEX_Alloc_inline(sizeof(PPCAMode));
 250    am->tag = Pam_RR;
 251    am->Pam.RR.base = base;
 252    am->Pam.RR.index = idx;
 253    return am;
 254 }
 255
 256 PPCAMode* dopyPPCAMode ( PPCAMode* am ) {
 257    switch (am->tag) {
 258    case Pam_IR:
 259       return PPCAMode_IR( am->Pam.IR.index, am->Pam.IR.base );
 260    case Pam_RR:
 261       return PPCAMode_RR( am->Pam.RR.index, am->Pam.RR.base );
 262    default:
 263       vpanic("dopyPPCAMode");
 264    }
 265 }
 266
 267 void ppPPCAMode ( PPCAMode* am ) {
 268    switch (am->tag) {
 269    case Pam_IR:
 270       if (am->Pam.IR.index == 0)
 271          vex_printf("0(");
 272       else
 273          vex_printf("%d(", (Int)am->Pam.IR.index);
 274       ppHRegPPC(am->Pam.IR.base);
 275       vex_printf(")");
 276       return;
 277    case Pam_RR:
 278       ppHRegPPC(am->Pam.RR.base);
 279       vex_printf(",");
 280       ppHRegPPC(am->Pam.RR.index);
 281       return;
 282    default:
 283       vpanic("ppPPCAMode");
 284    }
 285 }
 286
 287 static void addRegUsage_PPCAMode ( HRegUsage* u, PPCAMode* am ) {
 288    switch (am->tag) {
 289    case Pam_IR:
 290       addHRegUse(u, HRmRead, am->Pam.IR.base);
 291       return;
 292    case Pam_RR:
 293       addHRegUse(u, HRmRead, am->Pam.RR.base);
 294       addHRegUse(u, HRmRead, am->Pam.RR.index);
 295       return;
 296    default:
 297       vpanic("addRegUsage_PPCAMode");
 298    }
 299 }
 300
 301 static void mapRegs_PPCAMode ( HRegRemap* m, PPCAMode* am ) {
 302    switch (am->tag) {
 303    case Pam_IR:
 304       am->Pam.IR.base = lookupHRegRemap(m, am->Pam.IR.base);
 305       return;
 306    case Pam_RR:
 307       am->Pam.RR.base = lookupHRegRemap(m, am->Pam.RR.base);
 308       am->Pam.RR.index = lookupHRegRemap(m, am->Pam.RR.index);
 309       return;
 310    default:
 311       vpanic("mapRegs_PPCAMode");
 312    }
 313 }
 314
 315 /* --------- Operand, which can be a reg or a u16/s16. --------- */
 316
 317 PPCRH* PPCRH_Imm ( Bool syned, UShort imm16 ) {
 318    PPCRH* op         = LibVEX_Alloc_inline(sizeof(PPCRH));
 319    op->tag           = Prh_Imm;
 320    op->Prh.Imm.syned = syned;
 321    op->Prh.Imm.imm16 = imm16;
 322    /* If this is a signed value, ensure it's not -32768, so that we
 323       are guaranteed always to be able to negate if needed. */
 324    if (syned)
 325       vassert(imm16 != 0x8000);
 326    vassert(syned == True || syned == False);
 327    return op;
 328 }
 329 PPCRH* PPCRH_Reg ( HReg reg ) {
 330    PPCRH* op       = LibVEX_Alloc_inline(sizeof(PPCRH));
 331    op->tag         = Prh_Reg;
 332    op->Prh.Reg.reg = reg;
 333    return op;
 334 }
 335
 336 void ppPPCRH ( PPCRH* op ) {
 337    switch (op->tag) {
 338    case Prh_Imm:
 339       if (op->Prh.Imm.syned)
 340          vex_printf("%d", (Int)(Short)op->Prh.Imm.imm16);
 341       else
 342          vex_printf("%u", (UInt)(UShort)op->Prh.Imm.imm16);
 343       return;
 344    case Prh_Reg:
 345       ppHRegPPC(op->Prh.Reg.reg);
 346       return;
 347    default:
 348       vpanic("ppPPCRH");
 349    }
 350 }
 351
 352 /* An PPCRH can only be used in a "read" context (what would it mean
 353    to write or modify a literal?) and so we enumerate its registers
 354    accordingly. */
 355 static void addRegUsage_PPCRH ( HRegUsage* u, PPCRH* op ) {
 356    switch (op->tag) {
 357    case Prh_Imm:
 358       return;
 359    case Prh_Reg:
 360       addHRegUse(u, HRmRead, op->Prh.Reg.reg);
 361       return;
 362    default:
 363       vpanic("addRegUsage_PPCRH");
 364    }
 365 }
 366
 367 static void mapRegs_PPCRH ( HRegRemap* m, PPCRH* op ) {
 368    switch (op->tag) {
 369    case Prh_Imm:
 370       return;
 371    case Prh_Reg:
 372       op->Prh.Reg.reg = lookupHRegRemap(m, op->Prh.Reg.reg);
 373       return;
 374    default:
 375       vpanic("mapRegs_PPCRH");
 376    }
 377 }
 378
 379
 380 /* --------- Operand, which can be a reg or a u32/64. --------- */
 381
 382 PPCRI* PPCRI_Imm ( ULong imm64 ) {
 383    PPCRI* op   = LibVEX_Alloc_inline(sizeof(PPCRI));
 384    op->tag     = Pri_Imm;
 385    op->Pri.Imm = imm64;
 386    return op;
 387 }
 388 PPCRI* PPCRI_Reg ( HReg reg ) {
 389    PPCRI* op   = LibVEX_Alloc_inline(sizeof(PPCRI));
 390    op->tag     = Pri_Reg;
 391    op->Pri.Reg = reg;
 392    return op;
 393 }
 394
 395 void ppPPCRI ( PPCRI* dst ) {
 396    switch (dst->tag) {
 397       case Pri_Imm:
 398          vex_printf("0x%llx", dst->Pri.Imm);
 399          break;
 400       case Pri_Reg:
 401          ppHRegPPC(dst->Pri.Reg);
 402          break;
 403       default:
 404          vpanic("ppPPCRI");
 405    }
 406 }
 407
 408 /* An PPCRI can only be used in a "read" context (what would it
 409    mean to write or modify a literal?) and so we enumerate its
 410    registers accordingly. */
 411 static void addRegUsage_PPCRI ( HRegUsage* u, PPCRI* dst ) {
 412    switch (dst->tag) {
 413       case Pri_Imm:
 414          return;
 415       case Pri_Reg:
 416          addHRegUse(u, HRmRead, dst->Pri.Reg);
 417          return;
 418       default:
 419          vpanic("addRegUsage_PPCRI");
 420    }
 421 }
 422
 423 static void mapRegs_PPCRI ( HRegRemap* m, PPCRI* dst ) {
 424    switch (dst->tag) {
 425       case Pri_Imm:
 426          return;
 427       case Pri_Reg:
 428          dst->Pri.Reg = lookupHRegRemap(m, dst->Pri.Reg);
 429          return;
 430       default:
 431          vpanic("mapRegs_PPCRI");
 432    }
 433 }
 434
 435
 436 /* --------- Operand, which can be a vector reg or a simm5. --------- */
 437
 438 PPCVI5s* PPCVI5s_Imm ( Char simm5 ) {
 439    PPCVI5s* op   = LibVEX_Alloc_inline(sizeof(PPCVI5s));
 440    op->tag       = Pvi_Imm;
 441    op->Pvi.Imm5s = simm5;
 442    vassert(simm5 >= -16 && simm5 <= 15);
 443    return op;
 444 }
 445 PPCVI5s* PPCVI5s_Reg ( HReg reg ) {
 446    PPCVI5s* op = LibVEX_Alloc_inline(sizeof(PPCVI5s));
 447    op->tag     = Pvi_Reg;
 448    op->Pvi.Reg = reg;
 449    vassert(hregClass(reg) == HRcVec128);
 450    return op;
 451 }
 452
 453 void ppPPCVI5s ( PPCVI5s* src ) {
 454    switch (src->tag) {
 455       case Pvi_Imm:
 456          vex_printf("%d", (Int)src->Pvi.Imm5s);
 457          break;
 458       case Pvi_Reg:
 459          ppHRegPPC(src->Pvi.Reg);
 460          break;
 461       default:
 462          vpanic("ppPPCVI5s");
 463    }
 464 }
 465
 466 /* An PPCVI5s can only be used in a "read" context (what would it
 467    mean to write or modify a literal?) and so we enumerate its
 468    registers accordingly. */
 469 static void addRegUsage_PPCVI5s ( HRegUsage* u, PPCVI5s* dst ) {
 470    switch (dst->tag) {
 471       case Pvi_Imm:
 472          return;
 473       case Pvi_Reg:
 474          addHRegUse(u, HRmRead, dst->Pvi.Reg);
 475          return;
 476       default:
 477          vpanic("addRegUsage_PPCVI5s");
 478    }
 479 }
 480
 481 static void mapRegs_PPCVI5s ( HRegRemap* m, PPCVI5s* dst ) {
 482    switch (dst->tag) {
 483       case Pvi_Imm:
 484          return;
 485       case Pvi_Reg:
 486          dst->Pvi.Reg = lookupHRegRemap(m, dst->Pvi.Reg);
 487          return;
 488       default:
 489          vpanic("mapRegs_PPCVI5s");
 490    }
 491 }
 492
 493
 494 /* --------- Instructions. --------- */
 495
 496 const HChar* showPPCUnaryOp ( PPCUnaryOp op ) {
 497    switch (op) {
 498    case Pun_NOT:   return "not";
 499    case Pun_NEG:   return "neg";
 500    case Pun_CLZ32: return "cntlzw";
 501    case Pun_CLZ64: return "cntlzd";
 502    case Pun_EXTSW: return "extsw";
 503    case Pun_POP32: return "popcntw";
 504    case Pun_POP64: return "popcntd";
 505    default: vpanic("showPPCUnaryOp");
 506    }
 507 }
 508
 509 const HChar* showPPCAluOp ( PPCAluOp op, Bool immR ) {
 510    switch (op) {
 511       case Palu_ADD: return immR ? "addi"  : "add";
 512       case Palu_SUB: return immR ? "subi"  : "sub";
 513       case Palu_AND: return immR ? "andi." : "and";
 514       case Palu_OR:  return immR ? "ori"   : "or";
 515       case Palu_XOR: return immR ? "xori"  : "xor";
 516       default: vpanic("showPPCAluOp");
 517    }
 518 }
 519
 520 const HChar* showPPCShftOp ( PPCShftOp op, Bool immR, Bool sz32 ) {
 521    switch (op) {
 522       case Pshft_SHL: return sz32 ? (immR ? "slwi"  : "slw") :
 523                                     (immR ? "sldi"  : "sld");
 524       case Pshft_SHR: return sz32 ? (immR ? "srwi"  : "srw") :
 525                                     (immR ? "srdi"  : "srd");
 526       case Pshft_SAR: return sz32 ? (immR ? "srawi" : "sraw") :
 527                                     (immR ? "sradi" : "srad");
 528       default: vpanic("showPPCShftOp");
 529    }
 530 }
 531
 532 const HChar* showPPCFpOp ( PPCFpOp op ) {
 533    switch (op) {
 534       case Pfp_ADDD:   return "fadd";
 535       case Pfp_SUBD:   return "fsub";
 536       case Pfp_MULD:   return "fmul";
 537       case Pfp_DIVD:   return "fdiv";
 538       case Pfp_MADDD:  return "fmadd";
 539       case Pfp_MSUBD:  return "fmsub";
 540       case Pfp_MADDS:  return "fmadds";
 541       case Pfp_MSUBS:  return "fmsubs";
 542       case Pfp_ADDS:   return "fadds";
 543       case Pfp_SUBS:   return "fsubs";
 544       case Pfp_MULS:   return "fmuls";
 545       case Pfp_DIVS:   return "fdivs";
 546       case Pfp_SQRT:   return "fsqrt";
 547       case Pfp_ABS:    return "fabs";
 548       case Pfp_NEG:    return "fneg";
 549       case Pfp_MOV:    return "fmr";
 550       case Pfp_RES:    return "fres";
 551       case Pfp_RSQRTE: return "frsqrte";
 552       case Pfp_FRIM:   return "frim";
 553       case Pfp_FRIN:   return "frin";
 554       case Pfp_FRIP:   return "frip";
 555       case Pfp_FRIZ:   return "friz";
 556       case Pfp_FPADDQ:     return "xsaddqp";
 557       case Pfp_FPSUBQ:     return "xsubqp";
 558       case Pfp_FPMULQ:     return "xsmulqp";
 559       case Pfp_FPDIVQ:     return "xsdivqp";
 560       case Pfp_FPMULADDQ:        return "xsmaddqp";
 561       case Pfp_FPMULSUBQ:        return "xsmsubqp";
 562       case Pfp_FPNEGMULADDQ:     return "xsnmaddqp";
 563       case Pfp_FPNEGMULSUBQ:     return "xsnmsubqp";
 564       case Pfp_FPADDQRNDODD:     return "xsaddqpo";
 565       case Pfp_FPSUBQRNDODD:     return "xsubqpo";
 566       case Pfp_FPMULQRNDODD:     return "xsmulqpo";
 567       case Pfp_FPDIVQRNDODD:     return "xsaddqpo";
 568       case Pfp_FPMULADDQRNDODD:      return "xsmaddqpo";
 569       case Pfp_FPMULSUBQRNDODD:      return "xsmsubqpo";
 570       case Pfp_FPNEGMULADDQRNDODD:   return "xsnmaddqpo";
 571       case Pfp_FPNEGMULSUBQRNDODD:   return "xsnmsubqpo";
 572       case Pfp_FPQTOD:               return "xscvqpdp";
 573       case Pfp_FPQTODRNDODD:         return "xscvqpdpo";
 574       case Pfp_FPDTOQ:               return "xscvdpqp";
 575       case Pfp_IDSTOQ:               return "xscvsdqp";
 576       case Pfp_IDUTOQ:               return "xscvudqp";
 577       case Pfp_IQSTOQ:               return "xscvsqqp";
 578       case Pfp_IQUTOQ:               return "xscvuqqp";
 579       case Pfp_TRUNCFPQTOISD:        return "xscvqpsdz";
 580       case Pfp_TRUNCFPQTOISW:        return "xscvqpswz";
 581       case Pfp_TRUNCFPQTOIUD:        return "xscvqpudz";
 582       case Pfp_TRUNCFPQTOIUW:        return "xscvqpuwz";
 583       case Pfp_DFPADD:     return "dadd";
 584       case Pfp_DFPADDQ:    return "daddq";
 585       case Pfp_DFPSUB:     return "dsub";
 586       case Pfp_DFPSUBQ:    return "dsubq";
 587       case Pfp_DFPMUL:     return "dmul";
 588       case Pfp_DFPMULQ:    return "dmulq";
 589       case Pfp_DFPDIV:     return "ddivd";
 590       case Pfp_DFPDIVQ:    return "ddivq";
 591       case Pfp_DFPTOIQ:    return "dctfixqq";
 592       case Pfp_IQUTODFP:   return "dcffixqq";
 593       case Pfp_DCTDP:      return "dctdp";
 594       case Pfp_DRSP:       return "drsp";
 595       case Pfp_DCTFIX:     return "dctfix";
 596       case Pfp_DCFFIX:     return "dcffix";
 597       case Pfp_DCTQPQ:     return "dctqpq";
 598       case Pfp_DCFFIXQ:    return "dcffixq";
 599       case Pfp_DQUA:       return "dqua";
 600       case Pfp_DQUAQ:      return "dquaq";
 601       case Pfp_DXEX:       return "dxex";
 602       case Pfp_DXEXQ:      return "dxexq";
 603       case Pfp_DIEX:       return "diex";
 604       case Pfp_DIEXQ:      return "diexq";
 605       case Pfp_RRDTR:      return "rrdtr";
 606       default: vpanic("showPPCFpOp");
 607    }
 608 }
 609
 610 const HChar* showPPCAvOp ( PPCAvOp op ) {
 611    switch (op) {
 612
 613    /* Unary */
 614    case Pav_MOV:       return "vmr";      /* Mov */
 615
 616    case Pav_AND:       return "vand";     /* Bitwise */
 617    case Pav_OR:        return "vor";
 618    case Pav_XOR:       return "vxor";
 619    case Pav_NOT:       return "vnot";
 620
 621    case Pav_UNPCKH8S:  return "vupkhsb";  /* Unpack */
 622    case Pav_UNPCKH16S: return "vupkhsh";
 623    case Pav_UNPCKL8S:  return "vupklsb";
 624    case Pav_UNPCKL16S: return "vupklsh";
 625    case Pav_UNPCKHPIX: return "vupkhpx";
 626    case Pav_UNPCKLPIX: return "vupklpx";
 627
 628    /* Integer binary */
 629    case Pav_ADDU:      return "vaddu_m";  // b,h,w,dw
 630    case Pav_QADDU:     return "vaddu_s";  // b,h,w,dw
 631    case Pav_QADDS:     return "vadds_s";  // b,h,w,dw
 632
 633    case Pav_SUBU:      return "vsubu_m";  // b,h,w,dw
 634    case Pav_QSUBU:     return "vsubu_s";  // b,h,w,dw
 635    case Pav_QSUBS:     return "vsubs_s";  // b,h,w,dw
 636
 637    case Pav_MULU:      return "vmulu";    // w
 638    case Pav_OMULU:     return "vmulou";   // b,h,w
 639    case Pav_OMULS:     return "vmulos";   // b,h,w
 640    case Pav_EMULU:     return "vmuleu";   // b,h,w
 641    case Pav_EMULS:     return "vmules";   // b,h,w
 642
 643    case Pav_AVGU:      return "vavgu";    // b,h,w
 644    case Pav_AVGS:      return "vavgs";    // b,h,w
 645
 646    case Pav_MAXU:      return "vmaxu";    // b,h,w
 647    case Pav_MAXS:      return "vmaxs";    // b,h,w
 648
 649    case Pav_MINU:      return "vminu";    // b,h,w
 650    case Pav_MINS:      return "vmins";    // b,h,w
 651
 652    /* Compare (always affects CR field 6) */
 653    case Pav_CMPEQU:    return "vcmpequ";  // b,h,w
 654    case Pav_CMPGTU:    return "vcmpgtu";  // b,h,w
 655    case Pav_CMPGTS:    return "vcmpgts";  // b,h,w
 656
 657    /* Shift */
 658    case Pav_SHL:       return "vsl";      // ' ',b,h,w,dw
 659    case Pav_SHR:       return "vsr";      // ' ',b,h,w,dw
 660    case Pav_SAR:       return "vsra";     // b,h,w,dw
 661    case Pav_ROTL:      return "vrl";      // b,h,w,dw
 662
 663    /* Pack */
 664    case Pav_PACKUU:    return "vpku_um";  // h,w,dw
 665    case Pav_QPACKUU:   return "vpku_us";  // h,w
 666    case Pav_QPACKSU:   return "vpks_us";  // h,w
 667    case Pav_QPACKSS:   return "vpks_ss";  // h,w
 668    case Pav_PACKPXL:   return "vpkpx";
 669
 670    /* Merge */
 671    case Pav_MRGHI:     return "vmrgh";    // b,h,w
 672    case Pav_MRGLO:     return "vmrgl";    // b,h,w
 673
 674    /* Concatenation */
 675    case Pav_CATODD:     return "vmrgow";    // w
 676    case Pav_CATEVEN:    return "vmrgew";    // w
 677
 678    /* SHA */
 679    case Pav_SHA256:     return "vshasigmaw"; // w
 680    case Pav_SHA512:     return "vshasigmaw"; // dw
 681
 682    /* BCD */
 683    case Pav_BCDAdd:     return "bcdadd.";  // qw
 684    case Pav_BCDSub:     return "bcdsub.";  // qw
 685    case Pav_I128StoBCD128: return  "bcdcfsq.";  //qw
 686    case Pav_BCD128toI128S: return  "bcdctsq.";  //qw
 687
 688    /* I128 mult by 10 */
 689    case Pav_MulI128by10:       return  "vmul10uq";  //qw
 690    case Pav_MulI128by10Carry:  return  "vmul10cuq";  //qw
 691    case Pav_MulI128by10E:      return  "vmul10euq";  //qw
 692    case Pav_MulI128by10ECarry: return  "vmul10ecuq";  //qw
 693
 694       /* F128 to I128 signed */
 695    case Pav_F128toI128S:    return "xsrqpi|x";   //qw
 696
 697       /* F128 round to F128 */
 698    case Pav_ROUNDFPQ:       return "xsrqpxp";
 699
 700    /* Polynomial arith */
 701    case Pav_POLYMULADD: return "vpmsum";   // b, h, w, d
 702
 703    /* Cipher */
 704    case Pav_CIPHERV128:  case Pav_CIPHERLV128:
 705    case Pav_NCIPHERV128: case Pav_NCIPHERLV128:
 706    case Pav_CIPHERSUBV128: return "v_cipher_";  // qw
 707
 708    /* zero count */
 709    case Pav_ZEROCNTBYTE: case Pav_ZEROCNTWORD:
 710    case Pav_ZEROCNTHALF: case Pav_ZEROCNTDBL:
 711       return "vclz_";                           // b, h, w, d
 712
 713    /* trailing zero count */
 714    case Pav_TRAILINGZEROCNTBYTE: case Pav_TRAILINGZEROCNTWORD:
 715    case Pav_TRAILINGZEROCNTHALF: case Pav_TRAILINGZEROCNTDBL:
 716       return "vctz_";                           // b, h, w, d
 717
 718    /* vector gather (byte-by-byte bit matrix transpose) */
 719    case Pav_BITMTXXPOSE:
 720       return "vgbbd";
 721
 722    /* Vector Half-precision format to single precision conversion */
 723    case Pav_F16toF32x4:
 724       return"xvcvhpsp";
 725
 726    /* Vector Single-precision format to Half-precision conversion */
 727    case Pav_F32toF16x4:
 728       return"xvcvsphp";
 729
 730    /* Vector Half-precision format to Double precision conversion */
 731    case Pav_F16toF64x2:
 732       return"xvcvhpdp";
 733
 734    /* Vector Half-precision format to Double precision conversion */
 735    case Pav_F64toF16x2:
 736       return"xvcvdphp";
 737
 738    default: vpanic("showPPCAvOp");
 739    }
 740 }
 741
 742 const HChar* showPPCAvOpBin128 ( PPCAvOpBin128 op ) {
 743
 744    switch (op) {
 745    /* Binary ops */
 746
 747    /* Vector Divide Signed Quadword VX-form */
 748    case Pav_DivU128:
 749       return "vdivuq";
 750
 751    case Pav_DivS128:
 752       return "vdivsq";
 753
 754    case Pav_DivU128E:
 755       return "vdivuq";
 756
 757    case Pav_DivS128E:
 758       return "vdivsq";
 759
 760    case Pav_ModU128:
 761       return "vmoduq";
 762
 763    case Pav_ModS128:
 764       return "vmodsq";
 765
 766    default: vpanic("showPPCAvOpBin128");
 767    }
 768 }
 769
 770 const HChar* showPPCAvOpTri128 ( PPCAvOpTri128 op ) {
 771
 772    /* Vector Quadword VX-form */
 773    switch (op) {
 774    case Pav_2xMultU64Add128CarryOut:
 775       return "vmsumcud";
 776
 777    default: vpanic("showPPCAvOpTri128");
 778    }
 779 }
 780
 781 const HChar* showPPCAvFpOp ( PPCAvFpOp op ) {
 782    switch (op) {
 783    /* Floating Point Binary */
 784    case Pavfp_ADDF:      return "vaddfp";
 785    case Pavfp_SUBF:      return "vsubfp";
 786    case Pavfp_MULF:      return "vmaddfp";
 787    case Pavfp_MAXF:      return "vmaxfp";
 788    case Pavfp_MINF:      return "vminfp";
 789    case Pavfp_CMPEQF:    return "vcmpeqfp";
 790    case Pavfp_CMPGTF:    return "vcmpgtfp";
 791    case Pavfp_CMPGEF:    return "vcmpgefp";
 792
 793    /* Floating Point Unary */
 794    case Pavfp_RCPF:      return "vrefp";
 795    case Pavfp_RSQRTF:    return "vrsqrtefp";
 796    case Pavfp_Log2:      return "vlogefp";
 797    case Pavfp_Exp2:      return "vexptefp";
 798    case Pavfp_CVTU2F:    return "vcfux";
 799    case Pavfp_CVTS2F:    return "vcfsx";
 800    case Pavfp_QCVTF2U:   return "vctuxs";
 801    case Pavfp_QCVTF2S:   return "vctsxs";
 802    case Pavfp_ROUNDM:    return "vrfim";
 803    case Pavfp_ROUNDP:    return "vrfip";
 804    case Pavfp_ROUNDN:    return "vrfin";
 805    case Pavfp_ROUNDZ:    return "vrfiz";
 806
 807    default: vpanic("showPPCAvFpOp");
 808    }
 809 }
 810
 811 const HChar* showXFormUnary994 ( PPCXFormUnary994 op ) {
 812
 813    /* Vector Quadword VX-form */
 814    switch (op) {
 815    case Px_IQSTODFP:
 816       return "dcffixqq";
 817    case Px_DFPTOIQS:
 818       return "dctfixqq";
 819
 820    default: vpanic("showXFormUnary994");
 821    }
 822 }
 823
 824 PPCInstr* PPCInstr_LI ( HReg dst, ULong imm64, Bool mode64 )
 825 {
 826    PPCInstr* i     = LibVEX_Alloc_inline(sizeof(PPCInstr));
 827    i->tag          = Pin_LI;
 828    i->Pin.LI.dst   = dst;
 829    i->Pin.LI.imm64 = imm64;
 830    if (!mode64)
 831       vassert( (Long)imm64 == (Long)(Int)(UInt)imm64 );
 832    return i;
 833 }
 834 PPCInstr* PPCInstr_Alu ( PPCAluOp op, HReg dst,
 835                          HReg srcL, PPCRH* srcR ) {
 836    PPCInstr* i     = LibVEX_Alloc_inline(sizeof(PPCInstr));
 837    i->tag          = Pin_Alu;
 838    i->Pin.Alu.op   = op;
 839    i->Pin.Alu.dst  = dst;
 840    i->Pin.Alu.srcL = srcL;
 841    i->Pin.Alu.srcR = srcR;
 842    return i;
 843 }
 844 PPCInstr* PPCInstr_Shft ( PPCShftOp op, Bool sz32,
 845                           HReg dst, HReg srcL, PPCRH* srcR ) {
 846    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 847    i->tag           = Pin_Shft;
 848    i->Pin.Shft.op   = op;
 849    i->Pin.Shft.sz32 = sz32;
 850    i->Pin.Shft.dst  = dst;
 851    i->Pin.Shft.srcL = srcL;
 852    i->Pin.Shft.srcR = srcR;
 853    return i;
 854 }
 855 PPCInstr* PPCInstr_AddSubC ( Bool isAdd, Bool setC,
 856                              HReg dst, HReg srcL, HReg srcR ) {
 857    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
 858    i->tag               = Pin_AddSubC;
 859    i->Pin.AddSubC.isAdd = isAdd;
 860    i->Pin.AddSubC.setC  = setC;
 861    i->Pin.AddSubC.dst   = dst;
 862    i->Pin.AddSubC.srcL  = srcL;
 863    i->Pin.AddSubC.srcR  = srcR;
 864    return i;
 865 }
 866 PPCInstr* PPCInstr_Cmp ( Bool syned, Bool sz32,
 867                          UInt crfD, HReg srcL, PPCRH* srcR ) {
 868    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 869    i->tag           = Pin_Cmp;
 870    i->Pin.Cmp.syned = syned;
 871    i->Pin.Cmp.sz32  = sz32;
 872    i->Pin.Cmp.crfD  = crfD;
 873    i->Pin.Cmp.srcL  = srcL;
 874    i->Pin.Cmp.srcR  = srcR;
 875    return i;
 876 }
 877 PPCInstr* PPCInstr_Unary ( PPCUnaryOp op, HReg dst, HReg src ) {
 878    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 879    i->tag           = Pin_Unary;
 880    i->Pin.Unary.op  = op;
 881    i->Pin.Unary.dst = dst;
 882    i->Pin.Unary.src = src;
 883    return i;
 884 }
 885 PPCInstr* PPCInstr_MulL ( Bool syned, Bool hi, Bool sz32,
 886                           HReg dst, HReg srcL, HReg srcR ) {
 887    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
 888    i->tag            = Pin_MulL;
 889    i->Pin.MulL.syned = syned;
 890    i->Pin.MulL.hi    = hi;
 891    i->Pin.MulL.sz32  = sz32;
 892    i->Pin.MulL.dst   = dst;
 893    i->Pin.MulL.srcL  = srcL;
 894    i->Pin.MulL.srcR  = srcR;
 895    /* if doing the low word, the signedness is irrelevant, but tie it
 896       down anyway. */
 897    if (!hi) vassert(!syned);
 898    return i;
 899 }
 900 PPCInstr* PPCInstr_Div ( Bool extended, Bool syned, Bool sz32,
 901                          HReg dst, HReg srcL, HReg srcR ) {
 902    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 903    i->tag           = Pin_Div;
 904    i->Pin.Div.extended = extended;
 905    i->Pin.Div.syned = syned;
 906    i->Pin.Div.sz32  = sz32;
 907    i->Pin.Div.dst   = dst;
 908    i->Pin.Div.srcL  = srcL;
 909    i->Pin.Div.srcR  = srcR;
 910    return i;
 911 }
 912 PPCInstr* PPCInstr_Call ( PPCCondCode cond,
 913                           Addr64 target, UInt argiregs, RetLoc rloc ) {
 914    UInt mask;
 915    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
 916    i->tag               = Pin_Call;
 917    i->Pin.Call.cond     = cond;
 918    i->Pin.Call.target   = target;
 919    i->Pin.Call.argiregs = argiregs;
 920    i->Pin.Call.rloc     = rloc;
 921    /* Only r3 .. r10 inclusive may be used as arg regs. Hence: */
 922    mask = (1<<3)|(1<<4)|(1<<5)|(1<<6)|(1<<7)|(1<<8)|(1<<9)|(1<<10);
 923    vassert(0 == (argiregs & ~mask));
 924    vassert(is_sane_RetLoc(rloc));
 925    return i;
 926 }
 927 PPCInstr* PPCInstr_XDirect ( Addr64 dstGA, PPCAMode* amCIA,
 928                              PPCCondCode cond, Bool toFastEP ) {
 929    PPCInstr* i             = LibVEX_Alloc_inline(sizeof(PPCInstr));
 930    i->tag                  = Pin_XDirect;
 931    i->Pin.XDirect.dstGA    = dstGA;
 932    i->Pin.XDirect.amCIA    = amCIA;
 933    i->Pin.XDirect.cond     = cond;
 934    i->Pin.XDirect.toFastEP = toFastEP;
 935    return i;
 936 }
 937 PPCInstr* PPCInstr_XIndir ( HReg dstGA, PPCAMode* amCIA,
 938                             PPCCondCode cond ) {
 939    PPCInstr* i         = LibVEX_Alloc_inline(sizeof(PPCInstr));
 940    i->tag              = Pin_XIndir;
 941    i->Pin.XIndir.dstGA = dstGA;
 942    i->Pin.XIndir.amCIA = amCIA;
 943    i->Pin.XIndir.cond  = cond;
 944    return i;
 945 }
 946 PPCInstr* PPCInstr_XAssisted ( HReg dstGA, PPCAMode* amCIA,
 947                                PPCCondCode cond, IRJumpKind jk ) {
 948    PPCInstr* i            = LibVEX_Alloc_inline(sizeof(PPCInstr));
 949    i->tag                 = Pin_XAssisted;
 950    i->Pin.XAssisted.dstGA = dstGA;
 951    i->Pin.XAssisted.amCIA = amCIA;
 952    i->Pin.XAssisted.cond  = cond;
 953    i->Pin.XAssisted.jk    = jk;
 954    return i;
 955 }
 956 PPCInstr* PPCInstr_CMov  ( PPCCondCode cond,
 957                            HReg dst, PPCRI* src ) {
 958    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 959    i->tag           = Pin_CMov;
 960    i->Pin.CMov.cond = cond;
 961    i->Pin.CMov.src  = src;
 962    i->Pin.CMov.dst  = dst;
 963    vassert(cond.test != Pct_ALWAYS);
 964    return i;
 965 }
 966 PPCInstr* PPCInstr_Load ( UChar sz,
 967                           HReg dst, PPCAMode* src, Bool mode64 ) {
 968    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
 969    i->tag            = Pin_Load;
 970    i->Pin.Load.sz    = sz;
 971    i->Pin.Load.src   = src;
 972    i->Pin.Load.dst   = dst;
 973    vassert(sz == 1 || sz == 2 || sz == 4 || sz == 8);
 974    if (sz == 8) vassert(mode64);
 975    return i;
 976 }
 977 PPCInstr* PPCInstr_LoadL ( UChar sz,
 978                            HReg dst, HReg src, Bool mode64 )
 979 {
 980    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
 981    i->tag            = Pin_LoadL;
 982    i->Pin.LoadL.sz   = sz;
 983    i->Pin.LoadL.src  = src;
 984    i->Pin.LoadL.dst  = dst;
 985    vassert(sz == 1 || sz == 2 || sz == 4 || sz == 8);
 986    if (sz == 8) vassert(mode64);
 987    return i;
 988 }
 989 PPCInstr* PPCInstr_Store ( UChar sz, PPCAMode* dst, HReg src,
 990                            Bool mode64 ) {
 991    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
 992    i->tag           = Pin_Store;
 993    i->Pin.Store.sz  = sz;
 994    i->Pin.Store.src = src;
 995    i->Pin.Store.dst = dst;
 996    vassert(sz == 1 || sz == 2 || sz == 4 || sz == 8);
 997    if (sz == 8) vassert(mode64);
 998    return i;
 999 }
1000 PPCInstr* PPCInstr_StoreC ( UChar sz, HReg dst, HReg src, Bool mode64 ) {
1001    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
1002    i->tag            = Pin_StoreC;
1003    i->Pin.StoreC.sz  = sz;
1004    i->Pin.StoreC.src = src;
1005    i->Pin.StoreC.dst = dst;
1006    vassert(sz == 1 || sz == 2 || sz == 4 || sz == 8);
1007    if (sz == 8) vassert(mode64);
1008    return i;
1009 }
1010 PPCInstr* PPCInstr_Set ( PPCCondCode cond, HReg dst ) {
1011    PPCInstr* i     = LibVEX_Alloc_inline(sizeof(PPCInstr));
1012    i->tag          = Pin_Set;
1013    i->Pin.Set.cond = cond;
1014    i->Pin.Set.dst  = dst;
1015    return i;
1016 }
1017 PPCInstr* PPCInstr_MfCR ( HReg dst )
1018 {
1019    PPCInstr* i     = LibVEX_Alloc_inline(sizeof(PPCInstr));
1020    i->tag          = Pin_MfCR;
1021    i->Pin.MfCR.dst = dst;
1022    return i;
1023 }
1024 PPCInstr* PPCInstr_MFence ( void )
1025 {
1026    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1027    i->tag      = Pin_MFence;
1028    return i;
1029 }
1030
1031 PPCInstr* PPCInstr_FpUnary ( PPCFpOp op, HReg dst, HReg src ) {
1032    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1033    i->tag             = Pin_FpUnary;
1034    i->Pin.FpUnary.op  = op;
1035    i->Pin.FpUnary.dst = dst;
1036    i->Pin.FpUnary.src = src;
1037    return i;
1038 }
1039 PPCInstr* PPCInstr_FpBinary ( PPCFpOp op, HReg dst,
1040                               HReg srcL, HReg srcR ) {
1041    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1042    i->tag               = Pin_FpBinary;
1043    i->Pin.FpBinary.op   = op;
1044    i->Pin.FpBinary.dst  = dst;
1045    i->Pin.FpBinary.srcL = srcL;
1046    i->Pin.FpBinary.srcR = srcR;
1047    return i;
1048 }
1049 PPCInstr* PPCInstr_Fp128Unary(PPCFpOp op, HReg dst, HReg src) {
1050    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1051    i->tag = Pin_Fp128Unary;
1052    i->Pin.Fp128Unary.op = op;
1053    i->Pin.Fp128Unary.dst = dst;
1054    i->Pin.Fp128Unary.src = src;
1055    return i;
1056 }
1057 PPCInstr* PPCInstr_Fp128Binary(PPCFpOp op, HReg dst, HReg srcL, HReg srcR) {
1058    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1059    i->tag = Pin_Fp128Binary;
1060    i->Pin.Fp128Binary.op = op;
1061    i->Pin.Fp128Binary.dst = dst;
1062    i->Pin.Fp128Binary.srcL = srcL;
1063    i->Pin.Fp128Binary.srcR = srcR;
1064    return i;
1065 }
1066 PPCInstr* PPCInstr_Fp128Ternary(PPCFpOp op, HReg dst, HReg srcL, HReg srcR) {
1067    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1068    i->tag = Pin_Fp128Ternary;
1069    i->Pin.Fp128Ternary.op = op;
1070    i->Pin.Fp128Ternary.dst = dst;
1071    i->Pin.Fp128Ternary.srcL = srcL;
1072    i->Pin.Fp128Ternary.srcR = srcR;
1073    return i;
1074 }
1075 PPCInstr* PPCInstr_FpMulAcc ( PPCFpOp op, HReg dst, HReg srcML,
1076                                           HReg srcMR, HReg srcAcc )
1077 {
1078    PPCInstr* i            = LibVEX_Alloc_inline(sizeof(PPCInstr));
1079    i->tag                 = Pin_FpMulAcc;
1080    i->Pin.FpMulAcc.op     = op;
1081    i->Pin.FpMulAcc.dst    = dst;
1082    i->Pin.FpMulAcc.srcML  = srcML;
1083    i->Pin.FpMulAcc.srcMR  = srcMR;
1084    i->Pin.FpMulAcc.srcAcc = srcAcc;
1085    return i;
1086 }
1087 PPCInstr* PPCInstr_FpLdSt ( Bool isLoad, UChar sz,
1088                             HReg reg, PPCAMode* addr ) {
1089    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1090    i->tag               = Pin_FpLdSt;
1091    i->Pin.FpLdSt.isLoad = isLoad;
1092    i->Pin.FpLdSt.sz     = sz;
1093    i->Pin.FpLdSt.reg    = reg;
1094    i->Pin.FpLdSt.addr   = addr;
1095    vassert(sz == 4 || sz == 8);
1096    return i;
1097 }
1098 PPCInstr* PPCInstr_FpSTFIW ( HReg addr, HReg data )
1099 {
1100    PPCInstr* i         = LibVEX_Alloc_inline(sizeof(PPCInstr));
1101    i->tag              = Pin_FpSTFIW;
1102    i->Pin.FpSTFIW.addr = addr;
1103    i->Pin.FpSTFIW.data = data;
1104    return i;
1105 }
1106 PPCInstr* PPCInstr_FpRSP ( HReg dst, HReg src ) {
1107    PPCInstr* i      = LibVEX_Alloc_inline(sizeof(PPCInstr));
1108    i->tag           = Pin_FpRSP;
1109    i->Pin.FpRSP.dst = dst;
1110    i->Pin.FpRSP.src = src;
1111    return i;
1112 }
1113 PPCInstr* PPCInstr_Dfp64Unary(PPCFpOp op, HReg dst, HReg src) {
1114    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1115    i->tag = Pin_Dfp64Unary;
1116    i->Pin.Dfp64Unary.op = op;
1117    i->Pin.Dfp64Unary.dst = dst;
1118    i->Pin.Dfp64Unary.src = src;
1119    return i;
1120 }
1121 PPCInstr* PPCInstr_Dfp64Binary(PPCFpOp op, HReg dst, HReg srcL, HReg srcR) {
1122    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1123    i->tag = Pin_Dfp64Binary;
1124    i->Pin.Dfp64Binary.op = op;
1125    i->Pin.Dfp64Binary.dst = dst;
1126    i->Pin.Dfp64Binary.srcL = srcL;
1127    i->Pin.Dfp64Binary.srcR = srcR;
1128    return i;
1129 }
1130 PPCInstr* PPCInstr_DfpShift ( PPCFpOp op, HReg dst, HReg src, PPCRI* shift ) {
1131    PPCInstr* i            = LibVEX_Alloc_inline(sizeof(PPCInstr));
1132    i->tag                 = Pin_DfpShift;
1133    i->Pin.DfpShift.op     = op;
1134    i->Pin.DfpShift.shift  = shift;
1135    i->Pin.DfpShift.src    = src;
1136    i->Pin.DfpShift.dst    = dst;
1137    return i;
1138 }
1139 PPCInstr* PPCInstr_Dfp128Unary(PPCFpOp op, HReg dst_hi, HReg dst_lo,
1140                                 HReg src_hi, HReg src_lo) {
1141    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1142    i->tag = Pin_Dfp128Unary;
1143    i->Pin.Dfp128Unary.op = op;
1144    i->Pin.Dfp128Unary.dst_hi = dst_hi;
1145    i->Pin.Dfp128Unary.dst_lo = dst_lo;
1146    i->Pin.Dfp128Unary.src_hi = src_hi;
1147    i->Pin.Dfp128Unary.src_lo = src_lo;
1148    return i;
1149 }
1150 PPCInstr* PPCInstr_Dfp128Binary(PPCFpOp op, HReg dst_hi, HReg dst_lo,
1151                                 HReg srcR_hi, HReg srcR_lo) {
1152    /* dst is used to pass the srcL argument and return the result */
1153    PPCInstr* i = LibVEX_Alloc_inline( sizeof(PPCInstr) );
1154    i->tag = Pin_Dfp128Binary;
1155    i->Pin.Dfp128Binary.op = op;
1156    i->Pin.Dfp128Binary.dst_hi = dst_hi;
1157    i->Pin.Dfp128Binary.dst_lo = dst_lo;
1158    i->Pin.Dfp128Binary.srcR_hi = srcR_hi;
1159    i->Pin.Dfp128Binary.srcR_lo = srcR_lo;
1160    return i;
1161 }
1162 PPCInstr* PPCInstr_DfpShift128 ( PPCFpOp op, HReg dst_hi, HReg dst_lo,
1163                                  HReg src_hi, HReg src_lo,
1164                                  PPCRI* shift ) {
1165    PPCInstr* i               = LibVEX_Alloc_inline(sizeof(PPCInstr));
1166    i->tag                    = Pin_DfpShift128;
1167    i->Pin.DfpShift128.op     = op;
1168    i->Pin.DfpShift128.shift  = shift;
1169    i->Pin.DfpShift128.src_hi = src_hi;
1170    i->Pin.DfpShift128.src_lo = src_lo;
1171    i->Pin.DfpShift128.dst_hi = dst_hi;
1172    i->Pin.DfpShift128.dst_lo = dst_lo;
1173    return i;
1174 }
1175 PPCInstr* PPCInstr_DfpRound ( HReg dst, HReg src, PPCRI* r_rmc ) {
1176    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1177    i->tag                = Pin_DfpRound;
1178    i->Pin.DfpRound.dst   = dst;
1179    i->Pin.DfpRound.src   = src;
1180    i->Pin.DfpRound.r_rmc = r_rmc;
1181    return i;
1182 }
1183 PPCInstr* PPCInstr_DfpRound128 ( HReg dst_hi, HReg dst_lo, HReg src_hi,
1184                                  HReg src_lo, PPCRI* r_rmc ) {
1185    PPCInstr* i               = LibVEX_Alloc_inline(sizeof(PPCInstr));
1186    i->tag                    = Pin_DfpRound128;
1187    i->Pin.DfpRound128.dst_hi = dst_hi;
1188    i->Pin.DfpRound128.dst_lo = dst_lo;
1189    i->Pin.DfpRound128.src_hi = src_hi;
1190    i->Pin.DfpRound128.src_lo = src_lo;
1191    i->Pin.DfpRound128.r_rmc  = r_rmc;
1192    return i;
1193 }
1194 PPCInstr* PPCInstr_DfpQuantize ( PPCFpOp op, HReg dst, HReg srcL, HReg srcR,
1195                                  PPCRI* rmc ) {
1196    PPCInstr* i             = LibVEX_Alloc_inline(sizeof(PPCInstr));
1197    i->tag                  = Pin_DfpQuantize;
1198    i->Pin.DfpQuantize.op   = op;
1199    i->Pin.DfpQuantize.dst  = dst;
1200    i->Pin.DfpQuantize.srcL = srcL;
1201    i->Pin.DfpQuantize.srcR = srcR;
1202    i->Pin.DfpQuantize.rmc  = rmc;
1203    return i;
1204 }
1205 PPCInstr* PPCInstr_DfpQuantize128 ( PPCFpOp op, HReg dst_hi, HReg dst_lo,
1206                                     HReg src_hi, HReg src_lo, PPCRI* rmc ) {
1207    /* dst is used to pass left operand in and return result */
1208    PPCInstr* i                  = LibVEX_Alloc_inline(sizeof(PPCInstr));
1209    i->tag                       = Pin_DfpQuantize128;
1210    i->Pin.DfpQuantize128.op     = op;
1211    i->Pin.DfpQuantize128.dst_hi = dst_hi;
1212    i->Pin.DfpQuantize128.dst_lo = dst_lo;
1213    i->Pin.DfpQuantize128.src_hi = src_hi;
1214    i->Pin.DfpQuantize128.src_lo = src_lo;
1215    i->Pin.DfpQuantize128.rmc    = rmc;
1216    return i;
1217 }
1218 PPCInstr* PPCInstr_DfpD128toD64 ( PPCFpOp op, HReg dst,
1219                                   HReg src_hi, HReg src_lo ) {
1220    PPCInstr* i                = LibVEX_Alloc_inline(sizeof(PPCInstr));
1221    i->tag                     = Pin_DfpD128toD64;
1222    i->Pin.DfpD128toD64.op     = op;
1223    i->Pin.DfpD128toD64.src_hi = src_hi;
1224    i->Pin.DfpD128toD64.src_lo = src_lo;
1225    i->Pin.DfpD128toD64.dst    = dst;
1226    return i;
1227 }
1228 PPCInstr* PPCInstr_DfpI64StoD128 ( PPCFpOp op, HReg dst_hi,
1229                                    HReg dst_lo, HReg src ) {
1230    PPCInstr* i                 = LibVEX_Alloc_inline(sizeof(PPCInstr));
1231    i->tag                      = Pin_DfpI64StoD128;
1232    i->Pin.DfpI64StoD128.op     = op;
1233    i->Pin.DfpI64StoD128.src    = src;
1234    i->Pin.DfpI64StoD128.dst_hi = dst_hi;
1235    i->Pin.DfpI64StoD128.dst_lo = dst_lo;
1236    return i;
1237 }
1238 PPCInstr* PPCInstr_ExtractExpD128 ( PPCFpOp op, HReg dst,
1239                                     HReg src_hi, HReg src_lo ) {
1240    /* dst is used to pass the srcL argument */
1241    PPCInstr* i                  = LibVEX_Alloc_inline(sizeof(PPCInstr));
1242    i->tag                       = Pin_ExtractExpD128;
1243    i->Pin.ExtractExpD128.op     = op;
1244    i->Pin.ExtractExpD128.dst    = dst;
1245    i->Pin.ExtractExpD128.src_hi = src_hi;
1246    i->Pin.ExtractExpD128.src_lo = src_lo;
1247    return i;
1248 }
1249 PPCInstr* PPCInstr_InsertExpD128 ( PPCFpOp op, HReg dst_hi, HReg dst_lo,
1250                                    HReg srcL, HReg srcR_hi, HReg srcR_lo ) {
1251    /* dst is used to pass the srcL argument */
1252    PPCInstr* i                  = LibVEX_Alloc_inline(sizeof(PPCInstr));
1253    i->tag                       = Pin_InsertExpD128;
1254    i->Pin.InsertExpD128.op      = op;
1255    i->Pin.InsertExpD128.dst_hi  = dst_hi;
1256    i->Pin.InsertExpD128.dst_lo  = dst_lo;
1257    i->Pin.InsertExpD128.srcL    = srcL;
1258    i->Pin.InsertExpD128.srcR_hi = srcR_hi;
1259    i->Pin.InsertExpD128.srcR_lo = srcR_lo;
1260    return i;
1261 }
1262 PPCInstr* PPCInstr_Dfp64Cmp (/* UInt crfD,*/ HReg dst, HReg srcL, HReg srcR ) {
1263    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1264    i->tag               = Pin_Dfp64Cmp;
1265    i->Pin.Dfp64Cmp.dst = dst;
1266    i->Pin.Dfp64Cmp.srcL = srcL;
1267    i->Pin.Dfp64Cmp.srcR = srcR;
1268    return i;
1269 }
1270 PPCInstr* PPCInstr_Dfp128Cmp ( HReg dst, HReg srcL_hi, HReg srcL_lo,
1271                                HReg srcR_hi, HReg srcR_lo ) {
1272    PPCInstr* i               = LibVEX_Alloc_inline(sizeof(PPCInstr));
1273    i->tag                    = Pin_Dfp128Cmp;
1274    i->Pin.Dfp128Cmp.dst      = dst;
1275    i->Pin.Dfp128Cmp.srcL_hi  = srcL_hi;
1276    i->Pin.Dfp128Cmp.srcL_lo  = srcL_lo;
1277    i->Pin.Dfp128Cmp.srcR_hi  = srcR_hi;
1278    i->Pin.Dfp128Cmp.srcR_lo  = srcR_lo;
1279    return i;
1280 }
1281 PPCInstr* PPCInstr_EvCheck ( PPCAMode* amCounter,
1282                              PPCAMode* amFailAddr ) {
1283    PPCInstr* i               = LibVEX_Alloc_inline(sizeof(PPCInstr));
1284    i->tag                    = Pin_EvCheck;
1285    i->Pin.EvCheck.amCounter  = amCounter;
1286    i->Pin.EvCheck.amFailAddr = amFailAddr;
1287    return i;
1288 }
1289 PPCInstr* PPCInstr_ProfInc ( void ) {
1290    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1291    i->tag      = Pin_ProfInc;
1292    return i;
1293 }
1294
1295 /*
1296 Valid combo | fromI | int32 | syned | flt64 |
1297 --------------------------------------------
1298             |  n       n       n       n    |
1299 --------------------------------------------
1300  F64->I64U  |  n       n       n       y    |
1301 --------------------------------------------
1302             |  n       n       y       n    |
1303 --------------------------------------------
1304  F64->I64S  |  n       n       y       y    |
1305 --------------------------------------------
1306             |  n       y       n       n    |
1307 --------------------------------------------
1308  F64->I32U  |  n       y       n       y    |
1309 --------------------------------------------
1310             |  n       y       y       n    |
1311 --------------------------------------------
1312  F64->I32S  |  n       y       y       y    |
1313 --------------------------------------------
1314  I64U->F32  |  y       n       n       n    |
1315 --------------------------------------------
1316  I64U->F64  |  y       n       n       y    |
1317 --------------------------------------------
1318             |  y       n       y       n    |
1319 --------------------------------------------
1320  I64S->F64  |  y       n       y       y    |
1321 --------------------------------------------
1322             |  y       y       n       n    |
1323 --------------------------------------------
1324             |  y       y       n       y    |
1325 --------------------------------------------
1326             |  y       y       y       n    |
1327 --------------------------------------------
1328             |  y       y       y       y    |
1329 --------------------------------------------
1330 */
1331 PPCInstr* PPCInstr_FpCftI ( Bool fromI, Bool int32, Bool syned,
1332                             Bool flt64, HReg dst, HReg src ) {
1333    Bool tmp = fromI | int32 | syned | flt64;
1334    vassert(tmp == True || tmp == False); // iow, no high bits set
1335    UShort conversion = 0;
1336    conversion = (fromI << 3) | (int32 << 2) | (syned << 1) | flt64;
1337    switch (conversion) {
1338       // Supported conversion operations
1339       case 1: case 3: case 5: case 7:
1340       case 8: case 9: case 11:
1341          break;
1342       default:
1343          vpanic("PPCInstr_FpCftI(ppc_host)");
1344    }
1345    PPCInstr* i         = LibVEX_Alloc_inline(sizeof(PPCInstr));
1346    i->tag              = Pin_FpCftI;
1347    i->Pin.FpCftI.fromI = fromI;
1348    i->Pin.FpCftI.int32 = int32;
1349    i->Pin.FpCftI.syned = syned;
1350    i->Pin.FpCftI.flt64 = flt64;
1351    i->Pin.FpCftI.dst   = dst;
1352    i->Pin.FpCftI.src   = src;
1353    return i;
1354 }
1355 PPCInstr* PPCInstr_FpCMov ( PPCCondCode cond, HReg dst, HReg src ) {
1356    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1357    i->tag             = Pin_FpCMov;
1358    i->Pin.FpCMov.cond = cond;
1359    i->Pin.FpCMov.dst  = dst;
1360    i->Pin.FpCMov.src  = src;
1361    vassert(cond.test != Pct_ALWAYS);
1362    return i;
1363 }
1364 PPCInstr* PPCInstr_FpLdFPSCR ( HReg src, Bool dfp_rm ) {
1365    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1366    i->tag               = Pin_FpLdFPSCR;
1367    i->Pin.FpLdFPSCR.src = src;
1368    i->Pin.FpLdFPSCR.dfp_rm = dfp_rm ? 1 : 0;
1369    return i;
1370 }
1371 PPCInstr* PPCInstr_FpCmp ( HReg dst, HReg srcL, HReg srcR ) {
1372    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
1373    i->tag            = Pin_FpCmp;
1374    i->Pin.FpCmp.dst  = dst;
1375    i->Pin.FpCmp.srcL = srcL;
1376    i->Pin.FpCmp.srcR = srcR;
1377    return i;
1378 }
1379
1380 /* Read/Write Link Register */
1381 PPCInstr* PPCInstr_RdWrLR ( Bool wrLR, HReg gpr ) {
1382    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1383    i->tag             = Pin_RdWrLR;
1384    i->Pin.RdWrLR.wrLR = wrLR;
1385    i->Pin.RdWrLR.gpr  = gpr;
1386    return i;
1387 }
1388
1389 /* AltiVec */
1390 PPCInstr* PPCInstr_AvLdSt ( Bool isLoad, UChar sz,
1391                             HReg reg, PPCAMode* addr ) {
1392    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1393    i->tag               = Pin_AvLdSt;
1394    i->Pin.AvLdSt.isLoad = isLoad;
1395    i->Pin.AvLdSt.sz     = sz;
1396    i->Pin.AvLdSt.reg    = reg;
1397    i->Pin.AvLdSt.addr   = addr;
1398    return i;
1399 }
1400 PPCInstr* PPCInstr_AvUnary ( PPCAvOp op, HReg dst, HReg src ) {
1401    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1402    i->tag             = Pin_AvUnary;
1403    i->Pin.AvUnary.op  = op;
1404    i->Pin.AvUnary.dst = dst;
1405    i->Pin.AvUnary.src = src;
1406    return i;
1407 }
1408 PPCInstr* PPCInstr_AvBinary ( PPCAvOp op, HReg dst,
1409                               HReg srcL, HReg srcR ) {
1410    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1411    i->tag               = Pin_AvBinary;
1412    i->Pin.AvBinary.op   = op;
1413    i->Pin.AvBinary.dst  = dst;
1414    i->Pin.AvBinary.srcL = srcL;
1415    i->Pin.AvBinary.srcR = srcR;
1416    return i;
1417 }
1418 PPCInstr* PPCInstr_AvBinaryInt ( PPCAvOp op, HReg dst,
1419                                  HReg src, PPCRI* val ) {
1420    PPCInstr* i            = LibVEX_Alloc_inline(sizeof(PPCInstr));
1421    i->tag                 = Pin_AvBinaryInt;
1422    i->Pin.AvBinaryInt.op  = op;
1423    i->Pin.AvBinaryInt.dst = dst;
1424    i->Pin.AvBinaryInt.src = src;
1425    i->Pin.AvBinaryInt.val = val;
1426    return i;
1427 }
1428 PPCInstr* PPCInstr_AvBinaryInt128 ( PPCAvOpBin128 op, HReg dst,
1429                                     HReg src1, HReg src2 ) {
1430    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1431    i->tag      = Pin_AvBinaryInt128;
1432    i->Pin.AvBinaryInt128.op   = op;
1433    i->Pin.AvBinaryInt128.dst  = dst;
1434    i->Pin.AvBinaryInt128.src1 = src1;
1435    i->Pin.AvBinaryInt128.src2 = src2;
1436    return i;
1437 }
1438 PPCInstr* PPCInstr_AvTernaryInt128 ( PPCAvOpTri128 op, HReg dst,
1439                                      HReg src1, HReg src2, HReg src3 ) {
1440    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1441    i->tag      = Pin_AvTernaryInt128;
1442    i->Pin.AvTernaryInt128.op   = op;
1443    i->Pin.AvTernaryInt128.dst  = dst;
1444    i->Pin.AvTernaryInt128.src1 = src1;
1445    i->Pin.AvTernaryInt128.src2 = src2;
1446    i->Pin.AvTernaryInt128.src3 = src3;
1447    return i;
1448 }
1449 PPCInstr* PPCInstr_AvBin8x16 ( PPCAvOp op, HReg dst,
1450                                HReg srcL, HReg srcR ) {
1451    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1452    i->tag                = Pin_AvBin8x16;
1453    i->Pin.AvBin8x16.op   = op;
1454    i->Pin.AvBin8x16.dst  = dst;
1455    i->Pin.AvBin8x16.srcL = srcL;
1456    i->Pin.AvBin8x16.srcR = srcR;
1457    return i;
1458 }
1459 PPCInstr* PPCInstr_AvBin16x8 ( PPCAvOp op, HReg dst,
1460                                HReg srcL, HReg srcR ) {
1461    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1462    i->tag                = Pin_AvBin16x8;
1463    i->Pin.AvBin16x8.op   = op;
1464    i->Pin.AvBin16x8.dst  = dst;
1465    i->Pin.AvBin16x8.srcL = srcL;
1466    i->Pin.AvBin16x8.srcR = srcR;
1467    return i;
1468 }
1469 PPCInstr* PPCInstr_AvBin32x4 ( PPCAvOp op, HReg dst,
1470                                HReg srcL, HReg srcR ) {
1471    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1472    i->tag                = Pin_AvBin32x4;
1473    i->Pin.AvBin32x4.op   = op;
1474    i->Pin.AvBin32x4.dst  = dst;
1475    i->Pin.AvBin32x4.srcL = srcL;
1476    i->Pin.AvBin32x4.srcR = srcR;
1477    return i;
1478 }
1479 PPCInstr* PPCInstr_AvBin64x2 ( PPCAvOp op, HReg dst,
1480                                HReg srcL, HReg srcR ) {
1481    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1482    i->tag                = Pin_AvBin64x2;
1483    i->Pin.AvBin64x2.op   = op;
1484    i->Pin.AvBin64x2.dst  = dst;
1485    i->Pin.AvBin64x2.srcL = srcL;
1486    i->Pin.AvBin64x2.srcR = srcR;
1487    return i;
1488 }
1489
1490 PPCInstr* PPCInstr_AvBin32Fx4 ( PPCAvFpOp op, HReg dst,
1491                                 HReg srcL, HReg srcR ) {
1492    PPCInstr* i            = LibVEX_Alloc_inline(sizeof(PPCInstr));
1493    i->tag                 = Pin_AvBin32Fx4;
1494    i->Pin.AvBin32Fx4.op   = op;
1495    i->Pin.AvBin32Fx4.dst  = dst;
1496    i->Pin.AvBin32Fx4.srcL = srcL;
1497    i->Pin.AvBin32Fx4.srcR = srcR;
1498    return i;
1499 }
1500 PPCInstr* PPCInstr_AvUn32Fx4 ( PPCAvFpOp op, HReg dst, HReg src ) {
1501    PPCInstr* i          = LibVEX_Alloc_inline(sizeof(PPCInstr));
1502    i->tag               = Pin_AvUn32Fx4;
1503    i->Pin.AvUn32Fx4.op  = op;
1504    i->Pin.AvUn32Fx4.dst = dst;
1505    i->Pin.AvUn32Fx4.src = src;
1506    return i;
1507 }
1508 PPCInstr* PPCInstr_AvPerm ( HReg dst, HReg srcL, HReg srcR, HReg ctl ) {
1509    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1510    i->tag             = Pin_AvPerm;
1511    i->Pin.AvPerm.dst  = dst;
1512    i->Pin.AvPerm.srcL = srcL;
1513    i->Pin.AvPerm.srcR = srcR;
1514    i->Pin.AvPerm.ctl  = ctl;
1515    return i;
1516 }
1517
1518 PPCInstr* PPCInstr_AvSel ( HReg ctl, HReg dst, HReg srcL, HReg srcR ) {
1519    PPCInstr* i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
1520    i->tag            = Pin_AvSel;
1521    i->Pin.AvSel.ctl  = ctl;
1522    i->Pin.AvSel.dst  = dst;
1523    i->Pin.AvSel.srcL = srcL;
1524    i->Pin.AvSel.srcR = srcR;
1525    return i;
1526 }
1527 PPCInstr* PPCInstr_AvSh ( Bool shLeft, HReg dst, PPCAMode* addr ) {
1528    PPCInstr*  i       = LibVEX_Alloc_inline(sizeof(PPCInstr));
1529    i->tag             = Pin_AvSh;
1530    i->Pin.AvSh.shLeft = shLeft;
1531    i->Pin.AvSh.dst    = dst;
1532    i->Pin.AvSh.addr   = addr;
1533    return i;
1534 }
1535 PPCInstr* PPCInstr_AvShlDbl ( UChar shift, HReg dst,
1536                               HReg srcL, HReg srcR ) {
1537    PPCInstr* i           = LibVEX_Alloc_inline(sizeof(PPCInstr));
1538    i->tag                = Pin_AvShlDbl;
1539    i->Pin.AvShlDbl.shift = shift;
1540    i->Pin.AvShlDbl.dst   = dst;
1541    i->Pin.AvShlDbl.srcL  = srcL;
1542    i->Pin.AvShlDbl.srcR  = srcR;
1543    return i;
1544 }
1545 PPCInstr* PPCInstr_AvSplat ( UChar sz, HReg dst, PPCVI5s* src ) {
1546    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1547    i->tag             = Pin_AvSplat;
1548    i->Pin.AvSplat.sz  = sz;
1549    i->Pin.AvSplat.dst = dst;
1550    i->Pin.AvSplat.src = src;
1551    return i;
1552 }
1553 PPCInstr* PPCInstr_AvCMov ( PPCCondCode cond, HReg dst, HReg src ) {
1554    PPCInstr* i        = LibVEX_Alloc_inline(sizeof(PPCInstr));
1555    i->tag             = Pin_AvCMov;
1556    i->Pin.AvCMov.cond = cond;
1557    i->Pin.AvCMov.dst  = dst;
1558    i->Pin.AvCMov.src  = src;
1559    vassert(cond.test != Pct_ALWAYS);
1560    return i;
1561 }
1562 PPCInstr* PPCInstr_AvLdVSCR ( HReg src ) {
1563    PPCInstr* i         = LibVEX_Alloc_inline(sizeof(PPCInstr));
1564    i->tag              = Pin_AvLdVSCR;
1565    i->Pin.AvLdVSCR.src = src;
1566    return i;
1567 }
1568 PPCInstr* PPCInstr_AvCipherV128Unary ( PPCAvOp op, HReg dst, HReg src ) {
1569    PPCInstr* i              = LibVEX_Alloc_inline(sizeof(PPCInstr));
1570    i->tag                   = Pin_AvCipherV128Unary;
1571    i->Pin.AvCipherV128Unary.op   = op;
1572    i->Pin.AvCipherV128Unary.dst  = dst;
1573    i->Pin.AvCipherV128Unary.src  = src;
1574    return i;
1575 }
1576 PPCInstr* PPCInstr_AvCipherV128Binary ( PPCAvOp op, HReg dst,
1577                                         HReg srcL, HReg srcR ) {
1578    PPCInstr* i              = LibVEX_Alloc_inline(sizeof(PPCInstr));
1579    i->tag                   = Pin_AvCipherV128Binary;
1580    i->Pin.AvCipherV128Binary.op   = op;
1581    i->Pin.AvCipherV128Binary.dst  = dst;
1582    i->Pin.AvCipherV128Binary.srcL = srcL;
1583    i->Pin.AvCipherV128Binary.srcR = srcR;
1584    return i;
1585 }
1586 PPCInstr* PPCInstr_AvHashV128Binary ( PPCAvOp op, HReg dst,
1587                                       HReg src, PPCRI* s_field ) {
1588    PPCInstr* i              = LibVEX_Alloc_inline(sizeof(PPCInstr));
1589    i->tag                   = Pin_AvHashV128Binary;
1590    i->Pin.AvHashV128Binary.op  = op;
1591    i->Pin.AvHashV128Binary.dst = dst;
1592    i->Pin.AvHashV128Binary.src = src;
1593    i->Pin.AvHashV128Binary.s_field = s_field;
1594    return i;
1595 }
1596 PPCInstr* PPCInstr_AvBCDV128Binary ( PPCAvOp op, HReg dst,
1597                                      HReg src1, HReg src2 ) {
1598    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1599    i->tag      = Pin_AvBCDV128Binary;
1600    i->Pin.AvBCDV128Binary.op   = op;
1601    i->Pin.AvBCDV128Binary.dst  = dst;
1602    i->Pin.AvBCDV128Binary.src1 = src1;
1603    i->Pin.AvBCDV128Binary.src2 = src2;
1604    return i;
1605 }
1606 PPCInstr* PPCInstr_XFormUnary994 ( PPCXFormUnary994 op, HReg reg0, HReg reg1,
1607                                    HReg reg2 ) {
1608    /* This is used to issue istructions with opc1=63, opc2=994. The specific
1609       instruction is given in bits[11:15], the VRA field, of the instruction.
1610       Currently only used for dcffixqq and dctfixqq instructions.  */
1611    PPCInstr* i = LibVEX_Alloc_inline(sizeof(PPCInstr));
1612    i->tag      = Pin_XFormUnary994;
1613    i->Pin.XFormUnary994.op  = op;
1614    i->Pin.XFormUnary994.reg0 = reg0;
1615    i->Pin.XFormUnary994.reg1 = reg1;
1616    i->Pin.XFormUnary994.reg2 = reg2;
1617    return i;
1618 }
1619
1620 /* Pretty Print instructions */
1621 static void ppLoadImm ( HReg dst, ULong imm, Bool mode64 ) {
1622    vex_printf("li_word ");
1623    ppHRegPPC(dst);
1624    if (!mode64) {
1625       vex_printf(",0x%08x", (UInt)imm);
1626    } else {
1627       vex_printf(",0x%016llx", imm);
1628    }
1629 }
1630
1631 static void ppMovReg ( HReg dst, HReg src ) {
1632    if (!sameHReg(dst, src)) {
1633       vex_printf("mr ");
1634       ppHRegPPC(dst);
1635       vex_printf(",");
1636       ppHRegPPC(src);
1637    }
1638 }
1639
1640 void ppPPCInstr ( const PPCInstr* i, Bool mode64 )
1641 {
1642    switch (i->tag) {
1643    case Pin_LI:
1644       ppLoadImm(i->Pin.LI.dst, i->Pin.LI.imm64, mode64);
1645       break;
1646    case Pin_Alu: {
1647       HReg   r_srcL  = i->Pin.Alu.srcL;
1648       PPCRH* rh_srcR = i->Pin.Alu.srcR;
1649       /* special-case "mr" */
1650       if (i->Pin.Alu.op == Palu_OR &&   // or Rd,Rs,Rs == mr Rd,Rs
1651           rh_srcR->tag == Prh_Reg &&
1652           sameHReg(rh_srcR->Prh.Reg.reg, r_srcL)) {
1653          vex_printf("mr ");
1654          ppHRegPPC(i->Pin.Alu.dst);
1655          vex_printf(",");
1656          ppHRegPPC(r_srcL);
1657          return;
1658       }
1659       /* special-case "li" */
1660       if (i->Pin.Alu.op == Palu_ADD &&   // addi Rd,0,imm == li Rd,imm
1661           rh_srcR->tag == Prh_Imm &&
1662           hregEncoding(r_srcL) == 0) {
1663          vex_printf("li ");
1664          ppHRegPPC(i->Pin.Alu.dst);
1665          vex_printf(",");
1666          ppPPCRH(rh_srcR);
1667          return;
1668       }
1669       /* generic */
1670       vex_printf("%s ", showPPCAluOp(i->Pin.Alu.op,
1671                                      toBool(rh_srcR->tag == Prh_Imm)));
1672       ppHRegPPC(i->Pin.Alu.dst);
1673       vex_printf(",");
1674       ppHRegPPC(r_srcL);
1675       vex_printf(",");
1676       ppPPCRH(rh_srcR);
1677       return;
1678    }
1679    case Pin_Shft: {
1680       HReg   r_srcL  = i->Pin.Shft.srcL;
1681       PPCRH* rh_srcR = i->Pin.Shft.srcR;
1682       vex_printf("%s ", showPPCShftOp(i->Pin.Shft.op,
1683                                       toBool(rh_srcR->tag == Prh_Imm),
1684                                       i->Pin.Shft.sz32));
1685       ppHRegPPC(i->Pin.Shft.dst);
1686       vex_printf(",");
1687       ppHRegPPC(r_srcL);
1688       vex_printf(",");
1689       ppPPCRH(rh_srcR);
1690       return;
1691    }
1692    case Pin_AddSubC:
1693       vex_printf("%s%s ",
1694                  i->Pin.AddSubC.isAdd ? "add" : "sub",
1695                  i->Pin.AddSubC.setC ? "c" : "e");
1696       ppHRegPPC(i->Pin.AddSubC.dst);
1697       vex_printf(",");
1698       ppHRegPPC(i->Pin.AddSubC.srcL);
1699       vex_printf(",");
1700       ppHRegPPC(i->Pin.AddSubC.srcR);
1701       return;
1702    case Pin_Cmp:
1703       vex_printf("%s%c%s %%cr%u,",
1704                  i->Pin.Cmp.syned ? "cmp" : "cmpl",
1705                  i->Pin.Cmp.sz32 ? 'w' : 'd',
1706                  i->Pin.Cmp.srcR->tag == Prh_Imm ? "i" : "",
1707                  i->Pin.Cmp.crfD);
1708       ppHRegPPC(i->Pin.Cmp.srcL);
1709       vex_printf(",");
1710       ppPPCRH(i->Pin.Cmp.srcR);
1711       return;
1712    case Pin_Unary:
1713       vex_printf("%s ", showPPCUnaryOp(i->Pin.Unary.op));
1714       ppHRegPPC(i->Pin.Unary.dst);
1715       vex_printf(",");
1716       ppHRegPPC(i->Pin.Unary.src);
1717       return;
1718    case Pin_MulL:
1719       vex_printf("mul%c%c%s ",
1720                  i->Pin.MulL.hi ? 'h' : 'l',
1721                  i->Pin.MulL.sz32 ? 'w' : 'd',
1722                  i->Pin.MulL.hi ? (i->Pin.MulL.syned ? "s" : "u") : "");
1723       ppHRegPPC(i->Pin.MulL.dst);
1724       vex_printf(",");
1725       ppHRegPPC(i->Pin.MulL.srcL);
1726       vex_printf(",");
1727       ppHRegPPC(i->Pin.MulL.srcR);
1728       return;
1729    case Pin_Div:
1730       vex_printf("div%c%s%s ",
1731                  i->Pin.Div.sz32 ? 'w' : 'd',
1732                  i->Pin.Div.extended ? "e" : "",
1733                  i->Pin.Div.syned ? "" : "u");
1734       ppHRegPPC(i->Pin.Div.dst);
1735       vex_printf(",");
1736       ppHRegPPC(i->Pin.Div.srcL);
1737       vex_printf(",");
1738       ppHRegPPC(i->Pin.Div.srcR);
1739       return;
1740    case Pin_Call: {
1741       Int n;
1742       vex_printf("call: ");
1743       if (i->Pin.Call.cond.test != Pct_ALWAYS) {
1744          vex_printf("if (%s) ", showPPCCondCode(i->Pin.Call.cond));
1745       }
1746       vex_printf("{ ");
1747       ppLoadImm(hregPPC_GPR10(mode64), i->Pin.Call.target, mode64);
1748       vex_printf(" ; mtctr r10 ; bctrl [");
1749       for (n = 0; n < 32; n++) {
1750          if (i->Pin.Call.argiregs & (1<<n)) {
1751             vex_printf("r%d", n);
1752             if ((i->Pin.Call.argiregs >> n) > 1)
1753                vex_printf(",");
1754          }
1755       }
1756       vex_printf(",");
1757       ppRetLoc(i->Pin.Call.rloc);
1758       vex_printf("] }");
1759       break;
1760    }
1761    case Pin_XDirect:
1762       vex_printf("(xDirect) ");
1763       vex_printf("if (%s) { ",
1764                  showPPCCondCode(i->Pin.XDirect.cond));
1765       if (mode64) {
1766          vex_printf("imm64 r30,0x%llx; ", i->Pin.XDirect.dstGA);
1767          vex_printf("std r30,");
1768       } else {
1769          vex_printf("imm32 r30,0x%llx; ", i->Pin.XDirect.dstGA);
1770          vex_printf("stw r30,");
1771       }
1772       ppPPCAMode(i->Pin.XDirect.amCIA);
1773       vex_printf("; ");
1774       if (mode64) {
1775          vex_printf("imm64-fixed5 r30,$disp_cp_chain_me_to_%sEP; ",
1776                     i->Pin.XDirect.toFastEP ? "fast" : "slow");
1777       } else {
1778          vex_printf("imm32-fixed2 r30,$disp_cp_chain_me_to_%sEP; ",
1779                     i->Pin.XDirect.toFastEP ? "fast" : "slow");
1780       }
1781       vex_printf("mtctr r30; bctrl }");
1782       return;
1783    case Pin_XIndir:
1784       vex_printf("(xIndir) ");
1785       vex_printf("if (%s) { ",
1786                  showPPCCondCode(i->Pin.XIndir.cond));
1787       vex_printf("%s ", mode64 ? "std" : "stw");
1788       ppHRegPPC(i->Pin.XIndir.dstGA);
1789       vex_printf(",");
1790       ppPPCAMode(i->Pin.XIndir.amCIA);
1791       vex_printf("; ");
1792       vex_printf("imm%s r30,$disp_cp_xindir; ", mode64 ? "64" : "32");
1793       vex_printf("mtctr r30; bctr }");
1794       return;
1795    case Pin_XAssisted:
1796       vex_printf("(xAssisted) ");
1797       vex_printf("if (%s) { ",
1798                  showPPCCondCode(i->Pin.XAssisted.cond));
1799       vex_printf("%s ", mode64 ? "std" : "stw");
1800       ppHRegPPC(i->Pin.XAssisted.dstGA);
1801       vex_printf(",");
1802       ppPPCAMode(i->Pin.XAssisted.amCIA);
1803       vex_printf("; ");
1804       vex_printf("li r31,$IRJumpKind_to_TRCVAL(%d); ",
1805                  (Int)i->Pin.XAssisted.jk);
1806       vex_printf("imm%s r30,$disp_cp_xindir; ", mode64 ? "64" : "32");
1807       vex_printf("mtctr r30; bctr }");
1808       return;
1809    case Pin_CMov:
1810       vex_printf("cmov (%s) ", showPPCCondCode(i->Pin.CMov.cond));
1811       ppHRegPPC(i->Pin.CMov.dst);
1812       vex_printf(",");
1813       ppPPCRI(i->Pin.CMov.src);
1814       vex_printf(": ");
1815       if (i->Pin.CMov.cond.test != Pct_ALWAYS) {
1816          vex_printf("if (%s) ", showPPCCondCode(i->Pin.CMov.cond));
1817       }
1818       vex_printf("{ ");
1819       if (i->Pin.CMov.src->tag == Pri_Imm) {
1820          ppLoadImm(i->Pin.CMov.dst, i->Pin.CMov.src->Pri.Imm, mode64);
1821       } else {
1822          ppMovReg(i->Pin.CMov.dst, i->Pin.CMov.src->Pri.Reg);
1823       }
1824       vex_printf(" }");
1825       return;
1826    case Pin_Load: {
1827       Bool idxd = toBool(i->Pin.Load.src->tag == Pam_RR);
1828       UChar sz = i->Pin.Load.sz;
1829       HChar c_sz = sz==1 ? 'b' : sz==2 ? 'h' : sz==4 ? 'w' : 'd';
1830       vex_printf("l%c%s%s ", c_sz, sz==8 ? "" : "z", idxd ? "x" : "" );
1831       ppHRegPPC(i->Pin.Load.dst);
1832       vex_printf(",");
1833       ppPPCAMode(i->Pin.Load.src);
1834       return;
1835    }
1836    case Pin_LoadL: {
1837       UChar sz = i->Pin.LoadL.sz;
1838       HChar c_sz = sz==1 ? 'b' : sz==2 ? 'h' : sz==4 ? 'w' : 'd';
1839       vex_printf("l%carx ", c_sz);
1840       ppHRegPPC(i->Pin.LoadL.dst);
1841       vex_printf(",%%r0,");
1842       ppHRegPPC(i->Pin.LoadL.src);
1843       return;
1844    }
1845    case Pin_Store: {
1846       UChar sz = i->Pin.Store.sz;
1847       Bool idxd = toBool(i->Pin.Store.dst->tag == Pam_RR);
1848       HChar c_sz = sz==1 ? 'b' : sz==2 ? 'h' : sz==4 ? 'w' : /*8*/ 'd';
1849       vex_printf("st%c%s ", c_sz, idxd ? "x" : "" );
1850       ppHRegPPC(i->Pin.Store.src);
1851       vex_printf(",");
1852       ppPPCAMode(i->Pin.Store.dst);
1853       return;
1854    }
1855    case Pin_StoreC: {
1856       UChar sz = i->Pin.StoreC.sz;
1857       HChar c_sz = sz==1 ? 'b' : sz==2 ? 'h' : sz==4 ? 'w' : 'd';
1858       vex_printf("st%ccx. ", c_sz);
1859       ppHRegPPC(i->Pin.StoreC.src);
1860       vex_printf(",%%r0,");
1861       ppHRegPPC(i->Pin.StoreC.dst);
1862       return;
1863    }
1864    case Pin_Set: {
1865       PPCCondCode cc = i->Pin.Set.cond;
1866       vex_printf("set (%s),", showPPCCondCode(cc));
1867       ppHRegPPC(i->Pin.Set.dst);
1868       if (cc.test == Pct_ALWAYS) {
1869          vex_printf(": { li ");
1870          ppHRegPPC(i->Pin.Set.dst);
1871          vex_printf(",1 }");
1872       } else {
1873          vex_printf(": { mfcr r0 ; rlwinm ");
1874          ppHRegPPC(i->Pin.Set.dst);
1875          vex_printf(",r0,%u,31,31", cc.flag+1);
1876          if (cc.test == Pct_FALSE) {
1877             vex_printf("; xori ");
1878             ppHRegPPC(i->Pin.Set.dst);
1879             vex_printf(",");
1880             ppHRegPPC(i->Pin.Set.dst);
1881             vex_printf(",1");
1882          }
1883          vex_printf(" }");
1884       }
1885       return;
1886    }
1887    case Pin_MfCR:
1888       vex_printf("mfcr ");
1889       ppHRegPPC(i->Pin.MfCR.dst);
1890       break;
1891    case Pin_MFence:
1892       vex_printf("mfence (=sync)");
1893       return;
1894
1895    case Pin_FpUnary:
1896       vex_printf("%s ", showPPCFpOp(i->Pin.FpUnary.op));
1897       ppHRegPPC(i->Pin.FpUnary.dst);
1898       vex_printf(",");
1899       ppHRegPPC(i->Pin.FpUnary.src);
1900       return;
1901    case Pin_FpBinary:
1902       vex_printf("%s ", showPPCFpOp(i->Pin.FpBinary.op));
1903       ppHRegPPC(i->Pin.FpBinary.dst);
1904       vex_printf(",");
1905       ppHRegPPC(i->Pin.FpBinary.srcL);
1906       vex_printf(",");
1907       ppHRegPPC(i->Pin.FpBinary.srcR);
1908       return;
1909    case Pin_Fp128Unary:
1910       vex_printf("%s ", showPPCFpOp(i->Pin.Fp128Unary.op));
1911       ppHRegPPC(i->Pin.Fp128Unary.dst);
1912       vex_printf(",");
1913       ppHRegPPC(i->Pin.Fp128Unary.src);
1914       return;
1915    case Pin_Fp128Binary:
1916       vex_printf("%s ", showPPCFpOp(i->Pin.Fp128Binary.op));
1917       ppHRegPPC(i->Pin.Fp128Binary.dst);
1918       vex_printf(",");
1919       ppHRegPPC(i->Pin.Fp128Binary.srcL);
1920       vex_printf(",");
1921       ppHRegPPC(i->Pin.Fp128Binary.srcR);
1922       return;
1923    case Pin_Fp128Ternary:
1924       vex_printf("%s ", showPPCFpOp(i->Pin.Fp128Ternary.op));
1925       ppHRegPPC(i->Pin.Fp128Ternary.dst);
1926       vex_printf(",");
1927       ppHRegPPC(i->Pin.Fp128Ternary.srcL);
1928       vex_printf(",");
1929       ppHRegPPC(i->Pin.Fp128Ternary.srcR);
1930       return;
1931    case Pin_FpMulAcc:
1932       vex_printf("%s ", showPPCFpOp(i->Pin.FpMulAcc.op));
1933       ppHRegPPC(i->Pin.FpMulAcc.dst);
1934       vex_printf(",");
1935       ppHRegPPC(i->Pin.FpMulAcc.srcML);
1936       vex_printf(",");
1937       ppHRegPPC(i->Pin.FpMulAcc.srcMR);
1938       vex_printf(",");
1939       ppHRegPPC(i->Pin.FpMulAcc.srcAcc);
1940       return;
1941    case Pin_FpLdSt: {
1942       UChar sz = i->Pin.FpLdSt.sz;
1943       Bool idxd = toBool(i->Pin.FpLdSt.addr->tag == Pam_RR);
1944       if (i->Pin.FpLdSt.isLoad) {
1945          vex_printf("lf%c%s ",
1946                     (sz==4 ? 's' : 'd'),
1947                     idxd ? "x" : "" );
1948          ppHRegPPC(i->Pin.FpLdSt.reg);
1949          vex_printf(",");
1950          ppPPCAMode(i->Pin.FpLdSt.addr);
1951       } else {
1952          vex_printf("stf%c%s ",
1953                     (sz==4 ? 's' : 'd'),
1954                     idxd ? "x" : "" );
1955          ppHRegPPC(i->Pin.FpLdSt.reg);
1956          vex_printf(",");
1957          ppPPCAMode(i->Pin.FpLdSt.addr);
1958       }
1959       return;
1960    }
1961    case Pin_FpSTFIW:
1962       vex_printf("stfiwz ");
1963       ppHRegPPC(i->Pin.FpSTFIW.data);
1964       vex_printf(",0(");
1965       ppHRegPPC(i->Pin.FpSTFIW.addr);
1966       vex_printf(")");
1967       return;
1968    case Pin_FpRSP:
1969       vex_printf("frsp ");
1970       ppHRegPPC(i->Pin.FpRSP.dst);
1971       vex_printf(",");
1972       ppHRegPPC(i->Pin.FpRSP.src);
1973       return;
1974    case Pin_FpCftI: {
1975       const HChar* str = "fc?????";
1976       /* Note that "fcfids" is missing from below. That instruction would
1977        * satisfy the predicate:
1978        *    (i->Pin.FpCftI.fromI == True && i->Pin.FpCftI.int32 == False)
1979        * which would go into a final "else" clause to make this if-else
1980        * block balanced.  But we're able to implement fcfids by leveraging
1981        * the fcfid implementation, so it wasn't necessary to include it here.
1982        */
1983       if (i->Pin.FpCftI.fromI == False && i->Pin.FpCftI.int32 == False)
1984          if (i->Pin.FpCftI.syned == True)
1985             str = "fctid";
1986          else
1987             str = "fctidu";
1988       else if (i->Pin.FpCftI.fromI == False && i->Pin.FpCftI.int32 == True)
1989          if (i->Pin.FpCftI.syned == True)
1990             str = "fctiw";
1991          else
1992             str = "fctiwu";
1993       else if (i->Pin.FpCftI.fromI == True && i->Pin.FpCftI.int32 == False) {
1994          if (i->Pin.FpCftI.syned == True) {
1995             str = "fcfid";
1996          } else {
1997             if (i->Pin.FpCftI.flt64 == True)
1998                str = "fcfidu";
1999             else
2000                str = "fcfidus";
2001          }
2002       }
2003       vex_printf("%s ", str);
2004       ppHRegPPC(i->Pin.FpCftI.dst);
2005       vex_printf(",");
2006       ppHRegPPC(i->Pin.FpCftI.src);
2007       return;
2008    }
2009    case Pin_FpCMov:
2010       vex_printf("fpcmov (%s) ", showPPCCondCode(i->Pin.FpCMov.cond));
2011       ppHRegPPC(i->Pin.FpCMov.dst);
2012       vex_printf(",");
2013       ppHRegPPC(i->Pin.FpCMov.src);
2014       vex_printf(": ");
2015       vex_printf("if (fr_dst != fr_src) { ");
2016       if (i->Pin.FpCMov.cond.test != Pct_ALWAYS) {
2017          vex_printf("if (%s) { ", showPPCCondCode(i->Pin.FpCMov.cond));
2018       }
2019       vex_printf("fmr ");
2020       ppHRegPPC(i->Pin.FpCMov.dst);
2021       vex_printf(",");
2022       ppHRegPPC(i->Pin.FpCMov.src);
2023       if (i->Pin.FpCMov.cond.test != Pct_ALWAYS)
2024          vex_printf(" }");
2025       vex_printf(" }");
2026       return;
2027    case Pin_FpLdFPSCR:
2028       vex_printf("mtfsf 0xFF,");
2029       ppHRegPPC(i->Pin.FpLdFPSCR.src);
2030       vex_printf(",0, %s", i->Pin.FpLdFPSCR.dfp_rm ? "1" : "0");
2031       return;
2032    case Pin_FpCmp:
2033       vex_printf("fcmpo %%cr1,");
2034       ppHRegPPC(i->Pin.FpCmp.srcL);
2035       vex_printf(",");
2036       ppHRegPPC(i->Pin.FpCmp.srcR);
2037       vex_printf("; mfcr ");
2038       ppHRegPPC(i->Pin.FpCmp.dst);
2039       vex_printf("; rlwinm ");
2040       ppHRegPPC(i->Pin.FpCmp.dst);
2041       vex_printf(",");
2042       ppHRegPPC(i->Pin.FpCmp.dst);
2043       vex_printf(",8,28,31");
2044       return;
2045
2046    case Pin_RdWrLR:
2047       vex_printf("%s ", i->Pin.RdWrLR.wrLR ? "mtlr" : "mflr");
2048       ppHRegPPC(i->Pin.RdWrLR.gpr);
2049       return;
2050
2051    case Pin_AvLdSt: {
2052       UChar  sz = i->Pin.AvLdSt.sz;
2053       const HChar* str_size;
2054       if (i->Pin.AvLdSt.addr->tag == Pam_IR) {
2055          ppLoadImm(hregPPC_GPR30(mode64),
2056                    i->Pin.AvLdSt.addr->Pam.IR.index, mode64);
2057          vex_printf(" ; ");
2058       }
2059       str_size = sz==1 ? "eb" : sz==2 ? "eh" : sz==4 ? "ew" : "";
2060       if (i->Pin.AvLdSt.isLoad)
2061          vex_printf("lv%sx ", str_size);
2062       else
2063          vex_printf("stv%sx ", str_size);
2064       ppHRegPPC(i->Pin.AvLdSt.reg);
2065       vex_printf(",");
2066       if (i->Pin.AvLdSt.addr->tag == Pam_IR)
2067          vex_printf("%%r30");
2068       else
2069          ppHRegPPC(i->Pin.AvLdSt.addr->Pam.RR.index);
2070       vex_printf(",");
2071       ppHRegPPC(i->Pin.AvLdSt.addr->Pam.RR.base);
2072       return;
2073    }
2074    case Pin_AvUnary:
2075       vex_printf("%s ", showPPCAvOp(i->Pin.AvUnary.op));
2076       ppHRegPPC(i->Pin.AvUnary.dst);
2077       vex_printf(",");
2078       ppHRegPPC(i->Pin.AvUnary.src);
2079       return;
2080    case Pin_AvBinary:
2081       vex_printf("%s ", showPPCAvOp(i->Pin.AvBinary.op));
2082       ppHRegPPC(i->Pin.AvBinary.dst);
2083       vex_printf(",");
2084       ppHRegPPC(i->Pin.AvBinary.srcL);
2085       vex_printf(",");
2086       ppHRegPPC(i->Pin.AvBinary.srcR);
2087       return;
2088    case Pin_AvBinaryInt:
2089       vex_printf("%s ", showPPCAvOp(i->Pin.AvBinaryInt.op));
2090       ppHRegPPC(i->Pin.AvBinaryInt.dst);
2091       vex_printf(",");
2092       ppHRegPPC(i->Pin.AvBinaryInt.src);
2093       vex_printf(",");
2094       ppPPCRI(i->Pin.AvBinaryInt.val);
2095       return;
2096    case Pin_AvBinaryInt128:
2097       vex_printf("%s ", showPPCAvOpBin128(i->Pin.AvBinaryInt128.op));
2098       ppHRegPPC(i->Pin.AvBinaryInt128.dst);
2099       vex_printf(",");
2100       ppHRegPPC(i->Pin.AvBinaryInt128.src1);
2101       vex_printf(",");
2102       ppHRegPPC(i->Pin.AvBinaryInt128.src2);
2103       return;
2104    case Pin_AvTernaryInt128:
2105       vex_printf("%s ", showPPCAvOpTri128(i->Pin.AvTernaryInt128.op));
2106       ppHRegPPC(i->Pin.AvTernaryInt128.dst);
2107       vex_printf(",");
2108       ppHRegPPC(i->Pin.AvTernaryInt128.src1);
2109       vex_printf(",");
2110       ppHRegPPC(i->Pin.AvTernaryInt128.src2);
2111       vex_printf(",");
2112       ppHRegPPC(i->Pin.AvTernaryInt128.src3);
2113       return;
2114    case Pin_AvBin8x16:
2115       vex_printf("%s(b) ", showPPCAvOp(i->Pin.AvBin8x16.op));
2116       ppHRegPPC(i->Pin.AvBin8x16.dst);
2117       vex_printf(",");
2118       ppHRegPPC(i->Pin.AvBin8x16.srcL);
2119       vex_printf(",");
2120       ppHRegPPC(i->Pin.AvBin8x16.srcR);
2121       return;
2122    case Pin_AvBin16x8:
2123       vex_printf("%s(h) ", showPPCAvOp(i->Pin.AvBin16x8.op));
2124       ppHRegPPC(i->Pin.AvBin16x8.dst);
2125       vex_printf(",");
2126       ppHRegPPC(i->Pin.AvBin16x8.srcL);
2127       vex_printf(",");
2128       ppHRegPPC(i->Pin.AvBin16x8.srcR);
2129       return;
2130    case Pin_AvBin32x4:
2131       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvBin32x4.op));
2132       ppHRegPPC(i->Pin.AvBin32x4.dst);
2133       vex_printf(",");
2134       ppHRegPPC(i->Pin.AvBin32x4.srcL);
2135       vex_printf(",");
2136       ppHRegPPC(i->Pin.AvBin32x4.srcR);
2137       return;
2138    case Pin_AvBin64x2:
2139       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvBin64x2.op));
2140       ppHRegPPC(i->Pin.AvBin64x2.dst);
2141       vex_printf(",");
2142       ppHRegPPC(i->Pin.AvBin64x2.srcL);
2143       vex_printf(",");
2144       ppHRegPPC(i->Pin.AvBin64x2.srcR);
2145       return;
2146    case Pin_AvBin32Fx4:
2147       vex_printf("%s ", showPPCAvFpOp(i->Pin.AvBin32Fx4.op));
2148       ppHRegPPC(i->Pin.AvBin32Fx4.dst);
2149       vex_printf(",");
2150       ppHRegPPC(i->Pin.AvBin32Fx4.srcL);
2151       vex_printf(",");
2152       ppHRegPPC(i->Pin.AvBin32Fx4.srcR);
2153       return;
2154    case Pin_AvUn32Fx4:
2155       vex_printf("%s ", showPPCAvFpOp(i->Pin.AvUn32Fx4.op));
2156       ppHRegPPC(i->Pin.AvUn32Fx4.dst);
2157       vex_printf(",");
2158       ppHRegPPC(i->Pin.AvUn32Fx4.src);
2159       return;
2160    case Pin_AvPerm:
2161       vex_printf("vperm ");
2162       ppHRegPPC(i->Pin.AvPerm.dst);
2163       vex_printf(",");
2164       ppHRegPPC(i->Pin.AvPerm.srcL);
2165       vex_printf(",");
2166       ppHRegPPC(i->Pin.AvPerm.srcR);
2167       vex_printf(",");
2168       ppHRegPPC(i->Pin.AvPerm.ctl);
2169       return;
2170
2171    case Pin_AvSel:
2172       vex_printf("vsel ");
2173       ppHRegPPC(i->Pin.AvSel.dst);
2174       vex_printf(",");
2175       ppHRegPPC(i->Pin.AvSel.srcL);
2176       vex_printf(",");
2177       ppHRegPPC(i->Pin.AvSel.srcR);
2178       vex_printf(",");
2179       ppHRegPPC(i->Pin.AvSel.ctl);
2180       return;
2181
2182    case Pin_AvSh:
2183       /* This only generates the following instructions with RA
2184        * register number set to 0.
2185        */
2186       if (i->Pin.AvSh.addr->tag == Pam_IR) {
2187          ppLoadImm(hregPPC_GPR30(mode64),
2188                    i->Pin.AvSh.addr->Pam.IR.index, mode64);
2189          vex_printf(" ; ");
2190       }
2191
2192       if (i->Pin.AvSh.shLeft)
2193          vex_printf("lvsl ");
2194       else
2195          vex_printf("lvsr ");
2196
2197       ppHRegPPC(i->Pin.AvSh.dst);
2198       if (i->Pin.AvSh.addr->tag == Pam_IR)
2199          vex_printf("%%r30");
2200       else
2201          ppHRegPPC(i->Pin.AvSh.addr->Pam.RR.index);
2202       vex_printf(",");
2203       ppHRegPPC(i->Pin.AvSh.addr->Pam.RR.base);
2204       return;
2205
2206    case Pin_AvShlDbl:
2207       vex_printf("vsldoi ");
2208       ppHRegPPC(i->Pin.AvShlDbl.dst);
2209       vex_printf(",");
2210       ppHRegPPC(i->Pin.AvShlDbl.srcL);
2211       vex_printf(",");
2212       ppHRegPPC(i->Pin.AvShlDbl.srcR);
2213       vex_printf(",%d", i->Pin.AvShlDbl.shift);
2214       return;
2215
2216    case Pin_AvSplat: {
2217       UChar sz = i->Pin.AvSplat.sz;
2218       HChar ch_sz = toUChar( (sz == 8) ? 'b' : (sz == 16) ? 'h' : 'w' );
2219       vex_printf("vsplt%s%c ",
2220                  i->Pin.AvSplat.src->tag == Pvi_Imm ? "is" : "", ch_sz);
2221       ppHRegPPC(i->Pin.AvSplat.dst);
2222       vex_printf(",");
2223       ppPPCVI5s(i->Pin.AvSplat.src);
2224       if (i->Pin.AvSplat.src->tag == Pvi_Reg)
2225          vex_printf(", %d", (128/sz)-1);   /* louis lane */
2226       return;
2227    }
2228
2229    case Pin_AvCMov:
2230       vex_printf("avcmov (%s) ", showPPCCondCode(i->Pin.AvCMov.cond));
2231       ppHRegPPC(i->Pin.AvCMov.dst);
2232       vex_printf(",");
2233       ppHRegPPC(i->Pin.AvCMov.src);
2234       vex_printf(": ");
2235       vex_printf("if (v_dst != v_src) { ");
2236       if (i->Pin.AvCMov.cond.test != Pct_ALWAYS) {
2237          vex_printf("if (%s) { ", showPPCCondCode(i->Pin.AvCMov.cond));
2238       }
2239       vex_printf("vmr ");
2240       ppHRegPPC(i->Pin.AvCMov.dst);
2241       vex_printf(",");
2242       ppHRegPPC(i->Pin.AvCMov.src);
2243       if (i->Pin.FpCMov.cond.test != Pct_ALWAYS)
2244          vex_printf(" }");
2245       vex_printf(" }");
2246       return;
2247
2248    case Pin_AvLdVSCR:
2249       vex_printf("mtvscr ");
2250       ppHRegPPC(i->Pin.AvLdVSCR.src);
2251       return;
2252
2253    case Pin_AvCipherV128Unary:
2254       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvCipherV128Unary.op));
2255       ppHRegPPC(i->Pin.AvCipherV128Unary.dst);
2256       vex_printf(",");
2257       ppHRegPPC(i->Pin.AvCipherV128Unary.src);
2258       return;
2259
2260    case Pin_AvCipherV128Binary:
2261       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvCipherV128Binary.op));
2262       ppHRegPPC(i->Pin.AvCipherV128Binary.dst);
2263       vex_printf(",");
2264       ppHRegPPC(i->Pin.AvCipherV128Binary.srcL);
2265       vex_printf(",");
2266       ppHRegPPC(i->Pin.AvCipherV128Binary.srcR);
2267       return;
2268
2269    case Pin_AvHashV128Binary:
2270       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvHashV128Binary.op));
2271       ppHRegPPC(i->Pin.AvHashV128Binary.dst);
2272       vex_printf(",");
2273       ppHRegPPC(i->Pin.AvHashV128Binary.src);
2274       vex_printf(",");
2275       ppPPCRI(i->Pin.AvHashV128Binary.s_field);
2276       return;
2277
2278    case Pin_AvBCDV128Binary:
2279       vex_printf("%s(w) ", showPPCAvOp(i->Pin.AvBCDV128Binary.op));
2280       ppHRegPPC(i->Pin.AvBCDV128Binary.dst);
2281       vex_printf(",");
2282       ppHRegPPC(i->Pin.AvBCDV128Binary.src1);
2283       vex_printf(",");
2284       ppHRegPPC(i->Pin.AvBCDV128Binary.src2);
2285       return;
2286
2287    case Pin_Dfp64Unary:
2288       vex_printf("%s ", showPPCFpOp(i->Pin.Dfp64Unary.op));
2289       ppHRegPPC(i->Pin.Dfp64Unary.dst);
2290       vex_printf(",");
2291       ppHRegPPC(i->Pin.Dfp64Unary.src);
2292       return;
2293
2294    case Pin_Dfp64Binary:
2295       vex_printf("%s ", showPPCFpOp(i->Pin.Dfp64Binary.op));
2296       ppHRegPPC(i->Pin.Dfp64Binary.dst);
2297       vex_printf(",");
2298       ppHRegPPC(i->Pin.Dfp64Binary.srcL);
2299       vex_printf(",");
2300       ppHRegPPC(i->Pin.Dfp64Binary.srcR);
2301       return;
2302
2303    case Pin_DfpShift:
2304       vex_printf("%s ", showPPCFpOp(i->Pin.DfpShift.op));
2305       ppHRegPPC(i->Pin.DfpShift.dst);
2306       vex_printf(",");
2307       ppHRegPPC(i->Pin.DfpShift.src);
2308       vex_printf(",");
2309       ppPPCRI(i->Pin.DfpShift.shift);
2310       return;
2311
2312    case Pin_Dfp128Unary:
2313       vex_printf("%s ", showPPCFpOp(i->Pin.Dfp128Unary.op));
2314       ppHRegPPC(i->Pin.Dfp128Unary.dst_hi);
2315       vex_printf(",");
2316       ppHRegPPC(i->Pin.Dfp128Unary.src_hi);
2317       return;
2318
2319    case Pin_Dfp128Binary:
2320       vex_printf("%s ", showPPCFpOp(i->Pin.Dfp128Binary.op));
2321       ppHRegPPC(i->Pin.Dfp128Binary.dst_hi);
2322       vex_printf(",");
2323       ppHRegPPC(i->Pin.Dfp128Binary.srcR_hi);
2324       return;
2325
2326    case Pin_DfpShift128:
2327       vex_printf("%s ", showPPCFpOp(i->Pin.DfpShift128.op));
2328       ppHRegPPC(i->Pin.DfpShift128.dst_hi);
2329       vex_printf(",");
2330       ppHRegPPC(i->Pin.DfpShift128.src_hi);
2331       vex_printf(",");
2332       ppPPCRI(i->Pin.DfpShift128.shift);
2333       return;
2334
2335    case Pin_DfpRound:
2336       vex_printf("drintx ");
2337       ppHRegPPC(i->Pin.DfpRound.dst);
2338       vex_printf(",");
2339       ppHRegPPC(i->Pin.DfpRound.src);
2340       vex_printf(",");
2341       ppPPCRI(i->Pin.DfpRound.r_rmc); /*  R in bit 3 and RMC in bits 2:0 */
2342       return;
2343
2344    case Pin_DfpRound128:
2345       vex_printf("drintxq ");
2346       ppHRegPPC(i->Pin.DfpRound128.dst_hi);
2347       vex_printf(",");
2348       ppHRegPPC(i->Pin.DfpRound128.src_hi);
2349       vex_printf(",");
2350       ppPPCRI(i->Pin.DfpRound128.r_rmc); /*  R in bit 3 and RMC in bits 2:0 */
2351       return;
2352
2353    case Pin_DfpQuantize:
2354       vex_printf("%s ", showPPCFpOp(i->Pin.DfpQuantize.op));
2355       ppHRegPPC(i->Pin.DfpQuantize.dst);
2356       vex_printf(",");
2357       ppHRegPPC(i->Pin.DfpQuantize.srcL);
2358       vex_printf(",");
2359       ppHRegPPC(i->Pin.DfpQuantize.srcR);
2360       vex_printf(",");
2361       ppPPCRI(i->Pin.DfpQuantize.rmc);
2362       return;
2363
2364    case Pin_DfpQuantize128:
2365       /*  Dst is used to pass in left source and return result */
2366       vex_printf("dquaq ");
2367       ppHRegPPC(i->Pin.DfpQuantize128.dst_hi);
2368       vex_printf(",");
2369       ppHRegPPC(i->Pin.DfpQuantize128.dst_hi);
2370       vex_printf(",");
2371       ppHRegPPC(i->Pin.DfpQuantize128.src_hi);
2372       vex_printf(",");
2373       ppPPCRI(i->Pin.DfpQuantize128.rmc);
2374       return;
2375
2376    case Pin_DfpD128toD64:
2377       vex_printf("%s ", showPPCFpOp(i->Pin.DfpD128toD64.op));
2378       ppHRegPPC(i->Pin.DfpD128toD64.dst);
2379       vex_printf(",");
2380       ppHRegPPC(i->Pin.DfpD128toD64.src_hi);
2381       vex_printf(",");
2382       return;
2383
2384    case Pin_DfpI64StoD128:
2385       vex_printf("%s ", showPPCFpOp(i->Pin.DfpI64StoD128.op));
2386       ppHRegPPC(i->Pin.DfpI64StoD128.dst_hi);
2387       vex_printf(",");
2388       ppHRegPPC(i->Pin.DfpI64StoD128.src);
2389       vex_printf(",");
2390       return;
2391    case Pin_ExtractExpD128:
2392       vex_printf("dxexq ");
2393       ppHRegPPC(i->Pin.ExtractExpD128.dst);
2394       vex_printf(",");
2395       ppHRegPPC(i->Pin.ExtractExpD128.src_hi);
2396       return;
2397    case Pin_InsertExpD128:
2398       vex_printf("diexq ");
2399       ppHRegPPC(i->Pin.InsertExpD128.dst_hi);
2400       vex_printf(",");
2401       ppHRegPPC(i->Pin.InsertExpD128.srcL);
2402       vex_printf(",");
2403       ppHRegPPC(i->Pin.InsertExpD128.srcR_hi);
2404       return;
2405    case Pin_Dfp64Cmp:
2406       vex_printf("dcmpo %%cr1,");
2407       ppHRegPPC(i->Pin.Dfp64Cmp.srcL);
2408       vex_printf(",");
2409       ppHRegPPC(i->Pin.Dfp64Cmp.srcR);
2410       vex_printf("; mfcr ");
2411       ppHRegPPC(i->Pin.Dfp64Cmp.dst);
2412       vex_printf("; rlwinm ");
2413       ppHRegPPC(i->Pin.Dfp64Cmp.dst);
2414       vex_printf(",");
2415       ppHRegPPC(i->Pin.Dfp64Cmp.dst);
2416       vex_printf(",8,28,31");
2417       return;
2418    case Pin_Dfp128Cmp:
2419       vex_printf("dcmpoq %%cr1,");
2420       ppHRegPPC(i->Pin.Dfp128Cmp.srcL_hi);
2421       vex_printf(",");
2422       ppHRegPPC(i->Pin.Dfp128Cmp.srcR_hi);
2423       vex_printf("; mfcr ");
2424       ppHRegPPC(i->Pin.Dfp128Cmp.dst);
2425       vex_printf("; rlwinm ");
2426       ppHRegPPC(i->Pin.Dfp128Cmp.dst);
2427       vex_printf(",");
2428       ppHRegPPC(i->Pin.Dfp128Cmp.dst);
2429       vex_printf(",8,28,31");
2430       return;
2431
2432    case Pin_XFormUnary994:
2433       if (i->Pin.XFormUnary994.op == Px_DFPTOIQS) {
2434          vex_printf("%s(w) ", showXFormUnary994(i->Pin.XFormUnary994.op));
2435          ppHRegPPC(i->Pin.XFormUnary994.reg0);
2436          vex_printf(",");
2437          ppHRegPPC(i->Pin.XFormUnary994.reg1);
2438       } else {
2439          vex_printf("%s(w) ", showXFormUnary994(i->Pin.XFormUnary994.op));
2440          ppHRegPPC(i->Pin.XFormUnary994.reg0);
2441          vex_printf(",");
2442          ppHRegPPC(i->Pin.XFormUnary994.reg2);
2443       }
2444       return;
2445
2446    case Pin_EvCheck:
2447       /* Note that the counter dec is 32 bit even in 64-bit mode. */
2448       vex_printf("(evCheck) ");
2449       vex_printf("lwz r30,");
2450       ppPPCAMode(i->Pin.EvCheck.amCounter);
2451       vex_printf("; addic. r30,r30,-1; ");
2452       vex_printf("stw r30,");
2453       ppPPCAMode(i->Pin.EvCheck.amCounter);
2454       vex_printf("; bge nofail; lwz r30,");
2455       ppPPCAMode(i->Pin.EvCheck.amFailAddr);
2456       vex_printf("; mtctr r30; bctr; nofail:");
2457       return;
2458    case Pin_ProfInc:
2459       if (mode64) {
2460          vex_printf("(profInc) imm64-fixed5 r30,$NotKnownYet; ");
2461          vex_printf("ld r29,(r30); addi r29,r29,1; std r29,(r30)");
2462       } else {
2463          vex_printf("(profInc) imm32-fixed2 r30,$NotKnownYet; ");
2464          vex_printf("lwz r29,4(r30); addic. r29,r29,1; stw r29,4(r30)");
2465          vex_printf("lwz r29,0(r30); addze r29,r29; stw r29,0(r30)");
2466       }
2467       break;
2468    default:
2469       vex_printf("\nppPPCInstr: No such tag(%d)\n", (Int)i->tag);
2470       vpanic("ppPPCInstr");
2471    }
2472 }
2473
2474 /* --------- Helpers for register allocation. --------- */
2475
2476 void getRegUsage_PPCInstr ( HRegUsage* u, const PPCInstr* i, Bool mode64 )
2477 {
2478    initHRegUsage(u);
2479    switch (i->tag) {
2480    case Pin_LI:
2481       addHRegUse(u, HRmWrite, i->Pin.LI.dst);
2482       break;
2483    case Pin_Alu:
2484       addHRegUse(u, HRmRead,  i->Pin.Alu.srcL);
2485       addRegUsage_PPCRH(u,    i->Pin.Alu.srcR);
2486       addHRegUse(u, HRmWrite, i->Pin.Alu.dst);
2487
2488       // or Rd,Rs,Rs == mr Rd,Rs
2489       if ((i->Pin.Alu.op == Palu_OR)
2490           && (i->Pin.Alu.srcR->tag == Prh_Reg)
2491           && sameHReg(i->Pin.Alu.srcR->Prh.Reg.reg, i->Pin.Alu.srcL)) {
2492          u->isRegRegMove = True;
2493          u->regMoveSrc   = i->Pin.Alu.srcL;
2494          u->regMoveDst   = i->Pin.Alu.dst;
2495       }
2496       return;
2497    case Pin_Shft:
2498       addHRegUse(u, HRmRead,  i->Pin.Shft.srcL);
2499       addRegUsage_PPCRH(u,    i->Pin.Shft.srcR);
2500       addHRegUse(u, HRmWrite, i->Pin.Shft.dst);
2501       return;
2502    case Pin_AddSubC:
2503       addHRegUse(u, HRmWrite, i->Pin.AddSubC.dst);
2504       addHRegUse(u, HRmRead,  i->Pin.AddSubC.srcL);
2505       addHRegUse(u, HRmRead,  i->Pin.AddSubC.srcR);
2506       return;
2507    case Pin_Cmp:
2508       addHRegUse(u, HRmRead, i->Pin.Cmp.srcL);
2509       addRegUsage_PPCRH(u,   i->Pin.Cmp.srcR);
2510       return;
2511    case Pin_Unary:
2512       addHRegUse(u, HRmWrite, i->Pin.Unary.dst);
2513       addHRegUse(u, HRmRead,  i->Pin.Unary.src);
2514       return;
2515    case Pin_MulL:
2516       addHRegUse(u, HRmWrite, i->Pin.MulL.dst);
2517       addHRegUse(u, HRmRead,  i->Pin.MulL.srcL);
2518       addHRegUse(u, HRmRead,  i->Pin.MulL.srcR);
2519       return;
2520    case Pin_Div:
2521       addHRegUse(u, HRmWrite, i->Pin.Div.dst);
2522       addHRegUse(u, HRmRead,  i->Pin.Div.srcL);
2523       addHRegUse(u, HRmRead,  i->Pin.Div.srcR);
2524       return;
2525    case Pin_Call: {
2526       UInt argir;
2527       /* This is a bit subtle. */
2528       /* First off, claim it trashes all the caller-saved regs
2529          which fall within the register allocator's jurisdiction.
2530          These I believe to be:
2531          mode32: r3 to r12
2532          mode64: r3 to r10
2533       */
2534       /* XXXXXXXXXXXXXXXXX BUG! This doesn't say anything about the FP
2535          or Altivec registers.  We get away with this ONLY because
2536          getAllocatableRegs_PPC gives the allocator callee-saved fp
2537          and Altivec regs, and no caller-save ones. */
2538       addHRegUse(u, HRmWrite, hregPPC_GPR3(mode64));
2539       addHRegUse(u, HRmWrite, hregPPC_GPR4(mode64));
2540       addHRegUse(u, HRmWrite, hregPPC_GPR5(mode64));
2541       addHRegUse(u, HRmWrite, hregPPC_GPR6(mode64));
2542       addHRegUse(u, HRmWrite, hregPPC_GPR7(mode64));
2543       addHRegUse(u, HRmWrite, hregPPC_GPR8(mode64));
2544       addHRegUse(u, HRmWrite, hregPPC_GPR9(mode64));
2545       addHRegUse(u, HRmWrite, hregPPC_GPR10(mode64));
2546       if (!mode64) {
2547          addHRegUse(u, HRmWrite, hregPPC_GPR11(mode64));
2548          addHRegUse(u, HRmWrite, hregPPC_GPR12(mode64));
2549       }
2550
2551       /* Now we have to state any parameter-carrying registers
2552          which might be read.  This depends on the argiregs field. */
2553       argir = i->Pin.Call.argiregs;
2554       if (argir &(1<<10)) addHRegUse(u, HRmRead, hregPPC_GPR10(mode64));
2555       if (argir & (1<<9)) addHRegUse(u, HRmRead, hregPPC_GPR9(mode64));
2556       if (argir & (1<<8)) addHRegUse(u, HRmRead, hregPPC_GPR8(mode64));
2557       if (argir & (1<<7)) addHRegUse(u, HRmRead, hregPPC_GPR7(mode64));
2558       if (argir & (1<<6)) addHRegUse(u, HRmRead, hregPPC_GPR6(mode64));
2559       if (argir & (1<<5)) addHRegUse(u, HRmRead, hregPPC_GPR5(mode64));
2560       if (argir & (1<<4)) addHRegUse(u, HRmRead, hregPPC_GPR4(mode64));
2561       if (argir & (1<<3)) addHRegUse(u, HRmRead, hregPPC_GPR3(mode64));
2562
2563       vassert(0 == (argir & ~((1<<3)|(1<<4)|(1<<5)|(1<<6)
2564                               |(1<<7)|(1<<8)|(1<<9)|(1<<10))));
2565
2566       /* Finally, there is the issue that the insn trashes a
2567          register because the literal target address has to be
2568          loaded into a register.  %r10 seems a suitable victim.
2569          (Can't use %r0, as some insns interpret it as value zero). */
2570       addHRegUse(u, HRmWrite, hregPPC_GPR10(mode64));
2571       /* Upshot of this is that the assembler really must use %r10,
2572          and no other, as a destination temporary. */
2573       return;
2574    }
2575    /* XDirect/XIndir/XAssisted are also a bit subtle.  They
2576       conditionally exit the block.  Hence we only need to list (1)
2577       the registers that they read, and (2) the registers that they
2578       write in the case where the block is not exited.  (2) is empty,
2579       hence only (1) is relevant here. */
2580    case Pin_XDirect:
2581       addRegUsage_PPCAMode(u, i->Pin.XDirect.amCIA);
2582       return;
2583    case Pin_XIndir:
2584       addHRegUse(u, HRmRead, i->Pin.XIndir.dstGA);
2585       addRegUsage_PPCAMode(u, i->Pin.XIndir.amCIA);
2586       return;
2587    case Pin_XAssisted:
2588       addHRegUse(u, HRmRead, i->Pin.XAssisted.dstGA);
2589       addRegUsage_PPCAMode(u, i->Pin.XAssisted.amCIA);
2590       return;
2591    case Pin_CMov:
2592       addRegUsage_PPCRI(u,  i->Pin.CMov.src);
2593       addHRegUse(u, HRmModify, i->Pin.CMov.dst);
2594       return;
2595    case Pin_Load:
2596       addRegUsage_PPCAMode(u, i->Pin.Load.src);
2597       addHRegUse(u, HRmWrite, i->Pin.Load.dst);
2598       return;
2599    case Pin_LoadL:
2600       addHRegUse(u, HRmRead,  i->Pin.LoadL.src);
2601       addHRegUse(u, HRmWrite, i->Pin.LoadL.dst);
2602       return;
2603    case Pin_Store:
2604       addHRegUse(u, HRmRead,  i->Pin.Store.src);
2605       addRegUsage_PPCAMode(u, i->Pin.Store.dst);
2606       return;
2607    case Pin_StoreC:
2608       addHRegUse(u, HRmRead, i->Pin.StoreC.src);
2609       addHRegUse(u, HRmRead, i->Pin.StoreC.dst);
2610       return;
2611    case Pin_Set:
2612       addHRegUse(u, HRmWrite, i->Pin.Set.dst);
2613       return;
2614    case Pin_MfCR:
2615       addHRegUse(u, HRmWrite, i->Pin.MfCR.dst);
2616       return;
2617    case Pin_MFence:
2618       return;
2619
2620    case Pin_FpUnary:
2621       addHRegUse(u, HRmWrite, i->Pin.FpUnary.dst);
2622       addHRegUse(u, HRmRead,  i->Pin.FpUnary.src);
2623
2624       if (i->Pin.FpUnary.op == Pfp_MOV) {
2625          u->isRegRegMove = True;
2626          u->regMoveSrc   = i->Pin.FpUnary.src;
2627          u->regMoveDst   = i->Pin.FpUnary.dst;
2628       }
2629       return;
2630    case Pin_FpBinary:
2631       addHRegUse(u, HRmWrite, i->Pin.FpBinary.dst);
2632       addHRegUse(u, HRmRead,  i->Pin.FpBinary.srcL);
2633       addHRegUse(u, HRmRead,  i->Pin.FpBinary.srcR);
2634       return;
2635
2636    case Pin_Fp128Unary:
2637       addHRegUse(u, HRmWrite, i->Pin.Fp128Unary.dst);
2638       addHRegUse(u, HRmRead, i->Pin.Fp128Unary.src);
2639       return;
2640    case Pin_Fp128Binary:
2641       addHRegUse(u, HRmWrite, i->Pin.Fp128Binary.dst);
2642       addHRegUse(u, HRmRead, i->Pin.Fp128Binary.srcL);
2643       addHRegUse(u, HRmRead, i->Pin.Fp128Binary.srcR);
2644       return;
2645    case Pin_Fp128Ternary:
2646       addHRegUse(u, HRmModify, i->Pin.Fp128Ternary.dst);
2647       addHRegUse(u, HRmRead, i->Pin.Fp128Ternary.srcL);
2648       addHRegUse(u, HRmRead, i->Pin.Fp128Ternary.srcR);
2649       return;
2650    case Pin_FpMulAcc:
2651       addHRegUse(u, HRmWrite, i->Pin.FpMulAcc.dst);
2652       addHRegUse(u, HRmRead,  i->Pin.FpMulAcc.srcML);
2653       addHRegUse(u, HRmRead,  i->Pin.FpMulAcc.srcMR);
2654       addHRegUse(u, HRmRead,  i->Pin.FpMulAcc.srcAcc);
2655       return;
2656    case Pin_FpLdSt:
2657       addHRegUse(u, (i->Pin.FpLdSt.isLoad ? HRmWrite : HRmRead),
2658                  i->Pin.FpLdSt.reg);
2659       addRegUsage_PPCAMode(u, i->Pin.FpLdSt.addr);
2660       return;
2661    case Pin_FpSTFIW:
2662       addHRegUse(u, HRmRead, i->Pin.FpSTFIW.addr);
2663       addHRegUse(u, HRmRead, i->Pin.FpSTFIW.data);
2664       return;
2665    case Pin_FpRSP:
2666       addHRegUse(u, HRmWrite, i->Pin.FpRSP.dst);
2667       addHRegUse(u, HRmRead,  i->Pin.FpRSP.src);
2668       return;
2669    case Pin_FpCftI:
2670       addHRegUse(u, HRmWrite, i->Pin.FpCftI.dst);
2671       addHRegUse(u, HRmRead,  i->Pin.FpCftI.src);
2672       return;
2673    case Pin_FpCMov:
2674       addHRegUse(u, HRmModify, i->Pin.FpCMov.dst);
2675       addHRegUse(u, HRmRead,   i->Pin.FpCMov.src);
2676       return;
2677    case Pin_FpLdFPSCR:
2678       addHRegUse(u, HRmRead, i->Pin.FpLdFPSCR.src);
2679       return;
2680    case Pin_FpCmp:
2681       addHRegUse(u, HRmWrite, i->Pin.FpCmp.dst);
2682       addHRegUse(u, HRmRead,  i->Pin.FpCmp.srcL);
2683       addHRegUse(u, HRmRead,  i->Pin.FpCmp.srcR);
2684       return;
2685
2686    case Pin_RdWrLR:
2687       addHRegUse(u, (i->Pin.RdWrLR.wrLR ? HRmRead : HRmWrite),
2688                  i->Pin.RdWrLR.gpr);
2689       return;
2690
2691    case Pin_AvLdSt:
2692       addHRegUse(u, (i->Pin.AvLdSt.isLoad ? HRmWrite : HRmRead),
2693                  i->Pin.AvLdSt.reg);
2694       if (i->Pin.AvLdSt.addr->tag == Pam_IR)
2695          addHRegUse(u, HRmWrite, hregPPC_GPR30(mode64));
2696       addRegUsage_PPCAMode(u, i->Pin.AvLdSt.addr);
2697       return;
2698    case Pin_AvUnary:
2699       addHRegUse(u, HRmWrite, i->Pin.AvUnary.dst);
2700       addHRegUse(u, HRmRead,  i->Pin.AvUnary.src);
2701       return;
2702    case Pin_AvBinary:
2703       if (i->Pin.AvBinary.op == Pav_XOR
2704           && sameHReg(i->Pin.AvBinary.dst, i->Pin.AvBinary.srcL)
2705           && sameHReg(i->Pin.AvBinary.dst, i->Pin.AvBinary.srcR)) {
2706          /* reg-alloc needs to understand 'xor r,r,r' as a write of r */
2707          /* (as opposed to a rite of passage :-) */
2708          addHRegUse(u, HRmWrite, i->Pin.AvBinary.dst);
2709       } else {
2710          addHRegUse(u, HRmWrite, i->Pin.AvBinary.dst);
2711          addHRegUse(u, HRmRead,  i->Pin.AvBinary.srcL);
2712          addHRegUse(u, HRmRead,  i->Pin.AvBinary.srcR);
2713       }
2714       return;
2715    case Pin_AvBinaryInt:
2716       addHRegUse(u, HRmWrite, i->Pin.AvBinaryInt.dst);
2717       addHRegUse(u, HRmRead,  i->Pin.AvBinaryInt.src);
2718       return;
2719    case Pin_AvBinaryInt128:
2720       addHRegUse(u, HRmWrite, i->Pin.AvBinaryInt128.dst);
2721       addHRegUse(u, HRmRead,  i->Pin.AvBinaryInt128.src1);
2722       addHRegUse(u, HRmRead,  i->Pin.AvBinaryInt128.src2);
2723       return;
2724    case Pin_AvTernaryInt128:
2725       addHRegUse(u, HRmWrite, i->Pin.AvTernaryInt128.dst);
2726       addHRegUse(u, HRmRead,  i->Pin.AvTernaryInt128.src1);
2727       addHRegUse(u, HRmRead,  i->Pin.AvTernaryInt128.src2);
2728       addHRegUse(u, HRmRead,  i->Pin.AvTernaryInt128.src3);
2729       return;
2730    case Pin_AvBin8x16:
2731       addHRegUse(u, HRmWrite, i->Pin.AvBin8x16.dst);
2732       addHRegUse(u, HRmRead,  i->Pin.AvBin8x16.srcL);
2733       addHRegUse(u, HRmRead,  i->Pin.AvBin8x16.srcR);
2734       return;
2735    case Pin_AvBin16x8:
2736       addHRegUse(u, HRmWrite, i->Pin.AvBin16x8.dst);
2737       addHRegUse(u, HRmRead,  i->Pin.AvBin16x8.srcL);
2738       addHRegUse(u, HRmRead,  i->Pin.AvBin16x8.srcR);
2739       return;
2740    case Pin_AvBin32x4:
2741       addHRegUse(u, HRmWrite, i->Pin.AvBin32x4.dst);
2742       addHRegUse(u, HRmRead,  i->Pin.AvBin32x4.srcL);
2743       addHRegUse(u, HRmRead,  i->Pin.AvBin32x4.srcR);
2744       return;
2745    case Pin_AvBin64x2:
2746       addHRegUse(u, HRmWrite, i->Pin.AvBin64x2.dst);
2747       addHRegUse(u, HRmRead,  i->Pin.AvBin64x2.srcL);
2748       addHRegUse(u, HRmRead,  i->Pin.AvBin64x2.srcR);
2749       return;
2750    case Pin_AvBin32Fx4:
2751       addHRegUse(u, HRmWrite, i->Pin.AvBin32Fx4.dst);
2752       addHRegUse(u, HRmRead,  i->Pin.AvBin32Fx4.srcL);
2753       addHRegUse(u, HRmRead,  i->Pin.AvBin32Fx4.srcR);
2754       if (i->Pin.AvBin32Fx4.op == Pavfp_MULF)
2755          addHRegUse(u, HRmWrite, hregPPC_VR29(mode64));
2756       return;
2757    case Pin_AvUn32Fx4:
2758       addHRegUse(u, HRmWrite, i->Pin.AvUn32Fx4.dst);
2759       addHRegUse(u, HRmRead,  i->Pin.AvUn32Fx4.src);
2760       return;
2761    case Pin_AvPerm:
2762       addHRegUse(u, HRmWrite, i->Pin.AvPerm.dst);
2763       addHRegUse(u, HRmRead,  i->Pin.AvPerm.srcL);
2764       addHRegUse(u, HRmRead,  i->Pin.AvPerm.srcR);
2765       addHRegUse(u, HRmRead,  i->Pin.AvPerm.ctl);
2766       return;
2767    case Pin_AvSel:
2768       addHRegUse(u, HRmWrite, i->Pin.AvSel.dst);
2769       addHRegUse(u, HRmRead,  i->Pin.AvSel.ctl);
2770       addHRegUse(u, HRmRead,  i->Pin.AvSel.srcL);
2771       addHRegUse(u, HRmRead,  i->Pin.AvSel.srcR);
2772       return;
2773    case Pin_AvSh:
2774       addHRegUse(u, HRmWrite, i->Pin.AvSh.dst);
2775       if (i->Pin.AvSh.addr->tag == Pam_IR)
2776          addHRegUse(u, HRmWrite, hregPPC_GPR30(mode64));
2777       addRegUsage_PPCAMode(u, i->Pin.AvSh.addr);
2778       return;
2779    case Pin_AvShlDbl:
2780       addHRegUse(u, HRmWrite, i->Pin.AvShlDbl.dst);
2781       addHRegUse(u, HRmRead,  i->Pin.AvShlDbl.srcL);
2782       addHRegUse(u, HRmRead,  i->Pin.AvShlDbl.srcR);
2783       return;
2784    case Pin_AvSplat:
2785       addHRegUse(u, HRmWrite, i->Pin.AvSplat.dst);
2786       addRegUsage_PPCVI5s(u,  i->Pin.AvSplat.src);
2787       return;
2788    case Pin_AvCMov:
2789       addHRegUse(u, HRmModify, i->Pin.AvCMov.dst);
2790       addHRegUse(u, HRmRead,   i->Pin.AvCMov.src);
2791       return;
2792    case Pin_AvLdVSCR:
2793       addHRegUse(u, HRmRead, i->Pin.AvLdVSCR.src);
2794       return;
2795    case Pin_AvCipherV128Unary:
2796       addHRegUse(u, HRmWrite, i->Pin.AvCipherV128Unary.dst);
2797       addHRegUse(u, HRmRead,  i->Pin.AvCipherV128Unary.src);
2798       return;
2799    case Pin_AvCipherV128Binary:
2800       addHRegUse(u, HRmWrite, i->Pin.AvCipherV128Binary.dst);
2801       addHRegUse(u, HRmRead,  i->Pin.AvCipherV128Binary.srcL);
2802       addHRegUse(u, HRmRead,  i->Pin.AvCipherV128Binary.srcR);
2803       return;
2804    case Pin_AvHashV128Binary:
2805       addHRegUse(u, HRmWrite, i->Pin.AvHashV128Binary.dst);
2806       addHRegUse(u, HRmRead,  i->Pin.AvHashV128Binary.src);
2807       addRegUsage_PPCRI(u,    i->Pin.AvHashV128Binary.s_field);
2808       return;
2809    case Pin_AvBCDV128Binary:
2810       addHRegUse(u, HRmWrite, i->Pin.AvBCDV128Binary.dst);
2811       addHRegUse(u, HRmRead,  i->Pin.AvBCDV128Binary.src1);
2812       addHRegUse(u, HRmRead,  i->Pin.AvBCDV128Binary.src2);
2813       return;
2814    case Pin_Dfp64Unary:
2815       addHRegUse(u, HRmWrite, i->Pin.Dfp64Unary.dst);
2816       addHRegUse(u, HRmRead, i->Pin.Dfp64Unary.src);
2817       return;
2818    case Pin_Dfp64Binary:
2819       addHRegUse(u, HRmWrite, i->Pin.Dfp64Binary.dst);
2820       addHRegUse(u, HRmRead, i->Pin.Dfp64Binary.srcL);
2821       addHRegUse(u, HRmRead, i->Pin.Dfp64Binary.srcR);
2822       return;
2823    case Pin_DfpShift:
2824       addRegUsage_PPCRI(u,    i->Pin.DfpShift.shift);
2825       addHRegUse(u, HRmWrite, i->Pin.DfpShift.src);
2826       addHRegUse(u, HRmWrite, i->Pin.DfpShift.dst);
2827       return;
2828    case Pin_Dfp128Unary:
2829       addHRegUse(u, HRmWrite, i->Pin.Dfp128Unary.dst_hi);
2830       addHRegUse(u, HRmWrite, i->Pin.Dfp128Unary.dst_lo);
2831       addHRegUse(u, HRmRead,  i->Pin.Dfp128Unary.src_hi);
2832       addHRegUse(u, HRmRead,  i->Pin.Dfp128Unary.src_lo);
2833       return;
2834    case Pin_Dfp128Binary:
2835       addHRegUse(u, HRmWrite, i->Pin.Dfp128Binary.dst_hi);
2836       addHRegUse(u, HRmWrite, i->Pin.Dfp128Binary.dst_lo);
2837       addHRegUse(u, HRmRead, i->Pin.Dfp128Binary.srcR_hi);
2838       addHRegUse(u, HRmRead, i->Pin.Dfp128Binary.srcR_lo);
2839       return;
2840    case Pin_DfpRound:
2841       addHRegUse(u, HRmWrite, i->Pin.DfpRound.dst);
2842       addHRegUse(u, HRmRead,  i->Pin.DfpRound.src);
2843       return;
2844    case Pin_DfpRound128:
2845       addHRegUse(u, HRmWrite, i->Pin.DfpRound128.dst_hi);
2846       addHRegUse(u, HRmWrite, i->Pin.DfpRound128.dst_lo);
2847       addHRegUse(u, HRmRead,  i->Pin.DfpRound128.src_hi);
2848       addHRegUse(u, HRmRead,  i->Pin.DfpRound128.src_lo);
2849       return;
2850    case Pin_DfpQuantize:
2851       addRegUsage_PPCRI(u,  i->Pin.DfpQuantize.rmc);
2852       addHRegUse(u, HRmWrite, i->Pin.DfpQuantize.dst);
2853       addHRegUse(u, HRmRead,  i->Pin.DfpQuantize.srcL);
2854       addHRegUse(u, HRmRead,  i->Pin.DfpQuantize.srcR);
2855       return;
2856    case Pin_DfpQuantize128:
2857       addHRegUse(u, HRmWrite, i->Pin.DfpQuantize128.dst_hi);
2858       addHRegUse(u, HRmWrite, i->Pin.DfpQuantize128.dst_lo);
2859       addHRegUse(u, HRmRead,  i->Pin.DfpQuantize128.src_hi);
2860       addHRegUse(u, HRmRead,  i->Pin.DfpQuantize128.src_lo);
2861       return;
2862    case Pin_DfpShift128:
2863       addRegUsage_PPCRI(u,    i->Pin.DfpShift128.shift);
2864       addHRegUse(u, HRmWrite, i->Pin.DfpShift128.src_hi);
2865       addHRegUse(u, HRmWrite, i->Pin.DfpShift128.src_lo);
2866       addHRegUse(u, HRmWrite, i->Pin.DfpShift128.dst_hi);
2867       addHRegUse(u, HRmWrite, i->Pin.DfpShift128.dst_lo);
2868       return;
2869    case Pin_DfpD128toD64:
2870       addHRegUse(u, HRmWrite, i->Pin.DfpD128toD64.src_hi);
2871       addHRegUse(u, HRmWrite, i->Pin.DfpD128toD64.src_lo);
2872       addHRegUse(u, HRmWrite, i->Pin.DfpD128toD64.dst);
2873       return;
2874    case Pin_DfpI64StoD128:
2875       addHRegUse(u, HRmWrite, i->Pin.DfpI64StoD128.src);
2876       addHRegUse(u, HRmWrite, i->Pin.DfpI64StoD128.dst_hi);
2877       addHRegUse(u, HRmWrite, i->Pin.DfpI64StoD128.dst_lo);
2878       return;
2879    case Pin_ExtractExpD128:
2880       addHRegUse(u, HRmWrite, i->Pin.ExtractExpD128.dst);
2881       addHRegUse(u, HRmRead,  i->Pin.ExtractExpD128.src_hi);
2882       addHRegUse(u, HRmRead,  i->Pin.ExtractExpD128.src_lo);
2883       return;
2884    case Pin_InsertExpD128:
2885       addHRegUse(u, HRmWrite, i->Pin.InsertExpD128.dst_hi);
2886       addHRegUse(u, HRmWrite, i->Pin.InsertExpD128.dst_lo);
2887       addHRegUse(u, HRmRead,  i->Pin.InsertExpD128.srcL);
2888       addHRegUse(u, HRmRead,  i->Pin.InsertExpD128.srcR_hi);
2889       addHRegUse(u, HRmRead,  i->Pin.InsertExpD128.srcR_lo);
2890       return;
2891    case Pin_Dfp64Cmp:
2892       addHRegUse(u, HRmWrite, i->Pin.Dfp64Cmp.dst);
2893       addHRegUse(u, HRmRead,  i->Pin.Dfp64Cmp.srcL);
2894       addHRegUse(u, HRmRead,  i->Pin.Dfp64Cmp.srcR);
2895       return;
2896    case Pin_Dfp128Cmp:
2897       addHRegUse(u, HRmWrite, i->Pin.Dfp128Cmp.dst);
2898       addHRegUse(u, HRmRead,  i->Pin.Dfp128Cmp.srcL_hi);
2899       addHRegUse(u, HRmRead,  i->Pin.Dfp128Cmp.srcL_lo);
2900       addHRegUse(u, HRmRead,  i->Pin.Dfp128Cmp.srcR_hi);
2901       addHRegUse(u, HRmRead,  i->Pin.Dfp128Cmp.srcR_lo);
2902       return;
2903    case Pin_XFormUnary994:
2904       if (i->Pin.XFormUnary994.op == Px_DFPTOIQS) {
2905          addHRegUse(u, HRmWrite, i->Pin.XFormUnary994.reg0);
2906          addHRegUse(u, HRmRead,  i->Pin.XFormUnary994.reg1);
2907          addHRegUse(u, HRmRead,  i->Pin.XFormUnary994.reg2);
2908       } else {
2909          addHRegUse(u, HRmWrite, i->Pin.XFormUnary994.reg0);
2910          addHRegUse(u, HRmWrite, i->Pin.XFormUnary994.reg1);
2911          addHRegUse(u, HRmRead,  i->Pin.XFormUnary994.reg2);
2912       }
2913       return;
2914    case Pin_EvCheck:
2915       /* We expect both amodes only to mention the GSP (r31), so this
2916          is in fact pointless, since GSP isn't allocatable, but
2917          anyway.. */
2918       addRegUsage_PPCAMode(u, i->Pin.EvCheck.amCounter);
2919       addRegUsage_PPCAMode(u, i->Pin.EvCheck.amFailAddr);
2920       addHRegUse(u, HRmWrite, hregPPC_GPR30(mode64)); /* also unavail to RA */
2921       return;
2922    case Pin_ProfInc:
2923       addHRegUse(u, HRmWrite, hregPPC_GPR29(mode64));
2924       addHRegUse(u, HRmWrite, hregPPC_GPR30(mode64));
2925       return;
2926    default:
2927       ppPPCInstr(i, mode64);
2928       vpanic("getRegUsage_PPCInstr");
2929    }
2930 }
2931
2932 /* local helper */
2933 static void mapReg( HRegRemap* m, HReg* r )
2934 {
2935    *r = lookupHRegRemap(m, *r);
2936 }
2937
2938 void mapRegs_PPCInstr ( HRegRemap* m, PPCInstr* i, Bool mode64 )
2939 {
2940    switch (i->tag) {
2941    case Pin_LI:
2942       mapReg(m, &i->Pin.LI.dst);
2943       return;
2944    case Pin_Alu:
2945       mapReg(m, &i->Pin.Alu.dst);
2946       mapReg(m, &i->Pin.Alu.srcL);
2947       mapRegs_PPCRH(m, i->Pin.Alu.srcR);
2948       return;
2949    case Pin_Shft:
2950       mapReg(m, &i->Pin.Shft.dst);
2951       mapReg(m, &i->Pin.Shft.srcL);
2952       mapRegs_PPCRH(m, i->Pin.Shft.srcR);
2953       return;
2954    case Pin_AddSubC:
2955       mapReg(m, &i->Pin.AddSubC.dst);
2956       mapReg(m, &i->Pin.AddSubC.srcL);
2957       mapReg(m, &i->Pin.AddSubC.srcR);
2958       return;
2959    case Pin_Cmp:
2960       mapReg(m, &i->Pin.Cmp.srcL);
2961       mapRegs_PPCRH(m, i->Pin.Cmp.srcR);
2962       return;
2963    case Pin_Unary:
2964       mapReg(m, &i->Pin.Unary.dst);
2965       mapReg(m, &i->Pin.Unary.src);
2966       return;
2967    case Pin_MulL:
2968       mapReg(m, &i->Pin.MulL.dst);
2969       mapReg(m, &i->Pin.MulL.srcL);
2970       mapReg(m, &i->Pin.MulL.srcR);
2971       return;
2972    case Pin_Div:
2973       mapReg(m, &i->Pin.Div.dst);
2974       mapReg(m, &i->Pin.Div.srcL);
2975       mapReg(m, &i->Pin.Div.srcR);
2976       return;
2977    case Pin_Call:
2978       return;
2979    case Pin_XDirect:
2980       mapRegs_PPCAMode(m, i->Pin.XDirect.amCIA);
2981       return;
2982    case Pin_XIndir:
2983       mapReg(m, &i->Pin.XIndir.dstGA);
2984       mapRegs_PPCAMode(m, i->Pin.XIndir.amCIA);
2985       return;
2986    case Pin_XAssisted:
2987       mapReg(m, &i->Pin.XAssisted.dstGA);
2988       mapRegs_PPCAMode(m, i->Pin.XAssisted.amCIA);
2989       return;
2990    case Pin_CMov:
2991       mapRegs_PPCRI(m, i->Pin.CMov.src);
2992       mapReg(m, &i->Pin.CMov.dst);
2993       return;
2994    case Pin_Load:
2995       mapRegs_PPCAMode(m, i->Pin.Load.src);
2996       mapReg(m, &i->Pin.Load.dst);
2997       return;
2998    case Pin_LoadL:
2999       mapReg(m, &i->Pin.LoadL.src);
3000       mapReg(m, &i->Pin.LoadL.dst);
3001       return;
3002    case Pin_Store:
3003       mapReg(m, &i->Pin.Store.src);
3004       mapRegs_PPCAMode(m, i->Pin.Store.dst);
3005       return;
3006    case Pin_StoreC:
3007       mapReg(m, &i->Pin.StoreC.src);
3008       mapReg(m, &i->Pin.StoreC.dst);
3009       return;
3010    case Pin_Set:
3011       mapReg(m, &i->Pin.Set.dst);
3012       return;
3013    case Pin_MfCR:
3014       mapReg(m, &i->Pin.MfCR.dst);
3015       return;
3016    case Pin_MFence:
3017       return;
3018    case Pin_FpUnary:
3019       mapReg(m, &i->Pin.FpUnary.dst);
3020       mapReg(m, &i->Pin.FpUnary.src);
3021       return;
3022    case Pin_FpBinary:
3023       mapReg(m, &i->Pin.FpBinary.dst);
3024       mapReg(m, &i->Pin.FpBinary.srcL);
3025       mapReg(m, &i->Pin.FpBinary.srcR);
3026       return;
3027    case Pin_Fp128Unary:
3028       mapReg(m, &i->Pin.Fp128Unary.dst);
3029       mapReg(m, &i->Pin.Fp128Unary.src);
3030       return;
3031    case Pin_Fp128Binary:
3032       mapReg(m, &i->Pin.Fp128Binary.dst);
3033       mapReg(m, &i->Pin.Fp128Binary.srcL);
3034       mapReg(m, &i->Pin.Fp128Binary.srcR);
3035       return;
3036    case Pin_Fp128Ternary:
3037       mapReg(m, &i->Pin.Fp128Ternary.dst);
3038       mapReg(m, &i->Pin.Fp128Ternary.srcL);
3039       mapReg(m, &i->Pin.Fp128Ternary.srcR);
3040       return;
3041    case Pin_FpMulAcc:
3042       mapReg(m, &i->Pin.FpMulAcc.dst);
3043       mapReg(m, &i->Pin.FpMulAcc.srcML);
3044       mapReg(m, &i->Pin.FpMulAcc.srcMR);
3045       mapReg(m, &i->Pin.FpMulAcc.srcAcc);
3046       return;
3047    case Pin_FpLdSt:
3048       mapReg(m, &i->Pin.FpLdSt.reg);
3049       mapRegs_PPCAMode(m, i->Pin.FpLdSt.addr);
3050       return;
3051    case Pin_FpSTFIW:
3052       mapReg(m, &i->Pin.FpSTFIW.addr);
3053       mapReg(m, &i->Pin.FpSTFIW.data);
3054       return;
3055    case Pin_FpRSP:
3056       mapReg(m, &i->Pin.FpRSP.dst);
3057       mapReg(m, &i->Pin.FpRSP.src);
3058       return;
3059    case Pin_FpCftI:
3060       mapReg(m, &i->Pin.FpCftI.dst);
3061       mapReg(m, &i->Pin.FpCftI.src);
3062       return;
3063    case Pin_FpCMov:
3064       mapReg(m, &i->Pin.FpCMov.dst);
3065       mapReg(m, &i->Pin.FpCMov.src);
3066       return;
3067    case Pin_FpLdFPSCR:
3068       mapReg(m, &i->Pin.FpLdFPSCR.src);
3069       return;
3070    case Pin_FpCmp:
3071       mapReg(m, &i->Pin.FpCmp.dst);
3072       mapReg(m, &i->Pin.FpCmp.srcL);
3073       mapReg(m, &i->Pin.FpCmp.srcR);
3074       return;
3075    case Pin_RdWrLR:
3076       mapReg(m, &i->Pin.RdWrLR.gpr);
3077       return;
3078    case Pin_AvLdSt:
3079       mapReg(m, &i->Pin.AvLdSt.reg);
3080       mapRegs_PPCAMode(m, i->Pin.AvLdSt.addr);
3081       return;
3082    case Pin_AvUnary:
3083       mapReg(m, &i->Pin.AvUnary.dst);
3084       mapReg(m, &i->Pin.AvUnary.src);
3085       return;
3086    case Pin_AvBinary:
3087       mapReg(m, &i->Pin.AvBinary.dst);
3088       mapReg(m, &i->Pin.AvBinary.srcL);
3089       mapReg(m, &i->Pin.AvBinary.srcR);
3090       return;
3091    case Pin_AvBinaryInt:
3092       mapReg(m, &i->Pin.AvBinaryInt.dst);
3093       mapReg(m, &i->Pin.AvBinaryInt.src);
3094       return;
3095    case Pin_AvBinaryInt128:
3096       mapReg(m, &i->Pin.AvBinaryInt128.dst);
3097       mapReg(m, &i->Pin.AvBinaryInt128.src1);
3098       mapReg(m, &i->Pin.AvBinaryInt128.src2);
3099       return;
3100    case Pin_AvTernaryInt128:
3101       mapReg(m, &i->Pin.AvTernaryInt128.dst);
3102       mapReg(m, &i->Pin.AvTernaryInt128.src1);
3103       mapReg(m, &i->Pin.AvTernaryInt128.src2);
3104       mapReg(m, &i->Pin.AvTernaryInt128.src3);
3105       return;
3106    case Pin_AvBin8x16:
3107       mapReg(m, &i->Pin.AvBin8x16.dst);
3108       mapReg(m, &i->Pin.AvBin8x16.srcL);
3109       mapReg(m, &i->Pin.AvBin8x16.srcR);
3110       return;
3111    case Pin_AvBin16x8:
3112       mapReg(m, &i->Pin.AvBin16x8.dst);
3113       mapReg(m, &i->Pin.AvBin16x8.srcL);
3114       mapReg(m, &i->Pin.AvBin16x8.srcR);
3115       return;
3116    case Pin_AvBin32x4:
3117       mapReg(m, &i->Pin.AvBin32x4.dst);
3118       mapReg(m, &i->Pin.AvBin32x4.srcL);
3119       mapReg(m, &i->Pin.AvBin32x4.srcR);
3120       return;
3121    case Pin_AvBin64x2:
3122       mapReg(m, &i->Pin.AvBin64x2.dst);
3123       mapReg(m, &i->Pin.AvBin64x2.srcL);
3124       mapReg(m, &i->Pin.AvBin64x2.srcR);
3125       return;
3126    case Pin_AvBin32Fx4:
3127       mapReg(m, &i->Pin.AvBin32Fx4.dst);
3128       mapReg(m, &i->Pin.AvBin32Fx4.srcL);
3129       mapReg(m, &i->Pin.AvBin32Fx4.srcR);
3130       return;
3131    case Pin_AvUn32Fx4:
3132       mapReg(m, &i->Pin.AvUn32Fx4.dst);
3133       mapReg(m, &i->Pin.AvUn32Fx4.src);
3134       return;
3135    case Pin_AvPerm:
3136       mapReg(m, &i->Pin.AvPerm.dst);
3137       mapReg(m, &i->Pin.AvPerm.srcL);
3138       mapReg(m, &i->Pin.AvPerm.srcR);
3139       mapReg(m, &i->Pin.AvPerm.ctl);
3140       return;
3141    case Pin_AvSel:
3142       mapReg(m, &i->Pin.AvSel.dst);
3143       mapReg(m, &i->Pin.AvSel.srcL);
3144       mapReg(m, &i->Pin.AvSel.srcR);
3145       mapReg(m, &i->Pin.AvSel.ctl);
3146       return;
3147    case Pin_AvSh:
3148       mapReg(m, &i->Pin.AvSh.dst);
3149       mapRegs_PPCAMode(m, i->Pin.AvSh.addr);
3150       return;
3151    case Pin_AvShlDbl:
3152       mapReg(m, &i->Pin.AvShlDbl.dst);
3153       mapReg(m, &i->Pin.AvShlDbl.srcL);
3154       mapReg(m, &i->Pin.AvShlDbl.srcR);
3155       return;
3156    case Pin_AvSplat:
3157       mapReg(m, &i->Pin.AvSplat.dst);
3158       mapRegs_PPCVI5s(m, i->Pin.AvSplat.src);
3159       return;
3160    case Pin_AvCMov:
3161      mapReg(m, &i->Pin.AvCMov.dst);
3162      mapReg(m, &i->Pin.AvCMov.src);
3163      return;
3164    case Pin_AvLdVSCR:
3165       mapReg(m, &i->Pin.AvLdVSCR.src);
3166       return;
3167    case Pin_AvCipherV128Unary:
3168       mapReg(m, &i->Pin.AvCipherV128Unary.dst);
3169       mapReg(m, &i->Pin.AvCipherV128Unary.src);
3170       return;
3171    case Pin_AvCipherV128Binary:
3172       mapReg(m, &i->Pin.AvCipherV128Binary.dst);
3173       mapReg(m, &i->Pin.AvCipherV128Binary.srcL);
3174       mapReg(m, &i->Pin.AvCipherV128Binary.srcR);
3175       return;
3176    case Pin_AvHashV128Binary:
3177       mapRegs_PPCRI(m, i->Pin.AvHashV128Binary.s_field);
3178       mapReg(m, &i->Pin.AvHashV128Binary.dst);
3179       mapReg(m, &i->Pin.AvHashV128Binary.src);
3180       return;
3181    case Pin_AvBCDV128Binary:
3182       mapReg(m, &i->Pin.AvBCDV128Binary.dst);
3183       mapReg(m, &i->Pin.AvBCDV128Binary.src1);
3184       mapReg(m, &i->Pin.AvBCDV128Binary.src2);
3185       return;
3186    case Pin_Dfp64Unary:
3187       mapReg(m, &i->Pin.Dfp64Unary.dst);
3188       mapReg(m, &i->Pin.Dfp64Unary.src);
3189       return;
3190    case Pin_Dfp64Binary:
3191       mapReg(m, &i->Pin.Dfp64Binary.dst);
3192       mapReg(m, &i->Pin.Dfp64Binary.srcL);
3193       mapReg(m, &i->Pin.Dfp64Binary.srcR);
3194       return;
3195    case Pin_DfpShift:
3196       mapRegs_PPCRI(m, i->Pin.DfpShift.shift);
3197       mapReg(m, &i->Pin.DfpShift.src);
3198       mapReg(m, &i->Pin.DfpShift.dst);
3199       return;
3200    case Pin_Dfp128Unary:
3201       mapReg(m, &i->Pin.Dfp128Unary.dst_hi);
3202       mapReg(m, &i->Pin.Dfp128Unary.dst_lo);
3203       mapReg(m, &i->Pin.Dfp128Unary.src_hi);
3204       mapReg(m, &i->Pin.Dfp128Unary.src_lo);
3205      return;
3206    case Pin_Dfp128Binary:
3207       mapReg(m, &i->Pin.Dfp128Binary.dst_hi);
3208       mapReg(m, &i->Pin.Dfp128Binary.dst_lo);
3209       mapReg(m, &i->Pin.Dfp128Binary.srcR_hi);
3210       mapReg(m, &i->Pin.Dfp128Binary.srcR_lo);
3211       return;
3212    case Pin_DfpShift128:
3213       mapRegs_PPCRI(m, i->Pin.DfpShift128.shift);
3214       mapReg(m, &i->Pin.DfpShift128.src_hi);
3215       mapReg(m, &i->Pin.DfpShift128.src_lo);
3216       mapReg(m, &i->Pin.DfpShift128.dst_hi);
3217       mapReg(m, &i->Pin.DfpShift128.dst_lo);
3218       return;
3219    case Pin_DfpRound:
3220       mapReg(m, &i->Pin.DfpRound.dst);
3221       mapReg(m, &i->Pin.DfpRound.src);
3222       return;
3223    case Pin_DfpRound128:
3224       mapReg(m, &i->Pin.DfpRound128.dst_hi);
3225       mapReg(m, &i->Pin.DfpRound128.dst_lo);
3226       mapReg(m, &i->Pin.DfpRound128.src_hi);
3227       mapReg(m, &i->Pin.DfpRound128.src_lo);
3228       return;
3229    case Pin_DfpQuantize:
3230       mapRegs_PPCRI(m, i->Pin.DfpQuantize.rmc);
3231       mapReg(m, &i->Pin.DfpQuantize.dst);
3232       mapReg(m, &i->Pin.DfpQuantize.srcL);
3233       mapReg(m, &i->Pin.DfpQuantize.srcR);
3234       return;
3235    case Pin_DfpQuantize128:
3236       mapRegs_PPCRI(m, i->Pin.DfpQuantize128.rmc);
3237       mapReg(m, &i->Pin.DfpQuantize128.dst_hi);
3238       mapReg(m, &i->Pin.DfpQuantize128.dst_lo);
3239       mapReg(m, &i->Pin.DfpQuantize128.src_hi);
3240       mapReg(m, &i->Pin.DfpQuantize128.src_lo);
3241       return;
3242    case Pin_DfpD128toD64:
3243       mapReg(m, &i->Pin.DfpD128toD64.src_hi);
3244       mapReg(m, &i->Pin.DfpD128toD64.src_lo);
3245       mapReg(m, &i->Pin.DfpD128toD64.dst);
3246       return;
3247    case Pin_DfpI64StoD128:
3248       mapReg(m, &i->Pin.DfpI64StoD128.src);
3249       mapReg(m, &i->Pin.DfpI64StoD128.dst_hi);
3250       mapReg(m, &i->Pin.DfpI64StoD128.dst_lo);
3251       return;
3252    case Pin_ExtractExpD128:
3253       mapReg(m, &i->Pin.ExtractExpD128.dst);
3254       mapReg(m, &i->Pin.ExtractExpD128.src_hi);
3255       mapReg(m, &i->Pin.ExtractExpD128.src_lo);
3256       return;
3257    case Pin_InsertExpD128:
3258       mapReg(m, &i->Pin.InsertExpD128.dst_hi);
3259       mapReg(m, &i->Pin.InsertExpD128.dst_lo);
3260       mapReg(m, &i->Pin.InsertExpD128.srcL);
3261       mapReg(m, &i->Pin.InsertExpD128.srcR_hi);
3262       mapReg(m, &i->Pin.InsertExpD128.srcR_lo);
3263       return;
3264    case Pin_Dfp64Cmp:
3265       mapReg(m, &i->Pin.Dfp64Cmp.dst);
3266       mapReg(m, &i->Pin.Dfp64Cmp.srcL);
3267       mapReg(m, &i->Pin.Dfp64Cmp.srcR);
3268       return;
3269    case Pin_Dfp128Cmp:
3270       mapReg(m, &i->Pin.Dfp128Cmp.dst);
3271       mapReg(m, &i->Pin.Dfp128Cmp.srcL_hi);
3272       mapReg(m, &i->Pin.Dfp128Cmp.srcL_lo);
3273       mapReg(m, &i->Pin.Dfp128Cmp.srcR_hi);
3274       mapReg(m, &i->Pin.Dfp128Cmp.srcR_lo);
3275       return;
3276    case Pin_XFormUnary994:
3277       mapReg(m, &i->Pin.XFormUnary994.reg0);
3278       mapReg(m, &i->Pin.XFormUnary994.reg1);
3279       mapReg(m, &i->Pin.XFormUnary994.reg2);
3280       return;
3281    case Pin_EvCheck:
3282       /* We expect both amodes only to mention the GSP (r31), so this
3283          is in fact pointless, since GSP isn't allocatable, but
3284          anyway.. */
3285       mapRegs_PPCAMode(m, i->Pin.EvCheck.amCounter);
3286       mapRegs_PPCAMode(m, i->Pin.EvCheck.amFailAddr);
3287       return;
3288    case Pin_ProfInc:
3289       /* hardwires r29 and r30 -- nothing to modify. */
3290       return;
3291    default:
3292       ppPPCInstr(i, mode64);
3293       vpanic("mapRegs_PPCInstr");
3294    }
3295 }
3296
3297 /* Generate ppc spill/reload instructions under the direction of the
3298    register allocator.  Note it's critical these don't write the
3299    condition codes. */
3300
3301 void genSpill_PPC ( /*OUT*/HInstr** i1, /*OUT*/HInstr** i2,
3302                     HReg rreg, Int offsetB, Bool mode64 )
3303 {
3304    PPCAMode* am;
3305    vassert(!hregIsVirtual(rreg));
3306    *i1 = *i2 = NULL;
3307    am = PPCAMode_IR( offsetB, GuestStatePtr(mode64) );
3308    switch (hregClass(rreg)) {
3309       case HRcInt64:
3310          vassert(mode64);
3311          *i1 = PPCInstr_Store( 8, am, rreg, mode64 );
3312          return;
3313       case HRcInt32:
3314          vassert(!mode64);
3315          *i1 = PPCInstr_Store( 4, am, rreg, mode64 );
3316          return;
3317       case HRcFlt64:
3318          *i1 = PPCInstr_FpLdSt ( False/*store*/, 8, rreg, am );
3319          return;
3320       case HRcVec128:
3321          // XXX: GPR30 used as spill register to kludge AltiVec
3322          // AMode_IR
3323          *i1 = PPCInstr_AvLdSt ( False/*store*/, 16, rreg, am );
3324          return;
3325       default:
3326          ppHRegClass(hregClass(rreg));
3327          vpanic("genSpill_PPC: unimplemented regclass");
3328    }
3329 }
3330
3331 void genReload_PPC ( /*OUT*/HInstr** i1, /*OUT*/HInstr** i2,
3332                      HReg rreg, Int offsetB, Bool mode64 )
3333 {
3334    PPCAMode* am;
3335    vassert(!hregIsVirtual(rreg));
3336    *i1 = *i2 = NULL;
3337    am = PPCAMode_IR( offsetB, GuestStatePtr(mode64) );
3338    switch (hregClass(rreg)) {
3339       case HRcInt64:
3340          vassert(mode64);
3341          *i1 = PPCInstr_Load( 8, rreg, am, mode64 );
3342          return;
3343       case HRcInt32:
3344          vassert(!mode64);
3345          *i1 = PPCInstr_Load( 4, rreg, am, mode64 );
3346          return;
3347       case HRcFlt64:
3348          *i1 = PPCInstr_FpLdSt ( True/*load*/, 8, rreg, am );
3349          return;
3350       case HRcVec128:
3351          // XXX: GPR30 used as spill register to kludge AltiVec AMode_IR
3352          *i1 = PPCInstr_AvLdSt ( True/*load*/, 16, rreg, am );
3353          return;
3354       default:
3355          ppHRegClass(hregClass(rreg));
3356          vpanic("genReload_PPC: unimplemented regclass");
3357    }
3358 }
3359
3360 PPCInstr* genMove_PPC(HReg from, HReg to, Bool mode64)
3361 {
3362    switch (hregClass(from)) {
3363    case HRcInt32:
3364    case HRcInt64:
3365       return PPCInstr_Alu(Palu_OR, to, from, PPCRH_Reg(from));
3366    case HRcFlt64:
3367       return PPCInstr_FpUnary(Pfp_MOV, to, from);
3368    default:
3369       ppHRegClass(hregClass(from));
3370       vpanic("genMove_PPC: unimplemented regclass");
3371    }
3372 }
3373
3374
3375 /* --------- The ppc assembler (bleh.) --------- */
3376
3377 inline static UInt iregEnc ( HReg r, Bool mode64 )
3378 {
3379    UInt n;
3380    vassert(hregClass(r) == (mode64 ? HRcInt64 : HRcInt32));
3381    vassert(!hregIsVirtual(r));
3382    n = hregEncoding(r);
3383    vassert(n <= 32);
3384    return n;
3385 }
3386
3387 inline static UInt fregEnc ( HReg fr )
3388 {
3389    UInt n;
3390    vassert(hregClass(fr) == HRcFlt64);
3391    vassert(!hregIsVirtual(fr));
3392    n = hregEncoding(fr);
3393    vassert(n <= 32);
3394    return n;
3395 }
3396
3397 inline static UInt vregEnc ( HReg v )
3398 {
3399    UInt n;
3400    vassert(hregClass(v) == HRcVec128);
3401    vassert(!hregIsVirtual(v));
3402    n = hregEncoding(v);
3403    vassert(n <= 32);
3404    return n;
3405 }
3406
3407 /* Emit an instruction ppc-endianly */
3408 static UChar* emit32 ( UChar* p, UInt w32, VexEndness endness_host )
3409 {
3410   if (endness_host == VexEndnessBE) {
3411     *p++ = toUChar((w32 >> 24) & 0x000000FF);
3412     *p++ = toUChar((w32 >> 16) & 0x000000FF);
3413     *p++ = toUChar((w32 >>  8) & 0x000000FF);
3414     *p++ = toUChar((w32)       & 0x000000FF);
3415   } else {
3416     *p++ = toUChar((w32)       & 0x000000FF);
3417     *p++ = toUChar((w32 >>  8) & 0x000000FF);
3418     *p++ = toUChar((w32 >> 16) & 0x000000FF);
3419     *p++ = toUChar((w32 >> 24) & 0x000000FF);
3420   }
3421    return p;
3422 }
3423
3424 /* Fetch an instruction ppc-endianly */
3425 static UInt fetch32 ( UChar* p, VexEndness endness_host )
3426 {
3427    UInt w32 = 0;
3428    if (endness_host == VexEndnessBE) {
3429       w32 |= ((0xFF & (UInt)p[0]) << 24);
3430       w32 |= ((0xFF & (UInt)p[1]) << 16);
3431       w32 |= ((0xFF & (UInt)p[2]) <<  8);
3432       w32 |= ((0xFF & (UInt)p[3]) <<  0);
3433   } else {
3434       w32 |= ((0xFF & (UInt)p[3]) << 24);
3435       w32 |= ((0xFF & (UInt)p[2]) << 16);
3436       w32 |= ((0xFF & (UInt)p[1]) <<  8);
3437       w32 |= ((0xFF & (UInt)p[0]) <<  0);
3438   }
3439    return w32;
3440 }
3441
3442 /* The following mkForm[...] functions refer to ppc instruction forms
3443    as per PPC32 p576
3444  */
3445
3446 static UChar* mkFormD ( UChar* p, UInt opc1,
3447                         UInt r1, UInt r2, UInt imm, VexEndness endness_host )
3448 {
3449    UInt theInstr;
3450    vassert(opc1 < 0x40);
3451    vassert(r1   < 0x20);
3452    vassert(r2   < 0x20);
3453    imm = imm & 0xFFFF;
3454    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) | (imm));
3455    return emit32(p, theInstr, endness_host);
3456 }
3457
3458 static UChar* mkFormMD ( UChar* p, UInt opc1, UInt r1, UInt r2,
3459                          UInt imm1, UInt imm2, UInt opc2,
3460                          VexEndness endness_host )
3461 {
3462    UInt theInstr;
3463    vassert(opc1 < 0x40);
3464    vassert(r1   < 0x20);
3465    vassert(r2   < 0x20);
3466    vassert(imm1 < 0x40);
3467    vassert(imm2 < 0x40);
3468    vassert(opc2 < 0x08);
3469    imm2 = ((imm2 & 0x1F) << 1) | (imm2 >> 5);
3470    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3471                ((imm1 & 0x1F)<<11) | (imm2<<5) |
3472                (opc2<<2) | ((imm1 >> 5)<<1));
3473    return emit32(p, theInstr, endness_host);
3474 }
3475
3476 static UChar* mkFormX ( UChar* p, UInt opc1, UInt r1, UInt r2,
3477                         UInt r3, UInt opc2, UInt b0, VexEndness endness_host )
3478 {
3479    UInt theInstr;
3480    vassert(opc1 < 0x40);
3481    vassert(r1   < 0x20);
3482    vassert(r2   < 0x20);
3483    vassert(r3   < 0x20);
3484    vassert(opc2 < 0x400);
3485    vassert(b0   < 0x2);
3486    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3487                (r3<<11) | (opc2<<1) | (b0));
3488    return emit32(p, theInstr, endness_host);
3489 }
3490
3491 static UChar* mkFormXO ( UChar* p, UInt opc1, UInt r1, UInt r2,
3492                          UInt r3, UInt b10, UInt opc2, UInt b0,
3493                          VexEndness endness_host )
3494 {
3495    UInt theInstr;
3496    vassert(opc1 < 0x40);
3497    vassert(r1   < 0x20);
3498    vassert(r2   < 0x20);
3499    vassert(r3   < 0x20);
3500    vassert(b10  < 0x2);
3501    vassert(opc2 < 0x200);
3502    vassert(b0   < 0x2);
3503    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3504                (r3<<11) | (b10 << 10) | (opc2<<1) | (b0));
3505    return emit32(p, theInstr, endness_host);
3506 }
3507
3508 static UChar* mkFormX994 ( UChar* p, UInt inst_sel,
3509                         UInt rdst, UInt rsrc, VexEndness endness_host )
3510 {
3511    /* This issues an X-Form instruction with opc1 = 63 and opc2 = 994.  The
3512       specific instruction is given in bits[11:15].  */
3513    UInt theInstr;
3514    vassert(inst_sel < 0x2);
3515    vassert(rdst < 0x20);
3516    vassert(rsrc < 0x20);
3517    theInstr = ((63<<26) | (rdst<<21) | (inst_sel<<16) | (rsrc<<11) | (994 << 1));
3518    return emit32(p, theInstr, endness_host);
3519 }
3520
3521 static UChar* mkFormXL ( UChar* p, UInt opc1, UInt f1, UInt f2,
3522                          UInt f3, UInt opc2, UInt b0, VexEndness endness_host )
3523 {
3524    UInt theInstr;
3525    vassert(opc1 < 0x40);
3526    vassert(f1   < 0x20);
3527    vassert(f2   < 0x20);
3528    vassert(f3   < 0x20);
3529    vassert(opc2 < 0x400);
3530    vassert(b0   < 0x2);
3531    theInstr = ((opc1<<26) | (f1<<21) | (f2<<16) |
3532                (f3<<11) | (opc2<<1) | (b0));
3533    return emit32(p, theInstr, endness_host);
3534 }
3535
3536 // Note: for split field ops, give mnemonic arg
3537 static UChar* mkFormXFX ( UChar* p, UInt r1, UInt f2, UInt opc2,
3538                           VexEndness endness_host )
3539 {
3540    UInt theInstr;
3541    vassert(r1   < 0x20);
3542    vassert(f2   < 0x20);
3543    vassert(opc2 < 0x400);
3544    switch (opc2) {
3545    case 144:  // mtcrf
3546       vassert(f2 < 0x100);
3547       f2 = f2 << 1;
3548       break;
3549    case 339:  // mfspr
3550    case 371:  // mftb
3551    case 467:  // mtspr
3552       vassert(f2 < 0x400);
3553       // re-arrange split field
3554       f2 = ((f2>>5) & 0x1F) | ((f2 & 0x1F)<<5);
3555       break;
3556    default: vpanic("mkFormXFX(ppch)");
3557    }
3558    theInstr = ((31<<26) | (r1<<21) | (f2<<11) | (opc2<<1));
3559    return emit32(p, theInstr, endness_host);
3560 }
3561
3562 // Only used by mtfsf
3563 static UChar* mkFormXFL ( UChar* p, UInt FM, UInt freg, UInt dfp_rm,
3564                           VexEndness endness_host )
3565 {
3566    UInt theInstr;
3567    vassert(FM   < 0x100);
3568    vassert(freg < 0x20);
3569    theInstr = ((63<<26) | (FM<<17) | (dfp_rm<<16) | (freg<<11) | (711<<1));
3570    return emit32(p, theInstr, endness_host);
3571 }
3572
3573 static UChar* mkFormXS ( UChar* p, UInt opc1, UInt r1, UInt r2,
3574                          UInt imm, UInt opc2, UInt b0,
3575                          VexEndness endness_host )
3576 {
3577    UInt theInstr;
3578    vassert(opc1 < 0x40);
3579    vassert(r1   < 0x20);
3580    vassert(r2   < 0x20);
3581    vassert(imm  < 0x40);
3582    vassert(opc2 < 0x400);
3583    vassert(b0   < 0x2);
3584    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3585                ((imm & 0x1F)<<11) | (opc2<<2) | ((imm>>5)<<1) | (b0));
3586    return emit32(p, theInstr, endness_host);
3587 }
3588
3589
3590 #if 0
3591 // 'b'
3592 static UChar* mkFormI ( UChar* p, UInt LI, UInt AA, UInt LK,
3593                         VexEndness endness_host )
3594 {
3595    UInt theInstr;
3596    vassert(LI  < 0x1000000);
3597    vassert(AA  < 0x2);
3598    vassert(LK  < 0x2);
3599    theInstr = ((18<<26) | (LI<<2) | (AA<<1) | (LK));
3600    return emit32(p, theInstr, endness_host);
3601 }
3602 #endif
3603
3604 // 'bc'
3605 static UChar* mkFormB ( UChar* p, UInt BO, UInt BI,
3606                         UInt BD, UInt AA, UInt LK, VexEndness endness_host )
3607 {
3608    UInt theInstr;
3609    vassert(BO  < 0x20);
3610    vassert(BI  < 0x20);
3611    vassert(BD  < 0x4000);
3612    vassert(AA  < 0x2);
3613    vassert(LK  < 0x2);
3614    theInstr = ((16<<26) | (BO<<21) | (BI<<16) |
3615                (BD<<2) | (AA<<1) | (LK));
3616    return emit32(p, theInstr, endness_host);
3617 }
3618
3619 // rotates
3620 static UChar* mkFormM ( UChar* p, UInt opc1, UInt r1, UInt r2,
3621                         UInt f3, UInt MB, UInt ME, UInt Rc,
3622                         VexEndness endness_host )
3623 {
3624    UInt theInstr;
3625    vassert(opc1 < 0x40);
3626    vassert(r1   < 0x20);
3627    vassert(r2   < 0x20);
3628    vassert(f3   < 0x20);
3629    vassert(MB   < 0x20);
3630    vassert(ME   < 0x20);
3631    vassert(Rc   < 0x2);
3632    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3633                (f3<<11) | (MB<<6) | (ME<<1) | (Rc));
3634    return emit32(p, theInstr, endness_host);
3635 }
3636
3637 static UChar* mkFormA ( UChar* p, UInt opc1, UInt r1, UInt r2,
3638                         UInt r3, UInt r4, UInt opc2, UInt b0,
3639                         VexEndness endness_host )
3640 {
3641    UInt theInstr;
3642    vassert(opc1 < 0x40);
3643    vassert(r1   < 0x20);
3644    vassert(r2   < 0x20);
3645    vassert(r3   < 0x20);
3646    vassert(r4   < 0x20);
3647    vassert(opc2 < 0x20);
3648    vassert(b0   < 0x2 );
3649    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) | (r3<<11) |
3650                (r4<<6) | (opc2<<1) | (b0));
3651    return emit32(p, theInstr, endness_host);
3652 }
3653
3654 static UChar* mkFormZ22 ( UChar* p, UInt opc1, UInt r1, UInt r2,
3655                           UInt constant, UInt opc2, UInt b0,
3656                           VexEndness endness_host)
3657 {
3658    UInt theInstr;
3659    vassert(opc1     < 0x40);
3660    vassert(r1       < 0x20);
3661    vassert(r2       < 0x20);
3662    vassert(constant < 0x40);   /* 6 bit constant */
3663    vassert(opc2     < 0x200);  /* 9 bit field */
3664    vassert(b0       < 0x2);
3665    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3666                (constant<<10) | (opc2<<1) | (b0));
3667    return emit32(p, theInstr, endness_host);
3668 }
3669
3670 static UChar* mkFormZ23 ( UChar* p, UInt opc1, UInt r1, UInt r2,
3671                           UInt r3, UInt rmc, UInt opc2, UInt b0,
3672                           VexEndness endness_host)
3673 {
3674    UInt theInstr;
3675    vassert(opc1 < 0x40);
3676    vassert(r1   < 0x20);
3677    vassert(r2   < 0x20);
3678    vassert(r3   < 0x20);
3679    vassert(rmc  < 0x4);
3680    vassert(opc2 < 0x100);
3681    vassert(b0   < 0x2);
3682    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
3683                (r3<<11) | (rmc<<9) | (opc2<<1) | (b0));
3684    return emit32(p, theInstr, endness_host);
3685 }
3686
3687 static UChar* doAMode_IR ( UChar* p, UInt opc1, UInt rSD,
3688                            PPCAMode* am, Bool mode64, VexEndness endness_host )
3689 {
3690    UInt rA, idx;
3691    vassert(am->tag == Pam_IR);
3692    vassert(am->Pam.IR.index < 0x10000);
3693
3694    rA  = iregEnc(am->Pam.IR.base, mode64);
3695    idx = am->Pam.IR.index;
3696
3697    if (opc1 == 58 || opc1 == 62) { // ld/std: mode64 only
3698       vassert(mode64);
3699       /* stay sane with DS form: lowest 2 bits must be 00.  This
3700          should be guaranteed to us by iselWordExpr_AMode. */
3701       vassert(0 == (idx & 3));
3702    }
3703    p = mkFormD(p, opc1, rSD, rA, idx, endness_host);
3704    return p;
3705 }
3706
3707 static UChar* doAMode_RR ( UChar* p, UInt opc1, UInt opc2,
3708                            UInt rSD, PPCAMode* am, Bool mode64,
3709                            VexEndness endness_host )
3710 {
3711    UInt rA, rB;
3712    vassert(am->tag == Pam_RR);
3713
3714    rA  = iregEnc(am->Pam.RR.base, mode64);
3715    rB  = iregEnc(am->Pam.RR.index, mode64);
3716
3717    p = mkFormX(p, opc1, rSD, rA, rB, opc2, 0, endness_host);
3718    return p;
3719 }
3720
3721
3722 /* Load imm to r_dst */
3723 static UChar* mkLoadImm ( UChar* p, UInt r_dst, ULong imm, Bool mode64,
3724                           VexEndness endness_host )
3725 {
3726    vassert(r_dst < 0x20);
3727
3728    if (!mode64) {
3729       /* In 32-bit mode, make sure the top 32 bits of imm are a sign
3730          extension of the bottom 32 bits, so that the range tests
3731          below work correctly. */
3732       UInt u32 = (UInt)imm;
3733       Int  s32 = (Int)u32;
3734       Long s64 = (Long)s32;
3735       imm = (ULong)s64;
3736    }
3737
3738    if (imm >= 0xFFFFFFFFFFFF8000ULL || imm < 0x8000) {
3739       // sign-extendable from 16 bits
3740
3741       // addi r_dst,0,imm  => li r_dst,imm
3742       p = mkFormD(p, 14, r_dst, 0, imm & 0xFFFF, endness_host);
3743    } else {
3744       if (imm >= 0xFFFFFFFF80000000ULL || imm < 0x80000000ULL) {
3745          // sign-extendable from 32 bits
3746
3747          // addis r_dst,r0,(imm>>16) => lis r_dst, (imm>>16)
3748          p = mkFormD(p, 15, r_dst, 0, (imm>>16) & 0xFFFF, endness_host);
3749          // ori r_dst, r_dst, (imm & 0xFFFF)
3750          p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3751       } else {
3752          // full 64bit immediate load: 5 (five!) insns.
3753          vassert(mode64);
3754
3755          // load high word
3756
3757          // lis r_dst, (imm>>48) & 0xFFFF
3758          p = mkFormD(p, 15, r_dst, 0, (imm>>48) & 0xFFFF, endness_host);
3759
3760          // ori r_dst, r_dst, (imm>>32) & 0xFFFF
3761          if ((imm>>32) & 0xFFFF)
3762            p = mkFormD(p, 24, r_dst, r_dst, (imm>>32) & 0xFFFF, endness_host);
3763
3764          // shift r_dst low word to high word => rldicr
3765          p = mkFormMD(p, 30, r_dst, r_dst, 32, 31, 1, endness_host);
3766
3767          // load low word
3768
3769          // oris r_dst, r_dst, (imm>>16) & 0xFFFF
3770          if ((imm>>16) & 0xFFFF)
3771             p = mkFormD(p, 25, r_dst, r_dst, (imm>>16) & 0xFFFF, endness_host);
3772
3773          // ori r_dst, r_dst, (imm) & 0xFFFF
3774          if (imm & 0xFFFF)
3775             p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3776       }
3777    }
3778    return p;
3779 }
3780
3781 /* A simplified version of mkLoadImm that always generates 2 or 5
3782    instructions (32 or 64 bits respectively) even if it could generate
3783    fewer.  This is needed for generating fixed sized patchable
3784    sequences. */
3785 static UChar* mkLoadImm_EXACTLY2or5 ( UChar* p,
3786                                       UInt r_dst, ULong imm, Bool mode64,
3787                                       VexEndness endness_host )
3788 {
3789    vassert(r_dst < 0x20);
3790
3791    if (!mode64) {
3792       /* In 32-bit mode, make sure the top 32 bits of imm are a sign
3793          extension of the bottom 32 bits.  (Probably unnecessary.) */
3794       UInt u32 = (UInt)imm;
3795       Int  s32 = (Int)u32;
3796       Long s64 = (Long)s32;
3797       imm = (ULong)s64;
3798    }
3799
3800    if (!mode64) {
3801       // addis r_dst,r0,(imm>>16) => lis r_dst, (imm>>16)
3802       p = mkFormD(p, 15, r_dst, 0, (imm>>16) & 0xFFFF, endness_host);
3803       // ori r_dst, r_dst, (imm & 0xFFFF)
3804       p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3805
3806    } else {
3807       // full 64bit immediate load: 5 (five!) insns.
3808
3809       // load high word
3810       // lis r_dst, (imm>>48) & 0xFFFF
3811       p = mkFormD(p, 15, r_dst, 0, (imm>>48) & 0xFFFF, endness_host);
3812
3813       // ori r_dst, r_dst, (imm>>32) & 0xFFFF
3814       p = mkFormD(p, 24, r_dst, r_dst, (imm>>32) & 0xFFFF, endness_host);
3815
3816       // shift r_dst low word to high word => rldicr
3817       p = mkFormMD(p, 30, r_dst, r_dst, 32, 31, 1, endness_host);
3818
3819       // load low word
3820       // oris r_dst, r_dst, (imm>>16) & 0xFFFF
3821       p = mkFormD(p, 25, r_dst, r_dst, (imm>>16) & 0xFFFF, endness_host);
3822
3823       // ori r_dst, r_dst, (imm) & 0xFFFF
3824       p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3825    }
3826    return p;
3827 }
3828
3829 /* Checks whether the sequence of bytes at p was indeed created
3830    by mkLoadImm_EXACTLY2or5 with the given parameters. */
3831 static Bool isLoadImm_EXACTLY2or5 ( UChar* p_to_check,
3832                                     UInt r_dst, ULong imm, Bool mode64,
3833                                     VexEndness endness_host )
3834 {
3835    vassert(r_dst < 0x20);
3836
3837    if (!mode64) {
3838       /* In 32-bit mode, make sure the top 32 bits of imm are a sign
3839          extension of the bottom 32 bits.  (Probably unnecessary.) */
3840       UInt u32 = (UInt)imm;
3841       Int  s32 = (Int)u32;
3842       Long s64 = (Long)s32;
3843       imm = (ULong)s64;
3844    }
3845
3846    if (!mode64) {
3847       UInt   expect[2] = { 0, 0 };
3848       UChar* p         = (UChar*)&expect[0];
3849       // addis r_dst,r0,(imm>>16) => lis r_dst, (imm>>16)
3850       p = mkFormD(p, 15, r_dst, 0, (imm>>16) & 0xFFFF, endness_host);
3851       // ori r_dst, r_dst, (imm & 0xFFFF)
3852       p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3853       vassert(p == (UChar*)&expect[2]);
3854
3855       return fetch32(p_to_check + 0, endness_host) == expect[0]
3856              && fetch32(p_to_check + 4, endness_host) == expect[1];
3857
3858    } else {
3859       UInt   expect[5] = { 0, 0, 0, 0, 0 };
3860       UChar* p         = (UChar*)&expect[0];
3861       // full 64bit immediate load: 5 (five!) insns.
3862
3863       // load high word
3864       // lis r_dst, (imm>>48) & 0xFFFF
3865       p = mkFormD(p, 15, r_dst, 0, (imm>>48) & 0xFFFF, endness_host);
3866
3867       // ori r_dst, r_dst, (imm>>32) & 0xFFFF
3868       p = mkFormD(p, 24, r_dst, r_dst, (imm>>32) & 0xFFFF, endness_host);
3869
3870       // shift r_dst low word to high word => rldicr
3871       p = mkFormMD(p, 30, r_dst, r_dst, 32, 31, 1, endness_host);
3872
3873       // load low word
3874       // oris r_dst, r_dst, (imm>>16) & 0xFFFF
3875       p = mkFormD(p, 25, r_dst, r_dst, (imm>>16) & 0xFFFF, endness_host);
3876
3877       // ori r_dst, r_dst, (imm) & 0xFFFF
3878       p = mkFormD(p, 24, r_dst, r_dst, imm & 0xFFFF, endness_host);
3879
3880       vassert(p == (UChar*)&expect[5]);
3881
3882       return fetch32(p_to_check + 0, endness_host) == expect[0]
3883              && fetch32(p_to_check + 4,  endness_host) == expect[1]
3884              && fetch32(p_to_check + 8,  endness_host) == expect[2]
3885              && fetch32(p_to_check + 12, endness_host) == expect[3]
3886              && fetch32(p_to_check + 16, endness_host) == expect[4];
3887    }
3888 }
3889
3890
3891 /* Generate a machine-word sized load or store.  Simplified version of
3892    the Pin_Load and Pin_Store cases below. */
3893 static UChar* do_load_or_store_machine_word (
3894                  UChar* p, Bool isLoad,
3895                  UInt reg, PPCAMode* am, Bool mode64, VexEndness endness_host )
3896 {
3897    if (isLoad) {
3898       UInt opc1, sz = mode64 ? 8 : 4;
3899       switch (am->tag) {
3900          case Pam_IR:
3901             if (mode64) {
3902                vassert(0 == (am->Pam.IR.index & 3));
3903             }
3904             switch (sz) {
3905                case 4:  opc1 = 32; vassert(!mode64); break;
3906                case 8:  opc1 = 58; vassert(mode64);  break;
3907                default: vassert(0);
3908             }
3909             p = doAMode_IR(p, opc1, reg, am, mode64, endness_host);
3910             break;
3911          case Pam_RR:
3912             /* we could handle this case, but we don't expect to ever
3913                need to. */
3914             vassert(0);
3915          default:
3916             vassert(0);
3917       }
3918    } else /*store*/ {
3919       UInt opc1, sz = mode64 ? 8 : 4;
3920       switch (am->tag) {
3921          case Pam_IR:
3922             if (mode64) {
3923                vassert(0 == (am->Pam.IR.index & 3));
3924             }
3925             switch (sz) {
3926                case 4:  opc1 = 36; vassert(!mode64); break;
3927                case 8:  opc1 = 62; vassert(mode64);  break;
3928                default: vassert(0);
3929             }
3930             p = doAMode_IR(p, opc1, reg, am, mode64, endness_host);
3931             break;
3932          case Pam_RR:
3933             /* we could handle this case, but we don't expect to ever
3934                need to. */
3935             vassert(0);
3936          default:
3937             vassert(0);
3938       }
3939    }
3940    return p;
3941 }
3942
3943 /* Generate a 32-bit sized load or store.  Simplified version of
3944    do_load_or_store_machine_word above. */
3945 static UChar* do_load_or_store_word32 (
3946                  UChar* p, Bool isLoad,
3947                  UInt reg, PPCAMode* am, Bool mode64, VexEndness endness_host )
3948 {
3949    if (isLoad) {
3950       UInt opc1;
3951       switch (am->tag) {
3952          case Pam_IR:
3953             if (mode64) {
3954                vassert(0 == (am->Pam.IR.index & 3));
3955             }
3956             opc1 = 32;
3957             p = doAMode_IR(p, opc1, reg, am, mode64, endness_host);
3958             break;
3959          case Pam_RR:
3960             /* we could handle this case, but we don't expect to ever
3961                need to. */
3962             vassert(0);
3963          default:
3964             vassert(0);
3965       }
3966    } else /*store*/ {
3967       UInt opc1;
3968       switch (am->tag) {
3969          case Pam_IR:
3970             if (mode64) {
3971                vassert(0 == (am->Pam.IR.index & 3));
3972             }
3973             opc1 = 36;
3974             p = doAMode_IR(p, opc1, reg, am, mode64, endness_host);
3975             break;
3976          case Pam_RR:
3977             /* we could handle this case, but we don't expect to ever
3978                need to. */
3979             vassert(0);
3980          default:
3981             vassert(0);
3982       }
3983    }
3984    return p;
3985 }
3986
3987 /* Move r_dst to r_src */
3988 static UChar* mkMoveReg ( UChar* p, UInt r_dst, UInt r_src,
3989                           VexEndness endness_host )
3990 {
3991    vassert(r_dst < 0x20);
3992    vassert(r_src < 0x20);
3993
3994    if (r_dst != r_src) {
3995       /* or r_dst, r_src, r_src */
3996       p = mkFormX(p, 31, r_src, r_dst, r_src, 444, 0, endness_host );
3997    }
3998    return p;
3999 }
4000
4001 static UChar* mkFormVX ( UChar* p, UInt opc1, UInt r1, UInt r2,
4002                          UInt r3, UInt opc2, VexEndness endness_host )
4003 {
4004    UInt theInstr;
4005    vassert(opc1 < 0x40);
4006    vassert(r1   < 0x20);
4007    vassert(r2   < 0x20);
4008    vassert(r3   < 0x20);
4009    vassert(opc2 < 0x800);
4010    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) | (r3<<11) | opc2);
4011    return emit32(p, theInstr, endness_host);
4012 }
4013
4014 static UChar* mkFormVSXRND ( UChar* p, UInt opc1, UInt R, UInt r1,
4015                              UInt r2, UInt RMC, UInt opc2, UChar EX,
4016                              VexEndness endness_host )
4017 {
4018    /* The register mapping is all done using VR register numbers for the
4019     * V128 support.  This means that the operands for this instruction have
4020     * been loaded into a VR register. The 32 VR registers map to VSR registers
4021     * 32 to 63. For these instructions, the hardware adds 32 to the source
4022     * and destination register numbers.  Do not need to adjust the register
4023     * numbers for these instructions.
4024     */
4025
4026    UInt theInstr;
4027
4028    vassert(opc1 < 0x40);
4029    vassert(r1   < 0x20);
4030    vassert(r2   < 0x20);
4031    vassert(opc2 < 0x100);
4032    vassert(EX  < 0x2);
4033    vassert(R   < 0x2);
4034    vassert(RMC < 0x4);
4035
4036    theInstr = ((opc1<<26)  | (r1<<21) | (R<<16) | (r2<<11) | (RMC<<9) |
4037                (opc2 << 1) | EX);
4038    return emit32(p, theInstr, endness_host);
4039 }
4040
4041 static UChar* mkFormVX_BX_TX ( UChar* p, UInt opc1, UInt r1, UInt r2,
4042                                UInt r3, UInt opc2, VexEndness endness_host )
4043 {
4044    /* The register mapping is all done using VR register numbers for the
4045     * V128 support.  This means that the operands for this instruction have
4046     * been loaded into a VR register. The 32 VR registers map to VSR registers
4047     * 32 to 63. So to make the issued instruction reference the
4048     * corresponding VR register we have to add 32 to the source and
4049     * destination operand numbers, then load the new operand number into the
4050     * correct bit fields.
4051     *
4052     * r1 = 32xTX + T; r3 = 32xBX + B;
4053     * TX is bit 0, BX is bit 1, T is in bits [25:21], B is in bit [14:11]
4054     * opc2 is in bits [10:2]
4055     */
4056    UInt T, TX, B, BX;
4057
4058    UInt theInstr;
4059
4060    r1 += 32;   // adjust the VSR register number to map to the VR number
4061    r3 += 32;
4062
4063    vassert(opc1 < 0x40);
4064    vassert(r1   < 0x40);
4065    vassert(r2   < 0x20);
4066    vassert(r3   < 0x40);
4067    vassert(opc2 < 0x800);
4068
4069    T  = r1 & 0x1F;
4070    TX = r1 >> 5;
4071    B  = r3 & 0x1F;
4072    BX = r3 >> 5;
4073    theInstr = ((opc1<<26) | (T<<21) | (r2<<16) | (B<<11) | (opc2<<2)
4074                | (BX<<1) | TX);
4075    return emit32(p, theInstr, endness_host);
4076 }
4077
4078 static UChar* mkFormVXR0 ( UChar* p, UInt opc1, UInt r1, UInt r2,
4079                            UInt r3, UInt opc2, UChar R0,
4080                            VexEndness endness_host )
4081 {
4082    /* The register mapping is all done using VR register numbers for the
4083     * V128 support.  This means that the operands for this instruction have
4084     * been loaded into a VR register. The 32 VR registers map to VSR registers
4085     * 32 to 63.  For these instructions, the hardware adds 32 to the source
4086     * and destination register numbers.  Do not need to adjust the register
4087     * numbers for these instructions.
4088     */
4089
4090    UInt theInstr;
4091
4092    vassert(opc1 < 0x40);
4093    vassert(r1   < 0x20);  // register numbers are between 0 and 31 (5-bits)
4094    vassert(r2   < 0x20);
4095    vassert(r3   < 0x20);
4096    vassert(opc2 < 0x800);
4097    vassert(R0 < 0x2);
4098
4099    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) | (r3<<11) | (opc2<<1) | R0);
4100    return emit32(p, theInstr, endness_host);
4101 }
4102
4103 static UChar* mkFormVXI ( UChar* p, UInt opc1, UInt r1, UInt r2,
4104                           UInt r3, UInt opc2, VexEndness endness_host )
4105 {
4106    UInt theInstr;
4107    vassert(opc1 < 0x40);
4108    vassert(r1   < 0x20);
4109    vassert(r2   < 0x20);
4110    vassert(r3   < 0x20);
4111    vassert(opc2 < 0x27);
4112    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) | (r3<<11) | opc2<<1);
4113    return emit32(p, theInstr, endness_host);
4114 }
4115
4116 static UChar* mkFormVXR ( UChar* p, UInt opc1, UInt r1, UInt r2,
4117                           UInt r3, UInt Rc, UInt opc2,
4118                           VexEndness endness_host )
4119 {
4120    UInt theInstr;
4121    vassert(opc1 < 0x40);
4122    vassert(r1   < 0x20);
4123    vassert(r2   < 0x20);
4124    vassert(r3   < 0x20);
4125    vassert(Rc   < 0x2);
4126    vassert(opc2 < 0x400);
4127    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
4128                (r3<<11) | (Rc<<10) | opc2);
4129    return emit32(p, theInstr, endness_host);
4130 }
4131
4132 static UChar* mkFormVA ( UChar* p, UInt opc1, UInt r1, UInt r2,
4133                          UInt r3, UInt r4, UInt opc2, VexEndness endness_host )
4134 {
4135    UInt theInstr;
4136    vassert(opc1 < 0x40);
4137    vassert(r1   < 0x20);
4138    vassert(r2   < 0x20);
4139    vassert(r3   < 0x20);
4140    vassert(r4   < 0x20);
4141    vassert(opc2 < 0x40);
4142    theInstr = ((opc1<<26) | (r1<<21) | (r2<<16) |
4143                (r3<<11) | (r4<<6) | opc2);
4144    return emit32(p, theInstr, endness_host);
4145 }
4146
4147
4148
4149 /* Emit an instruction into buf and return the number of bytes used.
4150    Note that buf is not the insn's final place, and therefore it is
4151    imperative to emit position-independent code.  If the emitted
4152    instruction was a profiler inc, set *is_profInc to True, else leave
4153    it unchanged.
4154 */
4155 Int emit_PPCInstr ( /*MB_MOD*/Bool* is_profInc,
4156                     UChar* buf, Int nbuf, const PPCInstr* i,
4157                     Bool mode64, VexEndness endness_host,
4158                     const void* disp_cp_chain_me_to_slowEP,
4159                     const void* disp_cp_chain_me_to_fastEP,
4160                     const void* disp_cp_xindir,
4161                     const void* disp_cp_xassisted)
4162 {
4163    UChar* p = &buf[0];
4164    vassert(nbuf >= 32);
4165
4166    if (0) {
4167       vex_printf("asm  ");ppPPCInstr(i, mode64); vex_printf("\n");
4168    }
4169
4170    switch (i->tag) {
4171
4172    case Pin_LI:
4173       p = mkLoadImm(p, iregEnc(i->Pin.LI.dst, mode64),
4174                     i->Pin.LI.imm64, mode64, endness_host);
4175       goto done;
4176
4177    case Pin_Alu: {
4178       PPCRH* srcR   = i->Pin.Alu.srcR;
4179       Bool   immR   = toBool(srcR->tag == Prh_Imm);
4180       UInt   r_dst  = iregEnc(i->Pin.Alu.dst, mode64);
4181       UInt   r_srcL = iregEnc(i->Pin.Alu.srcL, mode64);
4182       UInt   r_srcR = immR ? (-1)/*bogus*/ :
4183                              iregEnc(srcR->Prh.Reg.reg, mode64);
4184
4185       switch (i->Pin.Alu.op) {
4186       case Palu_ADD:
4187          if (immR) {
4188             /* addi (PPC32 p350) */
4189             vassert(srcR->Prh.Imm.syned);
4190             vassert(srcR->Prh.Imm.imm16 != 0x8000);
4191             p = mkFormD(p, 14, r_dst, r_srcL, srcR->Prh.Imm.imm16, endness_host);
4192          } else {
4193             /* add (PPC32 p347) */
4194             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 266, 0, endness_host);
4195          }
4196          break;
4197
4198       case Palu_SUB:
4199          if (immR) {
4200             /* addi (PPC32 p350), but with negated imm */
4201             vassert(srcR->Prh.Imm.syned);
4202             vassert(srcR->Prh.Imm.imm16 != 0x8000);
4203             p = mkFormD(p, 14, r_dst, r_srcL, (- srcR->Prh.Imm.imm16),
4204                         endness_host);
4205          } else {
4206             /* subf (PPC32 p537), with args the "wrong" way round */
4207             p = mkFormXO(p, 31, r_dst, r_srcR, r_srcL, 0, 40, 0, endness_host);
4208          }
4209          break;
4210
4211       case Palu_AND:
4212          if (immR) {
4213             /* andi. (PPC32 p358) */
4214             vassert(!srcR->Prh.Imm.syned);
4215             p = mkFormD(p, 28, r_srcL, r_dst, srcR->Prh.Imm.imm16, endness_host);
4216          } else {
4217             /* and (PPC32 p356) */
4218             p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 28, 0, endness_host);
4219          }
4220          break;
4221
4222       case Palu_OR:
4223          if (immR) {
4224             /* ori (PPC32 p497) */
4225             vassert(!srcR->Prh.Imm.syned);
4226             p = mkFormD(p, 24, r_srcL, r_dst, srcR->Prh.Imm.imm16, endness_host);
4227          } else {
4228             /* or (PPC32 p495) */
4229             p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 444, 0, endness_host);
4230          }
4231          break;
4232
4233       case Palu_XOR:
4234          if (immR) {
4235             /* xori (PPC32 p550) */
4236             vassert(!srcR->Prh.Imm.syned);
4237             p = mkFormD(p, 26, r_srcL, r_dst, srcR->Prh.Imm.imm16, endness_host);
4238          } else {
4239             /* xor (PPC32 p549) */
4240             p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 316, 0, endness_host);
4241          }
4242          break;
4243
4244       default:
4245          goto bad;
4246       }
4247       goto done;
4248    }
4249
4250    case Pin_Shft: {
4251       PPCRH* srcR   = i->Pin.Shft.srcR;
4252       Bool   sz32   = i->Pin.Shft.sz32;
4253       Bool   immR   = toBool(srcR->tag == Prh_Imm);
4254       UInt   r_dst  = iregEnc(i->Pin.Shft.dst, mode64);
4255       UInt   r_srcL = iregEnc(i->Pin.Shft.srcL, mode64);
4256       UInt   r_srcR = immR ? (-1)/*bogus*/ :
4257                              iregEnc(srcR->Prh.Reg.reg, mode64);
4258       if (!mode64)
4259          vassert(sz32);
4260
4261       switch (i->Pin.Shft.op) {
4262       case Pshft_SHL:
4263          if (sz32) {
4264             if (immR) {
4265                /* rd = rs << n, 1 <= n <= 31
4266                   is
4267                   rlwinm rd,rs,n,0,31-n  (PPC32 p501)
4268                */
4269                UInt n = srcR->Prh.Imm.imm16;
4270                vassert(!srcR->Prh.Imm.syned);
4271                vassert(n > 0 && n < 32);
4272                p = mkFormM(p, 21, r_srcL, r_dst, n, 0, 31-n, 0, endness_host);
4273             } else {
4274                /* slw (PPC32 p505) */
4275                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 24, 0, endness_host);
4276             }
4277          } else {
4278             if (immR) {
4279                /* rd = rs << n, 1 <= n <= 63
4280                   is
4281                   rldicr rd,rs,n,63-n  (PPC64 p559)
4282                */
4283                UInt n = srcR->Prh.Imm.imm16;
4284                vassert(!srcR->Prh.Imm.syned);
4285                vassert(n > 0 && n < 64);
4286                p = mkFormMD(p, 30, r_srcL, r_dst, n, 63-n, 1, endness_host);
4287             } else {
4288                /* sld (PPC64 p568) */
4289                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 27, 0, endness_host);
4290             }
4291          }
4292          break;
4293
4294       case Pshft_SHR:
4295          if (sz32) {
4296              if (immR) {
4297                /* rd = rs >>u n, 1 <= n <= 31
4298                   is
4299                   rlwinm rd,rs,32-n,n,31  (PPC32 p501)
4300                */
4301                UInt n = srcR->Prh.Imm.imm16;
4302                vassert(!srcR->Prh.Imm.syned);
4303                vassert(n > 0 && n < 32);
4304                p = mkFormM(p, 21, r_srcL, r_dst, 32-n, n, 31, 0, endness_host);
4305             } else {
4306                /* srw (PPC32 p508) */
4307                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 536, 0, endness_host);
4308             }
4309          } else {
4310             if (immR) {
4311                /* rd = rs >>u n, 1 <= n <= 63
4312                   is
4313                   rldicl rd,rs,64-n,n  (PPC64 p558)
4314                */
4315                UInt n = srcR->Prh.Imm.imm16;
4316                vassert(!srcR->Prh.Imm.syned);
4317                vassert(n > 0 && n < 64);
4318                p = mkFormMD(p, 30, r_srcL, r_dst, 64-n, n, 0, endness_host);
4319             } else {
4320                /* srd (PPC64 p574) */
4321                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 539, 0, endness_host);
4322             }
4323          }
4324          break;
4325
4326       case Pshft_SAR:
4327          if (sz32) {
4328             if (immR) {
4329                /* srawi (PPC32 p507) */
4330                UInt n = srcR->Prh.Imm.imm16;
4331                vassert(!srcR->Prh.Imm.syned);
4332                /* In 64-bit mode, we allow right shifts by zero bits
4333                   as that is a handy way to sign extend the lower 32
4334                   bits into the upper 32 bits. */
4335                if (mode64)
4336                   vassert(n < 32);
4337                else
4338                   vassert(n > 0 && n < 32);
4339                p = mkFormX(p, 31, r_srcL, r_dst, n, 824, 0, endness_host);
4340             } else {
4341                /* sraw (PPC32 p506) */
4342                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 792, 0, endness_host);
4343             }
4344          } else {
4345             if (immR) {
4346                /* sradi (PPC64 p571) */
4347                UInt n = srcR->Prh.Imm.imm16;
4348                vassert(!srcR->Prh.Imm.syned);
4349                vassert(n > 0 && n < 64);
4350                p = mkFormXS(p, 31, r_srcL, r_dst, n, 413, 0, endness_host);
4351             } else {
4352                /* srad (PPC32 p570) */
4353                p = mkFormX(p, 31, r_srcL, r_dst, r_srcR, 794, 0, endness_host);
4354             }
4355          }
4356          break;
4357
4358       default:
4359          goto bad;
4360       }
4361       goto done;
4362    }
4363
4364    case Pin_AddSubC: {
4365       Bool isAdd  = i->Pin.AddSubC.isAdd;
4366       Bool setC   = i->Pin.AddSubC.setC;
4367       UInt r_srcL = iregEnc(i->Pin.AddSubC.srcL, mode64);
4368       UInt r_srcR = iregEnc(i->Pin.AddSubC.srcR, mode64);
4369       UInt r_dst  = iregEnc(i->Pin.AddSubC.dst, mode64);
4370
4371       if (isAdd) {
4372          if (setC) /* addc (PPC32 p348) */
4373             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 10, 0, endness_host);
4374          else          /* adde (PPC32 p349) */
4375             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 138, 0, endness_host);
4376       } else {
4377          /* subfX, with args the "wrong" way round */
4378          if (setC) /* subfc (PPC32 p538) */
4379             p = mkFormXO(p, 31, r_dst, r_srcR, r_srcL, 0, 8, 0, endness_host);
4380          else          /* subfe (PPC32 p539) */
4381             p = mkFormXO(p, 31, r_dst, r_srcR, r_srcL, 0, 136, 0, endness_host);
4382       }
4383       goto done;
4384    }
4385
4386    case Pin_Cmp: {
4387       Bool syned  = i->Pin.Cmp.syned;
4388       Bool sz32   = i->Pin.Cmp.sz32;
4389       UInt fld1   = i->Pin.Cmp.crfD << 2;
4390       UInt r_srcL = iregEnc(i->Pin.Cmp.srcL, mode64);
4391       UInt r_srcR, imm_srcR;
4392       PPCRH* srcR = i->Pin.Cmp.srcR;
4393
4394       if (!mode64)        // cmp double word invalid for mode32
4395          vassert(sz32);
4396       else if (!sz32)     // mode64 && cmp64: set L=1
4397          fld1 |= 1;
4398
4399       switch (srcR->tag) {
4400       case Prh_Imm:
4401          vassert(syned == srcR->Prh.Imm.syned);
4402          imm_srcR = srcR->Prh.Imm.imm16;
4403          if (syned) {  // cmpw/di  (signed)   (PPC32 p368)
4404             vassert(imm_srcR != 0x8000);
4405             p = mkFormD(p, 11, fld1, r_srcL, imm_srcR, endness_host);
4406          } else {      // cmplw/di (unsigned) (PPC32 p370)
4407             p = mkFormD(p, 10, fld1, r_srcL, imm_srcR, endness_host);
4408          }
4409          break;
4410       case Prh_Reg:
4411          r_srcR = iregEnc(srcR->Prh.Reg.reg, mode64);
4412          if (syned)  // cmpwi  (signed)   (PPC32 p367)
4413             p = mkFormX(p, 31, fld1, r_srcL, r_srcR, 0, 0, endness_host);
4414          else        // cmplwi (unsigned) (PPC32 p379)
4415             p = mkFormX(p, 31, fld1, r_srcL, r_srcR, 32, 0, endness_host);
4416          break;
4417       default:
4418          goto bad;
4419       }
4420       goto done;
4421    }
4422
4423    case Pin_Unary: {
4424       UInt r_dst = iregEnc(i->Pin.Unary.dst, mode64);
4425       UInt r_src = iregEnc(i->Pin.Unary.src, mode64);
4426
4427       switch (i->Pin.Unary.op) {
4428       case Pun_NOT:  // nor r_dst,r_src,r_src
4429          p = mkFormX(p, 31, r_src, r_dst, r_src, 124, 0, endness_host);
4430          break;
4431       case Pun_NEG:  // neg r_dst,r_src
4432          p = mkFormXO(p, 31, r_dst, r_src, 0, 0, 104, 0, endness_host);
4433          break;
4434       case Pun_CLZ32:  // cntlzw r_dst, r_src
4435          p = mkFormX(p, 31, r_src, r_dst, 0, 26, 0, endness_host);
4436          break;
4437       case Pun_CLZ64:  // cntlzd r_dst, r_src
4438          vassert(mode64);
4439          p = mkFormX(p, 31, r_src, r_dst, 0, 58, 0, endness_host);
4440          break;
4441       case Pun_EXTSW:  // extsw r_dst, r_src
4442          vassert(mode64);
4443          p = mkFormX(p, 31, r_src, r_dst, 0, 986, 0, endness_host);
4444          break;
4445       case Pun_POP32:  // popcntw r_dst, r_src
4446          p = mkFormX(p, 31, r_src, r_dst, 0, 378, 0, endness_host);
4447          break;
4448       case Pun_POP64:  // popcntd r_dst, r_src
4449          vassert(mode64);
4450          p = mkFormX(p, 31, r_src, r_dst, 0, 506, 0, endness_host);
4451          break;
4452       default:
4453          goto bad;
4454       }
4455       goto done;
4456    }
4457
4458    case Pin_MulL: {
4459       Bool syned  = i->Pin.MulL.syned;
4460       Bool sz32   = i->Pin.MulL.sz32;
4461       UInt r_dst  = iregEnc(i->Pin.MulL.dst, mode64);
4462       UInt r_srcL = iregEnc(i->Pin.MulL.srcL, mode64);
4463       UInt r_srcR = iregEnc(i->Pin.MulL.srcR, mode64);
4464
4465       if (!mode64)
4466          vassert(sz32);
4467
4468       if (i->Pin.MulL.hi) {
4469          // mul hi words, must consider sign
4470          if (sz32) {
4471             if (syned)  // mulhw r_dst,r_srcL,r_srcR
4472                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 75, 0,
4473                             endness_host);
4474             else        // mulhwu r_dst,r_srcL,r_srcR
4475                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 11, 0,
4476                             endness_host);
4477          } else {
4478             if (syned)  // mulhd r_dst,r_srcL,r_srcR
4479                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 73, 0,
4480                             endness_host);
4481             else        // mulhdu r_dst,r_srcL,r_srcR
4482                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 9, 0, endness_host);
4483          }
4484       } else {
4485          // mul low word, sign is irrelevant
4486          vassert(!i->Pin.MulL.syned);
4487          if (sz32)      // mullw r_dst,r_srcL,r_srcR
4488             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 235, 0, endness_host);
4489          else           // mulld r_dst,r_srcL,r_srcR
4490             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 233, 0, endness_host);
4491       }
4492       goto done;
4493    }
4494
4495    case Pin_Div: {
4496       Bool syned  = i->Pin.Div.syned;
4497       Bool sz32   = i->Pin.Div.sz32;
4498       UInt r_dst  = iregEnc(i->Pin.Div.dst, mode64);
4499       UInt r_srcL = iregEnc(i->Pin.Div.srcL, mode64);
4500       UInt r_srcR = iregEnc(i->Pin.Div.srcR, mode64);
4501
4502       if (!mode64)
4503          vassert(sz32);
4504
4505       if (i->Pin.Div.extended) {
4506          if (sz32) {
4507             if (syned)
4508                // divwe r_dst,r_srcL,r_srcR
4509                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 427, 0,
4510                             endness_host);
4511             else
4512                // divweu r_dst,r_srcL,r_srcR
4513                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 395, 0,
4514                             endness_host);
4515          } else {
4516             if (syned)
4517                // divde r_dst,r_srcL,r_srcR
4518                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 425, 0,
4519                             endness_host);
4520             else
4521                // divdeu r_dst,r_srcL,r_srcR
4522                p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 393, 0,
4523                             endness_host);
4524          }
4525       } else if (sz32) {
4526          if (syned)  // divw r_dst,r_srcL,r_srcR
4527             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 491, 0, endness_host);
4528          else        // divwu r_dst,r_srcL,r_srcR
4529             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 459, 0, endness_host);
4530       } else {
4531          if (syned)  // divd r_dst,r_srcL,r_srcR
4532             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 489, 0, endness_host);
4533          else        // divdu r_dst,r_srcL,r_srcR
4534             p = mkFormXO(p, 31, r_dst, r_srcL, r_srcR, 0, 457, 0, endness_host);
4535       }
4536       goto done;
4537    }
4538
4539    case Pin_Call: {
4540       if (i->Pin.Call.cond.test != Pct_ALWAYS
4541           && i->Pin.Call.rloc.pri != RLPri_None) {
4542          /* The call might not happen (it isn't unconditional) and it
4543             returns a result.  In this case we will need to generate a
4544             control flow diamond to put 0x555..555 in the return
4545             register(s) in the case where the call doesn't happen.  If
4546             this ever becomes necessary, maybe copy code from the ARM
4547             equivalent.  Until that day, just give up. */
4548          goto bad;
4549       }
4550       PPCCondCode cond  = i->Pin.Call.cond;
4551       UInt        r_dst = 10;
4552       /* As per detailed comment for Pin_Call in
4553          getRegUsage_PPCInstr above, %r10 is used as an address temp */
4554
4555       /* jump over the following insns if condition does not hold */
4556       UChar* ptmp = NULL;
4557       if (cond.test != Pct_ALWAYS) {
4558          /* jmp fwds if !condition */
4559          /* don't know how many bytes to jump over yet...
4560             make space for a jump instruction and fill in later. */
4561          ptmp = p; /* fill in this bit later */
4562          p += 4;                                          // p += 4
4563       }
4564
4565       /* load target to r_dst */                          // p += 4|8|20
4566       p = mkLoadImm(p, r_dst, i->Pin.Call.target, mode64, endness_host);
4567
4568       /* mtspr 9,r_dst => move r_dst to count register */
4569       p = mkFormXFX(p, r_dst, 9, 467, endness_host);               // p += 4
4570
4571       /* bctrl => branch to count register (and save to lr) */
4572       p = mkFormXL(p, 19, Pct_ALWAYS, 0, 0, 528, 1, endness_host); // p += 4
4573
4574       /* Fix up the conditional jump, if there was one. */
4575       if (cond.test != Pct_ALWAYS) {
4576          Int delta = p - ptmp;
4577          vassert(delta >= 16 && delta <= 32);
4578          /* bc !ct,cf,delta */
4579          mkFormB(ptmp, invertCondTest(cond.test),
4580                  cond.flag, (delta>>2), 0, 0, endness_host);
4581       }
4582       goto done;
4583    }
4584
4585    case Pin_XDirect: {
4586       /* NB: what goes on here has to be very closely coordinated
4587          with the chainXDirect_PPC and unchainXDirect_PPC below. */
4588       /* We're generating chain-me requests here, so we need to be
4589             sure this is actually allowed -- no-redir translations
4590             can't use chain-me's.  Hence: */
4591       vassert(disp_cp_chain_me_to_slowEP != NULL);
4592       vassert(disp_cp_chain_me_to_fastEP != NULL);
4593
4594       /* First off, if this is conditional, create a conditional jump
4595          over the rest of it.  Or at least, leave a space for it that
4596          we will shortly fill in. */
4597       UChar* ptmp = NULL;
4598       if (i->Pin.XDirect.cond.test != Pct_ALWAYS) {
4599          vassert(i->Pin.XDirect.cond.flag != Pcf_NONE);
4600          ptmp = p;
4601          p += 4;
4602       } else {
4603          vassert(i->Pin.XDirect.cond.flag == Pcf_NONE);
4604       }
4605
4606       /* Update the guest CIA. */
4607       /* imm32/64 r30, dstGA */
4608       if (!mode64) vassert(0 == (((ULong)i->Pin.XDirect.dstGA) >> 32));
4609       p = mkLoadImm(p, /*r*/30, (ULong)i->Pin.XDirect.dstGA, mode64,
4610                     endness_host);
4611       /* stw/std r30, amCIA */
4612       p = do_load_or_store_machine_word(
4613              p, False/*!isLoad*/,
4614              /*r*/30, i->Pin.XDirect.amCIA, mode64, endness_host
4615           );
4616
4617       /* --- FIRST PATCHABLE BYTE follows --- */
4618       /* VG_(disp_cp_chain_me_to_{slowEP,fastEP}) (where we're calling
4619          to) backs up the return address, so as to find the address of
4620          the first patchable byte.  So: don't change the number of
4621          instructions (32-bit: 4, 64-bit: 7) below. */
4622       /* imm32/64-fixed r30, VG_(disp_cp_chain_me_to_{slowEP,fastEP} */
4623       const void* disp_cp_chain_me
4624                = i->Pin.XDirect.toFastEP ? disp_cp_chain_me_to_fastEP
4625                                          : disp_cp_chain_me_to_slowEP;
4626       p = mkLoadImm_EXACTLY2or5(
4627              p, /*r*/30, (Addr)disp_cp_chain_me, mode64, endness_host);
4628       /* mtctr r30 */
4629       p = mkFormXFX(p, /*r*/30, 9, 467, endness_host);
4630       /* bctrl */
4631       p = mkFormXL(p, 19, Pct_ALWAYS, 0, 0, 528, 1, endness_host);
4632       /* --- END of PATCHABLE BYTES --- */
4633
4634       /* Fix up the conditional jump, if there was one. */
4635       if (i->Pin.XDirect.cond.test != Pct_ALWAYS) {
4636          Int delta = p - ptmp;
4637          vassert(delta >= 16 && delta <= 64 && 0 == (delta & 3));
4638          /* bc !ct,cf,delta */
4639          mkFormB(ptmp, invertCondTest(i->Pin.XDirect.cond.test),
4640                  i->Pin.XDirect.cond.flag, (delta>>2), 0, 0, endness_host);
4641       }
4642       goto done;
4643    }
4644
4645    case Pin_XIndir: {
4646       /* We're generating transfers that could lead indirectly to a
4647          chain-me, so we need to be sure this is actually allowed --
4648          no-redir translations are not allowed to reach normal
4649          translations without going through the scheduler.  That means
4650          no XDirects or XIndirs out from no-redir translations.
4651          Hence: */
4652       vassert(disp_cp_xindir != NULL);
4653
4654       /* First off, if this is conditional, create a conditional jump
4655          over the rest of it.  Or at least, leave a space for it that
4656          we will shortly fill in. */
4657       UChar* ptmp = NULL;
4658       if (i->Pin.XIndir.cond.test != Pct_ALWAYS) {
4659          vassert(i->Pin.XIndir.cond.flag != Pcf_NONE);
4660          ptmp = p;
4661          p += 4;
4662       } else {
4663          vassert(i->Pin.XIndir.cond.flag == Pcf_NONE);
4664       }
4665
4666       /* Update the guest CIA. */
4667       /* stw/std r-dstGA, amCIA */
4668       p = do_load_or_store_machine_word(
4669              p, False/*!isLoad*/,
4670              iregEnc(i->Pin.XIndir.dstGA, mode64),
4671              i->Pin.XIndir.amCIA, mode64, endness_host
4672           );
4673
4674       /* imm32/64 r30, VG_(disp_cp_xindir) */
4675       p = mkLoadImm(p, /*r*/30, (ULong)(Addr)disp_cp_xindir, mode64,
4676                     endness_host);
4677       /* mtctr r30 */
4678       p = mkFormXFX(p, /*r*/30, 9, 467, endness_host);
4679       /* bctr */
4680       p = mkFormXL(p, 19, Pct_ALWAYS, 0, 0, 528, 0, endness_host);
4681
4682       /* Fix up the conditional jump, if there was one. */
4683       if (i->Pin.XIndir.cond.test != Pct_ALWAYS) {
4684          Int delta = p - ptmp;
4685          vassert(delta >= 16 && delta <= 32 && 0 == (delta & 3));
4686          /* bc !ct,cf,delta */
4687          mkFormB(ptmp, invertCondTest(i->Pin.XIndir.cond.test),
4688                  i->Pin.XIndir.cond.flag, (delta>>2), 0, 0, endness_host);
4689       }
4690       goto done;
4691    }
4692
4693    case Pin_XAssisted: {
4694       /* First off, if this is conditional, create a conditional jump
4695          over the rest of it.  Or at least, leave a space for it that
4696          we will shortly fill in. */
4697       UChar* ptmp = NULL;
4698       if (i->Pin.XAssisted.cond.test != Pct_ALWAYS) {
4699          vassert(i->Pin.XAssisted.cond.flag != Pcf_NONE);
4700          ptmp = p;
4701          p += 4;
4702       } else {
4703          vassert(i->Pin.XAssisted.cond.flag == Pcf_NONE);
4704       }
4705
4706       /* Update the guest CIA. */
4707       /* stw/std r-dstGA, amCIA */
4708       p = do_load_or_store_machine_word(
4709              p, False/*!isLoad*/,
4710              iregEnc(i->Pin.XIndir.dstGA, mode64),
4711              i->Pin.XIndir.amCIA, mode64, endness_host
4712           );
4713
4714       /* imm32/64 r31, $magic_number */
4715       UInt trcval = 0;
4716       switch (i->Pin.XAssisted.jk) {
4717          case Ijk_ClientReq:   trcval = VEX_TRC_JMP_CLIENTREQ;   break;
4718          case Ijk_Sys_syscall: trcval = VEX_TRC_JMP_SYS_SYSCALL; break;
4719          //case Ijk_Sys_int128:  trcval = VEX_TRC_JMP_SYS_INT128;  break;
4720          //case Ijk_Yield:       trcval = VEX_TRC_JMP_YIELD;       break;
4721          case Ijk_EmWarn:      trcval = VEX_TRC_JMP_EMWARN;      break;
4722          case Ijk_EmFail:      trcval = VEX_TRC_JMP_EMFAIL;      break;
4723          //case Ijk_MapFail:     trcval = VEX_TRC_JMP_MAPFAIL;     break;
4724          case Ijk_NoDecode:    trcval = VEX_TRC_JMP_NODECODE;    break;
4725          case Ijk_InvalICache: trcval = VEX_TRC_JMP_INVALICACHE; break;
4726          case Ijk_NoRedir:     trcval = VEX_TRC_JMP_NOREDIR;     break;
4727          case Ijk_SigTRAP:     trcval = VEX_TRC_JMP_SIGTRAP;     break;
4728          //case Ijk_SigSEGV:     trcval = VEX_TRC_JMP_SIGSEGV;     break;
4729          case Ijk_SigBUS:        trcval = VEX_TRC_JMP_SIGBUS;    break;
4730          case Ijk_Boring:      trcval = VEX_TRC_JMP_BORING;      break;
4731          /* We don't expect to see the following being assisted. */
4732          //case Ijk_Ret:
4733          //case Ijk_Call:
4734          /* fallthrough */
4735          default:
4736             ppIRJumpKind(i->Pin.XAssisted.jk);
4737             vpanic("emit_ARMInstr.Pin_XAssisted: unexpected jump kind");
4738       }
4739       vassert(trcval != 0);
4740       p = mkLoadImm(p, /*r*/31, trcval, mode64, endness_host);
4741
4742       /* imm32/64 r30, VG_(disp_cp_xassisted) */
4743       p = mkLoadImm(p, /*r*/30,
4744                     (ULong)(Addr)disp_cp_xassisted, mode64,
4745                      endness_host);
4746       /* mtctr r30 */
4747       p = mkFormXFX(p, /*r*/30, 9, 467, endness_host);
4748       /* bctr */
4749       p = mkFormXL(p, 19, Pct_ALWAYS, 0, 0, 528, 0, endness_host);
4750
4751       /* Fix up the conditional jump, if there was one. */
4752       if (i->Pin.XAssisted.cond.test != Pct_ALWAYS) {
4753          Int delta = p - ptmp;
4754          vassert(delta >= 16 && delta <= 32 && 0 == (delta & 3));
4755          /* bc !ct,cf,delta */
4756          mkFormB(ptmp, invertCondTest(i->Pin.XAssisted.cond.test),
4757                  i->Pin.XAssisted.cond.flag, (delta>>2), 0, 0, endness_host);
4758       }
4759       goto done;
4760    }
4761
4762    case Pin_CMov: {
4763       UInt  r_dst, r_src;
4764       ULong imm_src;
4765       PPCCondCode cond;
4766       vassert(i->Pin.CMov.cond.test != Pct_ALWAYS);
4767
4768       r_dst = iregEnc(i->Pin.CMov.dst, mode64);
4769       cond = i->Pin.CMov.cond;
4770
4771       /* branch (if cond fails) over move instrs */
4772       UChar* ptmp = NULL;
4773       if (cond.test != Pct_ALWAYS) {
4774          /* don't know how many bytes to jump over yet...
4775             make space for a jump instruction and fill in later. */
4776          ptmp = p; /* fill in this bit later */
4777          p += 4;
4778       }
4779
4780       // cond true: move src => dst
4781       switch (i->Pin.CMov.src->tag) {
4782       case Pri_Imm:
4783          imm_src = i->Pin.CMov.src->Pri.Imm;
4784          p = mkLoadImm(p, r_dst, imm_src, mode64, endness_host);  // p += 4|8|20
4785          break;
4786       case Pri_Reg:
4787          r_src = iregEnc(i->Pin.CMov.src->Pri.Reg, mode64);
4788          p = mkMoveReg(p, r_dst, r_src, endness_host);            // p += 4
4789          break;
4790       default: goto bad;
4791       }
4792
4793       /* Fix up the conditional jump, if there was one. */
4794       if (cond.test != Pct_ALWAYS) {
4795          Int delta = p - ptmp;
4796          vassert(delta >= 8 && delta <= 24);
4797          /* bc !ct,cf,delta */
4798          mkFormB(ptmp, invertCondTest(cond.test),
4799                  cond.flag, (delta>>2), 0, 0, endness_host);
4800       }
4801       goto done;
4802    }
4803
4804    case Pin_Load: {
4805       PPCAMode* am_addr = i->Pin.Load.src;
4806       UInt r_dst = iregEnc(i->Pin.Load.dst, mode64);
4807       UInt opc1, opc2, sz = i->Pin.Load.sz;
4808       switch (am_addr->tag) {
4809       case Pam_IR:
4810          if (mode64 && (sz == 4 || sz == 8)) {
4811             /* should be guaranteed to us by iselWordExpr_AMode */
4812             vassert(0 == (am_addr->Pam.IR.index & 3));
4813          }
4814          switch(sz) {
4815             case 1:  opc1 = 34; break;
4816             case 2:  opc1 = 40; break;
4817             case 4:  opc1 = 32; break;
4818             case 8:  opc1 = 58; vassert(mode64); break;
4819             default: goto bad;
4820          }
4821          p = doAMode_IR(p, opc1, r_dst, am_addr, mode64, endness_host);
4822          goto done;
4823       case Pam_RR:
4824          switch(sz) {
4825             case 1:  opc2 = 87;  break;
4826             case 2:  opc2 = 279; break;
4827             case 4:  opc2 = 23;  break;
4828             case 8:  opc2 = 21; vassert(mode64); break;
4829             default: goto bad;
4830          }
4831          p = doAMode_RR(p, 31, opc2, r_dst, am_addr, mode64, endness_host);
4832          goto done;
4833       default:
4834          goto bad;
4835       }
4836    }
4837
4838    case Pin_LoadL: {
4839       if (i->Pin.LoadL.sz == 1) {
4840          p = mkFormX(p, 31, iregEnc(i->Pin.LoadL.dst, mode64),
4841                      0, iregEnc(i->Pin.LoadL.src, mode64), 52, 0, endness_host);
4842          goto done;
4843       }
4844       if (i->Pin.LoadL.sz == 2) {
4845          p = mkFormX(p, 31, iregEnc(i->Pin.LoadL.dst, mode64),
4846                      0, iregEnc(i->Pin.LoadL.src, mode64), 116, 0, endness_host);
4847          goto done;
4848       }
4849       if (i->Pin.LoadL.sz == 4) {
4850          p = mkFormX(p, 31, iregEnc(i->Pin.LoadL.dst, mode64),
4851                      0, iregEnc(i->Pin.LoadL.src, mode64), 20, 0, endness_host);
4852          goto done;
4853       }
4854       if (i->Pin.LoadL.sz == 8 && mode64) {
4855          p = mkFormX(p, 31, iregEnc(i->Pin.LoadL.dst, mode64),
4856                      0, iregEnc(i->Pin.LoadL.src, mode64), 84, 0, endness_host);
4857          goto done;
4858       }
4859       goto bad;
4860    }
4861
4862    case Pin_Set: {
4863       /* Make the destination register be 1 or 0, depending on whether
4864          the relevant condition holds. */
4865       UInt        r_dst = iregEnc(i->Pin.Set.dst, mode64);
4866       PPCCondCode cond  = i->Pin.Set.cond;
4867       UInt rot_imm, r_tmp;
4868
4869       if (cond.test == Pct_ALWAYS) {
4870          // Just load 1 to dst => li dst,1
4871          p = mkFormD(p, 14, r_dst, 0, 1, endness_host);
4872       } else {
4873          vassert(cond.flag != Pcf_NONE);
4874          rot_imm = 1 + cond.flag;
4875          r_tmp = 0;  // Not set in getAllocable, so no need to declare.
4876
4877          // r_tmp = CR  => mfcr r_tmp
4878          p = mkFormX(p, 31, r_tmp, 0, 0, 19, 0, endness_host);
4879
4880          // r_dst = flag (rotate left and mask)
4881          //  => rlwinm r_dst,r_tmp,rot_imm,31,31
4882          p = mkFormM(p, 21, r_tmp, r_dst, rot_imm, 31, 31, 0, endness_host);
4883
4884          if (cond.test == Pct_FALSE) {
4885             // flip bit  => xori r_dst,r_dst,1
4886             p = mkFormD(p, 26, r_dst, r_dst, 1, endness_host);
4887          }
4888       }
4889       goto done;
4890    }
4891
4892    case Pin_MfCR:
4893       // mfcr dst
4894       p = mkFormX(p, 31, iregEnc(i->Pin.MfCR.dst, mode64), 0, 0, 19, 0,
4895                   endness_host);
4896       goto done;
4897
4898    case Pin_MFence: {
4899       p = mkFormX(p, 31, 0, 0, 0, 598, 0, endness_host);   // sync, PPC32 p616
4900       // CAB: Should this be isync?
4901       //    p = mkFormXL(p, 19, 0, 0, 0, 150, 0);  // isync, PPC32 p467
4902       goto done;
4903    }
4904
4905    case Pin_Store: {
4906       PPCAMode* am_addr = i->Pin.Store.dst;
4907       UInt r_src = iregEnc(i->Pin.Store.src, mode64);
4908       UInt opc1, opc2, sz = i->Pin.Store.sz;
4909       switch (i->Pin.Store.dst->tag) {
4910       case Pam_IR:
4911          if (mode64 && (sz == 4 || sz == 8)) {
4912             /* should be guaranteed to us by iselWordExpr_AMode */
4913             vassert(0 == (am_addr->Pam.IR.index & 3));
4914          }
4915          switch(sz) {
4916          case 1: opc1 = 38; break;
4917          case 2: opc1 = 44; break;
4918          case 4: opc1 = 36; break;
4919          case 8: vassert(mode64);
4920                  opc1 = 62; break;
4921          default:
4922             goto bad;
4923          }
4924          p = doAMode_IR(p, opc1, r_src, am_addr, mode64, endness_host);
4925          goto done;
4926       case Pam_RR:
4927          switch(sz) {
4928          case 1: opc2 = 215; break;
4929          case 2: opc2 = 407; break;
4930          case 4: opc2 = 151; break;
4931          case 8: vassert(mode64);
4932                  opc2 = 149; break;
4933          default:
4934             goto bad;
4935          }
4936          p = doAMode_RR(p, 31, opc2, r_src, am_addr, mode64, endness_host);
4937          goto done;
4938       default:
4939          goto bad;
4940       }
4941       // PJF Coverity may be right but I'd reather keep the unreachable code
4942       // "just in case" that conditions above ever change
4943       // coverity[UNREACHABLE:FALSE]
4944       goto done;
4945    }
4946
4947    case Pin_StoreC: {
4948       if (i->Pin.StoreC.sz == 1) {
4949          p = mkFormX(p, 31, iregEnc(i->Pin.StoreC.src, mode64),
4950                      0, iregEnc(i->Pin.StoreC.dst, mode64), 694, 1, endness_host);
4951          goto done;
4952       }
4953       if (i->Pin.StoreC.sz == 2) {
4954          p = mkFormX(p, 31, iregEnc(i->Pin.StoreC.src, mode64),
4955                      0, iregEnc(i->Pin.StoreC.dst, mode64), 726, 1, endness_host);
4956          goto done;
4957       }
4958
4959       if (i->Pin.StoreC.sz == 4) {
4960          p = mkFormX(p, 31, iregEnc(i->Pin.StoreC.src, mode64),
4961                      0, iregEnc(i->Pin.StoreC.dst, mode64), 150, 1, endness_host);
4962          goto done;
4963       }
4964       if (i->Pin.StoreC.sz == 8 && mode64) {
4965          p = mkFormX(p, 31, iregEnc(i->Pin.StoreC.src, mode64),
4966                      0, iregEnc(i->Pin.StoreC.dst, mode64), 214, 1, endness_host);
4967          goto done;
4968       }
4969       goto bad;
4970    }
4971
4972    case Pin_FpUnary: {
4973       UInt fr_dst = fregEnc(i->Pin.FpUnary.dst);
4974       UInt fr_src = fregEnc(i->Pin.FpUnary.src);
4975       switch (i->Pin.FpUnary.op) {
4976       case Pfp_RSQRTE: // frsqrtre, PPC32 p424
4977          p = mkFormA( p, 63, fr_dst, 0, fr_src, 0, 26, 0, endness_host );
4978          break;
4979       case Pfp_RES:   // fres, PPC32 p421
4980          p = mkFormA( p, 59, fr_dst, 0, fr_src, 0, 24, 0, endness_host );
4981          break;
4982       case Pfp_SQRT:  // fsqrt, PPC32 p427
4983          p = mkFormA( p, 63, fr_dst, 0, fr_src, 0, 22, 0, endness_host );
4984          break;
4985       case Pfp_ABS:   // fabs, PPC32 p399
4986          p = mkFormX(p, 63, fr_dst, 0, fr_src, 264, 0, endness_host);
4987          break;
4988       case Pfp_NEG:   // fneg, PPC32 p416
4989          p = mkFormX(p, 63, fr_dst, 0, fr_src, 40, 0, endness_host);
4990          break;
4991       case Pfp_MOV:   // fmr, PPC32 p410
4992          p = mkFormX(p, 63, fr_dst, 0, fr_src, 72, 0, endness_host);
4993          break;
4994       case Pfp_FRIM:  // frim, PPC ISA 2.05 p137
4995          p = mkFormX(p, 63, fr_dst, 0, fr_src, 488, 0, endness_host);
4996          break;
4997       case Pfp_FRIP:  // frip, PPC ISA 2.05 p137
4998          p = mkFormX(p, 63, fr_dst, 0, fr_src, 456, 0, endness_host);
4999          break;
5000       case Pfp_FRIN:  // frin, PPC ISA 2.05 p137
5001          p = mkFormX(p, 63, fr_dst, 0, fr_src, 392, 0, endness_host);
5002          break;
5003       case Pfp_FRIZ:  // friz, PPC ISA 2.05 p137
5004          p = mkFormX(p, 63, fr_dst, 0, fr_src, 424, 0, endness_host);
5005          break;
5006       default:
5007          goto bad;
5008       }
5009       goto done;
5010    }
5011
5012    case Pin_FpBinary: {
5013       UInt fr_dst  = fregEnc(i->Pin.FpBinary.dst);
5014       UInt fr_srcL = fregEnc(i->Pin.FpBinary.srcL);
5015       UInt fr_srcR = fregEnc(i->Pin.FpBinary.srcR);
5016       switch (i->Pin.FpBinary.op) {
5017       case Pfp_ADDD:   // fadd, PPC32 p400
5018          p = mkFormA( p, 63, fr_dst, fr_srcL, fr_srcR, 0, 21, 0, endness_host );
5019          break;
5020       case Pfp_ADDS:   // fadds, PPC32 p401
5021          p = mkFormA( p, 59, fr_dst, fr_srcL, fr_srcR, 0, 21, 0, endness_host );
5022          break;
5023       case Pfp_SUBD:   // fsub, PPC32 p429
5024          p = mkFormA( p, 63, fr_dst, fr_srcL, fr_srcR, 0, 20, 0, endness_host );
5025          break;
5026       case Pfp_SUBS:   // fsubs, PPC32 p430
5027          p = mkFormA( p, 59, fr_dst, fr_srcL, fr_srcR, 0, 20, 0, endness_host );
5028          break;
5029       case Pfp_MULD:   // fmul, PPC32 p413
5030          p = mkFormA( p, 63, fr_dst, fr_srcL, 0, fr_srcR, 25, 0, endness_host );
5031          break;
5032       case Pfp_MULS:   // fmuls, PPC32 p414
5033          p = mkFormA( p, 59, fr_dst, fr_srcL, 0, fr_srcR, 25, 0, endness_host );
5034          break;
5035       case Pfp_DIVD:   // fdiv, PPC32 p406
5036          p = mkFormA( p, 63, fr_dst, fr_srcL, fr_srcR, 0, 18, 0, endness_host );
5037          break;
5038       case Pfp_DIVS:   // fdivs, PPC32 p407
5039          p = mkFormA( p, 59, fr_dst, fr_srcL, fr_srcR, 0, 18, 0, endness_host );
5040          break;
5041       default:
5042          goto bad;
5043       }
5044       goto done;
5045    }
5046
5047    case Pin_Fp128Unary: {
5048       /* Note Fp128 instructions use the vector scalar registers.  The register
5049        * mapping for the V128 type assumes the a vector instruction.  The
5050        * PPC hardware has a single register file that the vector scalar
5051        * registers and the vector registers map to.  The 32 vector
5052        * registers instructions map to the same registers as the vector
5053        * scalar registers 32 to 63.  mkFormVXR0 does the needed
5054        * adjustment.
5055       */
5056       UInt fr_dst = vregEnc(i->Pin.Fp128Unary.dst);
5057       UInt fr_src = vregEnc(i->Pin.Fp128Unary.src);
5058
5059       switch (i->Pin.Fp128Unary.op) {
5060       case Pfp_FPSQRTQ:         // xssqrtqp, use rounding specified by RN
5061          p = mkFormVXR0( p, 63, fr_dst, 27, fr_src, 804, 0, endness_host );
5062          break;
5063       case Pfp_FPSQRTQRNDODD:   // xssqrtqpo, use rounding specified by RN
5064          p = mkFormVXR0( p, 63, fr_dst, 27, fr_src, 804, 1, endness_host );
5065          break;
5066       case Pfp_FPQTOD:         // xscvqpdp, use rounding specified by RN
5067          p = mkFormVXR0( p, 63, fr_dst, 20, fr_src, 836, 0, endness_host );
5068          break;
5069       case Pfp_FPQTODRNDODD:   // xscvqpdpo, use rounding specified by RN
5070          p = mkFormVXR0( p, 63, fr_dst, 20, fr_src, 836, 1, endness_host );
5071         break;
5072       case Pfp_FPDTOQ:         // xscvdpqp
5073          p = mkFormVXR0( p, 63, fr_dst, 22, fr_src, 836, 0, endness_host );
5074          break;
5075       case Pfp_IDSTOQ:         // xscvsdqp
5076          p = mkFormVXR0( p, 63, fr_dst, 10, fr_src, 836, 0, endness_host );
5077          break;
5078       case Pfp_IDUTOQ:         // xscvudqp
5079          p = mkFormVXR0( p, 63, fr_dst, 2, fr_src, 836, 0, endness_host );
5080          break;
5081       case Pfp_IQSTOQ:         // xscvsqqp
5082          p = mkFormVXR0( p, 63, fr_dst, 11, fr_src, 836, 0, endness_host );
5083          break;
5084       case Pfp_IQUTOQ:         // xscvuqqp
5085          p = mkFormVXR0( p, 63, fr_dst, 3, fr_src, 836, 0, endness_host );
5086          break;
5087       case Pfp_TRUNCFPQTOISQ:   // xscvqpsqz
5088          p = mkFormVXR0( p, 63, fr_dst, 8, fr_src, 836, 0, endness_host );
5089          break;
5090       case Pfp_TRUNCFPQTOISD:   // xscvqpsdz
5091          p = mkFormVXR0( p, 63, fr_dst, 25, fr_src, 836, 0, endness_host );
5092          break;
5093       case Pfp_TRUNCFPQTOISW:   // xscvqpswz
5094          p = mkFormVXR0( p, 63, fr_dst, 9, fr_src, 836, 0, endness_host );
5095          break;
5096       case Pfp_TRUNCFPQTOIUQ:   // xscvqpuqz
5097          p = mkFormVXR0( p, 63, fr_dst, 0, fr_src, 836, 0, endness_host );
5098          break;
5099       case Pfp_TRUNCFPQTOIUD:   // xscvqpudz
5100          p = mkFormVXR0( p, 63, fr_dst, 17, fr_src, 836, 0, endness_host );
5101          break;
5102       case Pfp_TRUNCFPQTOIUW:   // xscvqpuwz
5103          p = mkFormVXR0( p, 63, fr_dst, 1, fr_src, 836, 0, endness_host );
5104          break;
5105       default:
5106          goto bad;
5107       }
5108       goto done;
5109    }
5110
5111    case Pin_Fp128Binary: {
5112       /* Note Fp128 instructions use the vector registers */
5113       UInt fr_dst  = vregEnc(i->Pin.Fp128Binary.dst);
5114       UInt fr_srcL = vregEnc(i->Pin.Fp128Binary.srcL);
5115       UInt fr_srcR = vregEnc(i->Pin.Fp128Binary.srcR);
5116
5117       /* Note this issues a Vector scalar instruction.  The register
5118        * mapping for the V128 type assumes the a vector instruction.  The
5119        * PPC hardware has a single register file that the vector scalar
5120        * registers and the vector registers map to.  The 32 vector
5121        * registers instructions map to the same registers as the vector
5122        * scalar registers 32 to 63.  For these instructions the HW adds
5123        * 32 to the register numbers to access the VSRR register.  No need
5124        * to adjust the numbers to map to the VR register that contians the
5125        * operands.
5126        */
5127
5128       switch (i->Pin.Fp128Binary.op) {
5129       case Pfp_FPADDQ:         // xsaddqp, use rounding specified by RN
5130          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 4, 0, endness_host );
5131          break;
5132       case Pfp_FPADDQRNDODD:   // xsaddqpo, round to odd
5133          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 4, 1, endness_host );
5134          break;
5135       case Pfp_FPSUBQ:         // xssubqp, use rounding specified by RN
5136          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 516, 0, endness_host );
5137          break;
5138       case Pfp_FPSUBQRNDODD:   // xssubqpo, round to odd
5139          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 516, 1, endness_host );
5140          break;
5141       case Pfp_FPMULQ:         // xsmulqp, use rounding specified by RN
5142          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 36, 0, endness_host );
5143          break;
5144       case Pfp_FPMULQRNDODD:   // xsmulqpo, round to odd
5145          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 36, 1, endness_host );
5146          break;
5147       case Pfp_FPDIVQ:         // xsdivqp, use rounding specified by RN
5148          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 548, 0, endness_host );
5149          break;
5150       case Pfp_FPDIVQRNDODD:   // xsdivqpo, round to odd
5151          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 548, 1, endness_host );
5152          break;
5153       case Pfp_FPMULADDQ:      // xsmaddqp, use rounding specified by RN
5154          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 388, 0, endness_host );
5155          break;
5156       case Pfp_FPMULADDQRNDODD:   // xsmaddqpo, round to odd
5157          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 388, 1, endness_host );
5158          break;
5159       case Pfp_FPMULSUBQ:         // xsmsubqp, use rounding specified by RN
5160          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 420, 0, endness_host );
5161          break;
5162       case Pfp_FPMULSUBQRNDODD:   // xsmsubsqpo, round to odd
5163          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 420, 1, endness_host );
5164          break;
5165       case Pfp_FPNEGMULADDQ:      // xsnmaddqp, use rounding specified by RN
5166          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 452, 0, endness_host );
5167          break;
5168       case Pfp_FPNEGMULADDQRNDODD:   // xsnmaddqpo, round to odd
5169          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 452, 1, endness_host );
5170          break;
5171       case Pfp_FPNEGMULSUBQ:         // xsnmsubqp, use rounding specified by RN
5172          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 484, 0, endness_host );
5173          break;
5174       case Pfp_FPNEGMULSUBQRNDODD:   // xsnmsubsqpo, round to odd
5175          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 484, 1, endness_host );
5176          break;
5177      default:
5178           goto bad;
5179       }
5180       goto done;
5181    }
5182
5183    case Pin_Fp128Ternary: {
5184       /* Note Fp128 instructions use the vector registers */
5185       UInt fr_dst  = vregEnc(i->Pin.Fp128Binary.dst);
5186       UInt fr_srcL = vregEnc(i->Pin.Fp128Binary.srcL);
5187       UInt fr_srcR = vregEnc(i->Pin.Fp128Binary.srcR);
5188
5189       /* Note this issues a Vector scalar instruction.  The register
5190        * mapping for the V128 type assumes the a vector instruction.  The
5191        * PPC hardware has a single register file that the vector scalar
5192        * registers and the vector registers map to.  The 32 vector
5193        * registers instructions map to the same registers as the vector
5194        * scalar registers 32 to 63.  For these instructions the HW adds
5195        * 32 to the register numbers to access the VSRR register.  No need
5196        * to adjust the numbers to map to the VR register that contians the
5197        * operands.
5198        */
5199
5200       switch (i->Pin.Fp128Binary.op) {
5201       case Pfp_FPMULADDQ:      // xsmaddqp, use rounding specified by RN
5202          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 388, 0, endness_host );
5203          break;
5204       case Pfp_FPMULADDQRNDODD:   // xsmaddqpo, round to odd
5205          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 388, 1, endness_host );
5206          break;
5207       case Pfp_FPMULSUBQ:         // xsmsubqp, use rounding specified by RN
5208          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 420, 0, endness_host );
5209          break;
5210       case Pfp_FPMULSUBQRNDODD:   // xsmsubsqpo, round to odd
5211          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 420, 1, endness_host );
5212          break;
5213       case Pfp_FPNEGMULADDQ:      // xsnmaddqp, use rounding specified by RN
5214          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 452, 0, endness_host );
5215          break;
5216       case Pfp_FPNEGMULADDQRNDODD:   // xsnmaddqpo, round to odd
5217          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 452, 1, endness_host );
5218          break;
5219       case Pfp_FPNEGMULSUBQ:         // xsnmsubqp, use rounding specified by RN
5220         p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 484, 0, endness_host );
5221          break;
5222       case Pfp_FPNEGMULSUBQRNDODD:   // xsnmsubsqpo, round to odd
5223          p = mkFormVXR0( p, 63, fr_dst, fr_srcL, fr_srcR, 484, 1, endness_host );
5224          break;
5225       default:
5226           goto bad;
5227       }
5228       goto done;
5229    }
5230
5231    case Pin_FpMulAcc: {
5232       UInt fr_dst    = fregEnc(i->Pin.FpMulAcc.dst);
5233       UInt fr_srcML  = fregEnc(i->Pin.FpMulAcc.srcML);
5234       UInt fr_srcMR  = fregEnc(i->Pin.FpMulAcc.srcMR);
5235       UInt fr_srcAcc = fregEnc(i->Pin.FpMulAcc.srcAcc);
5236       switch (i->Pin.FpMulAcc.op) {
5237       case Pfp_MADDD:   // fmadd, PPC32 p408
5238          p = mkFormA( p, 63, fr_dst, fr_srcML, fr_srcAcc, fr_srcMR, 29, 0,
5239                       endness_host );
5240          break;
5241       case Pfp_MADDS:   // fmadds, PPC32 p409
5242          p = mkFormA( p, 59, fr_dst, fr_srcML, fr_srcAcc, fr_srcMR, 29, 0,
5243                       endness_host );
5244          break;
5245       case Pfp_MSUBD:   // fmsub, PPC32 p411
5246          p = mkFormA( p, 63, fr_dst, fr_srcML, fr_srcAcc, fr_srcMR, 28, 0,
5247                       endness_host );
5248          break;
5249       case Pfp_MSUBS:   // fmsubs, PPC32 p412
5250          p = mkFormA( p, 59, fr_dst, fr_srcML, fr_srcAcc, fr_srcMR, 28, 0,
5251                       endness_host );
5252          break;
5253       default:
5254          goto bad;
5255       }
5256       goto done;
5257    }
5258
5259    case Pin_FpLdSt: {
5260       PPCAMode* am_addr = i->Pin.FpLdSt.addr;
5261       UInt f_reg = fregEnc(i->Pin.FpLdSt.reg);
5262       Bool idxd = toBool(i->Pin.FpLdSt.addr->tag == Pam_RR);
5263       UChar sz = i->Pin.FpLdSt.sz;
5264       UInt opc;
5265       vassert(sz == 4 || sz == 8);
5266
5267       if (i->Pin.FpLdSt.isLoad) {   // Load from memory
5268          if (idxd) {  // lf[s|d]x, PPC32 p444|440
5269             opc = (sz == 4) ? 535 : 599;
5270             p = doAMode_RR(p, 31, opc, f_reg, am_addr, mode64, endness_host);
5271          } else {     // lf[s|d], PPC32 p441|437
5272             opc = (sz == 4) ? 48 : 50;
5273             p = doAMode_IR(p, opc, f_reg, am_addr, mode64, endness_host);
5274          }
5275       } else {                      // Store to memory
5276          if (idxd) { // stf[s|d]x, PPC32 p521|516
5277             opc = (sz == 4) ? 663 : 727;
5278             p = doAMode_RR(p, 31, opc, f_reg, am_addr, mode64, endness_host);
5279          } else {    // stf[s|d], PPC32 p518|513
5280             opc = (sz == 4) ? 52 : 54;
5281             p = doAMode_IR(p, opc, f_reg, am_addr, mode64, endness_host);
5282          }
5283       }
5284       goto done;
5285    }
5286
5287    case Pin_FpSTFIW: {
5288       UInt ir_addr = iregEnc(i->Pin.FpSTFIW.addr, mode64);
5289       UInt fr_data = fregEnc(i->Pin.FpSTFIW.data);
5290       // stfiwx (store fp64[lo32] as int32), PPC32 p517
5291       // Use rA==0, so that EA == rB == ir_addr
5292       p = mkFormX(p, 31, fr_data, 0/*rA=0*/, ir_addr, 983, 0, endness_host);
5293       goto done;
5294    }
5295
5296    case Pin_FpRSP: {
5297       UInt fr_dst = fregEnc(i->Pin.FpRSP.dst);
5298       UInt fr_src = fregEnc(i->Pin.FpRSP.src);
5299       // frsp, PPC32 p423
5300       p = mkFormX(p, 63, fr_dst, 0, fr_src, 12, 0, endness_host);
5301       goto done;
5302    }
5303
5304    case Pin_FpCftI: {
5305       UInt fr_dst = fregEnc(i->Pin.FpCftI.dst);
5306       UInt fr_src = fregEnc(i->Pin.FpCftI.src);
5307       if (i->Pin.FpCftI.fromI == False && i->Pin.FpCftI.int32 == True) {
5308          if (i->Pin.FpCftI.syned == True) {
5309             // fctiw (conv f64 to i32), PPC32 p404
5310             p = mkFormX(p, 63, fr_dst, 0, fr_src, 14, 0, endness_host);
5311             goto done;
5312          } else {
5313             // fctiwu (conv f64 to u32)
5314             p = mkFormX(p, 63, fr_dst, 0, fr_src, 142, 0, endness_host);
5315             goto done;
5316          }
5317       }
5318       if (i->Pin.FpCftI.fromI == False && i->Pin.FpCftI.int32 == False) {
5319          if (i->Pin.FpCftI.syned == True) {
5320             // fctid (conv f64 to i64), PPC64 p437
5321             p = mkFormX(p, 63, fr_dst, 0, fr_src, 814, 0, endness_host);
5322             goto done;
5323          } else {
5324             // fctidu (conv f64 to u64)
5325             p = mkFormX(p, 63, fr_dst, 0, fr_src, 942, 0, endness_host);
5326             goto done;
5327          }
5328       }
5329       if (i->Pin.FpCftI.fromI == True && i->Pin.FpCftI.int32 == False) {
5330          if (i->Pin.FpCftI.syned == True) {
5331             // fcfid (conv i64 to f64), PPC64 p434
5332             p = mkFormX(p, 63, fr_dst, 0, fr_src, 846, 0, endness_host);
5333             goto done;
5334          } else if (i->Pin.FpCftI.flt64 == True) {
5335             // fcfidu (conv u64 to f64)
5336             p = mkFormX(p, 63, fr_dst, 0, fr_src, 974, 0, endness_host);
5337             goto done;
5338          } else {
5339             // fcfidus (conv u64 to f32)
5340             p = mkFormX(p, 59, fr_dst, 0, fr_src, 974, 0, endness_host);
5341             goto done;
5342          }
5343       }
5344       goto bad;
5345    }
5346
5347    case Pin_FpCMov: {
5348       UInt        fr_dst = fregEnc(i->Pin.FpCMov.dst);
5349       UInt        fr_src = fregEnc(i->Pin.FpCMov.src);
5350       PPCCondCode cc     = i->Pin.FpCMov.cond;
5351
5352       if (fr_dst == fr_src) goto done;
5353
5354       vassert(cc.test != Pct_ALWAYS);
5355
5356       /* jmp fwds if !condition */
5357       if (cc.test != Pct_ALWAYS) {
5358          /* bc !ct,cf,n_bytes>>2 */
5359          p = mkFormB(p, invertCondTest(cc.test), cc.flag, 8>>2, 0, 0,
5360                      endness_host);
5361       }
5362
5363       // fmr, PPC32 p410
5364       p = mkFormX(p, 63, fr_dst, 0, fr_src, 72, 0, endness_host);
5365       goto done;
5366    }
5367
5368    case Pin_FpLdFPSCR: {
5369       UInt fr_src = fregEnc(i->Pin.FpLdFPSCR.src);
5370       p = mkFormXFL(p, 0xFF, fr_src, i->Pin.FpLdFPSCR.dfp_rm, endness_host); // mtfsf, PPC32 p480
5371       goto done;
5372    }
5373
5374    case Pin_FpCmp: {
5375       UChar crfD    = 1;
5376       UInt  r_dst   = iregEnc(i->Pin.FpCmp.dst, mode64);
5377       UInt  fr_srcL = fregEnc(i->Pin.FpCmp.srcL);
5378       UInt  fr_srcR = fregEnc(i->Pin.FpCmp.srcR);
5379       vassert(crfD < 8);
5380       // fcmpo, PPC32 p402
5381       p = mkFormX(p, 63, crfD<<2, fr_srcL, fr_srcR, 32, 0, endness_host);
5382
5383       // mfcr (mv CR to r_dst), PPC32 p467
5384       p = mkFormX(p, 31, r_dst, 0, 0, 19, 0, endness_host);
5385
5386       // rlwinm r_dst,r_dst,8,28,31, PPC32 p501
5387       //  => rotate field 1 to bottomw of word, masking out upper 28
5388       p = mkFormM(p, 21, r_dst, r_dst, 8, 28, 31, 0, endness_host);
5389       goto done;
5390    }
5391
5392    case Pin_RdWrLR: {
5393       UInt reg = iregEnc(i->Pin.RdWrLR.gpr, mode64);
5394       /* wrLR==True ? mtlr r4 : mflr r4 */
5395       p = mkFormXFX(p, reg, 8, (i->Pin.RdWrLR.wrLR==True) ? 467 : 339,
5396                     endness_host);
5397       goto done;
5398    }
5399
5400
5401    /* AltiVec */
5402    case Pin_AvLdSt: {
5403       UInt opc2, v_reg, r_idx, r_base;
5404       UChar sz   = i->Pin.AvLdSt.sz;
5405       Bool  idxd = toBool(i->Pin.AvLdSt.addr->tag == Pam_RR);
5406       vassert(sz == 1 || sz == 2 || sz == 4 || sz == 16);
5407
5408       v_reg  = vregEnc(i->Pin.AvLdSt.reg);
5409       r_base = iregEnc(i->Pin.AvLdSt.addr->Pam.RR.base, mode64);
5410
5411       // Only have AltiVec AMode_RR: kludge AMode_IR
5412       if (!idxd) {
5413          r_idx = 30;                       // XXX: Using r30 as temp
5414          p = mkLoadImm(p, r_idx,
5415                        i->Pin.AvLdSt.addr->Pam.IR.index, mode64, endness_host);
5416       } else {
5417          r_idx  = iregEnc(i->Pin.AvLdSt.addr->Pam.RR.index, mode64);
5418       }
5419
5420       if (i->Pin.FpLdSt.isLoad) {  // Load from memory (1,2,4,16)
5421          opc2 = (sz==1) ?   7 : (sz==2) ?  39 : (sz==4) ?  71 : 103;
5422          p = mkFormX(p, 31, v_reg, r_idx, r_base, opc2, 0, endness_host);
5423       } else {                      // Store to memory (1,2,4,16)
5424          opc2 = (sz==1) ? 135 : (sz==2) ? 167 : (sz==4) ? 199 : 231;
5425          p = mkFormX(p, 31, v_reg, r_idx, r_base, opc2, 0, endness_host);
5426       }
5427       goto done;
5428    }
5429
5430    case Pin_AvUnary: {
5431       UInt v_dst = vregEnc(i->Pin.AvUnary.dst);
5432       UInt v_src = vregEnc(i->Pin.AvUnary.src);
5433       UInt opc2 = 0xFFFFFFFF, opc3 = 0xFFFFFFFF; /* invalid */
5434
5435       switch (i->Pin.AvUnary.op) {
5436       case Pav_MOV:       opc2 = 1156; break; // vor vD,vS,vS
5437       case Pav_NOT:       opc2 = 1284; break; // vnor vD,vS,vS
5438       case Pav_UNPCKH8S:  opc2 =  526; break; // vupkhsb
5439       case Pav_UNPCKH16S: opc2 =  590; break; // vupkhsh
5440       case Pav_UNPCKL8S:  opc2 =  654; break; // vupklsb
5441       case Pav_UNPCKL16S: opc2 =  718; break; // vupklsh
5442       case Pav_UNPCKHPIX: opc2 =  846; break; // vupkhpx
5443       case Pav_UNPCKLPIX: opc2 =  974; break; // vupklpx
5444
5445       case Pav_ZEROCNTBYTE: opc2 = 1794; break; // vclzb
5446       case Pav_ZEROCNTHALF: opc2 = 1858; break; // vclzh
5447       case Pav_ZEROCNTWORD: opc2 = 1922; break; // vclzw
5448       case Pav_ZEROCNTDBL:  opc2 = 1986; break; // vclzd
5449       case Pav_TRAILINGZEROCNTBYTE: opc2 = 1538; break; // vctzb
5450       case Pav_TRAILINGZEROCNTHALF: opc2 = 1538; break; // vctzh
5451       case Pav_TRAILINGZEROCNTWORD: opc2 = 1538; break; // vctzw
5452       case Pav_TRAILINGZEROCNTDBL:  opc2 = 1538; break; // vctzd
5453       case Pav_BITMTXXPOSE: opc2 = 1292; break; // vgbbd
5454       case Pav_BCD128toI128S: opc2 = 385; break; //bcdctsq.
5455       case Pav_MulI128by10:      opc2 = 513; break; // vmul10uq
5456       case Pav_MulI128by10Carry: opc2 =   1; break; // vmul10cuq
5457       case Pav_F16toF64x2: opc2 = 347; opc3 = 16; break; // xvcvhpdp
5458       case Pav_F64toF16x2: opc2 = 347; opc3 = 17; break; // xvcvdphp
5459       case Pav_F16toF32x4: opc2 = 475; opc3 = 24; break; // xvcvhpsp
5460       case Pav_F32toF16x4: opc2 = 475; opc3 = 25; break; // xvcvsphp
5461
5462       default:
5463          goto bad;
5464       }
5465       switch (i->Pin.AvUnary.op) {
5466       case Pav_MOV:
5467       case Pav_NOT:
5468          p = mkFormVX( p, 4, v_dst, v_src, v_src, opc2, endness_host );
5469          break;
5470       case Pav_F16toF32x4:
5471          {
5472             /* I64 source has four 16-bit float values in the upper 64-bit
5473              * of the source vector register, lower 64-bits are undefined.
5474              */
5475             /* Scatter the four F16 values in the Vector register */
5476             p = mkFormVX( p, 4, v_dst, 0, v_src, 590, endness_host );// vupkhsh
5477
5478             /* The layout of the vector register is now: S0F0 S1F1 S2F2 S3F3
5479              * where S is the sign extension of the 16-bit F value.  We don't
5480              * care about the extended signs.
5481              */
5482
5483             /* Input, in v_dst, is now correct for the xvcvhpsp instruction */
5484             p = mkFormVX_BX_TX( p, 60, v_dst, opc3, v_dst, opc2,
5485                                 endness_host );
5486          }
5487          break;
5488       case Pav_F64toF16x2:
5489       case Pav_F16toF64x2:
5490       case Pav_F32toF16x4:
5491          /* Note this issues a Vector scalar instruction.  The register
5492           * mapping for the V128 type assumes the a vector instruction.  The
5493           * PPC hardware has a single register file that the vector scalar
5494           * registers and the vector registers map to.  The 32 vector registers
5495           * instructions map to the same registers as the vector scalar
5496           * registers 32 to 63.  mkFormVX_BX_TX does the needed adjustment.
5497           */
5498          p = mkFormVX_BX_TX( p, 60, v_dst, opc3, v_src, opc2, endness_host );
5499          break;
5500       case Pav_BCD128toI128S:  // bcdctsq
5501          p = mkFormVX( p, 4, v_dst, 0, v_src, (1<<10 | 385), endness_host );
5502          break;
5503       case Pav_MulI128by10:
5504       case Pav_MulI128by10Carry:
5505          p = mkFormVX( p, 4, v_dst, v_src, 0, opc2, endness_host );
5506          break;
5507       case Pav_TRAILINGZEROCNTBYTE:
5508          p = mkFormVX( p, 4, v_dst, 28, v_src, opc2, endness_host );
5509          break;
5510       case Pav_TRAILINGZEROCNTHALF:
5511          p = mkFormVX( p, 4, v_dst, 29, v_src, opc2, endness_host );
5512          break;
5513       case Pav_TRAILINGZEROCNTWORD:
5514          p = mkFormVX( p, 4, v_dst, 30, v_src, opc2, endness_host );
5515          break;
5516       case Pav_TRAILINGZEROCNTDBL:
5517          p = mkFormVX( p, 4, v_dst, 31, v_src, opc2, endness_host );
5518          break;
5519       default:
5520          p = mkFormVX( p, 4, v_dst, 0, v_src, opc2, endness_host );
5521          break;
5522       }
5523       goto done;
5524    }
5525
5526    case Pin_AvBinary: {
5527       UInt v_dst  = vregEnc(i->Pin.AvBinary.dst);
5528       UInt v_srcL = vregEnc(i->Pin.AvBinary.srcL);
5529       UInt v_srcR = vregEnc(i->Pin.AvBinary.srcR);
5530       UInt opc2;
5531       if (i->Pin.AvBinary.op == Pav_SHL) {
5532          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 1036, endness_host ); // vslo
5533          p = mkFormVX( p, 4, v_dst, v_dst,  v_srcR, 452, endness_host );  // vsl
5534          goto done;
5535       }
5536       if (i->Pin.AvBinary.op == Pav_SHR) {
5537          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 1100, endness_host ); // vsro
5538          p = mkFormVX( p, 4, v_dst, v_dst,  v_srcR, 708, endness_host );  // vsr
5539          goto done;
5540       }
5541       switch (i->Pin.AvBinary.op) {
5542       /* Bitwise */
5543       case Pav_AND:       opc2 = 1028; break; // vand
5544       case Pav_OR:        opc2 = 1156; break; // vor
5545       case Pav_XOR:       opc2 = 1220; break; // vxor
5546       /* Mult by 10 */
5547       case Pav_MulI128by10E:      opc2 = 577; break; // vmul10euq
5548       case Pav_MulI128by10ECarry: opc2 =  65; break; // vmul10ecuq
5549       default:
5550          goto bad;
5551       }
5552       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5553       goto done;
5554    }
5555
5556    case Pin_AvBinaryInt: {
5557        UInt   ps = i->Pin.AvBinaryInt.val->Pri.Imm;
5558        UInt   dst = vregEnc(i->Pin.AvBinaryInt.dst);
5559        UInt   src = vregEnc(i->Pin.AvBinaryInt.src);
5560
5561        switch (i->Pin.AvBinaryInt.op) {
5562        /* BCD */
5563        case Pav_I128StoBCD128:   // bcdcfsq
5564           {
5565               /* v_srcR actually contains the value of the one-bit ps field */
5566               int opc2 = 385;
5567               p = mkFormVX( p, 4, dst, 2, src,
5568                             (1 << 10 | (ps << 9) | opc2), endness_host );
5569            }
5570        break;
5571
5572        case Pav_F128toI128S:  // xsrqpi, xsrqpix
5573            {
5574               int opc2 = 5;
5575               UInt EX  = ps & 0x1;
5576               UInt R   = (ps >> 3) & 0x1;
5577               UInt RMC = (ps >> 1) & 0x3;
5578               /* Note this issues a Vector scalar instruction.  The register
5579                * mapping for the V128 type assumes the a vector instruction.  The
5580                * PPC hardware has a single register file that the vector scalar
5581                * registers and the vector registers map to.  The 32 vector
5582                * registers instructions map to the same registers as the vector
5583                * scalar registers 32 to 63.  For these instructions the HW adds
5584                * 32 to the register numbers to access the VSRR register.  No need
5585                * to adjust the numbers to map to the VR register that contians
5586                * the operands.
5587                */
5588               p = mkFormVSXRND( p, 63, R, dst, src, RMC, opc2, EX,
5589                                 endness_host );
5590            }
5591         break;
5592
5593         case Pav_ROUNDFPQ:   // xsrqpxp
5594            {
5595               int opc2 = 37;
5596               UInt EX  = ps & 0x1;
5597               UInt RMC = (ps >> 1) & 0x3;
5598               UInt R   = (ps >> 3) & 0x1;
5599               p = mkFormVSXRND( p, 63, R, dst, src, RMC, opc2, EX,
5600                                 endness_host );
5601            }
5602         break;
5603
5604         default:
5605            goto bad;
5606
5607       }
5608       goto done;
5609    }
5610
5611    case Pin_AvBinaryInt128: {
5612        UInt   dst  = vregEnc(i->Pin.AvBinaryInt128.dst);
5613        UInt   src1 = vregEnc(i->Pin.AvBinaryInt128.src1);
5614        UInt   src2 = vregEnc(i->Pin.AvBinaryInt128.src2);
5615        int opc2;
5616
5617        switch (i->Pin.AvBinaryInt128.op) {
5618        case Pav_DivS128:  opc2 = 267; break;      //vdivsq
5619        case Pav_DivU128:  opc2 = 11;  break;      //vdivuq
5620        case Pav_DivU128E: opc2 = 523; break;      //vdiveuq
5621        case Pav_DivS128E: opc2 = 779; break;      //vdivesq
5622        case Pav_ModS128:  opc2 = 1803; break;     //vmodsq
5623        case Pav_ModU128:  opc2 = 1547; break;     //vmoduq
5624
5625        default:
5626            goto bad;
5627        }
5628        p = mkFormVX( p, 4, dst, src1, src2, opc2, endness_host );
5629       goto done;
5630    }
5631
5632    case Pin_AvTernaryInt128: {
5633        UInt   dst  = vregEnc(i->Pin.AvTernaryInt128.dst);
5634        UInt   src1 = vregEnc(i->Pin.AvTernaryInt128.src1);
5635        UInt   src2 = vregEnc(i->Pin.AvTernaryInt128.src2);
5636        UInt   src3 = vregEnc(i->Pin.AvTernaryInt128.src3);
5637        int opc2;
5638
5639        switch (i->Pin.AvTernaryInt128.op) {
5640        case Pav_2xMultU64Add128CarryOut: opc2 = 23; break;     //vsumcud
5641
5642        default:
5643            goto bad;
5644        }
5645        p = mkFormVA( p, 4, dst, src1, src2, src3, opc2, endness_host );
5646       goto done;
5647    }
5648
5649    case Pin_AvBin8x16: {
5650       UInt v_dst  = vregEnc(i->Pin.AvBin8x16.dst);
5651       UInt v_srcL = vregEnc(i->Pin.AvBin8x16.srcL);
5652       UInt v_srcR = vregEnc(i->Pin.AvBin8x16.srcR);
5653       UInt opc2;
5654       switch (i->Pin.AvBin8x16.op) {
5655
5656       case Pav_ADDU:     opc2 =    0; break; // vaddubm
5657       case Pav_QADDU:    opc2 =  512; break; // vaddubs
5658       case Pav_QADDS:    opc2 =  768; break; // vaddsbs
5659
5660       case Pav_SUBU:     opc2 = 1024; break; // vsububm
5661       case Pav_QSUBU:    opc2 = 1536; break; // vsububs
5662       case Pav_QSUBS:    opc2 = 1792; break; // vsubsbs
5663
5664       case Pav_OMULU:   opc2 =    8; break; // vmuloub
5665       case Pav_OMULS:   opc2 =  264; break; // vmulosb
5666       case Pav_EMULU:   opc2 =  520; break; // vmuleub
5667       case Pav_EMULS:   opc2 =  776; break; // vmulesb
5668
5669       case Pav_AVGU:     opc2 = 1026; break; // vavgub
5670       case Pav_AVGS:     opc2 = 1282; break; // vavgsb
5671       case Pav_MAXU:     opc2 =    2; break; // vmaxub
5672       case Pav_MAXS:     opc2 =  258; break; // vmaxsb
5673       case Pav_MINU:     opc2 =  514; break; // vminub
5674       case Pav_MINS:     opc2 =  770; break; // vminsb
5675
5676       case Pav_CMPEQU:   opc2 =    6; break; // vcmpequb
5677       case Pav_CMPGTU:   opc2 =  518; break; // vcmpgtub
5678       case Pav_CMPGTS:   opc2 =  774; break; // vcmpgtsb
5679
5680       case Pav_SHL:      opc2 =  260; break; // vslb
5681       case Pav_SHR:      opc2 =  516; break; // vsrb
5682       case Pav_SAR:      opc2 =  772; break; // vsrab
5683       case Pav_ROTL:     opc2 =    4; break; // vrlb
5684
5685       case Pav_MRGHI:    opc2 =   12; break; // vmrghb
5686       case Pav_MRGLO:    opc2 =  268; break; // vmrglb
5687
5688       case Pav_POLYMULADD: opc2 = 1032; break; // vpmsumb
5689
5690       default:
5691          goto bad;
5692       }
5693       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5694       goto done;
5695    }
5696
5697    case Pin_AvBin16x8: {
5698       UInt v_dst  = vregEnc(i->Pin.AvBin16x8.dst);
5699       UInt v_srcL = vregEnc(i->Pin.AvBin16x8.srcL);
5700       UInt v_srcR = vregEnc(i->Pin.AvBin16x8.srcR);
5701       UInt opc2;
5702       switch (i->Pin.AvBin16x8.op) {
5703
5704       case Pav_ADDU:    opc2 =   64; break; // vadduhm
5705       case Pav_QADDU:   opc2 =  576; break; // vadduhs
5706       case Pav_QADDS:   opc2 =  832; break; // vaddshs
5707
5708       case Pav_SUBU:    opc2 = 1088; break; // vsubuhm
5709       case Pav_QSUBU:   opc2 = 1600; break; // vsubuhs
5710       case Pav_QSUBS:   opc2 = 1856; break; // vsubshs
5711
5712       case Pav_OMULU:   opc2 =   72; break; // vmulouh
5713       case Pav_OMULS:   opc2 =  328; break; // vmulosh
5714       case Pav_EMULU:   opc2 =  584; break; // vmuleuh
5715       case Pav_EMULS:   opc2 =  840; break; // vmulesh
5716
5717       case Pav_AVGU:    opc2 = 1090; break; // vavguh
5718       case Pav_AVGS:    opc2 = 1346; break; // vavgsh
5719       case Pav_MAXU:    opc2 =   66; break; // vmaxuh
5720       case Pav_MAXS:    opc2 =  322; break; // vmaxsh
5721       case Pav_MINS:    opc2 =  834; break; // vminsh
5722       case Pav_MINU:    opc2 =  578; break; // vminuh
5723
5724       case Pav_CMPEQU:  opc2 =   70; break; // vcmpequh
5725       case Pav_CMPGTU:  opc2 =  582; break; // vcmpgtuh
5726       case Pav_CMPGTS:  opc2 =  838; break; // vcmpgtsh
5727
5728       case Pav_SHL:     opc2 =  324; break; // vslh
5729       case Pav_SHR:     opc2 =  580; break; // vsrh
5730       case Pav_SAR:     opc2 =  836; break; // vsrah
5731       case Pav_ROTL:    opc2 =   68; break; // vrlh
5732
5733       case Pav_PACKUU:  opc2 =   14; break; // vpkuhum
5734       case Pav_QPACKUU: opc2 =  142; break; // vpkuhus
5735       case Pav_QPACKSU: opc2 =  270; break; // vpkshus
5736       case Pav_QPACKSS: opc2 =  398; break; // vpkshss
5737       case Pav_PACKPXL: opc2 =  782; break; // vpkpx
5738
5739       case Pav_MRGHI:   opc2 =   76; break; // vmrghh
5740       case Pav_MRGLO:   opc2 =  332; break; // vmrglh
5741
5742       case Pav_POLYMULADD: opc2 = 1224; break; // vpmsumh
5743
5744       default:
5745          goto bad;
5746       }
5747       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5748       goto done;
5749    }
5750
5751    case Pin_AvBin32x4: {
5752       UInt v_dst  = vregEnc(i->Pin.AvBin32x4.dst);
5753       UInt v_srcL = vregEnc(i->Pin.AvBin32x4.srcL);
5754       UInt v_srcR = vregEnc(i->Pin.AvBin32x4.srcR);
5755       UInt opc2;
5756       switch (i->Pin.AvBin32x4.op) {
5757
5758       case Pav_ADDU:    opc2 =  128; break; // vadduwm
5759       case Pav_QADDU:   opc2 =  640; break; // vadduws
5760       case Pav_QADDS:   opc2 =  896; break; // vaddsws
5761
5762       case Pav_SUBU:    opc2 = 1152; break; // vsubuwm
5763       case Pav_QSUBU:   opc2 = 1664; break; // vsubuws
5764       case Pav_QSUBS:   opc2 = 1920; break; // vsubsws
5765
5766       case Pav_MULU:    opc2 =  137; break; // vmuluwm
5767       case Pav_OMULU:   opc2 =  136; break; // vmulouw
5768       case Pav_OMULS:   opc2 =  392; break; // vmulosw
5769       case Pav_EMULU:   opc2 =  648; break; // vmuleuw
5770       case Pav_EMULS:   opc2 =  904; break; // vmulesw
5771
5772       case Pav_AVGU:    opc2 = 1154; break; // vavguw
5773       case Pav_AVGS:    opc2 = 1410; break; // vavgsw
5774
5775       case Pav_MAXU:    opc2 =  130; break; // vmaxuw
5776       case Pav_MAXS:    opc2 =  386; break; // vmaxsw
5777
5778       case Pav_MINS:    opc2 =  898; break; // vminsw
5779       case Pav_MINU:    opc2 =  642; break; // vminuw
5780
5781       case Pav_CMPEQU:  opc2 =  134; break; // vcmpequw
5782       case Pav_CMPGTS:  opc2 =  902; break; // vcmpgtsw
5783       case Pav_CMPGTU:  opc2 =  646; break; // vcmpgtuw
5784
5785       case Pav_SHL:     opc2 =  388; break; // vslw
5786       case Pav_SHR:     opc2 =  644; break; // vsrw
5787       case Pav_SAR:     opc2 =  900; break; // vsraw
5788       case Pav_ROTL:    opc2 =  132; break; // vrlw
5789
5790       case Pav_PACKUU:  opc2 =   78; break; // vpkuwum
5791       case Pav_QPACKUU: opc2 =  206; break; // vpkuwus
5792       case Pav_QPACKSU: opc2 =  334; break; // vpkswus
5793       case Pav_QPACKSS: opc2 =  462; break; // vpkswss
5794
5795       case Pav_MRGHI:   opc2 =  140; break; // vmrghw
5796       case Pav_MRGLO:   opc2 =  396; break; // vmrglw
5797
5798       case Pav_CATODD:  opc2 = 1676; break; // vmrgow
5799       case Pav_CATEVEN: opc2 = 1932; break; // vmrgew
5800
5801       case Pav_POLYMULADD: opc2 = 1160; break; // vpmsumw
5802
5803       default:
5804          goto bad;
5805       }
5806       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5807       goto done;
5808    }
5809
5810    case Pin_AvBin64x2: {
5811       UInt v_dst  = vregEnc(i->Pin.AvBin64x2.dst);
5812       UInt v_srcL = vregEnc(i->Pin.AvBin64x2.srcL);
5813       UInt v_srcR = vregEnc(i->Pin.AvBin64x2.srcR);
5814       UInt opc2;
5815       switch (i->Pin.AvBin64x2.op) {
5816       case Pav_ADDU:    opc2 =  192; break; // vaddudm  vector double add
5817       case Pav_SUBU:    opc2 = 1216; break; // vsubudm  vector double add
5818       case Pav_MAXU:    opc2 =  194; break; // vmaxud   vector double max
5819       case Pav_MAXS:    opc2 =  450; break; // vmaxsd   vector double max
5820       case Pav_MINU:    opc2 =  706; break; // vminud   vector double min
5821       case Pav_MINS:    opc2 =  962; break; // vminsd   vector double min
5822       case Pav_CMPEQU:  opc2 =  199; break; // vcmpequd vector double compare
5823       case Pav_CMPGTU:  opc2 =  711; break; // vcmpgtud vector double compare
5824       case Pav_CMPGTS:  opc2 =  967; break; // vcmpgtsd vector double compare
5825       case Pav_SHL:     opc2 = 1476; break; // vsld
5826       case Pav_SHR:     opc2 = 1732; break; // vsrd
5827       case Pav_SAR:     opc2 =  964; break; // vsrad
5828       case Pav_ROTL:    opc2 =  196; break; // vrld
5829       case Pav_PACKUU:  opc2 = 1102; break; // vpkudum
5830       case Pav_QPACKUU: opc2 = 1230; break; // vpkudus, vpksdus (emulated)
5831       case Pav_QPACKSS: opc2 = 1486; break; // vpksdsm
5832       case Pav_MRGHI:   opc2 = 1614; break; // vmrghw
5833       case Pav_MRGLO:   opc2 = 1742; break; // vmrglw
5834       case Pav_POLYMULADD: opc2 = 1096; break; // vpmsumd
5835       default:
5836          goto bad;
5837       }
5838       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5839       goto done;
5840    }
5841    case Pin_AvCipherV128Unary: {
5842       UInt v_dst = vregEnc(i->Pin.AvCipherV128Unary.dst);
5843       UInt v_src = vregEnc(i->Pin.AvCipherV128Unary.src);
5844       UInt opc2;
5845       switch (i->Pin.AvCipherV128Unary.op) {
5846       case Pav_CIPHERSUBV128:   opc2 =  1480; break; // vsbox
5847       default:
5848          goto bad;
5849       }
5850       p = mkFormVX( p, 4, v_dst, v_src, 0, opc2, endness_host );
5851       goto done;
5852    }
5853    case Pin_AvCipherV128Binary: {
5854       UInt v_dst  = vregEnc(i->Pin.AvCipherV128Binary.dst);
5855       UInt v_srcL = vregEnc(i->Pin.AvCipherV128Binary.srcL);
5856       UInt v_srcR = vregEnc(i->Pin.AvCipherV128Binary.srcR);
5857       UInt opc2;
5858       switch (i->Pin.AvCipherV128Binary.op) {
5859       case Pav_CIPHERV128:     opc2 =  1288; break; // vcipher
5860       case Pav_CIPHERLV128:    opc2 =  1289; break; // vcipherlast
5861       case Pav_NCIPHERV128:    opc2 =  1352; break; // vncipher
5862       case Pav_NCIPHERLV128:   opc2 =  1353; break; // vncipherlast
5863       default:
5864          goto bad;
5865       }
5866       p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, opc2, endness_host );
5867       goto done;
5868    }
5869    case Pin_AvHashV128Binary: {
5870       UInt v_dst = vregEnc(i->Pin.AvHashV128Binary.dst);
5871       UInt v_src = vregEnc(i->Pin.AvHashV128Binary.src);
5872       PPCRI* s_field = i->Pin.AvHashV128Binary.s_field;
5873       UInt opc2;
5874       switch (i->Pin.AvHashV128Binary.op) {
5875       case Pav_SHA256:   opc2 =  1666; break; // vshasigmaw
5876       case Pav_SHA512:   opc2 =  1730; break; // vshasigmad
5877       default:
5878          goto bad;
5879       }
5880       p = mkFormVX( p, 4, v_dst, v_src, s_field->Pri.Imm, opc2, endness_host );
5881       goto done;
5882    }
5883    case Pin_AvBCDV128Binary: {
5884       UInt v_dst  = vregEnc(i->Pin.AvBCDV128Binary.dst);
5885       UInt v_src1 = vregEnc(i->Pin.AvBCDV128Binary.src1);
5886       UInt v_src2 = vregEnc(i->Pin.AvBCDV128Binary.src2);
5887       UInt ps = 0;    /* Issue the instruction with ps=0.  The IR code will
5888                        * fix up the result if ps=1.
5889                        */
5890       UInt opc2;
5891       switch (i->Pin.AvBCDV128Binary.op) {
5892       case Pav_BCDAdd:   opc2 =  1; break; // bcdadd
5893       case Pav_BCDSub:   opc2 = 65; break; // bcdsub
5894       default:
5895          goto bad;
5896       }
5897       p = mkFormVXR( p, 4, v_dst, v_src1, v_src2,
5898                      0x1, ps | opc2, endness_host );
5899       goto done;
5900    }
5901    case Pin_AvBin32Fx4: {
5902       UInt v_dst  = vregEnc(i->Pin.AvBin32Fx4.dst);
5903       UInt v_srcL = vregEnc(i->Pin.AvBin32Fx4.srcL);
5904       UInt v_srcR = vregEnc(i->Pin.AvBin32Fx4.srcR);
5905       switch (i->Pin.AvBin32Fx4.op) {
5906
5907       case Pavfp_ADDF:
5908          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 10, endness_host );   // vaddfp
5909          break;
5910       case Pavfp_SUBF:
5911          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 74, endness_host );   // vsubfp
5912          break;
5913       case Pavfp_MAXF:
5914          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 1034, endness_host ); // vmaxfp
5915          break;
5916       case Pavfp_MINF:
5917          p = mkFormVX( p, 4, v_dst, v_srcL, v_srcR, 1098, endness_host ); // vminfp
5918          break;
5919
5920       case Pavfp_MULF: {
5921          /* Make a vmulfp from a vmaddfp:
5922             load -0.0 (0x8000_0000) to each 32-bit word of vB
5923             this makes the add a noop.
5924          */
5925          UInt vB = 29;  // XXX: Using v29 for temp do not change
5926                         // without also changing
5927                         // getRegUsage_PPCInstr
5928          UInt konst = 0x1F;
5929
5930          // Better way to load -0.0 (0x80000000) ?
5931          // vspltisw vB,0x1F   (0x1F => each word of vB)
5932          p = mkFormVX( p, 4, vB, konst, 0, 908, endness_host );
5933
5934          // vslw vB,vB,vB (each word of vB = (0x1F << 0x1F) = 0x80000000
5935          p = mkFormVX( p, 4, vB, vB, vB, 388, endness_host );
5936
5937          // Finally, do the multiply:
5938          p = mkFormVA( p, 4, v_dst, v_srcL, vB, v_srcR, 46, endness_host );
5939          break;
5940       }
5941       case Pavfp_CMPEQF:  // vcmpeqfp
5942          p = mkFormVXR( p, 4, v_dst, v_srcL, v_srcR, 0, 198, endness_host);
5943          break;
5944       case Pavfp_CMPGTF:  // vcmpgtfp
5945          p = mkFormVXR( p, 4, v_dst, v_srcL, v_srcR, 0, 710, endness_host );
5946          break;
5947       case Pavfp_CMPGEF:  // vcmpgefp
5948          p = mkFormVXR( p, 4, v_dst, v_srcL, v_srcR, 0, 454, endness_host );
5949          break;
5950
5951       default:
5952          goto bad;
5953       }
5954       goto done;
5955    }
5956
5957    case Pin_AvUn32Fx4: {
5958       UInt v_dst = vregEnc(i->Pin.AvUn32Fx4.dst);
5959       UInt v_src = vregEnc(i->Pin.AvUn32Fx4.src);
5960       UInt opc2;
5961       switch (i->Pin.AvUn32Fx4.op) {
5962       case Pavfp_RCPF:    opc2 =  266; break; // vrefp
5963       case Pavfp_RSQRTF:  opc2 =  330; break; // vrsqrtefp
5964       case Pavfp_Log2:    opc2 =  458; break; // vlogefp
5965       case Pavfp_Exp2:    opc2 =  394; break; // vexptefp
5966       case Pavfp_CVTU2F:  opc2 =  778; break; // vcfux
5967       case Pavfp_CVTS2F:  opc2 =  842; break; // vcfsx
5968       case Pavfp_QCVTF2U: opc2 =  906; break; // vctuxs
5969       case Pavfp_QCVTF2S: opc2 =  970; break; // vctsxs
5970       case Pavfp_ROUNDM:  opc2 =  714; break; // vrfim
5971       case Pavfp_ROUNDP:  opc2 =  650; break; // vrfip
5972       case Pavfp_ROUNDN:  opc2 =  522; break; // vrfin
5973       case Pavfp_ROUNDZ:  opc2 =  586; break; // vrfiz
5974       default:
5975          goto bad;
5976       }
5977       p = mkFormVX( p, 4, v_dst, 0, v_src, opc2, endness_host );
5978       goto done;
5979    }
5980
5981    case Pin_AvPerm: {  // vperm
5982       UInt v_dst  = vregEnc(i->Pin.AvPerm.dst);
5983       UInt v_srcL = vregEnc(i->Pin.AvPerm.srcL);
5984       UInt v_srcR = vregEnc(i->Pin.AvPerm.srcR);
5985       UInt v_ctl  = vregEnc(i->Pin.AvPerm.ctl);
5986       p = mkFormVA( p, 4, v_dst, v_srcL, v_srcR, v_ctl, 43, endness_host );
5987       goto done;
5988    }
5989
5990    case Pin_AvSel: {  // vsel
5991       UInt v_ctl  = vregEnc(i->Pin.AvSel.ctl);
5992       UInt v_dst  = vregEnc(i->Pin.AvSel.dst);
5993       UInt v_srcL = vregEnc(i->Pin.AvSel.srcL);
5994       UInt v_srcR = vregEnc(i->Pin.AvSel.srcR);
5995       p = mkFormVA( p, 4, v_dst, v_srcL, v_srcR, v_ctl, 42, endness_host );
5996       goto done;
5997    }
5998
5999    case Pin_AvSh: {  // vsl or vsr
6000       UInt v_dst  = vregEnc(i->Pin.AvSh.dst);
6001       Bool  idxd = toBool(i->Pin.AvSh.addr->tag == Pam_RR);
6002       UInt r_idx, r_base;
6003
6004       r_base = iregEnc(i->Pin.AvSh.addr->Pam.RR.base, mode64);
6005
6006       if (!idxd) {
6007          r_idx = 30; // XXX: Using r30 as temp
6008          p = mkLoadImm(p, r_idx,
6009                        i->Pin.AvSh.addr->Pam.IR.index, mode64, endness_host);
6010       } else {
6011          r_idx  = iregEnc(i->Pin.AvSh.addr->Pam.RR.index, mode64);
6012       }
6013
6014       if (i->Pin.AvSh.shLeft)
6015          //vsl VRT,RA,RB
6016          p = mkFormVXI( p, 31, v_dst, r_idx, r_base, 6, endness_host );
6017       else
6018          //vsr VRT,RA,RB
6019          p = mkFormVXI( p, 31, v_dst, r_idx, r_base, 38, endness_host );
6020       goto done;
6021    }
6022
6023    case Pin_AvShlDbl: {  // vsldoi
6024       UInt shift  = i->Pin.AvShlDbl.shift;
6025       UInt v_dst  = vregEnc(i->Pin.AvShlDbl.dst);
6026       UInt v_srcL = vregEnc(i->Pin.AvShlDbl.srcL);
6027       UInt v_srcR = vregEnc(i->Pin.AvShlDbl.srcR);
6028       vassert(shift <= 0xF);
6029       p = mkFormVA( p, 4, v_dst, v_srcL, v_srcR, shift, 44, endness_host );
6030       goto done;
6031    }
6032
6033    case Pin_AvSplat: { // vsplt(is)(b,h,w)
6034       UInt v_dst = vregEnc(i->Pin.AvShlDbl.dst);
6035       UChar sz   = i->Pin.AvSplat.sz;
6036       UInt v_src, opc2;
6037       vassert(sz == 8 || sz == 16 || sz == 32);
6038
6039       if (i->Pin.AvSplat.src->tag == Pvi_Imm) {
6040          Char simm5;
6041          opc2 = (sz == 8) ? 780 : (sz == 16) ? 844 : 908;   // 8,16,32
6042          /* expects 5-bit-signed-imm */
6043          simm5 = i->Pin.AvSplat.src->Pvi.Imm5s;
6044          vassert(simm5 >= -16 && simm5 <= 15);
6045          simm5 = simm5 & 0x1F;
6046          p = mkFormVX( p, 4, v_dst, (UInt)simm5, 0, opc2, endness_host );
6047       }
6048       else {  // Pri_Reg
6049          UInt lowest_lane;
6050          opc2 = (sz == 8) ? 524 : (sz == 16) ? 588 : 652;  // 8,16,32
6051          vassert(hregClass(i->Pin.AvSplat.src->Pvi.Reg) == HRcVec128);
6052          v_src = vregEnc(i->Pin.AvSplat.src->Pvi.Reg);
6053          lowest_lane = (128/sz)-1;
6054          p = mkFormVX( p, 4, v_dst, lowest_lane, v_src, opc2, endness_host );
6055       }
6056       goto done;
6057    }
6058
6059    case Pin_AvCMov: {
6060       UInt v_dst     = vregEnc(i->Pin.AvCMov.dst);
6061       UInt v_src     = vregEnc(i->Pin.AvCMov.src);
6062       PPCCondCode cc = i->Pin.AvCMov.cond;
6063
6064       if (v_dst == v_src) goto done;
6065
6066       vassert(cc.test != Pct_ALWAYS);
6067
6068       /* jmp fwds 2 insns if !condition */
6069       if (cc.test != Pct_ALWAYS) {
6070          /* bc !ct,cf,n_bytes>>2 */
6071          p = mkFormB(p, invertCondTest(cc.test), cc.flag, 8>>2, 0, 0,
6072                      endness_host);
6073       }
6074       /* vmr */
6075       p = mkFormVX( p, 4, v_dst, v_src, v_src, 1156, endness_host );
6076       goto done;
6077    }
6078
6079    case Pin_AvLdVSCR: {  // mtvscr
6080       UInt v_src = vregEnc(i->Pin.AvLdVSCR.src);
6081       p = mkFormVX( p, 4, 0, 0, v_src, 1604, endness_host );
6082       goto done;
6083    }
6084
6085    case Pin_Dfp64Unary: {
6086       UInt fr_dst = fregEnc( i->Pin.FpUnary.dst );
6087       UInt fr_src = fregEnc( i->Pin.FpUnary.src );
6088
6089       switch (i->Pin.Dfp64Unary.op) {
6090       case Pfp_MOV: // fmr, PPC32 p410
6091          p = mkFormX( p, 63, fr_dst, 0, fr_src, 72, 0, endness_host );
6092          break;
6093       case Pfp_DCTDP:   // D32 to D64
6094          p = mkFormX( p, 59, fr_dst, 0, fr_src, 258, 0, endness_host );
6095          break;
6096       case Pfp_DRSP:    // D64 to D32
6097          p = mkFormX( p, 59, fr_dst, 0, fr_src, 770, 0, endness_host );
6098          break;
6099       case Pfp_DCFFIX:   // I64 to D64 conversion
6100          /* ONLY WORKS ON POWER7 */
6101          p = mkFormX( p, 59, fr_dst, 0, fr_src, 802, 0, endness_host );
6102          break;
6103       case Pfp_DCTFIX:   // D64 to I64 conversion
6104          p = mkFormX( p, 59, fr_dst, 0, fr_src, 290, 0, endness_host );
6105          break;
6106       case Pfp_DXEX:     // Extract exponent
6107          p = mkFormX( p, 59, fr_dst, 0, fr_src, 354, 0, endness_host );
6108          break;
6109       default:
6110          goto bad;
6111       }
6112       goto done;
6113    }
6114
6115    case Pin_Dfp64Binary: {
6116       UInt fr_dst = fregEnc( i->Pin.Dfp64Binary.dst );
6117       UInt fr_srcL = fregEnc( i->Pin.Dfp64Binary.srcL );
6118       UInt fr_srcR = fregEnc( i->Pin.Dfp64Binary.srcR );
6119       switch (i->Pin.Dfp64Binary.op) {
6120       case Pfp_DFPADD: /* dadd, dfp add, use default RM from reg ignore mode
6121                         * from the Iop instruction. */
6122          p = mkFormX( p, 59, fr_dst, fr_srcL, fr_srcR, 2, 0, endness_host );
6123          break;
6124       case Pfp_DFPSUB: /* dsub, dfp subtract, use default RM from reg ignore
6125                         * mode from the Iop instruction. */
6126          p = mkFormX( p, 59, fr_dst, fr_srcL, fr_srcR, 514, 0, endness_host );
6127          break;
6128       case Pfp_DFPMUL: /* dmul, dfp multipy, use default RM from reg ignore
6129                         * mode from the Iop instruction. */
6130          p = mkFormX( p, 59, fr_dst, fr_srcL, fr_srcR, 34, 0, endness_host );
6131          break;
6132       case Pfp_DFPDIV: /* ddiv, dfp divide, use default RM from reg ignore
6133                         * mode from the Iop instruction. */
6134          p = mkFormX( p, 59, fr_dst, fr_srcL, fr_srcR, 546, 0, endness_host );
6135          break;
6136       case Pfp_DIEX:  /* diex, insert exponent */
6137          p = mkFormX( p, 59, fr_dst, fr_srcL, fr_srcR, 866, 0, endness_host );
6138          break;
6139       default:
6140          goto bad;
6141       }
6142       goto done;
6143    }
6144
6145    case Pin_DfpShift: {
6146       UInt fr_src = fregEnc(i->Pin.DfpShift.src);
6147       UInt fr_dst = fregEnc(i->Pin.DfpShift.dst);
6148       UInt shift;
6149
6150       shift =  i->Pin.DfpShift.shift->Pri.Imm;
6151
6152       switch (i->Pin.DfpShift.op) {
6153       case Pfp_DSCLI:    /* dscli, DFP shift left by fr_srcR */
6154          p = mkFormZ22( p, 59, fr_dst, fr_src, shift,  66, 0, endness_host );
6155          break;
6156       case Pfp_DSCRI:    /* dscri, DFP shift right by fr_srcR */
6157          p = mkFormZ22( p, 59, fr_dst, fr_src, shift,  98, 0, endness_host );
6158          break;
6159       default:
6160          vex_printf("ERROR: emit_PPCInstr default case\n");
6161          goto bad;
6162       }
6163       goto done;
6164    }
6165
6166    case Pin_ExtractExpD128: {
6167       UInt fr_dst   = fregEnc(i->Pin.ExtractExpD128.dst);
6168       UInt fr_srcHi = fregEnc(i->Pin.ExtractExpD128.src_hi);
6169       UInt fr_srcLo = fregEnc(i->Pin.ExtractExpD128.src_lo);
6170
6171       switch (i->Pin.ExtractExpD128.op) {
6172       case Pfp_DXEXQ:
6173          /* Setup the upper and lower registers of the source operand
6174           * register pair.
6175           */
6176          p = mkFormX( p, 63, 12, 0, fr_srcHi, 72, 0, endness_host );
6177          p = mkFormX( p, 63, 13, 0, fr_srcLo, 72, 0, endness_host );
6178          p = mkFormX( p, 63, 10, 0, 12, 354, 0, endness_host );
6179
6180          /* The instruction will put the 64-bit result in
6181           * register 10.
6182           */
6183          p = mkFormX(p, 63, fr_dst, 0, 10,  72, 0, endness_host);
6184          break;
6185       default:
6186          vex_printf("Error: emit_PPCInstr case Pin_DfpExtractExp, case inst Default\n");
6187          goto bad;
6188       }
6189       goto done;
6190    }
6191    case Pin_Dfp128Unary: {
6192      UInt fr_dstHi = fregEnc(i->Pin.Dfp128Unary.dst_hi);
6193      UInt fr_dstLo = fregEnc(i->Pin.Dfp128Unary.dst_lo);
6194      UInt fr_srcLo = fregEnc(i->Pin.Dfp128Unary.src_lo);
6195
6196      /* Do instruction with 128-bit source operands in registers (10,11)
6197       * and (12,13).
6198       */
6199      switch (i->Pin.Dfp128Unary.op) {
6200      case Pfp_DCTQPQ: // D64 to D128, srcLo holds 64 bit operand
6201         p = mkFormX( p, 63, 12, 0, fr_srcLo, 72, 0, endness_host );
6202
6203         p = mkFormX( p, 63, 10, 0, 12, 258, 0, endness_host );
6204
6205         /* The instruction will put the 128-bit result in
6206          * registers (10,11).  Note, the operand in the instruction only
6207          * reference the first of the two registers in the pair.
6208          */
6209         p = mkFormX(p, 63, fr_dstHi, 0, 10,  72, 0, endness_host);
6210         p = mkFormX(p, 63, fr_dstLo, 0, 11,  72, 0, endness_host);
6211         break;
6212      default:
6213         vex_printf("Error: emit_PPCInstr case Pin_Dfp128Unary, case inst Default\
6214 \n");
6215         goto bad;
6216      }
6217      goto done;
6218    }
6219
6220    case Pin_Dfp128Binary: {
6221       /* dst is used to supply the  left source operand and return
6222        * the result.
6223        */
6224       UInt fr_dstHi = fregEnc( i->Pin.Dfp128Binary.dst_hi );
6225       UInt fr_dstLo = fregEnc( i->Pin.Dfp128Binary.dst_lo );
6226       UInt fr_srcRHi = fregEnc( i->Pin.Dfp128Binary.srcR_hi );
6227       UInt fr_srcRLo = fregEnc( i->Pin.Dfp128Binary.srcR_lo );
6228
6229       /* Setup the upper and lower registers of the source operand
6230        * register pair.
6231        */
6232       p = mkFormX( p, 63, 10, 0, fr_dstHi, 72, 0, endness_host );
6233       p = mkFormX( p, 63, 11, 0, fr_dstLo, 72, 0, endness_host );
6234       p = mkFormX( p, 63, 12, 0, fr_srcRHi, 72, 0, endness_host );
6235       p = mkFormX( p, 63, 13, 0, fr_srcRLo, 72, 0, endness_host );
6236
6237       /* Do instruction with 128-bit source operands in registers (10,11)
6238        * and (12,13).
6239        */
6240       switch (i->Pin.Dfp128Binary.op) {
6241       case Pfp_DFPADDQ:
6242          p = mkFormX( p, 63, 10, 10, 12, 2, 0, endness_host );
6243          break;
6244       case Pfp_DFPSUBQ:
6245          p = mkFormX( p, 63, 10, 10, 12, 514, 0, endness_host );
6246          break;
6247       case Pfp_DFPMULQ:
6248          p = mkFormX( p, 63, 10, 10, 12, 34, 0, endness_host );
6249          break;
6250       case Pfp_DFPDIVQ:
6251          p = mkFormX( p, 63, 10, 10, 12, 546, 0, endness_host );
6252          break;
6253       default:
6254          goto bad;
6255       }
6256
6257       /* The instruction will put the 128-bit result in
6258        * registers (10,11).  Note, the operand in the instruction only
6259        * reference the first of the two registers in the pair.
6260        */
6261       p = mkFormX(p, 63, fr_dstHi, 0, 10,  72, 0, endness_host);
6262       p = mkFormX(p, 63, fr_dstLo, 0, 11,  72, 0, endness_host);
6263       goto done;
6264    }
6265
6266    case Pin_DfpShift128: {
6267       UInt fr_src_hi = fregEnc(i->Pin.DfpShift128.src_hi);
6268       UInt fr_src_lo = fregEnc(i->Pin.DfpShift128.src_lo);
6269       UInt fr_dst_hi = fregEnc(i->Pin.DfpShift128.dst_hi);
6270       UInt fr_dst_lo = fregEnc(i->Pin.DfpShift128.dst_lo);
6271       UInt shift;
6272
6273       shift =  i->Pin.DfpShift128.shift->Pri.Imm;
6274
6275       /* setup source operand in register 12, 13 pair */
6276       p = mkFormX(p, 63, 12, 0, fr_src_hi, 72, 0, endness_host);
6277       p = mkFormX(p, 63, 13, 0, fr_src_lo, 72, 0, endness_host);
6278
6279       /* execute instruction putting result in register 10, 11 pair */
6280       switch (i->Pin.DfpShift128.op) {
6281       case Pfp_DSCLIQ:    /* dscliq, DFP shift left, fr_srcR is the integer
6282                            * shift amount.
6283                            */
6284          p = mkFormZ22( p, 63, 10, 12, shift,  66, 0, endness_host );
6285          break;
6286       case Pfp_DSCRIQ:    /* dscriq, DFP shift right, fr_srcR is the integer
6287                            * shift amount.
6288                            */
6289          p = mkFormZ22( p, 63, 10, 12, shift,  98, 0, endness_host );
6290          break;
6291       default:
6292          vex_printf("ERROR: emit_PPCInstr quad default case %d \n",
6293                     (Int)i->Pin.DfpShift128.op);
6294          goto bad;
6295       }
6296
6297       /* The instruction put the 128-bit result in registers (10,11).
6298        * Note, the operand in the instruction only reference the first of
6299        * the two registers in the pair.
6300        */
6301       p = mkFormX(p, 63, fr_dst_hi, 0, 10,  72, 0, endness_host);
6302       p = mkFormX(p, 63, fr_dst_lo, 0, 11,  72, 0, endness_host);
6303       goto done;
6304    }
6305
6306    case Pin_DfpRound: {
6307       UInt fr_dst = fregEnc(i->Pin.DfpRound.dst);
6308       UInt fr_src = fregEnc(i->Pin.DfpRound.src);
6309       UInt r_rmc, r, rmc;
6310
6311       r_rmc =  i->Pin.DfpRound.r_rmc->Pri.Imm;
6312       r = (r_rmc & 0x8) >> 3;
6313       rmc = r_rmc & 0x3;
6314
6315       // drintx
6316       p = mkFormZ23(p, 59, fr_dst, r, fr_src, rmc, 99, 0, endness_host);
6317       goto done;
6318    }
6319
6320    case Pin_DfpRound128: {
6321       UInt fr_dstHi = fregEnc(i->Pin.DfpRound128.dst_hi);
6322       UInt fr_dstLo = fregEnc(i->Pin.DfpRound128.dst_lo);
6323       UInt fr_srcHi = fregEnc(i->Pin.DfpRound128.src_hi);
6324       UInt fr_srcLo = fregEnc(i->Pin.DfpRound128.src_lo);
6325       UInt r_rmc, r, rmc;
6326
6327       r_rmc =  i->Pin.DfpRound128.r_rmc->Pri.Imm;
6328       r = (r_rmc & 0x8) >> 3;
6329       rmc = r_rmc & 0x3;
6330
6331       /* Setup the upper and lower registers of the source operand
6332        * register pair.
6333        */
6334       p = mkFormX(p, 63, 12, 0, fr_srcHi, 72, 0, endness_host);
6335       p = mkFormX(p, 63, 13, 0, fr_srcLo, 72, 0, endness_host);
6336
6337       /* Do drintx instruction with 128-bit source operands in
6338        * registers (12,13).
6339        */
6340       p = mkFormZ23(p, 63, 10, r, 12, rmc, 99, 0, endness_host);
6341
6342       /* The instruction will put the 128-bit result in
6343        * registers (10,11).  Note, the operand in the instruction only
6344        * reference the first of the two registers in the pair.
6345        */
6346       p = mkFormX(p, 63, fr_dstHi, 0, 10,  72, 0, endness_host);
6347       p = mkFormX(p, 63, fr_dstLo, 0, 11,  72, 0, endness_host);
6348       goto done;
6349    }
6350
6351    case Pin_DfpQuantize: {
6352       UInt fr_dst  = fregEnc(i->Pin.DfpQuantize.dst);
6353       UInt fr_srcL = fregEnc(i->Pin.DfpQuantize.srcL);
6354       UInt fr_srcR = fregEnc(i->Pin.DfpQuantize.srcR);
6355       UInt rmc;
6356
6357       rmc =  i->Pin.DfpQuantize.rmc->Pri.Imm;
6358
6359       switch (i->Pin.DfpQuantize.op) {
6360       case Pfp_DQUA:
6361          p = mkFormZ23(p, 59, fr_dst, fr_srcL, fr_srcR, rmc, 3, 0, endness_host);
6362          break;
6363       case Pfp_RRDTR:
6364          p = mkFormZ23(p, 59, fr_dst, fr_srcL, fr_srcR, rmc, 35, 0, endness_host);
6365          break;
6366       default:
6367          break;
6368       }
6369       goto done;
6370    }
6371
6372    case Pin_DfpQuantize128: {
6373       UInt fr_dst_hi = fregEnc(i->Pin.DfpQuantize128.dst_hi);
6374       UInt fr_dst_lo = fregEnc(i->Pin.DfpQuantize128.dst_lo);
6375       UInt fr_src_hi = fregEnc(i->Pin.DfpQuantize128.src_hi);
6376       UInt fr_src_lo = fregEnc(i->Pin.DfpQuantize128.src_lo);
6377       UInt rmc;
6378
6379       rmc =  i->Pin.DfpQuantize128.rmc->Pri.Imm;
6380       /* Setup the upper and lower registers of the source operand
6381        * register pairs.  Note, left source operand passed in via the
6382        * dst register pair.
6383        */
6384       p = mkFormX(p, 63, 10, 0, fr_dst_hi, 72, 0, endness_host);
6385       p = mkFormX(p, 63, 11, 0, fr_dst_lo, 72, 0, endness_host);
6386       p = mkFormX(p, 63, 12, 0, fr_src_hi, 72, 0, endness_host);
6387       p = mkFormX(p, 63, 13, 0, fr_src_lo, 72, 0, endness_host);
6388
6389       /* Do dquaq instruction with 128-bit source operands in
6390        * registers (12,13).
6391        */
6392       switch (i->Pin.DfpQuantize128.op) {
6393       case Pfp_DQUAQ:
6394          p = mkFormZ23(p, 63, 10, 10, 12, rmc, 3, 0, endness_host);
6395          break;
6396       case Pfp_DRRNDQ:
6397          p = mkFormZ23(p, 63, 10, 10, 12, rmc, 35, 0, endness_host);
6398          break;
6399       default:
6400          vpanic("Pin_DfpQuantize128: default case, couldn't find inst to issue \n");
6401          break;
6402       }
6403
6404       /* The instruction will put the 128-bit result in
6405        * registers (10,11).  Note, the operand in the instruction only
6406        * reference the first of the two registers in the pair.
6407        */
6408       p = mkFormX(p, 63, fr_dst_hi, 0, 10,  72, 0, endness_host);
6409       p = mkFormX(p, 63, fr_dst_lo, 0, 11,  72, 0, endness_host);
6410       goto done;
6411    }
6412
6413    case Pin_DfpD128toD64: {
6414       UInt fr_dst   = fregEnc( i->Pin.DfpD128toD64.dst );
6415       UInt fr_srcHi = fregEnc( i->Pin.DfpD128toD64.src_hi );
6416       UInt fr_srcLo = fregEnc( i->Pin.DfpD128toD64.src_lo );
6417
6418       /* Setup the upper and lower registers of the source operand
6419        * register pair.
6420        */
6421       p = mkFormX( p, 63, 10, 0, fr_dst, 72, 0, endness_host );
6422       p = mkFormX( p, 63, 12, 0, fr_srcHi, 72, 0, endness_host );
6423       p = mkFormX( p, 63, 13, 0, fr_srcLo, 72, 0, endness_host );
6424
6425       /* Do instruction with 128-bit source operands in registers (10,11) */
6426       switch (i->Pin.Dfp128Binary.op) {
6427       case Pfp_DRDPQ:
6428          p = mkFormX( p, 63, 10, 0, 12, 770, 0, endness_host );
6429          break;
6430       case Pfp_DCTFIXQ:
6431          p = mkFormX( p, 63, 10, 0, 12, 290, 0, endness_host );
6432          break;
6433       default:
6434          goto bad;
6435       }
6436
6437       /* The instruction will put the 64-bit result in registers 10. */
6438       p = mkFormX(p, 63, fr_dst, 0, 10,  72, 0, endness_host);
6439       goto done;
6440    }
6441
6442    case Pin_DfpI64StoD128: {
6443       UInt fr_dstHi = fregEnc( i->Pin.DfpI64StoD128.dst_hi );
6444       UInt fr_dstLo = fregEnc( i->Pin.DfpI64StoD128.dst_lo );
6445       UInt fr_src   = fregEnc( i->Pin.DfpI64StoD128.src );
6446
6447       switch (i->Pin.Dfp128Binary.op) {
6448       case Pfp_DCFFIXQ:
6449          p = mkFormX( p, 63, 10, 11, fr_src, 802, 0, endness_host );
6450          break;
6451       default:
6452          goto bad;
6453       }
6454
6455       /* The instruction will put the 64-bit result in registers 10, 11. */
6456       p = mkFormX(p, 63, fr_dstHi, 0, 10,  72, 0, endness_host);
6457       p = mkFormX(p, 63, fr_dstLo, 0, 11,  72, 0, endness_host);
6458       goto done;
6459    }
6460
6461    case Pin_InsertExpD128: {
6462       UInt fr_dstHi  = fregEnc(i->Pin.InsertExpD128.dst_hi);
6463       UInt fr_dstLo  = fregEnc(i->Pin.InsertExpD128.dst_lo);
6464       UInt fr_srcL   = fregEnc(i->Pin.InsertExpD128.srcL);
6465       UInt fr_srcRHi = fregEnc(i->Pin.InsertExpD128.srcR_hi);
6466       UInt fr_srcRLo = fregEnc(i->Pin.InsertExpD128.srcR_lo);
6467
6468       /* The left operand is a single F64 value, the right is an F128
6469        * register pair.
6470        */
6471       p = mkFormX(p, 63, 10, 0, fr_srcL, 72, 0, endness_host);
6472       p = mkFormX(p, 63, 12, 0, fr_srcRHi, 72, 0, endness_host);
6473       p = mkFormX(p, 63, 13, 0, fr_srcRLo, 72, 0, endness_host);
6474       p = mkFormX(p, 63, 10, 10, 12, 866, 0, endness_host );
6475
6476       /* The instruction will put the 128-bit result into
6477        * registers (10,11).  Note, the operand in the instruction only
6478        * reference the first of the two registers in the pair.
6479        */
6480       p = mkFormX(p, 63, fr_dstHi, 0, 10,  72, 0, endness_host);
6481       p = mkFormX(p, 63, fr_dstLo, 0, 11,  72, 0, endness_host);
6482       goto done;
6483    }
6484
6485    case Pin_Dfp64Cmp:{
6486       UChar crfD    = 1;
6487       UInt  r_dst   = iregEnc(i->Pin.Dfp64Cmp.dst, mode64);
6488       UInt  fr_srcL = fregEnc(i->Pin.Dfp64Cmp.srcL);
6489       UInt  fr_srcR = fregEnc(i->Pin.Dfp64Cmp.srcR);
6490       vassert(crfD < 8);
6491       // dcmpo, dcmpu
6492       p = mkFormX(p, 59, crfD<<2, fr_srcL, fr_srcR, 130, 0, endness_host);
6493
6494       // mfcr (mv CR to r_dst)
6495       p = mkFormX(p, 31, r_dst, 0, 0, 19, 0, endness_host);
6496
6497       // rlwinm r_dst,r_dst,8,28,31
6498       //  => rotate field 1 to bottomw of word, masking out upper 28
6499       p = mkFormM(p, 21, r_dst, r_dst, 8, 28, 31, 0, endness_host);
6500       goto done;
6501    }
6502
6503    case Pin_Dfp128Cmp: {
6504       UChar crfD       = 1;
6505       UInt  r_dst      = iregEnc(i->Pin.Dfp128Cmp.dst, mode64);
6506       UInt  fr_srcL_hi = fregEnc(i->Pin.Dfp128Cmp.srcL_hi);
6507       UInt  fr_srcL_lo = fregEnc(i->Pin.Dfp128Cmp.srcL_lo);
6508       UInt  fr_srcR_hi = fregEnc(i->Pin.Dfp128Cmp.srcR_hi);
6509       UInt  fr_srcR_lo = fregEnc(i->Pin.Dfp128Cmp.srcR_lo);
6510       vassert(crfD < 8);
6511       // dcmpoq, dcmpuq
6512       /* Setup the upper and lower registers of the source operand
6513        * register pair.
6514        */
6515       p = mkFormX(p, 63, 10, 0, fr_srcL_hi, 72, 0, endness_host);
6516       p = mkFormX(p, 63, 11, 0, fr_srcL_lo, 72, 0, endness_host);
6517       p = mkFormX(p, 63, 12, 0, fr_srcR_hi, 72, 0, endness_host);
6518       p = mkFormX(p, 63, 13, 0, fr_srcR_lo, 72, 0, endness_host);
6519
6520       p = mkFormX(p, 63, crfD<<2, 10, 12, 130, 0, endness_host);
6521
6522       // mfcr (mv CR to r_dst)
6523       p = mkFormX(p, 31, r_dst, 0, 0, 19, 0, endness_host);
6524
6525       // rlwinm r_dst,r_dst,8,28,31
6526       //  => rotate field 1 to bottomw of word, masking out upper 28
6527       p = mkFormM(p, 21, r_dst, r_dst, 8, 28, 31, 0, endness_host);
6528       goto done;
6529    }
6530
6531    case Pin_XFormUnary994: {
6532
6533        switch (i->Pin.XFormUnary994.op) {
6534
6535        case Px_IQSTODFP:      // dcffixqq
6536        {
6537           UInt dstHi = fregEnc(i->Pin.XFormUnary994.reg0);
6538           UInt dstLo = fregEnc(i->Pin.XFormUnary994.reg1);
6539           UInt src   = vregEnc(i->Pin.XFormUnary994.reg2);
6540           Int inst_sel = 0;
6541
6542           /* Do instruction, 128-bit integer source operand, result in two
6543              floating point registers VSR(10,11) */
6544           /* dcffixqq put result in  VSR[10], VSR[11] dword 0 */
6545           p = mkFormX994( p, inst_sel, 10, src, endness_host );
6546
6547           /* Move results to destination floating point register pair.
6548              Floating point regs are VSR[0] to VSR[31]  */
6549           p = mkFormX( p, 63, dstHi, 0, 10, 72, 0, endness_host );
6550           p = mkFormX( p, 63, dstLo, 0, 11, 72, 0, endness_host );
6551           break;
6552        }
6553
6554        case Px_DFPTOIQS:     // dctfixqq
6555        {
6556           UInt dstVSR = vregEnc(i->Pin.XFormUnary994.reg0);
6557           UInt srcHi = fregEnc(i->Pin.XFormUnary994.reg1);
6558           UInt srcLo = fregEnc(i->Pin.XFormUnary994.reg2);
6559           Int inst_sel = 1;
6560
6561           /* Setup the upper and lower registers of the source operand
6562            * register pair.
6563            */
6564           p = mkFormX( p, 63, 10, 0, srcHi, 72, 0, endness_host );
6565           p = mkFormX( p, 63, 11, 0, srcLo, 72, 0, endness_host );
6566
6567           /* Do instruction, two 64-bit source operands in registers floating
6568              point registers VSR(10,11) */
6569           p = mkFormX994( p, inst_sel, dstVSR, 10, endness_host );
6570           break;
6571        }
6572        default:
6573            goto bad;
6574        }
6575       goto done;
6576    }
6577
6578    case Pin_EvCheck: {
6579       /* This requires a 32-bit dec/test in both 32- and 64-bit
6580          modes. */
6581       /* We generate:
6582             lwz     r30, amCounter
6583             addic.  r30, r30, -1
6584             stw     r30, amCounter
6585             bge     nofail
6586             lwz/ld  r30, amFailAddr
6587             mtctr   r30
6588             bctr
6589            nofail:
6590       */
6591       UChar* p0 = p;
6592       /* lwz r30, amCounter */
6593       p = do_load_or_store_word32(p, True/*isLoad*/, /*r*/30,
6594                                   i->Pin.EvCheck.amCounter, mode64,
6595                                   endness_host);
6596       /* addic. r30,r30,-1 */
6597       p = emit32(p, 0x37DEFFFF, endness_host);
6598       /* stw r30, amCounter */
6599       p = do_load_or_store_word32(p, False/*!isLoad*/, /*r*/30,
6600                                   i->Pin.EvCheck.amCounter, mode64,
6601                                   endness_host);
6602       /* bge nofail */
6603       p = emit32(p, 0x40800010, endness_host);
6604       /* lwz/ld r30, amFailAddr */
6605       p = do_load_or_store_machine_word(p, True/*isLoad*/, /*r*/30,
6606                                         i->Pin.EvCheck.amFailAddr, mode64,
6607                                         endness_host);
6608       /* mtctr r30 */
6609       p = mkFormXFX(p, /*r*/30, 9, 467, endness_host);
6610       /* bctr */
6611       p = mkFormXL(p, 19, Pct_ALWAYS, 0, 0, 528, 0, endness_host);
6612       /* nofail: */
6613
6614       /* Crosscheck */
6615       vassert(evCheckSzB_PPC() == (UChar*)p - (UChar*)p0);
6616       goto done;
6617    }
6618
6619    case Pin_ProfInc: {
6620       /* We generate:
6621                (ctrP is unknown now, so use 0x65556555(65556555) in the
6622                expectation that a later call to LibVEX_patchProfCtr
6623                will be used to fill in the immediate fields once the
6624                right value is known.)
6625             32-bit:
6626               imm32-exactly r30, 0x65556555
6627               lwz     r29, 4(r30)
6628               addic.  r29, r29, 1
6629               stw     r29, 4(r30)
6630               lwz     r29, 0(r30)
6631               addze   r29, r29
6632               stw     r29, 0(r30)
6633             64-bit:
6634               imm64-exactly r30, 0x6555655565556555
6635               ld      r29, 0(r30)
6636               addi    r29, r29, 1
6637               std     r29, 0(r30)
6638       */
6639       if (mode64) {
6640          p = mkLoadImm_EXACTLY2or5(
6641                 p, /*r*/30, 0x6555655565556555ULL, True/*mode64*/, endness_host);
6642          p = emit32(p, 0xEBBE0000, endness_host);
6643          p = emit32(p, 0x3BBD0001, endness_host);
6644          p = emit32(p, 0xFBBE0000, endness_host);
6645       } else {
6646          p = mkLoadImm_EXACTLY2or5(
6647                 p, /*r*/30, 0x65556555ULL, False/*!mode64*/, endness_host);
6648          p = emit32(p, 0x83BE0004, endness_host);
6649          p = emit32(p, 0x37BD0001, endness_host);
6650          p = emit32(p, 0x93BE0004, endness_host);
6651          p = emit32(p, 0x83BE0000, endness_host);
6652          p = emit32(p, 0x7FBD0194, endness_host);
6653          p = emit32(p, 0x93BE0000, endness_host);
6654       }
6655       /* Tell the caller .. */
6656       vassert(!(*is_profInc));
6657       *is_profInc = True;
6658       goto done;
6659    }
6660
6661    default:
6662       goto bad;
6663    }
6664
6665   bad:
6666    vex_printf("\n=> ");
6667    ppPPCInstr(i, mode64);
6668    vpanic("emit_PPCInstr");
6669    /*NOTREACHED*/
6670
6671   done:
6672    vassert(p - &buf[0] <= 64);
6673    return p - &buf[0];
6674 }
6675
6676
6677 /* How big is an event check?  See case for Pin_EvCheck in
6678    emit_PPCInstr just above.  That crosschecks what this returns, so
6679    we can tell if we're inconsistent. */
6680 Int evCheckSzB_PPC (void)
6681 {
6682   return 28;
6683 }
6684
6685
6686 /* NB: what goes on here has to be very closely coordinated with the
6687    emitInstr case for XDirect, above. */
6688 VexInvalRange chainXDirect_PPC ( VexEndness endness_host,
6689                                  void* place_to_chain,
6690                                  const void* disp_cp_chain_me_EXPECTED,
6691                                  const void* place_to_jump_to,
6692                                  Bool  mode64 )
6693 {
6694    if (mode64) {
6695       vassert((endness_host == VexEndnessBE) ||
6696               (endness_host == VexEndnessLE));
6697    } else {
6698       vassert(endness_host == VexEndnessBE);
6699    }
6700
6701    /* What we're expecting to see is:
6702         imm32/64-fixed r30, disp_cp_chain_me_to_EXPECTED
6703         mtctr r30
6704         bctrl
6705       viz
6706         <8 or 20 bytes generated by mkLoadImm_EXACTLY2or5>
6707         7F C9 03 A6
6708         4E 80 04 21
6709    */
6710    UChar* p = (UChar*)place_to_chain;
6711    vassert(0 == (3 & (HWord)p));
6712    vassert(isLoadImm_EXACTLY2or5(p, /*r*/30,
6713                                  (Addr)disp_cp_chain_me_EXPECTED,
6714                                  mode64, endness_host));
6715    vassert(fetch32(p + (mode64 ? 20 : 8) + 0, endness_host) == 0x7FC903A6);
6716    vassert(fetch32(p + (mode64 ? 20 : 8) + 4, endness_host) == 0x4E800421);
6717    /* And what we want to change it to is:
6718         imm32/64-fixed r30, place_to_jump_to
6719         mtctr r30
6720         bctr
6721       viz
6722         <8 or 20 bytes generated by mkLoadImm_EXACTLY2or5>
6723         7F C9 03 A6
6724         4E 80 04 20
6725       The replacement has the same length as the original.
6726    */
6727    p = mkLoadImm_EXACTLY2or5(p, /*r*/30,
6728                              (Addr)place_to_jump_to, mode64,
6729                              endness_host);
6730    p = emit32(p, 0x7FC903A6, endness_host);
6731    p = emit32(p, 0x4E800420, endness_host);
6732
6733    Int len = p - (UChar*)place_to_chain;
6734    vassert(len == (mode64 ? 28 : 16)); /* stay sane */
6735    VexInvalRange vir = {(HWord)place_to_chain, len};
6736    return vir;
6737 }
6738
6739
6740 /* NB: what goes on here has to be very closely coordinated with the
6741    emitInstr case for XDirect, above. */
6742 VexInvalRange unchainXDirect_PPC ( VexEndness endness_host,
6743                                    void* place_to_unchain,
6744                                    const void* place_to_jump_to_EXPECTED,
6745                                    const void* disp_cp_chain_me,
6746                                    Bool  mode64 )
6747 {
6748    if (mode64) {
6749       vassert((endness_host == VexEndnessBE) ||
6750               (endness_host == VexEndnessLE));
6751    } else {
6752       vassert(endness_host == VexEndnessBE);
6753    }
6754
6755    /* What we're expecting to see is:
6756         imm32/64-fixed r30, place_to_jump_to_EXPECTED
6757         mtctr r30
6758         bctr
6759       viz
6760         <8 or 20 bytes generated by mkLoadImm_EXACTLY2or5>
6761         7F C9 03 A6
6762         4E 80 04 20
6763    */
6764    UChar* p = (UChar*)place_to_unchain;
6765    vassert(0 == (3 & (HWord)p));
6766    vassert(isLoadImm_EXACTLY2or5(p, /*r*/30,
6767                                  (Addr)place_to_jump_to_EXPECTED,
6768                                  mode64, endness_host));
6769    vassert(fetch32(p + (mode64 ? 20 : 8) + 0, endness_host) == 0x7FC903A6);
6770    vassert(fetch32(p + (mode64 ? 20 : 8) + 4, endness_host) == 0x4E800420);
6771    /* And what we want to change it to is:
6772         imm32/64-fixed r30, disp_cp_chain_me
6773         mtctr r30
6774         bctrl
6775       viz
6776         <8 or 20 bytes generated by mkLoadImm_EXACTLY2or5>
6777         7F C9 03 A6
6778         4E 80 04 21
6779       The replacement has the same length as the original.
6780    */
6781    p = mkLoadImm_EXACTLY2or5(p, /*r*/30,
6782                              (Addr)disp_cp_chain_me, mode64,
6783                              endness_host);
6784    p = emit32(p, 0x7FC903A6, endness_host);
6785    p = emit32(p, 0x4E800421, endness_host);
6786
6787    Int len = p - (UChar*)place_to_unchain;
6788    vassert(len == (mode64 ? 28 : 16)); /* stay sane */
6789    VexInvalRange vir = {(HWord)place_to_unchain, len};
6790    return vir;
6791 }
6792
6793
6794 /* Patch the counter address into a profile inc point, as previously
6795    created by the Pin_ProfInc case for emit_PPCInstr. */
6796 VexInvalRange patchProfInc_PPC ( VexEndness endness_host,
6797                                  void*  place_to_patch,
6798                                  const ULong* location_of_counter,
6799                                  Bool   mode64 )
6800 {
6801    if (mode64) {
6802       vassert((endness_host == VexEndnessBE) ||
6803               (endness_host == VexEndnessLE));
6804    } else {
6805       vassert(endness_host == VexEndnessBE);
6806    }
6807
6808    UChar* p = (UChar*)place_to_patch;
6809    vassert(0 == (3 & (HWord)p));
6810
6811    Int len = 0;
6812    if (mode64) {
6813       vassert(isLoadImm_EXACTLY2or5(p, /*r*/30,
6814                                     0x6555655565556555ULL, True/*mode64*/,
6815                                     endness_host));
6816       vassert(fetch32(p + 20, endness_host) == 0xEBBE0000);
6817       vassert(fetch32(p + 24, endness_host) == 0x3BBD0001);
6818       vassert(fetch32(p + 28, endness_host) == 0xFBBE0000);
6819       p = mkLoadImm_EXACTLY2or5(p, /*r*/30,
6820                                 (Addr)location_of_counter,
6821                                 True/*mode64*/, endness_host);
6822       len = p - (UChar*)place_to_patch;
6823       vassert(len == 20);
6824    } else {
6825       vassert(isLoadImm_EXACTLY2or5(p, /*r*/30,
6826                                     0x65556555ULL, False/*!mode64*/,
6827                                     endness_host));
6828       vassert(fetch32(p +  8, endness_host) == 0x83BE0004);
6829       vassert(fetch32(p + 12, endness_host) == 0x37BD0001);
6830       vassert(fetch32(p + 16, endness_host) == 0x93BE0004);
6831       vassert(fetch32(p + 20, endness_host) == 0x83BE0000);
6832       vassert(fetch32(p + 24, endness_host) == 0x7FBD0194);
6833       vassert(fetch32(p + 28, endness_host) == 0x93BE0000);
6834       p = mkLoadImm_EXACTLY2or5(p, /*r*/30,
6835                                 (Addr)location_of_counter,
6836                                 False/*!mode64*/, endness_host);
6837       len = p - (UChar*)place_to_patch;
6838       vassert(len == 8);
6839    }
6840    VexInvalRange vir = {(HWord)place_to_patch, len};
6841    return vir;
6842 }
6843
6844
6845 /*---------------------------------------------------------------*/
6846 /*--- end                                     host_ppc_defs.c ---*/
6847 /*---------------------------------------------------------------*/