3 # This is (mostly) based on following documentations.
4 # - Intel(R) 64 and IA-32 Architectures Software Developer's Manual Vol.2C
5 # (#326018-047US, June 2013)
9 # Referrer: escaped-name
11 # opcode: mnemonic|GrpXXX [operand1[,operand2...]] [(extra1)[,(extra2)...] [| 2nd-mnemonic ...]
13 # opcode: escape # escaped-name
16 # mnemonics that begin with lowercase 'v' accept a VEX or EVEX prefix
17 # mnemonics that begin with lowercase 'k' accept a VEX prefix
21 # reg: mnemonic [operand1[,operand2...]] [(extra1)[,(extra2)...] [| 2nd-mnemonic ...]
25 # (ev): this opcode requires EVEX prefix.
26 # (evo): this opcode is changed by EVEX prefix (EVEX opcode)
27 # (v): this opcode requires VEX prefix.
28 # (v1): this opcode only supports 128bit VEX.
30 # Last Prefix Superscripts
31 # - (66): the last prefix is 0x66
32 # - (F3): the last prefix is 0xF3
33 # - (F2): the last prefix is 0xF2
34 # - (!F3) : the last prefix is not 0xF3 (including non-last prefix case)
35 # - (66&F2): Both 0x66 and 0xF2 prefixes are specified.
37 Table: one byte opcode
56 0f: escape # 2-byte escape
109 40: INC eAX (i64) | REX (o64)
110 41: INC eCX (i64) | REX.B (o64)
111 42: INC eDX (i64) | REX.X (o64)
112 43: INC eBX (i64) | REX.XB (o64)
113 44: INC eSP (i64) | REX.R (o64)
114 45: INC eBP (i64) | REX.RB (o64)
115 46: INC eSI (i64) | REX.RX (o64)
116 47: INC eDI (i64) | REX.RXB (o64)
117 48: DEC eAX (i64) | REX.W (o64)
118 49: DEC eCX (i64) | REX.WB (o64)
119 4a: DEC eDX (i64) | REX.WX (o64)
120 4b: DEC eBX (i64) | REX.WXB (o64)
121 4c: DEC eSP (i64) | REX.WR (o64)
122 4d: DEC eBP (i64) | REX.WRB (o64)
123 4e: DEC eSI (i64) | REX.WRX (o64)
124 4f: DEC eDI (i64) | REX.WRXB (o64)
126 50: PUSH rAX/r8 (d64)
127 51: PUSH rCX/r9 (d64)
128 52: PUSH rDX/r10 (d64)
129 53: PUSH rBX/r11 (d64)
130 54: PUSH rSP/r12 (d64)
131 55: PUSH rBP/r13 (d64)
132 56: PUSH rSI/r14 (d64)
133 57: PUSH rDI/r15 (d64)
136 5a: POP rDX/r10 (d64)
137 5b: POP rBX/r11 (d64)
138 5c: POP rSP/r12 (d64)
139 5d: POP rBP/r13 (d64)
140 5e: POP rSI/r14 (d64)
141 5f: POP rDI/r15 (d64)
143 60: PUSHA/PUSHAD (i64)
145 62: BOUND Gv,Ma (i64) | EVEX (Prefix)
146 63: ARPL Ew,Gw (i64) | MOVSXD Gv,Ev (o64)
149 66: Operand-Size (Prefix)
150 67: Address-Size (Prefix)
156 6d: INS/INSW/INSD Yz,DX
158 6f: OUTS/OUTSW/OUTSD DX,Xz
179 82: Grp1 Eb,Ib (1A),(i64)
192 8f: Grp1A (1A) | POP Ev (d64)
194 90: NOP | PAUSE (F3) | XCHG r8,rAX
206 9c: PUSHF/D/Q Fv (d64)
207 9d: POPF/D/Q Fv (d64)
222 ab: STOS/W/D/Q Yv,rAX
224 ad: LODS/W/D/Q rAX,Xv
226 # Note: The May 2011 Intel manual shows Xv for the second parameter of the
227 # next instruction but Yv is correct
228 af: SCAS/W/D/Q rAX,Yv
251 c4: LES Gz,Mp (i64) | VEX+2byte (Prefix)
252 c5: LDS Gz,Mp (i64) | VEX+1byte (Prefix)
253 c6: Grp11A Eb,Ib (1A)
254 c7: Grp11B Ev,Iz (1A)
281 # Note: "forced64" is Intel CPU behavior: they ignore 0x66 prefix
282 # in 64-bit mode. AMD CPUs accept 0x66 prefix, it causes RIP truncation
283 # to 16 bits. In 32-bit mode, 0x66 is accepted by both Intel and AMD.
284 e0: LOOPNE/LOOPNZ Jb (f64)
285 e1: LOOPE/LOOPZ Jb (f64)
292 # With 0x66 prefix in 64-bit mode, for AMD CPUs immediate offset
293 # in "near" jumps and calls is 16-bit. For CALL,
294 # push of return address is 16-bit wide, RSP is decremented by 2
295 # but is not truncated to 16 bits, unlike RIP.
297 e9: JMP-near Jz (f64)
299 eb: JMP-short Jb (f64)
307 f2: REPNE (Prefix) | XACQUIRE (Prefix)
308 f3: REP/REPE (Prefix) | XRELEASE (Prefix)
323 Table: 2-byte opcode (0x0f)
324 Referrer: 2-byte escape
340 # AMD's prefetch group. Intel supports prefetchw(/1) only.
343 # 3DNow! uses the last imm byte as opcode extension.
346 # NOTE: According to Intel SDM opcode map, vmovups and vmovupd has no operands
347 # but it actually has operands. And also, vmovss and vmovsd only accept 128bit.
348 # MOVSS/MOVSD has too many forms(3) on SDM. This map just shows a typical form.
349 # Many AVX instructions lack v1 superscript, according to Intel AVX-Prgramming
351 10: vmovups Vps,Wps | vmovupd Vpd,Wpd (66) | vmovss Vx,Hx,Wss (F3),(v1) | vmovsd Vx,Hx,Wsd (F2),(v1)
352 11: vmovups Wps,Vps | vmovupd Wpd,Vpd (66) | vmovss Wss,Hx,Vss (F3),(v1) | vmovsd Wsd,Hx,Vsd (F2),(v1)
353 12: vmovlps Vq,Hq,Mq (v1) | vmovhlps Vq,Hq,Uq (v1) | vmovlpd Vq,Hq,Mq (66),(v1) | vmovsldup Vx,Wx (F3) | vmovddup Vx,Wx (F2)
354 13: vmovlps Mq,Vq (v1) | vmovlpd Mq,Vq (66),(v1)
355 14: vunpcklps Vx,Hx,Wx | vunpcklpd Vx,Hx,Wx (66)
356 15: vunpckhps Vx,Hx,Wx | vunpckhpd Vx,Hx,Wx (66)
357 16: vmovhps Vdq,Hq,Mq (v1) | vmovlhps Vdq,Hq,Uq (v1) | vmovhpd Vdq,Hq,Mq (66),(v1) | vmovshdup Vx,Wx (F3)
358 17: vmovhps Mq,Vq (v1) | vmovhpd Mq,Vq (66),(v1)
361 # Intel SDM opcode map does not list MPX instructions. For now using Gv for
362 # bnd registers and Ev for everything else is OK because the instruction
363 # decoder does not use the information except as an indication that there is
365 1a: BNDCL Gv,Ev (F3) | BNDCU Gv,Ev (F2) | BNDMOV Gv,Ev (66) | BNDLDX Gv,Ev
366 1b: BNDCN Gv,Ev (F2) | BNDMOV Ev,Gv (66) | BNDMK Gv,Ev (F3) | BNDSTX Ev,Gv
380 28: vmovaps Vps,Wps | vmovapd Vpd,Wpd (66)
381 29: vmovaps Wps,Vps | vmovapd Wpd,Vpd (66)
382 2a: cvtpi2ps Vps,Qpi | cvtpi2pd Vpd,Qpi (66) | vcvtsi2ss Vss,Hss,Ey (F3),(v1) | vcvtsi2sd Vsd,Hsd,Ey (F2),(v1)
383 2b: vmovntps Mps,Vps | vmovntpd Mpd,Vpd (66)
384 2c: cvttps2pi Ppi,Wps | cvttpd2pi Ppi,Wpd (66) | vcvttss2si Gy,Wss (F3),(v1) | vcvttsd2si Gy,Wsd (F2),(v1)
385 2d: cvtps2pi Ppi,Wps | cvtpd2pi Qpi,Wpd (66) | vcvtss2si Gy,Wss (F3),(v1) | vcvtsd2si Gy,Wsd (F2),(v1)
386 2e: vucomiss Vss,Wss (v1) | vucomisd Vsd,Wsd (66),(v1)
387 2f: vcomiss Vss,Wss (v1) | vcomisd Vsd,Wsd (66),(v1)
397 38: escape # 3-byte escape 1
399 3a: escape # 3-byte escape 2
407 41: CMOVNO Gv,Ev | kandw/q Vk,Hk,Uk | kandb/d Vk,Hk,Uk (66)
408 42: CMOVB/C/NAE Gv,Ev | kandnw/q Vk,Hk,Uk | kandnb/d Vk,Hk,Uk (66)
409 43: CMOVAE/NB/NC Gv,Ev
410 44: CMOVE/Z Gv,Ev | knotw/q Vk,Uk | knotb/d Vk,Uk (66)
411 45: CMOVNE/NZ Gv,Ev | korw/q Vk,Hk,Uk | korb/d Vk,Hk,Uk (66)
412 46: CMOVBE/NA Gv,Ev | kxnorw/q Vk,Hk,Uk | kxnorb/d Vk,Hk,Uk (66)
413 47: CMOVA/NBE Gv,Ev | kxorw/q Vk,Hk,Uk | kxorb/d Vk,Hk,Uk (66)
416 4a: CMOVP/PE Gv,Ev | kaddw/q Vk,Hk,Uk | kaddb/d Vk,Hk,Uk (66)
417 4b: CMOVNP/PO Gv,Ev | kunpckbw Vk,Hk,Uk (66) | kunpckwd/dq Vk,Hk,Uk
423 50: vmovmskps Gy,Ups | vmovmskpd Gy,Upd (66)
424 51: vsqrtps Vps,Wps | vsqrtpd Vpd,Wpd (66) | vsqrtss Vss,Hss,Wss (F3),(v1) | vsqrtsd Vsd,Hsd,Wsd (F2),(v1)
425 52: vrsqrtps Vps,Wps | vrsqrtss Vss,Hss,Wss (F3),(v1)
426 53: vrcpps Vps,Wps | vrcpss Vss,Hss,Wss (F3),(v1)
427 54: vandps Vps,Hps,Wps | vandpd Vpd,Hpd,Wpd (66)
428 55: vandnps Vps,Hps,Wps | vandnpd Vpd,Hpd,Wpd (66)
429 56: vorps Vps,Hps,Wps | vorpd Vpd,Hpd,Wpd (66)
430 57: vxorps Vps,Hps,Wps | vxorpd Vpd,Hpd,Wpd (66)
431 58: vaddps Vps,Hps,Wps | vaddpd Vpd,Hpd,Wpd (66) | vaddss Vss,Hss,Wss (F3),(v1) | vaddsd Vsd,Hsd,Wsd (F2),(v1)
432 59: vmulps Vps,Hps,Wps | vmulpd Vpd,Hpd,Wpd (66) | vmulss Vss,Hss,Wss (F3),(v1) | vmulsd Vsd,Hsd,Wsd (F2),(v1)
433 5a: vcvtps2pd Vpd,Wps | vcvtpd2ps Vps,Wpd (66) | vcvtss2sd Vsd,Hx,Wss (F3),(v1) | vcvtsd2ss Vss,Hx,Wsd (F2),(v1)
434 5b: vcvtdq2ps Vps,Wdq | vcvtqq2ps Vps,Wqq (evo) | vcvtps2dq Vdq,Wps (66) | vcvttps2dq Vdq,Wps (F3)
435 5c: vsubps Vps,Hps,Wps | vsubpd Vpd,Hpd,Wpd (66) | vsubss Vss,Hss,Wss (F3),(v1) | vsubsd Vsd,Hsd,Wsd (F2),(v1)
436 5d: vminps Vps,Hps,Wps | vminpd Vpd,Hpd,Wpd (66) | vminss Vss,Hss,Wss (F3),(v1) | vminsd Vsd,Hsd,Wsd (F2),(v1)
437 5e: vdivps Vps,Hps,Wps | vdivpd Vpd,Hpd,Wpd (66) | vdivss Vss,Hss,Wss (F3),(v1) | vdivsd Vsd,Hsd,Wsd (F2),(v1)
438 5f: vmaxps Vps,Hps,Wps | vmaxpd Vpd,Hpd,Wpd (66) | vmaxss Vss,Hss,Wss (F3),(v1) | vmaxsd Vsd,Hsd,Wsd (F2),(v1)
440 60: punpcklbw Pq,Qd | vpunpcklbw Vx,Hx,Wx (66),(v1)
441 61: punpcklwd Pq,Qd | vpunpcklwd Vx,Hx,Wx (66),(v1)
442 62: punpckldq Pq,Qd | vpunpckldq Vx,Hx,Wx (66),(v1)
443 63: packsswb Pq,Qq | vpacksswb Vx,Hx,Wx (66),(v1)
444 64: pcmpgtb Pq,Qq | vpcmpgtb Vx,Hx,Wx (66),(v1)
445 65: pcmpgtw Pq,Qq | vpcmpgtw Vx,Hx,Wx (66),(v1)
446 66: pcmpgtd Pq,Qq | vpcmpgtd Vx,Hx,Wx (66),(v1)
447 67: packuswb Pq,Qq | vpackuswb Vx,Hx,Wx (66),(v1)
448 68: punpckhbw Pq,Qd | vpunpckhbw Vx,Hx,Wx (66),(v1)
449 69: punpckhwd Pq,Qd | vpunpckhwd Vx,Hx,Wx (66),(v1)
450 6a: punpckhdq Pq,Qd | vpunpckhdq Vx,Hx,Wx (66),(v1)
451 6b: packssdw Pq,Qd | vpackssdw Vx,Hx,Wx (66),(v1)
452 6c: vpunpcklqdq Vx,Hx,Wx (66),(v1)
453 6d: vpunpckhqdq Vx,Hx,Wx (66),(v1)
454 6e: movd/q Pd,Ey | vmovd/q Vy,Ey (66),(v1)
455 6f: movq Pq,Qq | vmovdqa Vx,Wx (66) | vmovdqa32/64 Vx,Wx (66),(evo) | vmovdqu Vx,Wx (F3) | vmovdqu32/64 Vx,Wx (F3),(evo) | vmovdqu8/16 Vx,Wx (F2),(ev)
457 70: pshufw Pq,Qq,Ib | vpshufd Vx,Wx,Ib (66),(v1) | vpshufhw Vx,Wx,Ib (F3),(v1) | vpshuflw Vx,Wx,Ib (F2),(v1)
461 74: pcmpeqb Pq,Qq | vpcmpeqb Vx,Hx,Wx (66),(v1)
462 75: pcmpeqw Pq,Qq | vpcmpeqw Vx,Hx,Wx (66),(v1)
463 76: pcmpeqd Pq,Qq | vpcmpeqd Vx,Hx,Wx (66),(v1)
464 # Note: Remove (v), because vzeroall and vzeroupper becomes emms without VEX.
465 77: emms | vzeroupper | vzeroall
466 78: VMREAD Ey,Gy | vcvttps2udq/pd2udq Vx,Wpd (evo) | vcvttsd2usi Gv,Wx (F2),(ev) | vcvttss2usi Gv,Wx (F3),(ev) | vcvttps2uqq/pd2uqq Vx,Wx (66),(ev)
467 79: VMWRITE Gy,Ey | vcvtps2udq/pd2udq Vx,Wpd (evo) | vcvtsd2usi Gv,Wx (F2),(ev) | vcvtss2usi Gv,Wx (F3),(ev) | vcvtps2uqq/pd2uqq Vx,Wx (66),(ev)
468 7a: vcvtudq2pd/uqq2pd Vpd,Wx (F3),(ev) | vcvtudq2ps/uqq2ps Vpd,Wx (F2),(ev) | vcvttps2qq/pd2qq Vx,Wx (66),(ev)
469 7b: vcvtusi2sd Vpd,Hpd,Ev (F2),(ev) | vcvtusi2ss Vps,Hps,Ev (F3),(ev) | vcvtps2qq/pd2qq Vx,Wx (66),(ev)
470 7c: vhaddpd Vpd,Hpd,Wpd (66) | vhaddps Vps,Hps,Wps (F2)
471 7d: vhsubpd Vpd,Hpd,Wpd (66) | vhsubps Vps,Hps,Wps (F2)
472 7e: movd/q Ey,Pd | vmovd/q Ey,Vy (66),(v1) | vmovq Vq,Wq (F3),(v1)
473 7f: movq Qq,Pq | vmovdqa Wx,Vx (66) | vmovdqa32/64 Wx,Vx (66),(evo) | vmovdqu Wx,Vx (F3) | vmovdqu32/64 Wx,Vx (F3),(evo) | vmovdqu8/16 Wx,Vx (F2),(ev)
475 # Note: "forced64" is Intel CPU behavior (see comment about CALL insn).
478 82: JB/JC/JNAE Jz (f64)
479 83: JAE/JNB/JNC Jz (f64)
493 90: SETO Eb | kmovw/q Vk,Wk | kmovb/d Vk,Wk (66)
494 91: SETNO Eb | kmovw/q Mv,Vk | kmovb/d Mv,Vk (66)
495 92: SETB/C/NAE Eb | kmovw Vk,Rv | kmovb Vk,Rv (66) | kmovq/d Vk,Rv (F2)
496 93: SETAE/NB/NC Eb | kmovw Gv,Uk | kmovb Gv,Uk (66) | kmovq/d Gv,Uk (F2)
501 98: SETS Eb | kortestw/q Vk,Uk | kortestb/d Vk,Uk (66)
502 99: SETNS Eb | ktestw/q Vk,Uk | ktestb/d Vk,Uk (66)
535 b8: JMPE (!F3) | POPCNT Gv,Ev (F3)
539 bc: BSF Gv,Ev (!F3) | TZCNT Gv,Ev (F3)
540 bd: BSR Gv,Ev (!F3) | LZCNT Gv,Ev (F3)
546 c2: vcmpps Vps,Hps,Wps,Ib | vcmppd Vpd,Hpd,Wpd,Ib (66) | vcmpss Vss,Hss,Wss,Ib (F3),(v1) | vcmpsd Vsd,Hsd,Wsd,Ib (F2),(v1)
548 c4: pinsrw Pq,Ry/Mw,Ib | vpinsrw Vdq,Hdq,Ry/Mw,Ib (66),(v1)
549 c5: pextrw Gd,Nq,Ib | vpextrw Gd,Udq,Ib (66),(v1)
550 c6: vshufps Vps,Hps,Wps,Ib | vshufpd Vpd,Hpd,Wpd,Ib (66)
552 c8: BSWAP RAX/EAX/R8/R8D
553 c9: BSWAP RCX/ECX/R9/R9D
554 ca: BSWAP RDX/EDX/R10/R10D
555 cb: BSWAP RBX/EBX/R11/R11D
556 cc: BSWAP RSP/ESP/R12/R12D
557 cd: BSWAP RBP/EBP/R13/R13D
558 ce: BSWAP RSI/ESI/R14/R14D
559 cf: BSWAP RDI/EDI/R15/R15D
561 d0: vaddsubpd Vpd,Hpd,Wpd (66) | vaddsubps Vps,Hps,Wps (F2)
562 d1: psrlw Pq,Qq | vpsrlw Vx,Hx,Wx (66),(v1)
563 d2: psrld Pq,Qq | vpsrld Vx,Hx,Wx (66),(v1)
564 d3: psrlq Pq,Qq | vpsrlq Vx,Hx,Wx (66),(v1)
565 d4: paddq Pq,Qq | vpaddq Vx,Hx,Wx (66),(v1)
566 d5: pmullw Pq,Qq | vpmullw Vx,Hx,Wx (66),(v1)
567 d6: vmovq Wq,Vq (66),(v1) | movq2dq Vdq,Nq (F3) | movdq2q Pq,Uq (F2)
568 d7: pmovmskb Gd,Nq | vpmovmskb Gd,Ux (66),(v1)
569 d8: psubusb Pq,Qq | vpsubusb Vx,Hx,Wx (66),(v1)
570 d9: psubusw Pq,Qq | vpsubusw Vx,Hx,Wx (66),(v1)
571 da: pminub Pq,Qq | vpminub Vx,Hx,Wx (66),(v1)
572 db: pand Pq,Qq | vpand Vx,Hx,Wx (66),(v1) | vpandd/q Vx,Hx,Wx (66),(evo)
573 dc: paddusb Pq,Qq | vpaddusb Vx,Hx,Wx (66),(v1)
574 dd: paddusw Pq,Qq | vpaddusw Vx,Hx,Wx (66),(v1)
575 de: pmaxub Pq,Qq | vpmaxub Vx,Hx,Wx (66),(v1)
576 df: pandn Pq,Qq | vpandn Vx,Hx,Wx (66),(v1) | vpandnd/q Vx,Hx,Wx (66),(evo)
578 e0: pavgb Pq,Qq | vpavgb Vx,Hx,Wx (66),(v1)
579 e1: psraw Pq,Qq | vpsraw Vx,Hx,Wx (66),(v1)
580 e2: psrad Pq,Qq | vpsrad Vx,Hx,Wx (66),(v1)
581 e3: pavgw Pq,Qq | vpavgw Vx,Hx,Wx (66),(v1)
582 e4: pmulhuw Pq,Qq | vpmulhuw Vx,Hx,Wx (66),(v1)
583 e5: pmulhw Pq,Qq | vpmulhw Vx,Hx,Wx (66),(v1)
584 e6: vcvttpd2dq Vx,Wpd (66) | vcvtdq2pd Vx,Wdq (F3) | vcvtdq2pd/qq2pd Vx,Wdq (F3),(evo) | vcvtpd2dq Vx,Wpd (F2)
585 e7: movntq Mq,Pq | vmovntdq Mx,Vx (66)
586 e8: psubsb Pq,Qq | vpsubsb Vx,Hx,Wx (66),(v1)
587 e9: psubsw Pq,Qq | vpsubsw Vx,Hx,Wx (66),(v1)
588 ea: pminsw Pq,Qq | vpminsw Vx,Hx,Wx (66),(v1)
589 eb: por Pq,Qq | vpor Vx,Hx,Wx (66),(v1) | vpord/q Vx,Hx,Wx (66),(evo)
590 ec: paddsb Pq,Qq | vpaddsb Vx,Hx,Wx (66),(v1)
591 ed: paddsw Pq,Qq | vpaddsw Vx,Hx,Wx (66),(v1)
592 ee: pmaxsw Pq,Qq | vpmaxsw Vx,Hx,Wx (66),(v1)
593 ef: pxor Pq,Qq | vpxor Vx,Hx,Wx (66),(v1) | vpxord/q Vx,Hx,Wx (66),(evo)
595 f0: vlddqu Vx,Mx (F2)
596 f1: psllw Pq,Qq | vpsllw Vx,Hx,Wx (66),(v1)
597 f2: pslld Pq,Qq | vpslld Vx,Hx,Wx (66),(v1)
598 f3: psllq Pq,Qq | vpsllq Vx,Hx,Wx (66),(v1)
599 f4: pmuludq Pq,Qq | vpmuludq Vx,Hx,Wx (66),(v1)
600 f5: pmaddwd Pq,Qq | vpmaddwd Vx,Hx,Wx (66),(v1)
601 f6: psadbw Pq,Qq | vpsadbw Vx,Hx,Wx (66),(v1)
602 f7: maskmovq Pq,Nq | vmaskmovdqu Vx,Ux (66),(v1)
603 f8: psubb Pq,Qq | vpsubb Vx,Hx,Wx (66),(v1)
604 f9: psubw Pq,Qq | vpsubw Vx,Hx,Wx (66),(v1)
605 fa: psubd Pq,Qq | vpsubd Vx,Hx,Wx (66),(v1)
606 fb: psubq Pq,Qq | vpsubq Vx,Hx,Wx (66),(v1)
607 fc: paddb Pq,Qq | vpaddb Vx,Hx,Wx (66),(v1)
608 fd: paddw Pq,Qq | vpaddw Vx,Hx,Wx (66),(v1)
609 fe: paddd Pq,Qq | vpaddd Vx,Hx,Wx (66),(v1)
613 Table: 3-byte opcode 1 (0x0f 0x38)
614 Referrer: 3-byte escape 1
616 # 0x0f 0x38 0x00-0x0f
617 00: pshufb Pq,Qq | vpshufb Vx,Hx,Wx (66),(v1)
618 01: phaddw Pq,Qq | vphaddw Vx,Hx,Wx (66),(v1)
619 02: phaddd Pq,Qq | vphaddd Vx,Hx,Wx (66),(v1)
620 03: phaddsw Pq,Qq | vphaddsw Vx,Hx,Wx (66),(v1)
621 04: pmaddubsw Pq,Qq | vpmaddubsw Vx,Hx,Wx (66),(v1)
622 05: phsubw Pq,Qq | vphsubw Vx,Hx,Wx (66),(v1)
623 06: phsubd Pq,Qq | vphsubd Vx,Hx,Wx (66),(v1)
624 07: phsubsw Pq,Qq | vphsubsw Vx,Hx,Wx (66),(v1)
625 08: psignb Pq,Qq | vpsignb Vx,Hx,Wx (66),(v1)
626 09: psignw Pq,Qq | vpsignw Vx,Hx,Wx (66),(v1)
627 0a: psignd Pq,Qq | vpsignd Vx,Hx,Wx (66),(v1)
628 0b: pmulhrsw Pq,Qq | vpmulhrsw Vx,Hx,Wx (66),(v1)
629 0c: vpermilps Vx,Hx,Wx (66),(v)
630 0d: vpermilpd Vx,Hx,Wx (66),(v)
631 0e: vtestps Vx,Wx (66),(v)
632 0f: vtestpd Vx,Wx (66),(v)
633 # 0x0f 0x38 0x10-0x1f
634 10: pblendvb Vdq,Wdq (66) | vpsrlvw Vx,Hx,Wx (66),(evo) | vpmovuswb Wx,Vx (F3),(ev)
635 11: vpmovusdb Wx,Vd (F3),(ev) | vpsravw Vx,Hx,Wx (66),(ev)
636 12: vpmovusqb Wx,Vq (F3),(ev) | vpsllvw Vx,Hx,Wx (66),(ev)
637 13: vcvtph2ps Vx,Wx (66),(v) | vpmovusdw Wx,Vd (F3),(ev)
638 14: blendvps Vdq,Wdq (66) | vpmovusqw Wx,Vq (F3),(ev) | vprorvd/q Vx,Hx,Wx (66),(evo)
639 15: blendvpd Vdq,Wdq (66) | vpmovusqd Wx,Vq (F3),(ev) | vprolvd/q Vx,Hx,Wx (66),(evo)
640 16: vpermps Vqq,Hqq,Wqq (66),(v) | vpermps/d Vqq,Hqq,Wqq (66),(evo)
641 17: vptest Vx,Wx (66)
642 18: vbroadcastss Vx,Wd (66),(v)
643 19: vbroadcastsd Vqq,Wq (66),(v) | vbroadcastf32x2 Vqq,Wq (66),(evo)
644 1a: vbroadcastf128 Vqq,Mdq (66),(v) | vbroadcastf32x4/64x2 Vqq,Wq (66),(evo)
645 1b: vbroadcastf32x8/64x4 Vqq,Mdq (66),(ev)
646 1c: pabsb Pq,Qq | vpabsb Vx,Wx (66),(v1)
647 1d: pabsw Pq,Qq | vpabsw Vx,Wx (66),(v1)
648 1e: pabsd Pq,Qq | vpabsd Vx,Wx (66),(v1)
649 1f: vpabsq Vx,Wx (66),(ev)
650 # 0x0f 0x38 0x20-0x2f
651 20: vpmovsxbw Vx,Ux/Mq (66),(v1) | vpmovswb Wx,Vx (F3),(ev)
652 21: vpmovsxbd Vx,Ux/Md (66),(v1) | vpmovsdb Wx,Vd (F3),(ev)
653 22: vpmovsxbq Vx,Ux/Mw (66),(v1) | vpmovsqb Wx,Vq (F3),(ev)
654 23: vpmovsxwd Vx,Ux/Mq (66),(v1) | vpmovsdw Wx,Vd (F3),(ev)
655 24: vpmovsxwq Vx,Ux/Md (66),(v1) | vpmovsqw Wx,Vq (F3),(ev)
656 25: vpmovsxdq Vx,Ux/Mq (66),(v1) | vpmovsqd Wx,Vq (F3),(ev)
657 26: vptestmb/w Vk,Hx,Wx (66),(ev) | vptestnmb/w Vk,Hx,Wx (F3),(ev)
658 27: vptestmd/q Vk,Hx,Wx (66),(ev) | vptestnmd/q Vk,Hx,Wx (F3),(ev)
659 28: vpmuldq Vx,Hx,Wx (66),(v1) | vpmovm2b/w Vx,Uk (F3),(ev)
660 29: vpcmpeqq Vx,Hx,Wx (66),(v1) | vpmovb2m/w2m Vk,Ux (F3),(ev)
661 2a: vmovntdqa Vx,Mx (66),(v1) | vpbroadcastmb2q Vx,Uk (F3),(ev)
662 2b: vpackusdw Vx,Hx,Wx (66),(v1)
663 2c: vmaskmovps Vx,Hx,Mx (66),(v) | vscalefps/d Vx,Hx,Wx (66),(evo)
664 2d: vmaskmovpd Vx,Hx,Mx (66),(v) | vscalefss/d Vx,Hx,Wx (66),(evo)
665 2e: vmaskmovps Mx,Hx,Vx (66),(v)
666 2f: vmaskmovpd Mx,Hx,Vx (66),(v)
667 # 0x0f 0x38 0x30-0x3f
668 30: vpmovzxbw Vx,Ux/Mq (66),(v1) | vpmovwb Wx,Vx (F3),(ev)
669 31: vpmovzxbd Vx,Ux/Md (66),(v1) | vpmovdb Wx,Vd (F3),(ev)
670 32: vpmovzxbq Vx,Ux/Mw (66),(v1) | vpmovqb Wx,Vq (F3),(ev)
671 33: vpmovzxwd Vx,Ux/Mq (66),(v1) | vpmovdw Wx,Vd (F3),(ev)
672 34: vpmovzxwq Vx,Ux/Md (66),(v1) | vpmovqw Wx,Vq (F3),(ev)
673 35: vpmovzxdq Vx,Ux/Mq (66),(v1) | vpmovqd Wx,Vq (F3),(ev)
674 36: vpermd Vqq,Hqq,Wqq (66),(v) | vpermd/q Vqq,Hqq,Wqq (66),(evo)
675 37: vpcmpgtq Vx,Hx,Wx (66),(v1)
676 38: vpminsb Vx,Hx,Wx (66),(v1) | vpmovm2d/q Vx,Uk (F3),(ev)
677 39: vpminsd Vx,Hx,Wx (66),(v1) | vpminsd/q Vx,Hx,Wx (66),(evo) | vpmovd2m/q2m Vk,Ux (F3),(ev)
678 3a: vpminuw Vx,Hx,Wx (66),(v1) | vpbroadcastmw2d Vx,Uk (F3),(ev)
679 3b: vpminud Vx,Hx,Wx (66),(v1) | vpminud/q Vx,Hx,Wx (66),(evo)
680 3c: vpmaxsb Vx,Hx,Wx (66),(v1)
681 3d: vpmaxsd Vx,Hx,Wx (66),(v1) | vpmaxsd/q Vx,Hx,Wx (66),(evo)
682 3e: vpmaxuw Vx,Hx,Wx (66),(v1)
683 3f: vpmaxud Vx,Hx,Wx (66),(v1) | vpmaxud/q Vx,Hx,Wx (66),(evo)
684 # 0x0f 0x38 0x40-0x8f
685 40: vpmulld Vx,Hx,Wx (66),(v1) | vpmulld/q Vx,Hx,Wx (66),(evo)
686 41: vphminposuw Vdq,Wdq (66),(v1)
687 42: vgetexpps/d Vx,Wx (66),(ev)
688 43: vgetexpss/d Vx,Hx,Wx (66),(ev)
689 44: vplzcntd/q Vx,Wx (66),(ev)
690 45: vpsrlvd/q Vx,Hx,Wx (66),(v)
691 46: vpsravd Vx,Hx,Wx (66),(v) | vpsravd/q Vx,Hx,Wx (66),(evo)
692 47: vpsllvd/q Vx,Hx,Wx (66),(v)
694 4c: vrcp14ps/d Vpd,Wpd (66),(ev)
695 4d: vrcp14ss/d Vsd,Hpd,Wsd (66),(ev)
696 4e: vrsqrt14ps/d Vpd,Wpd (66),(ev)
697 4f: vrsqrt14ss/d Vsd,Hsd,Wsd (66),(ev)
699 58: vpbroadcastd Vx,Wx (66),(v)
700 59: vpbroadcastq Vx,Wx (66),(v) | vbroadcasti32x2 Vx,Wx (66),(evo)
701 5a: vbroadcasti128 Vqq,Mdq (66),(v) | vbroadcasti32x4/64x2 Vx,Wx (66),(evo)
702 5b: vbroadcasti32x8/64x4 Vqq,Mdq (66),(ev)
704 64: vpblendmd/q Vx,Hx,Wx (66),(ev)
705 65: vblendmps/d Vx,Hx,Wx (66),(ev)
706 66: vpblendmb/w Vx,Hx,Wx (66),(ev)
708 75: vpermi2b/w Vx,Hx,Wx (66),(ev)
709 76: vpermi2d/q Vx,Hx,Wx (66),(ev)
710 77: vpermi2ps/d Vx,Hx,Wx (66),(ev)
711 78: vpbroadcastb Vx,Wx (66),(v)
712 79: vpbroadcastw Vx,Wx (66),(v)
713 7a: vpbroadcastb Vx,Rv (66),(ev)
714 7b: vpbroadcastw Vx,Rv (66),(ev)
715 7c: vpbroadcastd/q Vx,Rv (66),(ev)
716 7d: vpermt2b/w Vx,Hx,Wx (66),(ev)
717 7e: vpermt2d/q Vx,Hx,Wx (66),(ev)
718 7f: vpermt2ps/d Vx,Hx,Wx (66),(ev)
719 80: INVEPT Gy,Mdq (66)
720 81: INVVPID Gy,Mdq (66)
721 82: INVPCID Gy,Mdq (66)
722 83: vpmultishiftqb Vx,Hx,Wx (66),(ev)
723 88: vexpandps/d Vpd,Wpd (66),(ev)
724 89: vpexpandd/q Vx,Wx (66),(ev)
725 8a: vcompressps/d Wx,Vx (66),(ev)
726 8b: vpcompressd/q Wx,Vx (66),(ev)
727 8c: vpmaskmovd/q Vx,Hx,Mx (66),(v)
728 8d: vpermb/w Vx,Hx,Wx (66),(ev)
729 8e: vpmaskmovd/q Mx,Vx,Hx (66),(v)
730 # 0x0f 0x38 0x90-0xbf (FMA)
731 90: vgatherdd/q Vx,Hx,Wx (66),(v) | vpgatherdd/q Vx,Wx (66),(evo)
732 91: vgatherqd/q Vx,Hx,Wx (66),(v) | vpgatherqd/q Vx,Wx (66),(evo)
733 92: vgatherdps/d Vx,Hx,Wx (66),(v)
734 93: vgatherqps/d Vx,Hx,Wx (66),(v)
737 96: vfmaddsub132ps/d Vx,Hx,Wx (66),(v)
738 97: vfmsubadd132ps/d Vx,Hx,Wx (66),(v)
739 98: vfmadd132ps/d Vx,Hx,Wx (66),(v)
740 99: vfmadd132ss/d Vx,Hx,Wx (66),(v),(v1)
741 9a: vfmsub132ps/d Vx,Hx,Wx (66),(v)
742 9b: vfmsub132ss/d Vx,Hx,Wx (66),(v),(v1)
743 9c: vfnmadd132ps/d Vx,Hx,Wx (66),(v)
744 9d: vfnmadd132ss/d Vx,Hx,Wx (66),(v),(v1)
745 9e: vfnmsub132ps/d Vx,Hx,Wx (66),(v)
746 9f: vfnmsub132ss/d Vx,Hx,Wx (66),(v),(v1)
747 a0: vpscatterdd/q Wx,Vx (66),(ev)
748 a1: vpscatterqd/q Wx,Vx (66),(ev)
749 a2: vscatterdps/d Wx,Vx (66),(ev)
750 a3: vscatterqps/d Wx,Vx (66),(ev)
751 a6: vfmaddsub213ps/d Vx,Hx,Wx (66),(v)
752 a7: vfmsubadd213ps/d Vx,Hx,Wx (66),(v)
753 a8: vfmadd213ps/d Vx,Hx,Wx (66),(v)
754 a9: vfmadd213ss/d Vx,Hx,Wx (66),(v),(v1)
755 aa: vfmsub213ps/d Vx,Hx,Wx (66),(v)
756 ab: vfmsub213ss/d Vx,Hx,Wx (66),(v),(v1)
757 ac: vfnmadd213ps/d Vx,Hx,Wx (66),(v)
758 ad: vfnmadd213ss/d Vx,Hx,Wx (66),(v),(v1)
759 ae: vfnmsub213ps/d Vx,Hx,Wx (66),(v)
760 af: vfnmsub213ss/d Vx,Hx,Wx (66),(v),(v1)
761 b4: vpmadd52luq Vx,Hx,Wx (66),(ev)
762 b5: vpmadd52huq Vx,Hx,Wx (66),(ev)
763 b6: vfmaddsub231ps/d Vx,Hx,Wx (66),(v)
764 b7: vfmsubadd231ps/d Vx,Hx,Wx (66),(v)
765 b8: vfmadd231ps/d Vx,Hx,Wx (66),(v)
766 b9: vfmadd231ss/d Vx,Hx,Wx (66),(v),(v1)
767 ba: vfmsub231ps/d Vx,Hx,Wx (66),(v)
768 bb: vfmsub231ss/d Vx,Hx,Wx (66),(v),(v1)
769 bc: vfnmadd231ps/d Vx,Hx,Wx (66),(v)
770 bd: vfnmadd231ss/d Vx,Hx,Wx (66),(v),(v1)
771 be: vfnmsub231ps/d Vx,Hx,Wx (66),(v)
772 bf: vfnmsub231ss/d Vx,Hx,Wx (66),(v),(v1)
773 # 0x0f 0x38 0xc0-0xff
774 c4: vpconflictd/q Vx,Wx (66),(ev)
777 c8: sha1nexte Vdq,Wdq | vexp2ps/d Vx,Wx (66),(ev)
779 ca: sha1msg2 Vdq,Wdq | vrcp28ps/d Vx,Wx (66),(ev)
780 cb: sha256rnds2 Vdq,Wdq | vrcp28ss/d Vx,Hx,Wx (66),(ev)
781 cc: sha256msg1 Vdq,Wdq | vrsqrt28ps/d Vx,Wx (66),(ev)
782 cd: sha256msg2 Vdq,Wdq | vrsqrt28ss/d Vx,Hx,Wx (66),(ev)
783 db: VAESIMC Vdq,Wdq (66),(v1)
784 dc: VAESENC Vdq,Hdq,Wdq (66),(v1)
785 dd: VAESENCLAST Vdq,Hdq,Wdq (66),(v1)
786 de: VAESDEC Vdq,Hdq,Wdq (66),(v1)
787 df: VAESDECLAST Vdq,Hdq,Wdq (66),(v1)
788 f0: MOVBE Gy,My | MOVBE Gw,Mw (66) | CRC32 Gd,Eb (F2) | CRC32 Gd,Eb (66&F2)
789 f1: MOVBE My,Gy | MOVBE Mw,Gw (66) | CRC32 Gd,Ey (F2) | CRC32 Gd,Ew (66&F2)
790 f2: ANDN Gy,By,Ey (v)
792 f5: BZHI Gy,Ey,By (v) | PEXT Gy,By,Ey (F3),(v) | PDEP Gy,By,Ey (F2),(v)
793 f6: ADCX Gy,Ey (66) | ADOX Gy,Ey (F3) | MULX By,Gy,rDX,Ey (F2),(v)
794 f7: BEXTR Gy,Ey,By (v) | SHLX Gy,Ey,By (66),(v) | SARX Gy,Ey,By (F3),(v) | SHRX Gy,Ey,By (F2),(v)
797 Table: 3-byte opcode 2 (0x0f 0x3a)
798 Referrer: 3-byte escape 2
800 # 0x0f 0x3a 0x00-0xff
801 00: vpermq Vqq,Wqq,Ib (66),(v)
802 01: vpermpd Vqq,Wqq,Ib (66),(v)
803 02: vpblendd Vx,Hx,Wx,Ib (66),(v)
804 03: valignd/q Vx,Hx,Wx,Ib (66),(ev)
805 04: vpermilps Vx,Wx,Ib (66),(v)
806 05: vpermilpd Vx,Wx,Ib (66),(v)
807 06: vperm2f128 Vqq,Hqq,Wqq,Ib (66),(v)
809 08: vroundps Vx,Wx,Ib (66) | vrndscaleps Vx,Wx,Ib (66),(evo)
810 09: vroundpd Vx,Wx,Ib (66) | vrndscalepd Vx,Wx,Ib (66),(evo)
811 0a: vroundss Vss,Wss,Ib (66),(v1) | vrndscaless Vx,Hx,Wx,Ib (66),(evo)
812 0b: vroundsd Vsd,Wsd,Ib (66),(v1) | vrndscalesd Vx,Hx,Wx,Ib (66),(evo)
813 0c: vblendps Vx,Hx,Wx,Ib (66)
814 0d: vblendpd Vx,Hx,Wx,Ib (66)
815 0e: vpblendw Vx,Hx,Wx,Ib (66),(v1)
816 0f: palignr Pq,Qq,Ib | vpalignr Vx,Hx,Wx,Ib (66),(v1)
817 14: vpextrb Rd/Mb,Vdq,Ib (66),(v1)
818 15: vpextrw Rd/Mw,Vdq,Ib (66),(v1)
819 16: vpextrd/q Ey,Vdq,Ib (66),(v1)
820 17: vextractps Ed,Vdq,Ib (66),(v1)
821 18: vinsertf128 Vqq,Hqq,Wqq,Ib (66),(v) | vinsertf32x4/64x2 Vqq,Hqq,Wqq,Ib (66),(evo)
822 19: vextractf128 Wdq,Vqq,Ib (66),(v) | vextractf32x4/64x2 Wdq,Vqq,Ib (66),(evo)
823 1a: vinsertf32x8/64x4 Vqq,Hqq,Wqq,Ib (66),(ev)
824 1b: vextractf32x8/64x4 Wdq,Vqq,Ib (66),(ev)
825 1d: vcvtps2ph Wx,Vx,Ib (66),(v)
826 1e: vpcmpud/q Vk,Hd,Wd,Ib (66),(ev)
827 1f: vpcmpd/q Vk,Hd,Wd,Ib (66),(ev)
828 20: vpinsrb Vdq,Hdq,Ry/Mb,Ib (66),(v1)
829 21: vinsertps Vdq,Hdq,Udq/Md,Ib (66),(v1)
830 22: vpinsrd/q Vdq,Hdq,Ey,Ib (66),(v1)
831 23: vshuff32x4/64x2 Vx,Hx,Wx,Ib (66),(ev)
832 25: vpternlogd/q Vx,Hx,Wx,Ib (66),(ev)
833 26: vgetmantps/d Vx,Wx,Ib (66),(ev)
834 27: vgetmantss/d Vx,Hx,Wx,Ib (66),(ev)
835 30: kshiftrb/w Vk,Uk,Ib (66),(v)
836 31: kshiftrd/q Vk,Uk,Ib (66),(v)
837 32: kshiftlb/w Vk,Uk,Ib (66),(v)
838 33: kshiftld/q Vk,Uk,Ib (66),(v)
839 38: vinserti128 Vqq,Hqq,Wqq,Ib (66),(v) | vinserti32x4/64x2 Vqq,Hqq,Wqq,Ib (66),(evo)
840 39: vextracti128 Wdq,Vqq,Ib (66),(v) | vextracti32x4/64x2 Wdq,Vqq,Ib (66),(evo)
841 3a: vinserti32x8/64x4 Vqq,Hqq,Wqq,Ib (66),(ev)
842 3b: vextracti32x8/64x4 Wdq,Vqq,Ib (66),(ev)
843 3e: vpcmpub/w Vk,Hk,Wx,Ib (66),(ev)
844 3f: vpcmpb/w Vk,Hk,Wx,Ib (66),(ev)
845 40: vdpps Vx,Hx,Wx,Ib (66)
846 41: vdppd Vdq,Hdq,Wdq,Ib (66),(v1)
847 42: vmpsadbw Vx,Hx,Wx,Ib (66),(v1) | vdbpsadbw Vx,Hx,Wx,Ib (66),(evo)
848 43: vshufi32x4/64x2 Vx,Hx,Wx,Ib (66),(ev)
849 44: vpclmulqdq Vdq,Hdq,Wdq,Ib (66),(v1)
850 46: vperm2i128 Vqq,Hqq,Wqq,Ib (66),(v)
851 4a: vblendvps Vx,Hx,Wx,Lx (66),(v)
852 4b: vblendvpd Vx,Hx,Wx,Lx (66),(v)
853 4c: vpblendvb Vx,Hx,Wx,Lx (66),(v1)
854 50: vrangeps/d Vx,Hx,Wx,Ib (66),(ev)
855 51: vrangess/d Vx,Hx,Wx,Ib (66),(ev)
856 54: vfixupimmps/d Vx,Hx,Wx,Ib (66),(ev)
857 55: vfixupimmss/d Vx,Hx,Wx,Ib (66),(ev)
858 56: vreduceps/d Vx,Wx,Ib (66),(ev)
859 57: vreducess/d Vx,Hx,Wx,Ib (66),(ev)
860 60: vpcmpestrm Vdq,Wdq,Ib (66),(v1)
861 61: vpcmpestri Vdq,Wdq,Ib (66),(v1)
862 62: vpcmpistrm Vdq,Wdq,Ib (66),(v1)
863 63: vpcmpistri Vdq,Wdq,Ib (66),(v1)
864 66: vfpclassps/d Vk,Wx,Ib (66),(ev)
865 67: vfpclassss/d Vk,Wx,Ib (66),(ev)
866 cc: sha1rnds4 Vdq,Wdq,Ib
867 df: VAESKEYGEN Vdq,Wdq,Ib (66),(v1)
868 f0: RORX Gy,Ey,Ib (F2),(v)
927 # Note: "forced64" is Intel CPU behavior (see comment about CALL insn).
946 0: SGDT Ms | VMCALL (001),(11B) | VMLAUNCH (010),(11B) | VMRESUME (011),(11B) | VMXOFF (100),(11B)
947 1: SIDT Ms | MONITOR (000),(11B) | MWAIT (001),(11B) | CLAC (010),(11B) | STAC (011),(11B)
948 2: LGDT Ms | XGETBV (000),(11B) | XSETBV (001),(11B) | VMFUNC (100),(11B) | XEND (101)(11B) | XTEST (110)(11B)
951 5: rdpkru (110),(11B) | wrpkru (111),(11B)
953 7: INVLPG Mb | SWAPGS (o64),(000),(11B) | RDTSCP (001),(11B)
964 1: CMPXCHG8B/16B Mq/Mdq
968 6: VMPTRLD Mq | VMCLEAR Mq (66) | VMXON Mq (F3) | RDRAND Rv (11B)
969 7: VMPTRST Mq | VMPTRST Mq (F3) | RDSEED Rv (11B)
984 # Grp11A and Grp11B are expressed as Grp11 in Intel SDM
987 7: XABORT Ib (000),(11B)
992 7: XBEGIN Jz (000),(11B)
996 2: psrlw Nq,Ib (11B) | vpsrlw Hx,Ux,Ib (66),(11B),(v1)
997 4: psraw Nq,Ib (11B) | vpsraw Hx,Ux,Ib (66),(11B),(v1)
998 6: psllw Nq,Ib (11B) | vpsllw Hx,Ux,Ib (66),(11B),(v1)
1002 0: vprord/q Hx,Wx,Ib (66),(ev)
1003 1: vprold/q Hx,Wx,Ib (66),(ev)
1004 2: psrld Nq,Ib (11B) | vpsrld Hx,Ux,Ib (66),(11B),(v1)
1005 4: psrad Nq,Ib (11B) | vpsrad Hx,Ux,Ib (66),(11B),(v1) | vpsrad/q Hx,Ux,Ib (66),(evo)
1006 6: pslld Nq,Ib (11B) | vpslld Hx,Ux,Ib (66),(11B),(v1)
1010 2: psrlq Nq,Ib (11B) | vpsrlq Hx,Ux,Ib (66),(11B),(v1)
1011 3: vpsrldq Hx,Ux,Ib (66),(11B),(v1)
1012 6: psllq Nq,Ib (11B) | vpsllq Hx,Ux,Ib (66),(11B),(v1)
1013 7: vpslldq Hx,Ux,Ib (66),(11B),(v1)
1017 0: fxsave | RDFSBASE Ry (F3),(11B)
1018 1: fxstor | RDGSBASE Ry (F3),(11B)
1019 2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
1020 3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
1021 4: XSAVE | ptwrite Ey (F3),(11B)
1022 5: XRSTOR | lfence (11B)
1023 6: XSAVEOPT | clwb (66) | mfence (11B)
1024 7: clflush | clflushopt (66) | sfence (11B)
1041 1: vgatherpf0dps/d Wx (66),(ev)
1042 2: vgatherpf1dps/d Wx (66),(ev)
1043 5: vscatterpf0dps/d Wx (66),(ev)
1044 6: vscatterpf1dps/d Wx (66),(ev)
1048 1: vgatherpf0qps/d Wx (66),(ev)
1049 2: vgatherpf1qps/d Wx (66),(ev)
1050 5: vscatterpf0qps/d Wx (66),(ev)
1051 6: vscatterpf1qps/d Wx (66),(ev)
1054 # AMD's Prefetch Group