1 //===-- BUFInstructions.td - Buffer Instruction Defintions ----------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 def MUBUFAddr32 : ComplexPattern<i64, 9, "SelectMUBUFAddr32">;
10 def MUBUFAddr64 : ComplexPattern<i64, 8, "SelectMUBUFAddr64">;
11 def MUBUFAddr64Atomic : ComplexPattern<i64, 5, "SelectMUBUFAddr64">;
13 def MUBUFScratchOffen : ComplexPattern<i64, 4, "SelectMUBUFScratchOffen", [], [SDNPWantParent]>;
14 def MUBUFScratchOffset : ComplexPattern<i64, 3, "SelectMUBUFScratchOffset", [], [SDNPWantParent], 20>;
16 def MUBUFOffset : ComplexPattern<i64, 7, "SelectMUBUFOffset">;
17 def MUBUFOffsetNoGLC : ComplexPattern<i64, 3, "SelectMUBUFOffset">;
18 def MUBUFOffsetAtomic : ComplexPattern<i64, 4, "SelectMUBUFOffset">;
28 class getAddrName<int addrKind> {
30 !if(!eq(addrKind, BUFAddrKind.Offset), "offset",
31 !if(!eq(addrKind, BUFAddrKind.OffEn), "offen",
32 !if(!eq(addrKind, BUFAddrKind.IdxEn), "idxen",
33 !if(!eq(addrKind, BUFAddrKind.BothEn), "bothen",
34 !if(!eq(addrKind, BUFAddrKind.Addr64), "addr64",
38 class MUBUFAddr64Table <bit is_addr64, string Name> {
39 bit IsAddr64 = is_addr64;
43 class MUBUFLdsTable <bit is_lds, string Name> {
48 class MTBUFAddr64Table <bit is_addr64, string Name> {
49 bit IsAddr64 = is_addr64;
53 //===----------------------------------------------------------------------===//
55 //===----------------------------------------------------------------------===//
57 class MTBUF_Pseudo <string opName, dag outs, dag ins,
58 string asmOps, list<dag> pattern=[]> :
59 InstSI<outs, ins, "", pattern>,
60 SIMCInstr<opName, SIEncodingFamily.NONE> {
63 let isCodeGenOnly = 1;
65 let UseNamedOperandTable = 1;
67 string Mnemonic = opName;
68 string AsmOperands = asmOps;
74 let hasSideEffects = 0;
75 let SchedRW = [WriteVMEM];
77 let AsmMatchConverter = "cvtMtbuf";
82 bits<1> has_vdata = 1;
83 bits<1> has_vaddr = 1;
86 bits<1> glc_value = 0; // the value for glc if no such operand
87 bits<1> dlc_value = 0; // the value for dlc if no such operand
88 bits<1> has_srsrc = 1;
89 bits<1> has_soffset = 1;
90 bits<1> has_offset = 1;
95 class MTBUF_Real <MTBUF_Pseudo ps> :
96 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
99 let isCodeGenOnly = 0;
101 // copy relevant pseudo op flags
102 let SubtargetPredicate = ps.SubtargetPredicate;
103 let AsmMatchConverter = ps.AsmMatchConverter;
104 let Constraints = ps.Constraints;
105 let DisableEncoding = ps.DisableEncoding;
106 let TSFlags = ps.TSFlags;
119 bits<4> dfmt = format{3-0};
120 bits<3> nfmt = format{6-4};
123 class getMTBUFInsDA<list<RegisterClass> vdataList,
124 list<RegisterClass> vaddrList=[]> {
125 RegisterClass vdataClass = !if(!empty(vdataList), ?, !head(vdataList));
126 RegisterClass vaddrClass = !if(!empty(vaddrList), ?, !head(vaddrList));
127 dag InsNoData = !if(!empty(vaddrList),
128 (ins SReg_128:$srsrc, SCSrc_b32:$soffset,
129 offset:$offset, FORMAT:$format, GLC:$glc, SLC:$slc, TFE:$tfe, DLC:$dlc),
130 (ins vaddrClass:$vaddr, SReg_128:$srsrc, SCSrc_b32:$soffset,
131 offset:$offset, FORMAT:$format, GLC:$glc, SLC:$slc, TFE:$tfe, DLC:$dlc)
133 dag InsData = !if(!empty(vaddrList),
134 (ins vdataClass:$vdata, SReg_128:$srsrc,
135 SCSrc_b32:$soffset, offset:$offset, FORMAT:$format, GLC:$glc,
136 SLC:$slc, TFE:$tfe, DLC:$dlc),
137 (ins vdataClass:$vdata, vaddrClass:$vaddr, SReg_128:$srsrc,
138 SCSrc_b32:$soffset, offset:$offset, FORMAT:$format, GLC:$glc,
139 SLC:$slc, TFE:$tfe, DLC:$dlc)
141 dag ret = !if(!empty(vdataList), InsNoData, InsData);
144 class getMTBUFIns<int addrKind, list<RegisterClass> vdataList=[]> {
146 !if(!eq(addrKind, BUFAddrKind.Offset), getMTBUFInsDA<vdataList>.ret,
147 !if(!eq(addrKind, BUFAddrKind.OffEn), getMTBUFInsDA<vdataList, [VGPR_32]>.ret,
148 !if(!eq(addrKind, BUFAddrKind.IdxEn), getMTBUFInsDA<vdataList, [VGPR_32]>.ret,
149 !if(!eq(addrKind, BUFAddrKind.BothEn), getMTBUFInsDA<vdataList, [VReg_64]>.ret,
150 !if(!eq(addrKind, BUFAddrKind.Addr64), getMTBUFInsDA<vdataList, [VReg_64]>.ret,
154 class getMTBUFAsmOps<int addrKind> {
156 !if(!eq(addrKind, BUFAddrKind.Offset), "off, $srsrc, $format, $soffset",
157 !if(!eq(addrKind, BUFAddrKind.OffEn),
158 "$vaddr, $srsrc, $format, $soffset offen",
159 !if(!eq(addrKind, BUFAddrKind.IdxEn),
160 "$vaddr, $srsrc, $format, $soffset idxen",
161 !if(!eq(addrKind, BUFAddrKind.BothEn),
162 "$vaddr, $srsrc, $format, $soffset idxen offen",
163 !if(!eq(addrKind, BUFAddrKind.Addr64),
164 "$vaddr, $srsrc, $format, $soffset addr64",
166 string ret = Pfx # "$offset";
169 class MTBUF_SetupAddr<int addrKind> {
170 bits<1> offen = !if(!eq(addrKind, BUFAddrKind.OffEn), 1,
171 !if(!eq(addrKind, BUFAddrKind.BothEn), 1 , 0));
173 bits<1> idxen = !if(!eq(addrKind, BUFAddrKind.IdxEn), 1,
174 !if(!eq(addrKind, BUFAddrKind.BothEn), 1 , 0));
176 bits<1> addr64 = !if(!eq(addrKind, BUFAddrKind.Addr64), 1, 0);
178 bits<1> has_vaddr = !if(!eq(addrKind, BUFAddrKind.Offset), 0, 1);
181 class MTBUF_Load_Pseudo <string opName,
183 RegisterClass vdataClass,
184 list<dag> pattern=[],
185 // Workaround bug bz30254
186 int addrKindCopy = addrKind>
187 : MTBUF_Pseudo<opName,
188 (outs vdataClass:$vdata),
189 getMTBUFIns<addrKindCopy>.ret,
190 " $vdata, " # getMTBUFAsmOps<addrKindCopy>.ret # "$glc$slc$tfe$dlc",
192 MTBUF_SetupAddr<addrKindCopy> {
193 let PseudoInstr = opName # "_" # getAddrName<addrKindCopy>.ret;
198 multiclass MTBUF_Pseudo_Loads<string opName, RegisterClass vdataClass,
199 ValueType load_vt = i32,
200 SDPatternOperator ld = null_frag> {
202 def _OFFSET : MTBUF_Load_Pseudo <opName, BUFAddrKind.Offset, vdataClass,
203 [(set load_vt:$vdata,
204 (ld (MUBUFOffset v4i32:$srsrc, i32:$soffset, i16:$offset, i8:$format,
205 i1:$glc, i1:$slc, i1:$tfe, i1:$dlc)))]>,
206 MTBUFAddr64Table<0, NAME>;
208 def _ADDR64 : MTBUF_Load_Pseudo <opName, BUFAddrKind.Addr64, vdataClass,
209 [(set load_vt:$vdata,
210 (ld (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset, i16:$offset,
211 i8:$format, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc)))]>,
212 MTBUFAddr64Table<1, NAME>;
214 def _OFFEN : MTBUF_Load_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
215 def _IDXEN : MTBUF_Load_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
216 def _BOTHEN : MTBUF_Load_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
218 let DisableWQM = 1 in {
219 def _OFFSET_exact : MTBUF_Load_Pseudo <opName, BUFAddrKind.Offset, vdataClass>;
220 def _OFFEN_exact : MTBUF_Load_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
221 def _IDXEN_exact : MTBUF_Load_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
222 def _BOTHEN_exact : MTBUF_Load_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
226 class MTBUF_Store_Pseudo <string opName,
228 RegisterClass vdataClass,
229 list<dag> pattern=[],
230 // Workaround bug bz30254
231 int addrKindCopy = addrKind,
232 RegisterClass vdataClassCopy = vdataClass>
233 : MTBUF_Pseudo<opName,
235 getMTBUFIns<addrKindCopy, [vdataClassCopy]>.ret,
236 " $vdata, " # getMTBUFAsmOps<addrKindCopy>.ret # "$glc$slc$tfe$dlc",
238 MTBUF_SetupAddr<addrKindCopy> {
239 let PseudoInstr = opName # "_" # getAddrName<addrKindCopy>.ret;
244 multiclass MTBUF_Pseudo_Stores<string opName, RegisterClass vdataClass,
245 ValueType store_vt = i32,
246 SDPatternOperator st = null_frag> {
248 def _OFFSET : MTBUF_Store_Pseudo <opName, BUFAddrKind.Offset, vdataClass,
249 [(st store_vt:$vdata, (MUBUFOffset v4i32:$srsrc, i32:$soffset,
250 i16:$offset, i8:$format, i1:$glc,
251 i1:$slc, i1:$tfe, i1:$dlc))]>,
252 MTBUFAddr64Table<0, NAME>;
254 def _ADDR64 : MTBUF_Store_Pseudo <opName, BUFAddrKind.Addr64, vdataClass,
255 [(st store_vt:$vdata, (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset,
256 i16:$offset, i8:$format, i1:$glc,
257 i1:$slc, i1:$tfe, i1:$dlc))]>,
258 MTBUFAddr64Table<1, NAME>;
260 def _OFFEN : MTBUF_Store_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
261 def _IDXEN : MTBUF_Store_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
262 def _BOTHEN : MTBUF_Store_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
264 let DisableWQM = 1 in {
265 def _OFFSET_exact : MTBUF_Store_Pseudo <opName, BUFAddrKind.Offset, vdataClass>;
266 def _OFFEN_exact : MTBUF_Store_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
267 def _IDXEN_exact : MTBUF_Store_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
268 def _BOTHEN_exact : MTBUF_Store_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
273 //===----------------------------------------------------------------------===//
275 //===----------------------------------------------------------------------===//
277 class MUBUFGetBaseOpcode<string Op> {
278 string ret = !subst("DWORDX2", "DWORD",
279 !subst("DWORDX3", "DWORD",
280 !subst("DWORDX4", "DWORD", Op)));
283 class MUBUF_Pseudo <string opName, dag outs, dag ins,
284 string asmOps, list<dag> pattern=[]> :
285 InstSI<outs, ins, "", pattern>,
286 SIMCInstr<opName, SIEncodingFamily.NONE> {
289 let isCodeGenOnly = 1;
291 let UseNamedOperandTable = 1;
293 string Mnemonic = opName;
294 string AsmOperands = asmOps;
296 Instruction Opcode = !cast<Instruction>(NAME);
297 Instruction BaseOpcode = !cast<Instruction>(MUBUFGetBaseOpcode<NAME>.ret);
303 let hasSideEffects = 0;
304 let SchedRW = [WriteVMEM];
306 let AsmMatchConverter = "cvtMubuf";
312 bits<1> has_vdata = 1;
313 bits<1> has_vaddr = 1;
316 bits<1> glc_value = 0; // the value for glc if no such operand
317 bits<1> dlc_value = 0; // the value for dlc if no such operand
318 bits<1> has_srsrc = 1;
319 bits<1> has_soffset = 1;
320 bits<1> has_offset = 1;
323 bits<4> elements = 0;
326 class MUBUF_Real <MUBUF_Pseudo ps> :
327 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
330 let isCodeGenOnly = 0;
332 // copy relevant pseudo op flags
333 let SubtargetPredicate = ps.SubtargetPredicate;
334 let AsmMatchConverter = ps.AsmMatchConverter;
335 let Constraints = ps.Constraints;
336 let DisableEncoding = ps.DisableEncoding;
337 let TSFlags = ps.TSFlags;
351 // For cache invalidation instructions.
352 class MUBUF_Invalidate <string opName, SDPatternOperator node = null_frag> :
353 MUBUF_Pseudo<opName, (outs), (ins), "", [(node)]> {
355 let AsmMatchConverter = "";
357 let hasSideEffects = 1;
360 // Set everything to 0.
377 class getMUBUFInsDA<list<RegisterClass> vdataList,
378 list<RegisterClass> vaddrList=[],
380 RegisterClass vdataClass = !if(!empty(vdataList), ?, !head(vdataList));
381 RegisterClass vaddrClass = !if(!empty(vaddrList), ?, !head(vaddrList));
382 dag InsNoData = !if(!empty(vaddrList),
383 (ins SReg_128:$srsrc, SCSrc_b32:$soffset,
384 offset:$offset, GLC:$glc, SLC:$slc),
385 (ins vaddrClass:$vaddr, SReg_128:$srsrc, SCSrc_b32:$soffset,
386 offset:$offset, GLC:$glc, SLC:$slc)
388 dag InsData = !if(!empty(vaddrList),
389 (ins vdataClass:$vdata, SReg_128:$srsrc,
390 SCSrc_b32:$soffset, offset:$offset, GLC:$glc, SLC:$slc),
391 (ins vdataClass:$vdata, vaddrClass:$vaddr, SReg_128:$srsrc,
392 SCSrc_b32:$soffset, offset:$offset, GLC:$glc, SLC:$slc)
395 !if(!empty(vdataList), InsNoData, InsData),
396 !if(isLds, (ins DLC:$dlc), (ins TFE:$tfe, DLC:$dlc))
400 class getMUBUFElements<ValueType vt> {
401 // eq does not support ValueType for some reason.
402 string vtAsStr = !cast<string>(vt);
405 !if(!eq(vtAsStr, "f16"), 1,
406 !if(!eq(vtAsStr, "v2f16"), 2,
407 !if(!eq(vtAsStr, "v3f16"), 3,
408 !if(!eq(vtAsStr, "v4f16"), 4,
409 !if(!eq(vt.Size, 32), 1,
410 !if(!eq(vt.Size, 64), 2,
411 !if(!eq(vt.Size, 96), 3,
412 !if(!eq(vt.Size, 128), 4, 0)
422 class getMUBUFIns<int addrKind, list<RegisterClass> vdataList=[], bit isLds = 0> {
424 !if(!eq(addrKind, BUFAddrKind.Offset), getMUBUFInsDA<vdataList, [], isLds>.ret,
425 !if(!eq(addrKind, BUFAddrKind.OffEn), getMUBUFInsDA<vdataList, [VGPR_32], isLds>.ret,
426 !if(!eq(addrKind, BUFAddrKind.IdxEn), getMUBUFInsDA<vdataList, [VGPR_32], isLds>.ret,
427 !if(!eq(addrKind, BUFAddrKind.BothEn), getMUBUFInsDA<vdataList, [VReg_64], isLds>.ret,
428 !if(!eq(addrKind, BUFAddrKind.Addr64), getMUBUFInsDA<vdataList, [VReg_64], isLds>.ret,
432 class getMUBUFAsmOps<int addrKind> {
434 !if(!eq(addrKind, BUFAddrKind.Offset), "off, $srsrc, $soffset",
435 !if(!eq(addrKind, BUFAddrKind.OffEn), "$vaddr, $srsrc, $soffset offen",
436 !if(!eq(addrKind, BUFAddrKind.IdxEn), "$vaddr, $srsrc, $soffset idxen",
437 !if(!eq(addrKind, BUFAddrKind.BothEn), "$vaddr, $srsrc, $soffset idxen offen",
438 !if(!eq(addrKind, BUFAddrKind.Addr64), "$vaddr, $srsrc, $soffset addr64",
440 string ret = Pfx # "$offset";
443 class MUBUF_SetupAddr<int addrKind> {
444 bits<1> offen = !if(!eq(addrKind, BUFAddrKind.OffEn), 1,
445 !if(!eq(addrKind, BUFAddrKind.BothEn), 1 , 0));
447 bits<1> idxen = !if(!eq(addrKind, BUFAddrKind.IdxEn), 1,
448 !if(!eq(addrKind, BUFAddrKind.BothEn), 1 , 0));
450 bits<1> addr64 = !if(!eq(addrKind, BUFAddrKind.Addr64), 1, 0);
452 bits<1> has_vaddr = !if(!eq(addrKind, BUFAddrKind.Offset), 0, 1);
455 class MUBUF_Load_Pseudo <string opName,
460 list<dag> pattern=[],
461 // Workaround bug bz30254
462 int addrKindCopy = addrKind>
463 : MUBUF_Pseudo<opName,
464 (outs getVregSrcForVT<vdata_vt>.ret:$vdata),
465 !con(getMUBUFIns<addrKindCopy, [], isLds>.ret,
466 !if(HasTiedDest, (ins getVregSrcForVT<vdata_vt>.ret:$vdata_in), (ins))),
467 " $vdata, " # getMUBUFAsmOps<addrKindCopy>.ret # "$glc$slc" #
468 !if(isLds, " lds", "$tfe") # "$dlc",
470 MUBUF_SetupAddr<addrKindCopy> {
471 let PseudoInstr = opName # !if(isLds, "_lds", "") #
472 "_" # getAddrName<addrKindCopy>.ret;
473 let AsmMatchConverter = !if(isLds, "cvtMubufLds", "cvtMubuf");
475 let Constraints = !if(HasTiedDest, "$vdata = $vdata_in", "");
479 let Uses = !if(isLds, [EXEC, M0], [EXEC]);
480 let has_tfe = !if(isLds, 0, 1);
482 let elements = getMUBUFElements<vdata_vt>.ret;
485 class MUBUF_Offset_Load_Pat <Instruction inst, ValueType load_vt = i32, SDPatternOperator ld = null_frag> : Pat <
486 (load_vt (ld (MUBUFOffset v4i32:$srsrc, i32:$soffset, i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))),
487 (load_vt (inst v4i32:$srsrc, i32:$soffset, i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))
490 class MUBUF_Addr64_Load_Pat <Instruction inst,
491 ValueType load_vt = i32,
492 SDPatternOperator ld = null_frag> : Pat <
493 (load_vt (ld (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset, i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))),
494 (load_vt (inst i64:$vaddr, v4i32:$srsrc, i32:$soffset, i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))
497 multiclass MUBUF_Pseudo_Load_Pats<string BaseInst, ValueType load_vt = i32, SDPatternOperator ld = null_frag> {
498 def : MUBUF_Offset_Load_Pat<!cast<Instruction>(BaseInst#"_OFFSET"), load_vt, ld>;
499 def : MUBUF_Addr64_Load_Pat<!cast<Instruction>(BaseInst#"_ADDR64"), load_vt, ld>;
503 // FIXME: tfe can't be an operand because it requires a separate
504 // opcode because it needs an N+1 register class dest register.
505 multiclass MUBUF_Pseudo_Loads<string opName,
506 ValueType load_vt = i32,
507 SDPatternOperator ld = null_frag,
511 def _OFFSET : MUBUF_Load_Pseudo <opName, BUFAddrKind.Offset, load_vt, TiedDest, isLds>,
512 MUBUFAddr64Table<0, NAME # !if(isLds, "_LDS", "")>;
514 def _ADDR64 : MUBUF_Load_Pseudo <opName, BUFAddrKind.Addr64, load_vt, TiedDest, isLds>,
515 MUBUFAddr64Table<1, NAME # !if(isLds, "_LDS", "")>;
517 def _OFFEN : MUBUF_Load_Pseudo <opName, BUFAddrKind.OffEn, load_vt, TiedDest, isLds>;
518 def _IDXEN : MUBUF_Load_Pseudo <opName, BUFAddrKind.IdxEn, load_vt, TiedDest, isLds>;
519 def _BOTHEN : MUBUF_Load_Pseudo <opName, BUFAddrKind.BothEn, load_vt, TiedDest, isLds>;
521 let DisableWQM = 1 in {
522 def _OFFSET_exact : MUBUF_Load_Pseudo <opName, BUFAddrKind.Offset, load_vt, TiedDest, isLds>;
523 def _OFFEN_exact : MUBUF_Load_Pseudo <opName, BUFAddrKind.OffEn, load_vt, TiedDest, isLds>;
524 def _IDXEN_exact : MUBUF_Load_Pseudo <opName, BUFAddrKind.IdxEn, load_vt, TiedDest, isLds>;
525 def _BOTHEN_exact : MUBUF_Load_Pseudo <opName, BUFAddrKind.BothEn, load_vt, TiedDest, isLds>;
529 multiclass MUBUF_Pseudo_Loads_Lds<string opName, ValueType load_vt = i32,
530 SDPatternOperator ld_nolds = null_frag,
531 SDPatternOperator ld_lds = null_frag> {
532 defm NAME : MUBUF_Pseudo_Loads<opName, load_vt, ld_nolds>;
533 defm _LDS : MUBUF_Pseudo_Loads<opName, load_vt, ld_lds, 0, 1>;
536 class MUBUF_Store_Pseudo <string opName,
539 list<dag> pattern=[],
540 // Workaround bug bz30254
541 int addrKindCopy = addrKind>
542 : MUBUF_Pseudo<opName,
544 getMUBUFIns<addrKindCopy, [getVregSrcForVT<store_vt>.ret]>.ret,
545 " $vdata, " # getMUBUFAsmOps<addrKindCopy>.ret # "$glc$slc$tfe$dlc",
547 MUBUF_SetupAddr<addrKindCopy> {
548 let PseudoInstr = opName # "_" # getAddrName<addrKindCopy>.ret;
552 let elements = getMUBUFElements<store_vt>.ret;
555 multiclass MUBUF_Pseudo_Stores<string opName,
556 ValueType store_vt = i32,
557 SDPatternOperator st = null_frag> {
559 def _OFFSET : MUBUF_Store_Pseudo <opName, BUFAddrKind.Offset, store_vt,
560 [(st store_vt:$vdata, (MUBUFOffset v4i32:$srsrc, i32:$soffset,
561 i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))]>,
562 MUBUFAddr64Table<0, NAME>;
564 def _ADDR64 : MUBUF_Store_Pseudo <opName, BUFAddrKind.Addr64, store_vt,
565 [(st store_vt:$vdata, (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset,
566 i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))]>,
567 MUBUFAddr64Table<1, NAME>;
569 def _OFFEN : MUBUF_Store_Pseudo <opName, BUFAddrKind.OffEn, store_vt>;
570 def _IDXEN : MUBUF_Store_Pseudo <opName, BUFAddrKind.IdxEn, store_vt>;
571 def _BOTHEN : MUBUF_Store_Pseudo <opName, BUFAddrKind.BothEn, store_vt>;
573 let DisableWQM = 1 in {
574 def _OFFSET_exact : MUBUF_Store_Pseudo <opName, BUFAddrKind.Offset, store_vt>;
575 def _OFFEN_exact : MUBUF_Store_Pseudo <opName, BUFAddrKind.OffEn, store_vt>;
576 def _IDXEN_exact : MUBUF_Store_Pseudo <opName, BUFAddrKind.IdxEn, store_vt>;
577 def _BOTHEN_exact : MUBUF_Store_Pseudo <opName, BUFAddrKind.BothEn, store_vt>;
581 class MUBUF_Pseudo_Store_Lds<string opName>
582 : MUBUF_Pseudo<opName,
584 (ins SReg_128:$srsrc, SCSrc_b32:$soffset, offset:$offset, GLC:$glc, SLC:$slc),
585 " $srsrc, $soffset$offset lds$glc$slc"> {
595 let Uses = [EXEC, M0];
596 let AsmMatchConverter = "cvtMubufLds";
599 class getMUBUFAtomicInsDA<RegisterClass vdataClass, bit vdata_in,
600 list<RegisterClass> vaddrList=[]> {
601 RegisterClass vaddrClass = !if(!empty(vaddrList), ?, !head(vaddrList));
602 dag ret = !if(vdata_in,
603 !if(!empty(vaddrList),
604 (ins vdataClass:$vdata_in,
605 SReg_128:$srsrc, SCSrc_b32:$soffset, offset:$offset, SLC:$slc),
606 (ins vdataClass:$vdata_in, vaddrClass:$vaddr,
607 SReg_128:$srsrc, SCSrc_b32:$soffset, offset:$offset, SLC:$slc)
609 !if(!empty(vaddrList),
610 (ins vdataClass:$vdata,
611 SReg_128:$srsrc, SCSrc_b32:$soffset, offset:$offset, SLC:$slc),
612 (ins vdataClass:$vdata, vaddrClass:$vaddr,
613 SReg_128:$srsrc, SCSrc_b32:$soffset, offset:$offset, SLC:$slc)
617 class getMUBUFAtomicIns<int addrKind,
618 RegisterClass vdataClass,
620 // Workaround bug bz30254
621 RegisterClass vdataClassCopy=vdataClass> {
623 !if(!eq(addrKind, BUFAddrKind.Offset),
624 getMUBUFAtomicInsDA<vdataClassCopy, vdata_in>.ret,
625 !if(!eq(addrKind, BUFAddrKind.OffEn),
626 getMUBUFAtomicInsDA<vdataClassCopy, vdata_in, [VGPR_32]>.ret,
627 !if(!eq(addrKind, BUFAddrKind.IdxEn),
628 getMUBUFAtomicInsDA<vdataClassCopy, vdata_in, [VGPR_32]>.ret,
629 !if(!eq(addrKind, BUFAddrKind.BothEn),
630 getMUBUFAtomicInsDA<vdataClassCopy, vdata_in, [VReg_64]>.ret,
631 !if(!eq(addrKind, BUFAddrKind.Addr64),
632 getMUBUFAtomicInsDA<vdataClassCopy, vdata_in, [VReg_64]>.ret,
636 class MUBUF_Atomic_Pseudo<string opName,
641 list<dag> pattern=[],
642 // Workaround bug bz30254
643 int addrKindCopy = addrKind>
644 : MUBUF_Pseudo<opName, outs, ins, asmOps, pattern>,
645 MUBUF_SetupAddr<addrKindCopy> {
648 let hasPostISelHook = 1;
649 let hasSideEffects = 1;
657 class MUBUF_AtomicNoRet_Pseudo<string opName, int addrKind,
658 RegisterClass vdataClass,
659 list<dag> pattern=[],
660 // Workaround bug bz30254
661 int addrKindCopy = addrKind,
662 RegisterClass vdataClassCopy = vdataClass>
663 : MUBUF_Atomic_Pseudo<opName, addrKindCopy,
665 getMUBUFAtomicIns<addrKindCopy, vdataClassCopy, 0>.ret,
666 " $vdata, " # getMUBUFAsmOps<addrKindCopy>.ret # "$slc",
668 AtomicNoRet<opName # "_" # getAddrName<addrKindCopy>.ret, 0> {
669 let PseudoInstr = opName # "_" # getAddrName<addrKindCopy>.ret;
672 let AsmMatchConverter = "cvtMubufAtomic";
675 class MUBUF_AtomicRet_Pseudo<string opName, int addrKind,
676 RegisterClass vdataClass,
677 list<dag> pattern=[],
678 // Workaround bug bz30254
679 int addrKindCopy = addrKind,
680 RegisterClass vdataClassCopy = vdataClass>
681 : MUBUF_Atomic_Pseudo<opName, addrKindCopy,
682 (outs vdataClassCopy:$vdata),
683 getMUBUFAtomicIns<addrKindCopy, vdataClassCopy, 1>.ret,
684 " $vdata, " # getMUBUFAsmOps<addrKindCopy>.ret # " glc$slc",
686 AtomicNoRet<opName # "_" # getAddrName<addrKindCopy>.ret, 1> {
687 let PseudoInstr = opName # "_rtn_" # getAddrName<addrKindCopy>.ret;
690 let Constraints = "$vdata = $vdata_in";
691 let DisableEncoding = "$vdata_in";
692 let AsmMatchConverter = "cvtMubufAtomicReturn";
695 multiclass MUBUF_Pseudo_Atomics_NO_RTN <string opName,
696 RegisterClass vdataClass,
698 SDPatternOperator atomic,
699 bit isFP = getIsFP<vdataType>.ret> {
700 let FPAtomic = isFP in
701 def _OFFSET : MUBUF_AtomicNoRet_Pseudo <opName, BUFAddrKind.Offset, vdataClass>,
702 MUBUFAddr64Table <0, NAME>;
704 let FPAtomic = isFP in
705 def _ADDR64 : MUBUF_AtomicNoRet_Pseudo <opName, BUFAddrKind.Addr64, vdataClass>,
706 MUBUFAddr64Table <1, NAME>;
708 let FPAtomic = isFP in
709 def _OFFEN : MUBUF_AtomicNoRet_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
711 let FPAtomic = isFP in
713 def _IDXEN : MUBUF_AtomicNoRet_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
715 let FPAtomic = isFP in
716 def _BOTHEN : MUBUF_AtomicNoRet_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
719 multiclass MUBUF_Pseudo_Atomics_RTN <string opName,
720 RegisterClass vdataClass,
722 SDPatternOperator atomic,
723 bit isFP = getIsFP<vdataType>.ret> {
724 let FPAtomic = isFP in
725 def _OFFSET_RTN : MUBUF_AtomicRet_Pseudo <opName, BUFAddrKind.Offset, vdataClass,
726 [(set vdataType:$vdata,
727 (atomic (MUBUFOffsetAtomic v4i32:$srsrc, i32:$soffset, i16:$offset, i1:$slc),
728 vdataType:$vdata_in))]>,
729 MUBUFAddr64Table <0, NAME # "_RTN">;
731 let FPAtomic = isFP in
732 def _ADDR64_RTN : MUBUF_AtomicRet_Pseudo <opName, BUFAddrKind.Addr64, vdataClass,
733 [(set vdataType:$vdata,
734 (atomic (MUBUFAddr64Atomic v4i32:$srsrc, i64:$vaddr, i32:$soffset, i16:$offset, i1:$slc),
735 vdataType:$vdata_in))]>,
736 MUBUFAddr64Table <1, NAME # "_RTN">;
738 let FPAtomic = isFP in
739 def _OFFEN_RTN : MUBUF_AtomicRet_Pseudo <opName, BUFAddrKind.OffEn, vdataClass>;
741 let FPAtomic = isFP in
742 def _IDXEN_RTN : MUBUF_AtomicRet_Pseudo <opName, BUFAddrKind.IdxEn, vdataClass>;
744 let FPAtomic = isFP in
745 def _BOTHEN_RTN : MUBUF_AtomicRet_Pseudo <opName, BUFAddrKind.BothEn, vdataClass>;
748 multiclass MUBUF_Pseudo_Atomics <string opName,
749 RegisterClass vdataClass,
751 SDPatternOperator atomic> :
752 MUBUF_Pseudo_Atomics_NO_RTN<opName, vdataClass, vdataType, atomic>,
753 MUBUF_Pseudo_Atomics_RTN<opName, vdataClass, vdataType, atomic>;
756 //===----------------------------------------------------------------------===//
757 // MUBUF Instructions
758 //===----------------------------------------------------------------------===//
760 defm BUFFER_LOAD_FORMAT_X : MUBUF_Pseudo_Loads_Lds <
761 "buffer_load_format_x", f32
763 defm BUFFER_LOAD_FORMAT_XY : MUBUF_Pseudo_Loads <
764 "buffer_load_format_xy", v2f32
766 defm BUFFER_LOAD_FORMAT_XYZ : MUBUF_Pseudo_Loads <
767 "buffer_load_format_xyz", v3f32
769 defm BUFFER_LOAD_FORMAT_XYZW : MUBUF_Pseudo_Loads <
770 "buffer_load_format_xyzw", v4f32
772 defm BUFFER_STORE_FORMAT_X : MUBUF_Pseudo_Stores <
773 "buffer_store_format_x", f32
775 defm BUFFER_STORE_FORMAT_XY : MUBUF_Pseudo_Stores <
776 "buffer_store_format_xy", v2f32
778 defm BUFFER_STORE_FORMAT_XYZ : MUBUF_Pseudo_Stores <
779 "buffer_store_format_xyz", v3f32
781 defm BUFFER_STORE_FORMAT_XYZW : MUBUF_Pseudo_Stores <
782 "buffer_store_format_xyzw", v4f32
785 let SubtargetPredicate = HasUnpackedD16VMem, D16Buf = 1 in {
786 defm BUFFER_LOAD_FORMAT_D16_X_gfx80 : MUBUF_Pseudo_Loads <
787 "buffer_load_format_d16_x", i32
789 defm BUFFER_LOAD_FORMAT_D16_XY_gfx80 : MUBUF_Pseudo_Loads <
790 "buffer_load_format_d16_xy", v2i32
792 defm BUFFER_LOAD_FORMAT_D16_XYZ_gfx80 : MUBUF_Pseudo_Loads <
793 "buffer_load_format_d16_xyz", v3i32
795 defm BUFFER_LOAD_FORMAT_D16_XYZW_gfx80 : MUBUF_Pseudo_Loads <
796 "buffer_load_format_d16_xyzw", v4i32
798 defm BUFFER_STORE_FORMAT_D16_X_gfx80 : MUBUF_Pseudo_Stores <
799 "buffer_store_format_d16_x", i32
801 defm BUFFER_STORE_FORMAT_D16_XY_gfx80 : MUBUF_Pseudo_Stores <
802 "buffer_store_format_d16_xy", v2i32
804 defm BUFFER_STORE_FORMAT_D16_XYZ_gfx80 : MUBUF_Pseudo_Stores <
805 "buffer_store_format_d16_xyz", v3i32
807 defm BUFFER_STORE_FORMAT_D16_XYZW_gfx80 : MUBUF_Pseudo_Stores <
808 "buffer_store_format_d16_xyzw", v4i32
810 } // End HasUnpackedD16VMem.
812 let SubtargetPredicate = HasPackedD16VMem, D16Buf = 1 in {
813 defm BUFFER_LOAD_FORMAT_D16_X : MUBUF_Pseudo_Loads <
814 "buffer_load_format_d16_x", f16
816 defm BUFFER_LOAD_FORMAT_D16_XY : MUBUF_Pseudo_Loads <
817 "buffer_load_format_d16_xy", v2f16
819 defm BUFFER_LOAD_FORMAT_D16_XYZ : MUBUF_Pseudo_Loads <
820 "buffer_load_format_d16_xyz", v3f16
822 defm BUFFER_LOAD_FORMAT_D16_XYZW : MUBUF_Pseudo_Loads <
823 "buffer_load_format_d16_xyzw", v4f16
825 defm BUFFER_STORE_FORMAT_D16_X : MUBUF_Pseudo_Stores <
826 "buffer_store_format_d16_x", f16
828 defm BUFFER_STORE_FORMAT_D16_XY : MUBUF_Pseudo_Stores <
829 "buffer_store_format_d16_xy", v2f16
831 defm BUFFER_STORE_FORMAT_D16_XYZ : MUBUF_Pseudo_Stores <
832 "buffer_store_format_d16_xyz", v3f16
834 defm BUFFER_STORE_FORMAT_D16_XYZW : MUBUF_Pseudo_Stores <
835 "buffer_store_format_d16_xyzw", v4f16
837 } // End HasPackedD16VMem.
839 defm BUFFER_LOAD_UBYTE : MUBUF_Pseudo_Loads_Lds <
840 "buffer_load_ubyte", i32
842 defm BUFFER_LOAD_SBYTE : MUBUF_Pseudo_Loads_Lds <
843 "buffer_load_sbyte", i32
845 defm BUFFER_LOAD_USHORT : MUBUF_Pseudo_Loads_Lds <
846 "buffer_load_ushort", i32
848 defm BUFFER_LOAD_SSHORT : MUBUF_Pseudo_Loads_Lds <
849 "buffer_load_sshort", i32
851 defm BUFFER_LOAD_DWORD : MUBUF_Pseudo_Loads_Lds <
852 "buffer_load_dword", i32
854 defm BUFFER_LOAD_DWORDX2 : MUBUF_Pseudo_Loads <
855 "buffer_load_dwordx2", v2i32
857 defm BUFFER_LOAD_DWORDX3 : MUBUF_Pseudo_Loads <
858 "buffer_load_dwordx3", v3i32
860 defm BUFFER_LOAD_DWORDX4 : MUBUF_Pseudo_Loads <
861 "buffer_load_dwordx4", v4i32
864 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_UBYTE", i32, extloadi8_global>;
865 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_UBYTE", i32, zextloadi8_global>;
866 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_SBYTE", i32, sextloadi8_global>;
867 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_USHORT", i32, extloadi16_global>;
868 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_USHORT", i32, zextloadi16_global>;
869 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_SSHORT", i32, sextloadi16_global>;
870 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_DWORD", i32, load_global>;
871 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_DWORDX2", v2i32, load_global>;
872 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_DWORDX3", v3i32, load_global>;
873 defm : MUBUF_Pseudo_Load_Pats<"BUFFER_LOAD_DWORDX4", v4i32, load_global>;
875 // This is not described in AMD documentation,
876 // but 'lds' versions of these opcodes are available
877 // in at least GFX8+ chips. See Bug 37653.
878 let SubtargetPredicate = isGFX8GFX9 in {
879 defm BUFFER_LOAD_DWORDX2_LDS : MUBUF_Pseudo_Loads <
880 "buffer_load_dwordx2", v2i32, null_frag, 0, 1
882 defm BUFFER_LOAD_DWORDX3_LDS : MUBUF_Pseudo_Loads <
883 "buffer_load_dwordx3", v3i32, null_frag, 0, 1
885 defm BUFFER_LOAD_DWORDX4_LDS : MUBUF_Pseudo_Loads <
886 "buffer_load_dwordx4", v4i32, null_frag, 0, 1
890 defm BUFFER_STORE_BYTE : MUBUF_Pseudo_Stores <
891 "buffer_store_byte", i32, truncstorei8_global
893 defm BUFFER_STORE_SHORT : MUBUF_Pseudo_Stores <
894 "buffer_store_short", i32, truncstorei16_global
896 defm BUFFER_STORE_DWORD : MUBUF_Pseudo_Stores <
897 "buffer_store_dword", i32, store_global
899 defm BUFFER_STORE_DWORDX2 : MUBUF_Pseudo_Stores <
900 "buffer_store_dwordx2", v2i32, store_global
902 defm BUFFER_STORE_DWORDX3 : MUBUF_Pseudo_Stores <
903 "buffer_store_dwordx3", v3i32, store_global
905 defm BUFFER_STORE_DWORDX4 : MUBUF_Pseudo_Stores <
906 "buffer_store_dwordx4", v4i32, store_global
908 defm BUFFER_ATOMIC_SWAP : MUBUF_Pseudo_Atomics <
909 "buffer_atomic_swap", VGPR_32, i32, atomic_swap_global_32
911 defm BUFFER_ATOMIC_CMPSWAP : MUBUF_Pseudo_Atomics <
912 "buffer_atomic_cmpswap", VReg_64, v2i32, null_frag
914 defm BUFFER_ATOMIC_ADD : MUBUF_Pseudo_Atomics <
915 "buffer_atomic_add", VGPR_32, i32, atomic_load_add_global_32
917 defm BUFFER_ATOMIC_SUB : MUBUF_Pseudo_Atomics <
918 "buffer_atomic_sub", VGPR_32, i32, atomic_load_sub_global_32
920 defm BUFFER_ATOMIC_SMIN : MUBUF_Pseudo_Atomics <
921 "buffer_atomic_smin", VGPR_32, i32, atomic_load_min_global_32
923 defm BUFFER_ATOMIC_UMIN : MUBUF_Pseudo_Atomics <
924 "buffer_atomic_umin", VGPR_32, i32, atomic_load_umin_global_32
926 defm BUFFER_ATOMIC_SMAX : MUBUF_Pseudo_Atomics <
927 "buffer_atomic_smax", VGPR_32, i32, atomic_load_max_global_32
929 defm BUFFER_ATOMIC_UMAX : MUBUF_Pseudo_Atomics <
930 "buffer_atomic_umax", VGPR_32, i32, atomic_load_umax_global_32
932 defm BUFFER_ATOMIC_AND : MUBUF_Pseudo_Atomics <
933 "buffer_atomic_and", VGPR_32, i32, atomic_load_and_global_32
935 defm BUFFER_ATOMIC_OR : MUBUF_Pseudo_Atomics <
936 "buffer_atomic_or", VGPR_32, i32, atomic_load_or_global_32
938 defm BUFFER_ATOMIC_XOR : MUBUF_Pseudo_Atomics <
939 "buffer_atomic_xor", VGPR_32, i32, atomic_load_xor_global_32
941 defm BUFFER_ATOMIC_INC : MUBUF_Pseudo_Atomics <
942 "buffer_atomic_inc", VGPR_32, i32, atomic_inc_global_32
944 defm BUFFER_ATOMIC_DEC : MUBUF_Pseudo_Atomics <
945 "buffer_atomic_dec", VGPR_32, i32, atomic_dec_global_32
947 defm BUFFER_ATOMIC_SWAP_X2 : MUBUF_Pseudo_Atomics <
948 "buffer_atomic_swap_x2", VReg_64, i64, atomic_swap_global_64
950 defm BUFFER_ATOMIC_CMPSWAP_X2 : MUBUF_Pseudo_Atomics <
951 "buffer_atomic_cmpswap_x2", VReg_128, v2i64, null_frag
953 defm BUFFER_ATOMIC_ADD_X2 : MUBUF_Pseudo_Atomics <
954 "buffer_atomic_add_x2", VReg_64, i64, atomic_load_add_global_64
956 defm BUFFER_ATOMIC_SUB_X2 : MUBUF_Pseudo_Atomics <
957 "buffer_atomic_sub_x2", VReg_64, i64, atomic_load_sub_global_64
959 defm BUFFER_ATOMIC_SMIN_X2 : MUBUF_Pseudo_Atomics <
960 "buffer_atomic_smin_x2", VReg_64, i64, atomic_load_min_global_64
962 defm BUFFER_ATOMIC_UMIN_X2 : MUBUF_Pseudo_Atomics <
963 "buffer_atomic_umin_x2", VReg_64, i64, atomic_load_umin_global_64
965 defm BUFFER_ATOMIC_SMAX_X2 : MUBUF_Pseudo_Atomics <
966 "buffer_atomic_smax_x2", VReg_64, i64, atomic_load_max_global_64
968 defm BUFFER_ATOMIC_UMAX_X2 : MUBUF_Pseudo_Atomics <
969 "buffer_atomic_umax_x2", VReg_64, i64, atomic_load_umax_global_64
971 defm BUFFER_ATOMIC_AND_X2 : MUBUF_Pseudo_Atomics <
972 "buffer_atomic_and_x2", VReg_64, i64, atomic_load_and_global_64
974 defm BUFFER_ATOMIC_OR_X2 : MUBUF_Pseudo_Atomics <
975 "buffer_atomic_or_x2", VReg_64, i64, atomic_load_or_global_64
977 defm BUFFER_ATOMIC_XOR_X2 : MUBUF_Pseudo_Atomics <
978 "buffer_atomic_xor_x2", VReg_64, i64, atomic_load_xor_global_64
980 defm BUFFER_ATOMIC_INC_X2 : MUBUF_Pseudo_Atomics <
981 "buffer_atomic_inc_x2", VReg_64, i64, atomic_inc_global_64
983 defm BUFFER_ATOMIC_DEC_X2 : MUBUF_Pseudo_Atomics <
984 "buffer_atomic_dec_x2", VReg_64, i64, atomic_dec_global_64
987 let SubtargetPredicate = isGFX8GFX9 in {
988 def BUFFER_STORE_LDS_DWORD : MUBUF_Pseudo_Store_Lds <"buffer_store_lds_dword">;
991 let SubtargetPredicate = isGFX6 in { // isn't on CI & VI
993 defm BUFFER_ATOMIC_RSUB : MUBUF_Pseudo_Atomics <"buffer_atomic_rsub">;
994 defm BUFFER_ATOMIC_FCMPSWAP : MUBUF_Pseudo_Atomics <"buffer_atomic_fcmpswap">;
995 defm BUFFER_ATOMIC_FMIN : MUBUF_Pseudo_Atomics <"buffer_atomic_fmin">;
996 defm BUFFER_ATOMIC_FMAX : MUBUF_Pseudo_Atomics <"buffer_atomic_fmax">;
997 defm BUFFER_ATOMIC_RSUB_X2 : MUBUF_Pseudo_Atomics <"buffer_atomic_rsub_x2">;
998 defm BUFFER_ATOMIC_FCMPSWAP_X2 : MUBUF_Pseudo_Atomics <"buffer_atomic_fcmpswap_x2">;
999 defm BUFFER_ATOMIC_FMIN_X2 : MUBUF_Pseudo_Atomics <"buffer_atomic_fmin_x2">;
1000 defm BUFFER_ATOMIC_FMAX_X2 : MUBUF_Pseudo_Atomics <"buffer_atomic_fmax_x2">;
1003 def BUFFER_WBINVL1_SC : MUBUF_Invalidate <"buffer_wbinvl1_sc",
1004 int_amdgcn_buffer_wbinvl1_sc>;
1007 let SubtargetPredicate = HasD16LoadStore in {
1009 defm BUFFER_LOAD_UBYTE_D16 : MUBUF_Pseudo_Loads <
1010 "buffer_load_ubyte_d16", i32, null_frag, 1
1013 defm BUFFER_LOAD_UBYTE_D16_HI : MUBUF_Pseudo_Loads <
1014 "buffer_load_ubyte_d16_hi", i32, null_frag, 1
1017 defm BUFFER_LOAD_SBYTE_D16 : MUBUF_Pseudo_Loads <
1018 "buffer_load_sbyte_d16", i32, null_frag, 1
1021 defm BUFFER_LOAD_SBYTE_D16_HI : MUBUF_Pseudo_Loads <
1022 "buffer_load_sbyte_d16_hi", i32, null_frag, 1
1025 defm BUFFER_LOAD_SHORT_D16 : MUBUF_Pseudo_Loads <
1026 "buffer_load_short_d16", i32, null_frag, 1
1029 defm BUFFER_LOAD_SHORT_D16_HI : MUBUF_Pseudo_Loads <
1030 "buffer_load_short_d16_hi", i32, null_frag, 1
1033 defm BUFFER_STORE_BYTE_D16_HI : MUBUF_Pseudo_Stores <
1034 "buffer_store_byte_d16_hi", i32
1037 defm BUFFER_STORE_SHORT_D16_HI : MUBUF_Pseudo_Stores <
1038 "buffer_store_short_d16_hi", i32
1041 defm BUFFER_LOAD_FORMAT_D16_HI_X : MUBUF_Pseudo_Loads <
1042 "buffer_load_format_d16_hi_x", i32
1044 defm BUFFER_STORE_FORMAT_D16_HI_X : MUBUF_Pseudo_Stores <
1045 "buffer_store_format_d16_hi_x", i32
1048 } // End HasD16LoadStore
1050 def BUFFER_WBINVL1 : MUBUF_Invalidate <"buffer_wbinvl1",
1051 int_amdgcn_buffer_wbinvl1>;
1053 let SubtargetPredicate = HasAtomicFaddInsts in {
1055 defm BUFFER_ATOMIC_ADD_F32 : MUBUF_Pseudo_Atomics_NO_RTN <
1056 "buffer_atomic_add_f32", VGPR_32, f32, atomic_fadd_global_noret
1058 defm BUFFER_ATOMIC_PK_ADD_F16 : MUBUF_Pseudo_Atomics_NO_RTN <
1059 "buffer_atomic_pk_add_f16", VGPR_32, v2f16, atomic_pk_fadd_global_noret
1062 } // End SubtargetPredicate = HasAtomicFaddInsts
1064 //===----------------------------------------------------------------------===//
1065 // MTBUF Instructions
1066 //===----------------------------------------------------------------------===//
1068 defm TBUFFER_LOAD_FORMAT_X : MTBUF_Pseudo_Loads <"tbuffer_load_format_x", VGPR_32>;
1069 defm TBUFFER_LOAD_FORMAT_XY : MTBUF_Pseudo_Loads <"tbuffer_load_format_xy", VReg_64>;
1070 defm TBUFFER_LOAD_FORMAT_XYZ : MTBUF_Pseudo_Loads <"tbuffer_load_format_xyz", VReg_96>;
1071 defm TBUFFER_LOAD_FORMAT_XYZW : MTBUF_Pseudo_Loads <"tbuffer_load_format_xyzw", VReg_128>;
1072 defm TBUFFER_STORE_FORMAT_X : MTBUF_Pseudo_Stores <"tbuffer_store_format_x", VGPR_32>;
1073 defm TBUFFER_STORE_FORMAT_XY : MTBUF_Pseudo_Stores <"tbuffer_store_format_xy", VReg_64>;
1074 defm TBUFFER_STORE_FORMAT_XYZ : MTBUF_Pseudo_Stores <"tbuffer_store_format_xyz", VReg_96>;
1075 defm TBUFFER_STORE_FORMAT_XYZW : MTBUF_Pseudo_Stores <"tbuffer_store_format_xyzw", VReg_128>;
1077 let SubtargetPredicate = HasUnpackedD16VMem, D16Buf = 1 in {
1078 defm TBUFFER_LOAD_FORMAT_D16_X_gfx80 : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_x", VGPR_32>;
1079 defm TBUFFER_LOAD_FORMAT_D16_XY_gfx80 : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xy", VReg_64>;
1080 defm TBUFFER_LOAD_FORMAT_D16_XYZ_gfx80 : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xyz", VReg_96>;
1081 defm TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80 : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xyzw", VReg_128>;
1082 defm TBUFFER_STORE_FORMAT_D16_X_gfx80 : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_x", VGPR_32>;
1083 defm TBUFFER_STORE_FORMAT_D16_XY_gfx80 : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xy", VReg_64>;
1084 defm TBUFFER_STORE_FORMAT_D16_XYZ_gfx80 : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xyz", VReg_96>;
1085 defm TBUFFER_STORE_FORMAT_D16_XYZW_gfx80 : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xyzw", VReg_128>;
1086 } // End HasUnpackedD16VMem.
1088 let SubtargetPredicate = HasPackedD16VMem, D16Buf = 1 in {
1089 defm TBUFFER_LOAD_FORMAT_D16_X : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_x", VGPR_32>;
1090 defm TBUFFER_LOAD_FORMAT_D16_XY : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xy", VGPR_32>;
1091 defm TBUFFER_LOAD_FORMAT_D16_XYZ : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xyz", VReg_64>;
1092 defm TBUFFER_LOAD_FORMAT_D16_XYZW : MTBUF_Pseudo_Loads <"tbuffer_load_format_d16_xyzw", VReg_64>;
1093 defm TBUFFER_STORE_FORMAT_D16_X : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_x", VGPR_32>;
1094 defm TBUFFER_STORE_FORMAT_D16_XY : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xy", VGPR_32>;
1095 defm TBUFFER_STORE_FORMAT_D16_XYZ : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xyz", VReg_64>;
1096 defm TBUFFER_STORE_FORMAT_D16_XYZW : MTBUF_Pseudo_Stores <"tbuffer_store_format_d16_xyzw", VReg_64>;
1097 } // End HasPackedD16VMem.
1099 let SubtargetPredicate = isGFX7Plus in {
1101 //===----------------------------------------------------------------------===//
1102 // Instruction definitions for CI and newer.
1103 //===----------------------------------------------------------------------===//
1105 def BUFFER_WBINVL1_VOL : MUBUF_Invalidate <"buffer_wbinvl1_vol",
1106 int_amdgcn_buffer_wbinvl1_vol>;
1108 } // End let SubtargetPredicate = isGFX7Plus
1110 let SubtargetPredicate = isGFX10Plus in {
1111 def BUFFER_GL0_INV : MUBUF_Invalidate<"buffer_gl0_inv">;
1112 def BUFFER_GL1_INV : MUBUF_Invalidate<"buffer_gl1_inv">;
1113 } // End SubtargetPredicate = isGFX10Plus
1115 //===----------------------------------------------------------------------===//
1117 //===----------------------------------------------------------------------===//
1119 def extract_glc : SDNodeXForm<imm, [{
1120 return CurDAG->getTargetConstant(N->getZExtValue() & 1, SDLoc(N), MVT::i8);
1123 def extract_slc : SDNodeXForm<imm, [{
1124 return CurDAG->getTargetConstant((N->getZExtValue() >> 1) & 1, SDLoc(N), MVT::i8);
1127 def extract_dlc : SDNodeXForm<imm, [{
1128 return CurDAG->getTargetConstant((N->getZExtValue() >> 2) & 1, SDLoc(N), MVT::i8);
1131 //===----------------------------------------------------------------------===//
1132 // buffer_load/store_format patterns
1133 //===----------------------------------------------------------------------===//
1135 multiclass MUBUF_LoadIntrinsicPat<SDPatternOperator name, ValueType vt,
1138 (vt (name v4i32:$rsrc, 0, 0, i32:$soffset, imm:$offset,
1139 imm:$cachepolicy, 0)),
1140 (!cast<MUBUF_Pseudo>(opcode # _OFFSET) $rsrc, $soffset, (as_i16imm $offset),
1141 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1145 (vt (name v4i32:$rsrc, 0, i32:$voffset, i32:$soffset, imm:$offset,
1146 imm:$cachepolicy, 0)),
1147 (!cast<MUBUF_Pseudo>(opcode # _OFFEN) $voffset, $rsrc, $soffset, (as_i16imm $offset),
1148 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1152 (vt (name v4i32:$rsrc, i32:$vindex, 0, i32:$soffset, imm:$offset,
1153 imm:$cachepolicy, imm)),
1154 (!cast<MUBUF_Pseudo>(opcode # _IDXEN) $vindex, $rsrc, $soffset, (as_i16imm $offset),
1155 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1159 (vt (name v4i32:$rsrc, i32:$vindex, i32:$voffset, i32:$soffset, imm:$offset,
1160 imm:$cachepolicy, imm)),
1161 (!cast<MUBUF_Pseudo>(opcode # _BOTHEN)
1162 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1163 $rsrc, $soffset, (as_i16imm $offset),
1164 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1168 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, f32, "BUFFER_LOAD_FORMAT_X">;
1169 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, i32, "BUFFER_LOAD_FORMAT_X">;
1170 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v2f32, "BUFFER_LOAD_FORMAT_XY">;
1171 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v2i32, "BUFFER_LOAD_FORMAT_XY">;
1172 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v3f32, "BUFFER_LOAD_FORMAT_XYZ">;
1173 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v3i32, "BUFFER_LOAD_FORMAT_XYZ">;
1174 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v4f32, "BUFFER_LOAD_FORMAT_XYZW">;
1175 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format, v4i32, "BUFFER_LOAD_FORMAT_XYZW">;
1177 let SubtargetPredicate = HasUnpackedD16VMem in {
1178 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, f16, "BUFFER_LOAD_FORMAT_D16_X_gfx80">;
1179 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, i16, "BUFFER_LOAD_FORMAT_D16_X_gfx80">;
1180 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v2i32, "BUFFER_LOAD_FORMAT_D16_XY_gfx80">;
1181 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v4i32, "BUFFER_LOAD_FORMAT_D16_XYZW_gfx80">;
1182 } // End HasUnpackedD16VMem.
1184 let SubtargetPredicate = HasPackedD16VMem in {
1185 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, f16, "BUFFER_LOAD_FORMAT_D16_X">;
1186 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, i16, "BUFFER_LOAD_FORMAT_D16_X">;
1187 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v2f16, "BUFFER_LOAD_FORMAT_D16_XY">;
1188 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v2i16, "BUFFER_LOAD_FORMAT_D16_XY">;
1189 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v4f16, "BUFFER_LOAD_FORMAT_D16_XYZW">;
1190 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_format_d16, v4i16, "BUFFER_LOAD_FORMAT_D16_XYZW">;
1191 } // End HasPackedD16VMem.
1193 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, f32, "BUFFER_LOAD_DWORD">;
1194 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, i32, "BUFFER_LOAD_DWORD">;
1195 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v2i16, "BUFFER_LOAD_DWORD">;
1196 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v2f16, "BUFFER_LOAD_DWORD">;
1197 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v2f32, "BUFFER_LOAD_DWORDX2">;
1198 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v2i32, "BUFFER_LOAD_DWORDX2">;
1199 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v4i16, "BUFFER_LOAD_DWORDX2">;
1200 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v4f16, "BUFFER_LOAD_DWORDX2">;
1201 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v3f32, "BUFFER_LOAD_DWORDX3">;
1202 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v3i32, "BUFFER_LOAD_DWORDX3">;
1203 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v4f32, "BUFFER_LOAD_DWORDX4">;
1204 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load, v4i32, "BUFFER_LOAD_DWORDX4">;
1205 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_byte, i32, "BUFFER_LOAD_SBYTE">;
1206 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_short, i32, "BUFFER_LOAD_SSHORT">;
1207 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_ubyte, i32, "BUFFER_LOAD_UBYTE">;
1208 defm : MUBUF_LoadIntrinsicPat<SIbuffer_load_ushort, i32, "BUFFER_LOAD_USHORT">;
1210 multiclass MUBUF_StoreIntrinsicPat<SDPatternOperator name, ValueType vt,
1213 (name vt:$vdata, v4i32:$rsrc, 0, 0, i32:$soffset, imm:$offset,
1214 imm:$cachepolicy, 0),
1215 (!cast<MUBUF_Pseudo>(opcode # _OFFSET_exact) $vdata, $rsrc, $soffset, (as_i16imm $offset),
1216 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1220 (name vt:$vdata, v4i32:$rsrc, 0, i32:$voffset, i32:$soffset, imm:$offset,
1221 imm:$cachepolicy, 0),
1222 (!cast<MUBUF_Pseudo>(opcode # _OFFEN_exact) $vdata, $voffset, $rsrc, $soffset,
1223 (as_i16imm $offset), (extract_glc $cachepolicy),
1224 (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1228 (name vt:$vdata, v4i32:$rsrc, i32:$vindex, 0, i32:$soffset, imm:$offset,
1229 imm:$cachepolicy, imm),
1230 (!cast<MUBUF_Pseudo>(opcode # _IDXEN_exact) $vdata, $vindex, $rsrc, $soffset,
1231 (as_i16imm $offset), (extract_glc $cachepolicy),
1232 (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1236 (name vt:$vdata, v4i32:$rsrc, i32:$vindex, i32:$voffset, i32:$soffset, imm:$offset,
1237 imm:$cachepolicy, imm),
1238 (!cast<MUBUF_Pseudo>(opcode # _BOTHEN_exact)
1240 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1241 $rsrc, $soffset, (as_i16imm $offset), (extract_glc $cachepolicy),
1242 (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1246 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, f32, "BUFFER_STORE_FORMAT_X">;
1247 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, i32, "BUFFER_STORE_FORMAT_X">;
1248 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v2f32, "BUFFER_STORE_FORMAT_XY">;
1249 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v2i32, "BUFFER_STORE_FORMAT_XY">;
1250 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v3f32, "BUFFER_STORE_FORMAT_XYZ">;
1251 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v3i32, "BUFFER_STORE_FORMAT_XYZ">;
1252 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v4f32, "BUFFER_STORE_FORMAT_XYZW">;
1253 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format, v4i32, "BUFFER_STORE_FORMAT_XYZW">;
1255 let SubtargetPredicate = HasUnpackedD16VMem in {
1256 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, f16, "BUFFER_STORE_FORMAT_D16_X_gfx80">;
1257 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, i16, "BUFFER_STORE_FORMAT_D16_X_gfx80">;
1258 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v2i32, "BUFFER_STORE_FORMAT_D16_XY_gfx80">;
1259 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v4i32, "BUFFER_STORE_FORMAT_D16_XYZW_gfx80">;
1260 } // End HasUnpackedD16VMem.
1262 let SubtargetPredicate = HasPackedD16VMem in {
1263 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, f16, "BUFFER_STORE_FORMAT_D16_X">;
1264 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, i16, "BUFFER_STORE_FORMAT_D16_X">;
1265 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v2f16, "BUFFER_STORE_FORMAT_D16_XY">;
1266 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v2i16, "BUFFER_STORE_FORMAT_D16_XY">;
1267 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v4f16, "BUFFER_STORE_FORMAT_D16_XYZW">;
1268 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_format_d16, v4i16, "BUFFER_STORE_FORMAT_D16_XYZW">;
1269 } // End HasPackedD16VMem.
1271 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, f32, "BUFFER_STORE_DWORD">;
1272 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, i32, "BUFFER_STORE_DWORD">;
1273 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v2i16, "BUFFER_STORE_DWORD">;
1274 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v2f16, "BUFFER_STORE_DWORD">;
1275 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v2f32, "BUFFER_STORE_DWORDX2">;
1276 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v2i32, "BUFFER_STORE_DWORDX2">;
1277 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v4i16, "BUFFER_STORE_DWORDX2">;
1278 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v4f16, "BUFFER_STORE_DWORDX2">;
1279 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v3f32, "BUFFER_STORE_DWORDX3">;
1280 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v3i32, "BUFFER_STORE_DWORDX3">;
1281 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v4f32, "BUFFER_STORE_DWORDX4">;
1282 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store, v4i32, "BUFFER_STORE_DWORDX4">;
1283 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_byte, i32, "BUFFER_STORE_BYTE">;
1284 defm : MUBUF_StoreIntrinsicPat<SIbuffer_store_short, i32, "BUFFER_STORE_SHORT">;
1286 //===----------------------------------------------------------------------===//
1287 // buffer_atomic patterns
1288 //===----------------------------------------------------------------------===//
1290 multiclass BufferAtomicPatterns<SDPatternOperator name, ValueType vt,
1293 (vt (name vt:$vdata_in, v4i32:$rsrc, 0,
1294 0, i32:$soffset, imm:$offset,
1295 imm:$cachepolicy, 0)),
1296 (!cast<MUBUF_Pseudo>(opcode # _OFFSET_RTN) $vdata_in, $rsrc, $soffset,
1297 (as_i16imm $offset), (extract_slc $cachepolicy))
1301 (vt (name vt:$vdata_in, v4i32:$rsrc, i32:$vindex,
1302 0, i32:$soffset, imm:$offset,
1303 imm:$cachepolicy, imm)),
1304 (!cast<MUBUF_Pseudo>(opcode # _IDXEN_RTN) $vdata_in, $vindex, $rsrc, $soffset,
1305 (as_i16imm $offset), (extract_slc $cachepolicy))
1309 (vt (name vt:$vdata_in, v4i32:$rsrc, 0,
1310 i32:$voffset, i32:$soffset, imm:$offset,
1311 imm:$cachepolicy, 0)),
1312 (!cast<MUBUF_Pseudo>(opcode # _OFFEN_RTN) $vdata_in, $voffset, $rsrc, $soffset,
1313 (as_i16imm $offset), (extract_slc $cachepolicy))
1317 (vt (name vt:$vdata_in, v4i32:$rsrc, i32:$vindex,
1318 i32:$voffset, i32:$soffset, imm:$offset,
1319 imm:$cachepolicy, imm)),
1320 (!cast<MUBUF_Pseudo>(opcode # _BOTHEN_RTN)
1322 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1323 $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy))
1327 defm : BufferAtomicPatterns<SIbuffer_atomic_swap, i32, "BUFFER_ATOMIC_SWAP">;
1328 defm : BufferAtomicPatterns<SIbuffer_atomic_add, i32, "BUFFER_ATOMIC_ADD">;
1329 defm : BufferAtomicPatterns<SIbuffer_atomic_sub, i32, "BUFFER_ATOMIC_SUB">;
1330 defm : BufferAtomicPatterns<SIbuffer_atomic_smin, i32, "BUFFER_ATOMIC_SMIN">;
1331 defm : BufferAtomicPatterns<SIbuffer_atomic_umin, i32, "BUFFER_ATOMIC_UMIN">;
1332 defm : BufferAtomicPatterns<SIbuffer_atomic_smax, i32, "BUFFER_ATOMIC_SMAX">;
1333 defm : BufferAtomicPatterns<SIbuffer_atomic_umax, i32, "BUFFER_ATOMIC_UMAX">;
1334 defm : BufferAtomicPatterns<SIbuffer_atomic_and, i32, "BUFFER_ATOMIC_AND">;
1335 defm : BufferAtomicPatterns<SIbuffer_atomic_or, i32, "BUFFER_ATOMIC_OR">;
1336 defm : BufferAtomicPatterns<SIbuffer_atomic_xor, i32, "BUFFER_ATOMIC_XOR">;
1337 defm : BufferAtomicPatterns<SIbuffer_atomic_inc, i32, "BUFFER_ATOMIC_INC">;
1338 defm : BufferAtomicPatterns<SIbuffer_atomic_dec, i32, "BUFFER_ATOMIC_DEC">;
1339 defm : BufferAtomicPatterns<SIbuffer_atomic_swap, i64, "BUFFER_ATOMIC_SWAP_X2">;
1340 defm : BufferAtomicPatterns<SIbuffer_atomic_add, i64, "BUFFER_ATOMIC_ADD_X2">;
1341 defm : BufferAtomicPatterns<SIbuffer_atomic_sub, i64, "BUFFER_ATOMIC_SUB_X2">;
1342 defm : BufferAtomicPatterns<SIbuffer_atomic_smin, i64, "BUFFER_ATOMIC_SMIN_X2">;
1343 defm : BufferAtomicPatterns<SIbuffer_atomic_umin, i64, "BUFFER_ATOMIC_UMIN_X2">;
1344 defm : BufferAtomicPatterns<SIbuffer_atomic_smax, i64, "BUFFER_ATOMIC_SMAX_X2">;
1345 defm : BufferAtomicPatterns<SIbuffer_atomic_umax, i64, "BUFFER_ATOMIC_UMAX_X2">;
1346 defm : BufferAtomicPatterns<SIbuffer_atomic_and, i64, "BUFFER_ATOMIC_AND_X2">;
1347 defm : BufferAtomicPatterns<SIbuffer_atomic_or, i64, "BUFFER_ATOMIC_OR_X2">;
1348 defm : BufferAtomicPatterns<SIbuffer_atomic_xor, i64, "BUFFER_ATOMIC_XOR_X2">;
1349 defm : BufferAtomicPatterns<SIbuffer_atomic_inc, i64, "BUFFER_ATOMIC_INC_X2">;
1350 defm : BufferAtomicPatterns<SIbuffer_atomic_dec, i64, "BUFFER_ATOMIC_DEC_X2">;
1352 multiclass BufferAtomicPatterns_NO_RTN<SDPatternOperator name, ValueType vt,
1355 (name vt:$vdata_in, v4i32:$rsrc, 0,
1356 0, i32:$soffset, imm:$offset,
1357 imm:$cachepolicy, 0),
1358 (!cast<MUBUF_Pseudo>(opcode # _OFFSET) $vdata_in, $rsrc, $soffset,
1359 (as_i16imm $offset), (extract_slc $cachepolicy))
1363 (name vt:$vdata_in, v4i32:$rsrc, i32:$vindex,
1364 0, i32:$soffset, imm:$offset,
1365 imm:$cachepolicy, imm),
1366 (!cast<MUBUF_Pseudo>(opcode # _IDXEN) $vdata_in, $vindex, $rsrc, $soffset,
1367 (as_i16imm $offset), (extract_slc $cachepolicy))
1371 (name vt:$vdata_in, v4i32:$rsrc, 0,
1372 i32:$voffset, i32:$soffset, imm:$offset,
1373 imm:$cachepolicy, 0),
1374 (!cast<MUBUF_Pseudo>(opcode # _OFFEN) $vdata_in, $voffset, $rsrc, $soffset,
1375 (as_i16imm $offset), (extract_slc $cachepolicy))
1379 (name vt:$vdata_in, v4i32:$rsrc, i32:$vindex,
1380 i32:$voffset, i32:$soffset, imm:$offset,
1381 imm:$cachepolicy, imm),
1382 (!cast<MUBUF_Pseudo>(opcode # _BOTHEN)
1384 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1385 $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy))
1389 defm : BufferAtomicPatterns_NO_RTN<SIbuffer_atomic_fadd, f32, "BUFFER_ATOMIC_ADD_F32">;
1390 defm : BufferAtomicPatterns_NO_RTN<SIbuffer_atomic_pk_fadd, v2f16, "BUFFER_ATOMIC_PK_ADD_F16">;
1393 (SIbuffer_atomic_cmpswap
1394 i32:$data, i32:$cmp, v4i32:$rsrc, 0,
1395 0, i32:$soffset, imm:$offset,
1396 imm:$cachepolicy, 0),
1398 (BUFFER_ATOMIC_CMPSWAP_OFFSET_RTN
1399 (REG_SEQUENCE VReg_64, $data, sub0, $cmp, sub1),
1400 $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy)),
1405 (SIbuffer_atomic_cmpswap
1406 i32:$data, i32:$cmp, v4i32:$rsrc, i32:$vindex,
1407 0, i32:$soffset, imm:$offset,
1408 imm:$cachepolicy, imm),
1410 (BUFFER_ATOMIC_CMPSWAP_IDXEN_RTN
1411 (REG_SEQUENCE VReg_64, $data, sub0, $cmp, sub1),
1412 $vindex, $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy)),
1417 (SIbuffer_atomic_cmpswap
1418 i32:$data, i32:$cmp, v4i32:$rsrc, 0,
1419 i32:$voffset, i32:$soffset, imm:$offset,
1420 imm:$cachepolicy, 0),
1422 (BUFFER_ATOMIC_CMPSWAP_OFFEN_RTN
1423 (REG_SEQUENCE VReg_64, $data, sub0, $cmp, sub1),
1424 $voffset, $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy)),
1429 (SIbuffer_atomic_cmpswap
1430 i32:$data, i32:$cmp, v4i32:$rsrc, i32:$vindex,
1431 i32:$voffset, i32:$soffset, imm:$offset,
1432 imm:$cachepolicy, imm),
1434 (BUFFER_ATOMIC_CMPSWAP_BOTHEN_RTN
1435 (REG_SEQUENCE VReg_64, $data, sub0, $cmp, sub1),
1436 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1437 $rsrc, $soffset, (as_i16imm $offset), (extract_slc $cachepolicy)),
1441 class MUBUFLoad_PatternADDR64 <MUBUF_Pseudo Instr_ADDR64, ValueType vt,
1442 PatFrag constant_ld> : GCNPat <
1443 (vt (constant_ld (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset,
1444 i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))),
1445 (Instr_ADDR64 $vaddr, $srsrc, $soffset, $offset, $glc, $slc, $tfe, $dlc)
1448 multiclass MUBUFLoad_Atomic_Pattern <MUBUF_Pseudo Instr_ADDR64, MUBUF_Pseudo Instr_OFFSET,
1449 ValueType vt, PatFrag atomic_ld> {
1451 (vt (atomic_ld (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset,
1452 i16:$offset, i1:$slc))),
1453 (Instr_ADDR64 $vaddr, $srsrc, $soffset, $offset, 0, $slc, 0, 0)
1457 (vt (atomic_ld (MUBUFOffsetNoGLC v4i32:$rsrc, i32:$soffset, i16:$offset))),
1458 (Instr_OFFSET $rsrc, $soffset, (as_i16imm $offset), 0, 0, 0, 0)
1462 let SubtargetPredicate = isGFX6GFX7 in {
1463 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_SBYTE_ADDR64, i32, sextloadi8_constant>;
1464 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_UBYTE_ADDR64, i32, extloadi8_constant>;
1465 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_UBYTE_ADDR64, i32, zextloadi8_constant>;
1466 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_SSHORT_ADDR64, i32, sextloadi16_constant>;
1467 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_USHORT_ADDR64, i32, extloadi16_constant>;
1468 def : MUBUFLoad_PatternADDR64 <BUFFER_LOAD_USHORT_ADDR64, i32, zextloadi16_constant>;
1470 defm : MUBUFLoad_Atomic_Pattern <BUFFER_LOAD_DWORD_ADDR64, BUFFER_LOAD_DWORD_OFFSET, i32, atomic_load_32_global>;
1471 defm : MUBUFLoad_Atomic_Pattern <BUFFER_LOAD_DWORDX2_ADDR64, BUFFER_LOAD_DWORDX2_OFFSET, i64, atomic_load_64_global>;
1472 } // End SubtargetPredicate = isGFX6GFX7
1474 multiclass MUBUFLoad_Pattern <MUBUF_Pseudo Instr_OFFSET, ValueType vt,
1478 (vt (ld (MUBUFOffset v4i32:$srsrc, i32:$soffset,
1479 i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc))),
1480 (Instr_OFFSET $srsrc, $soffset, $offset, $glc, $slc, $tfe, $dlc)
1484 let OtherPredicates = [Has16BitInsts] in {
1486 defm : MUBUFLoad_Pattern <BUFFER_LOAD_SBYTE_OFFSET, i16, sextloadi8_constant>;
1487 defm : MUBUFLoad_Pattern <BUFFER_LOAD_UBYTE_OFFSET, i16, extloadi8_constant>;
1488 defm : MUBUFLoad_Pattern <BUFFER_LOAD_UBYTE_OFFSET, i16, zextloadi8_constant>;
1489 defm : MUBUFLoad_Pattern <BUFFER_LOAD_SBYTE_OFFSET, i16, sextloadi8_global>;
1490 defm : MUBUFLoad_Pattern <BUFFER_LOAD_UBYTE_OFFSET, i16, extloadi8_global>;
1491 defm : MUBUFLoad_Pattern <BUFFER_LOAD_UBYTE_OFFSET, i16, zextloadi8_global>;
1493 defm : MUBUFLoad_Pattern <BUFFER_LOAD_USHORT_OFFSET, i16, load_global>;
1495 } // End OtherPredicates = [Has16BitInsts]
1497 multiclass MUBUFScratchLoadPat <MUBUF_Pseudo InstrOffen,
1498 MUBUF_Pseudo InstrOffset,
1499 ValueType vt, PatFrag ld> {
1501 (vt (ld (MUBUFScratchOffen v4i32:$srsrc, i32:$vaddr,
1502 i32:$soffset, u16imm:$offset))),
1503 (InstrOffen $vaddr, $srsrc, $soffset, $offset, 0, 0, 0, 0)
1507 (vt (ld (MUBUFScratchOffset v4i32:$srsrc, i32:$soffset, u16imm:$offset))),
1508 (InstrOffset $srsrc, $soffset, $offset, 0, 0, 0, 0)
1512 // XXX - Is it possible to have a complex pattern in a PatFrag?
1513 multiclass MUBUFScratchLoadPat_D16 <MUBUF_Pseudo InstrOffen,
1514 MUBUF_Pseudo InstrOffset,
1515 ValueType vt, PatFrag ld_frag> {
1517 (ld_frag (MUBUFScratchOffen v4i32:$srsrc, i32:$vaddr, i32:$soffset, u16imm:$offset), vt:$in),
1518 (InstrOffen $vaddr, $srsrc, $soffset, $offset, 0, 0, 0, 0, $in)
1522 (ld_frag (MUBUFScratchOffset v4i32:$srsrc, i32:$soffset, u16imm:$offset), vt:$in),
1523 (InstrOffset $srsrc, $soffset, $offset, 0, 0, 0, 0, $in)
1527 defm : MUBUFScratchLoadPat <BUFFER_LOAD_SBYTE_OFFEN, BUFFER_LOAD_SBYTE_OFFSET, i32, sextloadi8_private>;
1528 defm : MUBUFScratchLoadPat <BUFFER_LOAD_UBYTE_OFFEN, BUFFER_LOAD_UBYTE_OFFSET, i32, extloadi8_private>;
1529 defm : MUBUFScratchLoadPat <BUFFER_LOAD_UBYTE_OFFEN, BUFFER_LOAD_UBYTE_OFFSET, i32, zextloadi8_private>;
1530 defm : MUBUFScratchLoadPat <BUFFER_LOAD_SBYTE_OFFEN, BUFFER_LOAD_SBYTE_OFFSET, i16, sextloadi8_private>;
1531 defm : MUBUFScratchLoadPat <BUFFER_LOAD_UBYTE_OFFEN, BUFFER_LOAD_UBYTE_OFFSET, i16, extloadi8_private>;
1532 defm : MUBUFScratchLoadPat <BUFFER_LOAD_UBYTE_OFFEN, BUFFER_LOAD_UBYTE_OFFSET, i16, zextloadi8_private>;
1533 defm : MUBUFScratchLoadPat <BUFFER_LOAD_SSHORT_OFFEN, BUFFER_LOAD_SSHORT_OFFSET, i32, sextloadi16_private>;
1534 defm : MUBUFScratchLoadPat <BUFFER_LOAD_USHORT_OFFEN, BUFFER_LOAD_USHORT_OFFSET, i32, extloadi16_private>;
1535 defm : MUBUFScratchLoadPat <BUFFER_LOAD_USHORT_OFFEN, BUFFER_LOAD_USHORT_OFFSET, i32, zextloadi16_private>;
1536 defm : MUBUFScratchLoadPat <BUFFER_LOAD_USHORT_OFFEN, BUFFER_LOAD_USHORT_OFFSET, i16, load_private>;
1538 foreach vt = Reg32Types.types in {
1539 defm : MUBUFScratchLoadPat <BUFFER_LOAD_DWORD_OFFEN, BUFFER_LOAD_DWORD_OFFSET, i32, load_private>;
1541 defm : MUBUFScratchLoadPat <BUFFER_LOAD_DWORDX2_OFFEN, BUFFER_LOAD_DWORDX2_OFFSET, v2i32, load_private>;
1542 defm : MUBUFScratchLoadPat <BUFFER_LOAD_DWORDX3_OFFEN, BUFFER_LOAD_DWORDX3_OFFSET, v3i32, load_private>;
1543 defm : MUBUFScratchLoadPat <BUFFER_LOAD_DWORDX4_OFFEN, BUFFER_LOAD_DWORDX4_OFFSET, v4i32, load_private>;
1545 let OtherPredicates = [D16PreservesUnusedBits] in {
1546 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SHORT_D16_HI_OFFEN, BUFFER_LOAD_SHORT_D16_HI_OFFSET, v2i16, load_d16_hi_private>;
1547 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_UBYTE_D16_HI_OFFEN, BUFFER_LOAD_UBYTE_D16_HI_OFFSET, v2i16, az_extloadi8_d16_hi_private>;
1548 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SBYTE_D16_HI_OFFEN, BUFFER_LOAD_SBYTE_D16_HI_OFFSET, v2i16, sextloadi8_d16_hi_private>;
1549 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SHORT_D16_HI_OFFEN, BUFFER_LOAD_SHORT_D16_HI_OFFSET, v2f16, load_d16_hi_private>;
1550 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_UBYTE_D16_HI_OFFEN, BUFFER_LOAD_UBYTE_D16_HI_OFFSET, v2f16, az_extloadi8_d16_hi_private>;
1551 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SBYTE_D16_HI_OFFEN, BUFFER_LOAD_SBYTE_D16_HI_OFFSET, v2f16, sextloadi8_d16_hi_private>;
1553 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SHORT_D16_OFFEN, BUFFER_LOAD_SHORT_D16_OFFSET, v2i16, load_d16_lo_private>;
1554 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_UBYTE_D16_OFFEN, BUFFER_LOAD_UBYTE_D16_OFFSET, v2i16, az_extloadi8_d16_lo_private>;
1555 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SBYTE_D16_OFFEN, BUFFER_LOAD_SBYTE_D16_OFFSET, v2i16, sextloadi8_d16_lo_private>;
1556 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SHORT_D16_OFFEN, BUFFER_LOAD_SHORT_D16_OFFSET, v2f16, load_d16_lo_private>;
1557 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_UBYTE_D16_OFFEN, BUFFER_LOAD_UBYTE_D16_OFFSET, v2f16, az_extloadi8_d16_lo_private>;
1558 defm : MUBUFScratchLoadPat_D16<BUFFER_LOAD_SBYTE_D16_OFFEN, BUFFER_LOAD_SBYTE_D16_OFFSET, v2f16, sextloadi8_d16_lo_private>;
1561 multiclass MUBUFStore_Atomic_Pattern <MUBUF_Pseudo Instr_ADDR64, MUBUF_Pseudo Instr_OFFSET,
1562 ValueType vt, PatFrag atomic_st> {
1563 // Store follows atomic op convention so address is forst
1565 (atomic_st (MUBUFAddr64 v4i32:$srsrc, i64:$vaddr, i32:$soffset,
1566 i16:$offset, i1:$slc), vt:$val),
1567 (Instr_ADDR64 $val, $vaddr, $srsrc, $soffset, $offset, 0, $slc, 0, 0)
1571 (atomic_st (MUBUFOffsetNoGLC v4i32:$rsrc, i32:$soffset, i16:$offset), vt:$val),
1572 (Instr_OFFSET $val, $rsrc, $soffset, (as_i16imm $offset), 0, 0, 0, 0)
1575 let SubtargetPredicate = isGFX6GFX7 in {
1576 defm : MUBUFStore_Atomic_Pattern <BUFFER_STORE_DWORD_ADDR64, BUFFER_STORE_DWORD_OFFSET, i32, store_atomic_global>;
1577 defm : MUBUFStore_Atomic_Pattern <BUFFER_STORE_DWORDX2_ADDR64, BUFFER_STORE_DWORDX2_OFFSET, i64, store_atomic_global>;
1578 } // End Predicates = isGFX6GFX7
1581 multiclass MUBUFStore_Pattern <MUBUF_Pseudo Instr_OFFSET, ValueType vt,
1585 (st vt:$vdata, (MUBUFOffset v4i32:$srsrc, i32:$soffset,
1586 i16:$offset, i1:$glc, i1:$slc, i1:$tfe, i1:$dlc)),
1587 (Instr_OFFSET $vdata, $srsrc, $soffset, $offset, $glc, $slc, $tfe, $dlc)
1591 defm : MUBUFStore_Pattern <BUFFER_STORE_BYTE_OFFSET, i16, truncstorei8_global>;
1592 defm : MUBUFStore_Pattern <BUFFER_STORE_SHORT_OFFSET, i16, store_global>;
1594 multiclass MUBUFScratchStorePat <MUBUF_Pseudo InstrOffen,
1595 MUBUF_Pseudo InstrOffset,
1596 ValueType vt, PatFrag st,
1597 RegisterClass rc = VGPR_32> {
1599 (st vt:$value, (MUBUFScratchOffen v4i32:$srsrc, i32:$vaddr,
1600 i32:$soffset, u16imm:$offset)),
1601 (InstrOffen rc:$value, $vaddr, $srsrc, $soffset, $offset, 0, 0, 0, 0)
1605 (st vt:$value, (MUBUFScratchOffset v4i32:$srsrc, i32:$soffset,
1607 (InstrOffset rc:$value, $srsrc, $soffset, $offset, 0, 0, 0, 0)
1611 defm : MUBUFScratchStorePat <BUFFER_STORE_BYTE_OFFEN, BUFFER_STORE_BYTE_OFFSET, i32, truncstorei8_private>;
1612 defm : MUBUFScratchStorePat <BUFFER_STORE_SHORT_OFFEN, BUFFER_STORE_SHORT_OFFSET, i32, truncstorei16_private>;
1613 defm : MUBUFScratchStorePat <BUFFER_STORE_BYTE_OFFEN, BUFFER_STORE_BYTE_OFFSET, i16, truncstorei8_private>;
1614 defm : MUBUFScratchStorePat <BUFFER_STORE_SHORT_OFFEN, BUFFER_STORE_SHORT_OFFSET, i16, store_private>;
1616 foreach vt = Reg32Types.types in {
1617 defm : MUBUFScratchStorePat <BUFFER_STORE_DWORD_OFFEN, BUFFER_STORE_DWORD_OFFSET, vt, store_private>;
1620 defm : MUBUFScratchStorePat <BUFFER_STORE_DWORDX2_OFFEN, BUFFER_STORE_DWORDX2_OFFSET, v2i32, store_private, VReg_64>;
1621 defm : MUBUFScratchStorePat <BUFFER_STORE_DWORDX3_OFFEN, BUFFER_STORE_DWORDX3_OFFSET, v3i32, store_private, VReg_96>;
1622 defm : MUBUFScratchStorePat <BUFFER_STORE_DWORDX4_OFFEN, BUFFER_STORE_DWORDX4_OFFSET, v4i32, store_private, VReg_128>;
1625 let OtherPredicates = [D16PreservesUnusedBits] in {
1626 // Hiding the extract high pattern in the PatFrag seems to not
1627 // automatically increase the complexity.
1628 let AddedComplexity = 1 in {
1629 defm : MUBUFScratchStorePat <BUFFER_STORE_SHORT_D16_HI_OFFEN, BUFFER_STORE_SHORT_D16_HI_OFFSET, i32, store_hi16_private>;
1630 defm : MUBUFScratchStorePat <BUFFER_STORE_BYTE_D16_HI_OFFEN, BUFFER_STORE_BYTE_D16_HI_OFFSET, i32, truncstorei8_hi16_private>;
1634 //===----------------------------------------------------------------------===//
1636 //===----------------------------------------------------------------------===//
1638 //===----------------------------------------------------------------------===//
1639 // tbuffer_load/store_format patterns
1640 //===----------------------------------------------------------------------===//
1642 multiclass MTBUF_LoadIntrinsicPat<SDPatternOperator name, ValueType vt,
1645 (vt (name v4i32:$rsrc, 0, 0, i32:$soffset, imm:$offset,
1646 imm:$format, imm:$cachepolicy, 0)),
1647 (!cast<MTBUF_Pseudo>(opcode # _OFFSET) $rsrc, $soffset, (as_i16imm $offset),
1649 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1653 (vt (name v4i32:$rsrc, i32:$vindex, 0, i32:$soffset, imm:$offset,
1654 imm:$format, imm:$cachepolicy, imm)),
1655 (!cast<MTBUF_Pseudo>(opcode # _IDXEN) $vindex, $rsrc, $soffset, (as_i16imm $offset),
1657 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1661 (vt (name v4i32:$rsrc, 0, i32:$voffset, i32:$soffset, imm:$offset,
1662 imm:$format, imm:$cachepolicy, 0)),
1663 (!cast<MTBUF_Pseudo>(opcode # _OFFEN) $voffset, $rsrc, $soffset, (as_i16imm $offset),
1665 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1669 (vt (name v4i32:$rsrc, i32:$vindex, i32:$voffset, i32:$soffset, imm:$offset,
1670 imm:$format, imm:$cachepolicy, imm)),
1671 (!cast<MTBUF_Pseudo>(opcode # _BOTHEN)
1672 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1673 $rsrc, $soffset, (as_i16imm $offset),
1675 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1679 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, i32, "TBUFFER_LOAD_FORMAT_X">;
1680 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v2i32, "TBUFFER_LOAD_FORMAT_XY">;
1681 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v3i32, "TBUFFER_LOAD_FORMAT_XYZ">;
1682 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v4i32, "TBUFFER_LOAD_FORMAT_XYZW">;
1683 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, f32, "TBUFFER_LOAD_FORMAT_X">;
1684 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v2f32, "TBUFFER_LOAD_FORMAT_XY">;
1685 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v3f32, "TBUFFER_LOAD_FORMAT_XYZ">;
1686 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load, v4f32, "TBUFFER_LOAD_FORMAT_XYZW">;
1688 let SubtargetPredicate = HasUnpackedD16VMem in {
1689 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, f16, "TBUFFER_LOAD_FORMAT_D16_X_gfx80">;
1690 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, v2i32, "TBUFFER_LOAD_FORMAT_D16_XY_gfx80">;
1691 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, v4i32, "TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80">;
1692 } // End HasUnpackedD16VMem.
1694 let SubtargetPredicate = HasPackedD16VMem in {
1695 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, f16, "TBUFFER_LOAD_FORMAT_D16_X">;
1696 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, v2f16, "TBUFFER_LOAD_FORMAT_D16_XY">;
1697 defm : MTBUF_LoadIntrinsicPat<SItbuffer_load_d16, v4f16, "TBUFFER_LOAD_FORMAT_D16_XYZW">;
1698 } // End HasPackedD16VMem.
1700 multiclass MTBUF_StoreIntrinsicPat<SDPatternOperator name, ValueType vt,
1703 (name vt:$vdata, v4i32:$rsrc, 0, 0, i32:$soffset, imm:$offset,
1704 imm:$format, imm:$cachepolicy, 0),
1705 (!cast<MTBUF_Pseudo>(opcode # _OFFSET_exact) $vdata, $rsrc, $soffset,
1706 (as_i16imm $offset), (as_i8imm $format),
1707 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1711 (name vt:$vdata, v4i32:$rsrc, i32:$vindex, 0, i32:$soffset, imm:$offset,
1712 imm:$format, imm:$cachepolicy, imm),
1713 (!cast<MTBUF_Pseudo>(opcode # _IDXEN_exact) $vdata, $vindex, $rsrc, $soffset,
1714 (as_i16imm $offset), (as_i8imm $format),
1715 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1719 (name vt:$vdata, v4i32:$rsrc, 0, i32:$voffset, i32:$soffset, imm:$offset,
1720 imm:$format, imm:$cachepolicy, 0),
1721 (!cast<MTBUF_Pseudo>(opcode # _OFFEN_exact) $vdata, $voffset, $rsrc, $soffset,
1722 (as_i16imm $offset), (as_i8imm $format),
1723 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1727 (name vt:$vdata, v4i32:$rsrc, i32:$vindex, i32:$voffset, i32:$soffset,
1728 imm:$offset, imm:$format, imm:$cachepolicy, imm),
1729 (!cast<MTBUF_Pseudo>(opcode # _BOTHEN_exact)
1731 (REG_SEQUENCE VReg_64, $vindex, sub0, $voffset, sub1),
1732 $rsrc, $soffset, (as_i16imm $offset), (as_i8imm $format),
1733 (extract_glc $cachepolicy), (extract_slc $cachepolicy), 0, (extract_dlc $cachepolicy))
1737 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, i32, "TBUFFER_STORE_FORMAT_X">;
1738 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v2i32, "TBUFFER_STORE_FORMAT_XY">;
1739 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v3i32, "TBUFFER_STORE_FORMAT_XYZ">;
1740 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v4i32, "TBUFFER_STORE_FORMAT_XYZW">;
1741 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, f32, "TBUFFER_STORE_FORMAT_X">;
1742 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v2f32, "TBUFFER_STORE_FORMAT_XY">;
1743 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v3f32, "TBUFFER_STORE_FORMAT_XYZ">;
1744 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store, v4f32, "TBUFFER_STORE_FORMAT_XYZW">;
1746 let SubtargetPredicate = HasUnpackedD16VMem in {
1747 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, f16, "TBUFFER_STORE_FORMAT_D16_X_gfx80">;
1748 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, v2i32, "TBUFFER_STORE_FORMAT_D16_XY_gfx80">;
1749 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, v4i32, "TBUFFER_STORE_FORMAT_D16_XYZW_gfx80">;
1750 } // End HasUnpackedD16VMem.
1752 let SubtargetPredicate = HasPackedD16VMem in {
1753 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, f16, "TBUFFER_STORE_FORMAT_D16_X">;
1754 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, v2f16, "TBUFFER_STORE_FORMAT_D16_XY">;
1755 defm : MTBUF_StoreIntrinsicPat<SItbuffer_store_d16, v4f16, "TBUFFER_STORE_FORMAT_D16_XYZW">;
1756 } // End HasPackedD16VMem.
1758 //===----------------------------------------------------------------------===//
1759 // Target-specific instruction encodings.
1760 //===----------------------------------------------------------------------===//
1762 //===----------------------------------------------------------------------===//
1763 // Base ENC_MUBUF for GFX6, GFX7, GFX10.
1764 //===----------------------------------------------------------------------===//
1766 class Base_MUBUF_Real_gfx6_gfx7_gfx10<bits<7> op, MUBUF_Pseudo ps, int ef> :
1767 MUBUF_Real<ps>, Enc64, SIMCInstr<ps.PseudoInstr, ef> {
1768 let Inst{11-0} = !if(ps.has_offset, offset, ?);
1769 let Inst{12} = ps.offen;
1770 let Inst{13} = ps.idxen;
1771 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
1772 let Inst{16} = !if(ps.lds, 1, 0);
1773 let Inst{24-18} = op;
1774 let Inst{31-26} = 0x38;
1775 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
1776 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
1777 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
1778 let Inst{54} = !if(ps.has_slc, slc, ?);
1779 let Inst{55} = !if(ps.has_tfe, tfe, ?);
1780 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
1783 class MUBUF_Real_gfx10<bits<8> op, MUBUF_Pseudo ps> :
1784 Base_MUBUF_Real_gfx6_gfx7_gfx10<op{6-0}, ps, SIEncodingFamily.GFX10> {
1785 let Inst{15} = !if(ps.has_dlc, dlc, ps.dlc_value);
1786 let Inst{25} = op{7};
1789 class MUBUF_Real_gfx6_gfx7<bits<8> op, MUBUF_Pseudo ps> :
1790 Base_MUBUF_Real_gfx6_gfx7_gfx10<op{6-0}, ps, SIEncodingFamily.SI> {
1791 let Inst{15} = ps.addr64;
1794 //===----------------------------------------------------------------------===//
1796 //===----------------------------------------------------------------------===//
1798 let AssemblerPredicate = isGFX10Plus, DecoderNamespace = "GFX10" in {
1799 multiclass MUBUF_Real_gfx10_with_name<bits<8> op, string opName,
1801 def _gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(opName)> {
1802 MUBUF_Pseudo ps = !cast<MUBUF_Pseudo>(opName);
1803 let AsmString = asmName # ps.AsmOperands;
1806 multiclass MUBUF_Real_AllAddr_gfx10<bits<8> op> {
1808 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>;
1810 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>;
1812 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>;
1814 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>;
1816 multiclass MUBUF_Real_AllAddr_Lds_gfx10<bits<8> op> {
1817 def _OFFSET_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>,
1818 MUBUFLdsTable<0, NAME # "_OFFSET_gfx10">;
1819 def _OFFEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>,
1820 MUBUFLdsTable<0, NAME # "_OFFEN_gfx10">;
1821 def _IDXEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>,
1822 MUBUFLdsTable<0, NAME # "_IDXEN_gfx10">;
1823 def _BOTHEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>,
1824 MUBUFLdsTable<0, NAME # "_BOTHEN_gfx10">;
1826 def _LDS_OFFSET_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFSET")>,
1827 MUBUFLdsTable<1, NAME # "_OFFSET_gfx10">;
1828 def _LDS_OFFEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFEN")>,
1829 MUBUFLdsTable<1, NAME # "_OFFEN_gfx10">;
1830 def _LDS_IDXEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_IDXEN")>,
1831 MUBUFLdsTable<1, NAME # "_IDXEN_gfx10">;
1832 def _LDS_BOTHEN_gfx10 : MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_BOTHEN")>,
1833 MUBUFLdsTable<1, NAME # "_BOTHEN_gfx10">;
1835 multiclass MUBUF_Real_Atomics_gfx10<bits<8> op> :
1836 MUBUF_Real_AllAddr_gfx10<op> {
1837 def _BOTHEN_RTN_gfx10 :
1838 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN_RTN")>;
1839 def _IDXEN_RTN_gfx10 :
1840 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN_RTN")>;
1841 def _OFFEN_RTN_gfx10 :
1842 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN_RTN")>;
1843 def _OFFSET_RTN_gfx10 :
1844 MUBUF_Real_gfx10<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET_RTN")>;
1846 } // End AssemblerPredicate = isGFX10Plus, DecoderNamespace = "GFX10"
1848 defm BUFFER_STORE_BYTE_D16_HI : MUBUF_Real_AllAddr_gfx10<0x019>;
1849 defm BUFFER_STORE_SHORT_D16_HI : MUBUF_Real_AllAddr_gfx10<0x01b>;
1850 defm BUFFER_LOAD_UBYTE_D16 : MUBUF_Real_AllAddr_gfx10<0x020>;
1851 defm BUFFER_LOAD_UBYTE_D16_HI : MUBUF_Real_AllAddr_gfx10<0x021>;
1852 defm BUFFER_LOAD_SBYTE_D16 : MUBUF_Real_AllAddr_gfx10<0x022>;
1853 defm BUFFER_LOAD_SBYTE_D16_HI : MUBUF_Real_AllAddr_gfx10<0x023>;
1854 defm BUFFER_LOAD_SHORT_D16 : MUBUF_Real_AllAddr_gfx10<0x024>;
1855 defm BUFFER_LOAD_SHORT_D16_HI : MUBUF_Real_AllAddr_gfx10<0x025>;
1856 // FIXME-GFX10: Add following instructions:
1857 //defm BUFFER_LOAD_FORMAT_D16_HI_X : MUBUF_Real_AllAddr_gfx10<0x026>;
1858 //defm BUFFER_STORE_FORMAT_D16_HI_X : MUBUF_Real_AllAddr_gfx10<0x027>;
1859 defm BUFFER_LOAD_FORMAT_D16_X : MUBUF_Real_AllAddr_gfx10<0x080>;
1860 defm BUFFER_LOAD_FORMAT_D16_XY : MUBUF_Real_AllAddr_gfx10<0x081>;
1861 defm BUFFER_LOAD_FORMAT_D16_XYZ : MUBUF_Real_AllAddr_gfx10<0x082>;
1862 defm BUFFER_LOAD_FORMAT_D16_XYZW : MUBUF_Real_AllAddr_gfx10<0x083>;
1863 defm BUFFER_STORE_FORMAT_D16_X : MUBUF_Real_AllAddr_gfx10<0x084>;
1864 defm BUFFER_STORE_FORMAT_D16_XY : MUBUF_Real_AllAddr_gfx10<0x085>;
1865 defm BUFFER_STORE_FORMAT_D16_XYZ : MUBUF_Real_AllAddr_gfx10<0x086>;
1866 defm BUFFER_STORE_FORMAT_D16_XYZW : MUBUF_Real_AllAddr_gfx10<0x087>;
1868 def BUFFER_GL0_INV_gfx10 :
1869 MUBUF_Real_gfx10<0x071, BUFFER_GL0_INV>;
1870 def BUFFER_GL1_INV_gfx10 :
1871 MUBUF_Real_gfx10<0x072, BUFFER_GL1_INV>;
1873 //===----------------------------------------------------------------------===//
1874 // MUBUF - GFX6, GFX7, GFX10.
1875 //===----------------------------------------------------------------------===//
1877 let AssemblerPredicate = isGFX6, DecoderNamespace = "GFX6" in {
1878 multiclass MUBUF_Real_gfx6<bits<8> op> {
1879 def _gfx6 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME)>;
1881 } // End AssemblerPredicate = isGFX6, DecoderNamespace = "GFX6"
1883 let AssemblerPredicate = isGFX7Only, DecoderNamespace = "GFX7" in {
1884 multiclass MUBUF_Real_gfx7<bits<8> op> {
1885 def _gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME)>;
1887 } // End AssemblerPredicate = isGFX7Only, DecoderNamespace = "GFX7"
1889 let AssemblerPredicate = isGFX6GFX7, DecoderNamespace = "GFX6GFX7" in {
1890 multiclass MUBUF_Real_AllAddr_gfx6_gfx7<bits<8> op> {
1891 def _ADDR64_gfx6_gfx7 :
1892 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_ADDR64")>;
1893 def _BOTHEN_gfx6_gfx7 :
1894 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>;
1895 def _IDXEN_gfx6_gfx7 :
1896 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>;
1897 def _OFFEN_gfx6_gfx7 :
1898 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>;
1899 def _OFFSET_gfx6_gfx7 :
1900 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>;
1902 multiclass MUBUF_Real_AllAddr_Lds_gfx6_gfx7<bits<8> op> {
1903 def _OFFSET_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>,
1904 MUBUFLdsTable<0, NAME # "_OFFSET_gfx6_gfx7">;
1905 def _ADDR64_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_ADDR64")>,
1906 MUBUFLdsTable<0, NAME # "_ADDR64_gfx6_gfx7">;
1907 def _OFFEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>,
1908 MUBUFLdsTable<0, NAME # "_OFFEN_gfx6_gfx7">;
1909 def _IDXEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>,
1910 MUBUFLdsTable<0, NAME # "_IDXEN_gfx6_gfx7">;
1911 def _BOTHEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>,
1912 MUBUFLdsTable<0, NAME # "_BOTHEN_gfx6_gfx7">;
1914 def _LDS_OFFSET_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFSET")>,
1915 MUBUFLdsTable<1, NAME # "_OFFSET_gfx6_gfx7">;
1916 def _LDS_ADDR64_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_ADDR64")>,
1917 MUBUFLdsTable<1, NAME # "_ADDR64_gfx6_gfx7">;
1918 def _LDS_OFFEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFEN")>,
1919 MUBUFLdsTable<1, NAME # "_OFFEN_gfx6_gfx7">;
1920 def _LDS_IDXEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_IDXEN")>,
1921 MUBUFLdsTable<1, NAME # "_IDXEN_gfx6_gfx7">;
1922 def _LDS_BOTHEN_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_LDS_BOTHEN")>,
1923 MUBUFLdsTable<1, NAME # "_BOTHEN_gfx6_gfx7">;
1925 multiclass MUBUF_Real_Atomics_gfx6_gfx7<bits<8> op> :
1926 MUBUF_Real_AllAddr_gfx6_gfx7<op> {
1927 def _ADDR64_RTN_gfx6_gfx7 :
1928 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_ADDR64_RTN")>;
1929 def _BOTHEN_RTN_gfx6_gfx7 :
1930 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN_RTN")>;
1931 def _IDXEN_RTN_gfx6_gfx7 :
1932 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN_RTN")>;
1933 def _OFFEN_RTN_gfx6_gfx7 :
1934 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN_RTN")>;
1935 def _OFFSET_RTN_gfx6_gfx7 :
1936 MUBUF_Real_gfx6_gfx7<op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET_RTN")>;
1938 } // End AssemblerPredicate = isGFX6GFX7, DecoderNamespace = "GFX6GFX7"
1940 multiclass MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<bits<8> op> :
1941 MUBUF_Real_AllAddr_gfx6_gfx7<op>, MUBUF_Real_AllAddr_gfx10<op>;
1943 multiclass MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<bits<8> op> :
1944 MUBUF_Real_AllAddr_Lds_gfx6_gfx7<op>, MUBUF_Real_AllAddr_Lds_gfx10<op>;
1946 multiclass MUBUF_Real_Atomics_gfx6_gfx7_gfx10<bits<8> op> :
1947 MUBUF_Real_Atomics_gfx6_gfx7<op>, MUBUF_Real_Atomics_gfx10<op>;
1949 // FIXME-GFX6: Following instructions are available only on GFX6.
1950 //defm BUFFER_ATOMIC_RSUB : MUBUF_Real_Atomics_gfx6 <0x034>;
1951 //defm BUFFER_ATOMIC_RSUB_X2 : MUBUF_Real_Atomics_gfx6 <0x054>;
1953 defm BUFFER_LOAD_FORMAT_X : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x000>;
1954 defm BUFFER_LOAD_FORMAT_XY : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x001>;
1955 defm BUFFER_LOAD_FORMAT_XYZ : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x002>;
1956 defm BUFFER_LOAD_FORMAT_XYZW : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x003>;
1957 defm BUFFER_STORE_FORMAT_X : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x004>;
1958 defm BUFFER_STORE_FORMAT_XY : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x005>;
1959 defm BUFFER_STORE_FORMAT_XYZ : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x006>;
1960 defm BUFFER_STORE_FORMAT_XYZW : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x007>;
1961 defm BUFFER_LOAD_UBYTE : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x008>;
1962 defm BUFFER_LOAD_SBYTE : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x009>;
1963 defm BUFFER_LOAD_USHORT : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x00a>;
1964 defm BUFFER_LOAD_SSHORT : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x00b>;
1965 defm BUFFER_LOAD_DWORD : MUBUF_Real_AllAddr_Lds_gfx6_gfx7_gfx10<0x00c>;
1966 defm BUFFER_LOAD_DWORDX2 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x00d>;
1967 defm BUFFER_LOAD_DWORDX4 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x00e>;
1968 defm BUFFER_LOAD_DWORDX3 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x00f>;
1969 defm BUFFER_STORE_BYTE : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x018>;
1970 defm BUFFER_STORE_SHORT : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x01a>;
1971 defm BUFFER_STORE_DWORD : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x01c>;
1972 defm BUFFER_STORE_DWORDX2 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x01d>;
1973 defm BUFFER_STORE_DWORDX4 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x01e>;
1974 defm BUFFER_STORE_DWORDX3 : MUBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x01f>;
1976 defm BUFFER_ATOMIC_SWAP : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x030>;
1977 defm BUFFER_ATOMIC_CMPSWAP : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x031>;
1978 defm BUFFER_ATOMIC_ADD : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x032>;
1979 defm BUFFER_ATOMIC_SUB : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x033>;
1980 defm BUFFER_ATOMIC_SMIN : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x035>;
1981 defm BUFFER_ATOMIC_UMIN : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x036>;
1982 defm BUFFER_ATOMIC_SMAX : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x037>;
1983 defm BUFFER_ATOMIC_UMAX : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x038>;
1984 defm BUFFER_ATOMIC_AND : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x039>;
1985 defm BUFFER_ATOMIC_OR : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03a>;
1986 defm BUFFER_ATOMIC_XOR : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03b>;
1987 defm BUFFER_ATOMIC_INC : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03c>;
1988 defm BUFFER_ATOMIC_DEC : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03d>;
1989 // FIXME-GFX6-GFX7-GFX10: Add following instructions:
1990 //defm BUFFER_ATOMIC_FCMPSWAP : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03e>;
1991 //defm BUFFER_ATOMIC_FMIN : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x03f>;
1992 //defm BUFFER_ATOMIC_FMAX : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x040>;
1993 defm BUFFER_ATOMIC_SWAP_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x050>;
1994 defm BUFFER_ATOMIC_CMPSWAP_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x051>;
1995 defm BUFFER_ATOMIC_ADD_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x052>;
1996 defm BUFFER_ATOMIC_SUB_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x053>;
1997 defm BUFFER_ATOMIC_SMIN_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x055>;
1998 defm BUFFER_ATOMIC_UMIN_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x056>;
1999 defm BUFFER_ATOMIC_SMAX_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x057>;
2000 defm BUFFER_ATOMIC_UMAX_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x058>;
2001 defm BUFFER_ATOMIC_AND_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x059>;
2002 defm BUFFER_ATOMIC_OR_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05a>;
2003 defm BUFFER_ATOMIC_XOR_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05b>;
2004 defm BUFFER_ATOMIC_INC_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05c>;
2005 defm BUFFER_ATOMIC_DEC_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05d>;
2006 // FIXME-GFX7: Need to handle hazard for BUFFER_ATOMIC_FCMPSWAP_X2 on GFX7.
2007 // FIXME-GFX6-GFX7-GFX10: Add following instructions:
2008 //defm BUFFER_ATOMIC_FCMPSWAP_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05e>;
2009 //defm BUFFER_ATOMIC_FMIN_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x05f>;
2010 //defm BUFFER_ATOMIC_FMAX_X2 : MUBUF_Real_Atomics_gfx6_gfx7_gfx10<0x060>;
2012 defm BUFFER_WBINVL1_SC : MUBUF_Real_gfx6<0x070>;
2013 defm BUFFER_WBINVL1_VOL : MUBUF_Real_gfx7<0x070>;
2014 def BUFFER_WBINVL1_gfx6_gfx7 : MUBUF_Real_gfx6_gfx7<0x071, BUFFER_WBINVL1>;
2016 //===----------------------------------------------------------------------===//
2017 // Base ENC_MTBUF for GFX6, GFX7, GFX10.
2018 //===----------------------------------------------------------------------===//
2020 class Base_MTBUF_Real_gfx6_gfx7_gfx10<bits<3> op, MTBUF_Pseudo ps, int ef> :
2021 MTBUF_Real<ps>, Enc64, SIMCInstr<ps.PseudoInstr, ef> {
2022 let Inst{11-0} = !if(ps.has_offset, offset, ?);
2023 let Inst{12} = ps.offen;
2024 let Inst{13} = ps.idxen;
2025 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
2026 let Inst{18-16} = op;
2027 let Inst{31-26} = 0x3a; //encoding
2028 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
2029 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
2030 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
2031 let Inst{54} = !if(ps.has_slc, slc, ?);
2032 let Inst{55} = !if(ps.has_tfe, tfe, ?);
2033 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
2036 //===----------------------------------------------------------------------===//
2038 //===----------------------------------------------------------------------===//
2040 class MTBUF_Real_gfx10<bits<4> op, MTBUF_Pseudo ps> :
2041 Base_MTBUF_Real_gfx6_gfx7_gfx10<op{2-0}, ps, SIEncodingFamily.GFX10> {
2042 let Inst{15} = !if(ps.has_dlc, dlc, ps.dlc_value);
2043 let Inst{25-19} = format;
2044 let Inst{53} = op{3};
2047 let AssemblerPredicate = isGFX10Plus, DecoderNamespace = "GFX10" in {
2048 multiclass MTBUF_Real_AllAddr_gfx10<bits<4> op> {
2050 MTBUF_Real_gfx10<op, !cast<MTBUF_Pseudo>(NAME#"_BOTHEN")>;
2052 MTBUF_Real_gfx10<op, !cast<MTBUF_Pseudo>(NAME#"_IDXEN")>;
2054 MTBUF_Real_gfx10<op, !cast<MTBUF_Pseudo>(NAME#"_OFFEN")>;
2056 MTBUF_Real_gfx10<op, !cast<MTBUF_Pseudo>(NAME#"_OFFSET")>;
2058 } // End AssemblerPredicate = isGFX10Plus, DecoderNamespace = "GFX10"
2060 defm TBUFFER_LOAD_FORMAT_D16_X : MTBUF_Real_AllAddr_gfx10<0x008>;
2061 defm TBUFFER_LOAD_FORMAT_D16_XY : MTBUF_Real_AllAddr_gfx10<0x009>;
2062 defm TBUFFER_LOAD_FORMAT_D16_XYZ : MTBUF_Real_AllAddr_gfx10<0x00a>;
2063 defm TBUFFER_LOAD_FORMAT_D16_XYZW : MTBUF_Real_AllAddr_gfx10<0x00b>;
2064 defm TBUFFER_STORE_FORMAT_D16_X : MTBUF_Real_AllAddr_gfx10<0x00c>;
2065 defm TBUFFER_STORE_FORMAT_D16_XY : MTBUF_Real_AllAddr_gfx10<0x00d>;
2066 defm TBUFFER_STORE_FORMAT_D16_XYZ : MTBUF_Real_AllAddr_gfx10<0x00e>;
2067 defm TBUFFER_STORE_FORMAT_D16_XYZW : MTBUF_Real_AllAddr_gfx10<0x00f>;
2069 //===----------------------------------------------------------------------===//
2070 // MTBUF - GFX6, GFX7, GFX10.
2071 //===----------------------------------------------------------------------===//
2073 class MTBUF_Real_gfx6_gfx7<bits<4> op, MTBUF_Pseudo ps> :
2074 Base_MTBUF_Real_gfx6_gfx7_gfx10<op{2-0}, ps, SIEncodingFamily.SI> {
2075 let Inst{15} = ps.addr64;
2076 let Inst{22-19} = dfmt;
2077 let Inst{25-23} = nfmt;
2080 let AssemblerPredicate = isGFX6GFX7, DecoderNamespace = "GFX6GFX7" in {
2081 multiclass MTBUF_Real_AllAddr_gfx6_gfx7<bits<4> op> {
2082 def _ADDR64_gfx6_gfx7 :
2083 MTBUF_Real_gfx6_gfx7<op, !cast<MTBUF_Pseudo>(NAME#"_ADDR64")>;
2084 def _BOTHEN_gfx6_gfx7 :
2085 MTBUF_Real_gfx6_gfx7<op, !cast<MTBUF_Pseudo>(NAME#"_BOTHEN")>;
2086 def _IDXEN_gfx6_gfx7 :
2087 MTBUF_Real_gfx6_gfx7<op, !cast<MTBUF_Pseudo>(NAME#"_IDXEN")>;
2088 def _OFFEN_gfx6_gfx7 :
2089 MTBUF_Real_gfx6_gfx7<op, !cast<MTBUF_Pseudo>(NAME#"_OFFEN")>;
2090 def _OFFSET_gfx6_gfx7 :
2091 MTBUF_Real_gfx6_gfx7<op, !cast<MTBUF_Pseudo>(NAME#"_OFFSET")>;
2093 } // End AssemblerPredicate = isGFX6GFX7, DecoderNamespace = "GFX6GFX7"
2095 multiclass MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<bits<4> op> :
2096 MTBUF_Real_AllAddr_gfx6_gfx7<op>, MTBUF_Real_AllAddr_gfx10<op>;
2098 defm TBUFFER_LOAD_FORMAT_X : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x000>;
2099 defm TBUFFER_LOAD_FORMAT_XY : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x001>;
2100 defm TBUFFER_LOAD_FORMAT_XYZ : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x002>;
2101 defm TBUFFER_LOAD_FORMAT_XYZW : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x003>;
2102 defm TBUFFER_STORE_FORMAT_X : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x004>;
2103 defm TBUFFER_STORE_FORMAT_XY : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x005>;
2104 defm TBUFFER_STORE_FORMAT_XYZ : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x006>;
2105 defm TBUFFER_STORE_FORMAT_XYZW : MTBUF_Real_AllAddr_gfx6_gfx7_gfx10<0x007>;
2107 //===----------------------------------------------------------------------===//
2109 //===----------------------------------------------------------------------===//
2111 class MUBUF_Real_vi <bits<7> op, MUBUF_Pseudo ps> :
2114 SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI> {
2115 let AssemblerPredicate = isGFX8GFX9;
2116 let DecoderNamespace = "GFX8";
2118 let Inst{11-0} = !if(ps.has_offset, offset, ?);
2119 let Inst{12} = ps.offen;
2120 let Inst{13} = ps.idxen;
2121 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
2122 let Inst{16} = !if(ps.lds, 1, 0);
2123 let Inst{17} = !if(ps.has_slc, slc, ?);
2124 let Inst{24-18} = op;
2125 let Inst{31-26} = 0x38; //encoding
2126 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
2127 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
2128 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
2129 let Inst{55} = !if(ps.has_tfe, tfe, ?);
2130 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
2133 multiclass MUBUF_Real_AllAddr_vi<bits<7> op> {
2134 def _OFFSET_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>;
2135 def _OFFEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>;
2136 def _IDXEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>;
2137 def _BOTHEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>;
2140 multiclass MUBUF_Real_AllAddr_Lds_vi<bits<7> op> {
2142 def _OFFSET_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>,
2143 MUBUFLdsTable<0, NAME # "_OFFSET_vi">;
2144 def _OFFEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>,
2145 MUBUFLdsTable<0, NAME # "_OFFEN_vi">;
2146 def _IDXEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>,
2147 MUBUFLdsTable<0, NAME # "_IDXEN_vi">;
2148 def _BOTHEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>,
2149 MUBUFLdsTable<0, NAME # "_BOTHEN_vi">;
2151 def _LDS_OFFSET_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFSET")>,
2152 MUBUFLdsTable<1, NAME # "_OFFSET_vi">;
2153 def _LDS_OFFEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_LDS_OFFEN")>,
2154 MUBUFLdsTable<1, NAME # "_OFFEN_vi">;
2155 def _LDS_IDXEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_LDS_IDXEN")>,
2156 MUBUFLdsTable<1, NAME # "_IDXEN_vi">;
2157 def _LDS_BOTHEN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_LDS_BOTHEN")>,
2158 MUBUFLdsTable<1, NAME # "_BOTHEN_vi">;
2161 class MUBUF_Real_gfx80 <bits<7> op, MUBUF_Pseudo ps> :
2164 SIMCInstr<ps.PseudoInstr, SIEncodingFamily.GFX80> {
2165 let AssemblerPredicate=HasUnpackedD16VMem;
2166 let DecoderNamespace="GFX80_UNPACKED";
2168 let Inst{11-0} = !if(ps.has_offset, offset, ?);
2169 let Inst{12} = ps.offen;
2170 let Inst{13} = ps.idxen;
2171 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
2172 let Inst{16} = !if(ps.lds, 1, 0);
2173 let Inst{17} = !if(ps.has_slc, slc, ?);
2174 let Inst{24-18} = op;
2175 let Inst{31-26} = 0x38; //encoding
2176 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
2177 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
2178 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
2179 let Inst{55} = !if(ps.has_tfe, tfe, ?);
2180 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
2183 multiclass MUBUF_Real_AllAddr_gfx80<bits<7> op> {
2184 def _OFFSET_gfx80 : MUBUF_Real_gfx80 <op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET")>;
2185 def _OFFEN_gfx80 : MUBUF_Real_gfx80 <op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN")>;
2186 def _IDXEN_gfx80 : MUBUF_Real_gfx80 <op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN")>;
2187 def _BOTHEN_gfx80 : MUBUF_Real_gfx80 <op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN")>;
2190 multiclass MUBUF_Real_Atomic_vi<bits<7> op> :
2191 MUBUF_Real_AllAddr_vi<op> {
2192 def _OFFSET_RTN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFSET_RTN")>;
2193 def _OFFEN_RTN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_OFFEN_RTN")>;
2194 def _IDXEN_RTN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_IDXEN_RTN")>;
2195 def _BOTHEN_RTN_vi : MUBUF_Real_vi <op, !cast<MUBUF_Pseudo>(NAME#"_BOTHEN_RTN")>;
2198 defm BUFFER_LOAD_FORMAT_X : MUBUF_Real_AllAddr_Lds_vi <0x00>;
2199 defm BUFFER_LOAD_FORMAT_XY : MUBUF_Real_AllAddr_vi <0x01>;
2200 defm BUFFER_LOAD_FORMAT_XYZ : MUBUF_Real_AllAddr_vi <0x02>;
2201 defm BUFFER_LOAD_FORMAT_XYZW : MUBUF_Real_AllAddr_vi <0x03>;
2202 defm BUFFER_STORE_FORMAT_X : MUBUF_Real_AllAddr_vi <0x04>;
2203 defm BUFFER_STORE_FORMAT_XY : MUBUF_Real_AllAddr_vi <0x05>;
2204 defm BUFFER_STORE_FORMAT_XYZ : MUBUF_Real_AllAddr_vi <0x06>;
2205 defm BUFFER_STORE_FORMAT_XYZW : MUBUF_Real_AllAddr_vi <0x07>;
2206 let SubtargetPredicate = HasUnpackedD16VMem in {
2207 defm BUFFER_LOAD_FORMAT_D16_X_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x08>;
2208 defm BUFFER_LOAD_FORMAT_D16_XY_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x09>;
2209 defm BUFFER_LOAD_FORMAT_D16_XYZ_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0a>;
2210 defm BUFFER_LOAD_FORMAT_D16_XYZW_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0b>;
2211 defm BUFFER_STORE_FORMAT_D16_X_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0c>;
2212 defm BUFFER_STORE_FORMAT_D16_XY_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0d>;
2213 defm BUFFER_STORE_FORMAT_D16_XYZ_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0e>;
2214 defm BUFFER_STORE_FORMAT_D16_XYZW_gfx80 : MUBUF_Real_AllAddr_gfx80 <0x0f>;
2215 } // End HasUnpackedD16VMem.
2216 let SubtargetPredicate = HasPackedD16VMem in {
2217 defm BUFFER_LOAD_FORMAT_D16_X : MUBUF_Real_AllAddr_vi <0x08>;
2218 defm BUFFER_LOAD_FORMAT_D16_XY : MUBUF_Real_AllAddr_vi <0x09>;
2219 defm BUFFER_LOAD_FORMAT_D16_XYZ : MUBUF_Real_AllAddr_vi <0x0a>;
2220 defm BUFFER_LOAD_FORMAT_D16_XYZW : MUBUF_Real_AllAddr_vi <0x0b>;
2221 defm BUFFER_STORE_FORMAT_D16_X : MUBUF_Real_AllAddr_vi <0x0c>;
2222 defm BUFFER_STORE_FORMAT_D16_XY : MUBUF_Real_AllAddr_vi <0x0d>;
2223 defm BUFFER_STORE_FORMAT_D16_XYZ : MUBUF_Real_AllAddr_vi <0x0e>;
2224 defm BUFFER_STORE_FORMAT_D16_XYZW : MUBUF_Real_AllAddr_vi <0x0f>;
2225 } // End HasPackedD16VMem.
2226 defm BUFFER_LOAD_UBYTE : MUBUF_Real_AllAddr_Lds_vi <0x10>;
2227 defm BUFFER_LOAD_SBYTE : MUBUF_Real_AllAddr_Lds_vi <0x11>;
2228 defm BUFFER_LOAD_USHORT : MUBUF_Real_AllAddr_Lds_vi <0x12>;
2229 defm BUFFER_LOAD_SSHORT : MUBUF_Real_AllAddr_Lds_vi <0x13>;
2230 defm BUFFER_LOAD_DWORD : MUBUF_Real_AllAddr_Lds_vi <0x14>;
2231 defm BUFFER_LOAD_DWORDX2 : MUBUF_Real_AllAddr_Lds_vi <0x15>;
2232 defm BUFFER_LOAD_DWORDX3 : MUBUF_Real_AllAddr_Lds_vi <0x16>;
2233 defm BUFFER_LOAD_DWORDX4 : MUBUF_Real_AllAddr_Lds_vi <0x17>;
2234 defm BUFFER_STORE_BYTE : MUBUF_Real_AllAddr_vi <0x18>;
2235 defm BUFFER_STORE_BYTE_D16_HI : MUBUF_Real_AllAddr_vi <0x19>;
2236 defm BUFFER_STORE_SHORT : MUBUF_Real_AllAddr_vi <0x1a>;
2237 defm BUFFER_STORE_SHORT_D16_HI : MUBUF_Real_AllAddr_vi <0x1b>;
2238 defm BUFFER_STORE_DWORD : MUBUF_Real_AllAddr_vi <0x1c>;
2239 defm BUFFER_STORE_DWORDX2 : MUBUF_Real_AllAddr_vi <0x1d>;
2240 defm BUFFER_STORE_DWORDX3 : MUBUF_Real_AllAddr_vi <0x1e>;
2241 defm BUFFER_STORE_DWORDX4 : MUBUF_Real_AllAddr_vi <0x1f>;
2243 defm BUFFER_LOAD_UBYTE_D16 : MUBUF_Real_AllAddr_vi <0x20>;
2244 defm BUFFER_LOAD_UBYTE_D16_HI : MUBUF_Real_AllAddr_vi <0x21>;
2245 defm BUFFER_LOAD_SBYTE_D16 : MUBUF_Real_AllAddr_vi <0x22>;
2246 defm BUFFER_LOAD_SBYTE_D16_HI : MUBUF_Real_AllAddr_vi <0x23>;
2247 defm BUFFER_LOAD_SHORT_D16 : MUBUF_Real_AllAddr_vi <0x24>;
2248 defm BUFFER_LOAD_SHORT_D16_HI : MUBUF_Real_AllAddr_vi <0x25>;
2250 defm BUFFER_LOAD_FORMAT_D16_HI_X : MUBUF_Real_AllAddr_vi <0x26>;
2251 defm BUFFER_STORE_FORMAT_D16_HI_X : MUBUF_Real_AllAddr_vi <0x27>;
2253 defm BUFFER_ATOMIC_SWAP : MUBUF_Real_Atomic_vi <0x40>;
2254 defm BUFFER_ATOMIC_CMPSWAP : MUBUF_Real_Atomic_vi <0x41>;
2255 defm BUFFER_ATOMIC_ADD : MUBUF_Real_Atomic_vi <0x42>;
2256 defm BUFFER_ATOMIC_SUB : MUBUF_Real_Atomic_vi <0x43>;
2257 defm BUFFER_ATOMIC_SMIN : MUBUF_Real_Atomic_vi <0x44>;
2258 defm BUFFER_ATOMIC_UMIN : MUBUF_Real_Atomic_vi <0x45>;
2259 defm BUFFER_ATOMIC_SMAX : MUBUF_Real_Atomic_vi <0x46>;
2260 defm BUFFER_ATOMIC_UMAX : MUBUF_Real_Atomic_vi <0x47>;
2261 defm BUFFER_ATOMIC_AND : MUBUF_Real_Atomic_vi <0x48>;
2262 defm BUFFER_ATOMIC_OR : MUBUF_Real_Atomic_vi <0x49>;
2263 defm BUFFER_ATOMIC_XOR : MUBUF_Real_Atomic_vi <0x4a>;
2264 defm BUFFER_ATOMIC_INC : MUBUF_Real_Atomic_vi <0x4b>;
2265 defm BUFFER_ATOMIC_DEC : MUBUF_Real_Atomic_vi <0x4c>;
2267 defm BUFFER_ATOMIC_SWAP_X2 : MUBUF_Real_Atomic_vi <0x60>;
2268 defm BUFFER_ATOMIC_CMPSWAP_X2 : MUBUF_Real_Atomic_vi <0x61>;
2269 defm BUFFER_ATOMIC_ADD_X2 : MUBUF_Real_Atomic_vi <0x62>;
2270 defm BUFFER_ATOMIC_SUB_X2 : MUBUF_Real_Atomic_vi <0x63>;
2271 defm BUFFER_ATOMIC_SMIN_X2 : MUBUF_Real_Atomic_vi <0x64>;
2272 defm BUFFER_ATOMIC_UMIN_X2 : MUBUF_Real_Atomic_vi <0x65>;
2273 defm BUFFER_ATOMIC_SMAX_X2 : MUBUF_Real_Atomic_vi <0x66>;
2274 defm BUFFER_ATOMIC_UMAX_X2 : MUBUF_Real_Atomic_vi <0x67>;
2275 defm BUFFER_ATOMIC_AND_X2 : MUBUF_Real_Atomic_vi <0x68>;
2276 defm BUFFER_ATOMIC_OR_X2 : MUBUF_Real_Atomic_vi <0x69>;
2277 defm BUFFER_ATOMIC_XOR_X2 : MUBUF_Real_Atomic_vi <0x6a>;
2278 defm BUFFER_ATOMIC_INC_X2 : MUBUF_Real_Atomic_vi <0x6b>;
2279 defm BUFFER_ATOMIC_DEC_X2 : MUBUF_Real_Atomic_vi <0x6c>;
2281 def BUFFER_STORE_LDS_DWORD_vi : MUBUF_Real_vi <0x3d, BUFFER_STORE_LDS_DWORD>;
2283 def BUFFER_WBINVL1_vi : MUBUF_Real_vi <0x3e, BUFFER_WBINVL1>;
2284 def BUFFER_WBINVL1_VOL_vi : MUBUF_Real_vi <0x3f, BUFFER_WBINVL1_VOL>;
2286 let SubtargetPredicate = HasAtomicFaddInsts in {
2288 defm BUFFER_ATOMIC_ADD_F32 : MUBUF_Real_AllAddr_vi <0x4d>;
2289 defm BUFFER_ATOMIC_PK_ADD_F16 : MUBUF_Real_AllAddr_vi <0x4e>;
2291 } // End SubtargetPredicate = HasAtomicFaddInsts
2293 class MTBUF_Real_vi <bits<4> op, MTBUF_Pseudo ps> :
2296 SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI> {
2297 let AssemblerPredicate = isGFX8GFX9;
2298 let DecoderNamespace = "GFX8";
2300 let Inst{11-0} = !if(ps.has_offset, offset, ?);
2301 let Inst{12} = ps.offen;
2302 let Inst{13} = ps.idxen;
2303 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
2304 let Inst{18-15} = op;
2305 let Inst{22-19} = dfmt;
2306 let Inst{25-23} = nfmt;
2307 let Inst{31-26} = 0x3a; //encoding
2308 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
2309 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
2310 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
2311 let Inst{54} = !if(ps.has_slc, slc, ?);
2312 let Inst{55} = !if(ps.has_tfe, tfe, ?);
2313 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
2316 multiclass MTBUF_Real_AllAddr_vi<bits<4> op> {
2317 def _OFFSET_vi : MTBUF_Real_vi <op, !cast<MTBUF_Pseudo>(NAME#"_OFFSET")>;
2318 def _OFFEN_vi : MTBUF_Real_vi <op, !cast<MTBUF_Pseudo>(NAME#"_OFFEN")>;
2319 def _IDXEN_vi : MTBUF_Real_vi <op, !cast<MTBUF_Pseudo>(NAME#"_IDXEN")>;
2320 def _BOTHEN_vi : MTBUF_Real_vi <op, !cast<MTBUF_Pseudo>(NAME#"_BOTHEN")>;
2323 class MTBUF_Real_gfx80 <bits<4> op, MTBUF_Pseudo ps> :
2326 SIMCInstr<ps.PseudoInstr, SIEncodingFamily.GFX80> {
2327 let AssemblerPredicate=HasUnpackedD16VMem;
2328 let DecoderNamespace="GFX80_UNPACKED";
2330 let Inst{11-0} = !if(ps.has_offset, offset, ?);
2331 let Inst{12} = ps.offen;
2332 let Inst{13} = ps.idxen;
2333 let Inst{14} = !if(ps.has_glc, glc, ps.glc_value);
2334 let Inst{18-15} = op;
2335 let Inst{22-19} = dfmt;
2336 let Inst{25-23} = nfmt;
2337 let Inst{31-26} = 0x3a; //encoding
2338 let Inst{39-32} = !if(ps.has_vaddr, vaddr, ?);
2339 let Inst{47-40} = !if(ps.has_vdata, vdata, ?);
2340 let Inst{52-48} = !if(ps.has_srsrc, srsrc{6-2}, ?);
2341 let Inst{54} = !if(ps.has_slc, slc, ?);
2342 let Inst{55} = !if(ps.has_tfe, tfe, ?);
2343 let Inst{63-56} = !if(ps.has_soffset, soffset, ?);
2346 multiclass MTBUF_Real_AllAddr_gfx80<bits<4> op> {
2347 def _OFFSET_gfx80 : MTBUF_Real_gfx80 <op, !cast<MTBUF_Pseudo>(NAME#"_OFFSET")>;
2348 def _OFFEN_gfx80 : MTBUF_Real_gfx80 <op, !cast<MTBUF_Pseudo>(NAME#"_OFFEN")>;
2349 def _IDXEN_gfx80 : MTBUF_Real_gfx80 <op, !cast<MTBUF_Pseudo>(NAME#"_IDXEN")>;
2350 def _BOTHEN_gfx80 : MTBUF_Real_gfx80 <op, !cast<MTBUF_Pseudo>(NAME#"_BOTHEN")>;
2353 defm TBUFFER_LOAD_FORMAT_X : MTBUF_Real_AllAddr_vi <0x00>;
2354 defm TBUFFER_LOAD_FORMAT_XY : MTBUF_Real_AllAddr_vi <0x01>;
2355 defm TBUFFER_LOAD_FORMAT_XYZ : MTBUF_Real_AllAddr_vi <0x02>;
2356 defm TBUFFER_LOAD_FORMAT_XYZW : MTBUF_Real_AllAddr_vi <0x03>;
2357 defm TBUFFER_STORE_FORMAT_X : MTBUF_Real_AllAddr_vi <0x04>;
2358 defm TBUFFER_STORE_FORMAT_XY : MTBUF_Real_AllAddr_vi <0x05>;
2359 defm TBUFFER_STORE_FORMAT_XYZ : MTBUF_Real_AllAddr_vi <0x06>;
2360 defm TBUFFER_STORE_FORMAT_XYZW : MTBUF_Real_AllAddr_vi <0x07>;
2361 let SubtargetPredicate = HasUnpackedD16VMem in {
2362 defm TBUFFER_LOAD_FORMAT_D16_X_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x08>;
2363 defm TBUFFER_LOAD_FORMAT_D16_XY_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x09>;
2364 defm TBUFFER_LOAD_FORMAT_D16_XYZ_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0a>;
2365 defm TBUFFER_LOAD_FORMAT_D16_XYZW_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0b>;
2366 defm TBUFFER_STORE_FORMAT_D16_X_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0c>;
2367 defm TBUFFER_STORE_FORMAT_D16_XY_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0d>;
2368 defm TBUFFER_STORE_FORMAT_D16_XYZ_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0e>;
2369 defm TBUFFER_STORE_FORMAT_D16_XYZW_gfx80 : MTBUF_Real_AllAddr_gfx80 <0x0f>;
2370 } // End HasUnpackedD16VMem.
2371 let SubtargetPredicate = HasPackedD16VMem in {
2372 defm TBUFFER_LOAD_FORMAT_D16_X : MTBUF_Real_AllAddr_vi <0x08>;
2373 defm TBUFFER_LOAD_FORMAT_D16_XY : MTBUF_Real_AllAddr_vi <0x09>;
2374 defm TBUFFER_LOAD_FORMAT_D16_XYZ : MTBUF_Real_AllAddr_vi <0x0a>;
2375 defm TBUFFER_LOAD_FORMAT_D16_XYZW : MTBUF_Real_AllAddr_vi <0x0b>;
2376 defm TBUFFER_STORE_FORMAT_D16_X : MTBUF_Real_AllAddr_vi <0x0c>;
2377 defm TBUFFER_STORE_FORMAT_D16_XY : MTBUF_Real_AllAddr_vi <0x0d>;
2378 defm TBUFFER_STORE_FORMAT_D16_XYZ : MTBUF_Real_AllAddr_vi <0x0e>;
2379 defm TBUFFER_STORE_FORMAT_D16_XYZW : MTBUF_Real_AllAddr_vi <0x0f>;
2380 } // End HasUnpackedD16VMem.
2382 def MUBUFInfoTable : GenericTable {
2383 let FilterClass = "MUBUF_Pseudo";
2384 let CppTypeName = "MUBUFInfo";
2385 let Fields = ["Opcode", "BaseOpcode", "elements", "has_vaddr", "has_srsrc", "has_soffset"];
2387 let PrimaryKey = ["Opcode"];
2388 let PrimaryKeyName = "getMUBUFOpcodeHelper";
2391 def getMUBUFInfoFromOpcode : SearchIndex {
2392 let Table = MUBUFInfoTable;
2393 let Key = ["Opcode"];
2396 def getMUBUFInfoFromBaseOpcodeAndElements : SearchIndex {
2397 let Table = MUBUFInfoTable;
2398 let Key = ["BaseOpcode", "elements"];