1 //===-- R600InstrFormats.td - R600 Instruction Encodings ------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // R600 Instruction format definitions.
12 //===----------------------------------------------------------------------===//
14 def isR600 : Predicate<"Subtarget->getGeneration() <= AMDGPUSubtarget::R700">;
16 def isR600toCayman : Predicate<
17 "Subtarget->getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS">;
19 class R600Pat<dag pattern, dag result> : AMDGPUPat<pattern, result> {
20 let SubtargetPredicate = isR600toCayman;
23 class InstR600 <dag outs, dag ins, string asm, list<dag> pattern,
24 InstrItinClass itin = NoItinerary>
25 : AMDGPUInst <outs, ins, asm, pattern>, PredicateControl {
31 bits<2> FlagOperandIdx = 0;
36 bit HasNativeOperands = 0;
43 let SubtargetPredicate = isR600toCayman;
44 let Namespace = "R600";
45 let OutOperandList = outs;
46 let InOperandList = ins;
48 let Pattern = pattern;
51 // No AsmMatcher support.
52 let isCodeGenOnly = 1;
54 let TSFlags{4} = Trig;
57 // Vector instructions are instructions that must fill all slots in an
59 let TSFlags{6} = isVector;
60 let TSFlags{8-7} = FlagOperandIdx;
61 let TSFlags{9} = HasNativeOperands;
62 let TSFlags{10} = Op1;
63 let TSFlags{11} = Op2;
64 let TSFlags{12} = VTXInst;
65 let TSFlags{13} = TEXInst;
66 let TSFlags{14} = ALUInst;
67 let TSFlags{15} = LDS_1A;
68 let TSFlags{16} = LDS_1A1D;
69 let TSFlags{17} = IsExport;
70 let TSFlags{18} = LDS_1A2D;
73 //===----------------------------------------------------------------------===//
75 //===----------------------------------------------------------------------===//
77 class R600_ALU_LDS_Word0 {
84 bits<3> index_mode = 0;
88 bits<9> src0_sel = src0{8-0};
89 bits<2> src0_chan = src0{10-9};
90 bits<9> src1_sel = src1{8-0};
91 bits<2> src1_chan = src1{10-9};
93 let Word0{8-0} = src0_sel;
94 let Word0{9} = src0_rel;
95 let Word0{11-10} = src0_chan;
96 let Word0{21-13} = src1_sel;
97 let Word0{22} = src1_rel;
98 let Word0{24-23} = src1_chan;
99 let Word0{28-26} = index_mode;
100 let Word0{30-29} = pred_sel;
101 let Word0{31} = last;
104 class R600ALU_Word0 : R600_ALU_LDS_Word0 {
109 let Word0{12} = src0_neg;
110 let Word0{25} = src1_neg;
113 class R600ALU_Word1 {
114 field bits<32> Word1;
117 bits<3> bank_swizzle;
121 bits<7> dst_sel = dst{6-0};
122 bits<2> dst_chan = dst{10-9};
124 let Word1{20-18} = bank_swizzle;
125 let Word1{27-21} = dst_sel;
126 let Word1{28} = dst_rel;
127 let Word1{30-29} = dst_chan;
128 let Word1{31} = clamp;
131 class R600ALU_Word1_OP2 <bits<11> alu_inst> : R600ALU_Word1{
135 bits<1> update_exec_mask;
140 let Word1{0} = src0_abs;
141 let Word1{1} = src1_abs;
142 let Word1{2} = update_exec_mask;
143 let Word1{3} = update_pred;
144 let Word1{4} = write;
145 let Word1{6-5} = omod;
146 let Word1{17-7} = alu_inst;
149 class R600ALU_Word1_OP3 <bits<5> alu_inst> : R600ALU_Word1{
155 bits<9> src2_sel = src2{8-0};
156 bits<2> src2_chan = src2{10-9};
158 let Word1{8-0} = src2_sel;
159 let Word1{9} = src2_rel;
160 let Word1{11-10} = src2_chan;
161 let Word1{12} = src2_neg;
162 let Word1{17-13} = alu_inst;
165 class R600LDS_Word1 {
166 field bits<32> Word1;
169 bits<9> src2_sel = src2{8-0};
170 bits<2> src2_chan = src2{10-9};
172 // offset specifies the stride offset to the second set of data to be read
173 // from. This is a dword offset.
174 bits<5> alu_inst = 17; // OP3_INST_LDS_IDX_OP
175 bits<3> bank_swizzle;
177 bits<2> dst_chan = 0;
179 let Word1{8-0} = src2_sel;
180 let Word1{9} = src2_rel;
181 let Word1{11-10} = src2_chan;
182 let Word1{17-13} = alu_inst;
183 let Word1{20-18} = bank_swizzle;
184 let Word1{26-21} = lds_op;
185 let Word1{30-29} = dst_chan;
190 XXX: R600 subtarget uses a slightly different encoding than the other
191 subtargets. We currently handle this in R600MCCodeEmitter, but we may
192 want to use these instruction classes in the future.
194 class R600ALU_Word1_OP2_r600 : R600ALU_Word1_OP2 {
199 let Inst{37} = fog_merge;
200 let Inst{39-38} = omod;
201 let Inst{49-40} = alu_inst;
204 class R600ALU_Word1_OP2_r700 : R600ALU_Word1_OP2 {
208 let Inst{38-37} = omod;
209 let Inst{49-39} = alu_inst;
213 //===----------------------------------------------------------------------===//
214 // Vertex Fetch instructions
215 //===----------------------------------------------------------------------===//
218 field bits<32> Word0;
222 bits<1> FETCH_WHOLE_QUAD;
227 let Word0{4-0} = VC_INST;
228 let Word0{6-5} = FETCH_TYPE;
229 let Word0{7} = FETCH_WHOLE_QUAD;
230 let Word0{15-8} = buffer_id;
231 let Word0{22-16} = src_gpr;
232 let Word0{23} = SRC_REL;
233 let Word0{25-24} = SRC_SEL_X;
236 class VTX_WORD0_eg : VTX_WORD0 {
238 bits<6> MEGA_FETCH_COUNT;
240 let Word0{31-26} = MEGA_FETCH_COUNT;
243 class VTX_WORD0_cm : VTX_WORD0 {
246 bits<2> STRUCTURED_READ;
248 bits<1> COALESCED_READ;
250 let Word0{27-26} = SRC_SEL_Y;
251 let Word0{29-28} = STRUCTURED_READ;
252 let Word0{30} = LDS_REQ;
253 let Word0{31} = COALESCED_READ;
256 class VTX_WORD1_GPR {
257 field bits<32> Word1;
264 bits<1> USE_CONST_FIELDS;
266 bits<2> NUM_FORMAT_ALL;
267 bits<1> FORMAT_COMP_ALL;
268 bits<1> SRF_MODE_ALL;
270 let Word1{6-0} = dst_gpr;
271 let Word1{7} = DST_REL;
272 let Word1{8} = 0; // Reserved
273 let Word1{11-9} = DST_SEL_X;
274 let Word1{14-12} = DST_SEL_Y;
275 let Word1{17-15} = DST_SEL_Z;
276 let Word1{20-18} = DST_SEL_W;
277 let Word1{21} = USE_CONST_FIELDS;
278 let Word1{27-22} = DATA_FORMAT;
279 let Word1{29-28} = NUM_FORMAT_ALL;
280 let Word1{30} = FORMAT_COMP_ALL;
281 let Word1{31} = SRF_MODE_ALL;
284 //===----------------------------------------------------------------------===//
285 // Texture fetch instructions
286 //===----------------------------------------------------------------------===//
289 field bits<32> Word0;
293 bits<1> FETCH_WHOLE_QUAD;
298 bits<2> RESOURCE_INDEX_MODE;
299 bits<2> SAMPLER_INDEX_MODE;
301 let Word0{4-0} = TEX_INST;
302 let Word0{6-5} = INST_MOD;
303 let Word0{7} = FETCH_WHOLE_QUAD;
304 let Word0{15-8} = RESOURCE_ID;
305 let Word0{22-16} = SRC_GPR;
306 let Word0{23} = SRC_REL;
307 let Word0{24} = ALT_CONST;
308 let Word0{26-25} = RESOURCE_INDEX_MODE;
309 let Word0{28-27} = SAMPLER_INDEX_MODE;
313 field bits<32> Word1;
322 bits<1> COORD_TYPE_X;
323 bits<1> COORD_TYPE_Y;
324 bits<1> COORD_TYPE_Z;
325 bits<1> COORD_TYPE_W;
327 let Word1{6-0} = DST_GPR;
328 let Word1{7} = DST_REL;
329 let Word1{11-9} = DST_SEL_X;
330 let Word1{14-12} = DST_SEL_Y;
331 let Word1{17-15} = DST_SEL_Z;
332 let Word1{20-18} = DST_SEL_W;
333 let Word1{27-21} = LOD_BIAS;
334 let Word1{28} = COORD_TYPE_X;
335 let Word1{29} = COORD_TYPE_Y;
336 let Word1{30} = COORD_TYPE_Z;
337 let Word1{31} = COORD_TYPE_W;
341 field bits<32> Word2;
352 let Word2{4-0} = OFFSET_X;
353 let Word2{9-5} = OFFSET_Y;
354 let Word2{14-10} = OFFSET_Z;
355 let Word2{19-15} = SAMPLER_ID;
356 let Word2{22-20} = SRC_SEL_X;
357 let Word2{25-23} = SRC_SEL_Y;
358 let Word2{28-26} = SRC_SEL_Z;
359 let Word2{31-29} = SRC_SEL_W;
362 //===----------------------------------------------------------------------===//
363 // Control Flow Instructions
364 //===----------------------------------------------------------------------===//
366 class CF_WORD1_R600 {
367 field bits<32> Word1;
375 bits<1> END_OF_PROGRAM;
376 bits<1> VALID_PIXEL_MODE;
378 bits<1> WHOLE_QUAD_MODE;
381 let Word1{2-0} = POP_COUNT;
382 let Word1{7-3} = CF_CONST;
383 let Word1{9-8} = COND;
384 let Word1{12-10} = COUNT;
385 let Word1{18-13} = CALL_COUNT;
386 let Word1{19} = COUNT_3;
387 let Word1{21} = END_OF_PROGRAM;
388 let Word1{22} = VALID_PIXEL_MODE;
389 let Word1{29-23} = CF_INST;
390 let Word1{30} = WHOLE_QUAD_MODE;
391 let Word1{31} = BARRIER;
395 field bits<32> Word0;
398 bits<3> JUMPTABLE_SEL;
400 let Word0{23-0} = ADDR;
401 let Word0{26-24} = JUMPTABLE_SEL;
405 field bits<32> Word1;
411 bits<1> VALID_PIXEL_MODE;
412 bits<1> END_OF_PROGRAM;
416 let Word1{2-0} = POP_COUNT;
417 let Word1{7-3} = CF_CONST;
418 let Word1{9-8} = COND;
419 let Word1{15-10} = COUNT;
420 let Word1{20} = VALID_PIXEL_MODE;
421 let Word1{21} = END_OF_PROGRAM;
422 let Word1{29-22} = CF_INST;
423 let Word1{31} = BARRIER;
427 field bits<32> Word0;
430 bits<4> KCACHE_BANK0;
431 bits<4> KCACHE_BANK1;
432 bits<2> KCACHE_MODE0;
434 let Word0{21-0} = ADDR;
435 let Word0{25-22} = KCACHE_BANK0;
436 let Word0{29-26} = KCACHE_BANK1;
437 let Word0{31-30} = KCACHE_MODE0;
441 field bits<32> Word1;
443 bits<2> KCACHE_MODE1;
444 bits<8> KCACHE_ADDR0;
445 bits<8> KCACHE_ADDR1;
449 bits<1> WHOLE_QUAD_MODE;
452 let Word1{1-0} = KCACHE_MODE1;
453 let Word1{9-2} = KCACHE_ADDR0;
454 let Word1{17-10} = KCACHE_ADDR1;
455 let Word1{24-18} = COUNT;
456 let Word1{25} = ALT_CONST;
457 let Word1{29-26} = CF_INST;
458 let Word1{30} = WHOLE_QUAD_MODE;
459 let Word1{31} = BARRIER;
462 class CF_ALLOC_EXPORT_WORD0_RAT {
463 field bits<32> Word0;
474 let Word0{3-0} = rat_id;
475 let Word0{9-4} = rat_inst;
476 let Word0{10} = 0; // Reserved
477 let Word0{12-11} = rim;
478 let Word0{14-13} = type;
479 let Word0{21-15} = rw_gpr;
480 let Word0{22} = rw_rel;
481 let Word0{29-23} = index_gpr;
482 let Word0{31-30} = elem_size;
485 class CF_ALLOC_EXPORT_WORD1_BUF {
486 field bits<32> Word1;
497 let Word1{11-0} = array_size;
498 let Word1{15-12} = comp_mask;
499 let Word1{19-16} = burst_count;
502 let Word1{29-22} = cf_inst;
503 let Word1{30} = mark;
504 let Word1{31} = barrier;