2 * Copyright 2014 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
26 #define GFX9_NUM_GFX_RINGS 1
27 #define GFX9_NUM_COMPUTE_RINGS 8
32 #define PACKET_TYPE0 0
33 #define PACKET_TYPE1 1
34 #define PACKET_TYPE2 2
35 #define PACKET_TYPE3 3
37 #define CP_PACKET_GET_TYPE(h) (((h) >> 30) & 3)
38 #define CP_PACKET_GET_COUNT(h) (((h) >> 16) & 0x3FFF)
39 #define CP_PACKET0_GET_REG(h) ((h) & 0xFFFF)
40 #define CP_PACKET3_GET_OPCODE(h) (((h) >> 8) & 0xFF)
41 #define PACKET0(reg, n) ((PACKET_TYPE0 << 30) | \
44 #define CP_PACKET2 0x80000000
45 #define PACKET2_PAD_SHIFT 0
46 #define PACKET2_PAD_MASK (0x3fffffff << 0)
48 #define PACKET2(v) (CP_PACKET2 | REG_SET(PACKET2_PAD, (v)))
50 #define PACKET3(op, n) ((PACKET_TYPE3 << 30) | \
51 (((op) & 0xFF) << 8) | \
54 #define PACKET3_COMPUTE(op, n) (PACKET3(op, n) | 1 << 1)
56 #define PACKETJ_CONDITION_CHECK0 0
57 #define PACKETJ_CONDITION_CHECK1 1
58 #define PACKETJ_CONDITION_CHECK2 2
59 #define PACKETJ_CONDITION_CHECK3 3
60 #define PACKETJ_CONDITION_CHECK4 4
61 #define PACKETJ_CONDITION_CHECK5 5
62 #define PACKETJ_CONDITION_CHECK6 6
63 #define PACKETJ_CONDITION_CHECK7 7
65 #define PACKETJ_TYPE0 0
66 #define PACKETJ_TYPE1 1
67 #define PACKETJ_TYPE2 2
68 #define PACKETJ_TYPE3 3
69 #define PACKETJ_TYPE4 4
70 #define PACKETJ_TYPE5 5
71 #define PACKETJ_TYPE6 6
72 #define PACKETJ_TYPE7 7
74 #define PACKETJ(reg, r, cond, type) ((reg & 0x3FFFF) | \
75 ((r & 0x3F) << 18) | \
76 ((cond & 0xF) << 24) | \
80 #define PACKET3_NOP 0x10
81 #define PACKET3_SET_BASE 0x11
82 #define PACKET3_BASE_INDEX(x) ((x) << 0)
83 #define CE_PARTITION_BASE 3
84 #define PACKET3_CLEAR_STATE 0x12
85 #define PACKET3_INDEX_BUFFER_SIZE 0x13
86 #define PACKET3_DISPATCH_DIRECT 0x15
87 #define PACKET3_DISPATCH_INDIRECT 0x16
88 #define PACKET3_ATOMIC_GDS 0x1D
89 #define PACKET3_ATOMIC_MEM 0x1E
90 #define PACKET3_OCCLUSION_QUERY 0x1F
91 #define PACKET3_SET_PREDICATION 0x20
92 #define PACKET3_REG_RMW 0x21
93 #define PACKET3_COND_EXEC 0x22
94 #define PACKET3_PRED_EXEC 0x23
95 #define PACKET3_DRAW_INDIRECT 0x24
96 #define PACKET3_DRAW_INDEX_INDIRECT 0x25
97 #define PACKET3_INDEX_BASE 0x26
98 #define PACKET3_DRAW_INDEX_2 0x27
99 #define PACKET3_CONTEXT_CONTROL 0x28
100 #define PACKET3_INDEX_TYPE 0x2A
101 #define PACKET3_DRAW_INDIRECT_MULTI 0x2C
102 #define PACKET3_DRAW_INDEX_AUTO 0x2D
103 #define PACKET3_NUM_INSTANCES 0x2F
104 #define PACKET3_DRAW_INDEX_MULTI_AUTO 0x30
105 #define PACKET3_INDIRECT_BUFFER_CONST 0x33
106 #define PACKET3_STRMOUT_BUFFER_UPDATE 0x34
107 #define PACKET3_DRAW_INDEX_OFFSET_2 0x35
108 #define PACKET3_DRAW_PREAMBLE 0x36
109 #define PACKET3_WRITE_DATA 0x37
110 #define WRITE_DATA_DST_SEL(x) ((x) << 8)
112 * 1 - memory (sync - via GRBM)
116 * 5 - memory (async - direct)
118 #define WR_ONE_ADDR (1 << 16)
119 #define WR_CONFIRM (1 << 20)
120 #define WRITE_DATA_CACHE_POLICY(x) ((x) << 25)
124 #define WRITE_DATA_ENGINE_SEL(x) ((x) << 30)
129 #define PACKET3_DRAW_INDEX_INDIRECT_MULTI 0x38
130 #define PACKET3_MEM_SEMAPHORE 0x39
131 # define PACKET3_SEM_USE_MAILBOX (0x1 << 16)
132 # define PACKET3_SEM_SEL_SIGNAL_TYPE (0x1 << 20) /* 0 = increment, 1 = write 1 */
133 # define PACKET3_SEM_SEL_SIGNAL (0x6 << 29)
134 # define PACKET3_SEM_SEL_WAIT (0x7 << 29)
135 #define PACKET3_WAIT_REG_MEM 0x3C
136 #define WAIT_REG_MEM_FUNCTION(x) ((x) << 0)
145 #define WAIT_REG_MEM_MEM_SPACE(x) ((x) << 4)
149 #define WAIT_REG_MEM_OPERATION(x) ((x) << 6)
153 #define WAIT_REG_MEM_ENGINE(x) ((x) << 8)
157 #define PACKET3_INDIRECT_BUFFER 0x3F
158 #define INDIRECT_BUFFER_VALID (1 << 23)
159 #define INDIRECT_BUFFER_CACHE_POLICY(x) ((x) << 28)
164 #define INDIRECT_BUFFER_PRE_ENB(x) ((x) << 21)
165 #define PACKET3_COPY_DATA 0x40
166 #define PACKET3_PFP_SYNC_ME 0x42
167 #define PACKET3_COND_WRITE 0x45
168 #define PACKET3_EVENT_WRITE 0x46
169 #define EVENT_TYPE(x) ((x) << 0)
170 #define EVENT_INDEX(x) ((x) << 8)
171 /* 0 - any non-TS event
172 * 1 - ZPASS_DONE, PIXEL_PIPE_STAT_*
173 * 2 - SAMPLE_PIPELINESTAT
174 * 3 - SAMPLE_STREAMOUTSTAT*
175 * 4 - *S_PARTIAL_FLUSH
177 #define PACKET3_RELEASE_MEM 0x49
178 #define EVENT_TYPE(x) ((x) << 0)
179 #define EVENT_INDEX(x) ((x) << 8)
180 #define EOP_TCL1_VOL_ACTION_EN (1 << 12)
181 #define EOP_TC_VOL_ACTION_EN (1 << 13) /* L2 */
182 #define EOP_TC_WB_ACTION_EN (1 << 15) /* L2 */
183 #define EOP_TCL1_ACTION_EN (1 << 16)
184 #define EOP_TC_ACTION_EN (1 << 17) /* L2 */
185 #define EOP_TC_NC_ACTION_EN (1 << 19)
186 #define EOP_TC_MD_ACTION_EN (1 << 21) /* L2 metadata */
188 #define DATA_SEL(x) ((x) << 29)
190 * 1 - send low 32bit data
191 * 2 - send 64bit data
192 * 3 - send 64bit GPU counter value
193 * 4 - send 64bit sys counter value
195 #define INT_SEL(x) ((x) << 24)
197 * 1 - interrupt only (DATA_SEL = 0)
198 * 2 - interrupt when data write is confirmed
200 #define DST_SEL(x) ((x) << 16)
207 #define PACKET3_PREAMBLE_CNTL 0x4A
208 # define PACKET3_PREAMBLE_BEGIN_CLEAR_STATE (2 << 28)
209 # define PACKET3_PREAMBLE_END_CLEAR_STATE (3 << 28)
210 #define PACKET3_DMA_DATA 0x50
213 * 3. SRC_ADDR_LO or DATA [31:0]
214 * 4. SRC_ADDR_HI [31:0]
215 * 5. DST_ADDR_LO [31:0]
216 * 6. DST_ADDR_HI [7:0]
217 * 7. COMMAND [30:21] | BYTE_COUNT [20:0]
220 # define PACKET3_DMA_DATA_ENGINE(x) ((x) << 0)
224 # define PACKET3_DMA_DATA_SRC_CACHE_POLICY(x) ((x) << 13)
228 # define PACKET3_DMA_DATA_DST_SEL(x) ((x) << 20)
229 /* 0 - DST_ADDR using DAS
231 * 3 - DST_ADDR using L2
233 # define PACKET3_DMA_DATA_DST_CACHE_POLICY(x) ((x) << 25)
237 # define PACKET3_DMA_DATA_SRC_SEL(x) ((x) << 29)
238 /* 0 - SRC_ADDR using SAS
241 * 3 - SRC_ADDR using L2
243 # define PACKET3_DMA_DATA_CP_SYNC (1 << 31)
245 # define PACKET3_DMA_DATA_CMD_SAS (1 << 26)
249 # define PACKET3_DMA_DATA_CMD_DAS (1 << 27)
253 # define PACKET3_DMA_DATA_CMD_SAIC (1 << 28)
254 # define PACKET3_DMA_DATA_CMD_DAIC (1 << 29)
255 # define PACKET3_DMA_DATA_CMD_RAW_WAIT (1 << 30)
256 #define PACKET3_AQUIRE_MEM 0x58
257 #define PACKET3_REWIND 0x59
258 #define PACKET3_LOAD_UCONFIG_REG 0x5E
259 #define PACKET3_LOAD_SH_REG 0x5F
260 #define PACKET3_LOAD_CONFIG_REG 0x60
261 #define PACKET3_LOAD_CONTEXT_REG 0x61
262 #define PACKET3_SET_CONFIG_REG 0x68
263 #define PACKET3_SET_CONFIG_REG_START 0x00002000
264 #define PACKET3_SET_CONFIG_REG_END 0x00002c00
265 #define PACKET3_SET_CONTEXT_REG 0x69
266 #define PACKET3_SET_CONTEXT_REG_START 0x0000a000
267 #define PACKET3_SET_CONTEXT_REG_END 0x0000a400
268 #define PACKET3_SET_CONTEXT_REG_INDIRECT 0x73
269 #define PACKET3_SET_SH_REG 0x76
270 #define PACKET3_SET_SH_REG_START 0x00002c00
271 #define PACKET3_SET_SH_REG_END 0x00003000
272 #define PACKET3_SET_SH_REG_OFFSET 0x77
273 #define PACKET3_SET_QUEUE_REG 0x78
274 #define PACKET3_SET_UCONFIG_REG 0x79
275 #define PACKET3_SET_UCONFIG_REG_START 0x0000c000
276 #define PACKET3_SET_UCONFIG_REG_END 0x0000c400
277 #define PACKET3_SET_UCONFIG_REG_INDEX_TYPE (2 << 28)
278 #define PACKET3_SCRATCH_RAM_WRITE 0x7D
279 #define PACKET3_SCRATCH_RAM_READ 0x7E
280 #define PACKET3_LOAD_CONST_RAM 0x80
281 #define PACKET3_WRITE_CONST_RAM 0x81
282 #define PACKET3_DUMP_CONST_RAM 0x83
283 #define PACKET3_INCREMENT_CE_COUNTER 0x84
284 #define PACKET3_INCREMENT_DE_COUNTER 0x85
285 #define PACKET3_WAIT_ON_CE_COUNTER 0x86
286 #define PACKET3_WAIT_ON_DE_COUNTER_DIFF 0x88
287 #define PACKET3_SWITCH_BUFFER 0x8B
288 #define PACKET3_FRAME_CONTROL 0x90
289 # define FRAME_CMD(x) ((x) << 28)
295 #define PACKET3_INVALIDATE_TLBS 0x98
296 # define PACKET3_INVALIDATE_TLBS_DST_SEL(x) ((x) << 0)
297 # define PACKET3_INVALIDATE_TLBS_ALL_HUB(x) ((x) << 4)
298 # define PACKET3_INVALIDATE_TLBS_PASID(x) ((x) << 5)
299 # define PACKET3_INVALIDATE_TLBS_FLUSH_TYPE(x) ((x) << 29)
300 #define PACKET3_SET_RESOURCES 0xA0
303 * 3. QUEUE_MASK_LO [31:0]
304 * 4. QUEUE_MASK_HI [31:0]
305 * 5. GWS_MASK_LO [31:0]
306 * 6. GWS_MASK_HI [31:0]
308 * 8. GDS_HEAP_SIZE [16:11] | GDS_HEAP_BASE [5:0]
310 # define PACKET3_SET_RESOURCES_VMID_MASK(x) ((x) << 0)
311 # define PACKET3_SET_RESOURCES_UNMAP_LATENTY(x) ((x) << 16)
312 # define PACKET3_SET_RESOURCES_QUEUE_TYPE(x) ((x) << 29)
313 #define PACKET3_MAP_QUEUES 0xA2
317 * 4. MQD_ADDR_LO [31:0]
318 * 5. MQD_ADDR_HI [31:0]
319 * 6. WPTR_ADDR_LO [31:0]
320 * 7. WPTR_ADDR_HI [31:0]
323 # define PACKET3_MAP_QUEUES_QUEUE_SEL(x) ((x) << 4)
324 # define PACKET3_MAP_QUEUES_VMID(x) ((x) << 8)
325 # define PACKET3_MAP_QUEUES_QUEUE(x) ((x) << 13)
326 # define PACKET3_MAP_QUEUES_PIPE(x) ((x) << 16)
327 # define PACKET3_MAP_QUEUES_ME(x) ((x) << 18)
328 # define PACKET3_MAP_QUEUES_QUEUE_TYPE(x) ((x) << 21)
329 # define PACKET3_MAP_QUEUES_ALLOC_FORMAT(x) ((x) << 24)
330 # define PACKET3_MAP_QUEUES_ENGINE_SEL(x) ((x) << 26)
331 # define PACKET3_MAP_QUEUES_NUM_QUEUES(x) ((x) << 29)
333 # define PACKET3_MAP_QUEUES_CHECK_DISABLE(x) ((x) << 1)
334 # define PACKET3_MAP_QUEUES_DOORBELL_OFFSET(x) ((x) << 2)
335 #define PACKET3_UNMAP_QUEUES 0xA3
344 # define PACKET3_UNMAP_QUEUES_ACTION(x) ((x) << 0)
345 /* 0 - PREEMPT_QUEUES
347 * 2 - DISABLE_PROCESS_QUEUES
348 * 3 - PREEMPT_QUEUES_NO_UNMAP
350 # define PACKET3_UNMAP_QUEUES_QUEUE_SEL(x) ((x) << 4)
351 # define PACKET3_UNMAP_QUEUES_ENGINE_SEL(x) ((x) << 26)
352 # define PACKET3_UNMAP_QUEUES_NUM_QUEUES(x) ((x) << 29)
354 # define PACKET3_UNMAP_QUEUES_PASID(x) ((x) << 0)
356 # define PACKET3_UNMAP_QUEUES_DOORBELL_OFFSET0(x) ((x) << 2)
358 # define PACKET3_UNMAP_QUEUES_DOORBELL_OFFSET1(x) ((x) << 2)
360 # define PACKET3_UNMAP_QUEUES_RB_WPTR(x) ((x) << 0)
362 # define PACKET3_UNMAP_QUEUES_DOORBELL_OFFSET2(x) ((x) << 2)
364 # define PACKET3_UNMAP_QUEUES_DOORBELL_OFFSET3(x) ((x) << 2)
365 #define PACKET3_QUERY_STATUS 0xA4
375 # define PACKET3_QUERY_STATUS_CONTEXT_ID(x) ((x) << 0)
376 # define PACKET3_QUERY_STATUS_INTERRUPT_SEL(x) ((x) << 28)
377 # define PACKET3_QUERY_STATUS_COMMAND(x) ((x) << 30)
379 # define PACKET3_QUERY_STATUS_PASID(x) ((x) << 0)
381 # define PACKET3_QUERY_STATUS_DOORBELL_OFFSET(x) ((x) << 2)
382 # define PACKET3_QUERY_STATUS_ENG_SEL(x) ((x) << 25)
385 #define VCE_CMD_NO_OP 0x00000000
386 #define VCE_CMD_END 0x00000001
387 #define VCE_CMD_IB 0x00000002
388 #define VCE_CMD_FENCE 0x00000003
389 #define VCE_CMD_TRAP 0x00000004
390 #define VCE_CMD_IB_AUTO 0x00000005
391 #define VCE_CMD_SEMAPHORE 0x00000006
393 #define VCE_CMD_IB_VM 0x00000102
394 #define VCE_CMD_WAIT_GE 0x00000106
395 #define VCE_CMD_UPDATE_PTB 0x00000107
396 #define VCE_CMD_FLUSH_TLB 0x00000108
397 #define VCE_CMD_REG_WRITE 0x00000109
398 #define VCE_CMD_REG_WAIT 0x0000010a
400 #define HEVC_ENC_CMD_NO_OP 0x00000000
401 #define HEVC_ENC_CMD_END 0x00000001
402 #define HEVC_ENC_CMD_FENCE 0x00000003
403 #define HEVC_ENC_CMD_TRAP 0x00000004
404 #define HEVC_ENC_CMD_IB_VM 0x00000102
405 #define HEVC_ENC_CMD_REG_WRITE 0x00000109
406 #define HEVC_ENC_CMD_REG_WAIT 0x0000010a