2 * Copyright 2013 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
22 * Authors: Christian König <christian.koenig@amd.com>
25 #include <linux/firmware.h>
28 #include "radeon_asic.h"
32 * uvd_v1_0_get_rptr - get read pointer
34 * @rdev: radeon_device pointer
35 * @ring: radeon_ring pointer
37 * Returns the current hardware read pointer
39 uint32_t uvd_v1_0_get_rptr(struct radeon_device
*rdev
,
40 struct radeon_ring
*ring
)
42 return RREG32(UVD_RBC_RB_RPTR
);
46 * uvd_v1_0_get_wptr - get write pointer
48 * @rdev: radeon_device pointer
49 * @ring: radeon_ring pointer
51 * Returns the current hardware write pointer
53 uint32_t uvd_v1_0_get_wptr(struct radeon_device
*rdev
,
54 struct radeon_ring
*ring
)
56 return RREG32(UVD_RBC_RB_WPTR
);
60 * uvd_v1_0_set_wptr - set write pointer
62 * @rdev: radeon_device pointer
63 * @ring: radeon_ring pointer
65 * Commits the write pointer to the hardware
67 void uvd_v1_0_set_wptr(struct radeon_device
*rdev
,
68 struct radeon_ring
*ring
)
70 WREG32(UVD_RBC_RB_WPTR
, ring
->wptr
);
74 * uvd_v1_0_fence_emit - emit an fence & trap command
76 * @rdev: radeon_device pointer
77 * @fence: fence to emit
79 * Write a fence and a trap command to the ring.
81 void uvd_v1_0_fence_emit(struct radeon_device
*rdev
,
82 struct radeon_fence
*fence
)
84 struct radeon_ring
*ring
= &rdev
->ring
[fence
->ring
];
85 uint64_t addr
= rdev
->fence_drv
[fence
->ring
].gpu_addr
;
87 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_DATA0
, 0));
88 radeon_ring_write(ring
, addr
& 0xffffffff);
89 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_DATA1
, 0));
90 radeon_ring_write(ring
, fence
->seq
);
91 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_CMD
, 0));
92 radeon_ring_write(ring
, 0);
94 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_DATA0
, 0));
95 radeon_ring_write(ring
, 0);
96 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_DATA1
, 0));
97 radeon_ring_write(ring
, 0);
98 radeon_ring_write(ring
, PACKET0(UVD_GPCOM_VCPU_CMD
, 0));
99 radeon_ring_write(ring
, 2);
104 * uvd_v1_0_resume - memory controller programming
106 * @rdev: radeon_device pointer
108 * Let the UVD memory controller know it's offsets
110 int uvd_v1_0_resume(struct radeon_device
*rdev
)
116 r
= radeon_uvd_resume(rdev
);
120 /* program the VCPU memory controller bits 0-27 */
121 addr
= (rdev
->uvd
.gpu_addr
>> 3) + 16;
122 size
= RADEON_GPU_PAGE_ALIGN(rdev
->uvd_fw
->size
) >> 3;
123 WREG32(UVD_VCPU_CACHE_OFFSET0
, addr
);
124 WREG32(UVD_VCPU_CACHE_SIZE0
, size
);
127 size
= RADEON_UVD_HEAP_SIZE
>> 3;
128 WREG32(UVD_VCPU_CACHE_OFFSET1
, addr
);
129 WREG32(UVD_VCPU_CACHE_SIZE1
, size
);
132 size
= (RADEON_UVD_STACK_SIZE
+
133 (RADEON_UVD_SESSION_SIZE
* rdev
->uvd
.max_handles
)) >> 3;
134 WREG32(UVD_VCPU_CACHE_OFFSET2
, addr
);
135 WREG32(UVD_VCPU_CACHE_SIZE2
, size
);
138 addr
= (rdev
->uvd
.gpu_addr
>> 28) & 0xF;
139 WREG32(UVD_LMI_ADDR_EXT
, (addr
<< 12) | (addr
<< 0));
142 addr
= (rdev
->uvd
.gpu_addr
>> 32) & 0xFF;
143 WREG32(UVD_LMI_EXT40_ADDR
, addr
| (0x9 << 16) | (0x1 << 31));
145 WREG32(UVD_FW_START
, *((uint32_t*)rdev
->uvd
.cpu_addr
));
151 * uvd_v1_0_init - start and test UVD block
153 * @rdev: radeon_device pointer
155 * Initialize the hardware, boot up the VCPU and do some testing
157 int uvd_v1_0_init(struct radeon_device
*rdev
)
159 struct radeon_ring
*ring
= &rdev
->ring
[R600_RING_TYPE_UVD_INDEX
];
163 /* raise clocks while booting up the VCPU */
164 if (rdev
->family
< CHIP_RV740
)
165 radeon_set_uvd_clocks(rdev
, 10000, 10000);
167 radeon_set_uvd_clocks(rdev
, 53300, 40000);
169 r
= uvd_v1_0_start(rdev
);
174 r
= radeon_ring_test(rdev
, R600_RING_TYPE_UVD_INDEX
, ring
);
180 r
= radeon_ring_lock(rdev
, ring
, 10);
182 DRM_ERROR("radeon: ring failed to lock UVD ring (%d).\n", r
);
186 tmp
= PACKET0(UVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL
, 0);
187 radeon_ring_write(ring
, tmp
);
188 radeon_ring_write(ring
, 0xFFFFF);
190 tmp
= PACKET0(UVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL
, 0);
191 radeon_ring_write(ring
, tmp
);
192 radeon_ring_write(ring
, 0xFFFFF);
194 tmp
= PACKET0(UVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL
, 0);
195 radeon_ring_write(ring
, tmp
);
196 radeon_ring_write(ring
, 0xFFFFF);
198 /* Clear timeout status bits */
199 radeon_ring_write(ring
, PACKET0(UVD_SEMA_TIMEOUT_STATUS
, 0));
200 radeon_ring_write(ring
, 0x8);
202 radeon_ring_write(ring
, PACKET0(UVD_SEMA_CNTL
, 0));
203 radeon_ring_write(ring
, 3);
205 radeon_ring_unlock_commit(rdev
, ring
, false);
208 /* lower clocks again */
209 radeon_set_uvd_clocks(rdev
, 0, 0);
212 switch (rdev
->family
) {
216 /* 64byte granularity workaround */
217 WREG32(MC_CONFIG
, 0);
218 WREG32(MC_CONFIG
, 1 << 4);
219 WREG32(RS_DQ_RD_RET_CONF
, 0x3f);
220 WREG32(MC_CONFIG
, 0x1f);
226 /* write clean workaround */
227 WREG32_P(UVD_VCPU_CNTL
, 0x10, ~0x10);
231 /* TODO: Do we need more? */
235 DRM_INFO("UVD initialized successfully.\n");
242 * uvd_v1_0_fini - stop the hardware block
244 * @rdev: radeon_device pointer
246 * Stop the UVD block, mark ring as not ready any more
248 void uvd_v1_0_fini(struct radeon_device
*rdev
)
250 struct radeon_ring
*ring
= &rdev
->ring
[R600_RING_TYPE_UVD_INDEX
];
257 * uvd_v1_0_start - start UVD block
259 * @rdev: radeon_device pointer
261 * Setup and start the UVD block
263 int uvd_v1_0_start(struct radeon_device
*rdev
)
265 struct radeon_ring
*ring
= &rdev
->ring
[R600_RING_TYPE_UVD_INDEX
];
269 /* disable byte swapping */
270 u32 lmi_swap_cntl
= 0;
271 u32 mp_swap_cntl
= 0;
273 /* disable clock gating */
274 WREG32(UVD_CGC_GATE
, 0);
276 /* disable interupt */
277 WREG32_P(UVD_MASTINT_EN
, 0, ~(1 << 1));
279 /* Stall UMC and register bus before resetting VCPU */
280 WREG32_P(UVD_LMI_CTRL2
, 1 << 8, ~(1 << 8));
281 WREG32_P(UVD_RB_ARB_CTRL
, 1 << 3, ~(1 << 3));
284 /* put LMI, VCPU, RBC etc... into reset */
285 WREG32(UVD_SOFT_RESET
, LMI_SOFT_RESET
| VCPU_SOFT_RESET
|
286 LBSI_SOFT_RESET
| RBC_SOFT_RESET
| CSM_SOFT_RESET
|
287 CXW_SOFT_RESET
| TAP_SOFT_RESET
| LMI_UMC_SOFT_RESET
);
290 /* take UVD block out of reset */
291 WREG32_P(SRBM_SOFT_RESET
, 0, ~SOFT_RESET_UVD
);
294 /* initialize UVD memory controller */
295 WREG32(UVD_LMI_CTRL
, 0x40 | (1 << 8) | (1 << 13) |
296 (1 << 21) | (1 << 9) | (1 << 20));
299 /* swap (8 in 32) RB and IB */
303 WREG32(UVD_LMI_SWAP_CNTL
, lmi_swap_cntl
);
304 WREG32(UVD_MP_SWAP_CNTL
, mp_swap_cntl
);
306 WREG32(UVD_MPC_SET_MUXA0
, 0x40c2040);
307 WREG32(UVD_MPC_SET_MUXA1
, 0x0);
308 WREG32(UVD_MPC_SET_MUXB0
, 0x40c2040);
309 WREG32(UVD_MPC_SET_MUXB1
, 0x0);
310 WREG32(UVD_MPC_SET_ALU
, 0);
311 WREG32(UVD_MPC_SET_MUX
, 0x88);
313 /* take all subblocks out of reset, except VCPU */
314 WREG32(UVD_SOFT_RESET
, VCPU_SOFT_RESET
);
317 /* enable VCPU clock */
318 WREG32(UVD_VCPU_CNTL
, 1 << 9);
321 WREG32_P(UVD_LMI_CTRL2
, 0, ~(1 << 8));
323 WREG32_P(UVD_RB_ARB_CTRL
, 0, ~(1 << 3));
325 /* boot up the VCPU */
326 WREG32(UVD_SOFT_RESET
, 0);
329 for (i
= 0; i
< 10; ++i
) {
331 for (j
= 0; j
< 100; ++j
) {
332 status
= RREG32(UVD_STATUS
);
341 DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
342 WREG32_P(UVD_SOFT_RESET
, VCPU_SOFT_RESET
, ~VCPU_SOFT_RESET
);
344 WREG32_P(UVD_SOFT_RESET
, 0, ~VCPU_SOFT_RESET
);
350 DRM_ERROR("UVD not responding, giving up!!!\n");
354 /* enable interupt */
355 WREG32_P(UVD_MASTINT_EN
, 3<<1, ~(3 << 1));
357 /* force RBC into idle state */
358 WREG32(UVD_RBC_RB_CNTL
, 0x11010101);
360 /* Set the write pointer delay */
361 WREG32(UVD_RBC_RB_WPTR_CNTL
, 0);
363 /* program the 4GB memory segment for rptr and ring buffer */
364 WREG32(UVD_LMI_EXT40_ADDR
, upper_32_bits(ring
->gpu_addr
) |
365 (0x7 << 16) | (0x1 << 31));
367 /* Initialize the ring buffer's read and write pointers */
368 WREG32(UVD_RBC_RB_RPTR
, 0x0);
370 ring
->wptr
= RREG32(UVD_RBC_RB_RPTR
);
371 WREG32(UVD_RBC_RB_WPTR
, ring
->wptr
);
373 /* set the ring address */
374 WREG32(UVD_RBC_RB_BASE
, ring
->gpu_addr
);
376 /* Set ring buffer size */
377 rb_bufsz
= order_base_2(ring
->ring_size
);
378 rb_bufsz
= (0x1 << 8) | rb_bufsz
;
379 WREG32_P(UVD_RBC_RB_CNTL
, rb_bufsz
, ~0x11f1f);
385 * uvd_v1_0_stop - stop UVD block
387 * @rdev: radeon_device pointer
391 void uvd_v1_0_stop(struct radeon_device
*rdev
)
393 /* force RBC into idle state */
394 WREG32(UVD_RBC_RB_CNTL
, 0x11010101);
396 /* Stall UMC and register bus before resetting VCPU */
397 WREG32_P(UVD_LMI_CTRL2
, 1 << 8, ~(1 << 8));
398 WREG32_P(UVD_RB_ARB_CTRL
, 1 << 3, ~(1 << 3));
401 /* put VCPU into reset */
402 WREG32(UVD_SOFT_RESET
, VCPU_SOFT_RESET
);
405 /* disable VCPU clock */
406 WREG32(UVD_VCPU_CNTL
, 0x0);
408 /* Unstall UMC and register bus */
409 WREG32_P(UVD_LMI_CTRL2
, 0, ~(1 << 8));
410 WREG32_P(UVD_RB_ARB_CTRL
, 0, ~(1 << 3));
414 * uvd_v1_0_ring_test - register write test
416 * @rdev: radeon_device pointer
417 * @ring: radeon_ring pointer
419 * Test if we can successfully write to the context register
421 int uvd_v1_0_ring_test(struct radeon_device
*rdev
, struct radeon_ring
*ring
)
427 WREG32(UVD_CONTEXT_ID
, 0xCAFEDEAD);
428 r
= radeon_ring_lock(rdev
, ring
, 3);
430 DRM_ERROR("radeon: cp failed to lock ring %d (%d).\n",
434 radeon_ring_write(ring
, PACKET0(UVD_CONTEXT_ID
, 0));
435 radeon_ring_write(ring
, 0xDEADBEEF);
436 radeon_ring_unlock_commit(rdev
, ring
, false);
437 for (i
= 0; i
< rdev
->usec_timeout
; i
++) {
438 tmp
= RREG32(UVD_CONTEXT_ID
);
439 if (tmp
== 0xDEADBEEF)
444 if (i
< rdev
->usec_timeout
) {
445 DRM_INFO("ring test on %d succeeded in %d usecs\n",
448 DRM_ERROR("radeon: ring %d test failed (0x%08X)\n",
456 * uvd_v1_0_semaphore_emit - emit semaphore command
458 * @rdev: radeon_device pointer
459 * @ring: radeon_ring pointer
460 * @semaphore: semaphore to emit commands for
461 * @emit_wait: true if we should emit a wait command
463 * Emit a semaphore command (either wait or signal) to the UVD ring.
465 bool uvd_v1_0_semaphore_emit(struct radeon_device
*rdev
,
466 struct radeon_ring
*ring
,
467 struct radeon_semaphore
*semaphore
,
470 /* disable semaphores for UVD V1 hardware */
475 * uvd_v1_0_ib_execute - execute indirect buffer
477 * @rdev: radeon_device pointer
478 * @ib: indirect buffer to execute
480 * Write ring commands to execute the indirect buffer
482 void uvd_v1_0_ib_execute(struct radeon_device
*rdev
, struct radeon_ib
*ib
)
484 struct radeon_ring
*ring
= &rdev
->ring
[ib
->ring
];
486 radeon_ring_write(ring
, PACKET0(UVD_RBC_IB_BASE
, 0));
487 radeon_ring_write(ring
, ib
->gpu_addr
);
488 radeon_ring_write(ring
, PACKET0(UVD_RBC_IB_SIZE
, 0));
489 radeon_ring_write(ring
, ib
->length_dw
);
493 * uvd_v1_0_ib_test - test ib execution
495 * @rdev: radeon_device pointer
496 * @ring: radeon_ring pointer
498 * Test if we can successfully execute an IB
500 int uvd_v1_0_ib_test(struct radeon_device
*rdev
, struct radeon_ring
*ring
)
502 struct radeon_fence
*fence
= NULL
;
505 if (rdev
->family
< CHIP_RV740
)
506 r
= radeon_set_uvd_clocks(rdev
, 10000, 10000);
508 r
= radeon_set_uvd_clocks(rdev
, 53300, 40000);
510 DRM_ERROR("radeon: failed to raise UVD clocks (%d).\n", r
);
514 r
= radeon_uvd_get_create_msg(rdev
, ring
->idx
, 1, NULL
);
516 DRM_ERROR("radeon: failed to get create msg (%d).\n", r
);
520 r
= radeon_uvd_get_destroy_msg(rdev
, ring
->idx
, 1, &fence
);
522 DRM_ERROR("radeon: failed to get destroy ib (%d).\n", r
);
526 r
= radeon_fence_wait_timeout(fence
, false, usecs_to_jiffies(
527 RADEON_USEC_IB_TEST_TIMEOUT
));
529 DRM_ERROR("radeon: fence wait failed (%d).\n", r
);
532 DRM_ERROR("radeon: fence wait timed out.\n");
537 DRM_INFO("ib test on ring %d succeeded\n", ring
->idx
);
539 radeon_fence_unref(&fence
);
540 radeon_set_uvd_clocks(rdev
, 0, 0);