2 * Copyright 2009 Jerome Glisse.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19 * USE OR OTHER DEALINGS IN THE SOFTWARE.
21 * The above copyright notice and this permission notice (including the
22 * next paragraph) shall be included in all copies or substantial portions
28 * Jerome Glisse <glisse@freedesktop.org>
31 #include <linux/seq_file.h>
32 #include <linux/atomic.h>
33 #include <linux/wait.h>
34 #include <linux/kref.h>
35 #include <linux/slab.h>
36 #include <linux/firmware.h>
38 #include "radeon_reg.h"
40 #include "radeon_trace.h"
44 * Fences mark an event in the GPUs pipeline and are used
45 * for GPU/CPU synchronization. When the fence is written,
46 * it is expected that all buffers associated with that fence
47 * are no longer in use by the associated ring on the GPU and
48 * that the the relevant GPU caches have been flushed. Whether
49 * we use a scratch register or memory location depends on the asic
50 * and whether writeback is enabled.
54 * radeon_fence_write - write a fence value
56 * @rdev: radeon_device pointer
57 * @seq: sequence number to write
58 * @ring: ring index the fence is associated with
60 * Writes a fence value to memory or a scratch register (all asics).
62 static void radeon_fence_write(struct radeon_device
*rdev
, u32 seq
, int ring
)
64 struct radeon_fence_driver
*drv
= &rdev
->fence_drv
[ring
];
65 if (likely(rdev
->wb
.enabled
|| !drv
->scratch_reg
)) {
67 *drv
->cpu_addr
= cpu_to_le32(seq
);
70 WREG32(drv
->scratch_reg
, seq
);
75 * radeon_fence_read - read a fence value
77 * @rdev: radeon_device pointer
78 * @ring: ring index the fence is associated with
80 * Reads a fence value from memory or a scratch register (all asics).
81 * Returns the value of the fence read from memory or register.
83 static u32
radeon_fence_read(struct radeon_device
*rdev
, int ring
)
85 struct radeon_fence_driver
*drv
= &rdev
->fence_drv
[ring
];
88 if (likely(rdev
->wb
.enabled
|| !drv
->scratch_reg
)) {
90 seq
= le32_to_cpu(*drv
->cpu_addr
);
92 seq
= lower_32_bits(atomic64_read(&drv
->last_seq
));
95 seq
= RREG32(drv
->scratch_reg
);
101 * radeon_fence_emit - emit a fence on the requested ring
103 * @rdev: radeon_device pointer
104 * @fence: radeon fence object
105 * @ring: ring index the fence is associated with
107 * Emits a fence command on the requested ring (all asics).
108 * Returns 0 on success, -ENOMEM on failure.
110 int radeon_fence_emit(struct radeon_device
*rdev
,
111 struct radeon_fence
**fence
,
114 /* we are protected by the ring emission mutex */
115 *fence
= kmalloc(sizeof(struct radeon_fence
), GFP_KERNEL
);
116 if ((*fence
) == NULL
) {
119 kref_init(&((*fence
)->kref
));
120 (*fence
)->rdev
= rdev
;
121 (*fence
)->seq
= ++rdev
->fence_drv
[ring
].sync_seq
[ring
];
122 (*fence
)->ring
= ring
;
123 radeon_fence_ring_emit(rdev
, ring
, *fence
);
124 trace_radeon_fence_emit(rdev
->ddev
, (*fence
)->seq
);
129 * radeon_fence_process - process a fence
131 * @rdev: radeon_device pointer
132 * @ring: ring index the fence is associated with
134 * Checks the current fence value and wakes the fence queue
135 * if the sequence number has increased (all asics).
137 void radeon_fence_process(struct radeon_device
*rdev
, int ring
)
139 uint64_t seq
, last_seq
, last_emitted
;
140 unsigned count_loop
= 0;
143 /* Note there is a scenario here for an infinite loop but it's
144 * very unlikely to happen. For it to happen, the current polling
145 * process need to be interrupted by another process and another
146 * process needs to update the last_seq btw the atomic read and
147 * xchg of the current process.
149 * More over for this to go in infinite loop there need to be
150 * continuously new fence signaled ie radeon_fence_read needs
151 * to return a different value each time for both the currently
152 * polling process and the other process that xchg the last_seq
153 * btw atomic read and xchg of the current process. And the
154 * value the other process set as last seq must be higher than
155 * the seq value we just read. Which means that current process
156 * need to be interrupted after radeon_fence_read and before
159 * To be even more safe we count the number of time we loop and
160 * we bail after 10 loop just accepting the fact that we might
161 * have temporarly set the last_seq not to the true real last
162 * seq but to an older one.
164 last_seq
= atomic64_read(&rdev
->fence_drv
[ring
].last_seq
);
166 last_emitted
= rdev
->fence_drv
[ring
].sync_seq
[ring
];
167 seq
= radeon_fence_read(rdev
, ring
);
168 seq
|= last_seq
& 0xffffffff00000000LL
;
169 if (seq
< last_seq
) {
171 seq
|= last_emitted
& 0xffffffff00000000LL
;
174 if (seq
<= last_seq
|| seq
> last_emitted
) {
177 /* If we loop over we don't want to return without
178 * checking if a fence is signaled as it means that the
179 * seq we just read is different from the previous on.
183 if ((count_loop
++) > 10) {
184 /* We looped over too many time leave with the
185 * fact that we might have set an older fence
186 * seq then the current real last seq as signaled
191 } while (atomic64_xchg(&rdev
->fence_drv
[ring
].last_seq
, seq
) > seq
);
194 rdev
->fence_drv
[ring
].last_activity
= jiffies
;
195 wake_up_all(&rdev
->fence_queue
);
200 * radeon_fence_destroy - destroy a fence
204 * Frees the fence object (all asics).
206 static void radeon_fence_destroy(struct kref
*kref
)
208 struct radeon_fence
*fence
;
210 fence
= container_of(kref
, struct radeon_fence
, kref
);
215 * radeon_fence_seq_signaled - check if a fence sequeuce number has signaled
217 * @rdev: radeon device pointer
218 * @seq: sequence number
219 * @ring: ring index the fence is associated with
221 * Check if the last singled fence sequnce number is >= the requested
222 * sequence number (all asics).
223 * Returns true if the fence has signaled (current fence value
224 * is >= requested value) or false if it has not (current fence
225 * value is < the requested value. Helper function for
226 * radeon_fence_signaled().
228 static bool radeon_fence_seq_signaled(struct radeon_device
*rdev
,
229 u64 seq
, unsigned ring
)
231 if (atomic64_read(&rdev
->fence_drv
[ring
].last_seq
) >= seq
) {
234 /* poll new last sequence at least once */
235 radeon_fence_process(rdev
, ring
);
236 if (atomic64_read(&rdev
->fence_drv
[ring
].last_seq
) >= seq
) {
243 * radeon_fence_signaled - check if a fence has signaled
245 * @fence: radeon fence object
247 * Check if the requested fence has signaled (all asics).
248 * Returns true if the fence has signaled or false if it has not.
250 bool radeon_fence_signaled(struct radeon_fence
*fence
)
255 if (fence
->seq
== RADEON_FENCE_SIGNALED_SEQ
) {
258 if (radeon_fence_seq_signaled(fence
->rdev
, fence
->seq
, fence
->ring
)) {
259 fence
->seq
= RADEON_FENCE_SIGNALED_SEQ
;
266 * radeon_fence_wait_seq - wait for a specific sequence number
268 * @rdev: radeon device pointer
269 * @target_seq: sequence number we want to wait for
270 * @ring: ring index the fence is associated with
271 * @intr: use interruptable sleep
272 * @lock_ring: whether the ring should be locked or not
274 * Wait for the requested sequence number to be written (all asics).
275 * @intr selects whether to use interruptable (true) or non-interruptable
276 * (false) sleep when waiting for the sequence number. Helper function
277 * for radeon_fence_wait(), et al.
278 * Returns 0 if the sequence number has passed, error for all other cases.
279 * -EDEADLK is returned when a GPU lockup has been detected and the ring is
280 * marked as not ready so no further jobs get scheduled until a successful
283 static int radeon_fence_wait_seq(struct radeon_device
*rdev
, u64 target_seq
,
284 unsigned ring
, bool intr
, bool lock_ring
)
286 unsigned long timeout
, last_activity
;
292 while (target_seq
> atomic64_read(&rdev
->fence_drv
[ring
].last_seq
)) {
293 if (!rdev
->ring
[ring
].ready
) {
297 timeout
= jiffies
- RADEON_FENCE_JIFFIES_TIMEOUT
;
298 if (time_after(rdev
->fence_drv
[ring
].last_activity
, timeout
)) {
299 /* the normal case, timeout is somewhere before last_activity */
300 timeout
= rdev
->fence_drv
[ring
].last_activity
- timeout
;
302 /* either jiffies wrapped around, or no fence was signaled in the last 500ms
303 * anyway we will just wait for the minimum amount and then check for a lockup
307 seq
= atomic64_read(&rdev
->fence_drv
[ring
].last_seq
);
308 /* Save current last activity valuee, used to check for GPU lockups */
309 last_activity
= rdev
->fence_drv
[ring
].last_activity
;
311 trace_radeon_fence_wait_begin(rdev
->ddev
, seq
);
312 radeon_irq_kms_sw_irq_get(rdev
, ring
);
314 r
= wait_event_interruptible_timeout(rdev
->fence_queue
,
315 (signaled
= radeon_fence_seq_signaled(rdev
, target_seq
, ring
)),
318 r
= wait_event_timeout(rdev
->fence_queue
,
319 (signaled
= radeon_fence_seq_signaled(rdev
, target_seq
, ring
)),
322 radeon_irq_kms_sw_irq_put(rdev
, ring
);
323 if (unlikely(r
< 0)) {
326 trace_radeon_fence_wait_end(rdev
->ddev
, seq
);
328 if (unlikely(!signaled
)) {
329 /* we were interrupted for some reason and fence
330 * isn't signaled yet, resume waiting */
335 /* check if sequence value has changed since last_activity */
336 if (seq
!= atomic64_read(&rdev
->fence_drv
[ring
].last_seq
)) {
341 mutex_lock(&rdev
->ring_lock
);
344 /* test if somebody else has already decided that this is a lockup */
345 if (last_activity
!= rdev
->fence_drv
[ring
].last_activity
) {
347 mutex_unlock(&rdev
->ring_lock
);
352 if (radeon_ring_is_lockup(rdev
, ring
, &rdev
->ring
[ring
])) {
353 /* good news we believe it's a lockup */
354 dev_warn(rdev
->dev
, "GPU lockup (waiting for 0x%016llx last fence id 0x%016llx)\n",
357 /* change last activity so nobody else think there is a lockup */
358 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
359 rdev
->fence_drv
[i
].last_activity
= jiffies
;
362 /* mark the ring as not ready any more */
363 rdev
->ring
[ring
].ready
= false;
365 mutex_unlock(&rdev
->ring_lock
);
371 mutex_unlock(&rdev
->ring_lock
);
379 * radeon_fence_wait - wait for a fence to signal
381 * @fence: radeon fence object
382 * @intr: use interruptable sleep
384 * Wait for the requested fence to signal (all asics).
385 * @intr selects whether to use interruptable (true) or non-interruptable
386 * (false) sleep when waiting for the fence.
387 * Returns 0 if the fence has passed, error for all other cases.
389 int radeon_fence_wait(struct radeon_fence
*fence
, bool intr
)
394 WARN(1, "Querying an invalid fence : %p !\n", fence
);
398 r
= radeon_fence_wait_seq(fence
->rdev
, fence
->seq
,
399 fence
->ring
, intr
, true);
403 fence
->seq
= RADEON_FENCE_SIGNALED_SEQ
;
407 static bool radeon_fence_any_seq_signaled(struct radeon_device
*rdev
, u64
*seq
)
411 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
412 if (seq
[i
] && radeon_fence_seq_signaled(rdev
, seq
[i
], i
)) {
420 * radeon_fence_wait_any_seq - wait for a sequence number on any ring
422 * @rdev: radeon device pointer
423 * @target_seq: sequence number(s) we want to wait for
424 * @intr: use interruptable sleep
426 * Wait for the requested sequence number(s) to be written by any ring
427 * (all asics). Sequnce number array is indexed by ring id.
428 * @intr selects whether to use interruptable (true) or non-interruptable
429 * (false) sleep when waiting for the sequence number. Helper function
430 * for radeon_fence_wait_any(), et al.
431 * Returns 0 if the sequence number has passed, error for all other cases.
433 static int radeon_fence_wait_any_seq(struct radeon_device
*rdev
,
434 u64
*target_seq
, bool intr
)
436 unsigned long timeout
, last_activity
, tmp
;
437 unsigned i
, ring
= RADEON_NUM_RINGS
;
441 for (i
= 0, last_activity
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
442 if (!target_seq
[i
]) {
446 /* use the most recent one as indicator */
447 if (time_after(rdev
->fence_drv
[i
].last_activity
, last_activity
)) {
448 last_activity
= rdev
->fence_drv
[i
].last_activity
;
451 /* For lockup detection just pick the lowest ring we are
452 * actively waiting for
459 /* nothing to wait for ? */
460 if (ring
== RADEON_NUM_RINGS
) {
464 while (!radeon_fence_any_seq_signaled(rdev
, target_seq
)) {
465 timeout
= jiffies
- RADEON_FENCE_JIFFIES_TIMEOUT
;
466 if (time_after(last_activity
, timeout
)) {
467 /* the normal case, timeout is somewhere before last_activity */
468 timeout
= last_activity
- timeout
;
470 /* either jiffies wrapped around, or no fence was signaled in the last 500ms
471 * anyway we will just wait for the minimum amount and then check for a lockup
476 trace_radeon_fence_wait_begin(rdev
->ddev
, target_seq
[ring
]);
477 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
479 radeon_irq_kms_sw_irq_get(rdev
, i
);
483 r
= wait_event_interruptible_timeout(rdev
->fence_queue
,
484 (signaled
= radeon_fence_any_seq_signaled(rdev
, target_seq
)),
487 r
= wait_event_timeout(rdev
->fence_queue
,
488 (signaled
= radeon_fence_any_seq_signaled(rdev
, target_seq
)),
491 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
493 radeon_irq_kms_sw_irq_put(rdev
, i
);
496 if (unlikely(r
< 0)) {
499 trace_radeon_fence_wait_end(rdev
->ddev
, target_seq
[ring
]);
501 if (unlikely(!signaled
)) {
502 /* we were interrupted for some reason and fence
503 * isn't signaled yet, resume waiting */
508 mutex_lock(&rdev
->ring_lock
);
509 for (i
= 0, tmp
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
510 if (time_after(rdev
->fence_drv
[i
].last_activity
, tmp
)) {
511 tmp
= rdev
->fence_drv
[i
].last_activity
;
514 /* test if somebody else has already decided that this is a lockup */
515 if (last_activity
!= tmp
) {
517 mutex_unlock(&rdev
->ring_lock
);
521 if (radeon_ring_is_lockup(rdev
, ring
, &rdev
->ring
[ring
])) {
522 /* good news we believe it's a lockup */
523 dev_warn(rdev
->dev
, "GPU lockup (waiting for 0x%016llx)\n",
526 /* change last activity so nobody else think there is a lockup */
527 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
528 rdev
->fence_drv
[i
].last_activity
= jiffies
;
531 /* mark the ring as not ready any more */
532 rdev
->ring
[ring
].ready
= false;
533 mutex_unlock(&rdev
->ring_lock
);
536 mutex_unlock(&rdev
->ring_lock
);
543 * radeon_fence_wait_any - wait for a fence to signal on any ring
545 * @rdev: radeon device pointer
546 * @fences: radeon fence object(s)
547 * @intr: use interruptable sleep
549 * Wait for any requested fence to signal (all asics). Fence
550 * array is indexed by ring id. @intr selects whether to use
551 * interruptable (true) or non-interruptable (false) sleep when
552 * waiting for the fences. Used by the suballocator.
553 * Returns 0 if any fence has passed, error for all other cases.
555 int radeon_fence_wait_any(struct radeon_device
*rdev
,
556 struct radeon_fence
**fences
,
559 uint64_t seq
[RADEON_NUM_RINGS
];
563 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
570 if (fences
[i
]->seq
== RADEON_FENCE_SIGNALED_SEQ
) {
571 /* something was allready signaled */
575 seq
[i
] = fences
[i
]->seq
;
578 r
= radeon_fence_wait_any_seq(rdev
, seq
, intr
);
586 * radeon_fence_wait_next_locked - wait for the next fence to signal
588 * @rdev: radeon device pointer
589 * @ring: ring index the fence is associated with
591 * Wait for the next fence on the requested ring to signal (all asics).
592 * Returns 0 if the next fence has passed, error for all other cases.
593 * Caller must hold ring lock.
595 int radeon_fence_wait_next_locked(struct radeon_device
*rdev
, int ring
)
599 seq
= atomic64_read(&rdev
->fence_drv
[ring
].last_seq
) + 1ULL;
600 if (seq
>= rdev
->fence_drv
[ring
].sync_seq
[ring
]) {
601 /* nothing to wait for, last_seq is
602 already the last emited fence */
605 return radeon_fence_wait_seq(rdev
, seq
, ring
, false, false);
609 * radeon_fence_wait_empty_locked - wait for all fences to signal
611 * @rdev: radeon device pointer
612 * @ring: ring index the fence is associated with
614 * Wait for all fences on the requested ring to signal (all asics).
615 * Returns 0 if the fences have passed, error for all other cases.
616 * Caller must hold ring lock.
618 int radeon_fence_wait_empty_locked(struct radeon_device
*rdev
, int ring
)
620 uint64_t seq
= rdev
->fence_drv
[ring
].sync_seq
[ring
];
623 r
= radeon_fence_wait_seq(rdev
, seq
, ring
, false, false);
628 dev_err(rdev
->dev
, "error waiting for ring[%d] to become idle (%d)\n",
635 * radeon_fence_ref - take a ref on a fence
637 * @fence: radeon fence object
639 * Take a reference on a fence (all asics).
642 struct radeon_fence
*radeon_fence_ref(struct radeon_fence
*fence
)
644 kref_get(&fence
->kref
);
649 * radeon_fence_unref - remove a ref on a fence
651 * @fence: radeon fence object
653 * Remove a reference on a fence (all asics).
655 void radeon_fence_unref(struct radeon_fence
**fence
)
657 struct radeon_fence
*tmp
= *fence
;
661 kref_put(&tmp
->kref
, radeon_fence_destroy
);
666 * radeon_fence_count_emitted - get the count of emitted fences
668 * @rdev: radeon device pointer
669 * @ring: ring index the fence is associated with
671 * Get the number of fences emitted on the requested ring (all asics).
672 * Returns the number of emitted fences on the ring. Used by the
673 * dynpm code to ring track activity.
675 unsigned radeon_fence_count_emitted(struct radeon_device
*rdev
, int ring
)
679 /* We are not protected by ring lock when reading the last sequence
680 * but it's ok to report slightly wrong fence count here.
682 radeon_fence_process(rdev
, ring
);
683 emitted
= rdev
->fence_drv
[ring
].sync_seq
[ring
]
684 - atomic64_read(&rdev
->fence_drv
[ring
].last_seq
);
685 /* to avoid 32bits warp around */
686 if (emitted
> 0x10000000) {
687 emitted
= 0x10000000;
689 return (unsigned)emitted
;
693 * radeon_fence_need_sync - do we need a semaphore
695 * @fence: radeon fence object
696 * @dst_ring: which ring to check against
698 * Check if the fence needs to be synced against another ring
699 * (all asics). If so, we need to emit a semaphore.
700 * Returns true if we need to sync with another ring, false if
703 bool radeon_fence_need_sync(struct radeon_fence
*fence
, int dst_ring
)
705 struct radeon_fence_driver
*fdrv
;
711 if (fence
->ring
== dst_ring
) {
715 /* we are protected by the ring mutex */
716 fdrv
= &fence
->rdev
->fence_drv
[dst_ring
];
717 if (fence
->seq
<= fdrv
->sync_seq
[fence
->ring
]) {
725 * radeon_fence_note_sync - record the sync point
727 * @fence: radeon fence object
728 * @dst_ring: which ring to check against
730 * Note the sequence number at which point the fence will
731 * be synced with the requested ring (all asics).
733 void radeon_fence_note_sync(struct radeon_fence
*fence
, int dst_ring
)
735 struct radeon_fence_driver
*dst
, *src
;
742 if (fence
->ring
== dst_ring
) {
746 /* we are protected by the ring mutex */
747 src
= &fence
->rdev
->fence_drv
[fence
->ring
];
748 dst
= &fence
->rdev
->fence_drv
[dst_ring
];
749 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
753 dst
->sync_seq
[i
] = max(dst
->sync_seq
[i
], src
->sync_seq
[i
]);
758 * radeon_fence_driver_start_ring - make the fence driver
759 * ready for use on the requested ring.
761 * @rdev: radeon device pointer
762 * @ring: ring index to start the fence driver on
764 * Make the fence driver ready for processing (all asics).
765 * Not all asics have all rings, so each asic will only
766 * start the fence driver on the rings it has.
767 * Returns 0 for success, errors for failure.
769 int radeon_fence_driver_start_ring(struct radeon_device
*rdev
, int ring
)
774 radeon_scratch_free(rdev
, rdev
->fence_drv
[ring
].scratch_reg
);
775 if (rdev
->wb
.use_event
|| !radeon_ring_supports_scratch_reg(rdev
, &rdev
->ring
[ring
])) {
776 rdev
->fence_drv
[ring
].scratch_reg
= 0;
777 if (ring
!= R600_RING_TYPE_UVD_INDEX
) {
778 index
= R600_WB_EVENT_OFFSET
+ ring
* 4;
779 rdev
->fence_drv
[ring
].cpu_addr
= &rdev
->wb
.wb
[index
/4];
780 rdev
->fence_drv
[ring
].gpu_addr
= rdev
->wb
.gpu_addr
+
784 /* put fence directly behind firmware */
785 index
= ALIGN(rdev
->uvd_fw
->size
, 8);
786 rdev
->fence_drv
[ring
].cpu_addr
= rdev
->uvd
.cpu_addr
+ index
;
787 rdev
->fence_drv
[ring
].gpu_addr
= rdev
->uvd
.gpu_addr
+ index
;
791 r
= radeon_scratch_get(rdev
, &rdev
->fence_drv
[ring
].scratch_reg
);
793 dev_err(rdev
->dev
, "fence failed to get scratch register\n");
796 index
= RADEON_WB_SCRATCH_OFFSET
+
797 rdev
->fence_drv
[ring
].scratch_reg
-
798 rdev
->scratch
.reg_base
;
799 rdev
->fence_drv
[ring
].cpu_addr
= &rdev
->wb
.wb
[index
/4];
800 rdev
->fence_drv
[ring
].gpu_addr
= rdev
->wb
.gpu_addr
+ index
;
802 radeon_fence_write(rdev
, atomic64_read(&rdev
->fence_drv
[ring
].last_seq
), ring
);
803 rdev
->fence_drv
[ring
].initialized
= true;
804 dev_info(rdev
->dev
, "fence driver on ring %d use gpu addr 0x%016llx and cpu addr 0x%p\n",
805 ring
, rdev
->fence_drv
[ring
].gpu_addr
, rdev
->fence_drv
[ring
].cpu_addr
);
810 * radeon_fence_driver_init_ring - init the fence driver
811 * for the requested ring.
813 * @rdev: radeon device pointer
814 * @ring: ring index to start the fence driver on
816 * Init the fence driver for the requested ring (all asics).
817 * Helper function for radeon_fence_driver_init().
819 static void radeon_fence_driver_init_ring(struct radeon_device
*rdev
, int ring
)
823 rdev
->fence_drv
[ring
].scratch_reg
= -1;
824 rdev
->fence_drv
[ring
].cpu_addr
= NULL
;
825 rdev
->fence_drv
[ring
].gpu_addr
= 0;
826 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
)
827 rdev
->fence_drv
[ring
].sync_seq
[i
] = 0;
828 atomic64_set(&rdev
->fence_drv
[ring
].last_seq
, 0);
829 rdev
->fence_drv
[ring
].last_activity
= jiffies
;
830 rdev
->fence_drv
[ring
].initialized
= false;
834 * radeon_fence_driver_init - init the fence driver
835 * for all possible rings.
837 * @rdev: radeon device pointer
839 * Init the fence driver for all possible rings (all asics).
840 * Not all asics have all rings, so each asic will only
841 * start the fence driver on the rings it has using
842 * radeon_fence_driver_start_ring().
843 * Returns 0 for success.
845 int radeon_fence_driver_init(struct radeon_device
*rdev
)
849 init_waitqueue_head(&rdev
->fence_queue
);
850 for (ring
= 0; ring
< RADEON_NUM_RINGS
; ring
++) {
851 radeon_fence_driver_init_ring(rdev
, ring
);
853 if (radeon_debugfs_fence_init(rdev
)) {
854 dev_err(rdev
->dev
, "fence debugfs file creation failed\n");
860 * radeon_fence_driver_fini - tear down the fence driver
861 * for all possible rings.
863 * @rdev: radeon device pointer
865 * Tear down the fence driver for all possible rings (all asics).
867 void radeon_fence_driver_fini(struct radeon_device
*rdev
)
871 mutex_lock(&rdev
->ring_lock
);
872 for (ring
= 0; ring
< RADEON_NUM_RINGS
; ring
++) {
873 if (!rdev
->fence_drv
[ring
].initialized
)
875 r
= radeon_fence_wait_empty_locked(rdev
, ring
);
877 /* no need to trigger GPU reset as we are unloading */
878 radeon_fence_driver_force_completion(rdev
);
880 wake_up_all(&rdev
->fence_queue
);
881 radeon_scratch_free(rdev
, rdev
->fence_drv
[ring
].scratch_reg
);
882 rdev
->fence_drv
[ring
].initialized
= false;
884 mutex_unlock(&rdev
->ring_lock
);
888 * radeon_fence_driver_force_completion - force all fence waiter to complete
890 * @rdev: radeon device pointer
892 * In case of GPU reset failure make sure no process keep waiting on fence
893 * that will never complete.
895 void radeon_fence_driver_force_completion(struct radeon_device
*rdev
)
899 for (ring
= 0; ring
< RADEON_NUM_RINGS
; ring
++) {
900 if (!rdev
->fence_drv
[ring
].initialized
)
902 radeon_fence_write(rdev
, rdev
->fence_drv
[ring
].sync_seq
[ring
], ring
);
910 #if defined(CONFIG_DEBUG_FS)
911 static int radeon_debugfs_fence_info(struct seq_file
*m
, void *data
)
913 struct drm_info_node
*node
= (struct drm_info_node
*)m
->private;
914 struct drm_device
*dev
= node
->minor
->dev
;
915 struct radeon_device
*rdev
= dev
->dev_private
;
918 for (i
= 0; i
< RADEON_NUM_RINGS
; ++i
) {
919 if (!rdev
->fence_drv
[i
].initialized
)
922 seq_printf(m
, "--- ring %d ---\n", i
);
923 seq_printf(m
, "Last signaled fence 0x%016llx\n",
924 (unsigned long long)atomic64_read(&rdev
->fence_drv
[i
].last_seq
));
925 seq_printf(m
, "Last emitted 0x%016llx\n",
926 rdev
->fence_drv
[i
].sync_seq
[i
]);
928 for (j
= 0; j
< RADEON_NUM_RINGS
; ++j
) {
929 if (i
!= j
&& rdev
->fence_drv
[j
].initialized
)
930 seq_printf(m
, "Last sync to ring %d 0x%016llx\n",
931 j
, rdev
->fence_drv
[i
].sync_seq
[j
]);
937 static struct drm_info_list radeon_debugfs_fence_list
[] = {
938 {"radeon_fence_info", &radeon_debugfs_fence_info
, 0, NULL
},
942 int radeon_debugfs_fence_init(struct radeon_device
*rdev
)
944 #if defined(CONFIG_DEBUG_FS)
945 return radeon_debugfs_add_files(rdev
, radeon_debugfs_fence_list
, 1);