2 * Copyright 2015 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
22 * Authors: monk liu <monk.liu@amd.com>
26 #include <drm/drm_auth.h>
28 #include "amdgpu_sched.h"
30 static int amdgpu_ctx_priority_permit(struct drm_file
*filp
,
31 enum drm_sched_priority priority
)
33 /* NORMAL and below are accessible by everyone */
34 if (priority
<= DRM_SCHED_PRIORITY_NORMAL
)
37 if (capable(CAP_SYS_NICE
))
40 if (drm_is_current_master(filp
))
46 static int amdgpu_ctx_init(struct amdgpu_device
*adev
,
47 enum drm_sched_priority priority
,
48 struct drm_file
*filp
,
49 struct amdgpu_ctx
*ctx
)
54 if (priority
< 0 || priority
>= DRM_SCHED_PRIORITY_MAX
)
57 r
= amdgpu_ctx_priority_permit(filp
, priority
);
61 memset(ctx
, 0, sizeof(*ctx
));
63 kref_init(&ctx
->refcount
);
64 spin_lock_init(&ctx
->ring_lock
);
65 ctx
->fences
= kcalloc(amdgpu_sched_jobs
* AMDGPU_MAX_RINGS
,
66 sizeof(struct dma_fence
*), GFP_KERNEL
);
70 mutex_init(&ctx
->lock
);
72 for (i
= 0; i
< AMDGPU_MAX_RINGS
; ++i
) {
73 ctx
->rings
[i
].sequence
= 1;
74 ctx
->rings
[i
].fences
= &ctx
->fences
[amdgpu_sched_jobs
* i
];
77 ctx
->reset_counter
= atomic_read(&adev
->gpu_reset_counter
);
78 ctx
->reset_counter_query
= ctx
->reset_counter
;
79 ctx
->vram_lost_counter
= atomic_read(&adev
->vram_lost_counter
);
80 ctx
->init_priority
= priority
;
81 ctx
->override_priority
= DRM_SCHED_PRIORITY_UNSET
;
83 /* create context entity for each ring */
84 for (i
= 0; i
< adev
->num_rings
; i
++) {
85 struct amdgpu_ring
*ring
= adev
->rings
[i
];
86 struct drm_sched_rq
*rq
;
88 rq
= &ring
->sched
.sched_rq
[priority
];
90 if (ring
== &adev
->gfx
.kiq
.ring
)
93 r
= drm_sched_entity_init(&ctx
->rings
[i
].entity
,
94 &rq
, 1, &ctx
->guilty
);
99 r
= amdgpu_queue_mgr_init(adev
, &ctx
->queue_mgr
);
106 for (j
= 0; j
< i
; j
++)
107 drm_sched_entity_destroy(&ctx
->rings
[j
].entity
);
113 static void amdgpu_ctx_fini(struct kref
*ref
)
115 struct amdgpu_ctx
*ctx
= container_of(ref
, struct amdgpu_ctx
, refcount
);
116 struct amdgpu_device
*adev
= ctx
->adev
;
122 for (i
= 0; i
< AMDGPU_MAX_RINGS
; ++i
)
123 for (j
= 0; j
< amdgpu_sched_jobs
; ++j
)
124 dma_fence_put(ctx
->rings
[i
].fences
[j
]);
128 amdgpu_queue_mgr_fini(adev
, &ctx
->queue_mgr
);
130 mutex_destroy(&ctx
->lock
);
135 static int amdgpu_ctx_alloc(struct amdgpu_device
*adev
,
136 struct amdgpu_fpriv
*fpriv
,
137 struct drm_file
*filp
,
138 enum drm_sched_priority priority
,
141 struct amdgpu_ctx_mgr
*mgr
= &fpriv
->ctx_mgr
;
142 struct amdgpu_ctx
*ctx
;
145 ctx
= kmalloc(sizeof(*ctx
), GFP_KERNEL
);
149 mutex_lock(&mgr
->lock
);
150 r
= idr_alloc(&mgr
->ctx_handles
, ctx
, 1, 0, GFP_KERNEL
);
152 mutex_unlock(&mgr
->lock
);
158 r
= amdgpu_ctx_init(adev
, priority
, filp
, ctx
);
160 idr_remove(&mgr
->ctx_handles
, *id
);
164 mutex_unlock(&mgr
->lock
);
168 static void amdgpu_ctx_do_release(struct kref
*ref
)
170 struct amdgpu_ctx
*ctx
;
173 ctx
= container_of(ref
, struct amdgpu_ctx
, refcount
);
175 for (i
= 0; i
< ctx
->adev
->num_rings
; i
++) {
177 if (ctx
->adev
->rings
[i
] == &ctx
->adev
->gfx
.kiq
.ring
)
180 drm_sched_entity_destroy(&ctx
->rings
[i
].entity
);
183 amdgpu_ctx_fini(ref
);
186 static int amdgpu_ctx_free(struct amdgpu_fpriv
*fpriv
, uint32_t id
)
188 struct amdgpu_ctx_mgr
*mgr
= &fpriv
->ctx_mgr
;
189 struct amdgpu_ctx
*ctx
;
191 mutex_lock(&mgr
->lock
);
192 ctx
= idr_remove(&mgr
->ctx_handles
, id
);
194 kref_put(&ctx
->refcount
, amdgpu_ctx_do_release
);
195 mutex_unlock(&mgr
->lock
);
196 return ctx
? 0 : -EINVAL
;
199 static int amdgpu_ctx_query(struct amdgpu_device
*adev
,
200 struct amdgpu_fpriv
*fpriv
, uint32_t id
,
201 union drm_amdgpu_ctx_out
*out
)
203 struct amdgpu_ctx
*ctx
;
204 struct amdgpu_ctx_mgr
*mgr
;
205 unsigned reset_counter
;
210 mgr
= &fpriv
->ctx_mgr
;
211 mutex_lock(&mgr
->lock
);
212 ctx
= idr_find(&mgr
->ctx_handles
, id
);
214 mutex_unlock(&mgr
->lock
);
218 /* TODO: these two are always zero */
219 out
->state
.flags
= 0x0;
220 out
->state
.hangs
= 0x0;
222 /* determine if a GPU reset has occured since the last call */
223 reset_counter
= atomic_read(&adev
->gpu_reset_counter
);
224 /* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
225 if (ctx
->reset_counter_query
== reset_counter
)
226 out
->state
.reset_status
= AMDGPU_CTX_NO_RESET
;
228 out
->state
.reset_status
= AMDGPU_CTX_UNKNOWN_RESET
;
229 ctx
->reset_counter_query
= reset_counter
;
231 mutex_unlock(&mgr
->lock
);
235 static int amdgpu_ctx_query2(struct amdgpu_device
*adev
,
236 struct amdgpu_fpriv
*fpriv
, uint32_t id
,
237 union drm_amdgpu_ctx_out
*out
)
239 struct amdgpu_ctx
*ctx
;
240 struct amdgpu_ctx_mgr
*mgr
;
245 mgr
= &fpriv
->ctx_mgr
;
246 mutex_lock(&mgr
->lock
);
247 ctx
= idr_find(&mgr
->ctx_handles
, id
);
249 mutex_unlock(&mgr
->lock
);
253 out
->state
.flags
= 0x0;
254 out
->state
.hangs
= 0x0;
256 if (ctx
->reset_counter
!= atomic_read(&adev
->gpu_reset_counter
))
257 out
->state
.flags
|= AMDGPU_CTX_QUERY2_FLAGS_RESET
;
259 if (ctx
->vram_lost_counter
!= atomic_read(&adev
->vram_lost_counter
))
260 out
->state
.flags
|= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST
;
262 if (atomic_read(&ctx
->guilty
))
263 out
->state
.flags
|= AMDGPU_CTX_QUERY2_FLAGS_GUILTY
;
265 mutex_unlock(&mgr
->lock
);
269 int amdgpu_ctx_ioctl(struct drm_device
*dev
, void *data
,
270 struct drm_file
*filp
)
274 enum drm_sched_priority priority
;
276 union drm_amdgpu_ctx
*args
= data
;
277 struct amdgpu_device
*adev
= dev
->dev_private
;
278 struct amdgpu_fpriv
*fpriv
= filp
->driver_priv
;
281 id
= args
->in
.ctx_id
;
282 priority
= amdgpu_to_sched_priority(args
->in
.priority
);
284 /* For backwards compatibility reasons, we need to accept
285 * ioctls with garbage in the priority field */
286 if (priority
== DRM_SCHED_PRIORITY_INVALID
)
287 priority
= DRM_SCHED_PRIORITY_NORMAL
;
289 switch (args
->in
.op
) {
290 case AMDGPU_CTX_OP_ALLOC_CTX
:
291 r
= amdgpu_ctx_alloc(adev
, fpriv
, filp
, priority
, &id
);
292 args
->out
.alloc
.ctx_id
= id
;
294 case AMDGPU_CTX_OP_FREE_CTX
:
295 r
= amdgpu_ctx_free(fpriv
, id
);
297 case AMDGPU_CTX_OP_QUERY_STATE
:
298 r
= amdgpu_ctx_query(adev
, fpriv
, id
, &args
->out
);
300 case AMDGPU_CTX_OP_QUERY_STATE2
:
301 r
= amdgpu_ctx_query2(adev
, fpriv
, id
, &args
->out
);
310 struct amdgpu_ctx
*amdgpu_ctx_get(struct amdgpu_fpriv
*fpriv
, uint32_t id
)
312 struct amdgpu_ctx
*ctx
;
313 struct amdgpu_ctx_mgr
*mgr
;
318 mgr
= &fpriv
->ctx_mgr
;
320 mutex_lock(&mgr
->lock
);
321 ctx
= idr_find(&mgr
->ctx_handles
, id
);
323 kref_get(&ctx
->refcount
);
324 mutex_unlock(&mgr
->lock
);
328 int amdgpu_ctx_put(struct amdgpu_ctx
*ctx
)
333 kref_put(&ctx
->refcount
, amdgpu_ctx_do_release
);
337 int amdgpu_ctx_add_fence(struct amdgpu_ctx
*ctx
, struct amdgpu_ring
*ring
,
338 struct dma_fence
*fence
, uint64_t* handler
)
340 struct amdgpu_ctx_ring
*cring
= & ctx
->rings
[ring
->idx
];
341 uint64_t seq
= cring
->sequence
;
343 struct dma_fence
*other
= NULL
;
345 idx
= seq
& (amdgpu_sched_jobs
- 1);
346 other
= cring
->fences
[idx
];
348 BUG_ON(!dma_fence_is_signaled(other
));
350 dma_fence_get(fence
);
352 spin_lock(&ctx
->ring_lock
);
353 cring
->fences
[idx
] = fence
;
355 spin_unlock(&ctx
->ring_lock
);
357 dma_fence_put(other
);
364 struct dma_fence
*amdgpu_ctx_get_fence(struct amdgpu_ctx
*ctx
,
365 struct amdgpu_ring
*ring
, uint64_t seq
)
367 struct amdgpu_ctx_ring
*cring
= & ctx
->rings
[ring
->idx
];
368 struct dma_fence
*fence
;
370 spin_lock(&ctx
->ring_lock
);
373 seq
= ctx
->rings
[ring
->idx
].sequence
- 1;
375 if (seq
>= cring
->sequence
) {
376 spin_unlock(&ctx
->ring_lock
);
377 return ERR_PTR(-EINVAL
);
381 if (seq
+ amdgpu_sched_jobs
< cring
->sequence
) {
382 spin_unlock(&ctx
->ring_lock
);
386 fence
= dma_fence_get(cring
->fences
[seq
& (amdgpu_sched_jobs
- 1)]);
387 spin_unlock(&ctx
->ring_lock
);
392 void amdgpu_ctx_priority_override(struct amdgpu_ctx
*ctx
,
393 enum drm_sched_priority priority
)
396 struct amdgpu_device
*adev
= ctx
->adev
;
397 struct drm_sched_rq
*rq
;
398 struct drm_sched_entity
*entity
;
399 struct amdgpu_ring
*ring
;
400 enum drm_sched_priority ctx_prio
;
402 ctx
->override_priority
= priority
;
404 ctx_prio
= (ctx
->override_priority
== DRM_SCHED_PRIORITY_UNSET
) ?
405 ctx
->init_priority
: ctx
->override_priority
;
407 for (i
= 0; i
< adev
->num_rings
; i
++) {
408 ring
= adev
->rings
[i
];
409 entity
= &ctx
->rings
[i
].entity
;
410 rq
= &ring
->sched
.sched_rq
[ctx_prio
];
412 if (ring
->funcs
->type
== AMDGPU_RING_TYPE_KIQ
)
415 drm_sched_entity_set_rq(entity
, rq
);
419 int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx
*ctx
, unsigned ring_id
)
421 struct amdgpu_ctx_ring
*cring
= &ctx
->rings
[ring_id
];
422 unsigned idx
= cring
->sequence
& (amdgpu_sched_jobs
- 1);
423 struct dma_fence
*other
= cring
->fences
[idx
];
427 r
= dma_fence_wait(other
, true);
429 if (r
!= -ERESTARTSYS
)
430 DRM_ERROR("Error (%ld) waiting for fence!\n", r
);
439 void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr
*mgr
)
441 mutex_init(&mgr
->lock
);
442 idr_init(&mgr
->ctx_handles
);
445 void amdgpu_ctx_mgr_entity_flush(struct amdgpu_ctx_mgr
*mgr
)
447 struct amdgpu_ctx
*ctx
;
450 long max_wait
= MAX_WAIT_SCHED_ENTITY_Q_EMPTY
;
452 idp
= &mgr
->ctx_handles
;
454 mutex_lock(&mgr
->lock
);
455 idr_for_each_entry(idp
, ctx
, id
) {
458 mutex_unlock(&mgr
->lock
);
462 for (i
= 0; i
< ctx
->adev
->num_rings
; i
++) {
464 if (ctx
->adev
->rings
[i
] == &ctx
->adev
->gfx
.kiq
.ring
)
467 max_wait
= drm_sched_entity_flush(&ctx
->rings
[i
].entity
,
471 mutex_unlock(&mgr
->lock
);
474 void amdgpu_ctx_mgr_entity_fini(struct amdgpu_ctx_mgr
*mgr
)
476 struct amdgpu_ctx
*ctx
;
480 idp
= &mgr
->ctx_handles
;
482 idr_for_each_entry(idp
, ctx
, id
) {
487 for (i
= 0; i
< ctx
->adev
->num_rings
; i
++) {
489 if (ctx
->adev
->rings
[i
] == &ctx
->adev
->gfx
.kiq
.ring
)
492 if (kref_read(&ctx
->refcount
) == 1)
493 drm_sched_entity_fini(&ctx
->rings
[i
].entity
);
495 DRM_ERROR("ctx %p is still alive\n", ctx
);
500 void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr
*mgr
)
502 struct amdgpu_ctx
*ctx
;
506 amdgpu_ctx_mgr_entity_fini(mgr
);
508 idp
= &mgr
->ctx_handles
;
510 idr_for_each_entry(idp
, ctx
, id
) {
511 if (kref_put(&ctx
->refcount
, amdgpu_ctx_fini
) != 1)
512 DRM_ERROR("ctx %p is still alive\n", ctx
);
515 idr_destroy(&mgr
->ctx_handles
);
516 mutex_destroy(&mgr
->lock
);