2 * Copyright © 2008-2015 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 #ifndef I915_GEM_REQUEST_H
26 #define I915_GEM_REQUEST_H
28 #include <linux/fence.h>
33 * Request queue structure.
35 * The request queue allows us to note sequence numbers that have been emitted
36 * and may be associated with active buffers to be retired.
38 * By keeping this list, we can avoid having to do questionable sequence
39 * number comparisons on buffer last_read|write_seqno. It also allows an
40 * emission time to be associated with the request for tracking how far ahead
41 * of the GPU the submission is.
43 * The requests are reference counted.
45 struct drm_i915_gem_request
{
49 /** On Which ring this request was generated */
50 struct drm_i915_private
*i915
;
53 * Context and ring buffer related to this request
54 * Contexts are refcounted, so when this request is associated with a
55 * context, we must increment the context's refcount, to guarantee that
56 * it persists while any request is linked to it. Requests themselves
57 * are also refcounted, so the request will only be freed when the last
58 * reference to it is dismissed, and the code in
59 * i915_gem_request_free() will then decrement the refcount on the
62 struct i915_gem_context
*ctx
;
63 struct intel_engine_cs
*engine
;
64 struct intel_ring
*ring
;
65 struct intel_signal_node signaling
;
67 /** GEM sequence number associated with the previous request,
68 * when the HWS breadcrumb is equal to this the GPU is processing
73 /** Position in the ringbuffer of the start of the request */
77 * Position in the ringbuffer of the start of the postfix.
78 * This is required to calculate the maximum available ringbuffer
79 * space without overwriting the postfix.
83 /** Position in the ringbuffer of the end of the whole request */
86 /** Preallocate space in the ringbuffer for the emitting the request */
90 * Context related to the previous request.
91 * As the contexts are accessed by the hardware until the switch is
92 * completed to a new context, the hardware may still be writing
93 * to the context object after the breadcrumb is visible. We must
94 * not unpin/unbind/prune that object whilst still active and so
95 * we keep the previous context pinned until the following (this)
98 struct i915_gem_context
*previous_context
;
100 /** Batch buffer related to this request if any (used for
101 * error state dump only).
103 struct drm_i915_gem_object
*batch_obj
;
104 struct list_head active_list
;
106 /** Time at which this request was emitted, in jiffies. */
107 unsigned long emitted_jiffies
;
109 /** engine->request_list entry for this request */
110 struct list_head link
;
112 /** ring->request_list entry for this request */
113 struct list_head ring_link
;
115 struct drm_i915_file_private
*file_priv
;
116 /** file_priv list entry for this request */
117 struct list_head client_list
;
119 /** process identifier submitting this request */
123 * The ELSP only accepts two elements at a time, so we queue
124 * context/tail pairs on a given queue (ring->execlist_queue) until the
125 * hardware is available. The queue serves a double purpose: we also use
126 * it to keep track of the up to 2 contexts currently in the hardware
127 * (usually one in execution and the other queued up by the GPU): We
128 * only remove elements from the head of the queue when the hardware
129 * informs us that an element has been completed.
131 * All accesses to the queue are mediated by a spinlock
132 * (ring->execlist_lock).
135 /** Execlist link in the submission queue.*/
136 struct list_head execlist_link
;
138 /** Execlists no. of times this request has been sent to the ELSP */
141 /** Execlists context hardware id. */
142 unsigned int ctx_hw_id
;
145 extern const struct fence_ops i915_fence_ops
;
147 static inline bool fence_is_i915(struct fence
*fence
)
149 return fence
->ops
== &i915_fence_ops
;
152 struct drm_i915_gem_request
* __must_check
153 i915_gem_request_alloc(struct intel_engine_cs
*engine
,
154 struct i915_gem_context
*ctx
);
155 int i915_gem_request_add_to_client(struct drm_i915_gem_request
*req
,
156 struct drm_file
*file
);
157 void i915_gem_request_retire_upto(struct drm_i915_gem_request
*req
);
160 i915_gem_request_get_seqno(struct drm_i915_gem_request
*req
)
162 return req
? req
->fence
.seqno
: 0;
165 static inline struct intel_engine_cs
*
166 i915_gem_request_get_engine(struct drm_i915_gem_request
*req
)
168 return req
? req
->engine
: NULL
;
171 static inline struct drm_i915_gem_request
*
172 to_request(struct fence
*fence
)
174 /* We assume that NULL fence/request are interoperable */
175 BUILD_BUG_ON(offsetof(struct drm_i915_gem_request
, fence
) != 0);
176 GEM_BUG_ON(fence
&& !fence_is_i915(fence
));
177 return container_of(fence
, struct drm_i915_gem_request
, fence
);
180 static inline struct drm_i915_gem_request
*
181 i915_gem_request_get(struct drm_i915_gem_request
*req
)
183 return to_request(fence_get(&req
->fence
));
187 i915_gem_request_put(struct drm_i915_gem_request
*req
)
189 fence_put(&req
->fence
);
192 static inline void i915_gem_request_assign(struct drm_i915_gem_request
**pdst
,
193 struct drm_i915_gem_request
*src
)
196 i915_gem_request_get(src
);
199 i915_gem_request_put(*pdst
);
204 void __i915_add_request(struct drm_i915_gem_request
*req
,
205 struct drm_i915_gem_object
*batch_obj
,
207 #define i915_add_request(req) \
208 __i915_add_request(req, NULL, true)
209 #define i915_add_request_no_flush(req) \
210 __i915_add_request(req, NULL, false)
212 struct intel_rps_client
;
213 #define NO_WAITBOOST ERR_PTR(-1)
214 #define IS_RPS_CLIENT(p) (!IS_ERR(p))
215 #define IS_RPS_USER(p) (!IS_ERR_OR_NULL(p))
217 int i915_wait_request(struct drm_i915_gem_request
*req
,
220 struct intel_rps_client
*rps
)
221 __attribute__((nonnull(1)));
223 static inline u32
intel_engine_get_seqno(struct intel_engine_cs
*engine
);
226 * Returns true if seq1 is later than seq2.
228 static inline bool i915_seqno_passed(u32 seq1
, u32 seq2
)
230 return (s32
)(seq1
- seq2
) >= 0;
234 i915_gem_request_started(const struct drm_i915_gem_request
*req
)
236 return i915_seqno_passed(intel_engine_get_seqno(req
->engine
),
237 req
->previous_seqno
);
241 i915_gem_request_completed(const struct drm_i915_gem_request
*req
)
243 return i915_seqno_passed(intel_engine_get_seqno(req
->engine
),
247 bool __i915_spin_request(const struct drm_i915_gem_request
*request
,
248 int state
, unsigned long timeout_us
);
249 static inline bool i915_spin_request(const struct drm_i915_gem_request
*request
,
250 int state
, unsigned long timeout_us
)
252 return (i915_gem_request_started(request
) &&
253 __i915_spin_request(request
, state
, timeout_us
));
256 /* We treat requests as fences. This is not be to confused with our
257 * "fence registers" but pipeline synchronisation objects ala GL_ARB_sync.
258 * We use the fences to synchronize access from the CPU with activity on the
259 * GPU, for example, we should not rewrite an object's PTE whilst the GPU
260 * is reading them. We also track fences at a higher level to provide
261 * implicit synchronisation around GEM objects, e.g. set-domain will wait
262 * for outstanding GPU rendering before marking the object ready for CPU
263 * access, or a pageflip will wait until the GPU is complete before showing
264 * the frame on the scanout.
266 * In order to use a fence, the object must track the fence it needs to
267 * serialise with. For example, GEM objects want to track both read and
268 * write access so that we can perform concurrent read operations between
269 * the CPU and GPU engines, as well as waiting for all rendering to
270 * complete, or waiting for the last GPU user of a "fence register". The
271 * object then embeds a #i915_gem_active to track the most recent (in
272 * retirement order) request relevant for the desired mode of access.
273 * The #i915_gem_active is updated with i915_gem_active_set() to track the
274 * most recent fence request, typically this is done as part of
275 * i915_vma_move_to_active().
277 * When the #i915_gem_active completes (is retired), it will
278 * signal its completion to the owner through a callback as well as mark
279 * itself as idle (i915_gem_active.request == NULL). The owner
280 * can then perform any action, such as delayed freeing of an active
281 * resource including itself.
283 struct i915_gem_active
;
285 typedef void (*i915_gem_retire_fn
)(struct i915_gem_active
*,
286 struct drm_i915_gem_request
*);
288 struct i915_gem_active
{
289 struct drm_i915_gem_request
*request
;
290 struct list_head link
;
291 i915_gem_retire_fn retire
;
294 void i915_gem_retire_noop(struct i915_gem_active
*,
295 struct drm_i915_gem_request
*request
);
298 * init_request_active - prepares the activity tracker for use
299 * @active - the active tracker
300 * @func - a callback when then the tracker is retired (becomes idle),
303 * init_request_active() prepares the embedded @active struct for use as
304 * an activity tracker, that is for tracking the last known active request
305 * associated with it. When the last request becomes idle, when it is retired
306 * after completion, the optional callback @func is invoked.
309 init_request_active(struct i915_gem_active
*active
,
310 i915_gem_retire_fn retire
)
312 INIT_LIST_HEAD(&active
->link
);
313 active
->retire
= retire
?: i915_gem_retire_noop
;
317 * i915_gem_active_set - updates the tracker to watch the current request
318 * @active - the active tracker
319 * @request - the request to watch
321 * i915_gem_active_set() watches the given @request for completion. Whilst
322 * that @request is busy, the @active reports busy. When that @request is
323 * retired, the @active tracker is updated to report idle.
326 i915_gem_active_set(struct i915_gem_active
*active
,
327 struct drm_i915_gem_request
*request
)
329 list_move(&active
->link
, &request
->active_list
);
330 active
->request
= request
;
333 static inline struct drm_i915_gem_request
*
334 __i915_gem_active_peek(const struct i915_gem_active
*active
)
336 return active
->request
;
340 * i915_gem_active_peek - report the active request being monitored
341 * @active - the active tracker
343 * i915_gem_active_peek() returns the current request being tracked if
344 * still active, or NULL. It does not obtain a reference on the request
345 * for the caller, so the caller must hold struct_mutex.
347 static inline struct drm_i915_gem_request
*
348 i915_gem_active_peek(const struct i915_gem_active
*active
, struct mutex
*mutex
)
350 struct drm_i915_gem_request
*request
;
352 request
= active
->request
;
353 if (!request
|| i915_gem_request_completed(request
))
360 * i915_gem_active_get - return a reference to the active request
361 * @active - the active tracker
363 * i915_gem_active_get() returns a reference to the active request, or NULL
364 * if the active tracker is idle. The caller must hold struct_mutex.
366 static inline struct drm_i915_gem_request
*
367 i915_gem_active_get(const struct i915_gem_active
*active
, struct mutex
*mutex
)
369 return i915_gem_request_get(i915_gem_active_peek(active
, mutex
));
373 * i915_gem_active_isset - report whether the active tracker is assigned
374 * @active - the active tracker
376 * i915_gem_active_isset() returns true if the active tracker is currently
377 * assigned to a request. Due to the lazy retiring, that request may be idle
378 * and this may report stale information.
381 i915_gem_active_isset(const struct i915_gem_active
*active
)
383 return active
->request
;
387 * i915_gem_active_is_idle - report whether the active tracker is idle
388 * @active - the active tracker
390 * i915_gem_active_is_idle() returns true if the active tracker is currently
391 * unassigned or if the request is complete (but not yet retired). Requires
392 * the caller to hold struct_mutex (but that can be relaxed if desired).
395 i915_gem_active_is_idle(const struct i915_gem_active
*active
,
398 return !i915_gem_active_peek(active
, mutex
);
402 * i915_gem_active_wait - waits until the request is completed
403 * @active - the active request on which to wait
405 * i915_gem_active_wait() waits until the request is completed before
406 * returning. Note that it does not guarantee that the request is
407 * retired first, see i915_gem_active_retire().
409 * i915_gem_active_wait() returns immediately if the active
410 * request is already complete.
412 static inline int __must_check
413 i915_gem_active_wait(const struct i915_gem_active
*active
, struct mutex
*mutex
)
415 struct drm_i915_gem_request
*request
;
417 request
= i915_gem_active_peek(active
, mutex
);
421 return i915_wait_request(request
, true, NULL
, NULL
);
425 * i915_gem_active_retire - waits until the request is retired
426 * @active - the active request on which to wait
428 * i915_gem_active_retire() waits until the request is completed,
429 * and then ensures that at least the retirement handler for this
430 * @active tracker is called before returning. If the @active
431 * tracker is idle, the function returns immediately.
433 static inline int __must_check
434 i915_gem_active_retire(struct i915_gem_active
*active
,
437 struct drm_i915_gem_request
*request
;
440 request
= active
->request
;
444 ret
= i915_wait_request(request
, true, NULL
, NULL
);
448 list_del_init(&active
->link
);
449 active
->request
= NULL
;
450 active
->retire(active
, request
);
455 /* Convenience functions for peeking at state inside active's request whilst
456 * guarded by the struct_mutex.
459 static inline uint32_t
460 i915_gem_active_get_seqno(const struct i915_gem_active
*active
,
463 return i915_gem_request_get_seqno(i915_gem_active_peek(active
, mutex
));
466 static inline struct intel_engine_cs
*
467 i915_gem_active_get_engine(const struct i915_gem_active
*active
,
470 return i915_gem_request_get_engine(i915_gem_active_peek(active
, mutex
));
473 #define for_each_active(mask, idx) \
474 for (; mask ? idx = ffs(mask) - 1, 1 : 0; mask &= ~BIT(idx))
476 #endif /* I915_GEM_REQUEST_H */