.. | .. |
---|
26 | 26 | #define I915_REQUEST_H |
---|
27 | 27 | |
---|
28 | 28 | #include <linux/dma-fence.h> |
---|
| 29 | +#include <linux/irq_work.h> |
---|
| 30 | +#include <linux/lockdep.h> |
---|
| 31 | + |
---|
| 32 | +#include "gem/i915_gem_context_types.h" |
---|
| 33 | +#include "gt/intel_context_types.h" |
---|
| 34 | +#include "gt/intel_engine_types.h" |
---|
| 35 | +#include "gt/intel_timeline_types.h" |
---|
29 | 36 | |
---|
30 | 37 | #include "i915_gem.h" |
---|
31 | 38 | #include "i915_scheduler.h" |
---|
| 39 | +#include "i915_selftest.h" |
---|
32 | 40 | #include "i915_sw_fence.h" |
---|
33 | | -#include "i915_scheduler.h" |
---|
34 | 41 | |
---|
35 | 42 | #include <uapi/drm/i915_drm.h> |
---|
36 | 43 | |
---|
37 | 44 | struct drm_file; |
---|
38 | 45 | struct drm_i915_gem_object; |
---|
39 | 46 | struct i915_request; |
---|
40 | | -struct i915_timeline; |
---|
41 | | - |
---|
42 | | -struct intel_wait { |
---|
43 | | - struct rb_node node; |
---|
44 | | - struct task_struct *tsk; |
---|
45 | | - struct i915_request *request; |
---|
46 | | - u32 seqno; |
---|
47 | | -}; |
---|
48 | | - |
---|
49 | | -struct intel_signal_node { |
---|
50 | | - struct intel_wait wait; |
---|
51 | | - struct list_head link; |
---|
52 | | -}; |
---|
53 | 47 | |
---|
54 | 48 | struct i915_capture_list { |
---|
55 | 49 | struct i915_capture_list *next; |
---|
56 | 50 | struct i915_vma *vma; |
---|
| 51 | +}; |
---|
| 52 | + |
---|
| 53 | +#define RQ_TRACE(rq, fmt, ...) do { \ |
---|
| 54 | + const struct i915_request *rq__ = (rq); \ |
---|
| 55 | + ENGINE_TRACE(rq__->engine, "fence %llx:%lld, current %d " fmt, \ |
---|
| 56 | + rq__->fence.context, rq__->fence.seqno, \ |
---|
| 57 | + hwsp_seqno(rq__), ##__VA_ARGS__); \ |
---|
| 58 | +} while (0) |
---|
| 59 | + |
---|
| 60 | +enum { |
---|
| 61 | + /* |
---|
| 62 | + * I915_FENCE_FLAG_ACTIVE - this request is currently submitted to HW. |
---|
| 63 | + * |
---|
| 64 | + * Set by __i915_request_submit() on handing over to HW, and cleared |
---|
| 65 | + * by __i915_request_unsubmit() if we preempt this request. |
---|
| 66 | + * |
---|
| 67 | + * Finally cleared for consistency on retiring the request, when |
---|
| 68 | + * we know the HW is no longer running this request. |
---|
| 69 | + * |
---|
| 70 | + * See i915_request_is_active() |
---|
| 71 | + */ |
---|
| 72 | + I915_FENCE_FLAG_ACTIVE = DMA_FENCE_FLAG_USER_BITS, |
---|
| 73 | + |
---|
| 74 | + /* |
---|
| 75 | + * I915_FENCE_FLAG_PQUEUE - this request is ready for execution |
---|
| 76 | + * |
---|
| 77 | + * Using the scheduler, when a request is ready for execution it is put |
---|
| 78 | + * into the priority queue, and removed from that queue when transferred |
---|
| 79 | + * to the HW runlists. We want to track its membership within the |
---|
| 80 | + * priority queue so that we can easily check before rescheduling. |
---|
| 81 | + * |
---|
| 82 | + * See i915_request_in_priority_queue() |
---|
| 83 | + */ |
---|
| 84 | + I915_FENCE_FLAG_PQUEUE, |
---|
| 85 | + |
---|
| 86 | + /* |
---|
| 87 | + * I915_FENCE_FLAG_HOLD - this request is currently on hold |
---|
| 88 | + * |
---|
| 89 | + * This request has been suspended, pending an ongoing investigation. |
---|
| 90 | + */ |
---|
| 91 | + I915_FENCE_FLAG_HOLD, |
---|
| 92 | + |
---|
| 93 | + /* |
---|
| 94 | + * I915_FENCE_FLAG_INITIAL_BREADCRUMB - this request has the initial |
---|
| 95 | + * breadcrumb that marks the end of semaphore waits and start of the |
---|
| 96 | + * user payload. |
---|
| 97 | + */ |
---|
| 98 | + I915_FENCE_FLAG_INITIAL_BREADCRUMB, |
---|
| 99 | + |
---|
| 100 | + /* |
---|
| 101 | + * I915_FENCE_FLAG_SIGNAL - this request is currently on signal_list |
---|
| 102 | + * |
---|
| 103 | + * Internal bookkeeping used by the breadcrumb code to track when |
---|
| 104 | + * a request is on the various signal_list. |
---|
| 105 | + */ |
---|
| 106 | + I915_FENCE_FLAG_SIGNAL, |
---|
| 107 | + |
---|
| 108 | + /* |
---|
| 109 | + * I915_FENCE_FLAG_NOPREEMPT - this request should not be preempted |
---|
| 110 | + * |
---|
| 111 | + * The execution of some requests should not be interrupted. This is |
---|
| 112 | + * a sensitive operation as it makes the request super important, |
---|
| 113 | + * blocking other higher priority work. Abuse of this flag will |
---|
| 114 | + * lead to quality of service issues. |
---|
| 115 | + */ |
---|
| 116 | + I915_FENCE_FLAG_NOPREEMPT, |
---|
| 117 | + |
---|
| 118 | + /* |
---|
| 119 | + * I915_FENCE_FLAG_SENTINEL - this request should be last in the queue |
---|
| 120 | + * |
---|
| 121 | + * A high priority sentinel request may be submitted to clear the |
---|
| 122 | + * submission queue. As it will be the only request in-flight, upon |
---|
| 123 | + * execution all other active requests will have been preempted and |
---|
| 124 | + * unsubmitted. This preemptive pulse is used to re-evaluate the |
---|
| 125 | + * in-flight requests, particularly in cases where an active context |
---|
| 126 | + * is banned and those active requests need to be cancelled. |
---|
| 127 | + */ |
---|
| 128 | + I915_FENCE_FLAG_SENTINEL, |
---|
| 129 | + |
---|
| 130 | + /* |
---|
| 131 | + * I915_FENCE_FLAG_BOOST - upclock the gpu for this request |
---|
| 132 | + * |
---|
| 133 | + * Some requests are more important than others! In particular, a |
---|
| 134 | + * request that the user is waiting on is typically required for |
---|
| 135 | + * interactive latency, for which we want to minimise by upclocking |
---|
| 136 | + * the GPU. Here we track such boost requests on a per-request basis. |
---|
| 137 | + */ |
---|
| 138 | + I915_FENCE_FLAG_BOOST, |
---|
57 | 139 | }; |
---|
58 | 140 | |
---|
59 | 141 | /** |
---|
.. | .. |
---|
80 | 162 | struct dma_fence fence; |
---|
81 | 163 | spinlock_t lock; |
---|
82 | 164 | |
---|
83 | | - /** On Which ring this request was generated */ |
---|
84 | | - struct drm_i915_private *i915; |
---|
85 | | - |
---|
86 | 165 | /** |
---|
87 | 166 | * Context and ring buffer related to this request |
---|
88 | 167 | * Contexts are refcounted, so when this request is associated with a |
---|
.. | .. |
---|
93 | 172 | * i915_request_free() will then decrement the refcount on the |
---|
94 | 173 | * context. |
---|
95 | 174 | */ |
---|
96 | | - struct i915_gem_context *gem_context; |
---|
97 | 175 | struct intel_engine_cs *engine; |
---|
98 | | - struct intel_context *hw_context; |
---|
| 176 | + struct intel_context *context; |
---|
99 | 177 | struct intel_ring *ring; |
---|
100 | | - struct i915_timeline *timeline; |
---|
101 | | - struct intel_signal_node signaling; |
---|
| 178 | + struct intel_timeline __rcu *timeline; |
---|
| 179 | + |
---|
| 180 | + struct list_head signal_link; |
---|
| 181 | + struct llist_node signal_node; |
---|
| 182 | + |
---|
| 183 | + /* |
---|
| 184 | + * The rcu epoch of when this request was allocated. Used to judiciously |
---|
| 185 | + * apply backpressure on future allocations to ensure that under |
---|
| 186 | + * mempressure there is sufficient RCU ticks for us to reclaim our |
---|
| 187 | + * RCU protected slabs. |
---|
| 188 | + */ |
---|
| 189 | + unsigned long rcustate; |
---|
| 190 | + |
---|
| 191 | + /* |
---|
| 192 | + * We pin the timeline->mutex while constructing the request to |
---|
| 193 | + * ensure that no caller accidentally drops it during construction. |
---|
| 194 | + * The timeline->mutex must be held to ensure that only this caller |
---|
| 195 | + * can use the ring and manipulate the associated timeline during |
---|
| 196 | + * construction. |
---|
| 197 | + */ |
---|
| 198 | + struct pin_cookie cookie; |
---|
102 | 199 | |
---|
103 | 200 | /* |
---|
104 | 201 | * Fences for the various phases in the request's lifetime. |
---|
.. | .. |
---|
108 | 205 | * It is used by the driver to then queue the request for execution. |
---|
109 | 206 | */ |
---|
110 | 207 | struct i915_sw_fence submit; |
---|
111 | | - wait_queue_entry_t submitq; |
---|
112 | | - wait_queue_head_t execute; |
---|
| 208 | + union { |
---|
| 209 | + wait_queue_entry_t submitq; |
---|
| 210 | + struct i915_sw_dma_fence_cb dmaq; |
---|
| 211 | + struct i915_request_duration_cb { |
---|
| 212 | + struct dma_fence_cb cb; |
---|
| 213 | + ktime_t emitted; |
---|
| 214 | + } duration; |
---|
| 215 | + }; |
---|
| 216 | + struct llist_head execute_cb; |
---|
| 217 | + struct i915_sw_fence semaphore; |
---|
113 | 218 | |
---|
114 | 219 | /* |
---|
115 | 220 | * A list of everyone we wait upon, and everyone who waits upon us. |
---|
.. | .. |
---|
122 | 227 | */ |
---|
123 | 228 | struct i915_sched_node sched; |
---|
124 | 229 | struct i915_dependency dep; |
---|
| 230 | + intel_engine_mask_t execution_mask; |
---|
125 | 231 | |
---|
126 | | - /** |
---|
127 | | - * GEM sequence number associated with this request on the |
---|
128 | | - * global execution timeline. It is zero when the request is not |
---|
129 | | - * on the HW queue (i.e. not on the engine timeline list). |
---|
130 | | - * Its value is guarded by the timeline spinlock. |
---|
| 232 | + /* |
---|
| 233 | + * A convenience pointer to the current breadcrumb value stored in |
---|
| 234 | + * the HW status page (or our timeline's local equivalent). The full |
---|
| 235 | + * path would be rq->hw_context->ring->timeline->hwsp_seqno. |
---|
131 | 236 | */ |
---|
132 | | - u32 global_seqno; |
---|
| 237 | + const u32 *hwsp_seqno; |
---|
| 238 | + |
---|
| 239 | + /* |
---|
| 240 | + * If we need to access the timeline's seqno for this request in |
---|
| 241 | + * another request, we need to keep a read reference to this associated |
---|
| 242 | + * cacheline, so that we do not free and recycle it before the foreign |
---|
| 243 | + * observers have completed. Hence, we keep a pointer to the cacheline |
---|
| 244 | + * inside the timeline's HWSP vma, but it is only valid while this |
---|
| 245 | + * request has not completed and guarded by the timeline mutex. |
---|
| 246 | + */ |
---|
| 247 | + struct intel_timeline_cacheline __rcu *hwsp_cacheline; |
---|
133 | 248 | |
---|
134 | 249 | /** Position in the ring of the start of the request */ |
---|
135 | 250 | u32 head; |
---|
.. | .. |
---|
164 | 279 | * on the active_list (of their final request). |
---|
165 | 280 | */ |
---|
166 | 281 | struct i915_capture_list *capture_list; |
---|
167 | | - struct list_head active_list; |
---|
168 | 282 | |
---|
169 | 283 | /** Time at which this request was emitted, in jiffies. */ |
---|
170 | 284 | unsigned long emitted_jiffies; |
---|
171 | 285 | |
---|
172 | | - bool waitboost; |
---|
173 | | - |
---|
174 | | - /** engine->request_list entry for this request */ |
---|
| 286 | + /** timeline->request entry for this request */ |
---|
175 | 287 | struct list_head link; |
---|
176 | 288 | |
---|
177 | | - /** ring->request_list entry for this request */ |
---|
178 | | - struct list_head ring_link; |
---|
179 | | - |
---|
180 | | - struct drm_i915_file_private *file_priv; |
---|
181 | | - /** file_priv list entry for this request */ |
---|
182 | | - struct list_head client_link; |
---|
| 289 | + I915_SELFTEST_DECLARE(struct { |
---|
| 290 | + struct list_head link; |
---|
| 291 | + unsigned long delay; |
---|
| 292 | + } mock;) |
---|
183 | 293 | }; |
---|
184 | 294 | |
---|
185 | 295 | #define I915_FENCE_GFP (GFP_KERNEL | __GFP_RETRY_MAYFAIL | __GFP_NOWARN) |
---|
.. | .. |
---|
191 | 301 | return fence->ops == &i915_fence_ops; |
---|
192 | 302 | } |
---|
193 | 303 | |
---|
| 304 | +struct kmem_cache *i915_request_slab_cache(void); |
---|
| 305 | + |
---|
194 | 306 | struct i915_request * __must_check |
---|
195 | | -i915_request_alloc(struct intel_engine_cs *engine, |
---|
196 | | - struct i915_gem_context *ctx); |
---|
| 307 | +__i915_request_create(struct intel_context *ce, gfp_t gfp); |
---|
| 308 | +struct i915_request * __must_check |
---|
| 309 | +i915_request_create(struct intel_context *ce); |
---|
| 310 | + |
---|
| 311 | +void i915_request_set_error_once(struct i915_request *rq, int error); |
---|
| 312 | +void __i915_request_skip(struct i915_request *rq); |
---|
| 313 | + |
---|
| 314 | +struct i915_request *__i915_request_commit(struct i915_request *request); |
---|
| 315 | +void __i915_request_queue(struct i915_request *rq, |
---|
| 316 | + const struct i915_sched_attr *attr); |
---|
| 317 | + |
---|
| 318 | +bool i915_request_retire(struct i915_request *rq); |
---|
197 | 319 | void i915_request_retire_upto(struct i915_request *rq); |
---|
198 | 320 | |
---|
199 | 321 | static inline struct i915_request * |
---|
.. | .. |
---|
223 | 345 | dma_fence_put(&rq->fence); |
---|
224 | 346 | } |
---|
225 | 347 | |
---|
226 | | -/** |
---|
227 | | - * i915_request_global_seqno - report the current global seqno |
---|
228 | | - * @request - the request |
---|
229 | | - * |
---|
230 | | - * A request is assigned a global seqno only when it is on the hardware |
---|
231 | | - * execution queue. The global seqno can be used to maintain a list of |
---|
232 | | - * requests on the same engine in retirement order, for example for |
---|
233 | | - * constructing a priority queue for waiting. Prior to its execution, or |
---|
234 | | - * if it is subsequently removed in the event of preemption, its global |
---|
235 | | - * seqno is zero. As both insertion and removal from the execution queue |
---|
236 | | - * may operate in IRQ context, it is not guarded by the usual struct_mutex |
---|
237 | | - * BKL. Instead those relying on the global seqno must be prepared for its |
---|
238 | | - * value to change between reads. Only when the request is complete can |
---|
239 | | - * the global seqno be stable (due to the memory barriers on submitting |
---|
240 | | - * the commands to the hardware to write the breadcrumb, if the HWS shows |
---|
241 | | - * that it has passed the global seqno and the global seqno is unchanged |
---|
242 | | - * after the read, it is indeed complete). |
---|
243 | | - */ |
---|
244 | | -static u32 |
---|
245 | | -i915_request_global_seqno(const struct i915_request *request) |
---|
246 | | -{ |
---|
247 | | - return READ_ONCE(request->global_seqno); |
---|
248 | | -} |
---|
249 | | - |
---|
250 | 348 | int i915_request_await_object(struct i915_request *to, |
---|
251 | 349 | struct drm_i915_gem_object *obj, |
---|
252 | 350 | bool write); |
---|
253 | 351 | int i915_request_await_dma_fence(struct i915_request *rq, |
---|
254 | 352 | struct dma_fence *fence); |
---|
| 353 | +int i915_request_await_execution(struct i915_request *rq, |
---|
| 354 | + struct dma_fence *fence, |
---|
| 355 | + void (*hook)(struct i915_request *rq, |
---|
| 356 | + struct dma_fence *signal)); |
---|
255 | 357 | |
---|
256 | 358 | void i915_request_add(struct i915_request *rq); |
---|
257 | 359 | |
---|
258 | | -void __i915_request_submit(struct i915_request *request); |
---|
| 360 | +bool __i915_request_submit(struct i915_request *request); |
---|
259 | 361 | void i915_request_submit(struct i915_request *request); |
---|
260 | | - |
---|
261 | | -void i915_request_skip(struct i915_request *request, int error); |
---|
262 | 362 | |
---|
263 | 363 | void __i915_request_unsubmit(struct i915_request *request); |
---|
264 | 364 | void i915_request_unsubmit(struct i915_request *request); |
---|
.. | .. |
---|
268 | 368 | long timeout) |
---|
269 | 369 | __attribute__((nonnull(1))); |
---|
270 | 370 | #define I915_WAIT_INTERRUPTIBLE BIT(0) |
---|
271 | | -#define I915_WAIT_LOCKED BIT(1) /* struct_mutex held, handle GPU reset */ |
---|
| 371 | +#define I915_WAIT_PRIORITY BIT(1) /* small priority bump for the request */ |
---|
272 | 372 | #define I915_WAIT_ALL BIT(2) /* used by i915_gem_object_wait() */ |
---|
273 | | -#define I915_WAIT_FOR_IDLE_BOOST BIT(3) |
---|
274 | 373 | |
---|
275 | | -static inline u32 intel_engine_get_seqno(struct intel_engine_cs *engine); |
---|
| 374 | +static inline bool i915_request_signaled(const struct i915_request *rq) |
---|
| 375 | +{ |
---|
| 376 | + /* The request may live longer than its HWSP, so check flags first! */ |
---|
| 377 | + return test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &rq->fence.flags); |
---|
| 378 | +} |
---|
| 379 | + |
---|
| 380 | +static inline bool i915_request_is_active(const struct i915_request *rq) |
---|
| 381 | +{ |
---|
| 382 | + return test_bit(I915_FENCE_FLAG_ACTIVE, &rq->fence.flags); |
---|
| 383 | +} |
---|
| 384 | + |
---|
| 385 | +static inline bool i915_request_in_priority_queue(const struct i915_request *rq) |
---|
| 386 | +{ |
---|
| 387 | + return test_bit(I915_FENCE_FLAG_PQUEUE, &rq->fence.flags); |
---|
| 388 | +} |
---|
| 389 | + |
---|
| 390 | +static inline bool |
---|
| 391 | +i915_request_has_initial_breadcrumb(const struct i915_request *rq) |
---|
| 392 | +{ |
---|
| 393 | + return test_bit(I915_FENCE_FLAG_INITIAL_BREADCRUMB, &rq->fence.flags); |
---|
| 394 | +} |
---|
276 | 395 | |
---|
277 | 396 | /** |
---|
278 | 397 | * Returns true if seq1 is later than seq2. |
---|
.. | .. |
---|
282 | 401 | return (s32)(seq1 - seq2) >= 0; |
---|
283 | 402 | } |
---|
284 | 403 | |
---|
285 | | -static inline bool |
---|
286 | | -__i915_request_completed(const struct i915_request *rq, u32 seqno) |
---|
| 404 | +static inline u32 __hwsp_seqno(const struct i915_request *rq) |
---|
287 | 405 | { |
---|
288 | | - GEM_BUG_ON(!seqno); |
---|
289 | | - return i915_seqno_passed(intel_engine_get_seqno(rq->engine), seqno) && |
---|
290 | | - seqno == i915_request_global_seqno(rq); |
---|
| 406 | + const u32 *hwsp = READ_ONCE(rq->hwsp_seqno); |
---|
| 407 | + |
---|
| 408 | + return READ_ONCE(*hwsp); |
---|
| 409 | +} |
---|
| 410 | + |
---|
| 411 | +/** |
---|
| 412 | + * hwsp_seqno - the current breadcrumb value in the HW status page |
---|
| 413 | + * @rq: the request, to chase the relevant HW status page |
---|
| 414 | + * |
---|
| 415 | + * The emphasis in naming here is that hwsp_seqno() is not a property of the |
---|
| 416 | + * request, but an indication of the current HW state (associated with this |
---|
| 417 | + * request). Its value will change as the GPU executes more requests. |
---|
| 418 | + * |
---|
| 419 | + * Returns the current breadcrumb value in the associated HW status page (or |
---|
| 420 | + * the local timeline's equivalent) for this request. The request itself |
---|
| 421 | + * has the associated breadcrumb value of rq->fence.seqno, when the HW |
---|
| 422 | + * status page has that breadcrumb or later, this request is complete. |
---|
| 423 | + */ |
---|
| 424 | +static inline u32 hwsp_seqno(const struct i915_request *rq) |
---|
| 425 | +{ |
---|
| 426 | + u32 seqno; |
---|
| 427 | + |
---|
| 428 | + rcu_read_lock(); /* the HWSP may be freed at runtime */ |
---|
| 429 | + seqno = __hwsp_seqno(rq); |
---|
| 430 | + rcu_read_unlock(); |
---|
| 431 | + |
---|
| 432 | + return seqno; |
---|
| 433 | +} |
---|
| 434 | + |
---|
| 435 | +static inline bool __i915_request_has_started(const struct i915_request *rq) |
---|
| 436 | +{ |
---|
| 437 | + return i915_seqno_passed(__hwsp_seqno(rq), rq->fence.seqno - 1); |
---|
| 438 | +} |
---|
| 439 | + |
---|
| 440 | +/** |
---|
| 441 | + * i915_request_started - check if the request has begun being executed |
---|
| 442 | + * @rq: the request |
---|
| 443 | + * |
---|
| 444 | + * If the timeline is not using initial breadcrumbs, a request is |
---|
| 445 | + * considered started if the previous request on its timeline (i.e. |
---|
| 446 | + * context) has been signaled. |
---|
| 447 | + * |
---|
| 448 | + * If the timeline is using semaphores, it will also be emitting an |
---|
| 449 | + * "initial breadcrumb" after the semaphores are complete and just before |
---|
| 450 | + * it began executing the user payload. A request can therefore be active |
---|
| 451 | + * on the HW and not yet started as it is still busywaiting on its |
---|
| 452 | + * dependencies (via HW semaphores). |
---|
| 453 | + * |
---|
| 454 | + * If the request has started, its dependencies will have been signaled |
---|
| 455 | + * (either by fences or by semaphores) and it will have begun processing |
---|
| 456 | + * the user payload. |
---|
| 457 | + * |
---|
| 458 | + * However, even if a request has started, it may have been preempted and |
---|
| 459 | + * so no longer active, or it may have already completed. |
---|
| 460 | + * |
---|
| 461 | + * See also i915_request_is_active(). |
---|
| 462 | + * |
---|
| 463 | + * Returns true if the request has begun executing the user payload, or |
---|
| 464 | + * has completed: |
---|
| 465 | + */ |
---|
| 466 | +static inline bool i915_request_started(const struct i915_request *rq) |
---|
| 467 | +{ |
---|
| 468 | + bool result; |
---|
| 469 | + |
---|
| 470 | + if (i915_request_signaled(rq)) |
---|
| 471 | + return true; |
---|
| 472 | + |
---|
| 473 | + result = true; |
---|
| 474 | + rcu_read_lock(); /* the HWSP may be freed at runtime */ |
---|
| 475 | + if (likely(!i915_request_signaled(rq))) |
---|
| 476 | + /* Remember: started but may have since been preempted! */ |
---|
| 477 | + result = __i915_request_has_started(rq); |
---|
| 478 | + rcu_read_unlock(); |
---|
| 479 | + |
---|
| 480 | + return result; |
---|
| 481 | +} |
---|
| 482 | + |
---|
| 483 | +/** |
---|
| 484 | + * i915_request_is_running - check if the request may actually be executing |
---|
| 485 | + * @rq: the request |
---|
| 486 | + * |
---|
| 487 | + * Returns true if the request is currently submitted to hardware, has passed |
---|
| 488 | + * its start point (i.e. the context is setup and not busywaiting). Note that |
---|
| 489 | + * it may no longer be running by the time the function returns! |
---|
| 490 | + */ |
---|
| 491 | +static inline bool i915_request_is_running(const struct i915_request *rq) |
---|
| 492 | +{ |
---|
| 493 | + bool result; |
---|
| 494 | + |
---|
| 495 | + if (!i915_request_is_active(rq)) |
---|
| 496 | + return false; |
---|
| 497 | + |
---|
| 498 | + rcu_read_lock(); |
---|
| 499 | + result = __i915_request_has_started(rq) && i915_request_is_active(rq); |
---|
| 500 | + rcu_read_unlock(); |
---|
| 501 | + |
---|
| 502 | + return result; |
---|
| 503 | +} |
---|
| 504 | + |
---|
| 505 | +/** |
---|
| 506 | + * i915_request_is_ready - check if the request is ready for execution |
---|
| 507 | + * @rq: the request |
---|
| 508 | + * |
---|
| 509 | + * Upon construction, the request is instructed to wait upon various |
---|
| 510 | + * signals before it is ready to be executed by the HW. That is, we do |
---|
| 511 | + * not want to start execution and read data before it is written. In practice, |
---|
| 512 | + * this is controlled with a mixture of interrupts and semaphores. Once |
---|
| 513 | + * the submit fence is completed, the backend scheduler will place the |
---|
| 514 | + * request into its queue and from there submit it for execution. So we |
---|
| 515 | + * can detect when a request is eligible for execution (and is under control |
---|
| 516 | + * of the scheduler) by querying where it is in any of the scheduler's lists. |
---|
| 517 | + * |
---|
| 518 | + * Returns true if the request is ready for execution (it may be inflight), |
---|
| 519 | + * false otherwise. |
---|
| 520 | + */ |
---|
| 521 | +static inline bool i915_request_is_ready(const struct i915_request *rq) |
---|
| 522 | +{ |
---|
| 523 | + return !list_empty(&rq->sched.link); |
---|
| 524 | +} |
---|
| 525 | + |
---|
| 526 | +static inline bool __i915_request_is_complete(const struct i915_request *rq) |
---|
| 527 | +{ |
---|
| 528 | + return i915_seqno_passed(__hwsp_seqno(rq), rq->fence.seqno); |
---|
291 | 529 | } |
---|
292 | 530 | |
---|
293 | 531 | static inline bool i915_request_completed(const struct i915_request *rq) |
---|
294 | 532 | { |
---|
295 | | - u32 seqno; |
---|
| 533 | + bool result; |
---|
296 | 534 | |
---|
297 | | - seqno = i915_request_global_seqno(rq); |
---|
298 | | - if (!seqno) |
---|
299 | | - return false; |
---|
| 535 | + if (i915_request_signaled(rq)) |
---|
| 536 | + return true; |
---|
300 | 537 | |
---|
301 | | - return __i915_request_completed(rq, seqno); |
---|
302 | | -} |
---|
303 | | - |
---|
304 | | -static inline bool i915_request_started(const struct i915_request *rq) |
---|
305 | | -{ |
---|
306 | | - u32 seqno; |
---|
307 | | - |
---|
308 | | - seqno = i915_request_global_seqno(rq); |
---|
309 | | - if (!seqno) |
---|
310 | | - return false; |
---|
311 | | - |
---|
312 | | - return i915_seqno_passed(intel_engine_get_seqno(rq->engine), |
---|
313 | | - seqno - 1); |
---|
314 | | -} |
---|
315 | | - |
---|
316 | | -static inline bool i915_sched_node_signaled(const struct i915_sched_node *node) |
---|
317 | | -{ |
---|
318 | | - const struct i915_request *rq = |
---|
319 | | - container_of(node, const struct i915_request, sched); |
---|
320 | | - |
---|
321 | | - return i915_request_completed(rq); |
---|
322 | | -} |
---|
323 | | - |
---|
324 | | -void i915_retire_requests(struct drm_i915_private *i915); |
---|
325 | | - |
---|
326 | | -/* |
---|
327 | | - * We treat requests as fences. This is not be to confused with our |
---|
328 | | - * "fence registers" but pipeline synchronisation objects ala GL_ARB_sync. |
---|
329 | | - * We use the fences to synchronize access from the CPU with activity on the |
---|
330 | | - * GPU, for example, we should not rewrite an object's PTE whilst the GPU |
---|
331 | | - * is reading them. We also track fences at a higher level to provide |
---|
332 | | - * implicit synchronisation around GEM objects, e.g. set-domain will wait |
---|
333 | | - * for outstanding GPU rendering before marking the object ready for CPU |
---|
334 | | - * access, or a pageflip will wait until the GPU is complete before showing |
---|
335 | | - * the frame on the scanout. |
---|
336 | | - * |
---|
337 | | - * In order to use a fence, the object must track the fence it needs to |
---|
338 | | - * serialise with. For example, GEM objects want to track both read and |
---|
339 | | - * write access so that we can perform concurrent read operations between |
---|
340 | | - * the CPU and GPU engines, as well as waiting for all rendering to |
---|
341 | | - * complete, or waiting for the last GPU user of a "fence register". The |
---|
342 | | - * object then embeds a #i915_gem_active to track the most recent (in |
---|
343 | | - * retirement order) request relevant for the desired mode of access. |
---|
344 | | - * The #i915_gem_active is updated with i915_gem_active_set() to track the |
---|
345 | | - * most recent fence request, typically this is done as part of |
---|
346 | | - * i915_vma_move_to_active(). |
---|
347 | | - * |
---|
348 | | - * When the #i915_gem_active completes (is retired), it will |
---|
349 | | - * signal its completion to the owner through a callback as well as mark |
---|
350 | | - * itself as idle (i915_gem_active.request == NULL). The owner |
---|
351 | | - * can then perform any action, such as delayed freeing of an active |
---|
352 | | - * resource including itself. |
---|
353 | | - */ |
---|
354 | | -struct i915_gem_active; |
---|
355 | | - |
---|
356 | | -typedef void (*i915_gem_retire_fn)(struct i915_gem_active *, |
---|
357 | | - struct i915_request *); |
---|
358 | | - |
---|
359 | | -struct i915_gem_active { |
---|
360 | | - struct i915_request __rcu *request; |
---|
361 | | - struct list_head link; |
---|
362 | | - i915_gem_retire_fn retire; |
---|
363 | | -}; |
---|
364 | | - |
---|
365 | | -void i915_gem_retire_noop(struct i915_gem_active *, |
---|
366 | | - struct i915_request *request); |
---|
367 | | - |
---|
368 | | -/** |
---|
369 | | - * init_request_active - prepares the activity tracker for use |
---|
370 | | - * @active - the active tracker |
---|
371 | | - * @func - a callback when then the tracker is retired (becomes idle), |
---|
372 | | - * can be NULL |
---|
373 | | - * |
---|
374 | | - * init_request_active() prepares the embedded @active struct for use as |
---|
375 | | - * an activity tracker, that is for tracking the last known active request |
---|
376 | | - * associated with it. When the last request becomes idle, when it is retired |
---|
377 | | - * after completion, the optional callback @func is invoked. |
---|
378 | | - */ |
---|
379 | | -static inline void |
---|
380 | | -init_request_active(struct i915_gem_active *active, |
---|
381 | | - i915_gem_retire_fn retire) |
---|
382 | | -{ |
---|
383 | | - RCU_INIT_POINTER(active->request, NULL); |
---|
384 | | - INIT_LIST_HEAD(&active->link); |
---|
385 | | - active->retire = retire ?: i915_gem_retire_noop; |
---|
386 | | -} |
---|
387 | | - |
---|
388 | | -/** |
---|
389 | | - * i915_gem_active_set - updates the tracker to watch the current request |
---|
390 | | - * @active - the active tracker |
---|
391 | | - * @request - the request to watch |
---|
392 | | - * |
---|
393 | | - * i915_gem_active_set() watches the given @request for completion. Whilst |
---|
394 | | - * that @request is busy, the @active reports busy. When that @request is |
---|
395 | | - * retired, the @active tracker is updated to report idle. |
---|
396 | | - */ |
---|
397 | | -static inline void |
---|
398 | | -i915_gem_active_set(struct i915_gem_active *active, |
---|
399 | | - struct i915_request *request) |
---|
400 | | -{ |
---|
401 | | - list_move(&active->link, &request->active_list); |
---|
402 | | - rcu_assign_pointer(active->request, request); |
---|
403 | | -} |
---|
404 | | - |
---|
405 | | -/** |
---|
406 | | - * i915_gem_active_set_retire_fn - updates the retirement callback |
---|
407 | | - * @active - the active tracker |
---|
408 | | - * @fn - the routine called when the request is retired |
---|
409 | | - * @mutex - struct_mutex used to guard retirements |
---|
410 | | - * |
---|
411 | | - * i915_gem_active_set_retire_fn() updates the function pointer that |
---|
412 | | - * is called when the final request associated with the @active tracker |
---|
413 | | - * is retired. |
---|
414 | | - */ |
---|
415 | | -static inline void |
---|
416 | | -i915_gem_active_set_retire_fn(struct i915_gem_active *active, |
---|
417 | | - i915_gem_retire_fn fn, |
---|
418 | | - struct mutex *mutex) |
---|
419 | | -{ |
---|
420 | | - lockdep_assert_held(mutex); |
---|
421 | | - active->retire = fn ?: i915_gem_retire_noop; |
---|
422 | | -} |
---|
423 | | - |
---|
424 | | -static inline struct i915_request * |
---|
425 | | -__i915_gem_active_peek(const struct i915_gem_active *active) |
---|
426 | | -{ |
---|
427 | | - /* |
---|
428 | | - * Inside the error capture (running with the driver in an unknown |
---|
429 | | - * state), we want to bend the rules slightly (a lot). |
---|
430 | | - * |
---|
431 | | - * Work is in progress to make it safer, in the meantime this keeps |
---|
432 | | - * the known issue from spamming the logs. |
---|
433 | | - */ |
---|
434 | | - return rcu_dereference_protected(active->request, 1); |
---|
435 | | -} |
---|
436 | | - |
---|
437 | | -/** |
---|
438 | | - * i915_gem_active_raw - return the active request |
---|
439 | | - * @active - the active tracker |
---|
440 | | - * |
---|
441 | | - * i915_gem_active_raw() returns the current request being tracked, or NULL. |
---|
442 | | - * It does not obtain a reference on the request for the caller, so the caller |
---|
443 | | - * must hold struct_mutex. |
---|
444 | | - */ |
---|
445 | | -static inline struct i915_request * |
---|
446 | | -i915_gem_active_raw(const struct i915_gem_active *active, struct mutex *mutex) |
---|
447 | | -{ |
---|
448 | | - return rcu_dereference_protected(active->request, |
---|
449 | | - lockdep_is_held(mutex)); |
---|
450 | | -} |
---|
451 | | - |
---|
452 | | -/** |
---|
453 | | - * i915_gem_active_peek - report the active request being monitored |
---|
454 | | - * @active - the active tracker |
---|
455 | | - * |
---|
456 | | - * i915_gem_active_peek() returns the current request being tracked if |
---|
457 | | - * still active, or NULL. It does not obtain a reference on the request |
---|
458 | | - * for the caller, so the caller must hold struct_mutex. |
---|
459 | | - */ |
---|
460 | | -static inline struct i915_request * |
---|
461 | | -i915_gem_active_peek(const struct i915_gem_active *active, struct mutex *mutex) |
---|
462 | | -{ |
---|
463 | | - struct i915_request *request; |
---|
464 | | - |
---|
465 | | - request = i915_gem_active_raw(active, mutex); |
---|
466 | | - if (!request || i915_request_completed(request)) |
---|
467 | | - return NULL; |
---|
468 | | - |
---|
469 | | - return request; |
---|
470 | | -} |
---|
471 | | - |
---|
472 | | -/** |
---|
473 | | - * i915_gem_active_get - return a reference to the active request |
---|
474 | | - * @active - the active tracker |
---|
475 | | - * |
---|
476 | | - * i915_gem_active_get() returns a reference to the active request, or NULL |
---|
477 | | - * if the active tracker is idle. The caller must hold struct_mutex. |
---|
478 | | - */ |
---|
479 | | -static inline struct i915_request * |
---|
480 | | -i915_gem_active_get(const struct i915_gem_active *active, struct mutex *mutex) |
---|
481 | | -{ |
---|
482 | | - return i915_request_get(i915_gem_active_peek(active, mutex)); |
---|
483 | | -} |
---|
484 | | - |
---|
485 | | -/** |
---|
486 | | - * __i915_gem_active_get_rcu - return a reference to the active request |
---|
487 | | - * @active - the active tracker |
---|
488 | | - * |
---|
489 | | - * __i915_gem_active_get() returns a reference to the active request, or NULL |
---|
490 | | - * if the active tracker is idle. The caller must hold the RCU read lock, but |
---|
491 | | - * the returned pointer is safe to use outside of RCU. |
---|
492 | | - */ |
---|
493 | | -static inline struct i915_request * |
---|
494 | | -__i915_gem_active_get_rcu(const struct i915_gem_active *active) |
---|
495 | | -{ |
---|
496 | | - /* |
---|
497 | | - * Performing a lockless retrieval of the active request is super |
---|
498 | | - * tricky. SLAB_TYPESAFE_BY_RCU merely guarantees that the backing |
---|
499 | | - * slab of request objects will not be freed whilst we hold the |
---|
500 | | - * RCU read lock. It does not guarantee that the request itself |
---|
501 | | - * will not be freed and then *reused*. Viz, |
---|
502 | | - * |
---|
503 | | - * Thread A Thread B |
---|
504 | | - * |
---|
505 | | - * rq = active.request |
---|
506 | | - * retire(rq) -> free(rq); |
---|
507 | | - * (rq is now first on the slab freelist) |
---|
508 | | - * active.request = NULL |
---|
509 | | - * |
---|
510 | | - * rq = new submission on a new object |
---|
511 | | - * ref(rq) |
---|
512 | | - * |
---|
513 | | - * To prevent the request from being reused whilst the caller |
---|
514 | | - * uses it, we take a reference like normal. Whilst acquiring |
---|
515 | | - * the reference we check that it is not in a destroyed state |
---|
516 | | - * (refcnt == 0). That prevents the request being reallocated |
---|
517 | | - * whilst the caller holds on to it. To check that the request |
---|
518 | | - * was not reallocated as we acquired the reference we have to |
---|
519 | | - * check that our request remains the active request across |
---|
520 | | - * the lookup, in the same manner as a seqlock. The visibility |
---|
521 | | - * of the pointer versus the reference counting is controlled |
---|
522 | | - * by using RCU barriers (rcu_dereference and rcu_assign_pointer). |
---|
523 | | - * |
---|
524 | | - * In the middle of all that, we inspect whether the request is |
---|
525 | | - * complete. Retiring is lazy so the request may be completed long |
---|
526 | | - * before the active tracker is updated. Querying whether the |
---|
527 | | - * request is complete is far cheaper (as it involves no locked |
---|
528 | | - * instructions setting cachelines to exclusive) than acquiring |
---|
529 | | - * the reference, so we do it first. The RCU read lock ensures the |
---|
530 | | - * pointer dereference is valid, but does not ensure that the |
---|
531 | | - * seqno nor HWS is the right one! However, if the request was |
---|
532 | | - * reallocated, that means the active tracker's request was complete. |
---|
533 | | - * If the new request is also complete, then both are and we can |
---|
534 | | - * just report the active tracker is idle. If the new request is |
---|
535 | | - * incomplete, then we acquire a reference on it and check that |
---|
536 | | - * it remained the active request. |
---|
537 | | - * |
---|
538 | | - * It is then imperative that we do not zero the request on |
---|
539 | | - * reallocation, so that we can chase the dangling pointers! |
---|
540 | | - * See i915_request_alloc(). |
---|
541 | | - */ |
---|
542 | | - do { |
---|
543 | | - struct i915_request *request; |
---|
544 | | - |
---|
545 | | - request = rcu_dereference(active->request); |
---|
546 | | - if (!request || i915_request_completed(request)) |
---|
547 | | - return NULL; |
---|
548 | | - |
---|
549 | | - /* |
---|
550 | | - * An especially silly compiler could decide to recompute the |
---|
551 | | - * result of i915_request_completed, more specifically |
---|
552 | | - * re-emit the load for request->fence.seqno. A race would catch |
---|
553 | | - * a later seqno value, which could flip the result from true to |
---|
554 | | - * false. Which means part of the instructions below might not |
---|
555 | | - * be executed, while later on instructions are executed. Due to |
---|
556 | | - * barriers within the refcounting the inconsistency can't reach |
---|
557 | | - * past the call to i915_request_get_rcu, but not executing |
---|
558 | | - * that while still executing i915_request_put() creates |
---|
559 | | - * havoc enough. Prevent this with a compiler barrier. |
---|
560 | | - */ |
---|
561 | | - barrier(); |
---|
562 | | - |
---|
563 | | - request = i915_request_get_rcu(request); |
---|
564 | | - |
---|
565 | | - /* |
---|
566 | | - * What stops the following rcu_access_pointer() from occurring |
---|
567 | | - * before the above i915_request_get_rcu()? If we were |
---|
568 | | - * to read the value before pausing to get the reference to |
---|
569 | | - * the request, we may not notice a change in the active |
---|
570 | | - * tracker. |
---|
571 | | - * |
---|
572 | | - * The rcu_access_pointer() is a mere compiler barrier, which |
---|
573 | | - * means both the CPU and compiler are free to perform the |
---|
574 | | - * memory read without constraint. The compiler only has to |
---|
575 | | - * ensure that any operations after the rcu_access_pointer() |
---|
576 | | - * occur afterwards in program order. This means the read may |
---|
577 | | - * be performed earlier by an out-of-order CPU, or adventurous |
---|
578 | | - * compiler. |
---|
579 | | - * |
---|
580 | | - * The atomic operation at the heart of |
---|
581 | | - * i915_request_get_rcu(), see dma_fence_get_rcu(), is |
---|
582 | | - * atomic_inc_not_zero() which is only a full memory barrier |
---|
583 | | - * when successful. That is, if i915_request_get_rcu() |
---|
584 | | - * returns the request (and so with the reference counted |
---|
585 | | - * incremented) then the following read for rcu_access_pointer() |
---|
586 | | - * must occur after the atomic operation and so confirm |
---|
587 | | - * that this request is the one currently being tracked. |
---|
588 | | - * |
---|
589 | | - * The corresponding write barrier is part of |
---|
590 | | - * rcu_assign_pointer(). |
---|
591 | | - */ |
---|
592 | | - if (!request || request == rcu_access_pointer(active->request)) |
---|
593 | | - return rcu_pointer_handoff(request); |
---|
594 | | - |
---|
595 | | - i915_request_put(request); |
---|
596 | | - } while (1); |
---|
597 | | -} |
---|
598 | | - |
---|
599 | | -/** |
---|
600 | | - * i915_gem_active_get_unlocked - return a reference to the active request |
---|
601 | | - * @active - the active tracker |
---|
602 | | - * |
---|
603 | | - * i915_gem_active_get_unlocked() returns a reference to the active request, |
---|
604 | | - * or NULL if the active tracker is idle. The reference is obtained under RCU, |
---|
605 | | - * so no locking is required by the caller. |
---|
606 | | - * |
---|
607 | | - * The reference should be freed with i915_request_put(). |
---|
608 | | - */ |
---|
609 | | -static inline struct i915_request * |
---|
610 | | -i915_gem_active_get_unlocked(const struct i915_gem_active *active) |
---|
611 | | -{ |
---|
612 | | - struct i915_request *request; |
---|
613 | | - |
---|
614 | | - rcu_read_lock(); |
---|
615 | | - request = __i915_gem_active_get_rcu(active); |
---|
| 538 | + result = true; |
---|
| 539 | + rcu_read_lock(); /* the HWSP may be freed at runtime */ |
---|
| 540 | + if (likely(!i915_request_signaled(rq))) |
---|
| 541 | + result = __i915_request_is_complete(rq); |
---|
616 | 542 | rcu_read_unlock(); |
---|
617 | 543 | |
---|
618 | | - return request; |
---|
| 544 | + return result; |
---|
619 | 545 | } |
---|
620 | 546 | |
---|
621 | | -/** |
---|
622 | | - * i915_gem_active_isset - report whether the active tracker is assigned |
---|
623 | | - * @active - the active tracker |
---|
624 | | - * |
---|
625 | | - * i915_gem_active_isset() returns true if the active tracker is currently |
---|
626 | | - * assigned to a request. Due to the lazy retiring, that request may be idle |
---|
627 | | - * and this may report stale information. |
---|
628 | | - */ |
---|
629 | | -static inline bool |
---|
630 | | -i915_gem_active_isset(const struct i915_gem_active *active) |
---|
| 547 | +static inline void i915_request_mark_complete(struct i915_request *rq) |
---|
631 | 548 | { |
---|
632 | | - return rcu_access_pointer(active->request); |
---|
| 549 | + WRITE_ONCE(rq->hwsp_seqno, /* decouple from HWSP */ |
---|
| 550 | + (u32 *)&rq->fence.seqno); |
---|
633 | 551 | } |
---|
634 | 552 | |
---|
635 | | -/** |
---|
636 | | - * i915_gem_active_wait - waits until the request is completed |
---|
637 | | - * @active - the active request on which to wait |
---|
638 | | - * @flags - how to wait |
---|
639 | | - * @timeout - how long to wait at most |
---|
640 | | - * @rps - userspace client to charge for a waitboost |
---|
641 | | - * |
---|
642 | | - * i915_gem_active_wait() waits until the request is completed before |
---|
643 | | - * returning, without requiring any locks to be held. Note that it does not |
---|
644 | | - * retire any requests before returning. |
---|
645 | | - * |
---|
646 | | - * This function relies on RCU in order to acquire the reference to the active |
---|
647 | | - * request without holding any locks. See __i915_gem_active_get_rcu() for the |
---|
648 | | - * glory details on how that is managed. Once the reference is acquired, we |
---|
649 | | - * can then wait upon the request, and afterwards release our reference, |
---|
650 | | - * free of any locking. |
---|
651 | | - * |
---|
652 | | - * This function wraps i915_request_wait(), see it for the full details on |
---|
653 | | - * the arguments. |
---|
654 | | - * |
---|
655 | | - * Returns 0 if successful, or a negative error code. |
---|
656 | | - */ |
---|
657 | | -static inline int |
---|
658 | | -i915_gem_active_wait(const struct i915_gem_active *active, unsigned int flags) |
---|
| 553 | +static inline bool i915_request_has_waitboost(const struct i915_request *rq) |
---|
659 | 554 | { |
---|
660 | | - struct i915_request *request; |
---|
661 | | - long ret = 0; |
---|
662 | | - |
---|
663 | | - request = i915_gem_active_get_unlocked(active); |
---|
664 | | - if (request) { |
---|
665 | | - ret = i915_request_wait(request, flags, MAX_SCHEDULE_TIMEOUT); |
---|
666 | | - i915_request_put(request); |
---|
667 | | - } |
---|
668 | | - |
---|
669 | | - return ret < 0 ? ret : 0; |
---|
| 555 | + return test_bit(I915_FENCE_FLAG_BOOST, &rq->fence.flags); |
---|
670 | 556 | } |
---|
671 | 557 | |
---|
672 | | -/** |
---|
673 | | - * i915_gem_active_retire - waits until the request is retired |
---|
674 | | - * @active - the active request on which to wait |
---|
675 | | - * |
---|
676 | | - * i915_gem_active_retire() waits until the request is completed, |
---|
677 | | - * and then ensures that at least the retirement handler for this |
---|
678 | | - * @active tracker is called before returning. If the @active |
---|
679 | | - * tracker is idle, the function returns immediately. |
---|
680 | | - */ |
---|
681 | | -static inline int __must_check |
---|
682 | | -i915_gem_active_retire(struct i915_gem_active *active, |
---|
683 | | - struct mutex *mutex) |
---|
| 558 | +static inline bool i915_request_has_nopreempt(const struct i915_request *rq) |
---|
684 | 559 | { |
---|
685 | | - struct i915_request *request; |
---|
686 | | - long ret; |
---|
687 | | - |
---|
688 | | - request = i915_gem_active_raw(active, mutex); |
---|
689 | | - if (!request) |
---|
690 | | - return 0; |
---|
691 | | - |
---|
692 | | - ret = i915_request_wait(request, |
---|
693 | | - I915_WAIT_INTERRUPTIBLE | I915_WAIT_LOCKED, |
---|
694 | | - MAX_SCHEDULE_TIMEOUT); |
---|
695 | | - if (ret < 0) |
---|
696 | | - return ret; |
---|
697 | | - |
---|
698 | | - list_del_init(&active->link); |
---|
699 | | - RCU_INIT_POINTER(active->request, NULL); |
---|
700 | | - |
---|
701 | | - active->retire(active, request); |
---|
702 | | - |
---|
703 | | - return 0; |
---|
| 560 | + /* Preemption should only be disabled very rarely */ |
---|
| 561 | + return unlikely(test_bit(I915_FENCE_FLAG_NOPREEMPT, &rq->fence.flags)); |
---|
704 | 562 | } |
---|
705 | 563 | |
---|
706 | | -#define for_each_active(mask, idx) \ |
---|
707 | | - for (; mask ? idx = ffs(mask) - 1, 1 : 0; mask &= ~BIT(idx)) |
---|
| 564 | +static inline bool i915_request_has_sentinel(const struct i915_request *rq) |
---|
| 565 | +{ |
---|
| 566 | + return unlikely(test_bit(I915_FENCE_FLAG_SENTINEL, &rq->fence.flags)); |
---|
| 567 | +} |
---|
| 568 | + |
---|
| 569 | +static inline bool i915_request_on_hold(const struct i915_request *rq) |
---|
| 570 | +{ |
---|
| 571 | + return unlikely(test_bit(I915_FENCE_FLAG_HOLD, &rq->fence.flags)); |
---|
| 572 | +} |
---|
| 573 | + |
---|
| 574 | +static inline void i915_request_set_hold(struct i915_request *rq) |
---|
| 575 | +{ |
---|
| 576 | + set_bit(I915_FENCE_FLAG_HOLD, &rq->fence.flags); |
---|
| 577 | +} |
---|
| 578 | + |
---|
| 579 | +static inline void i915_request_clear_hold(struct i915_request *rq) |
---|
| 580 | +{ |
---|
| 581 | + clear_bit(I915_FENCE_FLAG_HOLD, &rq->fence.flags); |
---|
| 582 | +} |
---|
| 583 | + |
---|
| 584 | +static inline struct intel_timeline * |
---|
| 585 | +i915_request_timeline(const struct i915_request *rq) |
---|
| 586 | +{ |
---|
| 587 | + /* Valid only while the request is being constructed (or retired). */ |
---|
| 588 | + return rcu_dereference_protected(rq->timeline, |
---|
| 589 | + lockdep_is_held(&rcu_access_pointer(rq->timeline)->mutex)); |
---|
| 590 | +} |
---|
| 591 | + |
---|
| 592 | +static inline struct i915_gem_context * |
---|
| 593 | +i915_request_gem_context(const struct i915_request *rq) |
---|
| 594 | +{ |
---|
| 595 | + /* Valid only while the request is being constructed (or retired). */ |
---|
| 596 | + return rcu_dereference_protected(rq->context->gem_context, true); |
---|
| 597 | +} |
---|
| 598 | + |
---|
| 599 | +static inline struct intel_timeline * |
---|
| 600 | +i915_request_active_timeline(const struct i915_request *rq) |
---|
| 601 | +{ |
---|
| 602 | + /* |
---|
| 603 | + * When in use during submission, we are protected by a guarantee that |
---|
| 604 | + * the context/timeline is pinned and must remain pinned until after |
---|
| 605 | + * this submission. |
---|
| 606 | + */ |
---|
| 607 | + return rcu_dereference_protected(rq->timeline, |
---|
| 608 | + lockdep_is_held(&rq->engine->active.lock)); |
---|
| 609 | +} |
---|
708 | 610 | |
---|
709 | 611 | #endif /* I915_REQUEST_H */ |
---|