blob: d215dcdf0b1eac2a3a0ee5920b76b69611307594 [file] [log] [blame]
Chris Wilsone2f34962018-10-01 15:47:54 +01001/*
2 * SPDX-License-Identifier: MIT
3 *
4 * Copyright © 2018 Intel Corporation
5 */
6
7#include <linux/mutex.h>
8
9#include "i915_drv.h"
Chris Wilson103b76ee2019-03-05 21:38:30 +000010#include "i915_globals.h"
Chris Wilsone2f34962018-10-01 15:47:54 +010011#include "i915_request.h"
12#include "i915_scheduler.h"
13
Chris Wilson32eb6bc2019-02-28 10:20:33 +000014static struct i915_global_scheduler {
Chris Wilson103b76ee2019-03-05 21:38:30 +000015 struct i915_global base;
Chris Wilson32eb6bc2019-02-28 10:20:33 +000016 struct kmem_cache *slab_dependencies;
17 struct kmem_cache *slab_priorities;
18} global;
19
Chris Wilsone2f34962018-10-01 15:47:54 +010020static DEFINE_SPINLOCK(schedule_lock);
21
22static const struct i915_request *
23node_to_request(const struct i915_sched_node *node)
24{
25 return container_of(node, const struct i915_request, sched);
26}
27
Chris Wilsonbabfb1b2019-02-26 10:23:54 +000028static inline bool node_started(const struct i915_sched_node *node)
29{
30 return i915_request_started(node_to_request(node));
31}
32
Chris Wilsone2f34962018-10-01 15:47:54 +010033static inline bool node_signaled(const struct i915_sched_node *node)
34{
35 return i915_request_completed(node_to_request(node));
36}
37
Chris Wilsone2f34962018-10-01 15:47:54 +010038static inline struct i915_priolist *to_priolist(struct rb_node *rb)
39{
40 return rb_entry(rb, struct i915_priolist, node);
41}
42
Chris Wilson4d97cbe02019-01-29 18:54:51 +000043static void assert_priolists(struct intel_engine_execlists * const execlists)
Chris Wilsone2f34962018-10-01 15:47:54 +010044{
45 struct rb_node *rb;
46 long last_prio, i;
47
48 if (!IS_ENABLED(CONFIG_DRM_I915_DEBUG_GEM))
49 return;
50
51 GEM_BUG_ON(rb_first_cached(&execlists->queue) !=
52 rb_first(&execlists->queue.rb_root));
53
Chris Wilson4d97cbe02019-01-29 18:54:51 +000054 last_prio = (INT_MAX >> I915_USER_PRIORITY_SHIFT) + 1;
Chris Wilsone2f34962018-10-01 15:47:54 +010055 for (rb = rb_first_cached(&execlists->queue); rb; rb = rb_next(rb)) {
56 const struct i915_priolist *p = to_priolist(rb);
57
58 GEM_BUG_ON(p->priority >= last_prio);
59 last_prio = p->priority;
60
61 GEM_BUG_ON(!p->used);
62 for (i = 0; i < ARRAY_SIZE(p->requests); i++) {
63 if (list_empty(&p->requests[i]))
64 continue;
65
66 GEM_BUG_ON(!(p->used & BIT(i)));
67 }
68 }
69}
70
71struct list_head *
72i915_sched_lookup_priolist(struct intel_engine_cs *engine, int prio)
73{
74 struct intel_engine_execlists * const execlists = &engine->execlists;
75 struct i915_priolist *p;
76 struct rb_node **parent, *rb;
77 bool first = true;
78 int idx, i;
79
80 lockdep_assert_held(&engine->timeline.lock);
Chris Wilson4d97cbe02019-01-29 18:54:51 +000081 assert_priolists(execlists);
Chris Wilsone2f34962018-10-01 15:47:54 +010082
83 /* buckets sorted from highest [in slot 0] to lowest priority */
84 idx = I915_PRIORITY_COUNT - (prio & I915_PRIORITY_MASK) - 1;
85 prio >>= I915_USER_PRIORITY_SHIFT;
86 if (unlikely(execlists->no_priolist))
87 prio = I915_PRIORITY_NORMAL;
88
89find_priolist:
90 /* most positive priority is scheduled first, equal priorities fifo */
91 rb = NULL;
92 parent = &execlists->queue.rb_root.rb_node;
93 while (*parent) {
94 rb = *parent;
95 p = to_priolist(rb);
96 if (prio > p->priority) {
97 parent = &rb->rb_left;
98 } else if (prio < p->priority) {
99 parent = &rb->rb_right;
100 first = false;
101 } else {
102 goto out;
103 }
104 }
105
106 if (prio == I915_PRIORITY_NORMAL) {
107 p = &execlists->default_priolist;
108 } else {
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000109 p = kmem_cache_alloc(global.slab_priorities, GFP_ATOMIC);
Chris Wilsone2f34962018-10-01 15:47:54 +0100110 /* Convert an allocation failure to a priority bump */
111 if (unlikely(!p)) {
112 prio = I915_PRIORITY_NORMAL; /* recurses just once */
113
114 /* To maintain ordering with all rendering, after an
115 * allocation failure we have to disable all scheduling.
116 * Requests will then be executed in fifo, and schedule
117 * will ensure that dependencies are emitted in fifo.
118 * There will be still some reordering with existing
119 * requests, so if userspace lied about their
120 * dependencies that reordering may be visible.
121 */
122 execlists->no_priolist = true;
123 goto find_priolist;
124 }
125 }
126
127 p->priority = prio;
128 for (i = 0; i < ARRAY_SIZE(p->requests); i++)
129 INIT_LIST_HEAD(&p->requests[i]);
130 rb_link_node(&p->node, rb, parent);
131 rb_insert_color_cached(&p->node, &execlists->queue, first);
132 p->used = 0;
133
134out:
135 p->used |= BIT(idx);
136 return &p->requests[idx];
137}
138
Chris Wilson5ae87062019-05-13 13:01:00 +0100139void __i915_priolist_free(struct i915_priolist *p)
140{
141 kmem_cache_free(global.slab_priorities, p);
142}
143
Chris Wilsoned7dc672019-02-11 20:46:47 +0000144struct sched_cache {
145 struct list_head *priolist;
146};
147
Chris Wilsone2f34962018-10-01 15:47:54 +0100148static struct intel_engine_cs *
Chris Wilsoned7dc672019-02-11 20:46:47 +0000149sched_lock_engine(const struct i915_sched_node *node,
150 struct intel_engine_cs *locked,
151 struct sched_cache *cache)
Chris Wilsone2f34962018-10-01 15:47:54 +0100152{
153 struct intel_engine_cs *engine = node_to_request(node)->engine;
154
155 GEM_BUG_ON(!locked);
156
157 if (engine != locked) {
158 spin_unlock(&locked->timeline.lock);
Chris Wilsoned7dc672019-02-11 20:46:47 +0000159 memset(cache, 0, sizeof(*cache));
Chris Wilsone2f34962018-10-01 15:47:54 +0100160 spin_lock(&engine->timeline.lock);
161 }
162
163 return engine;
164}
165
Chris Wilson25d851a2019-05-07 13:25:44 +0100166static inline int rq_prio(const struct i915_request *rq)
Chris Wilsonc9a64622019-01-29 18:54:52 +0000167{
Chris Wilson25d851a2019-05-07 13:25:44 +0100168 return rq->sched.attr.priority | __NO_PREEMPTION;
169}
Chris Wilsonc9a64622019-01-29 18:54:52 +0000170
Chris Wilson25d851a2019-05-07 13:25:44 +0100171static void kick_submission(struct intel_engine_cs *engine, int prio)
172{
173 const struct i915_request *inflight =
174 port_request(engine->execlists.port);
Chris Wilsonc9a64622019-01-29 18:54:52 +0000175
Chris Wilson25d851a2019-05-07 13:25:44 +0100176 /*
177 * If we are already the currently executing context, don't
178 * bother evaluating if we should preempt ourselves, or if
179 * we expect nothing to change as a result of running the
180 * tasklet, i.e. we have not change the priority queue
181 * sufficiently to oust the running context.
182 */
183 if (inflight && !i915_scheduler_need_preempt(prio, rq_prio(inflight)))
184 return;
185
186 tasklet_hi_schedule(&engine->execlists.tasklet);
Chris Wilsonc9a64622019-01-29 18:54:52 +0000187}
188
Chris Wilson52c76fb2019-05-13 13:01:01 +0100189static void __i915_schedule(struct i915_sched_node *node,
Chris Wilsone9eaf822018-10-01 15:47:55 +0100190 const struct i915_sched_attr *attr)
Chris Wilsone2f34962018-10-01 15:47:54 +0100191{
Chris Wilsoned7dc672019-02-11 20:46:47 +0000192 struct intel_engine_cs *engine;
Chris Wilsone2f34962018-10-01 15:47:54 +0100193 struct i915_dependency *dep, *p;
194 struct i915_dependency stack;
195 const int prio = attr->priority;
Chris Wilsoned7dc672019-02-11 20:46:47 +0000196 struct sched_cache cache;
Chris Wilsone2f34962018-10-01 15:47:54 +0100197 LIST_HEAD(dfs);
198
Chris Wilsone9eaf822018-10-01 15:47:55 +0100199 /* Needed in order to use the temporary link inside i915_dependency */
200 lockdep_assert_held(&schedule_lock);
Chris Wilsone2f34962018-10-01 15:47:54 +0100201 GEM_BUG_ON(prio == I915_PRIORITY_INVALID);
202
Chris Wilson19098012019-05-13 13:01:02 +0100203 if (prio <= READ_ONCE(node->attr.priority))
Chris Wilsone2f34962018-10-01 15:47:54 +0100204 return;
205
Chris Wilson19098012019-05-13 13:01:02 +0100206 if (node_signaled(node))
Chris Wilsone2f34962018-10-01 15:47:54 +0100207 return;
208
Chris Wilson52c76fb2019-05-13 13:01:01 +0100209 stack.signaler = node;
Chris Wilsone2f34962018-10-01 15:47:54 +0100210 list_add(&stack.dfs_link, &dfs);
211
212 /*
213 * Recursively bump all dependent priorities to match the new request.
214 *
215 * A naive approach would be to use recursion:
216 * static void update_priorities(struct i915_sched_node *node, prio) {
217 * list_for_each_entry(dep, &node->signalers_list, signal_link)
218 * update_priorities(dep->signal, prio)
219 * queue_request(node);
220 * }
221 * but that may have unlimited recursion depth and so runs a very
222 * real risk of overunning the kernel stack. Instead, we build
223 * a flat list of all dependencies starting with the current request.
224 * As we walk the list of dependencies, we add all of its dependencies
225 * to the end of the list (this may include an already visited
226 * request) and continue to walk onwards onto the new dependencies. The
227 * end result is a topological list of requests in reverse order, the
228 * last element in the list is the request we must execute first.
229 */
230 list_for_each_entry(dep, &dfs, dfs_link) {
231 struct i915_sched_node *node = dep->signaler;
232
Chris Wilsonbabfb1b2019-02-26 10:23:54 +0000233 /* If we are already flying, we know we have no signalers */
234 if (node_started(node))
235 continue;
236
Chris Wilsone2f34962018-10-01 15:47:54 +0100237 /*
238 * Within an engine, there can be no cycle, but we may
239 * refer to the same dependency chain multiple times
240 * (redundant dependencies are not eliminated) and across
241 * engines.
242 */
243 list_for_each_entry(p, &node->signalers_list, signal_link) {
244 GEM_BUG_ON(p == dep); /* no cycles! */
245
246 if (node_signaled(p->signaler))
247 continue;
248
Chris Wilsone2f34962018-10-01 15:47:54 +0100249 if (prio > READ_ONCE(p->signaler->attr.priority))
250 list_move_tail(&p->dfs_link, &dfs);
251 }
252 }
253
254 /*
255 * If we didn't need to bump any existing priorities, and we haven't
256 * yet submitted this request (i.e. there is no potential race with
257 * execlists_submit_request()), we can set our own priority and skip
258 * acquiring the engine locks.
259 */
Chris Wilson52c76fb2019-05-13 13:01:01 +0100260 if (node->attr.priority == I915_PRIORITY_INVALID) {
261 GEM_BUG_ON(!list_empty(&node->link));
262 node->attr = *attr;
Chris Wilsone2f34962018-10-01 15:47:54 +0100263
264 if (stack.dfs_link.next == stack.dfs_link.prev)
Chris Wilsone9eaf822018-10-01 15:47:55 +0100265 return;
Chris Wilsone2f34962018-10-01 15:47:54 +0100266
267 __list_del_entry(&stack.dfs_link);
268 }
269
Chris Wilsoned7dc672019-02-11 20:46:47 +0000270 memset(&cache, 0, sizeof(cache));
Chris Wilson52c76fb2019-05-13 13:01:01 +0100271 engine = node_to_request(node)->engine;
Chris Wilsonb7404c72019-04-09 16:29:22 +0100272 spin_lock(&engine->timeline.lock);
Chris Wilsone2f34962018-10-01 15:47:54 +0100273
274 /* Fifo and depth-first replacement ensure our deps execute before us */
275 list_for_each_entry_safe_reverse(dep, p, &dfs, dfs_link) {
Chris Wilsone2f34962018-10-01 15:47:54 +0100276 INIT_LIST_HEAD(&dep->dfs_link);
277
Chris Wilson52c76fb2019-05-13 13:01:01 +0100278 node = dep->signaler;
Chris Wilsoned7dc672019-02-11 20:46:47 +0000279 engine = sched_lock_engine(node, engine, &cache);
Chris Wilsonc9a64622019-01-29 18:54:52 +0000280 lockdep_assert_held(&engine->timeline.lock);
Chris Wilsone2f34962018-10-01 15:47:54 +0100281
282 /* Recheck after acquiring the engine->timeline.lock */
283 if (prio <= node->attr.priority || node_signaled(node))
284 continue;
285
286 node->attr.priority = prio;
287 if (!list_empty(&node->link)) {
Chris Wilsoned7dc672019-02-11 20:46:47 +0000288 if (!cache.priolist)
289 cache.priolist =
290 i915_sched_lookup_priolist(engine,
291 prio);
292 list_move_tail(&node->link, cache.priolist);
Chris Wilsone2f34962018-10-01 15:47:54 +0100293 } else {
294 /*
295 * If the request is not in the priolist queue because
296 * it is not yet runnable, then it doesn't contribute
297 * to our preemption decisions. On the other hand,
298 * if the request is on the HW, it too is not in the
299 * queue; but in that case we may still need to reorder
300 * the inflight requests.
301 */
302 if (!i915_sw_fence_done(&node_to_request(node)->submit))
303 continue;
304 }
305
Chris Wilson4d97cbe02019-01-29 18:54:51 +0000306 if (prio <= engine->execlists.queue_priority_hint)
Chris Wilsone2f34962018-10-01 15:47:54 +0100307 continue;
308
Chris Wilsonc9a64622019-01-29 18:54:52 +0000309 engine->execlists.queue_priority_hint = prio;
310
Chris Wilsone2f34962018-10-01 15:47:54 +0100311 /* Defer (tasklet) submission until after all of our updates. */
Chris Wilson25d851a2019-05-07 13:25:44 +0100312 kick_submission(engine, prio);
Chris Wilsone2f34962018-10-01 15:47:54 +0100313 }
314
Chris Wilsonb7404c72019-04-09 16:29:22 +0100315 spin_unlock(&engine->timeline.lock);
Chris Wilsone9eaf822018-10-01 15:47:55 +0100316}
Chris Wilsone2f34962018-10-01 15:47:54 +0100317
Chris Wilsone9eaf822018-10-01 15:47:55 +0100318void i915_schedule(struct i915_request *rq, const struct i915_sched_attr *attr)
319{
Chris Wilsonb7404c72019-04-09 16:29:22 +0100320 spin_lock_irq(&schedule_lock);
Chris Wilson52c76fb2019-05-13 13:01:01 +0100321 __i915_schedule(&rq->sched, attr);
Chris Wilsonb7404c72019-04-09 16:29:22 +0100322 spin_unlock_irq(&schedule_lock);
Chris Wilsone2f34962018-10-01 15:47:54 +0100323}
Chris Wilsone9eaf822018-10-01 15:47:55 +0100324
Chris Wilson52c76fb2019-05-13 13:01:01 +0100325static void __bump_priority(struct i915_sched_node *node, unsigned int bump)
326{
327 struct i915_sched_attr attr = node->attr;
328
329 attr.priority |= bump;
330 __i915_schedule(node, &attr);
331}
332
Chris Wilsone9eaf822018-10-01 15:47:55 +0100333void i915_schedule_bump_priority(struct i915_request *rq, unsigned int bump)
334{
Chris Wilsonb7404c72019-04-09 16:29:22 +0100335 unsigned long flags;
Chris Wilsone9eaf822018-10-01 15:47:55 +0100336
337 GEM_BUG_ON(bump & ~I915_PRIORITY_MASK);
338
339 if (READ_ONCE(rq->sched.attr.priority) == I915_PRIORITY_INVALID)
340 return;
341
Chris Wilsonb7404c72019-04-09 16:29:22 +0100342 spin_lock_irqsave(&schedule_lock, flags);
Chris Wilson52c76fb2019-05-13 13:01:01 +0100343 __bump_priority(&rq->sched, bump);
Chris Wilsonb7404c72019-04-09 16:29:22 +0100344 spin_unlock_irqrestore(&schedule_lock, flags);
Chris Wilsone9eaf822018-10-01 15:47:55 +0100345}
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000346
Chris Wilson5ae87062019-05-13 13:01:00 +0100347void i915_sched_node_init(struct i915_sched_node *node)
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000348{
Chris Wilson5ae87062019-05-13 13:01:00 +0100349 INIT_LIST_HEAD(&node->signalers_list);
350 INIT_LIST_HEAD(&node->waiters_list);
351 INIT_LIST_HEAD(&node->link);
352 node->attr.priority = I915_PRIORITY_INVALID;
353 node->semaphores = 0;
354 node->flags = 0;
355}
356
357static struct i915_dependency *
358i915_dependency_alloc(void)
359{
360 return kmem_cache_alloc(global.slab_dependencies, GFP_KERNEL);
361}
362
363static void
364i915_dependency_free(struct i915_dependency *dep)
365{
366 kmem_cache_free(global.slab_dependencies, dep);
367}
368
369bool __i915_sched_node_add_dependency(struct i915_sched_node *node,
370 struct i915_sched_node *signal,
371 struct i915_dependency *dep,
372 unsigned long flags)
373{
374 bool ret = false;
375
376 spin_lock_irq(&schedule_lock);
377
378 if (!node_signaled(signal)) {
379 INIT_LIST_HEAD(&dep->dfs_link);
380 list_add(&dep->wait_link, &signal->waiters_list);
381 list_add(&dep->signal_link, &node->signalers_list);
382 dep->signaler = signal;
383 dep->flags = flags;
384
385 /* Keep track of whether anyone on this chain has a semaphore */
386 if (signal->flags & I915_SCHED_HAS_SEMAPHORE_CHAIN &&
387 !node_started(signal))
388 node->flags |= I915_SCHED_HAS_SEMAPHORE_CHAIN;
389
Chris Wilson6e7eb7a2019-05-15 14:00:50 +0100390 /*
391 * As we do not allow WAIT to preempt inflight requests,
392 * once we have executed a request, along with triggering
393 * any execution callbacks, we must preserve its ordering
394 * within the non-preemptible FIFO.
395 */
396 BUILD_BUG_ON(__NO_PREEMPTION & ~I915_PRIORITY_MASK);
397 if (flags & I915_DEPENDENCY_EXTERNAL)
398 __bump_priority(signal, __NO_PREEMPTION);
399
Chris Wilson5ae87062019-05-13 13:01:00 +0100400 ret = true;
401 }
402
403 spin_unlock_irq(&schedule_lock);
404
405 return ret;
406}
407
408int i915_sched_node_add_dependency(struct i915_sched_node *node,
409 struct i915_sched_node *signal)
410{
411 struct i915_dependency *dep;
412
413 dep = i915_dependency_alloc();
414 if (!dep)
415 return -ENOMEM;
416
417 if (!__i915_sched_node_add_dependency(node, signal, dep,
Chris Wilson6e7eb7a2019-05-15 14:00:50 +0100418 I915_DEPENDENCY_EXTERNAL |
Chris Wilson5ae87062019-05-13 13:01:00 +0100419 I915_DEPENDENCY_ALLOC))
420 i915_dependency_free(dep);
421
422 return 0;
423}
424
425void i915_sched_node_fini(struct i915_sched_node *node)
426{
427 struct i915_dependency *dep, *tmp;
428
429 GEM_BUG_ON(!list_empty(&node->link));
430
431 spin_lock_irq(&schedule_lock);
432
433 /*
434 * Everyone we depended upon (the fences we wait to be signaled)
435 * should retire before us and remove themselves from our list.
436 * However, retirement is run independently on each timeline and
437 * so we may be called out-of-order.
438 */
439 list_for_each_entry_safe(dep, tmp, &node->signalers_list, signal_link) {
440 GEM_BUG_ON(!node_signaled(dep->signaler));
441 GEM_BUG_ON(!list_empty(&dep->dfs_link));
442
443 list_del(&dep->wait_link);
444 if (dep->flags & I915_DEPENDENCY_ALLOC)
445 i915_dependency_free(dep);
446 }
447
448 /* Remove ourselves from everyone who depends upon us */
449 list_for_each_entry_safe(dep, tmp, &node->waiters_list, wait_link) {
450 GEM_BUG_ON(dep->signaler != node);
451 GEM_BUG_ON(!list_empty(&dep->dfs_link));
452
453 list_del(&dep->signal_link);
454 if (dep->flags & I915_DEPENDENCY_ALLOC)
455 i915_dependency_free(dep);
456 }
457
458 spin_unlock_irq(&schedule_lock);
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000459}
460
Chris Wilson103b76ee2019-03-05 21:38:30 +0000461static void i915_global_scheduler_shrink(void)
462{
463 kmem_cache_shrink(global.slab_dependencies);
464 kmem_cache_shrink(global.slab_priorities);
465}
466
467static void i915_global_scheduler_exit(void)
468{
469 kmem_cache_destroy(global.slab_dependencies);
470 kmem_cache_destroy(global.slab_priorities);
471}
472
473static struct i915_global_scheduler global = { {
474 .shrink = i915_global_scheduler_shrink,
475 .exit = i915_global_scheduler_exit,
476} };
477
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000478int __init i915_global_scheduler_init(void)
479{
480 global.slab_dependencies = KMEM_CACHE(i915_dependency,
481 SLAB_HWCACHE_ALIGN);
482 if (!global.slab_dependencies)
483 return -ENOMEM;
484
485 global.slab_priorities = KMEM_CACHE(i915_priolist,
486 SLAB_HWCACHE_ALIGN);
487 if (!global.slab_priorities)
488 goto err_priorities;
489
Chris Wilson103b76ee2019-03-05 21:38:30 +0000490 i915_global_register(&global.base);
Chris Wilson32eb6bc2019-02-28 10:20:33 +0000491 return 0;
492
493err_priorities:
494 kmem_cache_destroy(global.slab_priorities);
495 return -ENOMEM;
496}