1 /*
2 * SPDX-License-Identifier: MIT
3 *
4 * Copyright © 2019 Intel Corporation
5 */
6
7 #include <linux/slab.h>
8 #include <linux/workqueue.h>
9
10 #include "i915_active.h"
11 #include "gem/i915_gem_context.h"
12 #include "gem/i915_gem_object.h"
13 #include "i915_globals.h"
14 #include "i915_request.h"
15 #include "i915_scheduler.h"
16 #include "i915_vma.h"
17
18 static LIST_HEAD(globals);
19
20 static atomic_t active;
21 static atomic_t epoch;
22 static struct park_work {
23 struct delayed_work work;
24 struct rcu_head rcu;
25 unsigned long flags;
26 #define PENDING 0
27 int epoch;
28 } park;
29
i915_globals_shrink(void)30 static void i915_globals_shrink(void)
31 {
32 struct i915_global *global;
33
34 /*
35 * kmem_cache_shrink() discards empty slabs and reorders partially
36 * filled slabs to prioritise allocating from the mostly full slabs,
37 * with the aim of reducing fragmentation.
38 */
39 list_for_each_entry(global, &globals, link)
40 global->shrink();
41 }
42
__i915_globals_grace(struct rcu_head * rcu)43 static void __i915_globals_grace(struct rcu_head *rcu)
44 {
45 /* Ratelimit parking as shrinking is quite slow */
46 schedule_delayed_work(&park.work, round_jiffies_up_relative(2 * HZ));
47 }
48
__i915_globals_queue_rcu(void)49 static void __i915_globals_queue_rcu(void)
50 {
51 park.epoch = atomic_inc_return(&epoch);
52 if (!atomic_read(&active)) {
53 init_rcu_head(&park.rcu);
54 call_rcu(&park.rcu, __i915_globals_grace);
55 }
56 }
57
__i915_globals_park(struct work_struct * work)58 static void __i915_globals_park(struct work_struct *work)
59 {
60 destroy_rcu_head(&park.rcu);
61
62 /* Confirm nothing woke up in the last grace period */
63 if (park.epoch != atomic_read(&epoch)) {
64 __i915_globals_queue_rcu();
65 return;
66 }
67
68 clear_bit(PENDING, &park.flags);
69 i915_globals_shrink();
70 }
71
i915_global_register(struct i915_global * global)72 void __init i915_global_register(struct i915_global *global)
73 {
74 GEM_BUG_ON(!global->shrink);
75 GEM_BUG_ON(!global->exit);
76
77 list_add_tail(&global->link, &globals);
78 }
79
__i915_globals_cleanup(void)80 static void __i915_globals_cleanup(void)
81 {
82 struct i915_global *global, *next;
83
84 list_for_each_entry_safe_reverse(global, next, &globals, link)
85 global->exit();
86 }
87
88 static __initconst int (* const initfn[])(void) = {
89 i915_global_active_init,
90 i915_global_buddy_init,
91 i915_global_context_init,
92 i915_global_gem_context_init,
93 i915_global_objects_init,
94 i915_global_request_init,
95 i915_global_scheduler_init,
96 i915_global_vma_init,
97 };
98
i915_globals_init(void)99 int __init i915_globals_init(void)
100 {
101 int i;
102
103 for (i = 0; i < ARRAY_SIZE(initfn); i++) {
104 int err;
105
106 err = initfn[i]();
107 if (err) {
108 __i915_globals_cleanup();
109 return err;
110 }
111 }
112
113 INIT_DELAYED_WORK(&park.work, __i915_globals_park);
114 return 0;
115 }
116
i915_globals_park(void)117 void i915_globals_park(void)
118 {
119 /*
120 * Defer shrinking the global slab caches (and other work) until
121 * after a RCU grace period has completed with no activity. This
122 * is to try and reduce the latency impact on the consumers caused
123 * by us shrinking the caches the same time as they are trying to
124 * allocate, with the assumption being that if we idle long enough
125 * for an RCU grace period to elapse since the last use, it is likely
126 * to be longer until we need the caches again.
127 */
128 if (!atomic_dec_and_test(&active))
129 return;
130
131 /* Queue cleanup after the next RCU grace period has freed slabs */
132 if (!test_and_set_bit(PENDING, &park.flags))
133 __i915_globals_queue_rcu();
134 }
135
i915_globals_unpark(void)136 void i915_globals_unpark(void)
137 {
138 atomic_inc(&epoch);
139 atomic_inc(&active);
140 }
141
__i915_globals_flush(void)142 static void __exit __i915_globals_flush(void)
143 {
144 atomic_inc(&active); /* skip shrinking */
145
146 rcu_barrier(); /* wait for the work to be queued */
147 flush_delayed_work(&park.work);
148
149 atomic_dec(&active);
150 }
151
i915_globals_exit(void)152 void __exit i915_globals_exit(void)
153 {
154 GEM_BUG_ON(atomic_read(&active));
155
156 __i915_globals_flush();
157 __i915_globals_cleanup();
158
159 /* And ensure that our DESTROY_BY_RCU slabs are truly destroyed */
160 rcu_barrier();
161 }
162