1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright © 2014-2018 Intel Corporation
4  */
5 
6 #include "gem/i915_gem_object.h"
7 
8 #include "i915_drv.h"
9 #include "intel_engine_pm.h"
10 #include "intel_gt_buffer_pool.h"
11 
to_gt(struct intel_gt_buffer_pool * pool)12 static struct intel_gt *to_gt(struct intel_gt_buffer_pool *pool)
13 {
14 	return container_of(pool, struct intel_gt, buffer_pool);
15 }
16 
17 static struct list_head *
bucket_for_size(struct intel_gt_buffer_pool * pool,size_t sz)18 bucket_for_size(struct intel_gt_buffer_pool *pool, size_t sz)
19 {
20 	int n;
21 
22 	/*
23 	 * Compute a power-of-two bucket, but throw everything greater than
24 	 * 16KiB into the same bucket: i.e. the buckets hold objects of
25 	 * (1 page, 2 pages, 4 pages, 8+ pages).
26 	 */
27 	n = fls(sz >> PAGE_SHIFT) - 1;
28 	if (n >= ARRAY_SIZE(pool->cache_list))
29 		n = ARRAY_SIZE(pool->cache_list) - 1;
30 
31 	return &pool->cache_list[n];
32 }
33 
node_free(struct intel_gt_buffer_pool_node * node)34 static void node_free(struct intel_gt_buffer_pool_node *node)
35 {
36 	i915_gem_object_put(node->obj);
37 	i915_active_fini(&node->active);
38 	kfree_rcu(node, rcu);
39 }
40 
pool_free_older_than(struct intel_gt_buffer_pool * pool,long keep)41 static bool pool_free_older_than(struct intel_gt_buffer_pool *pool, long keep)
42 {
43 	struct intel_gt_buffer_pool_node *node, *stale = NULL;
44 	bool active = false;
45 	int n;
46 
47 	/* Free buffers that have not been used in the past second */
48 	for (n = 0; n < ARRAY_SIZE(pool->cache_list); n++) {
49 		struct list_head *list = &pool->cache_list[n];
50 
51 		if (list_empty(list))
52 			continue;
53 
54 		if (spin_trylock_irq(&pool->lock)) {
55 			struct list_head *pos;
56 
57 			/* Most recent at head; oldest at tail */
58 			list_for_each_prev(pos, list) {
59 				unsigned long age;
60 
61 				node = list_entry(pos, typeof(*node), link);
62 
63 				age = READ_ONCE(node->age);
64 				if (!age || jiffies - age < keep)
65 					break;
66 
67 				/* Check we are the first to claim this node */
68 				if (!xchg(&node->age, 0))
69 					break;
70 
71 				node->free = stale;
72 				stale = node;
73 			}
74 			if (!list_is_last(pos, list))
75 				__list_del_many(pos, list);
76 
77 			spin_unlock_irq(&pool->lock);
78 		}
79 
80 		active |= !list_empty(list);
81 	}
82 
83 	while ((node = stale)) {
84 		stale = stale->free;
85 		node_free(node);
86 	}
87 
88 	return active;
89 }
90 
pool_free_work(struct work_struct * wrk)91 static void pool_free_work(struct work_struct *wrk)
92 {
93 	struct intel_gt_buffer_pool *pool =
94 		container_of(wrk, typeof(*pool), work.work);
95 
96 	if (pool_free_older_than(pool, HZ))
97 		schedule_delayed_work(&pool->work,
98 				      round_jiffies_up_relative(HZ));
99 }
100 
pool_active(struct i915_active * ref)101 static int pool_active(struct i915_active *ref)
102 {
103 	struct intel_gt_buffer_pool_node *node =
104 		container_of(ref, typeof(*node), active);
105 	struct dma_resv *resv = node->obj->base.resv;
106 	int err;
107 
108 	if (dma_resv_trylock(resv)) {
109 		dma_resv_add_excl_fence(resv, NULL);
110 		dma_resv_unlock(resv);
111 	}
112 
113 	err = i915_gem_object_pin_pages(node->obj);
114 	if (err)
115 		return err;
116 
117 	/* Hide this pinned object from the shrinker until retired */
118 	i915_gem_object_make_unshrinkable(node->obj);
119 
120 	return 0;
121 }
122 
123 __i915_active_call
pool_retire(struct i915_active * ref)124 static void pool_retire(struct i915_active *ref)
125 {
126 	struct intel_gt_buffer_pool_node *node =
127 		container_of(ref, typeof(*node), active);
128 	struct intel_gt_buffer_pool *pool = node->pool;
129 	struct list_head *list = bucket_for_size(pool, node->obj->base.size);
130 	unsigned long flags;
131 
132 	i915_gem_object_unpin_pages(node->obj);
133 
134 	/* Return this object to the shrinker pool */
135 	i915_gem_object_make_purgeable(node->obj);
136 
137 	GEM_BUG_ON(node->age);
138 	spin_lock_irqsave(&pool->lock, flags);
139 	list_add_rcu(&node->link, list);
140 	WRITE_ONCE(node->age, jiffies ?: 1); /* 0 reserved for active nodes */
141 	spin_unlock_irqrestore(&pool->lock, flags);
142 
143 	schedule_delayed_work(&pool->work,
144 			      round_jiffies_up_relative(HZ));
145 }
146 
147 static struct intel_gt_buffer_pool_node *
node_create(struct intel_gt_buffer_pool * pool,size_t sz)148 node_create(struct intel_gt_buffer_pool *pool, size_t sz)
149 {
150 	struct intel_gt *gt = to_gt(pool);
151 	struct intel_gt_buffer_pool_node *node;
152 	struct drm_i915_gem_object *obj;
153 
154 	node = kmalloc(sizeof(*node),
155 		       GFP_KERNEL | __GFP_RETRY_MAYFAIL | __GFP_NOWARN);
156 	if (!node)
157 		return ERR_PTR(-ENOMEM);
158 
159 	node->age = 0;
160 	node->pool = pool;
161 	i915_active_init(&node->active, pool_active, pool_retire);
162 
163 	obj = i915_gem_object_create_internal(gt->i915, sz);
164 	if (IS_ERR(obj)) {
165 		i915_active_fini(&node->active);
166 		kfree(node);
167 		return ERR_CAST(obj);
168 	}
169 
170 	i915_gem_object_set_readonly(obj);
171 
172 	node->obj = obj;
173 	return node;
174 }
175 
176 struct intel_gt_buffer_pool_node *
intel_gt_get_buffer_pool(struct intel_gt * gt,size_t size)177 intel_gt_get_buffer_pool(struct intel_gt *gt, size_t size)
178 {
179 	struct intel_gt_buffer_pool *pool = &gt->buffer_pool;
180 	struct intel_gt_buffer_pool_node *node;
181 	struct list_head *list;
182 	int ret;
183 
184 	size = PAGE_ALIGN(size);
185 	list = bucket_for_size(pool, size);
186 
187 	rcu_read_lock();
188 	list_for_each_entry_rcu(node, list, link) {
189 		unsigned long age;
190 
191 		if (node->obj->base.size < size)
192 			continue;
193 
194 		age = READ_ONCE(node->age);
195 		if (!age)
196 			continue;
197 
198 		if (cmpxchg(&node->age, age, 0) == age) {
199 			spin_lock_irq(&pool->lock);
200 			list_del_rcu(&node->link);
201 			spin_unlock_irq(&pool->lock);
202 			break;
203 		}
204 	}
205 	rcu_read_unlock();
206 
207 	if (&node->link == list) {
208 		node = node_create(pool, size);
209 		if (IS_ERR(node))
210 			return node;
211 	}
212 
213 	ret = i915_active_acquire(&node->active);
214 	if (ret) {
215 		node_free(node);
216 		return ERR_PTR(ret);
217 	}
218 
219 	return node;
220 }
221 
intel_gt_init_buffer_pool(struct intel_gt * gt)222 void intel_gt_init_buffer_pool(struct intel_gt *gt)
223 {
224 	struct intel_gt_buffer_pool *pool = &gt->buffer_pool;
225 	int n;
226 
227 	spin_lock_init(&pool->lock);
228 	for (n = 0; n < ARRAY_SIZE(pool->cache_list); n++)
229 		INIT_LIST_HEAD(&pool->cache_list[n]);
230 	INIT_DELAYED_WORK(&pool->work, pool_free_work);
231 }
232 
intel_gt_flush_buffer_pool(struct intel_gt * gt)233 void intel_gt_flush_buffer_pool(struct intel_gt *gt)
234 {
235 	struct intel_gt_buffer_pool *pool = &gt->buffer_pool;
236 
237 	do {
238 		while (pool_free_older_than(pool, 0))
239 			;
240 	} while (cancel_delayed_work_sync(&pool->work));
241 }
242 
intel_gt_fini_buffer_pool(struct intel_gt * gt)243 void intel_gt_fini_buffer_pool(struct intel_gt *gt)
244 {
245 	struct intel_gt_buffer_pool *pool = &gt->buffer_pool;
246 	int n;
247 
248 	intel_gt_flush_buffer_pool(gt);
249 
250 	for (n = 0; n < ARRAY_SIZE(pool->cache_list); n++)
251 		GEM_BUG_ON(!list_empty(&pool->cache_list[n]));
252 }
253