1 // SPDX-License-Identifier: MIT
3 * Copyright © 2021 Intel Corporation
6 #include <linux/kmemleak.h>
7 #include <linux/sizes.h>
9 #include "i915_buddy.h"
12 #include "i915_utils.h"
14 static struct kmem_cache *slab_blocks;
16 static struct i915_buddy_block *i915_block_alloc(struct i915_buddy_mm *mm,
17 struct i915_buddy_block *parent,
21 struct i915_buddy_block *block;
23 GEM_BUG_ON(order > I915_BUDDY_MAX_ORDER);
25 block = kmem_cache_zalloc(slab_blocks, GFP_KERNEL);
29 block->header = offset;
30 block->header |= order;
31 block->parent = parent;
33 GEM_BUG_ON(block->header & I915_BUDDY_HEADER_UNUSED);
37 static void i915_block_free(struct i915_buddy_mm *mm,
38 struct i915_buddy_block *block)
40 kmem_cache_free(slab_blocks, block);
43 static void mark_allocated(struct i915_buddy_block *block)
45 block->header &= ~I915_BUDDY_HEADER_STATE;
46 block->header |= I915_BUDDY_ALLOCATED;
48 list_del(&block->link);
51 static void mark_free(struct i915_buddy_mm *mm,
52 struct i915_buddy_block *block)
54 block->header &= ~I915_BUDDY_HEADER_STATE;
55 block->header |= I915_BUDDY_FREE;
57 list_add(&block->link,
58 &mm->free_list[i915_buddy_block_order(block)]);
61 static void mark_split(struct i915_buddy_block *block)
63 block->header &= ~I915_BUDDY_HEADER_STATE;
64 block->header |= I915_BUDDY_SPLIT;
66 list_del(&block->link);
69 int i915_buddy_init(struct i915_buddy_mm *mm, u64 size, u64 chunk_size)
74 if (size < chunk_size)
77 if (chunk_size < PAGE_SIZE)
80 if (!is_power_of_2(chunk_size))
83 size = round_down(size, chunk_size);
87 mm->chunk_size = chunk_size;
88 mm->max_order = ilog2(size) - ilog2(chunk_size);
90 GEM_BUG_ON(mm->max_order > I915_BUDDY_MAX_ORDER);
92 mm->free_list = kmalloc_array(mm->max_order + 1,
93 sizeof(struct list_head),
98 for (i = 0; i <= mm->max_order; ++i)
99 INIT_LIST_HEAD(&mm->free_list[i]);
101 mm->n_roots = hweight64(size);
103 mm->roots = kmalloc_array(mm->n_roots,
104 sizeof(struct i915_buddy_block *),
113 * Split into power-of-two blocks, in case we are given a size that is
114 * not itself a power-of-two.
117 struct i915_buddy_block *root;
121 root_size = rounddown_pow_of_two(size);
122 order = ilog2(root_size) - ilog2(chunk_size);
124 root = i915_block_alloc(mm, NULL, order, offset);
130 GEM_BUG_ON(i > mm->max_order);
131 GEM_BUG_ON(i915_buddy_block_size(mm, root) < chunk_size);
144 i915_block_free(mm, mm->roots[i]);
147 kfree(mm->free_list);
151 void i915_buddy_fini(struct i915_buddy_mm *mm)
155 for (i = 0; i < mm->n_roots; ++i) {
156 GEM_WARN_ON(!i915_buddy_block_is_free(mm->roots[i]));
157 i915_block_free(mm, mm->roots[i]);
160 GEM_WARN_ON(mm->avail != mm->size);
163 kfree(mm->free_list);
166 static int split_block(struct i915_buddy_mm *mm,
167 struct i915_buddy_block *block)
169 unsigned int block_order = i915_buddy_block_order(block) - 1;
170 u64 offset = i915_buddy_block_offset(block);
172 GEM_BUG_ON(!i915_buddy_block_is_free(block));
173 GEM_BUG_ON(!i915_buddy_block_order(block));
175 block->left = i915_block_alloc(mm, block, block_order, offset);
179 block->right = i915_block_alloc(mm, block, block_order,
180 offset + (mm->chunk_size << block_order));
182 i915_block_free(mm, block->left);
186 mark_free(mm, block->left);
187 mark_free(mm, block->right);
194 static struct i915_buddy_block *
195 get_buddy(struct i915_buddy_block *block)
197 struct i915_buddy_block *parent;
199 parent = block->parent;
203 if (parent->left == block)
204 return parent->right;
209 static void __i915_buddy_free(struct i915_buddy_mm *mm,
210 struct i915_buddy_block *block)
212 struct i915_buddy_block *parent;
214 while ((parent = block->parent)) {
215 struct i915_buddy_block *buddy;
217 buddy = get_buddy(block);
219 if (!i915_buddy_block_is_free(buddy))
222 list_del(&buddy->link);
224 i915_block_free(mm, block);
225 i915_block_free(mm, buddy);
230 mark_free(mm, block);
233 void i915_buddy_free(struct i915_buddy_mm *mm,
234 struct i915_buddy_block *block)
236 GEM_BUG_ON(!i915_buddy_block_is_allocated(block));
237 mm->avail += i915_buddy_block_size(mm, block);
238 __i915_buddy_free(mm, block);
241 void i915_buddy_free_list(struct i915_buddy_mm *mm, struct list_head *objects)
243 struct i915_buddy_block *block, *on;
245 list_for_each_entry_safe(block, on, objects, link) {
246 i915_buddy_free(mm, block);
249 INIT_LIST_HEAD(objects);
253 * Allocate power-of-two block. The order value here translates to:
255 * 0 = 2^0 * mm->chunk_size
256 * 1 = 2^1 * mm->chunk_size
257 * 2 = 2^2 * mm->chunk_size
260 struct i915_buddy_block *
261 i915_buddy_alloc(struct i915_buddy_mm *mm, unsigned int order)
263 struct i915_buddy_block *block = NULL;
267 for (i = order; i <= mm->max_order; ++i) {
268 block = list_first_entry_or_null(&mm->free_list[i],
269 struct i915_buddy_block,
276 return ERR_PTR(-ENOSPC);
278 GEM_BUG_ON(!i915_buddy_block_is_free(block));
281 err = split_block(mm, block);
290 mark_allocated(block);
291 mm->avail -= i915_buddy_block_size(mm, block);
292 kmemleak_update_trace(block);
297 __i915_buddy_free(mm, block);
301 static inline bool overlaps(u64 s1, u64 e1, u64 s2, u64 e2)
303 return s1 <= e2 && e1 >= s2;
306 static inline bool contains(u64 s1, u64 e1, u64 s2, u64 e2)
308 return s1 <= s2 && e1 >= e2;
312 * Allocate range. Note that it's safe to chain together multiple alloc_ranges
313 * with the same blocks list.
315 * Intended for pre-allocating portions of the address space, for example to
316 * reserve a block for the initial framebuffer or similar, hence the expectation
317 * here is that i915_buddy_alloc() is still the main vehicle for
318 * allocations, so if that's not the case then the drm_mm range allocator is
319 * probably a much better fit, and so you should probably go use that instead.
321 int i915_buddy_alloc_range(struct i915_buddy_mm *mm,
322 struct list_head *blocks,
325 struct i915_buddy_block *block;
326 struct i915_buddy_block *buddy;
327 LIST_HEAD(allocated);
333 if (size < mm->chunk_size)
336 if (!IS_ALIGNED(size | start, mm->chunk_size))
339 if (range_overflows(start, size, mm->size))
342 for (i = 0; i < mm->n_roots; ++i)
343 list_add_tail(&mm->roots[i]->tmp_link, &dfs);
345 end = start + size - 1;
351 block = list_first_entry_or_null(&dfs,
352 struct i915_buddy_block,
357 list_del(&block->tmp_link);
359 block_start = i915_buddy_block_offset(block);
360 block_end = block_start + i915_buddy_block_size(mm, block) - 1;
362 if (!overlaps(start, end, block_start, block_end))
365 if (i915_buddy_block_is_allocated(block)) {
370 if (contains(start, end, block_start, block_end)) {
371 if (!i915_buddy_block_is_free(block)) {
376 mark_allocated(block);
377 mm->avail -= i915_buddy_block_size(mm, block);
378 list_add_tail(&block->link, &allocated);
382 if (!i915_buddy_block_is_split(block)) {
383 err = split_block(mm, block);
388 list_add(&block->right->tmp_link, &dfs);
389 list_add(&block->left->tmp_link, &dfs);
392 list_splice_tail(&allocated, blocks);
397 * We really don't want to leave around a bunch of split blocks, since
398 * bigger is better, so make sure we merge everything back before we
399 * free the allocated blocks.
401 buddy = get_buddy(block);
403 (i915_buddy_block_is_free(block) &&
404 i915_buddy_block_is_free(buddy)))
405 __i915_buddy_free(mm, block);
408 i915_buddy_free_list(mm, &allocated);
412 void i915_buddy_block_print(struct i915_buddy_mm *mm,
413 struct i915_buddy_block *block,
414 struct drm_printer *p)
416 u64 start = i915_buddy_block_offset(block);
417 u64 size = i915_buddy_block_size(mm, block);
419 drm_printf(p, "%#018llx-%#018llx: %llu\n", start, start + size, size);
422 void i915_buddy_print(struct i915_buddy_mm *mm, struct drm_printer *p)
426 drm_printf(p, "chunk_size: %lluKiB, total: %lluMiB, free: %lluMiB\n",
427 mm->chunk_size >> 10, mm->size >> 20, mm->avail >> 20);
429 for (order = mm->max_order; order >= 0; order--) {
430 struct i915_buddy_block *block;
433 list_for_each_entry(block, &mm->free_list[order], link) {
434 GEM_BUG_ON(!i915_buddy_block_is_free(block));
438 drm_printf(p, "order-%d ", order);
440 free = count * (mm->chunk_size << order);
442 drm_printf(p, "free: %lluKiB", free >> 10);
444 drm_printf(p, "free: %lluMiB", free >> 20);
446 drm_printf(p, ", pages: %llu\n", count);
450 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
451 #include "selftests/i915_buddy.c"
454 void i915_buddy_module_exit(void)
456 kmem_cache_destroy(slab_blocks);
459 int __init i915_buddy_module_init(void)
461 slab_blocks = KMEM_CACHE(i915_buddy_block, 0);