1 // SPDX-License-Identifier: GPL-2.0 OR MIT
5 #include <linux/sync_file.h>
6 #include <linux/pagemap.h>
7 #include <linux/shmem_fs.h>
8 #include <linux/dma-mapping.h>
10 #include <drm/drm_file.h>
11 #include <drm/drm_syncobj.h>
12 #include <drm/drm_utils.h>
14 #include <drm/lima_drm.h>
20 int lima_heap_alloc(struct lima_bo *bo, struct lima_vm *vm)
23 struct address_space *mapping = bo->base.base.filp->f_mapping;
24 struct device *dev = bo->base.base.dev->dev;
25 size_t old_size = bo->heap_size;
26 size_t new_size = bo->heap_size ? bo->heap_size * 2 :
27 (lima_heap_init_nr_pages << PAGE_SHIFT);
31 if (bo->heap_size >= bo->base.base.size)
34 new_size = min(new_size, bo->base.base.size);
36 mutex_lock(&bo->base.pages_lock);
39 pages = bo->base.pages;
41 pages = kvmalloc_array(bo->base.base.size >> PAGE_SHIFT,
42 sizeof(*pages), GFP_KERNEL | __GFP_ZERO);
44 mutex_unlock(&bo->base.pages_lock);
48 bo->base.pages = pages;
49 bo->base.pages_use_count = 1;
51 mapping_set_unevictable(mapping);
54 for (i = old_size >> PAGE_SHIFT; i < new_size >> PAGE_SHIFT; i++) {
55 struct page *page = shmem_read_mapping_page(mapping, i);
58 mutex_unlock(&bo->base.pages_lock);
64 mutex_unlock(&bo->base.pages_lock);
66 ret = sg_alloc_table_from_pages(&sgt, pages, i, 0,
67 new_size, GFP_KERNEL);
72 dma_unmap_sg(dev, bo->base.sgt->sgl,
73 bo->base.sgt->nents, DMA_BIDIRECTIONAL);
74 sg_free_table(bo->base.sgt);
76 bo->base.sgt = kmalloc(sizeof(*bo->base.sgt), GFP_KERNEL);
83 dma_map_sg(dev, sgt.sgl, sgt.nents, DMA_BIDIRECTIONAL);
88 ret = lima_vm_map_bo(vm, bo, old_size >> PAGE_SHIFT);
93 bo->heap_size = new_size;
97 int lima_gem_create_handle(struct drm_device *dev, struct drm_file *file,
98 u32 size, u32 flags, u32 *handle)
102 struct drm_gem_shmem_object *shmem;
103 struct drm_gem_object *obj;
105 bool is_heap = flags & LIMA_BO_FLAG_HEAP;
107 shmem = drm_gem_shmem_create(dev, size);
109 return PTR_ERR(shmem);
113 /* Mali Utgard GPU can only support 32bit address space */
114 mask = mapping_gfp_mask(obj->filp->f_mapping);
115 mask &= ~__GFP_HIGHMEM;
117 mapping_set_gfp_mask(obj->filp->f_mapping, mask);
120 bo = to_lima_bo(obj);
121 err = lima_heap_alloc(bo, NULL);
125 struct sg_table *sgt = drm_gem_shmem_get_pages_sgt(obj);
133 err = drm_gem_handle_create(file, obj, handle);
136 /* drop reference from allocate - handle holds it now */
137 drm_gem_object_put_unlocked(obj);
142 static void lima_gem_free_object(struct drm_gem_object *obj)
144 struct lima_bo *bo = to_lima_bo(obj);
146 if (!list_empty(&bo->va))
147 dev_err(obj->dev->dev, "lima gem free bo still has va\n");
149 drm_gem_shmem_free_object(obj);
152 static int lima_gem_object_open(struct drm_gem_object *obj, struct drm_file *file)
154 struct lima_bo *bo = to_lima_bo(obj);
155 struct lima_drm_priv *priv = to_lima_drm_priv(file);
156 struct lima_vm *vm = priv->vm;
158 return lima_vm_bo_add(vm, bo, true);
161 static void lima_gem_object_close(struct drm_gem_object *obj, struct drm_file *file)
163 struct lima_bo *bo = to_lima_bo(obj);
164 struct lima_drm_priv *priv = to_lima_drm_priv(file);
165 struct lima_vm *vm = priv->vm;
167 lima_vm_bo_del(vm, bo);
170 static int lima_gem_pin(struct drm_gem_object *obj)
172 struct lima_bo *bo = to_lima_bo(obj);
177 return drm_gem_shmem_pin(obj);
180 static void *lima_gem_vmap(struct drm_gem_object *obj)
182 struct lima_bo *bo = to_lima_bo(obj);
185 return ERR_PTR(-EINVAL);
187 return drm_gem_shmem_vmap(obj);
190 static int lima_gem_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma)
192 struct lima_bo *bo = to_lima_bo(obj);
197 return drm_gem_shmem_mmap(obj, vma);
200 static const struct drm_gem_object_funcs lima_gem_funcs = {
201 .free = lima_gem_free_object,
202 .open = lima_gem_object_open,
203 .close = lima_gem_object_close,
204 .print_info = drm_gem_shmem_print_info,
206 .unpin = drm_gem_shmem_unpin,
207 .get_sg_table = drm_gem_shmem_get_sg_table,
208 .vmap = lima_gem_vmap,
209 .vunmap = drm_gem_shmem_vunmap,
210 .mmap = lima_gem_mmap,
213 struct drm_gem_object *lima_gem_create_object(struct drm_device *dev, size_t size)
217 bo = kzalloc(sizeof(*bo), GFP_KERNEL);
221 mutex_init(&bo->lock);
222 INIT_LIST_HEAD(&bo->va);
224 bo->base.base.funcs = &lima_gem_funcs;
226 return &bo->base.base;
229 int lima_gem_get_info(struct drm_file *file, u32 handle, u32 *va, u64 *offset)
231 struct drm_gem_object *obj;
233 struct lima_drm_priv *priv = to_lima_drm_priv(file);
234 struct lima_vm *vm = priv->vm;
236 obj = drm_gem_object_lookup(file, handle);
240 bo = to_lima_bo(obj);
242 *va = lima_vm_get_va(vm, bo);
244 *offset = drm_vma_node_offset_addr(&obj->vma_node);
246 drm_gem_object_put_unlocked(obj);
250 static int lima_gem_sync_bo(struct lima_sched_task *task, struct lima_bo *bo,
251 bool write, bool explicit)
256 err = dma_resv_reserve_shared(lima_bo_resv(bo), 1);
261 /* explicit sync use user passed dep fence */
265 return drm_gem_fence_array_add_implicit(&task->deps, &bo->base.base, write);
268 static int lima_gem_add_deps(struct drm_file *file, struct lima_submit *submit)
272 for (i = 0; i < ARRAY_SIZE(submit->in_sync); i++) {
273 struct dma_fence *fence = NULL;
275 if (!submit->in_sync[i])
278 err = drm_syncobj_find_fence(file, submit->in_sync[i],
283 err = drm_gem_fence_array_add(&submit->task->deps, fence);
285 dma_fence_put(fence);
293 int lima_gem_submit(struct drm_file *file, struct lima_submit *submit)
296 struct ww_acquire_ctx ctx;
297 struct lima_drm_priv *priv = to_lima_drm_priv(file);
298 struct lima_vm *vm = priv->vm;
299 struct drm_syncobj *out_sync = NULL;
300 struct dma_fence *fence;
301 struct lima_bo **bos = submit->lbos;
303 if (submit->out_sync) {
304 out_sync = drm_syncobj_find(file, submit->out_sync);
309 for (i = 0; i < submit->nr_bos; i++) {
310 struct drm_gem_object *obj;
313 obj = drm_gem_object_lookup(file, submit->bos[i].handle);
319 bo = to_lima_bo(obj);
321 /* increase refcnt of gpu va map to prevent unmapped when executing,
322 * will be decreased when task done
324 err = lima_vm_bo_add(vm, bo, false);
326 drm_gem_object_put_unlocked(obj);
333 err = drm_gem_lock_reservations((struct drm_gem_object **)bos,
334 submit->nr_bos, &ctx);
338 err = lima_sched_task_init(
339 submit->task, submit->ctx->context + submit->pipe,
340 bos, submit->nr_bos, vm);
344 err = lima_gem_add_deps(file, submit);
348 for (i = 0; i < submit->nr_bos; i++) {
349 err = lima_gem_sync_bo(
350 submit->task, bos[i],
351 submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE,
352 submit->flags & LIMA_SUBMIT_FLAG_EXPLICIT_FENCE);
357 fence = lima_sched_context_queue_task(
358 submit->ctx->context + submit->pipe, submit->task);
360 for (i = 0; i < submit->nr_bos; i++) {
361 if (submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE)
362 dma_resv_add_excl_fence(lima_bo_resv(bos[i]), fence);
364 dma_resv_add_shared_fence(lima_bo_resv(bos[i]), fence);
367 drm_gem_unlock_reservations((struct drm_gem_object **)bos,
368 submit->nr_bos, &ctx);
370 for (i = 0; i < submit->nr_bos; i++)
371 drm_gem_object_put_unlocked(&bos[i]->base.base);
374 drm_syncobj_replace_fence(out_sync, fence);
375 drm_syncobj_put(out_sync);
378 dma_fence_put(fence);
383 lima_sched_task_fini(submit->task);
385 drm_gem_unlock_reservations((struct drm_gem_object **)bos,
386 submit->nr_bos, &ctx);
388 for (i = 0; i < submit->nr_bos; i++) {
391 lima_vm_bo_del(vm, bos[i]);
392 drm_gem_object_put_unlocked(&bos[i]->base.base);
395 drm_syncobj_put(out_sync);
399 int lima_gem_wait(struct drm_file *file, u32 handle, u32 op, s64 timeout_ns)
401 bool write = op & LIMA_GEM_WAIT_WRITE;
407 timeout = drm_timeout_abs_to_jiffies(timeout_ns);
409 ret = drm_gem_dma_resv_wait(file, handle, write, timeout);
411 ret = timeout ? -ETIMEDOUT : -EBUSY;