1 // SPDX-License-Identifier: GPL-2.0 OR MIT
5 #include <linux/iosys-map.h>
6 #include <linux/sync_file.h>
7 #include <linux/pagemap.h>
8 #include <linux/shmem_fs.h>
9 #include <linux/dma-mapping.h>
11 #include <drm/drm_file.h>
12 #include <drm/drm_syncobj.h>
13 #include <drm/drm_utils.h>
15 #include <drm/lima_drm.h>
21 int lima_heap_alloc(struct lima_bo *bo, struct lima_vm *vm)
24 struct address_space *mapping = bo->base.base.filp->f_mapping;
25 struct device *dev = bo->base.base.dev->dev;
26 size_t old_size = bo->heap_size;
27 size_t new_size = bo->heap_size ? bo->heap_size * 2 :
28 (lima_heap_init_nr_pages << PAGE_SHIFT);
32 if (bo->heap_size >= bo->base.base.size)
35 new_size = min(new_size, bo->base.base.size);
37 dma_resv_lock(bo->base.base.resv, NULL);
40 pages = bo->base.pages;
42 pages = kvmalloc_array(bo->base.base.size >> PAGE_SHIFT,
43 sizeof(*pages), GFP_KERNEL | __GFP_ZERO);
45 dma_resv_unlock(bo->base.base.resv);
49 bo->base.pages = pages;
50 bo->base.pages_use_count = 1;
52 mapping_set_unevictable(mapping);
55 for (i = old_size >> PAGE_SHIFT; i < new_size >> PAGE_SHIFT; i++) {
56 struct page *page = shmem_read_mapping_page(mapping, i);
59 dma_resv_unlock(bo->base.base.resv);
65 dma_resv_unlock(bo->base.base.resv);
67 ret = sg_alloc_table_from_pages(&sgt, pages, i, 0,
68 new_size, GFP_KERNEL);
73 dma_unmap_sgtable(dev, bo->base.sgt, DMA_BIDIRECTIONAL, 0);
74 sg_free_table(bo->base.sgt);
76 bo->base.sgt = kmalloc(sizeof(*bo->base.sgt), GFP_KERNEL);
83 ret = dma_map_sgtable(dev, &sgt, DMA_BIDIRECTIONAL, 0);
90 ret = lima_vm_map_bo(vm, bo, old_size >> PAGE_SHIFT);
95 bo->heap_size = new_size;
99 dma_unmap_sgtable(dev, &sgt, DMA_BIDIRECTIONAL, 0);
108 int lima_gem_create_handle(struct drm_device *dev, struct drm_file *file,
109 u32 size, u32 flags, u32 *handle)
113 struct drm_gem_shmem_object *shmem;
114 struct drm_gem_object *obj;
116 bool is_heap = flags & LIMA_BO_FLAG_HEAP;
118 shmem = drm_gem_shmem_create(dev, size);
120 return PTR_ERR(shmem);
124 /* Mali Utgard GPU can only support 32bit address space */
125 mask = mapping_gfp_mask(obj->filp->f_mapping);
126 mask &= ~__GFP_HIGHMEM;
128 mapping_set_gfp_mask(obj->filp->f_mapping, mask);
131 bo = to_lima_bo(obj);
132 err = lima_heap_alloc(bo, NULL);
136 struct sg_table *sgt = drm_gem_shmem_get_pages_sgt(shmem);
144 err = drm_gem_handle_create(file, obj, handle);
147 /* drop reference from allocate - handle holds it now */
148 drm_gem_object_put(obj);
153 static void lima_gem_free_object(struct drm_gem_object *obj)
155 struct lima_bo *bo = to_lima_bo(obj);
157 if (!list_empty(&bo->va))
158 dev_err(obj->dev->dev, "lima gem free bo still has va\n");
160 drm_gem_shmem_free(&bo->base);
163 static int lima_gem_object_open(struct drm_gem_object *obj, struct drm_file *file)
165 struct lima_bo *bo = to_lima_bo(obj);
166 struct lima_drm_priv *priv = to_lima_drm_priv(file);
167 struct lima_vm *vm = priv->vm;
169 return lima_vm_bo_add(vm, bo, true);
172 static void lima_gem_object_close(struct drm_gem_object *obj, struct drm_file *file)
174 struct lima_bo *bo = to_lima_bo(obj);
175 struct lima_drm_priv *priv = to_lima_drm_priv(file);
176 struct lima_vm *vm = priv->vm;
178 lima_vm_bo_del(vm, bo);
181 static int lima_gem_pin(struct drm_gem_object *obj)
183 struct lima_bo *bo = to_lima_bo(obj);
188 return drm_gem_shmem_pin_locked(&bo->base);
191 static int lima_gem_vmap(struct drm_gem_object *obj, struct iosys_map *map)
193 struct lima_bo *bo = to_lima_bo(obj);
198 return drm_gem_shmem_vmap(&bo->base, map);
201 static int lima_gem_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma)
203 struct lima_bo *bo = to_lima_bo(obj);
208 return drm_gem_shmem_mmap(&bo->base, vma);
211 static const struct drm_gem_object_funcs lima_gem_funcs = {
212 .free = lima_gem_free_object,
213 .open = lima_gem_object_open,
214 .close = lima_gem_object_close,
215 .print_info = drm_gem_shmem_object_print_info,
217 .unpin = drm_gem_shmem_object_unpin,
218 .get_sg_table = drm_gem_shmem_object_get_sg_table,
219 .vmap = lima_gem_vmap,
220 .vunmap = drm_gem_shmem_object_vunmap,
221 .mmap = lima_gem_mmap,
222 .vm_ops = &drm_gem_shmem_vm_ops,
225 struct drm_gem_object *lima_gem_create_object(struct drm_device *dev, size_t size)
229 bo = kzalloc(sizeof(*bo), GFP_KERNEL);
231 return ERR_PTR(-ENOMEM);
233 mutex_init(&bo->lock);
234 INIT_LIST_HEAD(&bo->va);
235 bo->base.map_wc = true;
236 bo->base.base.funcs = &lima_gem_funcs;
238 return &bo->base.base;
241 int lima_gem_get_info(struct drm_file *file, u32 handle, u32 *va, u64 *offset)
243 struct drm_gem_object *obj;
245 struct lima_drm_priv *priv = to_lima_drm_priv(file);
246 struct lima_vm *vm = priv->vm;
248 obj = drm_gem_object_lookup(file, handle);
252 bo = to_lima_bo(obj);
254 *va = lima_vm_get_va(vm, bo);
256 *offset = drm_vma_node_offset_addr(&obj->vma_node);
258 drm_gem_object_put(obj);
262 static int lima_gem_sync_bo(struct lima_sched_task *task, struct lima_bo *bo,
263 bool write, bool explicit)
267 err = dma_resv_reserve_fences(lima_bo_resv(bo), 1);
271 /* explicit sync use user passed dep fence */
275 return drm_sched_job_add_implicit_dependencies(&task->base,
280 static int lima_gem_add_deps(struct drm_file *file, struct lima_submit *submit)
284 for (i = 0; i < ARRAY_SIZE(submit->in_sync); i++) {
285 if (!submit->in_sync[i])
288 err = drm_sched_job_add_syncobj_dependency(&submit->task->base, file,
289 submit->in_sync[i], 0);
297 int lima_gem_submit(struct drm_file *file, struct lima_submit *submit)
300 struct ww_acquire_ctx ctx;
301 struct lima_drm_priv *priv = to_lima_drm_priv(file);
302 struct lima_vm *vm = priv->vm;
303 struct drm_syncobj *out_sync = NULL;
304 struct dma_fence *fence;
305 struct lima_bo **bos = submit->lbos;
307 if (submit->out_sync) {
308 out_sync = drm_syncobj_find(file, submit->out_sync);
313 for (i = 0; i < submit->nr_bos; i++) {
314 struct drm_gem_object *obj;
317 obj = drm_gem_object_lookup(file, submit->bos[i].handle);
323 bo = to_lima_bo(obj);
325 /* increase refcnt of gpu va map to prevent unmapped when executing,
326 * will be decreased when task done
328 err = lima_vm_bo_add(vm, bo, false);
330 drm_gem_object_put(obj);
337 err = drm_gem_lock_reservations((struct drm_gem_object **)bos,
338 submit->nr_bos, &ctx);
342 err = lima_sched_task_init(
343 submit->task, submit->ctx->context + submit->pipe,
344 bos, submit->nr_bos, vm);
348 err = lima_gem_add_deps(file, submit);
352 for (i = 0; i < submit->nr_bos; i++) {
353 err = lima_gem_sync_bo(
354 submit->task, bos[i],
355 submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE,
356 submit->flags & LIMA_SUBMIT_FLAG_EXPLICIT_FENCE);
361 fence = lima_sched_context_queue_task(submit->task);
363 for (i = 0; i < submit->nr_bos; i++) {
364 dma_resv_add_fence(lima_bo_resv(bos[i]), fence,
365 submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE ?
366 DMA_RESV_USAGE_WRITE : DMA_RESV_USAGE_READ);
369 drm_gem_unlock_reservations((struct drm_gem_object **)bos,
370 submit->nr_bos, &ctx);
372 for (i = 0; i < submit->nr_bos; i++)
373 drm_gem_object_put(&bos[i]->base.base);
376 drm_syncobj_replace_fence(out_sync, fence);
377 drm_syncobj_put(out_sync);
380 dma_fence_put(fence);
385 lima_sched_task_fini(submit->task);
387 drm_gem_unlock_reservations((struct drm_gem_object **)bos,
388 submit->nr_bos, &ctx);
390 for (i = 0; i < submit->nr_bos; i++) {
393 lima_vm_bo_del(vm, bos[i]);
394 drm_gem_object_put(&bos[i]->base.base);
397 drm_syncobj_put(out_sync);
401 int lima_gem_wait(struct drm_file *file, u32 handle, u32 op, s64 timeout_ns)
403 bool write = op & LIMA_GEM_WAIT_WRITE;
409 timeout = drm_timeout_abs_to_jiffies(timeout_ns);
411 ret = drm_gem_dma_resv_wait(file, handle, write, timeout);
413 ret = timeout ? -ETIMEDOUT : -EBUSY;