2 * Copyright 2015 Advanced Micro Devices, Inc.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19 * USE OR OTHER DEALINGS IN THE SOFTWARE.
21 * The above copyright notice and this permission notice (including the
22 * next paragraph) shall be included in all copies or substantial portions
33 #include "amdgpu_trace.h"
35 #define AMDGPU_BO_LIST_MAX_PRIORITY 32u
36 #define AMDGPU_BO_LIST_NUM_BUCKETS (AMDGPU_BO_LIST_MAX_PRIORITY + 1)
38 static int amdgpu_bo_list_create(struct amdgpu_fpriv *fpriv,
39 struct amdgpu_bo_list **result,
44 *result = kzalloc(sizeof(struct amdgpu_bo_list), GFP_KERNEL);
48 mutex_lock(&fpriv->bo_list_lock);
49 r = idr_alloc(&fpriv->bo_list_handles, *result,
52 mutex_unlock(&fpriv->bo_list_lock);
58 mutex_init(&(*result)->lock);
59 (*result)->num_entries = 0;
60 (*result)->array = NULL;
62 mutex_lock(&(*result)->lock);
63 mutex_unlock(&fpriv->bo_list_lock);
68 static void amdgpu_bo_list_destroy(struct amdgpu_fpriv *fpriv, int id)
70 struct amdgpu_bo_list *list;
72 mutex_lock(&fpriv->bo_list_lock);
73 list = idr_find(&fpriv->bo_list_handles, id);
75 mutex_lock(&list->lock);
76 idr_remove(&fpriv->bo_list_handles, id);
77 mutex_unlock(&list->lock);
78 amdgpu_bo_list_free(list);
80 mutex_unlock(&fpriv->bo_list_lock);
83 static int amdgpu_bo_list_set(struct amdgpu_device *adev,
84 struct drm_file *filp,
85 struct amdgpu_bo_list *list,
86 struct drm_amdgpu_bo_list_entry *info,
89 struct amdgpu_bo_list_entry *array;
90 struct amdgpu_bo *gds_obj = adev->gds.gds_gfx_bo;
91 struct amdgpu_bo *gws_obj = adev->gds.gws_gfx_bo;
92 struct amdgpu_bo *oa_obj = adev->gds.oa_gfx_bo;
94 unsigned last_entry = 0, first_userptr = num_entries;
97 unsigned long total_size = 0;
99 array = drm_malloc_ab(num_entries, sizeof(struct amdgpu_bo_list_entry));
102 memset(array, 0, num_entries * sizeof(struct amdgpu_bo_list_entry));
104 for (i = 0; i < num_entries; ++i) {
105 struct amdgpu_bo_list_entry *entry;
106 struct drm_gem_object *gobj;
107 struct amdgpu_bo *bo;
108 struct mm_struct *usermm;
110 gobj = drm_gem_object_lookup(filp, info[i].bo_handle);
116 bo = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj));
117 drm_gem_object_unreference_unlocked(gobj);
119 usermm = amdgpu_ttm_tt_get_usermm(bo->tbo.ttm);
121 if (usermm != current->mm) {
122 amdgpu_bo_unref(&bo);
126 entry = &array[--first_userptr];
128 entry = &array[last_entry++];
132 entry->priority = min(info[i].bo_priority,
133 AMDGPU_BO_LIST_MAX_PRIORITY);
134 entry->tv.bo = &entry->robj->tbo;
135 entry->tv.shared = true;
137 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_GDS)
138 gds_obj = entry->robj;
139 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_GWS)
140 gws_obj = entry->robj;
141 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_OA)
142 oa_obj = entry->robj;
144 total_size += amdgpu_bo_size(entry->robj);
145 trace_amdgpu_bo_list_set(list, entry->robj);
148 for (i = 0; i < list->num_entries; ++i)
149 amdgpu_bo_unref(&list->array[i].robj);
151 drm_free_large(list->array);
153 list->gds_obj = gds_obj;
154 list->gws_obj = gws_obj;
155 list->oa_obj = oa_obj;
156 list->first_userptr = first_userptr;
158 list->num_entries = num_entries;
160 trace_amdgpu_cs_bo_status(list->num_entries, total_size);
165 amdgpu_bo_unref(&array[i].robj);
166 drm_free_large(array);
170 struct amdgpu_bo_list *
171 amdgpu_bo_list_get(struct amdgpu_fpriv *fpriv, int id)
173 struct amdgpu_bo_list *result;
175 mutex_lock(&fpriv->bo_list_lock);
176 result = idr_find(&fpriv->bo_list_handles, id);
178 mutex_lock(&result->lock);
179 mutex_unlock(&fpriv->bo_list_lock);
183 void amdgpu_bo_list_get_list(struct amdgpu_bo_list *list,
184 struct list_head *validated)
186 /* This is based on the bucket sort with O(n) time complexity.
187 * An item with priority "i" is added to bucket[i]. The lists are then
188 * concatenated in descending order.
190 struct list_head bucket[AMDGPU_BO_LIST_NUM_BUCKETS];
193 for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
194 INIT_LIST_HEAD(&bucket[i]);
196 /* Since buffers which appear sooner in the relocation list are
197 * likely to be used more often than buffers which appear later
198 * in the list, the sort mustn't change the ordering of buffers
199 * with the same priority, i.e. it must be stable.
201 for (i = 0; i < list->num_entries; i++) {
202 unsigned priority = list->array[i].priority;
204 list_add_tail(&list->array[i].tv.head,
206 list->array[i].user_pages = NULL;
209 /* Connect the sorted buckets in the output list. */
210 for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
211 list_splice(&bucket[i], validated);
214 void amdgpu_bo_list_put(struct amdgpu_bo_list *list)
216 mutex_unlock(&list->lock);
219 void amdgpu_bo_list_free(struct amdgpu_bo_list *list)
223 for (i = 0; i < list->num_entries; ++i)
224 amdgpu_bo_unref(&list->array[i].robj);
226 mutex_destroy(&list->lock);
227 drm_free_large(list->array);
231 int amdgpu_bo_list_ioctl(struct drm_device *dev, void *data,
232 struct drm_file *filp)
234 const uint32_t info_size = sizeof(struct drm_amdgpu_bo_list_entry);
236 struct amdgpu_device *adev = dev->dev_private;
237 struct amdgpu_fpriv *fpriv = filp->driver_priv;
238 union drm_amdgpu_bo_list *args = data;
239 uint32_t handle = args->in.list_handle;
240 const void __user *uptr = (const void*)(long)args->in.bo_info_ptr;
242 struct drm_amdgpu_bo_list_entry *info;
243 struct amdgpu_bo_list *list;
247 info = drm_malloc_ab(args->in.bo_number,
248 sizeof(struct drm_amdgpu_bo_list_entry));
252 /* copy the handle array from userspace to a kernel buffer */
254 if (likely(info_size == args->in.bo_info_size)) {
255 unsigned long bytes = args->in.bo_number *
256 args->in.bo_info_size;
258 if (copy_from_user(info, uptr, bytes))
262 unsigned long bytes = min(args->in.bo_info_size, info_size);
265 memset(info, 0, args->in.bo_number * info_size);
266 for (i = 0; i < args->in.bo_number; ++i) {
267 if (copy_from_user(&info[i], uptr, bytes))
270 uptr += args->in.bo_info_size;
274 switch (args->in.operation) {
275 case AMDGPU_BO_LIST_OP_CREATE:
276 r = amdgpu_bo_list_create(fpriv, &list, &handle);
280 r = amdgpu_bo_list_set(adev, filp, list, info,
282 amdgpu_bo_list_put(list);
288 case AMDGPU_BO_LIST_OP_DESTROY:
289 amdgpu_bo_list_destroy(fpriv, handle);
293 case AMDGPU_BO_LIST_OP_UPDATE:
295 list = amdgpu_bo_list_get(fpriv, handle);
299 r = amdgpu_bo_list_set(adev, filp, list, info,
301 amdgpu_bo_list_put(list);
312 memset(args, 0, sizeof(*args));
313 args->out.list_handle = handle;
314 drm_free_large(info);
319 drm_free_large(info);