1d38ceaf9SAlex Deucher /*
2d38ceaf9SAlex Deucher  * Copyright 2015 Advanced Micro Devices, Inc.
3d38ceaf9SAlex Deucher  * All Rights Reserved.
4d38ceaf9SAlex Deucher  *
5d38ceaf9SAlex Deucher  * Permission is hereby granted, free of charge, to any person obtaining a
6d38ceaf9SAlex Deucher  * copy of this software and associated documentation files (the
7d38ceaf9SAlex Deucher  * "Software"), to deal in the Software without restriction, including
8d38ceaf9SAlex Deucher  * without limitation the rights to use, copy, modify, merge, publish,
9d38ceaf9SAlex Deucher  * distribute, sub license, and/or sell copies of the Software, and to
10d38ceaf9SAlex Deucher  * permit persons to whom the Software is furnished to do so, subject to
11d38ceaf9SAlex Deucher  * the following conditions:
12d38ceaf9SAlex Deucher  *
13d38ceaf9SAlex Deucher  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14d38ceaf9SAlex Deucher  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15d38ceaf9SAlex Deucher  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16d38ceaf9SAlex Deucher  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17d38ceaf9SAlex Deucher  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18d38ceaf9SAlex Deucher  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19d38ceaf9SAlex Deucher  * USE OR OTHER DEALINGS IN THE SOFTWARE.
20d38ceaf9SAlex Deucher  *
21d38ceaf9SAlex Deucher  * The above copyright notice and this permission notice (including the
22d38ceaf9SAlex Deucher  * next paragraph) shall be included in all copies or substantial portions
23d38ceaf9SAlex Deucher  * of the Software.
24d38ceaf9SAlex Deucher  *
25d38ceaf9SAlex Deucher  */
26d38ceaf9SAlex Deucher /*
27d38ceaf9SAlex Deucher  * Authors:
28d38ceaf9SAlex Deucher  *    Christian König <deathsimple@vodafone.de>
29d38ceaf9SAlex Deucher  */
30d38ceaf9SAlex Deucher 
31fdf2f6c5SSam Ravnborg #include <linux/uaccess.h>
32fdf2f6c5SSam Ravnborg 
33d38ceaf9SAlex Deucher #include "amdgpu.h"
34ec74407aSChristian König #include "amdgpu_trace.h"
35d38ceaf9SAlex Deucher 
36636ce25cSChristian König #define AMDGPU_BO_LIST_MAX_PRIORITY	32u
37636ce25cSChristian König #define AMDGPU_BO_LIST_NUM_BUCKETS	(AMDGPU_BO_LIST_MAX_PRIORITY + 1)
38636ce25cSChristian König 
39920990cbSChristian König static void amdgpu_bo_list_free_rcu(struct rcu_head *rcu)
40920990cbSChristian König {
41920990cbSChristian König 	struct amdgpu_bo_list *list = container_of(rcu, struct amdgpu_bo_list,
42920990cbSChristian König 						   rhead);
4399eea4dfSAlex Xie 
44920990cbSChristian König 	kvfree(list);
45920990cbSChristian König }
46920990cbSChristian König 
47920990cbSChristian König static void amdgpu_bo_list_free(struct kref *ref)
485ac55629SAlex Xie {
495ac55629SAlex Xie 	struct amdgpu_bo_list *list = container_of(ref, struct amdgpu_bo_list,
505ac55629SAlex Xie 						   refcount);
5139f7f69aSChristian König 	struct amdgpu_bo_list_entry *e;
525ac55629SAlex Xie 
53e83dfe4dSChristian König 	amdgpu_bo_list_for_each_entry(e, list) {
54e83dfe4dSChristian König 		struct amdgpu_bo *bo = ttm_to_amdgpu_bo(e->tv.bo);
55e83dfe4dSChristian König 
56e83dfe4dSChristian König 		amdgpu_bo_unref(&bo);
57e83dfe4dSChristian König 	}
585ac55629SAlex Xie 
59920990cbSChristian König 	call_rcu(&list->rhead, amdgpu_bo_list_free_rcu);
605ac55629SAlex Xie }
615ac55629SAlex Xie 
62920990cbSChristian König int amdgpu_bo_list_create(struct amdgpu_device *adev, struct drm_file *filp,
6399eea4dfSAlex Xie 			  struct drm_amdgpu_bo_list_entry *info,
64920990cbSChristian König 			  unsigned num_entries, struct amdgpu_bo_list **result)
65d38ceaf9SAlex Deucher {
66211dff55SChristian König 	unsigned last_entry = 0, first_userptr = num_entries;
67920990cbSChristian König 	struct amdgpu_bo_list_entry *array;
68920990cbSChristian König 	struct amdgpu_bo_list *list;
69275105ceSChristian König 	uint64_t total_size = 0;
70920990cbSChristian König 	size_t size;
71d38ceaf9SAlex Deucher 	unsigned i;
72cc325d19SChristian König 	int r;
73d38ceaf9SAlex Deucher 
74ff30e9e8SDan Carpenter 	if (num_entries > (SIZE_MAX - sizeof(struct amdgpu_bo_list))
75ff30e9e8SDan Carpenter 				/ sizeof(struct amdgpu_bo_list_entry))
76920990cbSChristian König 		return -EINVAL;
77920990cbSChristian König 
78920990cbSChristian König 	size = sizeof(struct amdgpu_bo_list);
79920990cbSChristian König 	size += num_entries * sizeof(struct amdgpu_bo_list_entry);
80920990cbSChristian König 	list = kvmalloc(size, GFP_KERNEL);
81920990cbSChristian König 	if (!list)
82d38ceaf9SAlex Deucher 		return -ENOMEM;
83920990cbSChristian König 
84920990cbSChristian König 	kref_init(&list->refcount);
85dca29491SChristian König 	list->gds_obj = NULL;
86dca29491SChristian König 	list->gws_obj = NULL;
87dca29491SChristian König 	list->oa_obj = NULL;
88920990cbSChristian König 
89920990cbSChristian König 	array = amdgpu_bo_list_array_entry(list, 0);
90d38ceaf9SAlex Deucher 	memset(array, 0, num_entries * sizeof(struct amdgpu_bo_list_entry));
91d38ceaf9SAlex Deucher 
92d38ceaf9SAlex Deucher 	for (i = 0; i < num_entries; ++i) {
93211dff55SChristian König 		struct amdgpu_bo_list_entry *entry;
94d38ceaf9SAlex Deucher 		struct drm_gem_object *gobj;
95211dff55SChristian König 		struct amdgpu_bo *bo;
96cc325d19SChristian König 		struct mm_struct *usermm;
97d38ceaf9SAlex Deucher 
98a8ad0bd8SChris Wilson 		gobj = drm_gem_object_lookup(filp, info[i].bo_handle);
99cc325d19SChristian König 		if (!gobj) {
100cc325d19SChristian König 			r = -ENOENT;
101d38ceaf9SAlex Deucher 			goto error_free;
102cc325d19SChristian König 		}
103d38ceaf9SAlex Deucher 
104211dff55SChristian König 		bo = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj));
105f62facc2SCihangir Akturk 		drm_gem_object_put_unlocked(gobj);
106211dff55SChristian König 
107211dff55SChristian König 		usermm = amdgpu_ttm_tt_get_usermm(bo->tbo.ttm);
108cc325d19SChristian König 		if (usermm) {
109cc325d19SChristian König 			if (usermm != current->mm) {
110211dff55SChristian König 				amdgpu_bo_unref(&bo);
111cc325d19SChristian König 				r = -EPERM;
112cc325d19SChristian König 				goto error_free;
113cc325d19SChristian König 			}
114211dff55SChristian König 			entry = &array[--first_userptr];
115211dff55SChristian König 		} else {
116211dff55SChristian König 			entry = &array[last_entry++];
117cc325d19SChristian König 		}
118211dff55SChristian König 
119211dff55SChristian König 		entry->priority = min(info[i].bo_priority,
120211dff55SChristian König 				      AMDGPU_BO_LIST_MAX_PRIORITY);
121e83dfe4dSChristian König 		entry->tv.bo = &bo->tbo;
122d38ceaf9SAlex Deucher 
123e83dfe4dSChristian König 		if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_GDS)
124e83dfe4dSChristian König 			list->gds_obj = bo;
125e83dfe4dSChristian König 		if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_GWS)
126e83dfe4dSChristian König 			list->gws_obj = bo;
127e83dfe4dSChristian König 		if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_OA)
128e83dfe4dSChristian König 			list->oa_obj = bo;
129ec74407aSChristian König 
130e83dfe4dSChristian König 		total_size += amdgpu_bo_size(bo);
131e83dfe4dSChristian König 		trace_amdgpu_bo_list_set(list, bo);
132d38ceaf9SAlex Deucher 	}
133d38ceaf9SAlex Deucher 
134211dff55SChristian König 	list->first_userptr = first_userptr;
135d38ceaf9SAlex Deucher 	list->num_entries = num_entries;
136d38ceaf9SAlex Deucher 
13715da301dSDavid Mao 	trace_amdgpu_cs_bo_status(list->num_entries, total_size);
138920990cbSChristian König 
139920990cbSChristian König 	*result = list;
140d38ceaf9SAlex Deucher 	return 0;
141d38ceaf9SAlex Deucher 
142d38ceaf9SAlex Deucher error_free:
143e83dfe4dSChristian König 	while (i--) {
144e83dfe4dSChristian König 		struct amdgpu_bo *bo = ttm_to_amdgpu_bo(array[i].tv.bo);
145e83dfe4dSChristian König 
146e83dfe4dSChristian König 		amdgpu_bo_unref(&bo);
147e83dfe4dSChristian König 	}
148920990cbSChristian König 	kvfree(list);
149cc325d19SChristian König 	return r;
150920990cbSChristian König 
151920990cbSChristian König }
152920990cbSChristian König 
153920990cbSChristian König static void amdgpu_bo_list_destroy(struct amdgpu_fpriv *fpriv, int id)
154920990cbSChristian König {
155920990cbSChristian König 	struct amdgpu_bo_list *list;
156920990cbSChristian König 
157920990cbSChristian König 	mutex_lock(&fpriv->bo_list_lock);
158920990cbSChristian König 	list = idr_remove(&fpriv->bo_list_handles, id);
159920990cbSChristian König 	mutex_unlock(&fpriv->bo_list_lock);
160920990cbSChristian König 	if (list)
161920990cbSChristian König 		kref_put(&list->refcount, amdgpu_bo_list_free);
162d38ceaf9SAlex Deucher }
163d38ceaf9SAlex Deucher 
16452c054caSChristian König int amdgpu_bo_list_get(struct amdgpu_fpriv *fpriv, int id,
16552c054caSChristian König 		       struct amdgpu_bo_list **result)
166d38ceaf9SAlex Deucher {
1675ac55629SAlex Xie 	rcu_read_lock();
16852c054caSChristian König 	*result = idr_find(&fpriv->bo_list_handles, id);
1695ac55629SAlex Xie 
17052c054caSChristian König 	if (*result && kref_get_unless_zero(&(*result)->refcount)) {
171564f0458SAlex Xie 		rcu_read_unlock();
17252c054caSChristian König 		return 0;
173564f0458SAlex Xie 	}
1745ac55629SAlex Xie 
17552c054caSChristian König 	rcu_read_unlock();
17652c054caSChristian König 	return -ENOENT;
177d38ceaf9SAlex Deucher }
178d38ceaf9SAlex Deucher 
179636ce25cSChristian König void amdgpu_bo_list_get_list(struct amdgpu_bo_list *list,
180636ce25cSChristian König 			     struct list_head *validated)
181636ce25cSChristian König {
182636ce25cSChristian König 	/* This is based on the bucket sort with O(n) time complexity.
183636ce25cSChristian König 	 * An item with priority "i" is added to bucket[i]. The lists are then
184636ce25cSChristian König 	 * concatenated in descending order.
185636ce25cSChristian König 	 */
186636ce25cSChristian König 	struct list_head bucket[AMDGPU_BO_LIST_NUM_BUCKETS];
18739f7f69aSChristian König 	struct amdgpu_bo_list_entry *e;
188636ce25cSChristian König 	unsigned i;
189636ce25cSChristian König 
190636ce25cSChristian König 	for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
191636ce25cSChristian König 		INIT_LIST_HEAD(&bucket[i]);
192636ce25cSChristian König 
193636ce25cSChristian König 	/* Since buffers which appear sooner in the relocation list are
194636ce25cSChristian König 	 * likely to be used more often than buffers which appear later
195636ce25cSChristian König 	 * in the list, the sort mustn't change the ordering of buffers
196636ce25cSChristian König 	 * with the same priority, i.e. it must be stable.
197636ce25cSChristian König 	 */
19839f7f69aSChristian König 	amdgpu_bo_list_for_each_entry(e, list) {
199e83dfe4dSChristian König 		struct amdgpu_bo *bo = ttm_to_amdgpu_bo(e->tv.bo);
20039f7f69aSChristian König 		unsigned priority = e->priority;
201636ce25cSChristian König 
202e83dfe4dSChristian König 		if (!bo->parent)
20339f7f69aSChristian König 			list_add_tail(&e->tv.head, &bucket[priority]);
204a20ee0b1SBas Nieuwenhuizen 
20539f7f69aSChristian König 		e->user_pages = NULL;
206636ce25cSChristian König 	}
207636ce25cSChristian König 
208636ce25cSChristian König 	/* Connect the sorted buckets in the output list. */
209636ce25cSChristian König 	for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
210636ce25cSChristian König 		list_splice(&bucket[i], validated);
211636ce25cSChristian König }
212636ce25cSChristian König 
213d38ceaf9SAlex Deucher void amdgpu_bo_list_put(struct amdgpu_bo_list *list)
214d38ceaf9SAlex Deucher {
215920990cbSChristian König 	kref_put(&list->refcount, amdgpu_bo_list_free);
216d38ceaf9SAlex Deucher }
217d38ceaf9SAlex Deucher 
218964d0fbfSAndrey Grodzovsky int amdgpu_bo_create_list_entry_array(struct drm_amdgpu_bo_list_in *in,
219964d0fbfSAndrey Grodzovsky 				      struct drm_amdgpu_bo_list_entry **info_param)
220d38ceaf9SAlex Deucher {
221964d0fbfSAndrey Grodzovsky 	const void __user *uptr = u64_to_user_ptr(in->bo_info_ptr);
222d38ceaf9SAlex Deucher 	const uint32_t info_size = sizeof(struct drm_amdgpu_bo_list_entry);
223d38ceaf9SAlex Deucher 	struct drm_amdgpu_bo_list_entry *info;
224d38ceaf9SAlex Deucher 	int r;
225d38ceaf9SAlex Deucher 
226964d0fbfSAndrey Grodzovsky 	info = kvmalloc_array(in->bo_number, info_size, GFP_KERNEL);
227d38ceaf9SAlex Deucher 	if (!info)
228d38ceaf9SAlex Deucher 		return -ENOMEM;
229d38ceaf9SAlex Deucher 
230d38ceaf9SAlex Deucher 	/* copy the handle array from userspace to a kernel buffer */
231d38ceaf9SAlex Deucher 	r = -EFAULT;
232964d0fbfSAndrey Grodzovsky 	if (likely(info_size == in->bo_info_size)) {
233964d0fbfSAndrey Grodzovsky 		unsigned long bytes = in->bo_number *
234964d0fbfSAndrey Grodzovsky 			in->bo_info_size;
235d38ceaf9SAlex Deucher 
236d38ceaf9SAlex Deucher 		if (copy_from_user(info, uptr, bytes))
237d38ceaf9SAlex Deucher 			goto error_free;
238d38ceaf9SAlex Deucher 
239d38ceaf9SAlex Deucher 	} else {
240964d0fbfSAndrey Grodzovsky 		unsigned long bytes = min(in->bo_info_size, info_size);
241d38ceaf9SAlex Deucher 		unsigned i;
242d38ceaf9SAlex Deucher 
243964d0fbfSAndrey Grodzovsky 		memset(info, 0, in->bo_number * info_size);
244964d0fbfSAndrey Grodzovsky 		for (i = 0; i < in->bo_number; ++i) {
245d38ceaf9SAlex Deucher 			if (copy_from_user(&info[i], uptr, bytes))
246d38ceaf9SAlex Deucher 				goto error_free;
247d38ceaf9SAlex Deucher 
248964d0fbfSAndrey Grodzovsky 			uptr += in->bo_info_size;
249d38ceaf9SAlex Deucher 		}
250d38ceaf9SAlex Deucher 	}
251d38ceaf9SAlex Deucher 
252964d0fbfSAndrey Grodzovsky 	*info_param = info;
253964d0fbfSAndrey Grodzovsky 	return 0;
254964d0fbfSAndrey Grodzovsky 
255964d0fbfSAndrey Grodzovsky error_free:
256964d0fbfSAndrey Grodzovsky 	kvfree(info);
257964d0fbfSAndrey Grodzovsky 	return r;
258964d0fbfSAndrey Grodzovsky }
259964d0fbfSAndrey Grodzovsky 
260964d0fbfSAndrey Grodzovsky int amdgpu_bo_list_ioctl(struct drm_device *dev, void *data,
261964d0fbfSAndrey Grodzovsky 				struct drm_file *filp)
262964d0fbfSAndrey Grodzovsky {
263964d0fbfSAndrey Grodzovsky 	struct amdgpu_device *adev = dev->dev_private;
264964d0fbfSAndrey Grodzovsky 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
265964d0fbfSAndrey Grodzovsky 	union drm_amdgpu_bo_list *args = data;
266964d0fbfSAndrey Grodzovsky 	uint32_t handle = args->in.list_handle;
267964d0fbfSAndrey Grodzovsky 	struct drm_amdgpu_bo_list_entry *info = NULL;
26881c6dabcSChristian König 	struct amdgpu_bo_list *list, *old;
269964d0fbfSAndrey Grodzovsky 	int r;
270964d0fbfSAndrey Grodzovsky 
271964d0fbfSAndrey Grodzovsky 	r = amdgpu_bo_create_list_entry_array(&args->in, &info);
272964d0fbfSAndrey Grodzovsky 	if (r)
273083164dbSNirmoy Das 		return r;
274964d0fbfSAndrey Grodzovsky 
275d38ceaf9SAlex Deucher 	switch (args->in.operation) {
276d38ceaf9SAlex Deucher 	case AMDGPU_BO_LIST_OP_CREATE:
27799eea4dfSAlex Xie 		r = amdgpu_bo_list_create(adev, filp, info, args->in.bo_number,
278964d0fbfSAndrey Grodzovsky 					  &list);
279d38ceaf9SAlex Deucher 		if (r)
280d38ceaf9SAlex Deucher 			goto error_free;
281964d0fbfSAndrey Grodzovsky 
282964d0fbfSAndrey Grodzovsky 		mutex_lock(&fpriv->bo_list_lock);
283964d0fbfSAndrey Grodzovsky 		r = idr_alloc(&fpriv->bo_list_handles, list, 1, 0, GFP_KERNEL);
284964d0fbfSAndrey Grodzovsky 		mutex_unlock(&fpriv->bo_list_lock);
285964d0fbfSAndrey Grodzovsky 		if (r < 0) {
286083164dbSNirmoy Das 			goto error_put_list;
287964d0fbfSAndrey Grodzovsky 		}
288964d0fbfSAndrey Grodzovsky 
289964d0fbfSAndrey Grodzovsky 		handle = r;
290d38ceaf9SAlex Deucher 		break;
291d38ceaf9SAlex Deucher 
292d38ceaf9SAlex Deucher 	case AMDGPU_BO_LIST_OP_DESTROY:
293d38ceaf9SAlex Deucher 		amdgpu_bo_list_destroy(fpriv, handle);
294d38ceaf9SAlex Deucher 		handle = 0;
295d38ceaf9SAlex Deucher 		break;
296d38ceaf9SAlex Deucher 
297d38ceaf9SAlex Deucher 	case AMDGPU_BO_LIST_OP_UPDATE:
29881c6dabcSChristian König 		r = amdgpu_bo_list_create(adev, filp, info, args->in.bo_number,
29981c6dabcSChristian König 					  &list);
30052c054caSChristian König 		if (r)
301d38ceaf9SAlex Deucher 			goto error_free;
302d38ceaf9SAlex Deucher 
30381c6dabcSChristian König 		mutex_lock(&fpriv->bo_list_lock);
30481c6dabcSChristian König 		old = idr_replace(&fpriv->bo_list_handles, list, handle);
30581c6dabcSChristian König 		mutex_unlock(&fpriv->bo_list_lock);
30681c6dabcSChristian König 
30781c6dabcSChristian König 		if (IS_ERR(old)) {
30881c6dabcSChristian König 			r = PTR_ERR(old);
309083164dbSNirmoy Das 			goto error_put_list;
31081c6dabcSChristian König 		}
311d38ceaf9SAlex Deucher 
31281c6dabcSChristian König 		amdgpu_bo_list_put(old);
313d38ceaf9SAlex Deucher 		break;
314d38ceaf9SAlex Deucher 
315d38ceaf9SAlex Deucher 	default:
316d38ceaf9SAlex Deucher 		r = -EINVAL;
317d38ceaf9SAlex Deucher 		goto error_free;
318d38ceaf9SAlex Deucher 	}
319d38ceaf9SAlex Deucher 
320d38ceaf9SAlex Deucher 	memset(args, 0, sizeof(*args));
321d38ceaf9SAlex Deucher 	args->out.list_handle = handle;
3222098105eSMichal Hocko 	kvfree(info);
323d38ceaf9SAlex Deucher 
324d38ceaf9SAlex Deucher 	return 0;
325d38ceaf9SAlex Deucher 
326083164dbSNirmoy Das error_put_list:
327083164dbSNirmoy Das 	amdgpu_bo_list_put(list);
328083164dbSNirmoy Das 
329d38ceaf9SAlex Deucher error_free:
3302098105eSMichal Hocko 	kvfree(info);
331d38ceaf9SAlex Deucher 	return r;
332d38ceaf9SAlex Deucher }
333