1d38ceaf9SAlex Deucher /* 2d38ceaf9SAlex Deucher * Copyright 2015 Advanced Micro Devices, Inc. 3d38ceaf9SAlex Deucher * All Rights Reserved. 4d38ceaf9SAlex Deucher * 5d38ceaf9SAlex Deucher * Permission is hereby granted, free of charge, to any person obtaining a 6d38ceaf9SAlex Deucher * copy of this software and associated documentation files (the 7d38ceaf9SAlex Deucher * "Software"), to deal in the Software without restriction, including 8d38ceaf9SAlex Deucher * without limitation the rights to use, copy, modify, merge, publish, 9d38ceaf9SAlex Deucher * distribute, sub license, and/or sell copies of the Software, and to 10d38ceaf9SAlex Deucher * permit persons to whom the Software is furnished to do so, subject to 11d38ceaf9SAlex Deucher * the following conditions: 12d38ceaf9SAlex Deucher * 13d38ceaf9SAlex Deucher * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14d38ceaf9SAlex Deucher * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15d38ceaf9SAlex Deucher * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 16d38ceaf9SAlex Deucher * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, 17d38ceaf9SAlex Deucher * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 18d38ceaf9SAlex Deucher * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 19d38ceaf9SAlex Deucher * USE OR OTHER DEALINGS IN THE SOFTWARE. 20d38ceaf9SAlex Deucher * 21d38ceaf9SAlex Deucher * The above copyright notice and this permission notice (including the 22d38ceaf9SAlex Deucher * next paragraph) shall be included in all copies or substantial portions 23d38ceaf9SAlex Deucher * of the Software. 24d38ceaf9SAlex Deucher * 25d38ceaf9SAlex Deucher */ 26d38ceaf9SAlex Deucher /* 27d38ceaf9SAlex Deucher * Authors: 28d38ceaf9SAlex Deucher * Christian König <deathsimple@vodafone.de> 29d38ceaf9SAlex Deucher */ 30d38ceaf9SAlex Deucher 31fdf2f6c5SSam Ravnborg #include <linux/uaccess.h> 32fdf2f6c5SSam Ravnborg 33d38ceaf9SAlex Deucher #include "amdgpu.h" 34ec74407aSChristian König #include "amdgpu_trace.h" 35d38ceaf9SAlex Deucher 36636ce25cSChristian König #define AMDGPU_BO_LIST_MAX_PRIORITY 32u 37636ce25cSChristian König #define AMDGPU_BO_LIST_NUM_BUCKETS (AMDGPU_BO_LIST_MAX_PRIORITY + 1) 38636ce25cSChristian König 39920990cbSChristian König static void amdgpu_bo_list_free_rcu(struct rcu_head *rcu) 40920990cbSChristian König { 41920990cbSChristian König struct amdgpu_bo_list *list = container_of(rcu, struct amdgpu_bo_list, 42920990cbSChristian König rhead); 4399eea4dfSAlex Xie 44920990cbSChristian König kvfree(list); 45920990cbSChristian König } 46920990cbSChristian König 47920990cbSChristian König static void amdgpu_bo_list_free(struct kref *ref) 485ac55629SAlex Xie { 495ac55629SAlex Xie struct amdgpu_bo_list *list = container_of(ref, struct amdgpu_bo_list, 505ac55629SAlex Xie refcount); 5139f7f69aSChristian König struct amdgpu_bo_list_entry *e; 525ac55629SAlex Xie 53e83dfe4dSChristian König amdgpu_bo_list_for_each_entry(e, list) { 54e83dfe4dSChristian König struct amdgpu_bo *bo = ttm_to_amdgpu_bo(e->tv.bo); 55e83dfe4dSChristian König 56e83dfe4dSChristian König amdgpu_bo_unref(&bo); 57e83dfe4dSChristian König } 585ac55629SAlex Xie 59920990cbSChristian König call_rcu(&list->rhead, amdgpu_bo_list_free_rcu); 605ac55629SAlex Xie } 615ac55629SAlex Xie 62920990cbSChristian König int amdgpu_bo_list_create(struct amdgpu_device *adev, struct drm_file *filp, 6399eea4dfSAlex Xie struct drm_amdgpu_bo_list_entry *info, 64920990cbSChristian König unsigned num_entries, struct amdgpu_bo_list **result) 65d38ceaf9SAlex Deucher { 66211dff55SChristian König unsigned last_entry = 0, first_userptr = num_entries; 67920990cbSChristian König struct amdgpu_bo_list_entry *array; 68920990cbSChristian König struct amdgpu_bo_list *list; 69275105ceSChristian König uint64_t total_size = 0; 70920990cbSChristian König size_t size; 71d38ceaf9SAlex Deucher unsigned i; 72cc325d19SChristian König int r; 73d38ceaf9SAlex Deucher 74ff30e9e8SDan Carpenter if (num_entries > (SIZE_MAX - sizeof(struct amdgpu_bo_list)) 75ff30e9e8SDan Carpenter / sizeof(struct amdgpu_bo_list_entry)) 76920990cbSChristian König return -EINVAL; 77920990cbSChristian König 78920990cbSChristian König size = sizeof(struct amdgpu_bo_list); 79920990cbSChristian König size += num_entries * sizeof(struct amdgpu_bo_list_entry); 80920990cbSChristian König list = kvmalloc(size, GFP_KERNEL); 81920990cbSChristian König if (!list) 82d38ceaf9SAlex Deucher return -ENOMEM; 83920990cbSChristian König 84920990cbSChristian König kref_init(&list->refcount); 85dca29491SChristian König list->gds_obj = NULL; 86dca29491SChristian König list->gws_obj = NULL; 87dca29491SChristian König list->oa_obj = NULL; 88920990cbSChristian König 89920990cbSChristian König array = amdgpu_bo_list_array_entry(list, 0); 90d38ceaf9SAlex Deucher memset(array, 0, num_entries * sizeof(struct amdgpu_bo_list_entry)); 91d38ceaf9SAlex Deucher 92d38ceaf9SAlex Deucher for (i = 0; i < num_entries; ++i) { 93211dff55SChristian König struct amdgpu_bo_list_entry *entry; 94d38ceaf9SAlex Deucher struct drm_gem_object *gobj; 95211dff55SChristian König struct amdgpu_bo *bo; 96cc325d19SChristian König struct mm_struct *usermm; 97d38ceaf9SAlex Deucher 98a8ad0bd8SChris Wilson gobj = drm_gem_object_lookup(filp, info[i].bo_handle); 99cc325d19SChristian König if (!gobj) { 100cc325d19SChristian König r = -ENOENT; 101d38ceaf9SAlex Deucher goto error_free; 102cc325d19SChristian König } 103d38ceaf9SAlex Deucher 104211dff55SChristian König bo = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj)); 105f62facc2SCihangir Akturk drm_gem_object_put_unlocked(gobj); 106211dff55SChristian König 107211dff55SChristian König usermm = amdgpu_ttm_tt_get_usermm(bo->tbo.ttm); 108cc325d19SChristian König if (usermm) { 109cc325d19SChristian König if (usermm != current->mm) { 110211dff55SChristian König amdgpu_bo_unref(&bo); 111cc325d19SChristian König r = -EPERM; 112cc325d19SChristian König goto error_free; 113cc325d19SChristian König } 114211dff55SChristian König entry = &array[--first_userptr]; 115211dff55SChristian König } else { 116211dff55SChristian König entry = &array[last_entry++]; 117cc325d19SChristian König } 118211dff55SChristian König 119211dff55SChristian König entry->priority = min(info[i].bo_priority, 120211dff55SChristian König AMDGPU_BO_LIST_MAX_PRIORITY); 121e83dfe4dSChristian König entry->tv.bo = &bo->tbo; 122d38ceaf9SAlex Deucher 123e83dfe4dSChristian König if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_GDS) 124e83dfe4dSChristian König list->gds_obj = bo; 125e83dfe4dSChristian König if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_GWS) 126e83dfe4dSChristian König list->gws_obj = bo; 127e83dfe4dSChristian König if (bo->preferred_domains == AMDGPU_GEM_DOMAIN_OA) 128e83dfe4dSChristian König list->oa_obj = bo; 129ec74407aSChristian König 130e83dfe4dSChristian König total_size += amdgpu_bo_size(bo); 131e83dfe4dSChristian König trace_amdgpu_bo_list_set(list, bo); 132d38ceaf9SAlex Deucher } 133d38ceaf9SAlex Deucher 134211dff55SChristian König list->first_userptr = first_userptr; 135d38ceaf9SAlex Deucher list->num_entries = num_entries; 136d38ceaf9SAlex Deucher 13715da301dSDavid Mao trace_amdgpu_cs_bo_status(list->num_entries, total_size); 138920990cbSChristian König 139920990cbSChristian König *result = list; 140d38ceaf9SAlex Deucher return 0; 141d38ceaf9SAlex Deucher 142d38ceaf9SAlex Deucher error_free: 143e83dfe4dSChristian König while (i--) { 144e83dfe4dSChristian König struct amdgpu_bo *bo = ttm_to_amdgpu_bo(array[i].tv.bo); 145e83dfe4dSChristian König 146e83dfe4dSChristian König amdgpu_bo_unref(&bo); 147e83dfe4dSChristian König } 148920990cbSChristian König kvfree(list); 149cc325d19SChristian König return r; 150920990cbSChristian König 151920990cbSChristian König } 152920990cbSChristian König 153920990cbSChristian König static void amdgpu_bo_list_destroy(struct amdgpu_fpriv *fpriv, int id) 154920990cbSChristian König { 155920990cbSChristian König struct amdgpu_bo_list *list; 156920990cbSChristian König 157920990cbSChristian König mutex_lock(&fpriv->bo_list_lock); 158920990cbSChristian König list = idr_remove(&fpriv->bo_list_handles, id); 159920990cbSChristian König mutex_unlock(&fpriv->bo_list_lock); 160920990cbSChristian König if (list) 161920990cbSChristian König kref_put(&list->refcount, amdgpu_bo_list_free); 162d38ceaf9SAlex Deucher } 163d38ceaf9SAlex Deucher 16452c054caSChristian König int amdgpu_bo_list_get(struct amdgpu_fpriv *fpriv, int id, 16552c054caSChristian König struct amdgpu_bo_list **result) 166d38ceaf9SAlex Deucher { 1675ac55629SAlex Xie rcu_read_lock(); 16852c054caSChristian König *result = idr_find(&fpriv->bo_list_handles, id); 1695ac55629SAlex Xie 17052c054caSChristian König if (*result && kref_get_unless_zero(&(*result)->refcount)) { 171564f0458SAlex Xie rcu_read_unlock(); 17252c054caSChristian König return 0; 173564f0458SAlex Xie } 1745ac55629SAlex Xie 17552c054caSChristian König rcu_read_unlock(); 17652c054caSChristian König return -ENOENT; 177d38ceaf9SAlex Deucher } 178d38ceaf9SAlex Deucher 179636ce25cSChristian König void amdgpu_bo_list_get_list(struct amdgpu_bo_list *list, 180636ce25cSChristian König struct list_head *validated) 181636ce25cSChristian König { 182636ce25cSChristian König /* This is based on the bucket sort with O(n) time complexity. 183636ce25cSChristian König * An item with priority "i" is added to bucket[i]. The lists are then 184636ce25cSChristian König * concatenated in descending order. 185636ce25cSChristian König */ 186636ce25cSChristian König struct list_head bucket[AMDGPU_BO_LIST_NUM_BUCKETS]; 18739f7f69aSChristian König struct amdgpu_bo_list_entry *e; 188636ce25cSChristian König unsigned i; 189636ce25cSChristian König 190636ce25cSChristian König for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++) 191636ce25cSChristian König INIT_LIST_HEAD(&bucket[i]); 192636ce25cSChristian König 193636ce25cSChristian König /* Since buffers which appear sooner in the relocation list are 194636ce25cSChristian König * likely to be used more often than buffers which appear later 195636ce25cSChristian König * in the list, the sort mustn't change the ordering of buffers 196636ce25cSChristian König * with the same priority, i.e. it must be stable. 197636ce25cSChristian König */ 19839f7f69aSChristian König amdgpu_bo_list_for_each_entry(e, list) { 199e83dfe4dSChristian König struct amdgpu_bo *bo = ttm_to_amdgpu_bo(e->tv.bo); 20039f7f69aSChristian König unsigned priority = e->priority; 201636ce25cSChristian König 202e83dfe4dSChristian König if (!bo->parent) 20339f7f69aSChristian König list_add_tail(&e->tv.head, &bucket[priority]); 204a20ee0b1SBas Nieuwenhuizen 20539f7f69aSChristian König e->user_pages = NULL; 206636ce25cSChristian König } 207636ce25cSChristian König 208636ce25cSChristian König /* Connect the sorted buckets in the output list. */ 209636ce25cSChristian König for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++) 210636ce25cSChristian König list_splice(&bucket[i], validated); 211636ce25cSChristian König } 212636ce25cSChristian König 213d38ceaf9SAlex Deucher void amdgpu_bo_list_put(struct amdgpu_bo_list *list) 214d38ceaf9SAlex Deucher { 215920990cbSChristian König kref_put(&list->refcount, amdgpu_bo_list_free); 216d38ceaf9SAlex Deucher } 217d38ceaf9SAlex Deucher 218964d0fbfSAndrey Grodzovsky int amdgpu_bo_create_list_entry_array(struct drm_amdgpu_bo_list_in *in, 219964d0fbfSAndrey Grodzovsky struct drm_amdgpu_bo_list_entry **info_param) 220d38ceaf9SAlex Deucher { 221964d0fbfSAndrey Grodzovsky const void __user *uptr = u64_to_user_ptr(in->bo_info_ptr); 222d38ceaf9SAlex Deucher const uint32_t info_size = sizeof(struct drm_amdgpu_bo_list_entry); 223d38ceaf9SAlex Deucher struct drm_amdgpu_bo_list_entry *info; 224d38ceaf9SAlex Deucher int r; 225d38ceaf9SAlex Deucher 226964d0fbfSAndrey Grodzovsky info = kvmalloc_array(in->bo_number, info_size, GFP_KERNEL); 227d38ceaf9SAlex Deucher if (!info) 228d38ceaf9SAlex Deucher return -ENOMEM; 229d38ceaf9SAlex Deucher 230d38ceaf9SAlex Deucher /* copy the handle array from userspace to a kernel buffer */ 231d38ceaf9SAlex Deucher r = -EFAULT; 232964d0fbfSAndrey Grodzovsky if (likely(info_size == in->bo_info_size)) { 233964d0fbfSAndrey Grodzovsky unsigned long bytes = in->bo_number * 234964d0fbfSAndrey Grodzovsky in->bo_info_size; 235d38ceaf9SAlex Deucher 236d38ceaf9SAlex Deucher if (copy_from_user(info, uptr, bytes)) 237d38ceaf9SAlex Deucher goto error_free; 238d38ceaf9SAlex Deucher 239d38ceaf9SAlex Deucher } else { 240964d0fbfSAndrey Grodzovsky unsigned long bytes = min(in->bo_info_size, info_size); 241d38ceaf9SAlex Deucher unsigned i; 242d38ceaf9SAlex Deucher 243964d0fbfSAndrey Grodzovsky memset(info, 0, in->bo_number * info_size); 244964d0fbfSAndrey Grodzovsky for (i = 0; i < in->bo_number; ++i) { 245d38ceaf9SAlex Deucher if (copy_from_user(&info[i], uptr, bytes)) 246d38ceaf9SAlex Deucher goto error_free; 247d38ceaf9SAlex Deucher 248964d0fbfSAndrey Grodzovsky uptr += in->bo_info_size; 249d38ceaf9SAlex Deucher } 250d38ceaf9SAlex Deucher } 251d38ceaf9SAlex Deucher 252964d0fbfSAndrey Grodzovsky *info_param = info; 253964d0fbfSAndrey Grodzovsky return 0; 254964d0fbfSAndrey Grodzovsky 255964d0fbfSAndrey Grodzovsky error_free: 256964d0fbfSAndrey Grodzovsky kvfree(info); 257964d0fbfSAndrey Grodzovsky return r; 258964d0fbfSAndrey Grodzovsky } 259964d0fbfSAndrey Grodzovsky 260964d0fbfSAndrey Grodzovsky int amdgpu_bo_list_ioctl(struct drm_device *dev, void *data, 261964d0fbfSAndrey Grodzovsky struct drm_file *filp) 262964d0fbfSAndrey Grodzovsky { 263964d0fbfSAndrey Grodzovsky struct amdgpu_device *adev = dev->dev_private; 264964d0fbfSAndrey Grodzovsky struct amdgpu_fpriv *fpriv = filp->driver_priv; 265964d0fbfSAndrey Grodzovsky union drm_amdgpu_bo_list *args = data; 266964d0fbfSAndrey Grodzovsky uint32_t handle = args->in.list_handle; 267964d0fbfSAndrey Grodzovsky struct drm_amdgpu_bo_list_entry *info = NULL; 26881c6dabcSChristian König struct amdgpu_bo_list *list, *old; 269964d0fbfSAndrey Grodzovsky int r; 270964d0fbfSAndrey Grodzovsky 271964d0fbfSAndrey Grodzovsky r = amdgpu_bo_create_list_entry_array(&args->in, &info); 272964d0fbfSAndrey Grodzovsky if (r) 273083164dbSNirmoy Das return r; 274964d0fbfSAndrey Grodzovsky 275d38ceaf9SAlex Deucher switch (args->in.operation) { 276d38ceaf9SAlex Deucher case AMDGPU_BO_LIST_OP_CREATE: 27799eea4dfSAlex Xie r = amdgpu_bo_list_create(adev, filp, info, args->in.bo_number, 278964d0fbfSAndrey Grodzovsky &list); 279d38ceaf9SAlex Deucher if (r) 280d38ceaf9SAlex Deucher goto error_free; 281964d0fbfSAndrey Grodzovsky 282964d0fbfSAndrey Grodzovsky mutex_lock(&fpriv->bo_list_lock); 283964d0fbfSAndrey Grodzovsky r = idr_alloc(&fpriv->bo_list_handles, list, 1, 0, GFP_KERNEL); 284964d0fbfSAndrey Grodzovsky mutex_unlock(&fpriv->bo_list_lock); 285964d0fbfSAndrey Grodzovsky if (r < 0) { 286083164dbSNirmoy Das goto error_put_list; 287964d0fbfSAndrey Grodzovsky } 288964d0fbfSAndrey Grodzovsky 289964d0fbfSAndrey Grodzovsky handle = r; 290d38ceaf9SAlex Deucher break; 291d38ceaf9SAlex Deucher 292d38ceaf9SAlex Deucher case AMDGPU_BO_LIST_OP_DESTROY: 293d38ceaf9SAlex Deucher amdgpu_bo_list_destroy(fpriv, handle); 294d38ceaf9SAlex Deucher handle = 0; 295d38ceaf9SAlex Deucher break; 296d38ceaf9SAlex Deucher 297d38ceaf9SAlex Deucher case AMDGPU_BO_LIST_OP_UPDATE: 29881c6dabcSChristian König r = amdgpu_bo_list_create(adev, filp, info, args->in.bo_number, 29981c6dabcSChristian König &list); 30052c054caSChristian König if (r) 301d38ceaf9SAlex Deucher goto error_free; 302d38ceaf9SAlex Deucher 30381c6dabcSChristian König mutex_lock(&fpriv->bo_list_lock); 30481c6dabcSChristian König old = idr_replace(&fpriv->bo_list_handles, list, handle); 30581c6dabcSChristian König mutex_unlock(&fpriv->bo_list_lock); 30681c6dabcSChristian König 30781c6dabcSChristian König if (IS_ERR(old)) { 30881c6dabcSChristian König r = PTR_ERR(old); 309083164dbSNirmoy Das goto error_put_list; 31081c6dabcSChristian König } 311d38ceaf9SAlex Deucher 31281c6dabcSChristian König amdgpu_bo_list_put(old); 313d38ceaf9SAlex Deucher break; 314d38ceaf9SAlex Deucher 315d38ceaf9SAlex Deucher default: 316d38ceaf9SAlex Deucher r = -EINVAL; 317d38ceaf9SAlex Deucher goto error_free; 318d38ceaf9SAlex Deucher } 319d38ceaf9SAlex Deucher 320d38ceaf9SAlex Deucher memset(args, 0, sizeof(*args)); 321d38ceaf9SAlex Deucher args->out.list_handle = handle; 3222098105eSMichal Hocko kvfree(info); 323d38ceaf9SAlex Deucher 324d38ceaf9SAlex Deucher return 0; 325d38ceaf9SAlex Deucher 326083164dbSNirmoy Das error_put_list: 327083164dbSNirmoy Das amdgpu_bo_list_put(list); 328083164dbSNirmoy Das 329d38ceaf9SAlex Deucher error_free: 3302098105eSMichal Hocko kvfree(info); 331d38ceaf9SAlex Deucher return r; 332d38ceaf9SAlex Deucher } 333