drivers/gpu/drm/amd/amdgpu/amdgpu_bo_list.c

   1 /*
   2  * Copyright 2015 Advanced Micro Devices, Inc.
   3  * All Rights Reserved.
   4  *
   5  * Permission is hereby granted, free of charge, to any person obtaining a
   6  * copy of this software and associated documentation files (the
   7  * "Software"), to deal in the Software without restriction, including
   8  * without limitation the rights to use, copy, modify, merge, publish,
   9  * distribute, sub license, and/or sell copies of the Software, and to
  10  * permit persons to whom the Software is furnished to do so, subject to
  11  * the following conditions:
  12  *
  13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  15  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  16  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  17  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  18  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  19  * USE OR OTHER DEALINGS IN THE SOFTWARE.
  20  *
  21  * The above copyright notice and this permission notice (including the
  22  * next paragraph) shall be included in all copies or substantial portions
  23  * of the Software.
  24  *
  25  */
  26 /*
  27  * Authors:
  28  *    Christian König <deathsimple@vodafone.de>
  29  */
  30
  31 #include <drm/drmP.h>
  32 #include "amdgpu.h"
  33 #include "amdgpu_trace.h"
  34
  35 #define AMDGPU_BO_LIST_MAX_PRIORITY     32u
  36 #define AMDGPU_BO_LIST_NUM_BUCKETS      (AMDGPU_BO_LIST_MAX_PRIORITY + 1)
  37
  38 static int amdgpu_bo_list_create(struct amdgpu_fpriv *fpriv,
  39                                  struct amdgpu_bo_list **result,
  40                                  int *id)
  41 {
  42         int r;
  43
  44         *result = kzalloc(sizeof(struct amdgpu_bo_list), GFP_KERNEL);
  45         if (!*result)
  46                 return -ENOMEM;
  47
  48         mutex_lock(&fpriv->bo_list_lock);
  49         r = idr_alloc(&fpriv->bo_list_handles, *result,
  50                       1, 0, GFP_KERNEL);
  51         if (r < 0) {
  52                 mutex_unlock(&fpriv->bo_list_lock);
  53                 kfree(*result);
  54                 return r;
  55         }
  56         *id = r;
  57
  58         mutex_init(&(*result)->lock);
  59         (*result)->num_entries = 0;
  60         (*result)->array = NULL;
  61
  62         mutex_lock(&(*result)->lock);
  63         mutex_unlock(&fpriv->bo_list_lock);
  64
  65         return 0;
  66 }
  67
  68 static void amdgpu_bo_list_destroy(struct amdgpu_fpriv *fpriv, int id)
  69 {
  70         struct amdgpu_bo_list *list;
  71
  72         mutex_lock(&fpriv->bo_list_lock);
  73         list = idr_find(&fpriv->bo_list_handles, id);
  74         if (list) {
  75                 mutex_lock(&list->lock);
  76                 idr_remove(&fpriv->bo_list_handles, id);
  77                 mutex_unlock(&list->lock);
  78                 amdgpu_bo_list_free(list);
  79         }
  80         mutex_unlock(&fpriv->bo_list_lock);
  81 }
  82
  83 static int amdgpu_bo_list_set(struct amdgpu_device *adev,
  84                                      struct drm_file *filp,
  85                                      struct amdgpu_bo_list *list,
  86                                      struct drm_amdgpu_bo_list_entry *info,
  87                                      unsigned num_entries)
  88 {
  89         struct amdgpu_bo_list_entry *array;
  90         struct amdgpu_bo *gds_obj = adev->gds.gds_gfx_bo;
  91         struct amdgpu_bo *gws_obj = adev->gds.gws_gfx_bo;
  92         struct amdgpu_bo *oa_obj = adev->gds.oa_gfx_bo;
  93
  94         unsigned last_entry = 0, first_userptr = num_entries;
  95         unsigned i;
  96         int r;
  97         unsigned long total_size = 0;
  98
  99         array = drm_malloc_ab(num_entries, sizeof(struct amdgpu_bo_list_entry));
 100         if (!array)
 101                 return -ENOMEM;
 102         memset(array, 0, num_entries * sizeof(struct amdgpu_bo_list_entry));
 103
 104         for (i = 0; i < num_entries; ++i) {
 105                 struct amdgpu_bo_list_entry *entry;
 106                 struct drm_gem_object *gobj;
 107                 struct amdgpu_bo *bo;
 108                 struct mm_struct *usermm;
 109
 110                 gobj = drm_gem_object_lookup(filp, info[i].bo_handle);
 111                 if (!gobj) {
 112                         r = -ENOENT;
 113                         goto error_free;
 114                 }
 115
 116                 bo = amdgpu_bo_ref(gem_to_amdgpu_bo(gobj));
 117                 drm_gem_object_unreference_unlocked(gobj);
 118
 119                 usermm = amdgpu_ttm_tt_get_usermm(bo->tbo.ttm);
 120                 if (usermm) {
 121                         if (usermm != current->mm) {
 122                                 amdgpu_bo_unref(&bo);
 123                                 r = -EPERM;
 124                                 goto error_free;
 125                         }
 126                         entry = &array[--first_userptr];
 127                 } else {
 128                         entry = &array[last_entry++];
 129                 }
 130
 131                 entry->robj = bo;
 132                 entry->priority = min(info[i].bo_priority,
 133                                       AMDGPU_BO_LIST_MAX_PRIORITY);
 134                 entry->tv.bo = &entry->robj->tbo;
 135                 entry->tv.shared = !entry->robj->prime_shared_count;
 136
 137                 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_GDS)
 138                         gds_obj = entry->robj;
 139                 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_GWS)
 140                         gws_obj = entry->robj;
 141                 if (entry->robj->prefered_domains == AMDGPU_GEM_DOMAIN_OA)
 142                         oa_obj = entry->robj;
 143
 144                 total_size += amdgpu_bo_size(entry->robj);
 145                 trace_amdgpu_bo_list_set(list, entry->robj);
 146         }
 147
 148         for (i = 0; i < list->num_entries; ++i)
 149                 amdgpu_bo_unref(&list->array[i].robj);
 150
 151         drm_free_large(list->array);
 152
 153         list->gds_obj = gds_obj;
 154         list->gws_obj = gws_obj;
 155         list->oa_obj = oa_obj;
 156         list->first_userptr = first_userptr;
 157         list->array = array;
 158         list->num_entries = num_entries;
 159
 160         trace_amdgpu_cs_bo_status(list->num_entries, total_size);
 161         return 0;
 162
 163 error_free:
 164         while (i--)
 165                 amdgpu_bo_unref(&array[i].robj);
 166         drm_free_large(array);
 167         return r;
 168 }
 169
 170 struct amdgpu_bo_list *
 171 amdgpu_bo_list_get(struct amdgpu_fpriv *fpriv, int id)
 172 {
 173         struct amdgpu_bo_list *result;
 174
 175         mutex_lock(&fpriv->bo_list_lock);
 176         result = idr_find(&fpriv->bo_list_handles, id);
 177         if (result)
 178                 mutex_lock(&result->lock);
 179         mutex_unlock(&fpriv->bo_list_lock);
 180         return result;
 181 }
 182
 183 void amdgpu_bo_list_get_list(struct amdgpu_bo_list *list,
 184                              struct list_head *validated)
 185 {
 186         /* This is based on the bucket sort with O(n) time complexity.
 187          * An item with priority "i" is added to bucket[i]. The lists are then
 188          * concatenated in descending order.
 189          */
 190         struct list_head bucket[AMDGPU_BO_LIST_NUM_BUCKETS];
 191         unsigned i;
 192
 193         for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
 194                 INIT_LIST_HEAD(&bucket[i]);
 195
 196         /* Since buffers which appear sooner in the relocation list are
 197          * likely to be used more often than buffers which appear later
 198          * in the list, the sort mustn't change the ordering of buffers
 199          * with the same priority, i.e. it must be stable.
 200          */
 201         for (i = 0; i < list->num_entries; i++) {
 202                 unsigned priority = list->array[i].priority;
 203
 204                 if (!list->array[i].robj->parent)
 205                         list_add_tail(&list->array[i].tv.head,
 206                                       &bucket[priority]);
 207
 208                 list->array[i].user_pages = NULL;
 209         }
 210
 211         /* Connect the sorted buckets in the output list. */
 212         for (i = 0; i < AMDGPU_BO_LIST_NUM_BUCKETS; i++)
 213                 list_splice(&bucket[i], validated);
 214 }
 215
 216 void amdgpu_bo_list_put(struct amdgpu_bo_list *list)
 217 {
 218         mutex_unlock(&list->lock);
 219 }
 220
 221 void amdgpu_bo_list_free(struct amdgpu_bo_list *list)
 222 {
 223         unsigned i;
 224
 225         for (i = 0; i < list->num_entries; ++i)
 226                 amdgpu_bo_unref(&list->array[i].robj);
 227
 228         mutex_destroy(&list->lock);
 229         drm_free_large(list->array);
 230         kfree(list);
 231 }
 232
 233 int amdgpu_bo_list_ioctl(struct drm_device *dev, void *data,
 234                                 struct drm_file *filp)
 235 {
 236         const uint32_t info_size = sizeof(struct drm_amdgpu_bo_list_entry);
 237
 238         struct amdgpu_device *adev = dev->dev_private;
 239         struct amdgpu_fpriv *fpriv = filp->driver_priv;
 240         union drm_amdgpu_bo_list *args = data;
 241         uint32_t handle = args->in.list_handle;
 242         const void __user *uptr = (const void*)(long)args->in.bo_info_ptr;
 243
 244         struct drm_amdgpu_bo_list_entry *info;
 245         struct amdgpu_bo_list *list;
 246
 247         int r;
 248
 249         info = drm_malloc_ab(args->in.bo_number,
 250                              sizeof(struct drm_amdgpu_bo_list_entry));
 251         if (!info)
 252                 return -ENOMEM;
 253
 254         /* copy the handle array from userspace to a kernel buffer */
 255         r = -EFAULT;
 256         if (likely(info_size == args->in.bo_info_size)) {
 257                 unsigned long bytes = args->in.bo_number *
 258                         args->in.bo_info_size;
 259
 260                 if (copy_from_user(info, uptr, bytes))
 261                         goto error_free;
 262
 263         } else {
 264                 unsigned long bytes = min(args->in.bo_info_size, info_size);
 265                 unsigned i;
 266
 267                 memset(info, 0, args->in.bo_number * info_size);
 268                 for (i = 0; i < args->in.bo_number; ++i) {
 269                         if (copy_from_user(&info[i], uptr, bytes))
 270                                 goto error_free;
 271
 272                         uptr += args->in.bo_info_size;
 273                 }
 274         }
 275
 276         switch (args->in.operation) {
 277         case AMDGPU_BO_LIST_OP_CREATE:
 278                 r = amdgpu_bo_list_create(fpriv, &list, &handle);
 279                 if (r)
 280                         goto error_free;
 281
 282                 r = amdgpu_bo_list_set(adev, filp, list, info,
 283                                               args->in.bo_number);
 284                 amdgpu_bo_list_put(list);
 285                 if (r)
 286                         goto error_free;
 287
 288                 break;
 289
 290         case AMDGPU_BO_LIST_OP_DESTROY:
 291                 amdgpu_bo_list_destroy(fpriv, handle);
 292                 handle = 0;
 293                 break;
 294
 295         case AMDGPU_BO_LIST_OP_UPDATE:
 296                 r = -ENOENT;
 297                 list = amdgpu_bo_list_get(fpriv, handle);
 298                 if (!list)
 299                         goto error_free;
 300
 301                 r = amdgpu_bo_list_set(adev, filp, list, info,
 302                                               args->in.bo_number);
 303                 amdgpu_bo_list_put(list);
 304                 if (r)
 305                         goto error_free;
 306
 307                 break;
 308
 309         default:
 310                 r = -EINVAL;
 311                 goto error_free;
 312         }
 313
 314         memset(args, 0, sizeof(*args));
 315         args->out.list_handle = handle;
 316         drm_free_large(info);
 317
 318         return 0;
 319
 320 error_free:
 321         drm_free_large(info);
 322         return r;
 323 }