drivers/gpu/drm/amd/amdgpu/amdgpu_mn.c

   1 /*
   2  * Copyright 2014 Advanced Micro Devices, Inc.
   3  * All Rights Reserved.
   4  *
   5  * Permission is hereby granted, free of charge, to any person obtaining a
   6  * copy of this software and associated documentation files (the
   7  * "Software"), to deal in the Software without restriction, including
   8  * without limitation the rights to use, copy, modify, merge, publish,
   9  * distribute, sub license, and/or sell copies of the Software, and to
  10  * permit persons to whom the Software is furnished to do so, subject to
  11  * the following conditions:
  12  *
  13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  15  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  16  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  17  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  18  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  19  * USE OR OTHER DEALINGS IN THE SOFTWARE.
  20  *
  21  * The above copyright notice and this permission notice (including the
  22  * next paragraph) shall be included in all copies or substantial portions
  23  * of the Software.
  24  *
  25  */
  26 /*
  27  * Authors:
  28  *    Christian König <christian.koenig@amd.com>
  29  */
  30
  31 #include <linux/firmware.h>
  32 #include <linux/module.h>
  33 #include <linux/mmu_notifier.h>
  34 #include <linux/interval_tree.h>
  35 #include <drm/drmP.h>
  36 #include <drm/drm.h>
  37
  38 #include "amdgpu.h"
  39
  40 struct amdgpu_mn {
  41         /* constant after initialisation */
  42         struct amdgpu_device    *adev;
  43         struct mm_struct        *mm;
  44         struct mmu_notifier     mn;
  45
  46         /* only used on destruction */
  47         struct work_struct      work;
  48
  49         /* protected by adev->mn_lock */
  50         struct hlist_node       node;
  51
  52         /* objects protected by lock */
  53         struct rw_semaphore     lock;
  54         struct rb_root_cached   objects;
  55         struct mutex            read_lock;
  56         atomic_t                recursion;
  57 };
  58
  59 struct amdgpu_mn_node {
  60         struct interval_tree_node       it;
  61         struct list_head                bos;
  62 };
  63
  64 /**
  65  * amdgpu_mn_destroy - destroy the rmn
  66  *
  67  * @work: previously sheduled work item
  68  *
  69  * Lazy destroys the notifier from a work item
  70  */
  71 static void amdgpu_mn_destroy(struct work_struct *work)
  72 {
  73         struct amdgpu_mn *rmn = container_of(work, struct amdgpu_mn, work);
  74         struct amdgpu_device *adev = rmn->adev;
  75         struct amdgpu_mn_node *node, *next_node;
  76         struct amdgpu_bo *bo, *next_bo;
  77
  78         mutex_lock(&adev->mn_lock);
  79         down_write(&rmn->lock);
  80         hash_del(&rmn->node);
  81         rbtree_postorder_for_each_entry_safe(node, next_node,
  82                                              &rmn->objects.rb_root, it.rb) {
  83                 list_for_each_entry_safe(bo, next_bo, &node->bos, mn_list) {
  84                         bo->mn = NULL;
  85                         list_del_init(&bo->mn_list);
  86                 }
  87                 kfree(node);
  88         }
  89         up_write(&rmn->lock);
  90         mutex_unlock(&adev->mn_lock);
  91         mmu_notifier_unregister_no_release(&rmn->mn, rmn->mm);
  92         kfree(rmn);
  93 }
  94
  95 /**
  96  * amdgpu_mn_release - callback to notify about mm destruction
  97  *
  98  * @mn: our notifier
  99  * @mn: the mm this callback is about
 100  *
 101  * Shedule a work item to lazy destroy our notifier.
 102  */
 103 static void amdgpu_mn_release(struct mmu_notifier *mn,
 104                               struct mm_struct *mm)
 105 {
 106         struct amdgpu_mn *rmn = container_of(mn, struct amdgpu_mn, mn);
 107         INIT_WORK(&rmn->work, amdgpu_mn_destroy);
 108         schedule_work(&rmn->work);
 109 }
 110
 111
 112 /**
 113  * amdgpu_mn_lock - take the write side lock for this mn
 114  */
 115 void amdgpu_mn_lock(struct amdgpu_mn *mn)
 116 {
 117         if (mn)
 118                 down_write(&mn->lock);
 119 }
 120
 121 /**
 122  * amdgpu_mn_unlock - drop the write side lock for this mn
 123  */
 124 void amdgpu_mn_unlock(struct amdgpu_mn *mn)
 125 {
 126         if (mn)
 127                 up_write(&mn->lock);
 128 }
 129
 130 /**
 131  * amdgpu_mn_read_lock - take the rmn read lock
 132  *
 133  * @rmn: our notifier
 134  *
 135  * Take the rmn read side lock.
 136  */
 137 static void amdgpu_mn_read_lock(struct amdgpu_mn *rmn)
 138 {
 139         mutex_lock(&rmn->read_lock);
 140         if (atomic_inc_return(&rmn->recursion) == 1)
 141                 down_read_non_owner(&rmn->lock);
 142         mutex_unlock(&rmn->read_lock);
 143 }
 144
 145 /**
 146  * amdgpu_mn_read_unlock - drop the rmn read lock
 147  *
 148  * @rmn: our notifier
 149  *
 150  * Drop the rmn read side lock.
 151  */
 152 static void amdgpu_mn_read_unlock(struct amdgpu_mn *rmn)
 153 {
 154         if (atomic_dec_return(&rmn->recursion) == 0)
 155                 up_read_non_owner(&rmn->lock);
 156 }
 157
 158 /**
 159  * amdgpu_mn_invalidate_node - unmap all BOs of a node
 160  *
 161  * @node: the node with the BOs to unmap
 162  *
 163  * We block for all BOs and unmap them by move them
 164  * into system domain again.
 165  */
 166 static void amdgpu_mn_invalidate_node(struct amdgpu_mn_node *node,
 167                                       unsigned long start,
 168                                       unsigned long end)
 169 {
 170         struct amdgpu_bo *bo;
 171         long r;
 172
 173         list_for_each_entry(bo, &node->bos, mn_list) {
 174
 175                 if (!amdgpu_ttm_tt_affect_userptr(bo->tbo.ttm, start, end))
 176                         continue;
 177
 178                 r = reservation_object_wait_timeout_rcu(bo->tbo.resv,
 179                         true, false, MAX_SCHEDULE_TIMEOUT);
 180                 if (r <= 0)
 181                         DRM_ERROR("(%ld) failed to wait for user bo\n", r);
 182
 183                 amdgpu_ttm_tt_mark_user_pages(bo->tbo.ttm);
 184         }
 185 }
 186
 187 /**
 188  * amdgpu_mn_invalidate_range_start - callback to notify about mm change
 189  *
 190  * @mn: our notifier
 191  * @mn: the mm this callback is about
 192  * @start: start of updated range
 193  * @end: end of updated range
 194  *
 195  * We block for all BOs between start and end to be idle and
 196  * unmap them by move them into system domain again.
 197  */
 198 static void amdgpu_mn_invalidate_range_start(struct mmu_notifier *mn,
 199                                              struct mm_struct *mm,
 200                                              unsigned long start,
 201                                              unsigned long end)
 202 {
 203         struct amdgpu_mn *rmn = container_of(mn, struct amdgpu_mn, mn);
 204         struct interval_tree_node *it;
 205
 206         /* notification is exclusive, but interval is inclusive */
 207         end -= 1;
 208
 209         amdgpu_mn_read_lock(rmn);
 210
 211         it = interval_tree_iter_first(&rmn->objects, start, end);
 212         while (it) {
 213                 struct amdgpu_mn_node *node;
 214
 215                 node = container_of(it, struct amdgpu_mn_node, it);
 216                 it = interval_tree_iter_next(it, start, end);
 217
 218                 amdgpu_mn_invalidate_node(node, start, end);
 219         }
 220 }
 221
 222 /**
 223  * amdgpu_mn_invalidate_range_end - callback to notify about mm change
 224  *
 225  * @mn: our notifier
 226  * @mn: the mm this callback is about
 227  * @start: start of updated range
 228  * @end: end of updated range
 229  *
 230  * Release the lock again to allow new command submissions.
 231  */
 232 static void amdgpu_mn_invalidate_range_end(struct mmu_notifier *mn,
 233                                            struct mm_struct *mm,
 234                                            unsigned long start,
 235                                            unsigned long end)
 236 {
 237         struct amdgpu_mn *rmn = container_of(mn, struct amdgpu_mn, mn);
 238
 239         amdgpu_mn_read_unlock(rmn);
 240 }
 241
 242 static const struct mmu_notifier_ops amdgpu_mn_ops = {
 243         .release = amdgpu_mn_release,
 244         .invalidate_range_start = amdgpu_mn_invalidate_range_start,
 245         .invalidate_range_end = amdgpu_mn_invalidate_range_end,
 246 };
 247
 248 /**
 249  * amdgpu_mn_get - create notifier context
 250  *
 251  * @adev: amdgpu device pointer
 252  *
 253  * Creates a notifier context for current->mm.
 254  */
 255 struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev)
 256 {
 257         struct mm_struct *mm = current->mm;
 258         struct amdgpu_mn *rmn;
 259         int r;
 260
 261         mutex_lock(&adev->mn_lock);
 262         if (down_write_killable(&mm->mmap_sem)) {
 263                 mutex_unlock(&adev->mn_lock);
 264                 return ERR_PTR(-EINTR);
 265         }
 266
 267         hash_for_each_possible(adev->mn_hash, rmn, node, (unsigned long)mm)
 268                 if (rmn->mm == mm)
 269                         goto release_locks;
 270
 271         rmn = kzalloc(sizeof(*rmn), GFP_KERNEL);
 272         if (!rmn) {
 273                 rmn = ERR_PTR(-ENOMEM);
 274                 goto release_locks;
 275         }
 276
 277         rmn->adev = adev;
 278         rmn->mm = mm;
 279         rmn->mn.ops = &amdgpu_mn_ops;
 280         init_rwsem(&rmn->lock);
 281         rmn->objects = RB_ROOT_CACHED;
 282         mutex_init(&rmn->read_lock);
 283         atomic_set(&rmn->recursion, 0);
 284
 285         r = __mmu_notifier_register(&rmn->mn, mm);
 286         if (r)
 287                 goto free_rmn;
 288
 289         hash_add(adev->mn_hash, &rmn->node, (unsigned long)mm);
 290
 291 release_locks:
 292         up_write(&mm->mmap_sem);
 293         mutex_unlock(&adev->mn_lock);
 294
 295         return rmn;
 296
 297 free_rmn:
 298         up_write(&mm->mmap_sem);
 299         mutex_unlock(&adev->mn_lock);
 300         kfree(rmn);
 301
 302         return ERR_PTR(r);
 303 }
 304
 305 /**
 306  * amdgpu_mn_register - register a BO for notifier updates
 307  *
 308  * @bo: amdgpu buffer object
 309  * @addr: userptr addr we should monitor
 310  *
 311  * Registers an MMU notifier for the given BO at the specified address.
 312  * Returns 0 on success, -ERRNO if anything goes wrong.
 313  */
 314 int amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr)
 315 {
 316         unsigned long end = addr + amdgpu_bo_size(bo) - 1;
 317         struct amdgpu_device *adev = amdgpu_ttm_adev(bo->tbo.bdev);
 318         struct amdgpu_mn *rmn;
 319         struct amdgpu_mn_node *node = NULL;
 320         struct list_head bos;
 321         struct interval_tree_node *it;
 322
 323         rmn = amdgpu_mn_get(adev);
 324         if (IS_ERR(rmn))
 325                 return PTR_ERR(rmn);
 326
 327         INIT_LIST_HEAD(&bos);
 328
 329         down_write(&rmn->lock);
 330
 331         while ((it = interval_tree_iter_first(&rmn->objects, addr, end))) {
 332                 kfree(node);
 333                 node = container_of(it, struct amdgpu_mn_node, it);
 334                 interval_tree_remove(&node->it, &rmn->objects);
 335                 addr = min(it->start, addr);
 336                 end = max(it->last, end);
 337                 list_splice(&node->bos, &bos);
 338         }
 339
 340         if (!node) {
 341                 node = kmalloc(sizeof(struct amdgpu_mn_node), GFP_KERNEL);
 342                 if (!node) {
 343                         up_write(&rmn->lock);
 344                         return -ENOMEM;
 345                 }
 346         }
 347
 348         bo->mn = rmn;
 349
 350         node->it.start = addr;
 351         node->it.last = end;
 352         INIT_LIST_HEAD(&node->bos);
 353         list_splice(&bos, &node->bos);
 354         list_add(&bo->mn_list, &node->bos);
 355
 356         interval_tree_insert(&node->it, &rmn->objects);
 357
 358         up_write(&rmn->lock);
 359
 360         return 0;
 361 }
 362
 363 /**
 364  * amdgpu_mn_unregister - unregister a BO for notifier updates
 365  *
 366  * @bo: amdgpu buffer object
 367  *
 368  * Remove any registration of MMU notifier updates from the buffer object.
 369  */
 370 void amdgpu_mn_unregister(struct amdgpu_bo *bo)
 371 {
 372         struct amdgpu_device *adev = amdgpu_ttm_adev(bo->tbo.bdev);
 373         struct amdgpu_mn *rmn;
 374         struct list_head *head;
 375
 376         mutex_lock(&adev->mn_lock);
 377
 378         rmn = bo->mn;
 379         if (rmn == NULL) {
 380                 mutex_unlock(&adev->mn_lock);
 381                 return;
 382         }
 383
 384         down_write(&rmn->lock);
 385
 386         /* save the next list entry for later */
 387         head = bo->mn_list.next;
 388
 389         bo->mn = NULL;
 390         list_del_init(&bo->mn_list);
 391
 392         if (list_empty(head)) {
 393                 struct amdgpu_mn_node *node;
 394                 node = container_of(head, struct amdgpu_mn_node, bos);
 395                 interval_tree_remove(&node->it, &rmn->objects);
 396                 kfree(node);
 397         }
 398
 399         up_write(&rmn->lock);
 400         mutex_unlock(&adev->mn_lock);
 401 }
 402