1*145eba1aSCai Huoqing // SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause 2f48ad614SDennis Dalessandro /* 33d2a9d64SDennis Dalessandro * Copyright(c) 2020 Cornelis Networks, Inc. 434ab4de7SMichael J. Ruhl * Copyright(c) 2016 - 2017 Intel Corporation. 5f48ad614SDennis Dalessandro */ 6*145eba1aSCai Huoqing 7f48ad614SDennis Dalessandro #include <linux/list.h> 8f48ad614SDennis Dalessandro #include <linux/rculist.h> 9f48ad614SDennis Dalessandro #include <linux/mmu_notifier.h> 10f48ad614SDennis Dalessandro #include <linux/interval_tree_generic.h> 113d2a9d64SDennis Dalessandro #include <linux/sched/mm.h> 12f48ad614SDennis Dalessandro 13f48ad614SDennis Dalessandro #include "mmu_rb.h" 14f48ad614SDennis Dalessandro #include "trace.h" 15f48ad614SDennis Dalessandro 16f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *); 17f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *); 1893065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *, 195d6527a7SJérôme Glisse const struct mmu_notifier_range *); 20f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *, 21f48ad614SDennis Dalessandro unsigned long, unsigned long); 22b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 23b85ced91SDean Luick struct list_head *del_list); 24b85ced91SDean Luick static void handle_remove(struct work_struct *work); 25f48ad614SDennis Dalessandro 260fc859a6SBhumika Goyal static const struct mmu_notifier_ops mn_opts = { 27f48ad614SDennis Dalessandro .invalidate_range_start = mmu_notifier_range_start, 28f48ad614SDennis Dalessandro }; 29f48ad614SDennis Dalessandro 30f48ad614SDennis Dalessandro INTERVAL_TREE_DEFINE(struct mmu_rb_node, node, unsigned long, __last, 31f48ad614SDennis Dalessandro mmu_node_start, mmu_node_last, static, __mmu_int_rb); 32f48ad614SDennis Dalessandro 33f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *node) 34f48ad614SDennis Dalessandro { 35f48ad614SDennis Dalessandro return node->addr & PAGE_MASK; 36f48ad614SDennis Dalessandro } 37f48ad614SDennis Dalessandro 38f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *node) 39f48ad614SDennis Dalessandro { 40f48ad614SDennis Dalessandro return PAGE_ALIGN(node->addr + node->len) - 1; 41f48ad614SDennis Dalessandro } 42f48ad614SDennis Dalessandro 433d2a9d64SDennis Dalessandro int hfi1_mmu_rb_register(void *ops_arg, 44e0b09ac5SDean Luick struct mmu_rb_ops *ops, 45b85ced91SDean Luick struct workqueue_struct *wq, 46e0b09ac5SDean Luick struct mmu_rb_handler **handler) 47f48ad614SDennis Dalessandro { 483d2a9d64SDennis Dalessandro struct mmu_rb_handler *h; 493faa3d9aSIra Weiny int ret; 50f48ad614SDennis Dalessandro 51ca5f7256SMike Marciniszyn h = kzalloc(sizeof(*h), GFP_KERNEL); 523d2a9d64SDennis Dalessandro if (!h) 53f48ad614SDennis Dalessandro return -ENOMEM; 54f48ad614SDennis Dalessandro 553d2a9d64SDennis Dalessandro h->root = RB_ROOT_CACHED; 563d2a9d64SDennis Dalessandro h->ops = ops; 573d2a9d64SDennis Dalessandro h->ops_arg = ops_arg; 583d2a9d64SDennis Dalessandro INIT_HLIST_NODE(&h->mn.hlist); 593d2a9d64SDennis Dalessandro spin_lock_init(&h->lock); 603d2a9d64SDennis Dalessandro h->mn.ops = &mn_opts; 613d2a9d64SDennis Dalessandro INIT_WORK(&h->del_work, handle_remove); 623d2a9d64SDennis Dalessandro INIT_LIST_HEAD(&h->del_list); 633d2a9d64SDennis Dalessandro INIT_LIST_HEAD(&h->lru_list); 643d2a9d64SDennis Dalessandro h->wq = wq; 653faa3d9aSIra Weiny 663d2a9d64SDennis Dalessandro ret = mmu_notifier_register(&h->mn, current->mm); 673faa3d9aSIra Weiny if (ret) { 683d2a9d64SDennis Dalessandro kfree(h); 693faa3d9aSIra Weiny return ret; 703faa3d9aSIra Weiny } 713faa3d9aSIra Weiny 723d2a9d64SDennis Dalessandro *handler = h; 73e0b09ac5SDean Luick return 0; 74f48ad614SDennis Dalessandro } 75f48ad614SDennis Dalessandro 76e0b09ac5SDean Luick void hfi1_mmu_rb_unregister(struct mmu_rb_handler *handler) 77f48ad614SDennis Dalessandro { 7820a42d08SDean Luick struct mmu_rb_node *rbnode; 7920a42d08SDean Luick struct rb_node *node; 80f48ad614SDennis Dalessandro unsigned long flags; 81b85ced91SDean Luick struct list_head del_list; 82f48ad614SDennis Dalessandro 83f48ad614SDennis Dalessandro /* Unregister first so we don't get any more notifications. */ 843d2a9d64SDennis Dalessandro mmu_notifier_unregister(&handler->mn, handler->mn.mm); 85f48ad614SDennis Dalessandro 86b85ced91SDean Luick /* 87b85ced91SDean Luick * Make sure the wq delete handler is finished running. It will not 88b85ced91SDean Luick * be triggered once the mmu notifiers are unregistered above. 89b85ced91SDean Luick */ 90b85ced91SDean Luick flush_work(&handler->del_work); 91b85ced91SDean Luick 92b85ced91SDean Luick INIT_LIST_HEAD(&del_list); 93b85ced91SDean Luick 94f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 95f808c13fSDavidlohr Bueso while ((node = rb_first_cached(&handler->root))) { 96f48ad614SDennis Dalessandro rbnode = rb_entry(node, struct mmu_rb_node, node); 97f808c13fSDavidlohr Bueso rb_erase_cached(node, &handler->root); 980636e9abSDean Luick /* move from LRU list to delete list */ 990636e9abSDean Luick list_move(&rbnode->list, &del_list); 100f48ad614SDennis Dalessandro } 101f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 102f48ad614SDennis Dalessandro 103b85ced91SDean Luick do_remove(handler, &del_list); 104b85ced91SDean Luick 105f48ad614SDennis Dalessandro kfree(handler); 106f48ad614SDennis Dalessandro } 107f48ad614SDennis Dalessandro 108e0b09ac5SDean Luick int hfi1_mmu_rb_insert(struct mmu_rb_handler *handler, 109e0b09ac5SDean Luick struct mmu_rb_node *mnode) 110f48ad614SDennis Dalessandro { 111f48ad614SDennis Dalessandro struct mmu_rb_node *node; 112f48ad614SDennis Dalessandro unsigned long flags; 113f48ad614SDennis Dalessandro int ret = 0; 114f48ad614SDennis Dalessandro 11534ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_insert(mnode->addr, mnode->len); 1163d2a9d64SDennis Dalessandro 1173d2a9d64SDennis Dalessandro if (current->mm != handler->mn.mm) 1183d2a9d64SDennis Dalessandro return -EPERM; 1193d2a9d64SDennis Dalessandro 120f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 121f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, mnode->addr, mnode->len); 122f48ad614SDennis Dalessandro if (node) { 123f48ad614SDennis Dalessandro ret = -EINVAL; 124f48ad614SDennis Dalessandro goto unlock; 125f48ad614SDennis Dalessandro } 126e0b09ac5SDean Luick __mmu_int_rb_insert(mnode, &handler->root); 1270636e9abSDean Luick list_add(&mnode->list, &handler->lru_list); 128f48ad614SDennis Dalessandro 129e0b09ac5SDean Luick ret = handler->ops->insert(handler->ops_arg, mnode); 1300636e9abSDean Luick if (ret) { 131e0b09ac5SDean Luick __mmu_int_rb_remove(mnode, &handler->root); 1320636e9abSDean Luick list_del(&mnode->list); /* remove from LRU list */ 1330636e9abSDean Luick } 1343d2a9d64SDennis Dalessandro mnode->handler = handler; 135f48ad614SDennis Dalessandro unlock: 136f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 137f48ad614SDennis Dalessandro return ret; 138f48ad614SDennis Dalessandro } 139f48ad614SDennis Dalessandro 140f48ad614SDennis Dalessandro /* Caller must hold handler lock */ 141f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *handler, 142f48ad614SDennis Dalessandro unsigned long addr, 143f48ad614SDennis Dalessandro unsigned long len) 144f48ad614SDennis Dalessandro { 145f48ad614SDennis Dalessandro struct mmu_rb_node *node = NULL; 146f48ad614SDennis Dalessandro 14734ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_search(addr, len); 148f48ad614SDennis Dalessandro if (!handler->ops->filter) { 149e0b09ac5SDean Luick node = __mmu_int_rb_iter_first(&handler->root, addr, 150f48ad614SDennis Dalessandro (addr + len) - 1); 151f48ad614SDennis Dalessandro } else { 152e0b09ac5SDean Luick for (node = __mmu_int_rb_iter_first(&handler->root, addr, 153f48ad614SDennis Dalessandro (addr + len) - 1); 154f48ad614SDennis Dalessandro node; 155f48ad614SDennis Dalessandro node = __mmu_int_rb_iter_next(node, addr, 156f48ad614SDennis Dalessandro (addr + len) - 1)) { 157f48ad614SDennis Dalessandro if (handler->ops->filter(node, addr, len)) 158f48ad614SDennis Dalessandro return node; 159f48ad614SDennis Dalessandro } 160f48ad614SDennis Dalessandro } 161f48ad614SDennis Dalessandro return node; 162f48ad614SDennis Dalessandro } 163f48ad614SDennis Dalessandro 1647be85676SSebastian Sanchez bool hfi1_mmu_rb_remove_unless_exact(struct mmu_rb_handler *handler, 1657be85676SSebastian Sanchez unsigned long addr, unsigned long len, 1667be85676SSebastian Sanchez struct mmu_rb_node **rb_node) 167f48ad614SDennis Dalessandro { 168f48ad614SDennis Dalessandro struct mmu_rb_node *node; 169f48ad614SDennis Dalessandro unsigned long flags; 1707be85676SSebastian Sanchez bool ret = false; 171f48ad614SDennis Dalessandro 1723d2a9d64SDennis Dalessandro if (current->mm != handler->mn.mm) 1733d2a9d64SDennis Dalessandro return ret; 1743d2a9d64SDennis Dalessandro 175f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 176f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, addr, len); 1770636e9abSDean Luick if (node) { 1787be85676SSebastian Sanchez if (node->addr == addr && node->len == len) 1797be85676SSebastian Sanchez goto unlock; 180e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 1810636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 1827be85676SSebastian Sanchez ret = true; 1830636e9abSDean Luick } 1847be85676SSebastian Sanchez unlock: 185f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 1867be85676SSebastian Sanchez *rb_node = node; 1877be85676SSebastian Sanchez return ret; 188f48ad614SDennis Dalessandro } 189f48ad614SDennis Dalessandro 19010345998SDean Luick void hfi1_mmu_rb_evict(struct mmu_rb_handler *handler, void *evict_arg) 19110345998SDean Luick { 1920636e9abSDean Luick struct mmu_rb_node *rbnode, *ptr; 19310345998SDean Luick struct list_head del_list; 19410345998SDean Luick unsigned long flags; 19510345998SDean Luick bool stop = false; 19610345998SDean Luick 1973d2a9d64SDennis Dalessandro if (current->mm != handler->mn.mm) 1983d2a9d64SDennis Dalessandro return; 1993d2a9d64SDennis Dalessandro 20010345998SDean Luick INIT_LIST_HEAD(&del_list); 20110345998SDean Luick 20210345998SDean Luick spin_lock_irqsave(&handler->lock, flags); 2030636e9abSDean Luick list_for_each_entry_safe_reverse(rbnode, ptr, &handler->lru_list, 2040636e9abSDean Luick list) { 20510345998SDean Luick if (handler->ops->evict(handler->ops_arg, rbnode, evict_arg, 20610345998SDean Luick &stop)) { 20710345998SDean Luick __mmu_int_rb_remove(rbnode, &handler->root); 2080636e9abSDean Luick /* move from LRU list to delete list */ 2090636e9abSDean Luick list_move(&rbnode->list, &del_list); 21010345998SDean Luick } 21110345998SDean Luick if (stop) 21210345998SDean Luick break; 21310345998SDean Luick } 21410345998SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 21510345998SDean Luick 21610345998SDean Luick while (!list_empty(&del_list)) { 21710345998SDean Luick rbnode = list_first_entry(&del_list, struct mmu_rb_node, list); 21810345998SDean Luick list_del(&rbnode->list); 219082b3532SDean Luick handler->ops->remove(handler->ops_arg, rbnode); 22010345998SDean Luick } 22110345998SDean Luick } 22210345998SDean Luick 223b85ced91SDean Luick /* 224b85ced91SDean Luick * It is up to the caller to ensure that this function does not race with the 225b85ced91SDean Luick * mmu invalidate notifier which may be calling the users remove callback on 226b85ced91SDean Luick * 'node'. 227b85ced91SDean Luick */ 228e0b09ac5SDean Luick void hfi1_mmu_rb_remove(struct mmu_rb_handler *handler, 229e0b09ac5SDean Luick struct mmu_rb_node *node) 230f48ad614SDennis Dalessandro { 2313c1091aaSIra Weiny unsigned long flags; 232f48ad614SDennis Dalessandro 2333d2a9d64SDennis Dalessandro if (current->mm != handler->mn.mm) 2343d2a9d64SDennis Dalessandro return; 2353d2a9d64SDennis Dalessandro 2363c1091aaSIra Weiny /* Validity of handler and node pointers has been checked by caller. */ 23734ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_remove(node->addr, node->len); 2383c1091aaSIra Weiny spin_lock_irqsave(&handler->lock, flags); 239e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 2400636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 2413c1091aaSIra Weiny spin_unlock_irqrestore(&handler->lock, flags); 2423c1091aaSIra Weiny 243082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 244f48ad614SDennis Dalessandro } 245f48ad614SDennis Dalessandro 24693065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *mn, 2475d6527a7SJérôme Glisse const struct mmu_notifier_range *range) 248f48ad614SDennis Dalessandro { 249f48ad614SDennis Dalessandro struct mmu_rb_handler *handler = 250f48ad614SDennis Dalessandro container_of(mn, struct mmu_rb_handler, mn); 251f808c13fSDavidlohr Bueso struct rb_root_cached *root = &handler->root; 252f48ad614SDennis Dalessandro struct mmu_rb_node *node, *ptr = NULL; 253f48ad614SDennis Dalessandro unsigned long flags; 254b85ced91SDean Luick bool added = false; 255f48ad614SDennis Dalessandro 256f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 2575d6527a7SJérôme Glisse for (node = __mmu_int_rb_iter_first(root, range->start, range->end-1); 258f48ad614SDennis Dalessandro node; node = ptr) { 259f48ad614SDennis Dalessandro /* Guard against node removal. */ 2605d6527a7SJérôme Glisse ptr = __mmu_int_rb_iter_next(node, range->start, 2615d6527a7SJérôme Glisse range->end - 1); 26234ab4de7SMichael J. Ruhl trace_hfi1_mmu_mem_invalidate(node->addr, node->len); 263e0b09ac5SDean Luick if (handler->ops->invalidate(handler->ops_arg, node)) { 264f48ad614SDennis Dalessandro __mmu_int_rb_remove(node, root); 2650636e9abSDean Luick /* move from LRU list to delete list */ 2660636e9abSDean Luick list_move(&node->list, &handler->del_list); 267b85ced91SDean Luick added = true; 268f48ad614SDennis Dalessandro } 269f48ad614SDennis Dalessandro } 270f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 271b85ced91SDean Luick 272b85ced91SDean Luick if (added) 273b85ced91SDean Luick queue_work(handler->wq, &handler->del_work); 27493065ac7SMichal Hocko 27593065ac7SMichal Hocko return 0; 276b85ced91SDean Luick } 277b85ced91SDean Luick 278b85ced91SDean Luick /* 279b85ced91SDean Luick * Call the remove function for the given handler and the list. This 280b85ced91SDean Luick * is expected to be called with a delete list extracted from handler. 281b85ced91SDean Luick * The caller should not be holding the handler lock. 282b85ced91SDean Luick */ 283b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 284b85ced91SDean Luick struct list_head *del_list) 285b85ced91SDean Luick { 286b85ced91SDean Luick struct mmu_rb_node *node; 287b85ced91SDean Luick 288b85ced91SDean Luick while (!list_empty(del_list)) { 289b85ced91SDean Luick node = list_first_entry(del_list, struct mmu_rb_node, list); 290b85ced91SDean Luick list_del(&node->list); 291082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 292b85ced91SDean Luick } 293b85ced91SDean Luick } 294b85ced91SDean Luick 295b85ced91SDean Luick /* 296b85ced91SDean Luick * Work queue function to remove all nodes that have been queued up to 297c1e8d7c6SMichel Lespinasse * be removed. The key feature is that mm->mmap_lock is not being held 298b85ced91SDean Luick * and the remove callback can sleep while taking it, if needed. 299b85ced91SDean Luick */ 300b85ced91SDean Luick static void handle_remove(struct work_struct *work) 301b85ced91SDean Luick { 302b85ced91SDean Luick struct mmu_rb_handler *handler = container_of(work, 303b85ced91SDean Luick struct mmu_rb_handler, 304b85ced91SDean Luick del_work); 305b85ced91SDean Luick struct list_head del_list; 306b85ced91SDean Luick unsigned long flags; 307b85ced91SDean Luick 308b85ced91SDean Luick /* remove anything that is queued to get removed */ 309b85ced91SDean Luick spin_lock_irqsave(&handler->lock, flags); 310b85ced91SDean Luick list_replace_init(&handler->del_list, &del_list); 311b85ced91SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 312b85ced91SDean Luick 313b85ced91SDean Luick do_remove(handler, &del_list); 314f48ad614SDennis Dalessandro } 315