1f48ad614SDennis Dalessandro /* 234ab4de7SMichael J. Ruhl * Copyright(c) 2016 - 2017 Intel Corporation. 3f48ad614SDennis Dalessandro * 4f48ad614SDennis Dalessandro * This file is provided under a dual BSD/GPLv2 license. When using or 5f48ad614SDennis Dalessandro * redistributing this file, you may do so under either license. 6f48ad614SDennis Dalessandro * 7f48ad614SDennis Dalessandro * GPL LICENSE SUMMARY 8f48ad614SDennis Dalessandro * 9f48ad614SDennis Dalessandro * This program is free software; you can redistribute it and/or modify 10f48ad614SDennis Dalessandro * it under the terms of version 2 of the GNU General Public License as 11f48ad614SDennis Dalessandro * published by the Free Software Foundation. 12f48ad614SDennis Dalessandro * 13f48ad614SDennis Dalessandro * This program is distributed in the hope that it will be useful, but 14f48ad614SDennis Dalessandro * WITHOUT ANY WARRANTY; without even the implied warranty of 15f48ad614SDennis Dalessandro * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16f48ad614SDennis Dalessandro * General Public License for more details. 17f48ad614SDennis Dalessandro * 18f48ad614SDennis Dalessandro * BSD LICENSE 19f48ad614SDennis Dalessandro * 20f48ad614SDennis Dalessandro * Redistribution and use in source and binary forms, with or without 21f48ad614SDennis Dalessandro * modification, are permitted provided that the following conditions 22f48ad614SDennis Dalessandro * are met: 23f48ad614SDennis Dalessandro * 24f48ad614SDennis Dalessandro * - Redistributions of source code must retain the above copyright 25f48ad614SDennis Dalessandro * notice, this list of conditions and the following disclaimer. 26f48ad614SDennis Dalessandro * - Redistributions in binary form must reproduce the above copyright 27f48ad614SDennis Dalessandro * notice, this list of conditions and the following disclaimer in 28f48ad614SDennis Dalessandro * the documentation and/or other materials provided with the 29f48ad614SDennis Dalessandro * distribution. 30f48ad614SDennis Dalessandro * - Neither the name of Intel Corporation nor the names of its 31f48ad614SDennis Dalessandro * contributors may be used to endorse or promote products derived 32f48ad614SDennis Dalessandro * from this software without specific prior written permission. 33f48ad614SDennis Dalessandro * 34f48ad614SDennis Dalessandro * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 35f48ad614SDennis Dalessandro * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 36f48ad614SDennis Dalessandro * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 37f48ad614SDennis Dalessandro * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 38f48ad614SDennis Dalessandro * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 39f48ad614SDennis Dalessandro * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 40f48ad614SDennis Dalessandro * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 41f48ad614SDennis Dalessandro * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 42f48ad614SDennis Dalessandro * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 43f48ad614SDennis Dalessandro * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 44f48ad614SDennis Dalessandro * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 45f48ad614SDennis Dalessandro * 46f48ad614SDennis Dalessandro */ 47f48ad614SDennis Dalessandro #include <linux/list.h> 48f48ad614SDennis Dalessandro #include <linux/rculist.h> 49f48ad614SDennis Dalessandro #include <linux/mmu_notifier.h> 50f48ad614SDennis Dalessandro #include <linux/interval_tree_generic.h> 51f48ad614SDennis Dalessandro 52f48ad614SDennis Dalessandro #include "mmu_rb.h" 53f48ad614SDennis Dalessandro #include "trace.h" 54f48ad614SDennis Dalessandro 55f48ad614SDennis Dalessandro struct mmu_rb_handler { 56f48ad614SDennis Dalessandro struct mmu_notifier mn; 57f808c13fSDavidlohr Bueso struct rb_root_cached root; 58e0b09ac5SDean Luick void *ops_arg; 59f48ad614SDennis Dalessandro spinlock_t lock; /* protect the RB tree */ 60f48ad614SDennis Dalessandro struct mmu_rb_ops *ops; 613faa3d9aSIra Weiny struct mm_struct *mm; 620636e9abSDean Luick struct list_head lru_list; 63b85ced91SDean Luick struct work_struct del_work; 64b85ced91SDean Luick struct list_head del_list; 65b85ced91SDean Luick struct workqueue_struct *wq; 66f48ad614SDennis Dalessandro }; 67f48ad614SDennis Dalessandro 68f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *); 69f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *); 7093065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *, 715d6527a7SJérôme Glisse const struct mmu_notifier_range *); 72f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *, 73f48ad614SDennis Dalessandro unsigned long, unsigned long); 74b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 75b85ced91SDean Luick struct list_head *del_list); 76b85ced91SDean Luick static void handle_remove(struct work_struct *work); 77f48ad614SDennis Dalessandro 780fc859a6SBhumika Goyal static const struct mmu_notifier_ops mn_opts = { 79f48ad614SDennis Dalessandro .invalidate_range_start = mmu_notifier_range_start, 80f48ad614SDennis Dalessandro }; 81f48ad614SDennis Dalessandro 82f48ad614SDennis Dalessandro INTERVAL_TREE_DEFINE(struct mmu_rb_node, node, unsigned long, __last, 83f48ad614SDennis Dalessandro mmu_node_start, mmu_node_last, static, __mmu_int_rb); 84f48ad614SDennis Dalessandro 85f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *node) 86f48ad614SDennis Dalessandro { 87f48ad614SDennis Dalessandro return node->addr & PAGE_MASK; 88f48ad614SDennis Dalessandro } 89f48ad614SDennis Dalessandro 90f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *node) 91f48ad614SDennis Dalessandro { 92f48ad614SDennis Dalessandro return PAGE_ALIGN(node->addr + node->len) - 1; 93f48ad614SDennis Dalessandro } 94f48ad614SDennis Dalessandro 95e0b09ac5SDean Luick int hfi1_mmu_rb_register(void *ops_arg, struct mm_struct *mm, 96e0b09ac5SDean Luick struct mmu_rb_ops *ops, 97b85ced91SDean Luick struct workqueue_struct *wq, 98e0b09ac5SDean Luick struct mmu_rb_handler **handler) 99f48ad614SDennis Dalessandro { 100f48ad614SDennis Dalessandro struct mmu_rb_handler *handlr; 1013faa3d9aSIra Weiny int ret; 102f48ad614SDennis Dalessandro 103f48ad614SDennis Dalessandro handlr = kmalloc(sizeof(*handlr), GFP_KERNEL); 104f48ad614SDennis Dalessandro if (!handlr) 105f48ad614SDennis Dalessandro return -ENOMEM; 106f48ad614SDennis Dalessandro 107f808c13fSDavidlohr Bueso handlr->root = RB_ROOT_CACHED; 108f48ad614SDennis Dalessandro handlr->ops = ops; 109e0b09ac5SDean Luick handlr->ops_arg = ops_arg; 110f48ad614SDennis Dalessandro INIT_HLIST_NODE(&handlr->mn.hlist); 111f48ad614SDennis Dalessandro spin_lock_init(&handlr->lock); 112f48ad614SDennis Dalessandro handlr->mn.ops = &mn_opts; 1133faa3d9aSIra Weiny handlr->mm = mm; 114b85ced91SDean Luick INIT_WORK(&handlr->del_work, handle_remove); 115b85ced91SDean Luick INIT_LIST_HEAD(&handlr->del_list); 1160636e9abSDean Luick INIT_LIST_HEAD(&handlr->lru_list); 117b85ced91SDean Luick handlr->wq = wq; 1183faa3d9aSIra Weiny 1193faa3d9aSIra Weiny ret = mmu_notifier_register(&handlr->mn, handlr->mm); 1203faa3d9aSIra Weiny if (ret) { 1213faa3d9aSIra Weiny kfree(handlr); 1223faa3d9aSIra Weiny return ret; 1233faa3d9aSIra Weiny } 1243faa3d9aSIra Weiny 125e0b09ac5SDean Luick *handler = handlr; 126e0b09ac5SDean Luick return 0; 127f48ad614SDennis Dalessandro } 128f48ad614SDennis Dalessandro 129e0b09ac5SDean Luick void hfi1_mmu_rb_unregister(struct mmu_rb_handler *handler) 130f48ad614SDennis Dalessandro { 13120a42d08SDean Luick struct mmu_rb_node *rbnode; 13220a42d08SDean Luick struct rb_node *node; 133f48ad614SDennis Dalessandro unsigned long flags; 134b85ced91SDean Luick struct list_head del_list; 135f48ad614SDennis Dalessandro 136f48ad614SDennis Dalessandro /* Unregister first so we don't get any more notifications. */ 1373faa3d9aSIra Weiny mmu_notifier_unregister(&handler->mn, handler->mm); 138f48ad614SDennis Dalessandro 139b85ced91SDean Luick /* 140b85ced91SDean Luick * Make sure the wq delete handler is finished running. It will not 141b85ced91SDean Luick * be triggered once the mmu notifiers are unregistered above. 142b85ced91SDean Luick */ 143b85ced91SDean Luick flush_work(&handler->del_work); 144b85ced91SDean Luick 145b85ced91SDean Luick INIT_LIST_HEAD(&del_list); 146b85ced91SDean Luick 147f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 148f808c13fSDavidlohr Bueso while ((node = rb_first_cached(&handler->root))) { 149f48ad614SDennis Dalessandro rbnode = rb_entry(node, struct mmu_rb_node, node); 150f808c13fSDavidlohr Bueso rb_erase_cached(node, &handler->root); 1510636e9abSDean Luick /* move from LRU list to delete list */ 1520636e9abSDean Luick list_move(&rbnode->list, &del_list); 153f48ad614SDennis Dalessandro } 154f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 155f48ad614SDennis Dalessandro 156b85ced91SDean Luick do_remove(handler, &del_list); 157b85ced91SDean Luick 158f48ad614SDennis Dalessandro kfree(handler); 159f48ad614SDennis Dalessandro } 160f48ad614SDennis Dalessandro 161e0b09ac5SDean Luick int hfi1_mmu_rb_insert(struct mmu_rb_handler *handler, 162e0b09ac5SDean Luick struct mmu_rb_node *mnode) 163f48ad614SDennis Dalessandro { 164f48ad614SDennis Dalessandro struct mmu_rb_node *node; 165f48ad614SDennis Dalessandro unsigned long flags; 166f48ad614SDennis Dalessandro int ret = 0; 167f48ad614SDennis Dalessandro 16834ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_insert(mnode->addr, mnode->len); 169f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 170f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, mnode->addr, mnode->len); 171f48ad614SDennis Dalessandro if (node) { 172f48ad614SDennis Dalessandro ret = -EINVAL; 173f48ad614SDennis Dalessandro goto unlock; 174f48ad614SDennis Dalessandro } 175e0b09ac5SDean Luick __mmu_int_rb_insert(mnode, &handler->root); 1760636e9abSDean Luick list_add(&mnode->list, &handler->lru_list); 177f48ad614SDennis Dalessandro 178e0b09ac5SDean Luick ret = handler->ops->insert(handler->ops_arg, mnode); 1790636e9abSDean Luick if (ret) { 180e0b09ac5SDean Luick __mmu_int_rb_remove(mnode, &handler->root); 1810636e9abSDean Luick list_del(&mnode->list); /* remove from LRU list */ 1820636e9abSDean Luick } 183f48ad614SDennis Dalessandro unlock: 184f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 185f48ad614SDennis Dalessandro return ret; 186f48ad614SDennis Dalessandro } 187f48ad614SDennis Dalessandro 188f48ad614SDennis Dalessandro /* Caller must hold handler lock */ 189f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *handler, 190f48ad614SDennis Dalessandro unsigned long addr, 191f48ad614SDennis Dalessandro unsigned long len) 192f48ad614SDennis Dalessandro { 193f48ad614SDennis Dalessandro struct mmu_rb_node *node = NULL; 194f48ad614SDennis Dalessandro 19534ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_search(addr, len); 196f48ad614SDennis Dalessandro if (!handler->ops->filter) { 197e0b09ac5SDean Luick node = __mmu_int_rb_iter_first(&handler->root, addr, 198f48ad614SDennis Dalessandro (addr + len) - 1); 199f48ad614SDennis Dalessandro } else { 200e0b09ac5SDean Luick for (node = __mmu_int_rb_iter_first(&handler->root, addr, 201f48ad614SDennis Dalessandro (addr + len) - 1); 202f48ad614SDennis Dalessandro node; 203f48ad614SDennis Dalessandro node = __mmu_int_rb_iter_next(node, addr, 204f48ad614SDennis Dalessandro (addr + len) - 1)) { 205f48ad614SDennis Dalessandro if (handler->ops->filter(node, addr, len)) 206f48ad614SDennis Dalessandro return node; 207f48ad614SDennis Dalessandro } 208f48ad614SDennis Dalessandro } 209f48ad614SDennis Dalessandro return node; 210f48ad614SDennis Dalessandro } 211f48ad614SDennis Dalessandro 2127be85676SSebastian Sanchez bool hfi1_mmu_rb_remove_unless_exact(struct mmu_rb_handler *handler, 2137be85676SSebastian Sanchez unsigned long addr, unsigned long len, 2147be85676SSebastian Sanchez struct mmu_rb_node **rb_node) 215f48ad614SDennis Dalessandro { 216f48ad614SDennis Dalessandro struct mmu_rb_node *node; 217f48ad614SDennis Dalessandro unsigned long flags; 2187be85676SSebastian Sanchez bool ret = false; 219f48ad614SDennis Dalessandro 220f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 221f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, addr, len); 2220636e9abSDean Luick if (node) { 2237be85676SSebastian Sanchez if (node->addr == addr && node->len == len) 2247be85676SSebastian Sanchez goto unlock; 225e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 2260636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 2277be85676SSebastian Sanchez ret = true; 2280636e9abSDean Luick } 2297be85676SSebastian Sanchez unlock: 230f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 2317be85676SSebastian Sanchez *rb_node = node; 2327be85676SSebastian Sanchez return ret; 233f48ad614SDennis Dalessandro } 234f48ad614SDennis Dalessandro 23510345998SDean Luick void hfi1_mmu_rb_evict(struct mmu_rb_handler *handler, void *evict_arg) 23610345998SDean Luick { 2370636e9abSDean Luick struct mmu_rb_node *rbnode, *ptr; 23810345998SDean Luick struct list_head del_list; 23910345998SDean Luick unsigned long flags; 24010345998SDean Luick bool stop = false; 24110345998SDean Luick 24210345998SDean Luick INIT_LIST_HEAD(&del_list); 24310345998SDean Luick 24410345998SDean Luick spin_lock_irqsave(&handler->lock, flags); 2450636e9abSDean Luick list_for_each_entry_safe_reverse(rbnode, ptr, &handler->lru_list, 2460636e9abSDean Luick list) { 24710345998SDean Luick if (handler->ops->evict(handler->ops_arg, rbnode, evict_arg, 24810345998SDean Luick &stop)) { 24910345998SDean Luick __mmu_int_rb_remove(rbnode, &handler->root); 2500636e9abSDean Luick /* move from LRU list to delete list */ 2510636e9abSDean Luick list_move(&rbnode->list, &del_list); 25210345998SDean Luick } 25310345998SDean Luick if (stop) 25410345998SDean Luick break; 25510345998SDean Luick } 25610345998SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 25710345998SDean Luick 25810345998SDean Luick while (!list_empty(&del_list)) { 25910345998SDean Luick rbnode = list_first_entry(&del_list, struct mmu_rb_node, list); 26010345998SDean Luick list_del(&rbnode->list); 261082b3532SDean Luick handler->ops->remove(handler->ops_arg, rbnode); 26210345998SDean Luick } 26310345998SDean Luick } 26410345998SDean Luick 265b85ced91SDean Luick /* 266b85ced91SDean Luick * It is up to the caller to ensure that this function does not race with the 267b85ced91SDean Luick * mmu invalidate notifier which may be calling the users remove callback on 268b85ced91SDean Luick * 'node'. 269b85ced91SDean Luick */ 270e0b09ac5SDean Luick void hfi1_mmu_rb_remove(struct mmu_rb_handler *handler, 271e0b09ac5SDean Luick struct mmu_rb_node *node) 272f48ad614SDennis Dalessandro { 2733c1091aaSIra Weiny unsigned long flags; 274f48ad614SDennis Dalessandro 2753c1091aaSIra Weiny /* Validity of handler and node pointers has been checked by caller. */ 27634ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_remove(node->addr, node->len); 2773c1091aaSIra Weiny spin_lock_irqsave(&handler->lock, flags); 278e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 2790636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 2803c1091aaSIra Weiny spin_unlock_irqrestore(&handler->lock, flags); 2813c1091aaSIra Weiny 282082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 283f48ad614SDennis Dalessandro } 284f48ad614SDennis Dalessandro 28593065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *mn, 2865d6527a7SJérôme Glisse const struct mmu_notifier_range *range) 287f48ad614SDennis Dalessandro { 288f48ad614SDennis Dalessandro struct mmu_rb_handler *handler = 289f48ad614SDennis Dalessandro container_of(mn, struct mmu_rb_handler, mn); 290f808c13fSDavidlohr Bueso struct rb_root_cached *root = &handler->root; 291f48ad614SDennis Dalessandro struct mmu_rb_node *node, *ptr = NULL; 292f48ad614SDennis Dalessandro unsigned long flags; 293b85ced91SDean Luick bool added = false; 294f48ad614SDennis Dalessandro 295f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 2965d6527a7SJérôme Glisse for (node = __mmu_int_rb_iter_first(root, range->start, range->end-1); 297f48ad614SDennis Dalessandro node; node = ptr) { 298f48ad614SDennis Dalessandro /* Guard against node removal. */ 2995d6527a7SJérôme Glisse ptr = __mmu_int_rb_iter_next(node, range->start, 3005d6527a7SJérôme Glisse range->end - 1); 30134ab4de7SMichael J. Ruhl trace_hfi1_mmu_mem_invalidate(node->addr, node->len); 302e0b09ac5SDean Luick if (handler->ops->invalidate(handler->ops_arg, node)) { 303f48ad614SDennis Dalessandro __mmu_int_rb_remove(node, root); 3040636e9abSDean Luick /* move from LRU list to delete list */ 3050636e9abSDean Luick list_move(&node->list, &handler->del_list); 306b85ced91SDean Luick added = true; 307f48ad614SDennis Dalessandro } 308f48ad614SDennis Dalessandro } 309f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 310b85ced91SDean Luick 311b85ced91SDean Luick if (added) 312b85ced91SDean Luick queue_work(handler->wq, &handler->del_work); 31393065ac7SMichal Hocko 31493065ac7SMichal Hocko return 0; 315b85ced91SDean Luick } 316b85ced91SDean Luick 317b85ced91SDean Luick /* 318b85ced91SDean Luick * Call the remove function for the given handler and the list. This 319b85ced91SDean Luick * is expected to be called with a delete list extracted from handler. 320b85ced91SDean Luick * The caller should not be holding the handler lock. 321b85ced91SDean Luick */ 322b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 323b85ced91SDean Luick struct list_head *del_list) 324b85ced91SDean Luick { 325b85ced91SDean Luick struct mmu_rb_node *node; 326b85ced91SDean Luick 327b85ced91SDean Luick while (!list_empty(del_list)) { 328b85ced91SDean Luick node = list_first_entry(del_list, struct mmu_rb_node, list); 329b85ced91SDean Luick list_del(&node->list); 330082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 331b85ced91SDean Luick } 332b85ced91SDean Luick } 333b85ced91SDean Luick 334b85ced91SDean Luick /* 335b85ced91SDean Luick * Work queue function to remove all nodes that have been queued up to 336*c1e8d7c6SMichel Lespinasse * be removed. The key feature is that mm->mmap_lock is not being held 337b85ced91SDean Luick * and the remove callback can sleep while taking it, if needed. 338b85ced91SDean Luick */ 339b85ced91SDean Luick static void handle_remove(struct work_struct *work) 340b85ced91SDean Luick { 341b85ced91SDean Luick struct mmu_rb_handler *handler = container_of(work, 342b85ced91SDean Luick struct mmu_rb_handler, 343b85ced91SDean Luick del_work); 344b85ced91SDean Luick struct list_head del_list; 345b85ced91SDean Luick unsigned long flags; 346b85ced91SDean Luick 347b85ced91SDean Luick /* remove anything that is queued to get removed */ 348b85ced91SDean Luick spin_lock_irqsave(&handler->lock, flags); 349b85ced91SDean Luick list_replace_init(&handler->del_list, &del_list); 350b85ced91SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 351b85ced91SDean Luick 352b85ced91SDean Luick do_remove(handler, &del_list); 353f48ad614SDennis Dalessandro } 354