1f48ad614SDennis Dalessandro /* 234ab4de7SMichael J. Ruhl * Copyright(c) 2016 - 2017 Intel Corporation. 3f48ad614SDennis Dalessandro * 4f48ad614SDennis Dalessandro * This file is provided under a dual BSD/GPLv2 license. When using or 5f48ad614SDennis Dalessandro * redistributing this file, you may do so under either license. 6f48ad614SDennis Dalessandro * 7f48ad614SDennis Dalessandro * GPL LICENSE SUMMARY 8f48ad614SDennis Dalessandro * 9f48ad614SDennis Dalessandro * This program is free software; you can redistribute it and/or modify 10f48ad614SDennis Dalessandro * it under the terms of version 2 of the GNU General Public License as 11f48ad614SDennis Dalessandro * published by the Free Software Foundation. 12f48ad614SDennis Dalessandro * 13f48ad614SDennis Dalessandro * This program is distributed in the hope that it will be useful, but 14f48ad614SDennis Dalessandro * WITHOUT ANY WARRANTY; without even the implied warranty of 15f48ad614SDennis Dalessandro * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16f48ad614SDennis Dalessandro * General Public License for more details. 17f48ad614SDennis Dalessandro * 18f48ad614SDennis Dalessandro * BSD LICENSE 19f48ad614SDennis Dalessandro * 20f48ad614SDennis Dalessandro * Redistribution and use in source and binary forms, with or without 21f48ad614SDennis Dalessandro * modification, are permitted provided that the following conditions 22f48ad614SDennis Dalessandro * are met: 23f48ad614SDennis Dalessandro * 24f48ad614SDennis Dalessandro * - Redistributions of source code must retain the above copyright 25f48ad614SDennis Dalessandro * notice, this list of conditions and the following disclaimer. 26f48ad614SDennis Dalessandro * - Redistributions in binary form must reproduce the above copyright 27f48ad614SDennis Dalessandro * notice, this list of conditions and the following disclaimer in 28f48ad614SDennis Dalessandro * the documentation and/or other materials provided with the 29f48ad614SDennis Dalessandro * distribution. 30f48ad614SDennis Dalessandro * - Neither the name of Intel Corporation nor the names of its 31f48ad614SDennis Dalessandro * contributors may be used to endorse or promote products derived 32f48ad614SDennis Dalessandro * from this software without specific prior written permission. 33f48ad614SDennis Dalessandro * 34f48ad614SDennis Dalessandro * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 35f48ad614SDennis Dalessandro * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 36f48ad614SDennis Dalessandro * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 37f48ad614SDennis Dalessandro * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 38f48ad614SDennis Dalessandro * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 39f48ad614SDennis Dalessandro * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 40f48ad614SDennis Dalessandro * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 41f48ad614SDennis Dalessandro * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 42f48ad614SDennis Dalessandro * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 43f48ad614SDennis Dalessandro * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 44f48ad614SDennis Dalessandro * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 45f48ad614SDennis Dalessandro * 46f48ad614SDennis Dalessandro */ 47f48ad614SDennis Dalessandro #include <linux/list.h> 48f48ad614SDennis Dalessandro #include <linux/rculist.h> 49f48ad614SDennis Dalessandro #include <linux/mmu_notifier.h> 50f48ad614SDennis Dalessandro #include <linux/interval_tree_generic.h> 51f48ad614SDennis Dalessandro 52f48ad614SDennis Dalessandro #include "mmu_rb.h" 53f48ad614SDennis Dalessandro #include "trace.h" 54f48ad614SDennis Dalessandro 55f48ad614SDennis Dalessandro struct mmu_rb_handler { 56f48ad614SDennis Dalessandro struct mmu_notifier mn; 57f808c13fSDavidlohr Bueso struct rb_root_cached root; 58e0b09ac5SDean Luick void *ops_arg; 59f48ad614SDennis Dalessandro spinlock_t lock; /* protect the RB tree */ 60f48ad614SDennis Dalessandro struct mmu_rb_ops *ops; 613faa3d9aSIra Weiny struct mm_struct *mm; 620636e9abSDean Luick struct list_head lru_list; 63b85ced91SDean Luick struct work_struct del_work; 64b85ced91SDean Luick struct list_head del_list; 65b85ced91SDean Luick struct workqueue_struct *wq; 66f48ad614SDennis Dalessandro }; 67f48ad614SDennis Dalessandro 68f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *); 69f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *); 70*93065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *, 71f48ad614SDennis Dalessandro struct mm_struct *, 72*93065ac7SMichal Hocko unsigned long, unsigned long, bool); 73f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *, 74f48ad614SDennis Dalessandro unsigned long, unsigned long); 75b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 76b85ced91SDean Luick struct list_head *del_list); 77b85ced91SDean Luick static void handle_remove(struct work_struct *work); 78f48ad614SDennis Dalessandro 790fc859a6SBhumika Goyal static const struct mmu_notifier_ops mn_opts = { 805ff7091fSDavid Rientjes .flags = MMU_INVALIDATE_DOES_NOT_BLOCK, 81f48ad614SDennis Dalessandro .invalidate_range_start = mmu_notifier_range_start, 82f48ad614SDennis Dalessandro }; 83f48ad614SDennis Dalessandro 84f48ad614SDennis Dalessandro INTERVAL_TREE_DEFINE(struct mmu_rb_node, node, unsigned long, __last, 85f48ad614SDennis Dalessandro mmu_node_start, mmu_node_last, static, __mmu_int_rb); 86f48ad614SDennis Dalessandro 87f48ad614SDennis Dalessandro static unsigned long mmu_node_start(struct mmu_rb_node *node) 88f48ad614SDennis Dalessandro { 89f48ad614SDennis Dalessandro return node->addr & PAGE_MASK; 90f48ad614SDennis Dalessandro } 91f48ad614SDennis Dalessandro 92f48ad614SDennis Dalessandro static unsigned long mmu_node_last(struct mmu_rb_node *node) 93f48ad614SDennis Dalessandro { 94f48ad614SDennis Dalessandro return PAGE_ALIGN(node->addr + node->len) - 1; 95f48ad614SDennis Dalessandro } 96f48ad614SDennis Dalessandro 97e0b09ac5SDean Luick int hfi1_mmu_rb_register(void *ops_arg, struct mm_struct *mm, 98e0b09ac5SDean Luick struct mmu_rb_ops *ops, 99b85ced91SDean Luick struct workqueue_struct *wq, 100e0b09ac5SDean Luick struct mmu_rb_handler **handler) 101f48ad614SDennis Dalessandro { 102f48ad614SDennis Dalessandro struct mmu_rb_handler *handlr; 1033faa3d9aSIra Weiny int ret; 104f48ad614SDennis Dalessandro 105f48ad614SDennis Dalessandro handlr = kmalloc(sizeof(*handlr), GFP_KERNEL); 106f48ad614SDennis Dalessandro if (!handlr) 107f48ad614SDennis Dalessandro return -ENOMEM; 108f48ad614SDennis Dalessandro 109f808c13fSDavidlohr Bueso handlr->root = RB_ROOT_CACHED; 110f48ad614SDennis Dalessandro handlr->ops = ops; 111e0b09ac5SDean Luick handlr->ops_arg = ops_arg; 112f48ad614SDennis Dalessandro INIT_HLIST_NODE(&handlr->mn.hlist); 113f48ad614SDennis Dalessandro spin_lock_init(&handlr->lock); 114f48ad614SDennis Dalessandro handlr->mn.ops = &mn_opts; 1153faa3d9aSIra Weiny handlr->mm = mm; 116b85ced91SDean Luick INIT_WORK(&handlr->del_work, handle_remove); 117b85ced91SDean Luick INIT_LIST_HEAD(&handlr->del_list); 1180636e9abSDean Luick INIT_LIST_HEAD(&handlr->lru_list); 119b85ced91SDean Luick handlr->wq = wq; 1203faa3d9aSIra Weiny 1213faa3d9aSIra Weiny ret = mmu_notifier_register(&handlr->mn, handlr->mm); 1223faa3d9aSIra Weiny if (ret) { 1233faa3d9aSIra Weiny kfree(handlr); 1243faa3d9aSIra Weiny return ret; 1253faa3d9aSIra Weiny } 1263faa3d9aSIra Weiny 127e0b09ac5SDean Luick *handler = handlr; 128e0b09ac5SDean Luick return 0; 129f48ad614SDennis Dalessandro } 130f48ad614SDennis Dalessandro 131e0b09ac5SDean Luick void hfi1_mmu_rb_unregister(struct mmu_rb_handler *handler) 132f48ad614SDennis Dalessandro { 13320a42d08SDean Luick struct mmu_rb_node *rbnode; 13420a42d08SDean Luick struct rb_node *node; 135f48ad614SDennis Dalessandro unsigned long flags; 136b85ced91SDean Luick struct list_head del_list; 137f48ad614SDennis Dalessandro 138f48ad614SDennis Dalessandro /* Unregister first so we don't get any more notifications. */ 1393faa3d9aSIra Weiny mmu_notifier_unregister(&handler->mn, handler->mm); 140f48ad614SDennis Dalessandro 141b85ced91SDean Luick /* 142b85ced91SDean Luick * Make sure the wq delete handler is finished running. It will not 143b85ced91SDean Luick * be triggered once the mmu notifiers are unregistered above. 144b85ced91SDean Luick */ 145b85ced91SDean Luick flush_work(&handler->del_work); 146b85ced91SDean Luick 147b85ced91SDean Luick INIT_LIST_HEAD(&del_list); 148b85ced91SDean Luick 149f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 150f808c13fSDavidlohr Bueso while ((node = rb_first_cached(&handler->root))) { 151f48ad614SDennis Dalessandro rbnode = rb_entry(node, struct mmu_rb_node, node); 152f808c13fSDavidlohr Bueso rb_erase_cached(node, &handler->root); 1530636e9abSDean Luick /* move from LRU list to delete list */ 1540636e9abSDean Luick list_move(&rbnode->list, &del_list); 155f48ad614SDennis Dalessandro } 156f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 157f48ad614SDennis Dalessandro 158b85ced91SDean Luick do_remove(handler, &del_list); 159b85ced91SDean Luick 160f48ad614SDennis Dalessandro kfree(handler); 161f48ad614SDennis Dalessandro } 162f48ad614SDennis Dalessandro 163e0b09ac5SDean Luick int hfi1_mmu_rb_insert(struct mmu_rb_handler *handler, 164e0b09ac5SDean Luick struct mmu_rb_node *mnode) 165f48ad614SDennis Dalessandro { 166f48ad614SDennis Dalessandro struct mmu_rb_node *node; 167f48ad614SDennis Dalessandro unsigned long flags; 168f48ad614SDennis Dalessandro int ret = 0; 169f48ad614SDennis Dalessandro 17034ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_insert(mnode->addr, mnode->len); 171f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 172f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, mnode->addr, mnode->len); 173f48ad614SDennis Dalessandro if (node) { 174f48ad614SDennis Dalessandro ret = -EINVAL; 175f48ad614SDennis Dalessandro goto unlock; 176f48ad614SDennis Dalessandro } 177e0b09ac5SDean Luick __mmu_int_rb_insert(mnode, &handler->root); 1780636e9abSDean Luick list_add(&mnode->list, &handler->lru_list); 179f48ad614SDennis Dalessandro 180e0b09ac5SDean Luick ret = handler->ops->insert(handler->ops_arg, mnode); 1810636e9abSDean Luick if (ret) { 182e0b09ac5SDean Luick __mmu_int_rb_remove(mnode, &handler->root); 1830636e9abSDean Luick list_del(&mnode->list); /* remove from LRU list */ 1840636e9abSDean Luick } 185f48ad614SDennis Dalessandro unlock: 186f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 187f48ad614SDennis Dalessandro return ret; 188f48ad614SDennis Dalessandro } 189f48ad614SDennis Dalessandro 190f48ad614SDennis Dalessandro /* Caller must hold handler lock */ 191f48ad614SDennis Dalessandro static struct mmu_rb_node *__mmu_rb_search(struct mmu_rb_handler *handler, 192f48ad614SDennis Dalessandro unsigned long addr, 193f48ad614SDennis Dalessandro unsigned long len) 194f48ad614SDennis Dalessandro { 195f48ad614SDennis Dalessandro struct mmu_rb_node *node = NULL; 196f48ad614SDennis Dalessandro 19734ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_search(addr, len); 198f48ad614SDennis Dalessandro if (!handler->ops->filter) { 199e0b09ac5SDean Luick node = __mmu_int_rb_iter_first(&handler->root, addr, 200f48ad614SDennis Dalessandro (addr + len) - 1); 201f48ad614SDennis Dalessandro } else { 202e0b09ac5SDean Luick for (node = __mmu_int_rb_iter_first(&handler->root, addr, 203f48ad614SDennis Dalessandro (addr + len) - 1); 204f48ad614SDennis Dalessandro node; 205f48ad614SDennis Dalessandro node = __mmu_int_rb_iter_next(node, addr, 206f48ad614SDennis Dalessandro (addr + len) - 1)) { 207f48ad614SDennis Dalessandro if (handler->ops->filter(node, addr, len)) 208f48ad614SDennis Dalessandro return node; 209f48ad614SDennis Dalessandro } 210f48ad614SDennis Dalessandro } 211f48ad614SDennis Dalessandro return node; 212f48ad614SDennis Dalessandro } 213f48ad614SDennis Dalessandro 2147be85676SSebastian Sanchez bool hfi1_mmu_rb_remove_unless_exact(struct mmu_rb_handler *handler, 2157be85676SSebastian Sanchez unsigned long addr, unsigned long len, 2167be85676SSebastian Sanchez struct mmu_rb_node **rb_node) 217f48ad614SDennis Dalessandro { 218f48ad614SDennis Dalessandro struct mmu_rb_node *node; 219f48ad614SDennis Dalessandro unsigned long flags; 2207be85676SSebastian Sanchez bool ret = false; 221f48ad614SDennis Dalessandro 222f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 223f48ad614SDennis Dalessandro node = __mmu_rb_search(handler, addr, len); 2240636e9abSDean Luick if (node) { 2257be85676SSebastian Sanchez if (node->addr == addr && node->len == len) 2267be85676SSebastian Sanchez goto unlock; 227e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 2280636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 2297be85676SSebastian Sanchez ret = true; 2300636e9abSDean Luick } 2317be85676SSebastian Sanchez unlock: 232f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 2337be85676SSebastian Sanchez *rb_node = node; 2347be85676SSebastian Sanchez return ret; 235f48ad614SDennis Dalessandro } 236f48ad614SDennis Dalessandro 23710345998SDean Luick void hfi1_mmu_rb_evict(struct mmu_rb_handler *handler, void *evict_arg) 23810345998SDean Luick { 2390636e9abSDean Luick struct mmu_rb_node *rbnode, *ptr; 24010345998SDean Luick struct list_head del_list; 24110345998SDean Luick unsigned long flags; 24210345998SDean Luick bool stop = false; 24310345998SDean Luick 24410345998SDean Luick INIT_LIST_HEAD(&del_list); 24510345998SDean Luick 24610345998SDean Luick spin_lock_irqsave(&handler->lock, flags); 2470636e9abSDean Luick list_for_each_entry_safe_reverse(rbnode, ptr, &handler->lru_list, 2480636e9abSDean Luick list) { 24910345998SDean Luick if (handler->ops->evict(handler->ops_arg, rbnode, evict_arg, 25010345998SDean Luick &stop)) { 25110345998SDean Luick __mmu_int_rb_remove(rbnode, &handler->root); 2520636e9abSDean Luick /* move from LRU list to delete list */ 2530636e9abSDean Luick list_move(&rbnode->list, &del_list); 25410345998SDean Luick } 25510345998SDean Luick if (stop) 25610345998SDean Luick break; 25710345998SDean Luick } 25810345998SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 25910345998SDean Luick 26010345998SDean Luick while (!list_empty(&del_list)) { 26110345998SDean Luick rbnode = list_first_entry(&del_list, struct mmu_rb_node, list); 26210345998SDean Luick list_del(&rbnode->list); 263082b3532SDean Luick handler->ops->remove(handler->ops_arg, rbnode); 26410345998SDean Luick } 26510345998SDean Luick } 26610345998SDean Luick 267b85ced91SDean Luick /* 268b85ced91SDean Luick * It is up to the caller to ensure that this function does not race with the 269b85ced91SDean Luick * mmu invalidate notifier which may be calling the users remove callback on 270b85ced91SDean Luick * 'node'. 271b85ced91SDean Luick */ 272e0b09ac5SDean Luick void hfi1_mmu_rb_remove(struct mmu_rb_handler *handler, 273e0b09ac5SDean Luick struct mmu_rb_node *node) 274f48ad614SDennis Dalessandro { 2753c1091aaSIra Weiny unsigned long flags; 276f48ad614SDennis Dalessandro 2773c1091aaSIra Weiny /* Validity of handler and node pointers has been checked by caller. */ 27834ab4de7SMichael J. Ruhl trace_hfi1_mmu_rb_remove(node->addr, node->len); 2793c1091aaSIra Weiny spin_lock_irqsave(&handler->lock, flags); 280e0b09ac5SDean Luick __mmu_int_rb_remove(node, &handler->root); 2810636e9abSDean Luick list_del(&node->list); /* remove from LRU list */ 2823c1091aaSIra Weiny spin_unlock_irqrestore(&handler->lock, flags); 2833c1091aaSIra Weiny 284082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 285f48ad614SDennis Dalessandro } 286f48ad614SDennis Dalessandro 287*93065ac7SMichal Hocko static int mmu_notifier_range_start(struct mmu_notifier *mn, 288f48ad614SDennis Dalessandro struct mm_struct *mm, 289f48ad614SDennis Dalessandro unsigned long start, 290*93065ac7SMichal Hocko unsigned long end, 291*93065ac7SMichal Hocko bool blockable) 292f48ad614SDennis Dalessandro { 293f48ad614SDennis Dalessandro struct mmu_rb_handler *handler = 294f48ad614SDennis Dalessandro container_of(mn, struct mmu_rb_handler, mn); 295f808c13fSDavidlohr Bueso struct rb_root_cached *root = &handler->root; 296f48ad614SDennis Dalessandro struct mmu_rb_node *node, *ptr = NULL; 297f48ad614SDennis Dalessandro unsigned long flags; 298b85ced91SDean Luick bool added = false; 299f48ad614SDennis Dalessandro 300f48ad614SDennis Dalessandro spin_lock_irqsave(&handler->lock, flags); 301f48ad614SDennis Dalessandro for (node = __mmu_int_rb_iter_first(root, start, end - 1); 302f48ad614SDennis Dalessandro node; node = ptr) { 303f48ad614SDennis Dalessandro /* Guard against node removal. */ 304f48ad614SDennis Dalessandro ptr = __mmu_int_rb_iter_next(node, start, end - 1); 30534ab4de7SMichael J. Ruhl trace_hfi1_mmu_mem_invalidate(node->addr, node->len); 306e0b09ac5SDean Luick if (handler->ops->invalidate(handler->ops_arg, node)) { 307f48ad614SDennis Dalessandro __mmu_int_rb_remove(node, root); 3080636e9abSDean Luick /* move from LRU list to delete list */ 3090636e9abSDean Luick list_move(&node->list, &handler->del_list); 310b85ced91SDean Luick added = true; 311f48ad614SDennis Dalessandro } 312f48ad614SDennis Dalessandro } 313f48ad614SDennis Dalessandro spin_unlock_irqrestore(&handler->lock, flags); 314b85ced91SDean Luick 315b85ced91SDean Luick if (added) 316b85ced91SDean Luick queue_work(handler->wq, &handler->del_work); 317*93065ac7SMichal Hocko 318*93065ac7SMichal Hocko return 0; 319b85ced91SDean Luick } 320b85ced91SDean Luick 321b85ced91SDean Luick /* 322b85ced91SDean Luick * Call the remove function for the given handler and the list. This 323b85ced91SDean Luick * is expected to be called with a delete list extracted from handler. 324b85ced91SDean Luick * The caller should not be holding the handler lock. 325b85ced91SDean Luick */ 326b85ced91SDean Luick static void do_remove(struct mmu_rb_handler *handler, 327b85ced91SDean Luick struct list_head *del_list) 328b85ced91SDean Luick { 329b85ced91SDean Luick struct mmu_rb_node *node; 330b85ced91SDean Luick 331b85ced91SDean Luick while (!list_empty(del_list)) { 332b85ced91SDean Luick node = list_first_entry(del_list, struct mmu_rb_node, list); 333b85ced91SDean Luick list_del(&node->list); 334082b3532SDean Luick handler->ops->remove(handler->ops_arg, node); 335b85ced91SDean Luick } 336b85ced91SDean Luick } 337b85ced91SDean Luick 338b85ced91SDean Luick /* 339b85ced91SDean Luick * Work queue function to remove all nodes that have been queued up to 340b85ced91SDean Luick * be removed. The key feature is that mm->mmap_sem is not being held 341b85ced91SDean Luick * and the remove callback can sleep while taking it, if needed. 342b85ced91SDean Luick */ 343b85ced91SDean Luick static void handle_remove(struct work_struct *work) 344b85ced91SDean Luick { 345b85ced91SDean Luick struct mmu_rb_handler *handler = container_of(work, 346b85ced91SDean Luick struct mmu_rb_handler, 347b85ced91SDean Luick del_work); 348b85ced91SDean Luick struct list_head del_list; 349b85ced91SDean Luick unsigned long flags; 350b85ced91SDean Luick 351b85ced91SDean Luick /* remove anything that is queued to get removed */ 352b85ced91SDean Luick spin_lock_irqsave(&handler->lock, flags); 353b85ced91SDean Luick list_replace_init(&handler->del_list, &del_list); 354b85ced91SDean Luick spin_unlock_irqrestore(&handler->lock, flags); 355b85ced91SDean Luick 356b85ced91SDean Luick do_remove(handler, &del_list); 357f48ad614SDennis Dalessandro } 358