10b61f8a4SDave Chinner // SPDX-License-Identifier: GPL-2.0 21da177e4SLinus Torvalds /* 37b718769SNathan Scott * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc. 4c7e8f268SDavid Chinner * Copyright (c) 2008 Dave Chinner 57b718769SNathan Scott * All Rights Reserved. 61da177e4SLinus Torvalds */ 71da177e4SLinus Torvalds #include "xfs.h" 8a844f451SNathan Scott #include "xfs_fs.h" 95467b34bSDarrick J. Wong #include "xfs_shared.h" 104fb6e8adSChristoph Hellwig #include "xfs_format.h" 11239880efSDave Chinner #include "xfs_log_format.h" 12239880efSDave Chinner #include "xfs_trans_resv.h" 131da177e4SLinus Torvalds #include "xfs_mount.h" 14239880efSDave Chinner #include "xfs_trans.h" 151da177e4SLinus Torvalds #include "xfs_trans_priv.h" 169e4c109aSChristoph Hellwig #include "xfs_trace.h" 17e9e899a2SDarrick J. Wong #include "xfs_errortag.h" 181da177e4SLinus Torvalds #include "xfs_error.h" 19239880efSDave Chinner #include "xfs_log.h" 20*0020a190SDave Chinner #include "xfs_log_priv.h" 211da177e4SLinus Torvalds 221da177e4SLinus Torvalds #ifdef DEBUG 23cd4a3c50SDave Chinner /* 24cd4a3c50SDave Chinner * Check that the list is sorted as it should be. 25d686d12dSDave Chinner * 26d686d12dSDave Chinner * Called with the ail lock held, but we don't want to assert fail with it 27d686d12dSDave Chinner * held otherwise we'll lock everything up and won't be able to debug the 28d686d12dSDave Chinner * cause. Hence we sample and check the state under the AIL lock and return if 29d686d12dSDave Chinner * everything is fine, otherwise we drop the lock and run the ASSERT checks. 30d686d12dSDave Chinner * Asserts may not be fatal, so pick the lock back up and continue onwards. 31cd4a3c50SDave Chinner */ 32cd4a3c50SDave Chinner STATIC void 33cd4a3c50SDave Chinner xfs_ail_check( 34cd4a3c50SDave Chinner struct xfs_ail *ailp, 35d686d12dSDave Chinner struct xfs_log_item *lip) 36daebba1bSJules Irenge __must_hold(&ailp->ail_lock) 37cd4a3c50SDave Chinner { 38d686d12dSDave Chinner struct xfs_log_item *prev_lip; 39d686d12dSDave Chinner struct xfs_log_item *next_lip; 40d686d12dSDave Chinner xfs_lsn_t prev_lsn = NULLCOMMITLSN; 41d686d12dSDave Chinner xfs_lsn_t next_lsn = NULLCOMMITLSN; 42d686d12dSDave Chinner xfs_lsn_t lsn; 43d686d12dSDave Chinner bool in_ail; 44d686d12dSDave Chinner 45cd4a3c50SDave Chinner 4657e80956SMatthew Wilcox if (list_empty(&ailp->ail_head)) 47cd4a3c50SDave Chinner return; 48cd4a3c50SDave Chinner 49cd4a3c50SDave Chinner /* 50d686d12dSDave Chinner * Sample then check the next and previous entries are valid. 51cd4a3c50SDave Chinner */ 52d686d12dSDave Chinner in_ail = test_bit(XFS_LI_IN_AIL, &lip->li_flags); 53d686d12dSDave Chinner prev_lip = list_entry(lip->li_ail.prev, struct xfs_log_item, li_ail); 5457e80956SMatthew Wilcox if (&prev_lip->li_ail != &ailp->ail_head) 55d686d12dSDave Chinner prev_lsn = prev_lip->li_lsn; 56d686d12dSDave Chinner next_lip = list_entry(lip->li_ail.next, struct xfs_log_item, li_ail); 57d686d12dSDave Chinner if (&next_lip->li_ail != &ailp->ail_head) 58d686d12dSDave Chinner next_lsn = next_lip->li_lsn; 59d686d12dSDave Chinner lsn = lip->li_lsn; 60cd4a3c50SDave Chinner 61d686d12dSDave Chinner if (in_ail && 62d686d12dSDave Chinner (prev_lsn == NULLCOMMITLSN || XFS_LSN_CMP(prev_lsn, lsn) <= 0) && 63d686d12dSDave Chinner (next_lsn == NULLCOMMITLSN || XFS_LSN_CMP(next_lsn, lsn) >= 0)) 64d686d12dSDave Chinner return; 65cd4a3c50SDave Chinner 66d686d12dSDave Chinner spin_unlock(&ailp->ail_lock); 67d686d12dSDave Chinner ASSERT(in_ail); 68d686d12dSDave Chinner ASSERT(prev_lsn == NULLCOMMITLSN || XFS_LSN_CMP(prev_lsn, lsn) <= 0); 69d686d12dSDave Chinner ASSERT(next_lsn == NULLCOMMITLSN || XFS_LSN_CMP(next_lsn, lsn) >= 0); 70d686d12dSDave Chinner spin_lock(&ailp->ail_lock); 71cd4a3c50SDave Chinner } 72cd4a3c50SDave Chinner #else /* !DEBUG */ 73de08dbc1SDavid Chinner #define xfs_ail_check(a,l) 741da177e4SLinus Torvalds #endif /* DEBUG */ 751da177e4SLinus Torvalds 76cd4a3c50SDave Chinner /* 77fd074841SDave Chinner * Return a pointer to the last item in the AIL. If the AIL is empty, then 78fd074841SDave Chinner * return NULL. 79fd074841SDave Chinner */ 80efe2330fSChristoph Hellwig static struct xfs_log_item * 81fd074841SDave Chinner xfs_ail_max( 82fd074841SDave Chinner struct xfs_ail *ailp) 83fd074841SDave Chinner { 8457e80956SMatthew Wilcox if (list_empty(&ailp->ail_head)) 85fd074841SDave Chinner return NULL; 86fd074841SDave Chinner 87efe2330fSChristoph Hellwig return list_entry(ailp->ail_head.prev, struct xfs_log_item, li_ail); 88fd074841SDave Chinner } 89fd074841SDave Chinner 90fd074841SDave Chinner /* 91cd4a3c50SDave Chinner * Return a pointer to the item which follows the given item in the AIL. If 92cd4a3c50SDave Chinner * the given item is the last item in the list, then return NULL. 93cd4a3c50SDave Chinner */ 94efe2330fSChristoph Hellwig static struct xfs_log_item * 95cd4a3c50SDave Chinner xfs_ail_next( 96cd4a3c50SDave Chinner struct xfs_ail *ailp, 97efe2330fSChristoph Hellwig struct xfs_log_item *lip) 98cd4a3c50SDave Chinner { 9957e80956SMatthew Wilcox if (lip->li_ail.next == &ailp->ail_head) 100cd4a3c50SDave Chinner return NULL; 101cd4a3c50SDave Chinner 102efe2330fSChristoph Hellwig return list_first_entry(&lip->li_ail, struct xfs_log_item, li_ail); 103cd4a3c50SDave Chinner } 104cd4a3c50SDave Chinner 105cd4a3c50SDave Chinner /* 106cd4a3c50SDave Chinner * This is called by the log manager code to determine the LSN of the tail of 107cd4a3c50SDave Chinner * the log. This is exactly the LSN of the first item in the AIL. If the AIL 108cd4a3c50SDave Chinner * is empty, then this function returns 0. 1091da177e4SLinus Torvalds * 110cd4a3c50SDave Chinner * We need the AIL lock in order to get a coherent read of the lsn of the last 111cd4a3c50SDave Chinner * item in the AIL. 1121da177e4SLinus Torvalds */ 1138eb807bdSDave Chinner static xfs_lsn_t 1148eb807bdSDave Chinner __xfs_ail_min_lsn( 1158eb807bdSDave Chinner struct xfs_ail *ailp) 1168eb807bdSDave Chinner { 1178eb807bdSDave Chinner struct xfs_log_item *lip = xfs_ail_min(ailp); 1188eb807bdSDave Chinner 1198eb807bdSDave Chinner if (lip) 1208eb807bdSDave Chinner return lip->li_lsn; 1218eb807bdSDave Chinner return 0; 1228eb807bdSDave Chinner } 1238eb807bdSDave Chinner 1241da177e4SLinus Torvalds xfs_lsn_t 125fd074841SDave Chinner xfs_ail_min_lsn( 1265b00f14fSDavid Chinner struct xfs_ail *ailp) 1271da177e4SLinus Torvalds { 1288eb807bdSDave Chinner xfs_lsn_t lsn; 1291da177e4SLinus Torvalds 13057e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 1318eb807bdSDave Chinner lsn = __xfs_ail_min_lsn(ailp); 13257e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 1331da177e4SLinus Torvalds 1341da177e4SLinus Torvalds return lsn; 1351da177e4SLinus Torvalds } 1361da177e4SLinus Torvalds 1371da177e4SLinus Torvalds /* 138fd074841SDave Chinner * Return the maximum lsn held in the AIL, or zero if the AIL is empty. 139fd074841SDave Chinner */ 140fd074841SDave Chinner static xfs_lsn_t 141fd074841SDave Chinner xfs_ail_max_lsn( 142fd074841SDave Chinner struct xfs_ail *ailp) 143fd074841SDave Chinner { 144fd074841SDave Chinner xfs_lsn_t lsn = 0; 145efe2330fSChristoph Hellwig struct xfs_log_item *lip; 146fd074841SDave Chinner 14757e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 148fd074841SDave Chinner lip = xfs_ail_max(ailp); 149fd074841SDave Chinner if (lip) 150fd074841SDave Chinner lsn = lip->li_lsn; 15157e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 152fd074841SDave Chinner 153fd074841SDave Chinner return lsn; 154fd074841SDave Chinner } 155fd074841SDave Chinner 156fd074841SDave Chinner /* 157af3e4022SDave Chinner * The cursor keeps track of where our current traversal is up to by tracking 158af3e4022SDave Chinner * the next item in the list for us. However, for this to be safe, removing an 159af3e4022SDave Chinner * object from the AIL needs to invalidate any cursor that points to it. hence 160af3e4022SDave Chinner * the traversal cursor needs to be linked to the struct xfs_ail so that 161af3e4022SDave Chinner * deletion can search all the active cursors for invalidation. 16227d8d5feSDavid Chinner */ 1635b00f14fSDavid Chinner STATIC void 16427d8d5feSDavid Chinner xfs_trans_ail_cursor_init( 16527d8d5feSDavid Chinner struct xfs_ail *ailp, 16627d8d5feSDavid Chinner struct xfs_ail_cursor *cur) 16727d8d5feSDavid Chinner { 16827d8d5feSDavid Chinner cur->item = NULL; 16957e80956SMatthew Wilcox list_add_tail(&cur->list, &ailp->ail_cursors); 17027d8d5feSDavid Chinner } 17127d8d5feSDavid Chinner 17227d8d5feSDavid Chinner /* 173af3e4022SDave Chinner * Get the next item in the traversal and advance the cursor. If the cursor 174af3e4022SDave Chinner * was invalidated (indicated by a lip of 1), restart the traversal. 17527d8d5feSDavid Chinner */ 1765b00f14fSDavid Chinner struct xfs_log_item * 17727d8d5feSDavid Chinner xfs_trans_ail_cursor_next( 17827d8d5feSDavid Chinner struct xfs_ail *ailp, 17927d8d5feSDavid Chinner struct xfs_ail_cursor *cur) 18027d8d5feSDavid Chinner { 18127d8d5feSDavid Chinner struct xfs_log_item *lip = cur->item; 18227d8d5feSDavid Chinner 183db9d67d6SChristoph Hellwig if ((uintptr_t)lip & 1) 18427d8d5feSDavid Chinner lip = xfs_ail_min(ailp); 18516b59029SDave Chinner if (lip) 18616b59029SDave Chinner cur->item = xfs_ail_next(ailp, lip); 18727d8d5feSDavid Chinner return lip; 18827d8d5feSDavid Chinner } 18927d8d5feSDavid Chinner 19027d8d5feSDavid Chinner /* 191af3e4022SDave Chinner * When the traversal is complete, we need to remove the cursor from the list 192af3e4022SDave Chinner * of traversing cursors. 19327d8d5feSDavid Chinner */ 19427d8d5feSDavid Chinner void 19527d8d5feSDavid Chinner xfs_trans_ail_cursor_done( 196af3e4022SDave Chinner struct xfs_ail_cursor *cur) 19727d8d5feSDavid Chinner { 198af3e4022SDave Chinner cur->item = NULL; 199af3e4022SDave Chinner list_del_init(&cur->list); 20027d8d5feSDavid Chinner } 20127d8d5feSDavid Chinner 20227d8d5feSDavid Chinner /* 203af3e4022SDave Chinner * Invalidate any cursor that is pointing to this item. This is called when an 204af3e4022SDave Chinner * item is removed from the AIL. Any cursor pointing to this object is now 205af3e4022SDave Chinner * invalid and the traversal needs to be terminated so it doesn't reference a 206af3e4022SDave Chinner * freed object. We set the low bit of the cursor item pointer so we can 207af3e4022SDave Chinner * distinguish between an invalidation and the end of the list when getting the 208af3e4022SDave Chinner * next item from the cursor. 2095b00f14fSDavid Chinner */ 2105b00f14fSDavid Chinner STATIC void 2115b00f14fSDavid Chinner xfs_trans_ail_cursor_clear( 2125b00f14fSDavid Chinner struct xfs_ail *ailp, 2135b00f14fSDavid Chinner struct xfs_log_item *lip) 2145b00f14fSDavid Chinner { 2155b00f14fSDavid Chinner struct xfs_ail_cursor *cur; 2165b00f14fSDavid Chinner 21757e80956SMatthew Wilcox list_for_each_entry(cur, &ailp->ail_cursors, list) { 2185b00f14fSDavid Chinner if (cur->item == lip) 2195b00f14fSDavid Chinner cur->item = (struct xfs_log_item *) 220db9d67d6SChristoph Hellwig ((uintptr_t)cur->item | 1); 2215b00f14fSDavid Chinner } 2225b00f14fSDavid Chinner } 2235b00f14fSDavid Chinner 2245b00f14fSDavid Chinner /* 22516b59029SDave Chinner * Find the first item in the AIL with the given @lsn by searching in ascending 22616b59029SDave Chinner * LSN order and initialise the cursor to point to the next item for a 22716b59029SDave Chinner * ascending traversal. Pass a @lsn of zero to initialise the cursor to the 22816b59029SDave Chinner * first item in the AIL. Returns NULL if the list is empty. 229249a8c11SDavid Chinner */ 230efe2330fSChristoph Hellwig struct xfs_log_item * 2315b00f14fSDavid Chinner xfs_trans_ail_cursor_first( 23227d8d5feSDavid Chinner struct xfs_ail *ailp, 23327d8d5feSDavid Chinner struct xfs_ail_cursor *cur, 234249a8c11SDavid Chinner xfs_lsn_t lsn) 235249a8c11SDavid Chinner { 236efe2330fSChristoph Hellwig struct xfs_log_item *lip; 237249a8c11SDavid Chinner 2385b00f14fSDavid Chinner xfs_trans_ail_cursor_init(ailp, cur); 23916b59029SDave Chinner 24016b59029SDave Chinner if (lsn == 0) { 24127d8d5feSDavid Chinner lip = xfs_ail_min(ailp); 2425b00f14fSDavid Chinner goto out; 24316b59029SDave Chinner } 244249a8c11SDavid Chinner 24557e80956SMatthew Wilcox list_for_each_entry(lip, &ailp->ail_head, li_ail) { 2465b00f14fSDavid Chinner if (XFS_LSN_CMP(lip->li_lsn, lsn) >= 0) 2477ee49acfSDavid Chinner goto out; 2485b00f14fSDavid Chinner } 24916b59029SDave Chinner return NULL; 25016b59029SDave Chinner 2515b00f14fSDavid Chinner out: 25216b59029SDave Chinner if (lip) 25316b59029SDave Chinner cur->item = xfs_ail_next(ailp, lip); 254249a8c11SDavid Chinner return lip; 255249a8c11SDavid Chinner } 256535f6b37SJosef 'Jeff' Sipek 2571d8c95a3SDave Chinner static struct xfs_log_item * 2581d8c95a3SDave Chinner __xfs_trans_ail_cursor_last( 2591d8c95a3SDave Chinner struct xfs_ail *ailp, 2601d8c95a3SDave Chinner xfs_lsn_t lsn) 2611d8c95a3SDave Chinner { 262efe2330fSChristoph Hellwig struct xfs_log_item *lip; 2631d8c95a3SDave Chinner 26457e80956SMatthew Wilcox list_for_each_entry_reverse(lip, &ailp->ail_head, li_ail) { 2651d8c95a3SDave Chinner if (XFS_LSN_CMP(lip->li_lsn, lsn) <= 0) 2661d8c95a3SDave Chinner return lip; 2671d8c95a3SDave Chinner } 2681d8c95a3SDave Chinner return NULL; 2691d8c95a3SDave Chinner } 2701d8c95a3SDave Chinner 2711d8c95a3SDave Chinner /* 27216b59029SDave Chinner * Find the last item in the AIL with the given @lsn by searching in descending 27316b59029SDave Chinner * LSN order and initialise the cursor to point to that item. If there is no 27416b59029SDave Chinner * item with the value of @lsn, then it sets the cursor to the last item with an 27516b59029SDave Chinner * LSN lower than @lsn. Returns NULL if the list is empty. 2761d8c95a3SDave Chinner */ 2771d8c95a3SDave Chinner struct xfs_log_item * 2781d8c95a3SDave Chinner xfs_trans_ail_cursor_last( 2791d8c95a3SDave Chinner struct xfs_ail *ailp, 2801d8c95a3SDave Chinner struct xfs_ail_cursor *cur, 2811d8c95a3SDave Chinner xfs_lsn_t lsn) 2821d8c95a3SDave Chinner { 2831d8c95a3SDave Chinner xfs_trans_ail_cursor_init(ailp, cur); 2841d8c95a3SDave Chinner cur->item = __xfs_trans_ail_cursor_last(ailp, lsn); 2851d8c95a3SDave Chinner return cur->item; 2861d8c95a3SDave Chinner } 2871d8c95a3SDave Chinner 2881d8c95a3SDave Chinner /* 28916b59029SDave Chinner * Splice the log item list into the AIL at the given LSN. We splice to the 2901d8c95a3SDave Chinner * tail of the given LSN to maintain insert order for push traversals. The 2911d8c95a3SDave Chinner * cursor is optional, allowing repeated updates to the same LSN to avoid 292e44f4112SAlex Elder * repeated traversals. This should not be called with an empty list. 293cd4a3c50SDave Chinner */ 294cd4a3c50SDave Chinner static void 295cd4a3c50SDave Chinner xfs_ail_splice( 296cd4a3c50SDave Chinner struct xfs_ail *ailp, 2971d8c95a3SDave Chinner struct xfs_ail_cursor *cur, 298cd4a3c50SDave Chinner struct list_head *list, 299cd4a3c50SDave Chinner xfs_lsn_t lsn) 300cd4a3c50SDave Chinner { 301e44f4112SAlex Elder struct xfs_log_item *lip; 302e44f4112SAlex Elder 303e44f4112SAlex Elder ASSERT(!list_empty(list)); 304cd4a3c50SDave Chinner 3051d8c95a3SDave Chinner /* 306e44f4112SAlex Elder * Use the cursor to determine the insertion point if one is 307e44f4112SAlex Elder * provided. If not, or if the one we got is not valid, 308e44f4112SAlex Elder * find the place in the AIL where the items belong. 3091d8c95a3SDave Chinner */ 310e44f4112SAlex Elder lip = cur ? cur->item : NULL; 311db9d67d6SChristoph Hellwig if (!lip || (uintptr_t)lip & 1) 3121d8c95a3SDave Chinner lip = __xfs_trans_ail_cursor_last(ailp, lsn); 3131d8c95a3SDave Chinner 314e44f4112SAlex Elder /* 315e44f4112SAlex Elder * If a cursor is provided, we know we're processing the AIL 316e44f4112SAlex Elder * in lsn order, and future items to be spliced in will 317e44f4112SAlex Elder * follow the last one being inserted now. Update the 318e44f4112SAlex Elder * cursor to point to that last item, now while we have a 319e44f4112SAlex Elder * reliable pointer to it. 320e44f4112SAlex Elder */ 3211d8c95a3SDave Chinner if (cur) 322e44f4112SAlex Elder cur->item = list_entry(list->prev, struct xfs_log_item, li_ail); 323cd4a3c50SDave Chinner 3241d8c95a3SDave Chinner /* 325e44f4112SAlex Elder * Finally perform the splice. Unless the AIL was empty, 326e44f4112SAlex Elder * lip points to the item in the AIL _after_ which the new 327e44f4112SAlex Elder * items should go. If lip is null the AIL was empty, so 328e44f4112SAlex Elder * the new items go at the head of the AIL. 3291d8c95a3SDave Chinner */ 330e44f4112SAlex Elder if (lip) 3311d8c95a3SDave Chinner list_splice(list, &lip->li_ail); 332e44f4112SAlex Elder else 33357e80956SMatthew Wilcox list_splice(list, &ailp->ail_head); 334cd4a3c50SDave Chinner } 335cd4a3c50SDave Chinner 336cd4a3c50SDave Chinner /* 337cd4a3c50SDave Chinner * Delete the given item from the AIL. Return a pointer to the item. 338cd4a3c50SDave Chinner */ 339cd4a3c50SDave Chinner static void 340cd4a3c50SDave Chinner xfs_ail_delete( 341cd4a3c50SDave Chinner struct xfs_ail *ailp, 342efe2330fSChristoph Hellwig struct xfs_log_item *lip) 343cd4a3c50SDave Chinner { 344cd4a3c50SDave Chinner xfs_ail_check(ailp, lip); 345cd4a3c50SDave Chinner list_del(&lip->li_ail); 346cd4a3c50SDave Chinner xfs_trans_ail_cursor_clear(ailp, lip); 347cd4a3c50SDave Chinner } 348cd4a3c50SDave Chinner 349cb6ad099SBrian Foster /* 350cb6ad099SBrian Foster * Requeue a failed buffer for writeback. 351cb6ad099SBrian Foster * 352cb6ad099SBrian Foster * We clear the log item failed state here as well, but we have to be careful 353cb6ad099SBrian Foster * about reference counts because the only active reference counts on the buffer 354cb6ad099SBrian Foster * may be the failed log items. Hence if we clear the log item failed state 355cb6ad099SBrian Foster * before queuing the buffer for IO we can release all active references to 356cb6ad099SBrian Foster * the buffer and free it, leading to use after free problems in 357cb6ad099SBrian Foster * xfs_buf_delwri_queue. It makes no difference to the buffer or log items which 358cb6ad099SBrian Foster * order we process them in - the buffer is locked, and we own the buffer list 359cb6ad099SBrian Foster * so nothing on them is going to change while we are performing this action. 360cb6ad099SBrian Foster * 361cb6ad099SBrian Foster * Hence we can safely queue the buffer for IO before we clear the failed log 362cb6ad099SBrian Foster * item state, therefore always having an active reference to the buffer and 363cb6ad099SBrian Foster * avoiding the transient zero-reference state that leads to use-after-free. 364cb6ad099SBrian Foster */ 365cb6ad099SBrian Foster static inline int 366cb6ad099SBrian Foster xfsaild_resubmit_item( 367cb6ad099SBrian Foster struct xfs_log_item *lip, 368cb6ad099SBrian Foster struct list_head *buffer_list) 369cb6ad099SBrian Foster { 370cb6ad099SBrian Foster struct xfs_buf *bp = lip->li_buf; 371cb6ad099SBrian Foster 372cb6ad099SBrian Foster if (!xfs_buf_trylock(bp)) 373cb6ad099SBrian Foster return XFS_ITEM_LOCKED; 374cb6ad099SBrian Foster 375cb6ad099SBrian Foster if (!xfs_buf_delwri_queue(bp, buffer_list)) { 376cb6ad099SBrian Foster xfs_buf_unlock(bp); 377cb6ad099SBrian Foster return XFS_ITEM_FLUSHING; 378cb6ad099SBrian Foster } 379cb6ad099SBrian Foster 380cb6ad099SBrian Foster /* protected by ail_lock */ 381298f7becSDave Chinner list_for_each_entry(lip, &bp->b_li_list, li_bio_list) { 382298f7becSDave Chinner if (bp->b_flags & _XBF_INODES) 383298f7becSDave Chinner clear_bit(XFS_LI_FAILED, &lip->li_flags); 384298f7becSDave Chinner else 385cb6ad099SBrian Foster xfs_clear_li_failed(lip); 386298f7becSDave Chinner } 387cb6ad099SBrian Foster 388cb6ad099SBrian Foster xfs_buf_unlock(bp); 389cb6ad099SBrian Foster return XFS_ITEM_SUCCESS; 390cb6ad099SBrian Foster } 391cb6ad099SBrian Foster 3927f4d01f3SBrian Foster static inline uint 3937f4d01f3SBrian Foster xfsaild_push_item( 3947f4d01f3SBrian Foster struct xfs_ail *ailp, 3957f4d01f3SBrian Foster struct xfs_log_item *lip) 3967f4d01f3SBrian Foster { 3977f4d01f3SBrian Foster /* 3987f4d01f3SBrian Foster * If log item pinning is enabled, skip the push and track the item as 3997f4d01f3SBrian Foster * pinned. This can help induce head-behind-tail conditions. 4007f4d01f3SBrian Foster */ 40157e80956SMatthew Wilcox if (XFS_TEST_ERROR(false, ailp->ail_mount, XFS_ERRTAG_LOG_ITEM_PIN)) 4027f4d01f3SBrian Foster return XFS_ITEM_PINNED; 4037f4d01f3SBrian Foster 404e8b78db7SChristoph Hellwig /* 405e8b78db7SChristoph Hellwig * Consider the item pinned if a push callback is not defined so the 406e8b78db7SChristoph Hellwig * caller will force the log. This should only happen for intent items 407e8b78db7SChristoph Hellwig * as they are unpinned once the associated done item is committed to 408e8b78db7SChristoph Hellwig * the on-disk log. 409e8b78db7SChristoph Hellwig */ 410e8b78db7SChristoph Hellwig if (!lip->li_ops->iop_push) 411e8b78db7SChristoph Hellwig return XFS_ITEM_PINNED; 412cb6ad099SBrian Foster if (test_bit(XFS_LI_FAILED, &lip->li_flags)) 413cb6ad099SBrian Foster return xfsaild_resubmit_item(lip, &ailp->ail_buf_list); 41457e80956SMatthew Wilcox return lip->li_ops->iop_push(lip, &ailp->ail_buf_list); 4157f4d01f3SBrian Foster } 4167f4d01f3SBrian Foster 4170030807cSChristoph Hellwig static long 4180030807cSChristoph Hellwig xfsaild_push( 4190030807cSChristoph Hellwig struct xfs_ail *ailp) 420249a8c11SDavid Chinner { 42157e80956SMatthew Wilcox xfs_mount_t *mp = ailp->ail_mount; 422af3e4022SDave Chinner struct xfs_ail_cursor cur; 423efe2330fSChristoph Hellwig struct xfs_log_item *lip; 4249e7004e7SDave Chinner xfs_lsn_t lsn; 425fe0da767SDave Chinner xfs_lsn_t target; 42643ff2122SChristoph Hellwig long tout; 4279e7004e7SDave Chinner int stuck = 0; 42843ff2122SChristoph Hellwig int flushing = 0; 4299e7004e7SDave Chinner int count = 0; 4301da177e4SLinus Torvalds 431670ce93fSDave Chinner /* 43243ff2122SChristoph Hellwig * If we encountered pinned items or did not finish writing out all 433*0020a190SDave Chinner * buffers the last time we ran, force a background CIL push to get the 434*0020a190SDave Chinner * items unpinned in the near future. We do not wait on the CIL push as 435*0020a190SDave Chinner * that could stall us for seconds if there is enough background IO 436*0020a190SDave Chinner * load. Stalling for that long when the tail of the log is pinned and 437*0020a190SDave Chinner * needs flushing will hard stop the transaction subsystem when log 438*0020a190SDave Chinner * space runs out. 439670ce93fSDave Chinner */ 44057e80956SMatthew Wilcox if (ailp->ail_log_flush && ailp->ail_last_pushed_lsn == 0 && 44157e80956SMatthew Wilcox (!list_empty_careful(&ailp->ail_buf_list) || 44243ff2122SChristoph Hellwig xfs_ail_min_lsn(ailp))) { 44357e80956SMatthew Wilcox ailp->ail_log_flush = 0; 44443ff2122SChristoph Hellwig 445ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail_flush); 446*0020a190SDave Chinner xlog_cil_flush(mp->m_log); 447670ce93fSDave Chinner } 448670ce93fSDave Chinner 44957e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 4508375f922SBrian Foster 45157e80956SMatthew Wilcox /* barrier matches the ail_target update in xfs_ail_push() */ 4528375f922SBrian Foster smp_rmb(); 45357e80956SMatthew Wilcox target = ailp->ail_target; 45457e80956SMatthew Wilcox ailp->ail_target_prev = target; 4558375f922SBrian Foster 456f376b45eSBrian Foster /* we're done if the AIL is empty or our push has reached the end */ 45757e80956SMatthew Wilcox lip = xfs_trans_ail_cursor_first(ailp, &cur, ailp->ail_last_pushed_lsn); 458f376b45eSBrian Foster if (!lip) 4599e7004e7SDave Chinner goto out_done; 4601da177e4SLinus Torvalds 461ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail); 4621da177e4SLinus Torvalds 463249a8c11SDavid Chinner lsn = lip->li_lsn; 46450e86686SDave Chinner while ((XFS_LSN_CMP(lip->li_lsn, target) <= 0)) { 465249a8c11SDavid Chinner int lock_result; 46643ff2122SChristoph Hellwig 467249a8c11SDavid Chinner /* 468904c17e6SDave Chinner * Note that iop_push may unlock and reacquire the AIL lock. We 46943ff2122SChristoph Hellwig * rely on the AIL cursor implementation to be able to deal with 47043ff2122SChristoph Hellwig * the dropped lock. 4711da177e4SLinus Torvalds */ 4727f4d01f3SBrian Foster lock_result = xfsaild_push_item(ailp, lip); 4731da177e4SLinus Torvalds switch (lock_result) { 4741da177e4SLinus Torvalds case XFS_ITEM_SUCCESS: 475ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail_success); 4769e4c109aSChristoph Hellwig trace_xfs_ail_push(lip); 4779e4c109aSChristoph Hellwig 47857e80956SMatthew Wilcox ailp->ail_last_pushed_lsn = lsn; 4791da177e4SLinus Torvalds break; 4801da177e4SLinus Torvalds 48143ff2122SChristoph Hellwig case XFS_ITEM_FLUSHING: 48243ff2122SChristoph Hellwig /* 483cf085a1bSJoe Perches * The item or its backing buffer is already being 48443ff2122SChristoph Hellwig * flushed. The typical reason for that is that an 48543ff2122SChristoph Hellwig * inode buffer is locked because we already pushed the 48643ff2122SChristoph Hellwig * updates to it as part of inode clustering. 48743ff2122SChristoph Hellwig * 488b63da6c8SRandy Dunlap * We do not want to stop flushing just because lots 489cf085a1bSJoe Perches * of items are already being flushed, but we need to 49043ff2122SChristoph Hellwig * re-try the flushing relatively soon if most of the 491cf085a1bSJoe Perches * AIL is being flushed. 49243ff2122SChristoph Hellwig */ 493ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail_flushing); 49443ff2122SChristoph Hellwig trace_xfs_ail_flushing(lip); 49517b38471SChristoph Hellwig 49643ff2122SChristoph Hellwig flushing++; 49757e80956SMatthew Wilcox ailp->ail_last_pushed_lsn = lsn; 4981da177e4SLinus Torvalds break; 4991da177e4SLinus Torvalds 5001da177e4SLinus Torvalds case XFS_ITEM_PINNED: 501ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail_pinned); 5029e4c109aSChristoph Hellwig trace_xfs_ail_pinned(lip); 5039e4c109aSChristoph Hellwig 504249a8c11SDavid Chinner stuck++; 50557e80956SMatthew Wilcox ailp->ail_log_flush++; 5061da177e4SLinus Torvalds break; 5071da177e4SLinus Torvalds case XFS_ITEM_LOCKED: 508ff6d6af2SBill O'Donnell XFS_STATS_INC(mp, xs_push_ail_locked); 5099e4c109aSChristoph Hellwig trace_xfs_ail_locked(lip); 51043ff2122SChristoph Hellwig 511249a8c11SDavid Chinner stuck++; 5121da177e4SLinus Torvalds break; 5131da177e4SLinus Torvalds default: 5141da177e4SLinus Torvalds ASSERT(0); 5151da177e4SLinus Torvalds break; 5161da177e4SLinus Torvalds } 5171da177e4SLinus Torvalds 518249a8c11SDavid Chinner count++; 519249a8c11SDavid Chinner 520249a8c11SDavid Chinner /* 521249a8c11SDavid Chinner * Are there too many items we can't do anything with? 52243ff2122SChristoph Hellwig * 523b63da6c8SRandy Dunlap * If we are skipping too many items because we can't flush 524249a8c11SDavid Chinner * them or they are already being flushed, we back off and 525249a8c11SDavid Chinner * given them time to complete whatever operation is being 526249a8c11SDavid Chinner * done. i.e. remove pressure from the AIL while we can't make 527249a8c11SDavid Chinner * progress so traversals don't slow down further inserts and 528249a8c11SDavid Chinner * removals to/from the AIL. 529249a8c11SDavid Chinner * 530249a8c11SDavid Chinner * The value of 100 is an arbitrary magic number based on 531249a8c11SDavid Chinner * observation. 532249a8c11SDavid Chinner */ 533249a8c11SDavid Chinner if (stuck > 100) 534249a8c11SDavid Chinner break; 535249a8c11SDavid Chinner 536af3e4022SDave Chinner lip = xfs_trans_ail_cursor_next(ailp, &cur); 537249a8c11SDavid Chinner if (lip == NULL) 538249a8c11SDavid Chinner break; 539249a8c11SDavid Chinner lsn = lip->li_lsn; 5401da177e4SLinus Torvalds } 541f376b45eSBrian Foster 542f376b45eSBrian Foster out_done: 543e4a1e29cSEric Sandeen xfs_trans_ail_cursor_done(&cur); 54457e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 5451da177e4SLinus Torvalds 54657e80956SMatthew Wilcox if (xfs_buf_delwri_submit_nowait(&ailp->ail_buf_list)) 54757e80956SMatthew Wilcox ailp->ail_log_flush++; 548d808f617SDave Chinner 54943ff2122SChristoph Hellwig if (!count || XFS_LSN_CMP(lsn, target) >= 0) { 550249a8c11SDavid Chinner /* 55143ff2122SChristoph Hellwig * We reached the target or the AIL is empty, so wait a bit 55243ff2122SChristoph Hellwig * longer for I/O to complete and remove pushed items from the 55343ff2122SChristoph Hellwig * AIL before we start the next scan from the start of the AIL. 554249a8c11SDavid Chinner */ 555453eac8aSDave Chinner tout = 50; 55657e80956SMatthew Wilcox ailp->ail_last_pushed_lsn = 0; 55743ff2122SChristoph Hellwig } else if (((stuck + flushing) * 100) / count > 90) { 558249a8c11SDavid Chinner /* 55943ff2122SChristoph Hellwig * Either there is a lot of contention on the AIL or we are 56043ff2122SChristoph Hellwig * stuck due to operations in progress. "Stuck" in this case 56143ff2122SChristoph Hellwig * is defined as >90% of the items we tried to push were stuck. 562249a8c11SDavid Chinner * 563249a8c11SDavid Chinner * Backoff a bit more to allow some I/O to complete before 56443ff2122SChristoph Hellwig * restarting from the start of the AIL. This prevents us from 56543ff2122SChristoph Hellwig * spinning on the same items, and if they are pinned will all 56643ff2122SChristoph Hellwig * the restart to issue a log force to unpin the stuck items. 567249a8c11SDavid Chinner */ 568453eac8aSDave Chinner tout = 20; 56957e80956SMatthew Wilcox ailp->ail_last_pushed_lsn = 0; 57043ff2122SChristoph Hellwig } else { 57143ff2122SChristoph Hellwig /* 57243ff2122SChristoph Hellwig * Assume we have more work to do in a short while. 57343ff2122SChristoph Hellwig */ 57443ff2122SChristoph Hellwig tout = 10; 575453eac8aSDave Chinner } 5761da177e4SLinus Torvalds 5770030807cSChristoph Hellwig return tout; 5780030807cSChristoph Hellwig } 5790030807cSChristoph Hellwig 5800030807cSChristoph Hellwig static int 5810030807cSChristoph Hellwig xfsaild( 5820030807cSChristoph Hellwig void *data) 5830030807cSChristoph Hellwig { 5840030807cSChristoph Hellwig struct xfs_ail *ailp = data; 5850030807cSChristoph Hellwig long tout = 0; /* milliseconds */ 58610a98cb1SEric Biggers unsigned int noreclaim_flag; 5870030807cSChristoph Hellwig 58810a98cb1SEric Biggers noreclaim_flag = memalloc_noreclaim_save(); 58918f1df4eSMichal Hocko set_freezable(); 59043ff2122SChristoph Hellwig 5910bd89676SHou Tao while (1) { 5920030807cSChristoph Hellwig if (tout && tout <= 20) 5930bd89676SHou Tao set_current_state(TASK_KILLABLE); 5940030807cSChristoph Hellwig else 5950bd89676SHou Tao set_current_state(TASK_INTERRUPTIBLE); 5960bd89676SHou Tao 5970bd89676SHou Tao /* 598efc3289cSBrian Foster * Check kthread_should_stop() after we set the task state to 599efc3289cSBrian Foster * guarantee that we either see the stop bit and exit or the 600efc3289cSBrian Foster * task state is reset to runnable such that it's not scheduled 601efc3289cSBrian Foster * out indefinitely and detects the stop bit at next iteration. 6020bd89676SHou Tao * A memory barrier is included in above task state set to 6030bd89676SHou Tao * serialize again kthread_stop(). 6040bd89676SHou Tao */ 6050bd89676SHou Tao if (kthread_should_stop()) { 6060bd89676SHou Tao __set_current_state(TASK_RUNNING); 607efc3289cSBrian Foster 608efc3289cSBrian Foster /* 609efc3289cSBrian Foster * The caller forces out the AIL before stopping the 610efc3289cSBrian Foster * thread in the common case, which means the delwri 611efc3289cSBrian Foster * queue is drained. In the shutdown case, the queue may 612efc3289cSBrian Foster * still hold relogged buffers that haven't been 613efc3289cSBrian Foster * submitted because they were pinned since added to the 614efc3289cSBrian Foster * queue. 615efc3289cSBrian Foster * 616efc3289cSBrian Foster * Log I/O error processing stales the underlying buffer 617efc3289cSBrian Foster * and clears the delwri state, expecting the buf to be 618efc3289cSBrian Foster * removed on the next submission attempt. That won't 619efc3289cSBrian Foster * happen if we're shutting down, so this is the last 620efc3289cSBrian Foster * opportunity to release such buffers from the queue. 621efc3289cSBrian Foster */ 622efc3289cSBrian Foster ASSERT(list_empty(&ailp->ail_buf_list) || 623efc3289cSBrian Foster XFS_FORCED_SHUTDOWN(ailp->ail_mount)); 624efc3289cSBrian Foster xfs_buf_delwri_cancel(&ailp->ail_buf_list); 6250bd89676SHou Tao break; 6260bd89676SHou Tao } 6278375f922SBrian Foster 62857e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 6298375f922SBrian Foster 6308375f922SBrian Foster /* 6318375f922SBrian Foster * Idle if the AIL is empty and we are not racing with a target 6328375f922SBrian Foster * update. We check the AIL after we set the task to a sleep 63357e80956SMatthew Wilcox * state to guarantee that we either catch an ail_target update 6348375f922SBrian Foster * or that a wake_up resets the state to TASK_RUNNING. 6358375f922SBrian Foster * Otherwise, we run the risk of sleeping indefinitely. 6368375f922SBrian Foster * 63757e80956SMatthew Wilcox * The barrier matches the ail_target update in xfs_ail_push(). 6388375f922SBrian Foster */ 6398375f922SBrian Foster smp_rmb(); 6408375f922SBrian Foster if (!xfs_ail_min(ailp) && 641f376b45eSBrian Foster ailp->ail_target == ailp->ail_target_prev && 642f376b45eSBrian Foster list_empty(&ailp->ail_buf_list)) { 64357e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 64418f1df4eSMichal Hocko freezable_schedule(); 6458375f922SBrian Foster tout = 0; 6468375f922SBrian Foster continue; 6478375f922SBrian Foster } 64857e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 6498375f922SBrian Foster 6508375f922SBrian Foster if (tout) 65118f1df4eSMichal Hocko freezable_schedule_timeout(msecs_to_jiffies(tout)); 6528375f922SBrian Foster 6538375f922SBrian Foster __set_current_state(TASK_RUNNING); 6540030807cSChristoph Hellwig 6550030807cSChristoph Hellwig try_to_freeze(); 6560030807cSChristoph Hellwig 6570030807cSChristoph Hellwig tout = xfsaild_push(ailp); 6580030807cSChristoph Hellwig } 6590030807cSChristoph Hellwig 66010a98cb1SEric Biggers memalloc_noreclaim_restore(noreclaim_flag); 6610030807cSChristoph Hellwig return 0; 6620bf6a5bdSDave Chinner } 6630bf6a5bdSDave Chinner 6640bf6a5bdSDave Chinner /* 6650bf6a5bdSDave Chinner * This routine is called to move the tail of the AIL forward. It does this by 6660bf6a5bdSDave Chinner * trying to flush items in the AIL whose lsns are below the given 6670bf6a5bdSDave Chinner * threshold_lsn. 6680bf6a5bdSDave Chinner * 6690bf6a5bdSDave Chinner * The push is run asynchronously in a workqueue, which means the caller needs 6700bf6a5bdSDave Chinner * to handle waiting on the async flush for space to become available. 6710bf6a5bdSDave Chinner * We don't want to interrupt any push that is in progress, hence we only queue 672cf085a1bSJoe Perches * work if we set the pushing bit appropriately. 6730bf6a5bdSDave Chinner * 6740bf6a5bdSDave Chinner * We do this unlocked - we only need to know whether there is anything in the 6750bf6a5bdSDave Chinner * AIL at the time we are called. We don't need to access the contents of 6760bf6a5bdSDave Chinner * any of the objects, so the lock is not needed. 6770bf6a5bdSDave Chinner */ 6780bf6a5bdSDave Chinner void 679fd074841SDave Chinner xfs_ail_push( 6800bf6a5bdSDave Chinner struct xfs_ail *ailp, 6810bf6a5bdSDave Chinner xfs_lsn_t threshold_lsn) 6820bf6a5bdSDave Chinner { 683efe2330fSChristoph Hellwig struct xfs_log_item *lip; 6840bf6a5bdSDave Chinner 6850bf6a5bdSDave Chinner lip = xfs_ail_min(ailp); 68657e80956SMatthew Wilcox if (!lip || XFS_FORCED_SHUTDOWN(ailp->ail_mount) || 68757e80956SMatthew Wilcox XFS_LSN_CMP(threshold_lsn, ailp->ail_target) <= 0) 6880bf6a5bdSDave Chinner return; 6890bf6a5bdSDave Chinner 6900bf6a5bdSDave Chinner /* 6910bf6a5bdSDave Chinner * Ensure that the new target is noticed in push code before it clears 6920bf6a5bdSDave Chinner * the XFS_AIL_PUSHING_BIT. 6930bf6a5bdSDave Chinner */ 6940bf6a5bdSDave Chinner smp_wmb(); 69557e80956SMatthew Wilcox xfs_trans_ail_copy_lsn(ailp, &ailp->ail_target, &threshold_lsn); 6960030807cSChristoph Hellwig smp_wmb(); 6970030807cSChristoph Hellwig 69857e80956SMatthew Wilcox wake_up_process(ailp->ail_task); 6990bf6a5bdSDave Chinner } 7001da177e4SLinus Torvalds 7011da177e4SLinus Torvalds /* 702fd074841SDave Chinner * Push out all items in the AIL immediately 703fd074841SDave Chinner */ 704fd074841SDave Chinner void 705fd074841SDave Chinner xfs_ail_push_all( 706fd074841SDave Chinner struct xfs_ail *ailp) 707fd074841SDave Chinner { 708fd074841SDave Chinner xfs_lsn_t threshold_lsn = xfs_ail_max_lsn(ailp); 709fd074841SDave Chinner 710fd074841SDave Chinner if (threshold_lsn) 711fd074841SDave Chinner xfs_ail_push(ailp, threshold_lsn); 712fd074841SDave Chinner } 713fd074841SDave Chinner 714fd074841SDave Chinner /* 715211e4d43SChristoph Hellwig * Push out all items in the AIL immediately and wait until the AIL is empty. 716211e4d43SChristoph Hellwig */ 717211e4d43SChristoph Hellwig void 718211e4d43SChristoph Hellwig xfs_ail_push_all_sync( 719211e4d43SChristoph Hellwig struct xfs_ail *ailp) 720211e4d43SChristoph Hellwig { 721211e4d43SChristoph Hellwig struct xfs_log_item *lip; 722211e4d43SChristoph Hellwig DEFINE_WAIT(wait); 723211e4d43SChristoph Hellwig 72457e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 725211e4d43SChristoph Hellwig while ((lip = xfs_ail_max(ailp)) != NULL) { 72657e80956SMatthew Wilcox prepare_to_wait(&ailp->ail_empty, &wait, TASK_UNINTERRUPTIBLE); 72757e80956SMatthew Wilcox ailp->ail_target = lip->li_lsn; 72857e80956SMatthew Wilcox wake_up_process(ailp->ail_task); 72957e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 730211e4d43SChristoph Hellwig schedule(); 73157e80956SMatthew Wilcox spin_lock(&ailp->ail_lock); 732211e4d43SChristoph Hellwig } 73357e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 734211e4d43SChristoph Hellwig 73557e80956SMatthew Wilcox finish_wait(&ailp->ail_empty, &wait); 736211e4d43SChristoph Hellwig } 737211e4d43SChristoph Hellwig 7384165994aSDave Chinner void 7394165994aSDave Chinner xfs_ail_update_finish( 7404165994aSDave Chinner struct xfs_ail *ailp, 7418eb807bdSDave Chinner xfs_lsn_t old_lsn) __releases(ailp->ail_lock) 7424165994aSDave Chinner { 7434165994aSDave Chinner struct xfs_mount *mp = ailp->ail_mount; 7444165994aSDave Chinner 7458eb807bdSDave Chinner /* if the tail lsn hasn't changed, don't do updates or wakeups. */ 7468eb807bdSDave Chinner if (!old_lsn || old_lsn == __xfs_ail_min_lsn(ailp)) { 7474165994aSDave Chinner spin_unlock(&ailp->ail_lock); 7484165994aSDave Chinner return; 7494165994aSDave Chinner } 7504165994aSDave Chinner 7514165994aSDave Chinner if (!XFS_FORCED_SHUTDOWN(mp)) 7524165994aSDave Chinner xlog_assign_tail_lsn_locked(mp); 7534165994aSDave Chinner 7544165994aSDave Chinner if (list_empty(&ailp->ail_head)) 7554165994aSDave Chinner wake_up_all(&ailp->ail_empty); 7564165994aSDave Chinner spin_unlock(&ailp->ail_lock); 7574165994aSDave Chinner xfs_log_space_wake(mp); 7584165994aSDave Chinner } 7594165994aSDave Chinner 760211e4d43SChristoph Hellwig /* 7610e57f6a3SDave Chinner * xfs_trans_ail_update - bulk AIL insertion operation. 7620e57f6a3SDave Chinner * 7630e57f6a3SDave Chinner * @xfs_trans_ail_update takes an array of log items that all need to be 7640e57f6a3SDave Chinner * positioned at the same LSN in the AIL. If an item is not in the AIL, it will 7650e57f6a3SDave Chinner * be added. Otherwise, it will be repositioned by removing it and re-adding 7660e57f6a3SDave Chinner * it to the AIL. If we move the first item in the AIL, update the log tail to 7670e57f6a3SDave Chinner * match the new minimum LSN in the AIL. 7680e57f6a3SDave Chinner * 7690e57f6a3SDave Chinner * This function takes the AIL lock once to execute the update operations on 7700e57f6a3SDave Chinner * all the items in the array, and as such should not be called with the AIL 7710e57f6a3SDave Chinner * lock held. As a result, once we have the AIL lock, we need to check each log 7720e57f6a3SDave Chinner * item LSN to confirm it needs to be moved forward in the AIL. 7730e57f6a3SDave Chinner * 7740e57f6a3SDave Chinner * To optimise the insert operation, we delete all the items from the AIL in 7750e57f6a3SDave Chinner * the first pass, moving them into a temporary list, then splice the temporary 7760e57f6a3SDave Chinner * list into the correct position in the AIL. This avoids needing to do an 7770e57f6a3SDave Chinner * insert operation on every item. 7780e57f6a3SDave Chinner * 7790e57f6a3SDave Chinner * This function must be called with the AIL lock held. The lock is dropped 7800e57f6a3SDave Chinner * before returning. 7810e57f6a3SDave Chinner */ 7820e57f6a3SDave Chinner void 7830e57f6a3SDave Chinner xfs_trans_ail_update_bulk( 7840e57f6a3SDave Chinner struct xfs_ail *ailp, 7851d8c95a3SDave Chinner struct xfs_ail_cursor *cur, 7860e57f6a3SDave Chinner struct xfs_log_item **log_items, 7870e57f6a3SDave Chinner int nr_items, 78857e80956SMatthew Wilcox xfs_lsn_t lsn) __releases(ailp->ail_lock) 7890e57f6a3SDave Chinner { 790efe2330fSChristoph Hellwig struct xfs_log_item *mlip; 7918eb807bdSDave Chinner xfs_lsn_t tail_lsn = 0; 7920e57f6a3SDave Chinner int i; 7930e57f6a3SDave Chinner LIST_HEAD(tmp); 7940e57f6a3SDave Chinner 795e44f4112SAlex Elder ASSERT(nr_items > 0); /* Not required, but true. */ 7960e57f6a3SDave Chinner mlip = xfs_ail_min(ailp); 7970e57f6a3SDave Chinner 7980e57f6a3SDave Chinner for (i = 0; i < nr_items; i++) { 7990e57f6a3SDave Chinner struct xfs_log_item *lip = log_items[i]; 80022525c17SDave Chinner if (test_and_set_bit(XFS_LI_IN_AIL, &lip->li_flags)) { 8010e57f6a3SDave Chinner /* check if we really need to move the item */ 8020e57f6a3SDave Chinner if (XFS_LSN_CMP(lsn, lip->li_lsn) <= 0) 8030e57f6a3SDave Chinner continue; 8040e57f6a3SDave Chinner 805750b9c90SDave Chinner trace_xfs_ail_move(lip, lip->li_lsn, lsn); 8068eb807bdSDave Chinner if (mlip == lip && !tail_lsn) 8078eb807bdSDave Chinner tail_lsn = lip->li_lsn; 8088eb807bdSDave Chinner 8090e57f6a3SDave Chinner xfs_ail_delete(ailp, lip); 8100e57f6a3SDave Chinner } else { 811750b9c90SDave Chinner trace_xfs_ail_insert(lip, 0, lsn); 8120e57f6a3SDave Chinner } 8130e57f6a3SDave Chinner lip->li_lsn = lsn; 8140e57f6a3SDave Chinner list_add(&lip->li_ail, &tmp); 8150e57f6a3SDave Chinner } 8160e57f6a3SDave Chinner 817e44f4112SAlex Elder if (!list_empty(&tmp)) 8181d8c95a3SDave Chinner xfs_ail_splice(ailp, cur, &tmp, lsn); 8191c304625SChristoph Hellwig 8208eb807bdSDave Chinner xfs_ail_update_finish(ailp, tail_lsn); 8210e57f6a3SDave Chinner } 8220e57f6a3SDave Chinner 82386a37174SDarrick J. Wong /* Insert a log item into the AIL. */ 82486a37174SDarrick J. Wong void 82586a37174SDarrick J. Wong xfs_trans_ail_insert( 82686a37174SDarrick J. Wong struct xfs_ail *ailp, 82786a37174SDarrick J. Wong struct xfs_log_item *lip, 82886a37174SDarrick J. Wong xfs_lsn_t lsn) 82986a37174SDarrick J. Wong { 83086a37174SDarrick J. Wong spin_lock(&ailp->ail_lock); 83186a37174SDarrick J. Wong xfs_trans_ail_update_bulk(ailp, NULL, &lip, 1, lsn); 83286a37174SDarrick J. Wong } 83386a37174SDarrick J. Wong 8348eb807bdSDave Chinner /* 8358eb807bdSDave Chinner * Delete one log item from the AIL. 8368eb807bdSDave Chinner * 8378eb807bdSDave Chinner * If this item was at the tail of the AIL, return the LSN of the log item so 8388eb807bdSDave Chinner * that we can use it to check if the LSN of the tail of the log has moved 8398eb807bdSDave Chinner * when finishing up the AIL delete process in xfs_ail_update_finish(). 8408eb807bdSDave Chinner */ 8418eb807bdSDave Chinner xfs_lsn_t 84227af1bbfSChristoph Hellwig xfs_ail_delete_one( 84327af1bbfSChristoph Hellwig struct xfs_ail *ailp, 84427af1bbfSChristoph Hellwig struct xfs_log_item *lip) 84527af1bbfSChristoph Hellwig { 84627af1bbfSChristoph Hellwig struct xfs_log_item *mlip = xfs_ail_min(ailp); 8478eb807bdSDave Chinner xfs_lsn_t lsn = lip->li_lsn; 84827af1bbfSChristoph Hellwig 84927af1bbfSChristoph Hellwig trace_xfs_ail_delete(lip, mlip->li_lsn, lip->li_lsn); 85027af1bbfSChristoph Hellwig xfs_ail_delete(ailp, lip); 85122525c17SDave Chinner clear_bit(XFS_LI_IN_AIL, &lip->li_flags); 85227af1bbfSChristoph Hellwig lip->li_lsn = 0; 85327af1bbfSChristoph Hellwig 8548eb807bdSDave Chinner if (mlip == lip) 8558eb807bdSDave Chinner return lsn; 8568eb807bdSDave Chinner return 0; 85727af1bbfSChristoph Hellwig } 85827af1bbfSChristoph Hellwig 85930136832SDave Chinner void 86027af1bbfSChristoph Hellwig xfs_trans_ail_delete( 86127af1bbfSChristoph Hellwig struct xfs_log_item *lip, 8624165994aSDave Chinner int shutdown_type) 86330136832SDave Chinner { 864849274c1SBrian Foster struct xfs_ail *ailp = lip->li_ailp; 86557e80956SMatthew Wilcox struct xfs_mount *mp = ailp->ail_mount; 8668eb807bdSDave Chinner xfs_lsn_t tail_lsn; 86730136832SDave Chinner 868849274c1SBrian Foster spin_lock(&ailp->ail_lock); 86922525c17SDave Chinner if (!test_bit(XFS_LI_IN_AIL, &lip->li_flags)) { 87057e80956SMatthew Wilcox spin_unlock(&ailp->ail_lock); 8712b3cf093SBrian Foster if (shutdown_type && !XFS_FORCED_SHUTDOWN(mp)) { 8726a19d939SDave Chinner xfs_alert_tag(mp, XFS_PTAG_AILDELETE, 87330136832SDave Chinner "%s: attempting to delete a log item that is not in the AIL", 87430136832SDave Chinner __func__); 87504913fddSDave Chinner xfs_force_shutdown(mp, shutdown_type); 87630136832SDave Chinner } 87730136832SDave Chinner return; 87830136832SDave Chinner } 87930136832SDave Chinner 8802b3cf093SBrian Foster /* xfs_ail_update_finish() drops the AIL lock */ 881e98084b8SDave Chinner xfs_clear_li_failed(lip); 8828eb807bdSDave Chinner tail_lsn = xfs_ail_delete_one(ailp, lip); 8838eb807bdSDave Chinner xfs_ail_update_finish(ailp, tail_lsn); 88430136832SDave Chinner } 8851da177e4SLinus Torvalds 886249a8c11SDavid Chinner int 8871da177e4SLinus Torvalds xfs_trans_ail_init( 8881da177e4SLinus Torvalds xfs_mount_t *mp) 8891da177e4SLinus Torvalds { 89082fa9012SDavid Chinner struct xfs_ail *ailp; 89182fa9012SDavid Chinner 89282fa9012SDavid Chinner ailp = kmem_zalloc(sizeof(struct xfs_ail), KM_MAYFAIL); 89382fa9012SDavid Chinner if (!ailp) 8942451337dSDave Chinner return -ENOMEM; 89582fa9012SDavid Chinner 89657e80956SMatthew Wilcox ailp->ail_mount = mp; 89757e80956SMatthew Wilcox INIT_LIST_HEAD(&ailp->ail_head); 89857e80956SMatthew Wilcox INIT_LIST_HEAD(&ailp->ail_cursors); 89957e80956SMatthew Wilcox spin_lock_init(&ailp->ail_lock); 90057e80956SMatthew Wilcox INIT_LIST_HEAD(&ailp->ail_buf_list); 90157e80956SMatthew Wilcox init_waitqueue_head(&ailp->ail_empty); 9020030807cSChristoph Hellwig 90357e80956SMatthew Wilcox ailp->ail_task = kthread_run(xfsaild, ailp, "xfsaild/%s", 904e1d3d218SIan Kent ailp->ail_mount->m_super->s_id); 90557e80956SMatthew Wilcox if (IS_ERR(ailp->ail_task)) 9060030807cSChristoph Hellwig goto out_free_ailp; 9070030807cSChristoph Hellwig 90827d8d5feSDavid Chinner mp->m_ail = ailp; 90927d8d5feSDavid Chinner return 0; 9100030807cSChristoph Hellwig 9110030807cSChristoph Hellwig out_free_ailp: 9120030807cSChristoph Hellwig kmem_free(ailp); 9132451337dSDave Chinner return -ENOMEM; 914249a8c11SDavid Chinner } 915249a8c11SDavid Chinner 916249a8c11SDavid Chinner void 917249a8c11SDavid Chinner xfs_trans_ail_destroy( 918249a8c11SDavid Chinner xfs_mount_t *mp) 919249a8c11SDavid Chinner { 92082fa9012SDavid Chinner struct xfs_ail *ailp = mp->m_ail; 92182fa9012SDavid Chinner 92257e80956SMatthew Wilcox kthread_stop(ailp->ail_task); 92382fa9012SDavid Chinner kmem_free(ailp); 9241da177e4SLinus Torvalds } 925