10b61f8a4SDave Chinner // SPDX-License-Identifier: GPL-2.0+ 2bdf28630SDarrick J. Wong /* 3bdf28630SDarrick J. Wong * Copyright (C) 2016 Oracle. All Rights Reserved. 4bdf28630SDarrick J. Wong * Author: Darrick J. Wong <darrick.wong@oracle.com> 5bdf28630SDarrick J. Wong */ 6bdf28630SDarrick J. Wong #include "xfs.h" 7bdf28630SDarrick J. Wong #include "xfs_fs.h" 8bdf28630SDarrick J. Wong #include "xfs_shared.h" 9bdf28630SDarrick J. Wong #include "xfs_format.h" 10bdf28630SDarrick J. Wong #include "xfs_log_format.h" 11bdf28630SDarrick J. Wong #include "xfs_trans_resv.h" 12bdf28630SDarrick J. Wong #include "xfs_mount.h" 13bdf28630SDarrick J. Wong #include "xfs_defer.h" 14bdf28630SDarrick J. Wong #include "xfs_btree.h" 15bdf28630SDarrick J. Wong #include "xfs_bmap.h" 16bdf28630SDarrick J. Wong #include "xfs_refcount_btree.h" 17bdf28630SDarrick J. Wong #include "xfs_alloc.h" 18e9e899a2SDarrick J. Wong #include "xfs_errortag.h" 19bdf28630SDarrick J. Wong #include "xfs_error.h" 20bdf28630SDarrick J. Wong #include "xfs_trace.h" 21bdf28630SDarrick J. Wong #include "xfs_trans.h" 22bdf28630SDarrick J. Wong #include "xfs_bit.h" 23bdf28630SDarrick J. Wong #include "xfs_refcount.h" 24174edb0eSDarrick J. Wong #include "xfs_rmap.h" 25a81a0621SDave Chinner #include "xfs_ag.h" 26bdf28630SDarrick J. Wong 2731727258SDarrick J. Wong /* Allowable refcount adjustment amounts. */ 2831727258SDarrick J. Wong enum xfs_refc_adjust_op { 2931727258SDarrick J. Wong XFS_REFCOUNT_ADJUST_INCREASE = 1, 3031727258SDarrick J. Wong XFS_REFCOUNT_ADJUST_DECREASE = -1, 31174edb0eSDarrick J. Wong XFS_REFCOUNT_ADJUST_COW_ALLOC = 0, 32174edb0eSDarrick J. Wong XFS_REFCOUNT_ADJUST_COW_FREE = -1, 3331727258SDarrick J. Wong }; 3431727258SDarrick J. Wong 35174edb0eSDarrick J. Wong STATIC int __xfs_refcount_cow_alloc(struct xfs_btree_cur *rcur, 360f37d178SBrian Foster xfs_agblock_t agbno, xfs_extlen_t aglen); 37174edb0eSDarrick J. Wong STATIC int __xfs_refcount_cow_free(struct xfs_btree_cur *rcur, 380f37d178SBrian Foster xfs_agblock_t agbno, xfs_extlen_t aglen); 39174edb0eSDarrick J. Wong 40bdf28630SDarrick J. Wong /* 41bdf28630SDarrick J. Wong * Look up the first record less than or equal to [bno, len] in the btree 42bdf28630SDarrick J. Wong * given by cur. 43bdf28630SDarrick J. Wong */ 44bdf28630SDarrick J. Wong int 45bdf28630SDarrick J. Wong xfs_refcount_lookup_le( 46bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 47bdf28630SDarrick J. Wong xfs_agblock_t bno, 48bdf28630SDarrick J. Wong int *stat) 49bdf28630SDarrick J. Wong { 5050f02fe3SDave Chinner trace_xfs_refcount_lookup(cur->bc_mp, cur->bc_ag.pag->pag_agno, bno, 51bdf28630SDarrick J. Wong XFS_LOOKUP_LE); 52bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_startblock = bno; 53bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_blockcount = 0; 54bdf28630SDarrick J. Wong return xfs_btree_lookup(cur, XFS_LOOKUP_LE, stat); 55bdf28630SDarrick J. Wong } 56bdf28630SDarrick J. Wong 57bdf28630SDarrick J. Wong /* 58bdf28630SDarrick J. Wong * Look up the first record greater than or equal to [bno, len] in the btree 59bdf28630SDarrick J. Wong * given by cur. 60bdf28630SDarrick J. Wong */ 61bdf28630SDarrick J. Wong int 62bdf28630SDarrick J. Wong xfs_refcount_lookup_ge( 63bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 64bdf28630SDarrick J. Wong xfs_agblock_t bno, 65bdf28630SDarrick J. Wong int *stat) 66bdf28630SDarrick J. Wong { 6750f02fe3SDave Chinner trace_xfs_refcount_lookup(cur->bc_mp, cur->bc_ag.pag->pag_agno, bno, 68bdf28630SDarrick J. Wong XFS_LOOKUP_GE); 69bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_startblock = bno; 70bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_blockcount = 0; 71bdf28630SDarrick J. Wong return xfs_btree_lookup(cur, XFS_LOOKUP_GE, stat); 72bdf28630SDarrick J. Wong } 73bdf28630SDarrick J. Wong 7408daa3ccSDarrick J. Wong /* 7508daa3ccSDarrick J. Wong * Look up the first record equal to [bno, len] in the btree 7608daa3ccSDarrick J. Wong * given by cur. 7708daa3ccSDarrick J. Wong */ 7808daa3ccSDarrick J. Wong int 7908daa3ccSDarrick J. Wong xfs_refcount_lookup_eq( 8008daa3ccSDarrick J. Wong struct xfs_btree_cur *cur, 8108daa3ccSDarrick J. Wong xfs_agblock_t bno, 8208daa3ccSDarrick J. Wong int *stat) 8308daa3ccSDarrick J. Wong { 8450f02fe3SDave Chinner trace_xfs_refcount_lookup(cur->bc_mp, cur->bc_ag.pag->pag_agno, bno, 8508daa3ccSDarrick J. Wong XFS_LOOKUP_LE); 8608daa3ccSDarrick J. Wong cur->bc_rec.rc.rc_startblock = bno; 8708daa3ccSDarrick J. Wong cur->bc_rec.rc.rc_blockcount = 0; 8808daa3ccSDarrick J. Wong return xfs_btree_lookup(cur, XFS_LOOKUP_EQ, stat); 8908daa3ccSDarrick J. Wong } 9008daa3ccSDarrick J. Wong 91174edb0eSDarrick J. Wong /* Convert on-disk record to in-core format. */ 927f8f1313SDarrick J. Wong void 93174edb0eSDarrick J. Wong xfs_refcount_btrec_to_irec( 94*159eb69dSDarrick J. Wong const union xfs_btree_rec *rec, 95174edb0eSDarrick J. Wong struct xfs_refcount_irec *irec) 96174edb0eSDarrick J. Wong { 97174edb0eSDarrick J. Wong irec->rc_startblock = be32_to_cpu(rec->refc.rc_startblock); 98174edb0eSDarrick J. Wong irec->rc_blockcount = be32_to_cpu(rec->refc.rc_blockcount); 99174edb0eSDarrick J. Wong irec->rc_refcount = be32_to_cpu(rec->refc.rc_refcount); 100174edb0eSDarrick J. Wong } 101174edb0eSDarrick J. Wong 102bdf28630SDarrick J. Wong /* 103bdf28630SDarrick J. Wong * Get the data from the pointed-to record. 104bdf28630SDarrick J. Wong */ 105bdf28630SDarrick J. Wong int 106bdf28630SDarrick J. Wong xfs_refcount_get_rec( 107bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 108bdf28630SDarrick J. Wong struct xfs_refcount_irec *irec, 109bdf28630SDarrick J. Wong int *stat) 110bdf28630SDarrick J. Wong { 1119e6c08d4SDave Chinner struct xfs_mount *mp = cur->bc_mp; 11250f02fe3SDave Chinner xfs_agnumber_t agno = cur->bc_ag.pag->pag_agno; 113bdf28630SDarrick J. Wong union xfs_btree_rec *rec; 114bdf28630SDarrick J. Wong int error; 1159e6c08d4SDave Chinner xfs_agblock_t realstart; 116bdf28630SDarrick J. Wong 117bdf28630SDarrick J. Wong error = xfs_btree_get_rec(cur, &rec, stat); 1189e6c08d4SDave Chinner if (error || !*stat) 119bdf28630SDarrick J. Wong return error; 1209e6c08d4SDave Chinner 1219e6c08d4SDave Chinner xfs_refcount_btrec_to_irec(rec, irec); 1229e6c08d4SDave Chinner 12350f02fe3SDave Chinner agno = cur->bc_ag.pag->pag_agno; 1249e6c08d4SDave Chinner if (irec->rc_blockcount == 0 || irec->rc_blockcount > MAXREFCEXTLEN) 1259e6c08d4SDave Chinner goto out_bad_rec; 1269e6c08d4SDave Chinner 1279e6c08d4SDave Chinner /* handle special COW-staging state */ 1289e6c08d4SDave Chinner realstart = irec->rc_startblock; 1299e6c08d4SDave Chinner if (realstart & XFS_REFC_COW_START) { 1309e6c08d4SDave Chinner if (irec->rc_refcount != 1) 1319e6c08d4SDave Chinner goto out_bad_rec; 1329e6c08d4SDave Chinner realstart &= ~XFS_REFC_COW_START; 1339e6c08d4SDave Chinner } else if (irec->rc_refcount < 2) { 1349e6c08d4SDave Chinner goto out_bad_rec; 1359e6c08d4SDave Chinner } 1369e6c08d4SDave Chinner 1379e6c08d4SDave Chinner /* check for valid extent range, including overflow */ 1389e6c08d4SDave Chinner if (!xfs_verify_agbno(mp, agno, realstart)) 1399e6c08d4SDave Chinner goto out_bad_rec; 1409e6c08d4SDave Chinner if (realstart > realstart + irec->rc_blockcount) 1419e6c08d4SDave Chinner goto out_bad_rec; 1429e6c08d4SDave Chinner if (!xfs_verify_agbno(mp, agno, realstart + irec->rc_blockcount - 1)) 1439e6c08d4SDave Chinner goto out_bad_rec; 1449e6c08d4SDave Chinner 1459e6c08d4SDave Chinner if (irec->rc_refcount == 0 || irec->rc_refcount > MAXREFCOUNT) 1469e6c08d4SDave Chinner goto out_bad_rec; 1479e6c08d4SDave Chinner 14850f02fe3SDave Chinner trace_xfs_refcount_get(cur->bc_mp, cur->bc_ag.pag->pag_agno, irec); 1499e6c08d4SDave Chinner return 0; 1509e6c08d4SDave Chinner 1519e6c08d4SDave Chinner out_bad_rec: 1529e6c08d4SDave Chinner xfs_warn(mp, 1539e6c08d4SDave Chinner "Refcount BTree record corruption in AG %d detected!", agno); 1549e6c08d4SDave Chinner xfs_warn(mp, 1559e6c08d4SDave Chinner "Start block 0x%x, block count 0x%x, references 0x%x", 1569e6c08d4SDave Chinner irec->rc_startblock, irec->rc_blockcount, irec->rc_refcount); 1579e6c08d4SDave Chinner return -EFSCORRUPTED; 158bdf28630SDarrick J. Wong } 159bdf28630SDarrick J. Wong 160bdf28630SDarrick J. Wong /* 161bdf28630SDarrick J. Wong * Update the record referred to by cur to the value given 162bdf28630SDarrick J. Wong * by [bno, len, refcount]. 163bdf28630SDarrick J. Wong * This either works (return 0) or gets an EFSCORRUPTED error. 164bdf28630SDarrick J. Wong */ 165bdf28630SDarrick J. Wong STATIC int 166bdf28630SDarrick J. Wong xfs_refcount_update( 167bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 168bdf28630SDarrick J. Wong struct xfs_refcount_irec *irec) 169bdf28630SDarrick J. Wong { 170bdf28630SDarrick J. Wong union xfs_btree_rec rec; 171bdf28630SDarrick J. Wong int error; 172bdf28630SDarrick J. Wong 17350f02fe3SDave Chinner trace_xfs_refcount_update(cur->bc_mp, cur->bc_ag.pag->pag_agno, irec); 174bdf28630SDarrick J. Wong rec.refc.rc_startblock = cpu_to_be32(irec->rc_startblock); 175bdf28630SDarrick J. Wong rec.refc.rc_blockcount = cpu_to_be32(irec->rc_blockcount); 176bdf28630SDarrick J. Wong rec.refc.rc_refcount = cpu_to_be32(irec->rc_refcount); 177bdf28630SDarrick J. Wong error = xfs_btree_update(cur, &rec); 178bdf28630SDarrick J. Wong if (error) 179bdf28630SDarrick J. Wong trace_xfs_refcount_update_error(cur->bc_mp, 18050f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 181bdf28630SDarrick J. Wong return error; 182bdf28630SDarrick J. Wong } 183bdf28630SDarrick J. Wong 184bdf28630SDarrick J. Wong /* 185bdf28630SDarrick J. Wong * Insert the record referred to by cur to the value given 186bdf28630SDarrick J. Wong * by [bno, len, refcount]. 187bdf28630SDarrick J. Wong * This either works (return 0) or gets an EFSCORRUPTED error. 188bdf28630SDarrick J. Wong */ 1897f8f1313SDarrick J. Wong int 190bdf28630SDarrick J. Wong xfs_refcount_insert( 191bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 192bdf28630SDarrick J. Wong struct xfs_refcount_irec *irec, 193bdf28630SDarrick J. Wong int *i) 194bdf28630SDarrick J. Wong { 195bdf28630SDarrick J. Wong int error; 196bdf28630SDarrick J. Wong 19750f02fe3SDave Chinner trace_xfs_refcount_insert(cur->bc_mp, cur->bc_ag.pag->pag_agno, irec); 198bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_startblock = irec->rc_startblock; 199bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_blockcount = irec->rc_blockcount; 200bdf28630SDarrick J. Wong cur->bc_rec.rc.rc_refcount = irec->rc_refcount; 201bdf28630SDarrick J. Wong error = xfs_btree_insert(cur, i); 20216858f7cSDave Chinner if (error) 20316858f7cSDave Chinner goto out_error; 204f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, *i != 1)) { 205f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 206f9e03706SDarrick J. Wong goto out_error; 207f9e03706SDarrick J. Wong } 20816858f7cSDave Chinner 209bdf28630SDarrick J. Wong out_error: 210bdf28630SDarrick J. Wong if (error) 211bdf28630SDarrick J. Wong trace_xfs_refcount_insert_error(cur->bc_mp, 21250f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 213bdf28630SDarrick J. Wong return error; 214bdf28630SDarrick J. Wong } 215bdf28630SDarrick J. Wong 216bdf28630SDarrick J. Wong /* 217bdf28630SDarrick J. Wong * Remove the record referred to by cur, then set the pointer to the spot 218bdf28630SDarrick J. Wong * where the record could be re-inserted, in case we want to increment or 219bdf28630SDarrick J. Wong * decrement the cursor. 220bdf28630SDarrick J. Wong * This either works (return 0) or gets an EFSCORRUPTED error. 221bdf28630SDarrick J. Wong */ 222bdf28630SDarrick J. Wong STATIC int 223bdf28630SDarrick J. Wong xfs_refcount_delete( 224bdf28630SDarrick J. Wong struct xfs_btree_cur *cur, 225bdf28630SDarrick J. Wong int *i) 226bdf28630SDarrick J. Wong { 227bdf28630SDarrick J. Wong struct xfs_refcount_irec irec; 228bdf28630SDarrick J. Wong int found_rec; 229bdf28630SDarrick J. Wong int error; 230bdf28630SDarrick J. Wong 231bdf28630SDarrick J. Wong error = xfs_refcount_get_rec(cur, &irec, &found_rec); 232bdf28630SDarrick J. Wong if (error) 233bdf28630SDarrick J. Wong goto out_error; 234f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 235f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 236f9e03706SDarrick J. Wong goto out_error; 237f9e03706SDarrick J. Wong } 23850f02fe3SDave Chinner trace_xfs_refcount_delete(cur->bc_mp, cur->bc_ag.pag->pag_agno, &irec); 239bdf28630SDarrick J. Wong error = xfs_btree_delete(cur, i); 240f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, *i != 1)) { 241f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 242f9e03706SDarrick J. Wong goto out_error; 243f9e03706SDarrick J. Wong } 244bdf28630SDarrick J. Wong if (error) 245bdf28630SDarrick J. Wong goto out_error; 246bdf28630SDarrick J. Wong error = xfs_refcount_lookup_ge(cur, irec.rc_startblock, &found_rec); 247bdf28630SDarrick J. Wong out_error: 248bdf28630SDarrick J. Wong if (error) 249bdf28630SDarrick J. Wong trace_xfs_refcount_delete_error(cur->bc_mp, 25050f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 251bdf28630SDarrick J. Wong return error; 252bdf28630SDarrick J. Wong } 25331727258SDarrick J. Wong 25431727258SDarrick J. Wong /* 25531727258SDarrick J. Wong * Adjusting the Reference Count 25631727258SDarrick J. Wong * 25731727258SDarrick J. Wong * As stated elsewhere, the reference count btree (refcbt) stores 25831727258SDarrick J. Wong * >1 reference counts for extents of physical blocks. In this 25931727258SDarrick J. Wong * operation, we're either raising or lowering the reference count of 26031727258SDarrick J. Wong * some subrange stored in the tree: 26131727258SDarrick J. Wong * 26231727258SDarrick J. Wong * <------ adjustment range ------> 26331727258SDarrick J. Wong * ----+ +---+-----+ +--+--------+--------- 26431727258SDarrick J. Wong * 2 | | 3 | 4 | |17| 55 | 10 26531727258SDarrick J. Wong * ----+ +---+-----+ +--+--------+--------- 26631727258SDarrick J. Wong * X axis is physical blocks number; 26731727258SDarrick J. Wong * reference counts are the numbers inside the rectangles 26831727258SDarrick J. Wong * 26931727258SDarrick J. Wong * The first thing we need to do is to ensure that there are no 27031727258SDarrick J. Wong * refcount extents crossing either boundary of the range to be 27131727258SDarrick J. Wong * adjusted. For any extent that does cross a boundary, split it into 27231727258SDarrick J. Wong * two extents so that we can increment the refcount of one of the 27331727258SDarrick J. Wong * pieces later: 27431727258SDarrick J. Wong * 27531727258SDarrick J. Wong * <------ adjustment range ------> 27631727258SDarrick J. Wong * ----+ +---+-----+ +--+--------+----+---- 27731727258SDarrick J. Wong * 2 | | 3 | 2 | |17| 55 | 10 | 10 27831727258SDarrick J. Wong * ----+ +---+-----+ +--+--------+----+---- 27931727258SDarrick J. Wong * 28031727258SDarrick J. Wong * For this next step, let's assume that all the physical blocks in 28131727258SDarrick J. Wong * the adjustment range are mapped to a file and are therefore in use 28231727258SDarrick J. Wong * at least once. Therefore, we can infer that any gap in the 28331727258SDarrick J. Wong * refcount tree within the adjustment range represents a physical 28431727258SDarrick J. Wong * extent with refcount == 1: 28531727258SDarrick J. Wong * 28631727258SDarrick J. Wong * <------ adjustment range ------> 28731727258SDarrick J. Wong * ----+---+---+-----+-+--+--------+----+---- 28831727258SDarrick J. Wong * 2 |"1"| 3 | 2 |1|17| 55 | 10 | 10 28931727258SDarrick J. Wong * ----+---+---+-----+-+--+--------+----+---- 29031727258SDarrick J. Wong * ^ 29131727258SDarrick J. Wong * 29231727258SDarrick J. Wong * For each extent that falls within the interval range, figure out 29331727258SDarrick J. Wong * which extent is to the left or the right of that extent. Now we 29431727258SDarrick J. Wong * have a left, current, and right extent. If the new reference count 29531727258SDarrick J. Wong * of the center extent enables us to merge left, center, and right 29631727258SDarrick J. Wong * into one record covering all three, do so. If the center extent is 29731727258SDarrick J. Wong * at the left end of the range, abuts the left extent, and its new 29831727258SDarrick J. Wong * reference count matches the left extent's record, then merge them. 29931727258SDarrick J. Wong * If the center extent is at the right end of the range, abuts the 30031727258SDarrick J. Wong * right extent, and the reference counts match, merge those. In the 30131727258SDarrick J. Wong * example, we can left merge (assuming an increment operation): 30231727258SDarrick J. Wong * 30331727258SDarrick J. Wong * <------ adjustment range ------> 30431727258SDarrick J. Wong * --------+---+-----+-+--+--------+----+---- 30531727258SDarrick J. Wong * 2 | 3 | 2 |1|17| 55 | 10 | 10 30631727258SDarrick J. Wong * --------+---+-----+-+--+--------+----+---- 30731727258SDarrick J. Wong * ^ 30831727258SDarrick J. Wong * 30931727258SDarrick J. Wong * For all other extents within the range, adjust the reference count 31031727258SDarrick J. Wong * or delete it if the refcount falls below 2. If we were 31131727258SDarrick J. Wong * incrementing, the end result looks like this: 31231727258SDarrick J. Wong * 31331727258SDarrick J. Wong * <------ adjustment range ------> 31431727258SDarrick J. Wong * --------+---+-----+-+--+--------+----+---- 31531727258SDarrick J. Wong * 2 | 4 | 3 |2|18| 56 | 11 | 10 31631727258SDarrick J. Wong * --------+---+-----+-+--+--------+----+---- 31731727258SDarrick J. Wong * 31831727258SDarrick J. Wong * The result of a decrement operation looks as such: 31931727258SDarrick J. Wong * 32031727258SDarrick J. Wong * <------ adjustment range ------> 32131727258SDarrick J. Wong * ----+ +---+ +--+--------+----+---- 32231727258SDarrick J. Wong * 2 | | 2 | |16| 54 | 9 | 10 32331727258SDarrick J. Wong * ----+ +---+ +--+--------+----+---- 32431727258SDarrick J. Wong * DDDD 111111DD 32531727258SDarrick J. Wong * 32631727258SDarrick J. Wong * The blocks marked "D" are freed; the blocks marked "1" are only 32731727258SDarrick J. Wong * referenced once and therefore the record is removed from the 32831727258SDarrick J. Wong * refcount btree. 32931727258SDarrick J. Wong */ 33031727258SDarrick J. Wong 33131727258SDarrick J. Wong /* Next block after this extent. */ 33231727258SDarrick J. Wong static inline xfs_agblock_t 33331727258SDarrick J. Wong xfs_refc_next( 33431727258SDarrick J. Wong struct xfs_refcount_irec *rc) 33531727258SDarrick J. Wong { 33631727258SDarrick J. Wong return rc->rc_startblock + rc->rc_blockcount; 33731727258SDarrick J. Wong } 33831727258SDarrick J. Wong 33931727258SDarrick J. Wong /* 34031727258SDarrick J. Wong * Split a refcount extent that crosses agbno. 34131727258SDarrick J. Wong */ 34231727258SDarrick J. Wong STATIC int 34331727258SDarrick J. Wong xfs_refcount_split_extent( 34431727258SDarrick J. Wong struct xfs_btree_cur *cur, 34531727258SDarrick J. Wong xfs_agblock_t agbno, 34631727258SDarrick J. Wong bool *shape_changed) 34731727258SDarrick J. Wong { 34831727258SDarrick J. Wong struct xfs_refcount_irec rcext, tmp; 34931727258SDarrick J. Wong int found_rec; 35031727258SDarrick J. Wong int error; 35131727258SDarrick J. Wong 35231727258SDarrick J. Wong *shape_changed = false; 35331727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, agbno, &found_rec); 35431727258SDarrick J. Wong if (error) 35531727258SDarrick J. Wong goto out_error; 35631727258SDarrick J. Wong if (!found_rec) 35731727258SDarrick J. Wong return 0; 35831727258SDarrick J. Wong 35931727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &rcext, &found_rec); 36031727258SDarrick J. Wong if (error) 36131727258SDarrick J. Wong goto out_error; 362f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 363f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 364f9e03706SDarrick J. Wong goto out_error; 365f9e03706SDarrick J. Wong } 36631727258SDarrick J. Wong if (rcext.rc_startblock == agbno || xfs_refc_next(&rcext) <= agbno) 36731727258SDarrick J. Wong return 0; 36831727258SDarrick J. Wong 36931727258SDarrick J. Wong *shape_changed = true; 37050f02fe3SDave Chinner trace_xfs_refcount_split_extent(cur->bc_mp, cur->bc_ag.pag->pag_agno, 37131727258SDarrick J. Wong &rcext, agbno); 37231727258SDarrick J. Wong 37331727258SDarrick J. Wong /* Establish the right extent. */ 37431727258SDarrick J. Wong tmp = rcext; 37531727258SDarrick J. Wong tmp.rc_startblock = agbno; 37631727258SDarrick J. Wong tmp.rc_blockcount -= (agbno - rcext.rc_startblock); 37731727258SDarrick J. Wong error = xfs_refcount_update(cur, &tmp); 37831727258SDarrick J. Wong if (error) 37931727258SDarrick J. Wong goto out_error; 38031727258SDarrick J. Wong 38131727258SDarrick J. Wong /* Insert the left extent. */ 38231727258SDarrick J. Wong tmp = rcext; 38331727258SDarrick J. Wong tmp.rc_blockcount = agbno - rcext.rc_startblock; 38431727258SDarrick J. Wong error = xfs_refcount_insert(cur, &tmp, &found_rec); 38531727258SDarrick J. Wong if (error) 38631727258SDarrick J. Wong goto out_error; 387f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 388f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 389f9e03706SDarrick J. Wong goto out_error; 390f9e03706SDarrick J. Wong } 39131727258SDarrick J. Wong return error; 39231727258SDarrick J. Wong 39331727258SDarrick J. Wong out_error: 39431727258SDarrick J. Wong trace_xfs_refcount_split_extent_error(cur->bc_mp, 39550f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 39631727258SDarrick J. Wong return error; 39731727258SDarrick J. Wong } 39831727258SDarrick J. Wong 39931727258SDarrick J. Wong /* 40031727258SDarrick J. Wong * Merge the left, center, and right extents. 40131727258SDarrick J. Wong */ 40231727258SDarrick J. Wong STATIC int 40331727258SDarrick J. Wong xfs_refcount_merge_center_extents( 40431727258SDarrick J. Wong struct xfs_btree_cur *cur, 40531727258SDarrick J. Wong struct xfs_refcount_irec *left, 40631727258SDarrick J. Wong struct xfs_refcount_irec *center, 40731727258SDarrick J. Wong struct xfs_refcount_irec *right, 40831727258SDarrick J. Wong unsigned long long extlen, 40931727258SDarrick J. Wong xfs_extlen_t *aglen) 41031727258SDarrick J. Wong { 41131727258SDarrick J. Wong int error; 41231727258SDarrick J. Wong int found_rec; 41331727258SDarrick J. Wong 41431727258SDarrick J. Wong trace_xfs_refcount_merge_center_extents(cur->bc_mp, 41550f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, left, center, right); 41631727258SDarrick J. Wong 41731727258SDarrick J. Wong /* 41831727258SDarrick J. Wong * Make sure the center and right extents are not in the btree. 41931727258SDarrick J. Wong * If the center extent was synthesized, the first delete call 42031727258SDarrick J. Wong * removes the right extent and we skip the second deletion. 42131727258SDarrick J. Wong * If center and right were in the btree, then the first delete 42231727258SDarrick J. Wong * call removes the center and the second one removes the right 42331727258SDarrick J. Wong * extent. 42431727258SDarrick J. Wong */ 42531727258SDarrick J. Wong error = xfs_refcount_lookup_ge(cur, center->rc_startblock, 42631727258SDarrick J. Wong &found_rec); 42731727258SDarrick J. Wong if (error) 42831727258SDarrick J. Wong goto out_error; 429f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 430f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 431f9e03706SDarrick J. Wong goto out_error; 432f9e03706SDarrick J. Wong } 43331727258SDarrick J. Wong 43431727258SDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 43531727258SDarrick J. Wong if (error) 43631727258SDarrick J. Wong goto out_error; 437f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 438f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 439f9e03706SDarrick J. Wong goto out_error; 440f9e03706SDarrick J. Wong } 44131727258SDarrick J. Wong 44231727258SDarrick J. Wong if (center->rc_refcount > 1) { 44331727258SDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 44431727258SDarrick J. Wong if (error) 44531727258SDarrick J. Wong goto out_error; 446f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 447f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 448f9e03706SDarrick J. Wong goto out_error; 449f9e03706SDarrick J. Wong } 45031727258SDarrick J. Wong } 45131727258SDarrick J. Wong 45231727258SDarrick J. Wong /* Enlarge the left extent. */ 45331727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, left->rc_startblock, 45431727258SDarrick J. Wong &found_rec); 45531727258SDarrick J. Wong if (error) 45631727258SDarrick J. Wong goto out_error; 457f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 458f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 459f9e03706SDarrick J. Wong goto out_error; 460f9e03706SDarrick J. Wong } 46131727258SDarrick J. Wong 46231727258SDarrick J. Wong left->rc_blockcount = extlen; 46331727258SDarrick J. Wong error = xfs_refcount_update(cur, left); 46431727258SDarrick J. Wong if (error) 46531727258SDarrick J. Wong goto out_error; 46631727258SDarrick J. Wong 46731727258SDarrick J. Wong *aglen = 0; 46831727258SDarrick J. Wong return error; 46931727258SDarrick J. Wong 47031727258SDarrick J. Wong out_error: 47131727258SDarrick J. Wong trace_xfs_refcount_merge_center_extents_error(cur->bc_mp, 47250f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 47331727258SDarrick J. Wong return error; 47431727258SDarrick J. Wong } 47531727258SDarrick J. Wong 47631727258SDarrick J. Wong /* 47731727258SDarrick J. Wong * Merge with the left extent. 47831727258SDarrick J. Wong */ 47931727258SDarrick J. Wong STATIC int 48031727258SDarrick J. Wong xfs_refcount_merge_left_extent( 48131727258SDarrick J. Wong struct xfs_btree_cur *cur, 48231727258SDarrick J. Wong struct xfs_refcount_irec *left, 48331727258SDarrick J. Wong struct xfs_refcount_irec *cleft, 48431727258SDarrick J. Wong xfs_agblock_t *agbno, 48531727258SDarrick J. Wong xfs_extlen_t *aglen) 48631727258SDarrick J. Wong { 48731727258SDarrick J. Wong int error; 48831727258SDarrick J. Wong int found_rec; 48931727258SDarrick J. Wong 49031727258SDarrick J. Wong trace_xfs_refcount_merge_left_extent(cur->bc_mp, 49150f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, left, cleft); 49231727258SDarrick J. Wong 49331727258SDarrick J. Wong /* If the extent at agbno (cleft) wasn't synthesized, remove it. */ 49431727258SDarrick J. Wong if (cleft->rc_refcount > 1) { 49531727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, cleft->rc_startblock, 49631727258SDarrick J. Wong &found_rec); 49731727258SDarrick J. Wong if (error) 49831727258SDarrick J. Wong goto out_error; 499f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 500f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 501f9e03706SDarrick J. Wong goto out_error; 502f9e03706SDarrick J. Wong } 50331727258SDarrick J. Wong 50431727258SDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 50531727258SDarrick J. Wong if (error) 50631727258SDarrick J. Wong goto out_error; 507f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 508f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 509f9e03706SDarrick J. Wong goto out_error; 510f9e03706SDarrick J. Wong } 51131727258SDarrick J. Wong } 51231727258SDarrick J. Wong 51331727258SDarrick J. Wong /* Enlarge the left extent. */ 51431727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, left->rc_startblock, 51531727258SDarrick J. Wong &found_rec); 51631727258SDarrick J. Wong if (error) 51731727258SDarrick J. Wong goto out_error; 518f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 519f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 520f9e03706SDarrick J. Wong goto out_error; 521f9e03706SDarrick J. Wong } 52231727258SDarrick J. Wong 52331727258SDarrick J. Wong left->rc_blockcount += cleft->rc_blockcount; 52431727258SDarrick J. Wong error = xfs_refcount_update(cur, left); 52531727258SDarrick J. Wong if (error) 52631727258SDarrick J. Wong goto out_error; 52731727258SDarrick J. Wong 52831727258SDarrick J. Wong *agbno += cleft->rc_blockcount; 52931727258SDarrick J. Wong *aglen -= cleft->rc_blockcount; 53031727258SDarrick J. Wong return error; 53131727258SDarrick J. Wong 53231727258SDarrick J. Wong out_error: 53331727258SDarrick J. Wong trace_xfs_refcount_merge_left_extent_error(cur->bc_mp, 53450f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 53531727258SDarrick J. Wong return error; 53631727258SDarrick J. Wong } 53731727258SDarrick J. Wong 53831727258SDarrick J. Wong /* 53931727258SDarrick J. Wong * Merge with the right extent. 54031727258SDarrick J. Wong */ 54131727258SDarrick J. Wong STATIC int 54231727258SDarrick J. Wong xfs_refcount_merge_right_extent( 54331727258SDarrick J. Wong struct xfs_btree_cur *cur, 54431727258SDarrick J. Wong struct xfs_refcount_irec *right, 54531727258SDarrick J. Wong struct xfs_refcount_irec *cright, 54631727258SDarrick J. Wong xfs_extlen_t *aglen) 54731727258SDarrick J. Wong { 54831727258SDarrick J. Wong int error; 54931727258SDarrick J. Wong int found_rec; 55031727258SDarrick J. Wong 55131727258SDarrick J. Wong trace_xfs_refcount_merge_right_extent(cur->bc_mp, 55250f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, cright, right); 55331727258SDarrick J. Wong 55431727258SDarrick J. Wong /* 55531727258SDarrick J. Wong * If the extent ending at agbno+aglen (cright) wasn't synthesized, 55631727258SDarrick J. Wong * remove it. 55731727258SDarrick J. Wong */ 55831727258SDarrick J. Wong if (cright->rc_refcount > 1) { 55931727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, cright->rc_startblock, 56031727258SDarrick J. Wong &found_rec); 56131727258SDarrick J. Wong if (error) 56231727258SDarrick J. Wong goto out_error; 563f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 564f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 565f9e03706SDarrick J. Wong goto out_error; 566f9e03706SDarrick J. Wong } 56731727258SDarrick J. Wong 56831727258SDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 56931727258SDarrick J. Wong if (error) 57031727258SDarrick J. Wong goto out_error; 571f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 572f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 573f9e03706SDarrick J. Wong goto out_error; 574f9e03706SDarrick J. Wong } 57531727258SDarrick J. Wong } 57631727258SDarrick J. Wong 57731727258SDarrick J. Wong /* Enlarge the right extent. */ 57831727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, right->rc_startblock, 57931727258SDarrick J. Wong &found_rec); 58031727258SDarrick J. Wong if (error) 58131727258SDarrick J. Wong goto out_error; 582f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 583f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 584f9e03706SDarrick J. Wong goto out_error; 585f9e03706SDarrick J. Wong } 58631727258SDarrick J. Wong 58731727258SDarrick J. Wong right->rc_startblock -= cright->rc_blockcount; 58831727258SDarrick J. Wong right->rc_blockcount += cright->rc_blockcount; 58931727258SDarrick J. Wong error = xfs_refcount_update(cur, right); 59031727258SDarrick J. Wong if (error) 59131727258SDarrick J. Wong goto out_error; 59231727258SDarrick J. Wong 59331727258SDarrick J. Wong *aglen -= cright->rc_blockcount; 59431727258SDarrick J. Wong return error; 59531727258SDarrick J. Wong 59631727258SDarrick J. Wong out_error: 59731727258SDarrick J. Wong trace_xfs_refcount_merge_right_extent_error(cur->bc_mp, 59850f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 59931727258SDarrick J. Wong return error; 60031727258SDarrick J. Wong } 60131727258SDarrick J. Wong 602174edb0eSDarrick J. Wong #define XFS_FIND_RCEXT_SHARED 1 603174edb0eSDarrick J. Wong #define XFS_FIND_RCEXT_COW 2 60431727258SDarrick J. Wong /* 60531727258SDarrick J. Wong * Find the left extent and the one after it (cleft). This function assumes 60631727258SDarrick J. Wong * that we've already split any extent crossing agbno. 60731727258SDarrick J. Wong */ 60831727258SDarrick J. Wong STATIC int 60931727258SDarrick J. Wong xfs_refcount_find_left_extents( 61031727258SDarrick J. Wong struct xfs_btree_cur *cur, 61131727258SDarrick J. Wong struct xfs_refcount_irec *left, 61231727258SDarrick J. Wong struct xfs_refcount_irec *cleft, 61331727258SDarrick J. Wong xfs_agblock_t agbno, 614174edb0eSDarrick J. Wong xfs_extlen_t aglen, 615174edb0eSDarrick J. Wong int flags) 61631727258SDarrick J. Wong { 61731727258SDarrick J. Wong struct xfs_refcount_irec tmp; 61831727258SDarrick J. Wong int error; 61931727258SDarrick J. Wong int found_rec; 62031727258SDarrick J. Wong 62131727258SDarrick J. Wong left->rc_startblock = cleft->rc_startblock = NULLAGBLOCK; 62231727258SDarrick J. Wong error = xfs_refcount_lookup_le(cur, agbno - 1, &found_rec); 62331727258SDarrick J. Wong if (error) 62431727258SDarrick J. Wong goto out_error; 62531727258SDarrick J. Wong if (!found_rec) 62631727258SDarrick J. Wong return 0; 62731727258SDarrick J. Wong 62831727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &found_rec); 62931727258SDarrick J. Wong if (error) 63031727258SDarrick J. Wong goto out_error; 631f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 632f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 633f9e03706SDarrick J. Wong goto out_error; 634f9e03706SDarrick J. Wong } 63531727258SDarrick J. Wong 63631727258SDarrick J. Wong if (xfs_refc_next(&tmp) != agbno) 63731727258SDarrick J. Wong return 0; 638174edb0eSDarrick J. Wong if ((flags & XFS_FIND_RCEXT_SHARED) && tmp.rc_refcount < 2) 639174edb0eSDarrick J. Wong return 0; 640174edb0eSDarrick J. Wong if ((flags & XFS_FIND_RCEXT_COW) && tmp.rc_refcount > 1) 641174edb0eSDarrick J. Wong return 0; 64231727258SDarrick J. Wong /* We have a left extent; retrieve (or invent) the next right one */ 64331727258SDarrick J. Wong *left = tmp; 64431727258SDarrick J. Wong 64531727258SDarrick J. Wong error = xfs_btree_increment(cur, 0, &found_rec); 64631727258SDarrick J. Wong if (error) 64731727258SDarrick J. Wong goto out_error; 64831727258SDarrick J. Wong if (found_rec) { 64931727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &found_rec); 65031727258SDarrick J. Wong if (error) 65131727258SDarrick J. Wong goto out_error; 652f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 653f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 654f9e03706SDarrick J. Wong goto out_error; 655f9e03706SDarrick J. Wong } 65631727258SDarrick J. Wong 65731727258SDarrick J. Wong /* if tmp starts at the end of our range, just use that */ 65831727258SDarrick J. Wong if (tmp.rc_startblock == agbno) 65931727258SDarrick J. Wong *cleft = tmp; 66031727258SDarrick J. Wong else { 66131727258SDarrick J. Wong /* 66231727258SDarrick J. Wong * There's a gap in the refcntbt at the start of the 66331727258SDarrick J. Wong * range we're interested in (refcount == 1) so 66431727258SDarrick J. Wong * synthesize the implied extent and pass it back. 66531727258SDarrick J. Wong * We assume here that the agbno/aglen range was 66631727258SDarrick J. Wong * passed in from a data fork extent mapping and 66731727258SDarrick J. Wong * therefore is allocated to exactly one owner. 66831727258SDarrick J. Wong */ 66931727258SDarrick J. Wong cleft->rc_startblock = agbno; 67031727258SDarrick J. Wong cleft->rc_blockcount = min(aglen, 67131727258SDarrick J. Wong tmp.rc_startblock - agbno); 67231727258SDarrick J. Wong cleft->rc_refcount = 1; 67331727258SDarrick J. Wong } 67431727258SDarrick J. Wong } else { 67531727258SDarrick J. Wong /* 67631727258SDarrick J. Wong * No extents, so pretend that there's one covering the whole 67731727258SDarrick J. Wong * range. 67831727258SDarrick J. Wong */ 67931727258SDarrick J. Wong cleft->rc_startblock = agbno; 68031727258SDarrick J. Wong cleft->rc_blockcount = aglen; 68131727258SDarrick J. Wong cleft->rc_refcount = 1; 68231727258SDarrick J. Wong } 68350f02fe3SDave Chinner trace_xfs_refcount_find_left_extent(cur->bc_mp, cur->bc_ag.pag->pag_agno, 68431727258SDarrick J. Wong left, cleft, agbno); 68531727258SDarrick J. Wong return error; 68631727258SDarrick J. Wong 68731727258SDarrick J. Wong out_error: 68831727258SDarrick J. Wong trace_xfs_refcount_find_left_extent_error(cur->bc_mp, 68950f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 69031727258SDarrick J. Wong return error; 69131727258SDarrick J. Wong } 69231727258SDarrick J. Wong 69331727258SDarrick J. Wong /* 69431727258SDarrick J. Wong * Find the right extent and the one before it (cright). This function 69531727258SDarrick J. Wong * assumes that we've already split any extents crossing agbno + aglen. 69631727258SDarrick J. Wong */ 69731727258SDarrick J. Wong STATIC int 69831727258SDarrick J. Wong xfs_refcount_find_right_extents( 69931727258SDarrick J. Wong struct xfs_btree_cur *cur, 70031727258SDarrick J. Wong struct xfs_refcount_irec *right, 70131727258SDarrick J. Wong struct xfs_refcount_irec *cright, 70231727258SDarrick J. Wong xfs_agblock_t agbno, 703174edb0eSDarrick J. Wong xfs_extlen_t aglen, 704174edb0eSDarrick J. Wong int flags) 70531727258SDarrick J. Wong { 70631727258SDarrick J. Wong struct xfs_refcount_irec tmp; 70731727258SDarrick J. Wong int error; 70831727258SDarrick J. Wong int found_rec; 70931727258SDarrick J. Wong 71031727258SDarrick J. Wong right->rc_startblock = cright->rc_startblock = NULLAGBLOCK; 71131727258SDarrick J. Wong error = xfs_refcount_lookup_ge(cur, agbno + aglen, &found_rec); 71231727258SDarrick J. Wong if (error) 71331727258SDarrick J. Wong goto out_error; 71431727258SDarrick J. Wong if (!found_rec) 71531727258SDarrick J. Wong return 0; 71631727258SDarrick J. Wong 71731727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &found_rec); 71831727258SDarrick J. Wong if (error) 71931727258SDarrick J. Wong goto out_error; 720f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 721f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 722f9e03706SDarrick J. Wong goto out_error; 723f9e03706SDarrick J. Wong } 72431727258SDarrick J. Wong 72531727258SDarrick J. Wong if (tmp.rc_startblock != agbno + aglen) 72631727258SDarrick J. Wong return 0; 727174edb0eSDarrick J. Wong if ((flags & XFS_FIND_RCEXT_SHARED) && tmp.rc_refcount < 2) 728174edb0eSDarrick J. Wong return 0; 729174edb0eSDarrick J. Wong if ((flags & XFS_FIND_RCEXT_COW) && tmp.rc_refcount > 1) 730174edb0eSDarrick J. Wong return 0; 73131727258SDarrick J. Wong /* We have a right extent; retrieve (or invent) the next left one */ 73231727258SDarrick J. Wong *right = tmp; 73331727258SDarrick J. Wong 73431727258SDarrick J. Wong error = xfs_btree_decrement(cur, 0, &found_rec); 73531727258SDarrick J. Wong if (error) 73631727258SDarrick J. Wong goto out_error; 73731727258SDarrick J. Wong if (found_rec) { 73831727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &found_rec); 73931727258SDarrick J. Wong if (error) 74031727258SDarrick J. Wong goto out_error; 741f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 742f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 743f9e03706SDarrick J. Wong goto out_error; 744f9e03706SDarrick J. Wong } 74531727258SDarrick J. Wong 74631727258SDarrick J. Wong /* if tmp ends at the end of our range, just use that */ 74731727258SDarrick J. Wong if (xfs_refc_next(&tmp) == agbno + aglen) 74831727258SDarrick J. Wong *cright = tmp; 74931727258SDarrick J. Wong else { 75031727258SDarrick J. Wong /* 75131727258SDarrick J. Wong * There's a gap in the refcntbt at the end of the 75231727258SDarrick J. Wong * range we're interested in (refcount == 1) so 75331727258SDarrick J. Wong * create the implied extent and pass it back. 75431727258SDarrick J. Wong * We assume here that the agbno/aglen range was 75531727258SDarrick J. Wong * passed in from a data fork extent mapping and 75631727258SDarrick J. Wong * therefore is allocated to exactly one owner. 75731727258SDarrick J. Wong */ 75831727258SDarrick J. Wong cright->rc_startblock = max(agbno, xfs_refc_next(&tmp)); 75931727258SDarrick J. Wong cright->rc_blockcount = right->rc_startblock - 76031727258SDarrick J. Wong cright->rc_startblock; 76131727258SDarrick J. Wong cright->rc_refcount = 1; 76231727258SDarrick J. Wong } 76331727258SDarrick J. Wong } else { 76431727258SDarrick J. Wong /* 76531727258SDarrick J. Wong * No extents, so pretend that there's one covering the whole 76631727258SDarrick J. Wong * range. 76731727258SDarrick J. Wong */ 76831727258SDarrick J. Wong cright->rc_startblock = agbno; 76931727258SDarrick J. Wong cright->rc_blockcount = aglen; 77031727258SDarrick J. Wong cright->rc_refcount = 1; 77131727258SDarrick J. Wong } 77250f02fe3SDave Chinner trace_xfs_refcount_find_right_extent(cur->bc_mp, cur->bc_ag.pag->pag_agno, 77331727258SDarrick J. Wong cright, right, agbno + aglen); 77431727258SDarrick J. Wong return error; 77531727258SDarrick J. Wong 77631727258SDarrick J. Wong out_error: 77731727258SDarrick J. Wong trace_xfs_refcount_find_right_extent_error(cur->bc_mp, 77850f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 77931727258SDarrick J. Wong return error; 78031727258SDarrick J. Wong } 78131727258SDarrick J. Wong 78231727258SDarrick J. Wong /* Is this extent valid? */ 78331727258SDarrick J. Wong static inline bool 78431727258SDarrick J. Wong xfs_refc_valid( 78531727258SDarrick J. Wong struct xfs_refcount_irec *rc) 78631727258SDarrick J. Wong { 78731727258SDarrick J. Wong return rc->rc_startblock != NULLAGBLOCK; 78831727258SDarrick J. Wong } 78931727258SDarrick J. Wong 79031727258SDarrick J. Wong /* 79131727258SDarrick J. Wong * Try to merge with any extents on the boundaries of the adjustment range. 79231727258SDarrick J. Wong */ 79331727258SDarrick J. Wong STATIC int 79431727258SDarrick J. Wong xfs_refcount_merge_extents( 79531727258SDarrick J. Wong struct xfs_btree_cur *cur, 79631727258SDarrick J. Wong xfs_agblock_t *agbno, 79731727258SDarrick J. Wong xfs_extlen_t *aglen, 79831727258SDarrick J. Wong enum xfs_refc_adjust_op adjust, 799174edb0eSDarrick J. Wong int flags, 80031727258SDarrick J. Wong bool *shape_changed) 80131727258SDarrick J. Wong { 80231727258SDarrick J. Wong struct xfs_refcount_irec left = {0}, cleft = {0}; 80331727258SDarrick J. Wong struct xfs_refcount_irec cright = {0}, right = {0}; 80431727258SDarrick J. Wong int error; 80531727258SDarrick J. Wong unsigned long long ulen; 80631727258SDarrick J. Wong bool cequal; 80731727258SDarrick J. Wong 80831727258SDarrick J. Wong *shape_changed = false; 80931727258SDarrick J. Wong /* 81031727258SDarrick J. Wong * Find the extent just below agbno [left], just above agbno [cleft], 81131727258SDarrick J. Wong * just below (agbno + aglen) [cright], and just above (agbno + aglen) 81231727258SDarrick J. Wong * [right]. 81331727258SDarrick J. Wong */ 81431727258SDarrick J. Wong error = xfs_refcount_find_left_extents(cur, &left, &cleft, *agbno, 815174edb0eSDarrick J. Wong *aglen, flags); 81631727258SDarrick J. Wong if (error) 81731727258SDarrick J. Wong return error; 81831727258SDarrick J. Wong error = xfs_refcount_find_right_extents(cur, &right, &cright, *agbno, 819174edb0eSDarrick J. Wong *aglen, flags); 82031727258SDarrick J. Wong if (error) 82131727258SDarrick J. Wong return error; 82231727258SDarrick J. Wong 82331727258SDarrick J. Wong /* No left or right extent to merge; exit. */ 82431727258SDarrick J. Wong if (!xfs_refc_valid(&left) && !xfs_refc_valid(&right)) 82531727258SDarrick J. Wong return 0; 82631727258SDarrick J. Wong 82731727258SDarrick J. Wong cequal = (cleft.rc_startblock == cright.rc_startblock) && 82831727258SDarrick J. Wong (cleft.rc_blockcount == cright.rc_blockcount); 82931727258SDarrick J. Wong 83031727258SDarrick J. Wong /* Try to merge left, cleft, and right. cleft must == cright. */ 83131727258SDarrick J. Wong ulen = (unsigned long long)left.rc_blockcount + cleft.rc_blockcount + 83231727258SDarrick J. Wong right.rc_blockcount; 83331727258SDarrick J. Wong if (xfs_refc_valid(&left) && xfs_refc_valid(&right) && 83431727258SDarrick J. Wong xfs_refc_valid(&cleft) && xfs_refc_valid(&cright) && cequal && 83531727258SDarrick J. Wong left.rc_refcount == cleft.rc_refcount + adjust && 83631727258SDarrick J. Wong right.rc_refcount == cleft.rc_refcount + adjust && 83731727258SDarrick J. Wong ulen < MAXREFCEXTLEN) { 83831727258SDarrick J. Wong *shape_changed = true; 83931727258SDarrick J. Wong return xfs_refcount_merge_center_extents(cur, &left, &cleft, 840a1f69417SEric Sandeen &right, ulen, aglen); 84131727258SDarrick J. Wong } 84231727258SDarrick J. Wong 84331727258SDarrick J. Wong /* Try to merge left and cleft. */ 84431727258SDarrick J. Wong ulen = (unsigned long long)left.rc_blockcount + cleft.rc_blockcount; 84531727258SDarrick J. Wong if (xfs_refc_valid(&left) && xfs_refc_valid(&cleft) && 84631727258SDarrick J. Wong left.rc_refcount == cleft.rc_refcount + adjust && 84731727258SDarrick J. Wong ulen < MAXREFCEXTLEN) { 84831727258SDarrick J. Wong *shape_changed = true; 84931727258SDarrick J. Wong error = xfs_refcount_merge_left_extent(cur, &left, &cleft, 85031727258SDarrick J. Wong agbno, aglen); 85131727258SDarrick J. Wong if (error) 85231727258SDarrick J. Wong return error; 85331727258SDarrick J. Wong 85431727258SDarrick J. Wong /* 85531727258SDarrick J. Wong * If we just merged left + cleft and cleft == cright, 85631727258SDarrick J. Wong * we no longer have a cright to merge with right. We're done. 85731727258SDarrick J. Wong */ 85831727258SDarrick J. Wong if (cequal) 85931727258SDarrick J. Wong return 0; 86031727258SDarrick J. Wong } 86131727258SDarrick J. Wong 86231727258SDarrick J. Wong /* Try to merge cright and right. */ 86331727258SDarrick J. Wong ulen = (unsigned long long)right.rc_blockcount + cright.rc_blockcount; 86431727258SDarrick J. Wong if (xfs_refc_valid(&right) && xfs_refc_valid(&cright) && 86531727258SDarrick J. Wong right.rc_refcount == cright.rc_refcount + adjust && 86631727258SDarrick J. Wong ulen < MAXREFCEXTLEN) { 86731727258SDarrick J. Wong *shape_changed = true; 86831727258SDarrick J. Wong return xfs_refcount_merge_right_extent(cur, &right, &cright, 869a1f69417SEric Sandeen aglen); 87031727258SDarrick J. Wong } 87131727258SDarrick J. Wong 87231727258SDarrick J. Wong return error; 87331727258SDarrick J. Wong } 87431727258SDarrick J. Wong 87531727258SDarrick J. Wong /* 87631727258SDarrick J. Wong * XXX: This is a pretty hand-wavy estimate. The penalty for guessing 87731727258SDarrick J. Wong * true incorrectly is a shutdown FS; the penalty for guessing false 87831727258SDarrick J. Wong * incorrectly is more transaction rolls than might be necessary. 87931727258SDarrick J. Wong * Be conservative here. 88031727258SDarrick J. Wong */ 88131727258SDarrick J. Wong static bool 88231727258SDarrick J. Wong xfs_refcount_still_have_space( 88331727258SDarrick J. Wong struct xfs_btree_cur *cur) 88431727258SDarrick J. Wong { 88531727258SDarrick J. Wong unsigned long overhead; 88631727258SDarrick J. Wong 887c4aa10d0SDave Chinner overhead = cur->bc_ag.refc.shape_changes * 88831727258SDarrick J. Wong xfs_allocfree_log_count(cur->bc_mp, 1); 88931727258SDarrick J. Wong overhead *= cur->bc_mp->m_sb.sb_blocksize; 89031727258SDarrick J. Wong 89131727258SDarrick J. Wong /* 89231727258SDarrick J. Wong * Only allow 2 refcount extent updates per transaction if the 89331727258SDarrick J. Wong * refcount continue update "error" has been injected. 89431727258SDarrick J. Wong */ 895c4aa10d0SDave Chinner if (cur->bc_ag.refc.nr_ops > 2 && 89631727258SDarrick J. Wong XFS_TEST_ERROR(false, cur->bc_mp, 8979e24cfd0SDarrick J. Wong XFS_ERRTAG_REFCOUNT_CONTINUE_UPDATE)) 89831727258SDarrick J. Wong return false; 89931727258SDarrick J. Wong 900c4aa10d0SDave Chinner if (cur->bc_ag.refc.nr_ops == 0) 90131727258SDarrick J. Wong return true; 90231727258SDarrick J. Wong else if (overhead > cur->bc_tp->t_log_res) 90331727258SDarrick J. Wong return false; 90431727258SDarrick J. Wong return cur->bc_tp->t_log_res - overhead > 905c4aa10d0SDave Chinner cur->bc_ag.refc.nr_ops * XFS_REFCOUNT_ITEM_OVERHEAD; 90631727258SDarrick J. Wong } 90731727258SDarrick J. Wong 90831727258SDarrick J. Wong /* 90931727258SDarrick J. Wong * Adjust the refcounts of middle extents. At this point we should have 91031727258SDarrick J. Wong * split extents that crossed the adjustment range; merged with adjacent 91131727258SDarrick J. Wong * extents; and updated agbno/aglen to reflect the merges. Therefore, 91231727258SDarrick J. Wong * all we have to do is update the extents inside [agbno, agbno + aglen]. 91331727258SDarrick J. Wong */ 91431727258SDarrick J. Wong STATIC int 91531727258SDarrick J. Wong xfs_refcount_adjust_extents( 91631727258SDarrick J. Wong struct xfs_btree_cur *cur, 91731727258SDarrick J. Wong xfs_agblock_t *agbno, 91831727258SDarrick J. Wong xfs_extlen_t *aglen, 91931727258SDarrick J. Wong enum xfs_refc_adjust_op adj, 92031727258SDarrick J. Wong struct xfs_owner_info *oinfo) 92131727258SDarrick J. Wong { 92231727258SDarrick J. Wong struct xfs_refcount_irec ext, tmp; 92331727258SDarrick J. Wong int error; 92431727258SDarrick J. Wong int found_rec, found_tmp; 92531727258SDarrick J. Wong xfs_fsblock_t fsbno; 92631727258SDarrick J. Wong 92731727258SDarrick J. Wong /* Merging did all the work already. */ 92831727258SDarrick J. Wong if (*aglen == 0) 92931727258SDarrick J. Wong return 0; 93031727258SDarrick J. Wong 93131727258SDarrick J. Wong error = xfs_refcount_lookup_ge(cur, *agbno, &found_rec); 93231727258SDarrick J. Wong if (error) 93331727258SDarrick J. Wong goto out_error; 93431727258SDarrick J. Wong 93531727258SDarrick J. Wong while (*aglen > 0 && xfs_refcount_still_have_space(cur)) { 93631727258SDarrick J. Wong error = xfs_refcount_get_rec(cur, &ext, &found_rec); 93731727258SDarrick J. Wong if (error) 93831727258SDarrick J. Wong goto out_error; 93931727258SDarrick J. Wong if (!found_rec) { 94031727258SDarrick J. Wong ext.rc_startblock = cur->bc_mp->m_sb.sb_agblocks; 94131727258SDarrick J. Wong ext.rc_blockcount = 0; 94231727258SDarrick J. Wong ext.rc_refcount = 0; 94331727258SDarrick J. Wong } 94431727258SDarrick J. Wong 94531727258SDarrick J. Wong /* 94631727258SDarrick J. Wong * Deal with a hole in the refcount tree; if a file maps to 94731727258SDarrick J. Wong * these blocks and there's no refcountbt record, pretend that 94831727258SDarrick J. Wong * there is one with refcount == 1. 94931727258SDarrick J. Wong */ 95031727258SDarrick J. Wong if (ext.rc_startblock != *agbno) { 95131727258SDarrick J. Wong tmp.rc_startblock = *agbno; 95231727258SDarrick J. Wong tmp.rc_blockcount = min(*aglen, 95331727258SDarrick J. Wong ext.rc_startblock - *agbno); 95431727258SDarrick J. Wong tmp.rc_refcount = 1 + adj; 95531727258SDarrick J. Wong trace_xfs_refcount_modify_extent(cur->bc_mp, 95650f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, &tmp); 95731727258SDarrick J. Wong 95831727258SDarrick J. Wong /* 95931727258SDarrick J. Wong * Either cover the hole (increment) or 96031727258SDarrick J. Wong * delete the range (decrement). 96131727258SDarrick J. Wong */ 96231727258SDarrick J. Wong if (tmp.rc_refcount) { 96331727258SDarrick J. Wong error = xfs_refcount_insert(cur, &tmp, 96431727258SDarrick J. Wong &found_tmp); 96531727258SDarrick J. Wong if (error) 96631727258SDarrick J. Wong goto out_error; 967f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, 968f9e03706SDarrick J. Wong found_tmp != 1)) { 969f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 970f9e03706SDarrick J. Wong goto out_error; 971f9e03706SDarrick J. Wong } 972c4aa10d0SDave Chinner cur->bc_ag.refc.nr_ops++; 97331727258SDarrick J. Wong } else { 97431727258SDarrick J. Wong fsbno = XFS_AGB_TO_FSB(cur->bc_mp, 97550f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, 97631727258SDarrick J. Wong tmp.rc_startblock); 9770f37d178SBrian Foster xfs_bmap_add_free(cur->bc_tp, fsbno, 97831727258SDarrick J. Wong tmp.rc_blockcount, oinfo); 97931727258SDarrick J. Wong } 98031727258SDarrick J. Wong 98131727258SDarrick J. Wong (*agbno) += tmp.rc_blockcount; 98231727258SDarrick J. Wong (*aglen) -= tmp.rc_blockcount; 98331727258SDarrick J. Wong 98431727258SDarrick J. Wong error = xfs_refcount_lookup_ge(cur, *agbno, 98531727258SDarrick J. Wong &found_rec); 98631727258SDarrick J. Wong if (error) 98731727258SDarrick J. Wong goto out_error; 98831727258SDarrick J. Wong } 98931727258SDarrick J. Wong 99031727258SDarrick J. Wong /* Stop if there's nothing left to modify */ 99131727258SDarrick J. Wong if (*aglen == 0 || !xfs_refcount_still_have_space(cur)) 99231727258SDarrick J. Wong break; 99331727258SDarrick J. Wong 99431727258SDarrick J. Wong /* 99531727258SDarrick J. Wong * Adjust the reference count and either update the tree 99631727258SDarrick J. Wong * (incr) or free the blocks (decr). 99731727258SDarrick J. Wong */ 99831727258SDarrick J. Wong if (ext.rc_refcount == MAXREFCOUNT) 99931727258SDarrick J. Wong goto skip; 100031727258SDarrick J. Wong ext.rc_refcount += adj; 100131727258SDarrick J. Wong trace_xfs_refcount_modify_extent(cur->bc_mp, 100250f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, &ext); 100331727258SDarrick J. Wong if (ext.rc_refcount > 1) { 100431727258SDarrick J. Wong error = xfs_refcount_update(cur, &ext); 100531727258SDarrick J. Wong if (error) 100631727258SDarrick J. Wong goto out_error; 1007c4aa10d0SDave Chinner cur->bc_ag.refc.nr_ops++; 100831727258SDarrick J. Wong } else if (ext.rc_refcount == 1) { 100931727258SDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 101031727258SDarrick J. Wong if (error) 101131727258SDarrick J. Wong goto out_error; 1012f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 1013f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1014f9e03706SDarrick J. Wong goto out_error; 1015f9e03706SDarrick J. Wong } 1016c4aa10d0SDave Chinner cur->bc_ag.refc.nr_ops++; 101731727258SDarrick J. Wong goto advloop; 101831727258SDarrick J. Wong } else { 101931727258SDarrick J. Wong fsbno = XFS_AGB_TO_FSB(cur->bc_mp, 102050f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, 102131727258SDarrick J. Wong ext.rc_startblock); 10220f37d178SBrian Foster xfs_bmap_add_free(cur->bc_tp, fsbno, ext.rc_blockcount, 10230f37d178SBrian Foster oinfo); 102431727258SDarrick J. Wong } 102531727258SDarrick J. Wong 102631727258SDarrick J. Wong skip: 102731727258SDarrick J. Wong error = xfs_btree_increment(cur, 0, &found_rec); 102831727258SDarrick J. Wong if (error) 102931727258SDarrick J. Wong goto out_error; 103031727258SDarrick J. Wong 103131727258SDarrick J. Wong advloop: 103231727258SDarrick J. Wong (*agbno) += ext.rc_blockcount; 103331727258SDarrick J. Wong (*aglen) -= ext.rc_blockcount; 103431727258SDarrick J. Wong } 103531727258SDarrick J. Wong 103631727258SDarrick J. Wong return error; 103731727258SDarrick J. Wong out_error: 103831727258SDarrick J. Wong trace_xfs_refcount_modify_extent_error(cur->bc_mp, 103950f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 104031727258SDarrick J. Wong return error; 104131727258SDarrick J. Wong } 104231727258SDarrick J. Wong 104331727258SDarrick J. Wong /* Adjust the reference count of a range of AG blocks. */ 104431727258SDarrick J. Wong STATIC int 104531727258SDarrick J. Wong xfs_refcount_adjust( 104631727258SDarrick J. Wong struct xfs_btree_cur *cur, 104731727258SDarrick J. Wong xfs_agblock_t agbno, 104831727258SDarrick J. Wong xfs_extlen_t aglen, 104931727258SDarrick J. Wong xfs_agblock_t *new_agbno, 105031727258SDarrick J. Wong xfs_extlen_t *new_aglen, 105131727258SDarrick J. Wong enum xfs_refc_adjust_op adj, 105231727258SDarrick J. Wong struct xfs_owner_info *oinfo) 105331727258SDarrick J. Wong { 105431727258SDarrick J. Wong bool shape_changed; 105531727258SDarrick J. Wong int shape_changes = 0; 105631727258SDarrick J. Wong int error; 105731727258SDarrick J. Wong 105831727258SDarrick J. Wong *new_agbno = agbno; 105931727258SDarrick J. Wong *new_aglen = aglen; 106031727258SDarrick J. Wong if (adj == XFS_REFCOUNT_ADJUST_INCREASE) 106150f02fe3SDave Chinner trace_xfs_refcount_increase(cur->bc_mp, cur->bc_ag.pag->pag_agno, 106231727258SDarrick J. Wong agbno, aglen); 106331727258SDarrick J. Wong else 106450f02fe3SDave Chinner trace_xfs_refcount_decrease(cur->bc_mp, cur->bc_ag.pag->pag_agno, 106531727258SDarrick J. Wong agbno, aglen); 106631727258SDarrick J. Wong 106731727258SDarrick J. Wong /* 106831727258SDarrick J. Wong * Ensure that no rcextents cross the boundary of the adjustment range. 106931727258SDarrick J. Wong */ 107031727258SDarrick J. Wong error = xfs_refcount_split_extent(cur, agbno, &shape_changed); 107131727258SDarrick J. Wong if (error) 107231727258SDarrick J. Wong goto out_error; 107331727258SDarrick J. Wong if (shape_changed) 107431727258SDarrick J. Wong shape_changes++; 107531727258SDarrick J. Wong 107631727258SDarrick J. Wong error = xfs_refcount_split_extent(cur, agbno + aglen, &shape_changed); 107731727258SDarrick J. Wong if (error) 107831727258SDarrick J. Wong goto out_error; 107931727258SDarrick J. Wong if (shape_changed) 108031727258SDarrick J. Wong shape_changes++; 108131727258SDarrick J. Wong 108231727258SDarrick J. Wong /* 108331727258SDarrick J. Wong * Try to merge with the left or right extents of the range. 108431727258SDarrick J. Wong */ 108531727258SDarrick J. Wong error = xfs_refcount_merge_extents(cur, new_agbno, new_aglen, adj, 1086174edb0eSDarrick J. Wong XFS_FIND_RCEXT_SHARED, &shape_changed); 108731727258SDarrick J. Wong if (error) 108831727258SDarrick J. Wong goto out_error; 108931727258SDarrick J. Wong if (shape_changed) 109031727258SDarrick J. Wong shape_changes++; 109131727258SDarrick J. Wong if (shape_changes) 1092c4aa10d0SDave Chinner cur->bc_ag.refc.shape_changes++; 109331727258SDarrick J. Wong 109431727258SDarrick J. Wong /* Now that we've taken care of the ends, adjust the middle extents */ 109531727258SDarrick J. Wong error = xfs_refcount_adjust_extents(cur, new_agbno, new_aglen, 10960f37d178SBrian Foster adj, oinfo); 109731727258SDarrick J. Wong if (error) 109831727258SDarrick J. Wong goto out_error; 109931727258SDarrick J. Wong 110031727258SDarrick J. Wong return 0; 110131727258SDarrick J. Wong 110231727258SDarrick J. Wong out_error: 110350f02fe3SDave Chinner trace_xfs_refcount_adjust_error(cur->bc_mp, cur->bc_ag.pag->pag_agno, 110431727258SDarrick J. Wong error, _RET_IP_); 110531727258SDarrick J. Wong return error; 110631727258SDarrick J. Wong } 110733ba6129SDarrick J. Wong 110833ba6129SDarrick J. Wong /* Clean up after calling xfs_refcount_finish_one. */ 110933ba6129SDarrick J. Wong void 111033ba6129SDarrick J. Wong xfs_refcount_finish_one_cleanup( 111133ba6129SDarrick J. Wong struct xfs_trans *tp, 111233ba6129SDarrick J. Wong struct xfs_btree_cur *rcur, 111333ba6129SDarrick J. Wong int error) 111433ba6129SDarrick J. Wong { 111533ba6129SDarrick J. Wong struct xfs_buf *agbp; 111633ba6129SDarrick J. Wong 111733ba6129SDarrick J. Wong if (rcur == NULL) 111833ba6129SDarrick J. Wong return; 1119576af732SDave Chinner agbp = rcur->bc_ag.agbp; 11200b04b6b8SDarrick J. Wong xfs_btree_del_cursor(rcur, error); 112133ba6129SDarrick J. Wong if (error) 112233ba6129SDarrick J. Wong xfs_trans_brelse(tp, agbp); 112333ba6129SDarrick J. Wong } 112433ba6129SDarrick J. Wong 112533ba6129SDarrick J. Wong /* 112633ba6129SDarrick J. Wong * Process one of the deferred refcount operations. We pass back the 112733ba6129SDarrick J. Wong * btree cursor to maintain our lock on the btree between calls. 112833ba6129SDarrick J. Wong * This saves time and eliminates a buffer deadlock between the 112933ba6129SDarrick J. Wong * superblock and the AGF because we'll always grab them in the same 113033ba6129SDarrick J. Wong * order. 113133ba6129SDarrick J. Wong */ 113233ba6129SDarrick J. Wong int 113333ba6129SDarrick J. Wong xfs_refcount_finish_one( 113433ba6129SDarrick J. Wong struct xfs_trans *tp, 113533ba6129SDarrick J. Wong enum xfs_refcount_intent_type type, 113633ba6129SDarrick J. Wong xfs_fsblock_t startblock, 113733ba6129SDarrick J. Wong xfs_extlen_t blockcount, 113833ba6129SDarrick J. Wong xfs_fsblock_t *new_fsb, 113933ba6129SDarrick J. Wong xfs_extlen_t *new_len, 114033ba6129SDarrick J. Wong struct xfs_btree_cur **pcur) 114133ba6129SDarrick J. Wong { 114233ba6129SDarrick J. Wong struct xfs_mount *mp = tp->t_mountp; 114333ba6129SDarrick J. Wong struct xfs_btree_cur *rcur; 114433ba6129SDarrick J. Wong struct xfs_buf *agbp = NULL; 114533ba6129SDarrick J. Wong int error = 0; 114633ba6129SDarrick J. Wong xfs_agblock_t bno; 114733ba6129SDarrick J. Wong xfs_agblock_t new_agbno; 114833ba6129SDarrick J. Wong unsigned long nr_ops = 0; 114933ba6129SDarrick J. Wong int shape_changes = 0; 1150a81a0621SDave Chinner struct xfs_perag *pag; 115133ba6129SDarrick J. Wong 1152a81a0621SDave Chinner pag = xfs_perag_get(mp, XFS_FSB_TO_AGNO(mp, startblock)); 115333ba6129SDarrick J. Wong bno = XFS_FSB_TO_AGBNO(mp, startblock); 115433ba6129SDarrick J. Wong 115533ba6129SDarrick J. Wong trace_xfs_refcount_deferred(mp, XFS_FSB_TO_AGNO(mp, startblock), 115633ba6129SDarrick J. Wong type, XFS_FSB_TO_AGBNO(mp, startblock), 115733ba6129SDarrick J. Wong blockcount); 115833ba6129SDarrick J. Wong 1159a81a0621SDave Chinner if (XFS_TEST_ERROR(false, mp, XFS_ERRTAG_REFCOUNT_FINISH_ONE)) { 1160a81a0621SDave Chinner error = -EIO; 1161a81a0621SDave Chinner goto out_drop; 1162a81a0621SDave Chinner } 116333ba6129SDarrick J. Wong 116433ba6129SDarrick J. Wong /* 116533ba6129SDarrick J. Wong * If we haven't gotten a cursor or the cursor AG doesn't match 116633ba6129SDarrick J. Wong * the startblock, get one now. 116733ba6129SDarrick J. Wong */ 116833ba6129SDarrick J. Wong rcur = *pcur; 1169a81a0621SDave Chinner if (rcur != NULL && rcur->bc_ag.pag != pag) { 1170c4aa10d0SDave Chinner nr_ops = rcur->bc_ag.refc.nr_ops; 1171c4aa10d0SDave Chinner shape_changes = rcur->bc_ag.refc.shape_changes; 117233ba6129SDarrick J. Wong xfs_refcount_finish_one_cleanup(tp, rcur, 0); 117333ba6129SDarrick J. Wong rcur = NULL; 117433ba6129SDarrick J. Wong *pcur = NULL; 117533ba6129SDarrick J. Wong } 117633ba6129SDarrick J. Wong if (rcur == NULL) { 1177a81a0621SDave Chinner error = xfs_alloc_read_agf(tp->t_mountp, tp, pag->pag_agno, 117833ba6129SDarrick J. Wong XFS_ALLOC_FLAG_FREEING, &agbp); 117933ba6129SDarrick J. Wong if (error) 1180a81a0621SDave Chinner goto out_drop; 118133ba6129SDarrick J. Wong 1182a81a0621SDave Chinner rcur = xfs_refcountbt_init_cursor(mp, tp, agbp, pag); 1183c4aa10d0SDave Chinner rcur->bc_ag.refc.nr_ops = nr_ops; 1184c4aa10d0SDave Chinner rcur->bc_ag.refc.shape_changes = shape_changes; 118533ba6129SDarrick J. Wong } 118633ba6129SDarrick J. Wong *pcur = rcur; 118733ba6129SDarrick J. Wong 118833ba6129SDarrick J. Wong switch (type) { 118933ba6129SDarrick J. Wong case XFS_REFCOUNT_INCREASE: 119033ba6129SDarrick J. Wong error = xfs_refcount_adjust(rcur, bno, blockcount, &new_agbno, 11910f37d178SBrian Foster new_len, XFS_REFCOUNT_ADJUST_INCREASE, NULL); 1192a81a0621SDave Chinner *new_fsb = XFS_AGB_TO_FSB(mp, pag->pag_agno, new_agbno); 119333ba6129SDarrick J. Wong break; 119433ba6129SDarrick J. Wong case XFS_REFCOUNT_DECREASE: 119533ba6129SDarrick J. Wong error = xfs_refcount_adjust(rcur, bno, blockcount, &new_agbno, 11960f37d178SBrian Foster new_len, XFS_REFCOUNT_ADJUST_DECREASE, NULL); 1197a81a0621SDave Chinner *new_fsb = XFS_AGB_TO_FSB(mp, pag->pag_agno, new_agbno); 119833ba6129SDarrick J. Wong break; 1199174edb0eSDarrick J. Wong case XFS_REFCOUNT_ALLOC_COW: 1200174edb0eSDarrick J. Wong *new_fsb = startblock + blockcount; 1201174edb0eSDarrick J. Wong *new_len = 0; 12020f37d178SBrian Foster error = __xfs_refcount_cow_alloc(rcur, bno, blockcount); 1203174edb0eSDarrick J. Wong break; 1204174edb0eSDarrick J. Wong case XFS_REFCOUNT_FREE_COW: 1205174edb0eSDarrick J. Wong *new_fsb = startblock + blockcount; 1206174edb0eSDarrick J. Wong *new_len = 0; 12070f37d178SBrian Foster error = __xfs_refcount_cow_free(rcur, bno, blockcount); 1208174edb0eSDarrick J. Wong break; 120933ba6129SDarrick J. Wong default: 121033ba6129SDarrick J. Wong ASSERT(0); 121133ba6129SDarrick J. Wong error = -EFSCORRUPTED; 121233ba6129SDarrick J. Wong } 121333ba6129SDarrick J. Wong if (!error && *new_len > 0) 1214a81a0621SDave Chinner trace_xfs_refcount_finish_one_leftover(mp, pag->pag_agno, type, 121533ba6129SDarrick J. Wong bno, blockcount, new_agbno, *new_len); 1216a81a0621SDave Chinner out_drop: 1217a81a0621SDave Chinner xfs_perag_put(pag); 121833ba6129SDarrick J. Wong return error; 121933ba6129SDarrick J. Wong } 122033ba6129SDarrick J. Wong 122133ba6129SDarrick J. Wong /* 122233ba6129SDarrick J. Wong * Record a refcount intent for later processing. 122333ba6129SDarrick J. Wong */ 122474b4c5d4SDarrick J. Wong static void 122533ba6129SDarrick J. Wong __xfs_refcount_add( 12260f37d178SBrian Foster struct xfs_trans *tp, 122733ba6129SDarrick J. Wong enum xfs_refcount_intent_type type, 122833ba6129SDarrick J. Wong xfs_fsblock_t startblock, 122933ba6129SDarrick J. Wong xfs_extlen_t blockcount) 123033ba6129SDarrick J. Wong { 123133ba6129SDarrick J. Wong struct xfs_refcount_intent *ri; 123233ba6129SDarrick J. Wong 12330f37d178SBrian Foster trace_xfs_refcount_defer(tp->t_mountp, 12340f37d178SBrian Foster XFS_FSB_TO_AGNO(tp->t_mountp, startblock), 12350f37d178SBrian Foster type, XFS_FSB_TO_AGBNO(tp->t_mountp, startblock), 123633ba6129SDarrick J. Wong blockcount); 123733ba6129SDarrick J. Wong 123833ba6129SDarrick J. Wong ri = kmem_alloc(sizeof(struct xfs_refcount_intent), 1239707e0ddaSTetsuo Handa KM_NOFS); 124033ba6129SDarrick J. Wong INIT_LIST_HEAD(&ri->ri_list); 124133ba6129SDarrick J. Wong ri->ri_type = type; 124233ba6129SDarrick J. Wong ri->ri_startblock = startblock; 124333ba6129SDarrick J. Wong ri->ri_blockcount = blockcount; 124433ba6129SDarrick J. Wong 12450f37d178SBrian Foster xfs_defer_add(tp, XFS_DEFER_OPS_TYPE_REFCOUNT, &ri->ri_list); 124633ba6129SDarrick J. Wong } 124733ba6129SDarrick J. Wong 124833ba6129SDarrick J. Wong /* 124933ba6129SDarrick J. Wong * Increase the reference count of the blocks backing a file's extent. 125033ba6129SDarrick J. Wong */ 125174b4c5d4SDarrick J. Wong void 125233ba6129SDarrick J. Wong xfs_refcount_increase_extent( 12530f37d178SBrian Foster struct xfs_trans *tp, 125433ba6129SDarrick J. Wong struct xfs_bmbt_irec *PREV) 125533ba6129SDarrick J. Wong { 12560f37d178SBrian Foster if (!xfs_sb_version_hasreflink(&tp->t_mountp->m_sb)) 125774b4c5d4SDarrick J. Wong return; 125833ba6129SDarrick J. Wong 125974b4c5d4SDarrick J. Wong __xfs_refcount_add(tp, XFS_REFCOUNT_INCREASE, PREV->br_startblock, 126074b4c5d4SDarrick J. Wong PREV->br_blockcount); 126133ba6129SDarrick J. Wong } 126233ba6129SDarrick J. Wong 126333ba6129SDarrick J. Wong /* 126433ba6129SDarrick J. Wong * Decrease the reference count of the blocks backing a file's extent. 126533ba6129SDarrick J. Wong */ 126674b4c5d4SDarrick J. Wong void 126733ba6129SDarrick J. Wong xfs_refcount_decrease_extent( 12680f37d178SBrian Foster struct xfs_trans *tp, 126933ba6129SDarrick J. Wong struct xfs_bmbt_irec *PREV) 127033ba6129SDarrick J. Wong { 12710f37d178SBrian Foster if (!xfs_sb_version_hasreflink(&tp->t_mountp->m_sb)) 127274b4c5d4SDarrick J. Wong return; 127333ba6129SDarrick J. Wong 127474b4c5d4SDarrick J. Wong __xfs_refcount_add(tp, XFS_REFCOUNT_DECREASE, PREV->br_startblock, 127574b4c5d4SDarrick J. Wong PREV->br_blockcount); 127633ba6129SDarrick J. Wong } 1277350a27a6SDarrick J. Wong 1278350a27a6SDarrick J. Wong /* 1279350a27a6SDarrick J. Wong * Given an AG extent, find the lowest-numbered run of shared blocks 1280350a27a6SDarrick J. Wong * within that range and return the range in fbno/flen. If 1281350a27a6SDarrick J. Wong * find_end_of_shared is set, return the longest contiguous extent of 1282350a27a6SDarrick J. Wong * shared blocks; if not, just return the first extent we find. If no 1283350a27a6SDarrick J. Wong * shared blocks are found, fbno and flen will be set to NULLAGBLOCK 1284350a27a6SDarrick J. Wong * and 0, respectively. 1285350a27a6SDarrick J. Wong */ 1286350a27a6SDarrick J. Wong int 1287350a27a6SDarrick J. Wong xfs_refcount_find_shared( 1288350a27a6SDarrick J. Wong struct xfs_btree_cur *cur, 1289350a27a6SDarrick J. Wong xfs_agblock_t agbno, 1290350a27a6SDarrick J. Wong xfs_extlen_t aglen, 1291350a27a6SDarrick J. Wong xfs_agblock_t *fbno, 1292350a27a6SDarrick J. Wong xfs_extlen_t *flen, 1293350a27a6SDarrick J. Wong bool find_end_of_shared) 1294350a27a6SDarrick J. Wong { 1295350a27a6SDarrick J. Wong struct xfs_refcount_irec tmp; 1296350a27a6SDarrick J. Wong int i; 1297350a27a6SDarrick J. Wong int have; 1298350a27a6SDarrick J. Wong int error; 1299350a27a6SDarrick J. Wong 130050f02fe3SDave Chinner trace_xfs_refcount_find_shared(cur->bc_mp, cur->bc_ag.pag->pag_agno, 1301350a27a6SDarrick J. Wong agbno, aglen); 1302350a27a6SDarrick J. Wong 1303350a27a6SDarrick J. Wong /* By default, skip the whole range */ 1304350a27a6SDarrick J. Wong *fbno = NULLAGBLOCK; 1305350a27a6SDarrick J. Wong *flen = 0; 1306350a27a6SDarrick J. Wong 1307350a27a6SDarrick J. Wong /* Try to find a refcount extent that crosses the start */ 1308350a27a6SDarrick J. Wong error = xfs_refcount_lookup_le(cur, agbno, &have); 1309350a27a6SDarrick J. Wong if (error) 1310350a27a6SDarrick J. Wong goto out_error; 1311350a27a6SDarrick J. Wong if (!have) { 1312350a27a6SDarrick J. Wong /* No left extent, look at the next one */ 1313350a27a6SDarrick J. Wong error = xfs_btree_increment(cur, 0, &have); 1314350a27a6SDarrick J. Wong if (error) 1315350a27a6SDarrick J. Wong goto out_error; 1316350a27a6SDarrick J. Wong if (!have) 1317350a27a6SDarrick J. Wong goto done; 1318350a27a6SDarrick J. Wong } 1319350a27a6SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &i); 1320350a27a6SDarrick J. Wong if (error) 1321350a27a6SDarrick J. Wong goto out_error; 1322f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, i != 1)) { 1323f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1324f9e03706SDarrick J. Wong goto out_error; 1325f9e03706SDarrick J. Wong } 1326350a27a6SDarrick J. Wong 1327350a27a6SDarrick J. Wong /* If the extent ends before the start, look at the next one */ 1328350a27a6SDarrick J. Wong if (tmp.rc_startblock + tmp.rc_blockcount <= agbno) { 1329350a27a6SDarrick J. Wong error = xfs_btree_increment(cur, 0, &have); 1330350a27a6SDarrick J. Wong if (error) 1331350a27a6SDarrick J. Wong goto out_error; 1332350a27a6SDarrick J. Wong if (!have) 1333350a27a6SDarrick J. Wong goto done; 1334350a27a6SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &i); 1335350a27a6SDarrick J. Wong if (error) 1336350a27a6SDarrick J. Wong goto out_error; 1337f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, i != 1)) { 1338f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1339f9e03706SDarrick J. Wong goto out_error; 1340f9e03706SDarrick J. Wong } 1341350a27a6SDarrick J. Wong } 1342350a27a6SDarrick J. Wong 1343350a27a6SDarrick J. Wong /* If the extent starts after the range we want, bail out */ 1344350a27a6SDarrick J. Wong if (tmp.rc_startblock >= agbno + aglen) 1345350a27a6SDarrick J. Wong goto done; 1346350a27a6SDarrick J. Wong 1347350a27a6SDarrick J. Wong /* We found the start of a shared extent! */ 1348350a27a6SDarrick J. Wong if (tmp.rc_startblock < agbno) { 1349350a27a6SDarrick J. Wong tmp.rc_blockcount -= (agbno - tmp.rc_startblock); 1350350a27a6SDarrick J. Wong tmp.rc_startblock = agbno; 1351350a27a6SDarrick J. Wong } 1352350a27a6SDarrick J. Wong 1353350a27a6SDarrick J. Wong *fbno = tmp.rc_startblock; 1354350a27a6SDarrick J. Wong *flen = min(tmp.rc_blockcount, agbno + aglen - *fbno); 1355350a27a6SDarrick J. Wong if (!find_end_of_shared) 1356350a27a6SDarrick J. Wong goto done; 1357350a27a6SDarrick J. Wong 1358350a27a6SDarrick J. Wong /* Otherwise, find the end of this shared extent */ 1359350a27a6SDarrick J. Wong while (*fbno + *flen < agbno + aglen) { 1360350a27a6SDarrick J. Wong error = xfs_btree_increment(cur, 0, &have); 1361350a27a6SDarrick J. Wong if (error) 1362350a27a6SDarrick J. Wong goto out_error; 1363350a27a6SDarrick J. Wong if (!have) 1364350a27a6SDarrick J. Wong break; 1365350a27a6SDarrick J. Wong error = xfs_refcount_get_rec(cur, &tmp, &i); 1366350a27a6SDarrick J. Wong if (error) 1367350a27a6SDarrick J. Wong goto out_error; 1368f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, i != 1)) { 1369f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1370f9e03706SDarrick J. Wong goto out_error; 1371f9e03706SDarrick J. Wong } 1372350a27a6SDarrick J. Wong if (tmp.rc_startblock >= agbno + aglen || 1373350a27a6SDarrick J. Wong tmp.rc_startblock != *fbno + *flen) 1374350a27a6SDarrick J. Wong break; 1375350a27a6SDarrick J. Wong *flen = min(*flen + tmp.rc_blockcount, agbno + aglen - *fbno); 1376350a27a6SDarrick J. Wong } 1377350a27a6SDarrick J. Wong 1378350a27a6SDarrick J. Wong done: 1379350a27a6SDarrick J. Wong trace_xfs_refcount_find_shared_result(cur->bc_mp, 138050f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, *fbno, *flen); 1381350a27a6SDarrick J. Wong 1382350a27a6SDarrick J. Wong out_error: 1383350a27a6SDarrick J. Wong if (error) 1384350a27a6SDarrick J. Wong trace_xfs_refcount_find_shared_error(cur->bc_mp, 138550f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 1386350a27a6SDarrick J. Wong return error; 1387350a27a6SDarrick J. Wong } 1388174edb0eSDarrick J. Wong 1389174edb0eSDarrick J. Wong /* 1390174edb0eSDarrick J. Wong * Recovering CoW Blocks After a Crash 1391174edb0eSDarrick J. Wong * 1392174edb0eSDarrick J. Wong * Due to the way that the copy on write mechanism works, there's a window of 1393174edb0eSDarrick J. Wong * opportunity in which we can lose track of allocated blocks during a crash. 1394174edb0eSDarrick J. Wong * Because CoW uses delayed allocation in the in-core CoW fork, writeback 1395174edb0eSDarrick J. Wong * causes blocks to be allocated and stored in the CoW fork. The blocks are 1396174edb0eSDarrick J. Wong * no longer in the free space btree but are not otherwise recorded anywhere 1397174edb0eSDarrick J. Wong * until the write completes and the blocks are mapped into the file. A crash 1398174edb0eSDarrick J. Wong * in between allocation and remapping results in the replacement blocks being 1399174edb0eSDarrick J. Wong * lost. This situation is exacerbated by the CoW extent size hint because 1400174edb0eSDarrick J. Wong * allocations can hang around for long time. 1401174edb0eSDarrick J. Wong * 1402174edb0eSDarrick J. Wong * However, there is a place where we can record these allocations before they 1403174edb0eSDarrick J. Wong * become mappings -- the reference count btree. The btree does not record 1404174edb0eSDarrick J. Wong * extents with refcount == 1, so we can record allocations with a refcount of 1405174edb0eSDarrick J. Wong * 1. Blocks being used for CoW writeout cannot be shared, so there should be 1406174edb0eSDarrick J. Wong * no conflict with shared block records. These mappings should be created 1407174edb0eSDarrick J. Wong * when we allocate blocks to the CoW fork and deleted when they're removed 1408174edb0eSDarrick J. Wong * from the CoW fork. 1409174edb0eSDarrick J. Wong * 1410174edb0eSDarrick J. Wong * Minor nit: records for in-progress CoW allocations and records for shared 1411174edb0eSDarrick J. Wong * extents must never be merged, to preserve the property that (except for CoW 1412174edb0eSDarrick J. Wong * allocations) there are no refcount btree entries with refcount == 1. The 1413174edb0eSDarrick J. Wong * only time this could potentially happen is when unsharing a block that's 1414174edb0eSDarrick J. Wong * adjacent to CoW allocations, so we must be careful to avoid this. 1415174edb0eSDarrick J. Wong * 1416174edb0eSDarrick J. Wong * At mount time we recover lost CoW allocations by searching the refcount 1417174edb0eSDarrick J. Wong * btree for these refcount == 1 mappings. These represent CoW allocations 1418174edb0eSDarrick J. Wong * that were in progress at the time the filesystem went down, so we can free 1419174edb0eSDarrick J. Wong * them to get the space back. 1420174edb0eSDarrick J. Wong * 1421174edb0eSDarrick J. Wong * This mechanism is superior to creating EFIs for unmapped CoW extents for 1422174edb0eSDarrick J. Wong * several reasons -- first, EFIs pin the tail of the log and would have to be 1423174edb0eSDarrick J. Wong * periodically relogged to avoid filling up the log. Second, CoW completions 1424174edb0eSDarrick J. Wong * will have to file an EFD and create new EFIs for whatever remains in the 1425174edb0eSDarrick J. Wong * CoW fork; this partially takes care of (1) but extent-size reservations 1426174edb0eSDarrick J. Wong * will have to periodically relog even if there's no writeout in progress. 1427174edb0eSDarrick J. Wong * This can happen if the CoW extent size hint is set, which you really want. 1428174edb0eSDarrick J. Wong * Third, EFIs cannot currently be automatically relogged into newer 1429174edb0eSDarrick J. Wong * transactions to advance the log tail. Fourth, stuffing the log full of 1430174edb0eSDarrick J. Wong * EFIs places an upper bound on the number of CoW allocations that can be 1431174edb0eSDarrick J. Wong * held filesystem-wide at any given time. Recording them in the refcount 1432174edb0eSDarrick J. Wong * btree doesn't require us to maintain any state in memory and doesn't pin 1433174edb0eSDarrick J. Wong * the log. 1434174edb0eSDarrick J. Wong */ 1435174edb0eSDarrick J. Wong /* 1436174edb0eSDarrick J. Wong * Adjust the refcounts of CoW allocations. These allocations are "magic" 1437174edb0eSDarrick J. Wong * in that they're not referenced anywhere else in the filesystem, so we 1438174edb0eSDarrick J. Wong * stash them in the refcount btree with a refcount of 1 until either file 1439174edb0eSDarrick J. Wong * remapping (or CoW cancellation) happens. 1440174edb0eSDarrick J. Wong */ 1441174edb0eSDarrick J. Wong STATIC int 1442174edb0eSDarrick J. Wong xfs_refcount_adjust_cow_extents( 1443174edb0eSDarrick J. Wong struct xfs_btree_cur *cur, 1444174edb0eSDarrick J. Wong xfs_agblock_t agbno, 1445174edb0eSDarrick J. Wong xfs_extlen_t aglen, 1446a1f69417SEric Sandeen enum xfs_refc_adjust_op adj) 1447174edb0eSDarrick J. Wong { 1448174edb0eSDarrick J. Wong struct xfs_refcount_irec ext, tmp; 1449174edb0eSDarrick J. Wong int error; 1450174edb0eSDarrick J. Wong int found_rec, found_tmp; 1451174edb0eSDarrick J. Wong 1452174edb0eSDarrick J. Wong if (aglen == 0) 1453174edb0eSDarrick J. Wong return 0; 1454174edb0eSDarrick J. Wong 1455174edb0eSDarrick J. Wong /* Find any overlapping refcount records */ 1456174edb0eSDarrick J. Wong error = xfs_refcount_lookup_ge(cur, agbno, &found_rec); 1457174edb0eSDarrick J. Wong if (error) 1458174edb0eSDarrick J. Wong goto out_error; 1459174edb0eSDarrick J. Wong error = xfs_refcount_get_rec(cur, &ext, &found_rec); 1460174edb0eSDarrick J. Wong if (error) 1461174edb0eSDarrick J. Wong goto out_error; 1462174edb0eSDarrick J. Wong if (!found_rec) { 1463174edb0eSDarrick J. Wong ext.rc_startblock = cur->bc_mp->m_sb.sb_agblocks + 1464174edb0eSDarrick J. Wong XFS_REFC_COW_START; 1465174edb0eSDarrick J. Wong ext.rc_blockcount = 0; 1466174edb0eSDarrick J. Wong ext.rc_refcount = 0; 1467174edb0eSDarrick J. Wong } 1468174edb0eSDarrick J. Wong 1469174edb0eSDarrick J. Wong switch (adj) { 1470174edb0eSDarrick J. Wong case XFS_REFCOUNT_ADJUST_COW_ALLOC: 1471174edb0eSDarrick J. Wong /* Adding a CoW reservation, there should be nothing here. */ 1472f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, 1473f9e03706SDarrick J. Wong agbno + aglen > ext.rc_startblock)) { 1474f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1475f9e03706SDarrick J. Wong goto out_error; 1476f9e03706SDarrick J. Wong } 1477174edb0eSDarrick J. Wong 1478174edb0eSDarrick J. Wong tmp.rc_startblock = agbno; 1479174edb0eSDarrick J. Wong tmp.rc_blockcount = aglen; 1480174edb0eSDarrick J. Wong tmp.rc_refcount = 1; 1481174edb0eSDarrick J. Wong trace_xfs_refcount_modify_extent(cur->bc_mp, 148250f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, &tmp); 1483174edb0eSDarrick J. Wong 1484174edb0eSDarrick J. Wong error = xfs_refcount_insert(cur, &tmp, 1485174edb0eSDarrick J. Wong &found_tmp); 1486174edb0eSDarrick J. Wong if (error) 1487174edb0eSDarrick J. Wong goto out_error; 1488f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_tmp != 1)) { 1489f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1490f9e03706SDarrick J. Wong goto out_error; 1491f9e03706SDarrick J. Wong } 1492174edb0eSDarrick J. Wong break; 1493174edb0eSDarrick J. Wong case XFS_REFCOUNT_ADJUST_COW_FREE: 1494174edb0eSDarrick J. Wong /* Removing a CoW reservation, there should be one extent. */ 1495f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, ext.rc_startblock != agbno)) { 1496f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1497f9e03706SDarrick J. Wong goto out_error; 1498f9e03706SDarrick J. Wong } 1499f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, ext.rc_blockcount != aglen)) { 1500f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1501f9e03706SDarrick J. Wong goto out_error; 1502f9e03706SDarrick J. Wong } 1503f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, ext.rc_refcount != 1)) { 1504f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1505f9e03706SDarrick J. Wong goto out_error; 1506f9e03706SDarrick J. Wong } 1507174edb0eSDarrick J. Wong 1508174edb0eSDarrick J. Wong ext.rc_refcount = 0; 1509174edb0eSDarrick J. Wong trace_xfs_refcount_modify_extent(cur->bc_mp, 151050f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, &ext); 1511174edb0eSDarrick J. Wong error = xfs_refcount_delete(cur, &found_rec); 1512174edb0eSDarrick J. Wong if (error) 1513174edb0eSDarrick J. Wong goto out_error; 1514f9e03706SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, found_rec != 1)) { 1515f9e03706SDarrick J. Wong error = -EFSCORRUPTED; 1516f9e03706SDarrick J. Wong goto out_error; 1517f9e03706SDarrick J. Wong } 1518174edb0eSDarrick J. Wong break; 1519174edb0eSDarrick J. Wong default: 1520174edb0eSDarrick J. Wong ASSERT(0); 1521174edb0eSDarrick J. Wong } 1522174edb0eSDarrick J. Wong 1523174edb0eSDarrick J. Wong return error; 1524174edb0eSDarrick J. Wong out_error: 1525174edb0eSDarrick J. Wong trace_xfs_refcount_modify_extent_error(cur->bc_mp, 152650f02fe3SDave Chinner cur->bc_ag.pag->pag_agno, error, _RET_IP_); 1527174edb0eSDarrick J. Wong return error; 1528174edb0eSDarrick J. Wong } 1529174edb0eSDarrick J. Wong 1530174edb0eSDarrick J. Wong /* 1531174edb0eSDarrick J. Wong * Add or remove refcount btree entries for CoW reservations. 1532174edb0eSDarrick J. Wong */ 1533174edb0eSDarrick J. Wong STATIC int 1534174edb0eSDarrick J. Wong xfs_refcount_adjust_cow( 1535174edb0eSDarrick J. Wong struct xfs_btree_cur *cur, 1536174edb0eSDarrick J. Wong xfs_agblock_t agbno, 1537174edb0eSDarrick J. Wong xfs_extlen_t aglen, 1538a1f69417SEric Sandeen enum xfs_refc_adjust_op adj) 1539174edb0eSDarrick J. Wong { 1540174edb0eSDarrick J. Wong bool shape_changed; 1541174edb0eSDarrick J. Wong int error; 1542174edb0eSDarrick J. Wong 1543174edb0eSDarrick J. Wong agbno += XFS_REFC_COW_START; 1544174edb0eSDarrick J. Wong 1545174edb0eSDarrick J. Wong /* 1546174edb0eSDarrick J. Wong * Ensure that no rcextents cross the boundary of the adjustment range. 1547174edb0eSDarrick J. Wong */ 1548174edb0eSDarrick J. Wong error = xfs_refcount_split_extent(cur, agbno, &shape_changed); 1549174edb0eSDarrick J. Wong if (error) 1550174edb0eSDarrick J. Wong goto out_error; 1551174edb0eSDarrick J. Wong 1552174edb0eSDarrick J. Wong error = xfs_refcount_split_extent(cur, agbno + aglen, &shape_changed); 1553174edb0eSDarrick J. Wong if (error) 1554174edb0eSDarrick J. Wong goto out_error; 1555174edb0eSDarrick J. Wong 1556174edb0eSDarrick J. Wong /* 1557174edb0eSDarrick J. Wong * Try to merge with the left or right extents of the range. 1558174edb0eSDarrick J. Wong */ 1559174edb0eSDarrick J. Wong error = xfs_refcount_merge_extents(cur, &agbno, &aglen, adj, 1560174edb0eSDarrick J. Wong XFS_FIND_RCEXT_COW, &shape_changed); 1561174edb0eSDarrick J. Wong if (error) 1562174edb0eSDarrick J. Wong goto out_error; 1563174edb0eSDarrick J. Wong 1564174edb0eSDarrick J. Wong /* Now that we've taken care of the ends, adjust the middle extents */ 1565a1f69417SEric Sandeen error = xfs_refcount_adjust_cow_extents(cur, agbno, aglen, adj); 1566174edb0eSDarrick J. Wong if (error) 1567174edb0eSDarrick J. Wong goto out_error; 1568174edb0eSDarrick J. Wong 1569174edb0eSDarrick J. Wong return 0; 1570174edb0eSDarrick J. Wong 1571174edb0eSDarrick J. Wong out_error: 157250f02fe3SDave Chinner trace_xfs_refcount_adjust_cow_error(cur->bc_mp, cur->bc_ag.pag->pag_agno, 1573174edb0eSDarrick J. Wong error, _RET_IP_); 1574174edb0eSDarrick J. Wong return error; 1575174edb0eSDarrick J. Wong } 1576174edb0eSDarrick J. Wong 1577174edb0eSDarrick J. Wong /* 1578174edb0eSDarrick J. Wong * Record a CoW allocation in the refcount btree. 1579174edb0eSDarrick J. Wong */ 1580174edb0eSDarrick J. Wong STATIC int 1581174edb0eSDarrick J. Wong __xfs_refcount_cow_alloc( 1582174edb0eSDarrick J. Wong struct xfs_btree_cur *rcur, 1583174edb0eSDarrick J. Wong xfs_agblock_t agbno, 15840f37d178SBrian Foster xfs_extlen_t aglen) 1585174edb0eSDarrick J. Wong { 158650f02fe3SDave Chinner trace_xfs_refcount_cow_increase(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, 1587174edb0eSDarrick J. Wong agbno, aglen); 1588174edb0eSDarrick J. Wong 1589174edb0eSDarrick J. Wong /* Add refcount btree reservation */ 15900525e952SDarrick J. Wong return xfs_refcount_adjust_cow(rcur, agbno, aglen, 1591a1f69417SEric Sandeen XFS_REFCOUNT_ADJUST_COW_ALLOC); 1592174edb0eSDarrick J. Wong } 1593174edb0eSDarrick J. Wong 1594174edb0eSDarrick J. Wong /* 1595174edb0eSDarrick J. Wong * Remove a CoW allocation from the refcount btree. 1596174edb0eSDarrick J. Wong */ 1597174edb0eSDarrick J. Wong STATIC int 1598174edb0eSDarrick J. Wong __xfs_refcount_cow_free( 1599174edb0eSDarrick J. Wong struct xfs_btree_cur *rcur, 1600174edb0eSDarrick J. Wong xfs_agblock_t agbno, 16010f37d178SBrian Foster xfs_extlen_t aglen) 1602174edb0eSDarrick J. Wong { 160350f02fe3SDave Chinner trace_xfs_refcount_cow_decrease(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, 1604174edb0eSDarrick J. Wong agbno, aglen); 1605174edb0eSDarrick J. Wong 1606174edb0eSDarrick J. Wong /* Remove refcount btree reservation */ 16070525e952SDarrick J. Wong return xfs_refcount_adjust_cow(rcur, agbno, aglen, 1608a1f69417SEric Sandeen XFS_REFCOUNT_ADJUST_COW_FREE); 1609174edb0eSDarrick J. Wong } 1610174edb0eSDarrick J. Wong 1611174edb0eSDarrick J. Wong /* Record a CoW staging extent in the refcount btree. */ 161274b4c5d4SDarrick J. Wong void 1613174edb0eSDarrick J. Wong xfs_refcount_alloc_cow_extent( 16140f37d178SBrian Foster struct xfs_trans *tp, 1615174edb0eSDarrick J. Wong xfs_fsblock_t fsb, 1616174edb0eSDarrick J. Wong xfs_extlen_t len) 1617174edb0eSDarrick J. Wong { 16180f37d178SBrian Foster struct xfs_mount *mp = tp->t_mountp; 16190525e952SDarrick J. Wong 1620174edb0eSDarrick J. Wong if (!xfs_sb_version_hasreflink(&mp->m_sb)) 162174b4c5d4SDarrick J. Wong return; 1622174edb0eSDarrick J. Wong 162374b4c5d4SDarrick J. Wong __xfs_refcount_add(tp, XFS_REFCOUNT_ALLOC_COW, fsb, len); 16240525e952SDarrick J. Wong 16250525e952SDarrick J. Wong /* Add rmap entry */ 1626bc46ac64SDarrick J. Wong xfs_rmap_alloc_extent(tp, XFS_FSB_TO_AGNO(mp, fsb), 16270525e952SDarrick J. Wong XFS_FSB_TO_AGBNO(mp, fsb), len, XFS_RMAP_OWN_COW); 1628174edb0eSDarrick J. Wong } 1629174edb0eSDarrick J. Wong 1630174edb0eSDarrick J. Wong /* Forget a CoW staging event in the refcount btree. */ 163174b4c5d4SDarrick J. Wong void 1632174edb0eSDarrick J. Wong xfs_refcount_free_cow_extent( 16330f37d178SBrian Foster struct xfs_trans *tp, 1634174edb0eSDarrick J. Wong xfs_fsblock_t fsb, 1635174edb0eSDarrick J. Wong xfs_extlen_t len) 1636174edb0eSDarrick J. Wong { 16370f37d178SBrian Foster struct xfs_mount *mp = tp->t_mountp; 16380525e952SDarrick J. Wong 1639174edb0eSDarrick J. Wong if (!xfs_sb_version_hasreflink(&mp->m_sb)) 164074b4c5d4SDarrick J. Wong return; 1641174edb0eSDarrick J. Wong 16420525e952SDarrick J. Wong /* Remove rmap entry */ 1643bc46ac64SDarrick J. Wong xfs_rmap_free_extent(tp, XFS_FSB_TO_AGNO(mp, fsb), 16440525e952SDarrick J. Wong XFS_FSB_TO_AGBNO(mp, fsb), len, XFS_RMAP_OWN_COW); 164574b4c5d4SDarrick J. Wong __xfs_refcount_add(tp, XFS_REFCOUNT_FREE_COW, fsb, len); 1646174edb0eSDarrick J. Wong } 1647174edb0eSDarrick J. Wong 1648174edb0eSDarrick J. Wong struct xfs_refcount_recovery { 1649174edb0eSDarrick J. Wong struct list_head rr_list; 1650174edb0eSDarrick J. Wong struct xfs_refcount_irec rr_rrec; 1651174edb0eSDarrick J. Wong }; 1652174edb0eSDarrick J. Wong 1653174edb0eSDarrick J. Wong /* Stuff an extent on the recovery list. */ 1654174edb0eSDarrick J. Wong STATIC int 1655174edb0eSDarrick J. Wong xfs_refcount_recover_extent( 1656174edb0eSDarrick J. Wong struct xfs_btree_cur *cur, 1657*159eb69dSDarrick J. Wong const union xfs_btree_rec *rec, 1658174edb0eSDarrick J. Wong void *priv) 1659174edb0eSDarrick J. Wong { 1660174edb0eSDarrick J. Wong struct list_head *debris = priv; 1661174edb0eSDarrick J. Wong struct xfs_refcount_recovery *rr; 1662174edb0eSDarrick J. Wong 1663a71895c5SDarrick J. Wong if (XFS_IS_CORRUPT(cur->bc_mp, 1664a71895c5SDarrick J. Wong be32_to_cpu(rec->refc.rc_refcount) != 1)) 1665174edb0eSDarrick J. Wong return -EFSCORRUPTED; 1666174edb0eSDarrick J. Wong 1667707e0ddaSTetsuo Handa rr = kmem_alloc(sizeof(struct xfs_refcount_recovery), 0); 1668174edb0eSDarrick J. Wong xfs_refcount_btrec_to_irec(rec, &rr->rr_rrec); 1669174edb0eSDarrick J. Wong list_add_tail(&rr->rr_list, debris); 1670174edb0eSDarrick J. Wong 1671174edb0eSDarrick J. Wong return 0; 1672174edb0eSDarrick J. Wong } 1673174edb0eSDarrick J. Wong 1674174edb0eSDarrick J. Wong /* Find and remove leftover CoW reservations. */ 1675174edb0eSDarrick J. Wong int 1676174edb0eSDarrick J. Wong xfs_refcount_recover_cow_leftovers( 1677174edb0eSDarrick J. Wong struct xfs_mount *mp, 1678a81a0621SDave Chinner struct xfs_perag *pag) 1679174edb0eSDarrick J. Wong { 1680174edb0eSDarrick J. Wong struct xfs_trans *tp; 1681174edb0eSDarrick J. Wong struct xfs_btree_cur *cur; 1682174edb0eSDarrick J. Wong struct xfs_buf *agbp; 1683174edb0eSDarrick J. Wong struct xfs_refcount_recovery *rr, *n; 1684174edb0eSDarrick J. Wong struct list_head debris; 1685174edb0eSDarrick J. Wong union xfs_btree_irec low; 1686174edb0eSDarrick J. Wong union xfs_btree_irec high; 1687174edb0eSDarrick J. Wong xfs_fsblock_t fsb; 1688174edb0eSDarrick J. Wong xfs_agblock_t agbno; 1689174edb0eSDarrick J. Wong int error; 1690174edb0eSDarrick J. Wong 1691174edb0eSDarrick J. Wong if (mp->m_sb.sb_agblocks >= XFS_REFC_COW_START) 1692174edb0eSDarrick J. Wong return -EOPNOTSUPP; 1693174edb0eSDarrick J. Wong 16943ecb3ac7SDarrick J. Wong INIT_LIST_HEAD(&debris); 16953ecb3ac7SDarrick J. Wong 16963ecb3ac7SDarrick J. Wong /* 16973ecb3ac7SDarrick J. Wong * In this first part, we use an empty transaction to gather up 16983ecb3ac7SDarrick J. Wong * all the leftover CoW extents so that we can subsequently 16993ecb3ac7SDarrick J. Wong * delete them. The empty transaction is used to avoid 17003ecb3ac7SDarrick J. Wong * a buffer lock deadlock if there happens to be a loop in the 17013ecb3ac7SDarrick J. Wong * refcountbt because we're allowed to re-grab a buffer that is 17023ecb3ac7SDarrick J. Wong * already attached to our transaction. When we're done 17033ecb3ac7SDarrick J. Wong * recording the CoW debris we cancel the (empty) transaction 17043ecb3ac7SDarrick J. Wong * and everything goes away cleanly. 17053ecb3ac7SDarrick J. Wong */ 17063ecb3ac7SDarrick J. Wong error = xfs_trans_alloc_empty(mp, &tp); 1707174edb0eSDarrick J. Wong if (error) 1708174edb0eSDarrick J. Wong return error; 17093ecb3ac7SDarrick J. Wong 1710a81a0621SDave Chinner error = xfs_alloc_read_agf(mp, tp, pag->pag_agno, 0, &agbp); 17113ecb3ac7SDarrick J. Wong if (error) 17123ecb3ac7SDarrick J. Wong goto out_trans; 1713a81a0621SDave Chinner cur = xfs_refcountbt_init_cursor(mp, tp, agbp, pag); 1714174edb0eSDarrick J. Wong 1715174edb0eSDarrick J. Wong /* Find all the leftover CoW staging extents. */ 1716174edb0eSDarrick J. Wong memset(&low, 0, sizeof(low)); 1717174edb0eSDarrick J. Wong memset(&high, 0, sizeof(high)); 1718174edb0eSDarrick J. Wong low.rc.rc_startblock = XFS_REFC_COW_START; 1719174edb0eSDarrick J. Wong high.rc.rc_startblock = -1U; 1720174edb0eSDarrick J. Wong error = xfs_btree_query_range(cur, &low, &high, 1721174edb0eSDarrick J. Wong xfs_refcount_recover_extent, &debris); 1722ef97ef26SDarrick J. Wong xfs_btree_del_cursor(cur, error); 17233ecb3ac7SDarrick J. Wong xfs_trans_brelse(tp, agbp); 17243ecb3ac7SDarrick J. Wong xfs_trans_cancel(tp); 1725ef97ef26SDarrick J. Wong if (error) 1726ef97ef26SDarrick J. Wong goto out_free; 1727174edb0eSDarrick J. Wong 1728174edb0eSDarrick J. Wong /* Now iterate the list to free the leftovers */ 17293ecb3ac7SDarrick J. Wong list_for_each_entry_safe(rr, n, &debris, rr_list) { 1730174edb0eSDarrick J. Wong /* Set up transaction. */ 1731174edb0eSDarrick J. Wong error = xfs_trans_alloc(mp, &M_RES(mp)->tr_write, 0, 0, 0, &tp); 1732174edb0eSDarrick J. Wong if (error) 1733174edb0eSDarrick J. Wong goto out_free; 1734174edb0eSDarrick J. Wong 1735a81a0621SDave Chinner trace_xfs_refcount_recover_extent(mp, pag->pag_agno, 1736a81a0621SDave Chinner &rr->rr_rrec); 1737174edb0eSDarrick J. Wong 1738174edb0eSDarrick J. Wong /* Free the orphan record */ 1739174edb0eSDarrick J. Wong agbno = rr->rr_rrec.rc_startblock - XFS_REFC_COW_START; 1740a81a0621SDave Chinner fsb = XFS_AGB_TO_FSB(mp, pag->pag_agno, agbno); 174174b4c5d4SDarrick J. Wong xfs_refcount_free_cow_extent(tp, fsb, 1742174edb0eSDarrick J. Wong rr->rr_rrec.rc_blockcount); 1743174edb0eSDarrick J. Wong 1744174edb0eSDarrick J. Wong /* Free the block. */ 17450f37d178SBrian Foster xfs_bmap_add_free(tp, fsb, rr->rr_rrec.rc_blockcount, NULL); 1746174edb0eSDarrick J. Wong 1747174edb0eSDarrick J. Wong error = xfs_trans_commit(tp); 1748174edb0eSDarrick J. Wong if (error) 1749174edb0eSDarrick J. Wong goto out_free; 17503ecb3ac7SDarrick J. Wong 17513ecb3ac7SDarrick J. Wong list_del(&rr->rr_list); 17523ecb3ac7SDarrick J. Wong kmem_free(rr); 17536f97077fSDarrick J. Wong } 1754174edb0eSDarrick J. Wong 17553ecb3ac7SDarrick J. Wong return error; 17563ecb3ac7SDarrick J. Wong out_trans: 17573ecb3ac7SDarrick J. Wong xfs_trans_cancel(tp); 1758174edb0eSDarrick J. Wong out_free: 1759174edb0eSDarrick J. Wong /* Free the leftover list */ 1760174edb0eSDarrick J. Wong list_for_each_entry_safe(rr, n, &debris, rr_list) { 1761174edb0eSDarrick J. Wong list_del(&rr->rr_list); 1762174edb0eSDarrick J. Wong kmem_free(rr); 1763174edb0eSDarrick J. Wong } 1764174edb0eSDarrick J. Wong return error; 1765174edb0eSDarrick J. Wong } 176649db55ecSDarrick J. Wong 176749db55ecSDarrick J. Wong /* Is there a record covering a given extent? */ 176849db55ecSDarrick J. Wong int 176949db55ecSDarrick J. Wong xfs_refcount_has_record( 177049db55ecSDarrick J. Wong struct xfs_btree_cur *cur, 177149db55ecSDarrick J. Wong xfs_agblock_t bno, 177249db55ecSDarrick J. Wong xfs_extlen_t len, 177349db55ecSDarrick J. Wong bool *exists) 177449db55ecSDarrick J. Wong { 177549db55ecSDarrick J. Wong union xfs_btree_irec low; 177649db55ecSDarrick J. Wong union xfs_btree_irec high; 177749db55ecSDarrick J. Wong 177849db55ecSDarrick J. Wong memset(&low, 0, sizeof(low)); 177949db55ecSDarrick J. Wong low.rc.rc_startblock = bno; 178049db55ecSDarrick J. Wong memset(&high, 0xFF, sizeof(high)); 178149db55ecSDarrick J. Wong high.rc.rc_startblock = bno + len - 1; 178249db55ecSDarrick J. Wong 178349db55ecSDarrick J. Wong return xfs_btree_has_record(cur, &low, &high, exists); 178449db55ecSDarrick J. Wong } 1785