1b16817b6SDave Chinner /* SPDX-License-Identifier: GPL-2.0 */ 2b16817b6SDave Chinner /* 3b16817b6SDave Chinner * Copyright (c) 2000-2005 Silicon Graphics, Inc. 4b16817b6SDave Chinner * Copyright (c) 2018 Red Hat, Inc. 5b16817b6SDave Chinner * All rights reserved. 6b16817b6SDave Chinner */ 7b16817b6SDave Chinner 8b16817b6SDave Chinner #include "xfs.h" 9b16817b6SDave Chinner #include "xfs_fs.h" 10b16817b6SDave Chinner #include "xfs_shared.h" 11b16817b6SDave Chinner #include "xfs_format.h" 12b16817b6SDave Chinner #include "xfs_trans_resv.h" 13f327a007SDarrick J. Wong #include "xfs_bit.h" 14b16817b6SDave Chinner #include "xfs_sb.h" 15b16817b6SDave Chinner #include "xfs_mount.h" 16b16817b6SDave Chinner #include "xfs_btree.h" 17b16817b6SDave Chinner #include "xfs_alloc_btree.h" 18b16817b6SDave Chinner #include "xfs_rmap_btree.h" 19b16817b6SDave Chinner #include "xfs_alloc.h" 2049dd56f2SDave Chinner #include "xfs_ialloc.h" 21b16817b6SDave Chinner #include "xfs_rmap.h" 22b16817b6SDave Chinner #include "xfs_ag.h" 237cd5006bSDarrick J. Wong #include "xfs_ag_resv.h" 241302c6a2SDarrick J. Wong #include "xfs_health.h" 2546141dc8SGao Xiang #include "xfs_error.h" 2646141dc8SGao Xiang #include "xfs_bmap.h" 2746141dc8SGao Xiang #include "xfs_defer.h" 2846141dc8SGao Xiang #include "xfs_log_format.h" 2946141dc8SGao Xiang #include "xfs_trans.h" 309bbafc71SDave Chinner #include "xfs_trace.h" 3107b6403aSDave Chinner #include "xfs_inode.h" 3207b6403aSDave Chinner #include "xfs_icache.h" 3307b6403aSDave Chinner 349bbafc71SDave Chinner 359bbafc71SDave Chinner /* 369bbafc71SDave Chinner * Passive reference counting access wrappers to the perag structures. If the 379bbafc71SDave Chinner * per-ag structure is to be freed, the freeing code is responsible for cleaning 389bbafc71SDave Chinner * up objects with passive references before freeing the structure. This is 399bbafc71SDave Chinner * things like cached buffers. 409bbafc71SDave Chinner */ 419bbafc71SDave Chinner struct xfs_perag * 429bbafc71SDave Chinner xfs_perag_get( 439bbafc71SDave Chinner struct xfs_mount *mp, 449bbafc71SDave Chinner xfs_agnumber_t agno) 459bbafc71SDave Chinner { 469bbafc71SDave Chinner struct xfs_perag *pag; 479bbafc71SDave Chinner 489bbafc71SDave Chinner rcu_read_lock(); 499bbafc71SDave Chinner pag = radix_tree_lookup(&mp->m_perag_tree, agno); 509bbafc71SDave Chinner if (pag) { 51368e2d09SDave Chinner trace_xfs_perag_get(pag, _RET_IP_); 529bbafc71SDave Chinner ASSERT(atomic_read(&pag->pag_ref) >= 0); 53368e2d09SDave Chinner atomic_inc(&pag->pag_ref); 549bbafc71SDave Chinner } 559bbafc71SDave Chinner rcu_read_unlock(); 569bbafc71SDave Chinner return pag; 579bbafc71SDave Chinner } 589bbafc71SDave Chinner 599bbafc71SDave Chinner /* 609bbafc71SDave Chinner * search from @first to find the next perag with the given tag set. 619bbafc71SDave Chinner */ 629bbafc71SDave Chinner struct xfs_perag * 639bbafc71SDave Chinner xfs_perag_get_tag( 649bbafc71SDave Chinner struct xfs_mount *mp, 659bbafc71SDave Chinner xfs_agnumber_t first, 66ffc18582SDarrick J. Wong unsigned int tag) 679bbafc71SDave Chinner { 689bbafc71SDave Chinner struct xfs_perag *pag; 699bbafc71SDave Chinner int found; 709bbafc71SDave Chinner 719bbafc71SDave Chinner rcu_read_lock(); 729bbafc71SDave Chinner found = radix_tree_gang_lookup_tag(&mp->m_perag_tree, 739bbafc71SDave Chinner (void **)&pag, first, 1, tag); 749bbafc71SDave Chinner if (found <= 0) { 759bbafc71SDave Chinner rcu_read_unlock(); 769bbafc71SDave Chinner return NULL; 779bbafc71SDave Chinner } 78368e2d09SDave Chinner trace_xfs_perag_get_tag(pag, _RET_IP_); 79368e2d09SDave Chinner atomic_inc(&pag->pag_ref); 809bbafc71SDave Chinner rcu_read_unlock(); 819bbafc71SDave Chinner return pag; 829bbafc71SDave Chinner } 839bbafc71SDave Chinner 84*9b2e5a23SDarrick J. Wong /* Get a passive reference to the given perag. */ 85*9b2e5a23SDarrick J. Wong struct xfs_perag * 86*9b2e5a23SDarrick J. Wong xfs_perag_hold( 87*9b2e5a23SDarrick J. Wong struct xfs_perag *pag) 88*9b2e5a23SDarrick J. Wong { 89*9b2e5a23SDarrick J. Wong ASSERT(atomic_read(&pag->pag_ref) > 0 || 90*9b2e5a23SDarrick J. Wong atomic_read(&pag->pag_active_ref) > 0); 91*9b2e5a23SDarrick J. Wong 92*9b2e5a23SDarrick J. Wong trace_xfs_perag_hold(pag, _RET_IP_); 93*9b2e5a23SDarrick J. Wong atomic_inc(&pag->pag_ref); 94*9b2e5a23SDarrick J. Wong return pag; 95*9b2e5a23SDarrick J. Wong } 96*9b2e5a23SDarrick J. Wong 979bbafc71SDave Chinner void 989bbafc71SDave Chinner xfs_perag_put( 999bbafc71SDave Chinner struct xfs_perag *pag) 1009bbafc71SDave Chinner { 101368e2d09SDave Chinner trace_xfs_perag_put(pag, _RET_IP_); 1029bbafc71SDave Chinner ASSERT(atomic_read(&pag->pag_ref) > 0); 103368e2d09SDave Chinner atomic_dec(&pag->pag_ref); 1049bbafc71SDave Chinner } 1059bbafc71SDave Chinner 1069bbafc71SDave Chinner /* 107c4d5660aSDave Chinner * Active references for perag structures. This is for short term access to the 108c4d5660aSDave Chinner * per ag structures for walking trees or accessing state. If an AG is being 109c4d5660aSDave Chinner * shrunk or is offline, then this will fail to find that AG and return NULL 110c4d5660aSDave Chinner * instead. 111c4d5660aSDave Chinner */ 112c4d5660aSDave Chinner struct xfs_perag * 113c4d5660aSDave Chinner xfs_perag_grab( 114c4d5660aSDave Chinner struct xfs_mount *mp, 115c4d5660aSDave Chinner xfs_agnumber_t agno) 116c4d5660aSDave Chinner { 117c4d5660aSDave Chinner struct xfs_perag *pag; 118c4d5660aSDave Chinner 119c4d5660aSDave Chinner rcu_read_lock(); 120c4d5660aSDave Chinner pag = radix_tree_lookup(&mp->m_perag_tree, agno); 121c4d5660aSDave Chinner if (pag) { 122368e2d09SDave Chinner trace_xfs_perag_grab(pag, _RET_IP_); 123c4d5660aSDave Chinner if (!atomic_inc_not_zero(&pag->pag_active_ref)) 124c4d5660aSDave Chinner pag = NULL; 125c4d5660aSDave Chinner } 126c4d5660aSDave Chinner rcu_read_unlock(); 127c4d5660aSDave Chinner return pag; 128c4d5660aSDave Chinner } 129c4d5660aSDave Chinner 130c4d5660aSDave Chinner /* 131c4d5660aSDave Chinner * search from @first to find the next perag with the given tag set. 132c4d5660aSDave Chinner */ 133c4d5660aSDave Chinner struct xfs_perag * 134c4d5660aSDave Chinner xfs_perag_grab_tag( 135c4d5660aSDave Chinner struct xfs_mount *mp, 136c4d5660aSDave Chinner xfs_agnumber_t first, 137c4d5660aSDave Chinner int tag) 138c4d5660aSDave Chinner { 139c4d5660aSDave Chinner struct xfs_perag *pag; 140c4d5660aSDave Chinner int found; 141c4d5660aSDave Chinner 142c4d5660aSDave Chinner rcu_read_lock(); 143c4d5660aSDave Chinner found = radix_tree_gang_lookup_tag(&mp->m_perag_tree, 144c4d5660aSDave Chinner (void **)&pag, first, 1, tag); 145c4d5660aSDave Chinner if (found <= 0) { 146c4d5660aSDave Chinner rcu_read_unlock(); 147c4d5660aSDave Chinner return NULL; 148c4d5660aSDave Chinner } 149368e2d09SDave Chinner trace_xfs_perag_grab_tag(pag, _RET_IP_); 150c4d5660aSDave Chinner if (!atomic_inc_not_zero(&pag->pag_active_ref)) 151c4d5660aSDave Chinner pag = NULL; 152c4d5660aSDave Chinner rcu_read_unlock(); 153c4d5660aSDave Chinner return pag; 154c4d5660aSDave Chinner } 155c4d5660aSDave Chinner 156c4d5660aSDave Chinner void 157c4d5660aSDave Chinner xfs_perag_rele( 158c4d5660aSDave Chinner struct xfs_perag *pag) 159c4d5660aSDave Chinner { 160368e2d09SDave Chinner trace_xfs_perag_rele(pag, _RET_IP_); 161c4d5660aSDave Chinner if (atomic_dec_and_test(&pag->pag_active_ref)) 162c4d5660aSDave Chinner wake_up(&pag->pag_active_wq); 163c4d5660aSDave Chinner } 164c4d5660aSDave Chinner 165c4d5660aSDave Chinner /* 1669bbafc71SDave Chinner * xfs_initialize_perag_data 1679bbafc71SDave Chinner * 1689bbafc71SDave Chinner * Read in each per-ag structure so we can count up the number of 1699bbafc71SDave Chinner * allocated inodes, free inodes and used filesystem blocks as this 1709bbafc71SDave Chinner * information is no longer persistent in the superblock. Once we have 1719bbafc71SDave Chinner * this information, write it into the in-core superblock structure. 1729bbafc71SDave Chinner */ 1739bbafc71SDave Chinner int 1749bbafc71SDave Chinner xfs_initialize_perag_data( 1759bbafc71SDave Chinner struct xfs_mount *mp, 1769bbafc71SDave Chinner xfs_agnumber_t agcount) 1779bbafc71SDave Chinner { 1789bbafc71SDave Chinner xfs_agnumber_t index; 17950920116SDave Chinner struct xfs_perag *pag; 18050920116SDave Chinner struct xfs_sb *sbp = &mp->m_sb; 1819bbafc71SDave Chinner uint64_t ifree = 0; 1829bbafc71SDave Chinner uint64_t ialloc = 0; 1839bbafc71SDave Chinner uint64_t bfree = 0; 1849bbafc71SDave Chinner uint64_t bfreelst = 0; 1859bbafc71SDave Chinner uint64_t btree = 0; 1869bbafc71SDave Chinner uint64_t fdblocks; 1879bbafc71SDave Chinner int error = 0; 1889bbafc71SDave Chinner 1899bbafc71SDave Chinner for (index = 0; index < agcount; index++) { 1909bbafc71SDave Chinner /* 19108d3e84fSDave Chinner * Read the AGF and AGI buffers to populate the per-ag 19208d3e84fSDave Chinner * structures for us. 1939bbafc71SDave Chinner */ 1949bbafc71SDave Chinner pag = xfs_perag_get(mp, index); 19508d3e84fSDave Chinner error = xfs_alloc_read_agf(pag, NULL, 0, NULL); 19608d3e84fSDave Chinner if (!error) 19799b13c7fSDave Chinner error = xfs_ialloc_read_agi(pag, NULL, NULL); 19899b13c7fSDave Chinner if (error) { 19999b13c7fSDave Chinner xfs_perag_put(pag); 20099b13c7fSDave Chinner return error; 20199b13c7fSDave Chinner } 20299b13c7fSDave Chinner 2039bbafc71SDave Chinner ifree += pag->pagi_freecount; 2049bbafc71SDave Chinner ialloc += pag->pagi_count; 2059bbafc71SDave Chinner bfree += pag->pagf_freeblks; 2069bbafc71SDave Chinner bfreelst += pag->pagf_flcount; 2079bbafc71SDave Chinner btree += pag->pagf_btreeblks; 2089bbafc71SDave Chinner xfs_perag_put(pag); 2099bbafc71SDave Chinner } 2109bbafc71SDave Chinner fdblocks = bfree + bfreelst + btree; 2119bbafc71SDave Chinner 2129bbafc71SDave Chinner /* 2139bbafc71SDave Chinner * If the new summary counts are obviously incorrect, fail the 2149bbafc71SDave Chinner * mount operation because that implies the AGFs are also corrupt. 2159bbafc71SDave Chinner * Clear FS_COUNTERS so that we don't unmount with a dirty log, which 2169bbafc71SDave Chinner * will prevent xfs_repair from fixing anything. 2179bbafc71SDave Chinner */ 2189bbafc71SDave Chinner if (fdblocks > sbp->sb_dblocks || ifree > ialloc) { 2199bbafc71SDave Chinner xfs_alert(mp, "AGF corruption. Please run xfs_repair."); 2209bbafc71SDave Chinner error = -EFSCORRUPTED; 2219bbafc71SDave Chinner goto out; 2229bbafc71SDave Chinner } 2239bbafc71SDave Chinner 2249bbafc71SDave Chinner /* Overwrite incore superblock counters with just-read data */ 2259bbafc71SDave Chinner spin_lock(&mp->m_sb_lock); 2269bbafc71SDave Chinner sbp->sb_ifree = ifree; 2279bbafc71SDave Chinner sbp->sb_icount = ialloc; 2289bbafc71SDave Chinner sbp->sb_fdblocks = fdblocks; 2299bbafc71SDave Chinner spin_unlock(&mp->m_sb_lock); 2309bbafc71SDave Chinner 2319bbafc71SDave Chinner xfs_reinit_percpu_counters(mp); 2329bbafc71SDave Chinner out: 2339bbafc71SDave Chinner xfs_fs_mark_healthy(mp, XFS_SICK_FS_COUNTERS); 2349bbafc71SDave Chinner return error; 2359bbafc71SDave Chinner } 236b16817b6SDave Chinner 23707b6403aSDave Chinner STATIC void 23807b6403aSDave Chinner __xfs_free_perag( 23907b6403aSDave Chinner struct rcu_head *head) 24007b6403aSDave Chinner { 24107b6403aSDave Chinner struct xfs_perag *pag = container_of(head, struct xfs_perag, rcu_head); 24207b6403aSDave Chinner 24307b6403aSDave Chinner ASSERT(!delayed_work_pending(&pag->pag_blockgc_work)); 24407b6403aSDave Chinner kmem_free(pag); 24507b6403aSDave Chinner } 24607b6403aSDave Chinner 24707b6403aSDave Chinner /* 24807b6403aSDave Chinner * Free up the per-ag resources associated with the mount structure. 24907b6403aSDave Chinner */ 25007b6403aSDave Chinner void 25107b6403aSDave Chinner xfs_free_perag( 25207b6403aSDave Chinner struct xfs_mount *mp) 25307b6403aSDave Chinner { 25407b6403aSDave Chinner struct xfs_perag *pag; 25507b6403aSDave Chinner xfs_agnumber_t agno; 25607b6403aSDave Chinner 25707b6403aSDave Chinner for (agno = 0; agno < mp->m_sb.sb_agcount; agno++) { 25807b6403aSDave Chinner spin_lock(&mp->m_perag_lock); 25907b6403aSDave Chinner pag = radix_tree_delete(&mp->m_perag_tree, agno); 26007b6403aSDave Chinner spin_unlock(&mp->m_perag_lock); 26107b6403aSDave Chinner ASSERT(pag); 2625b55cbc2SDave Chinner XFS_IS_CORRUPT(pag->pag_mount, atomic_read(&pag->pag_ref) != 0); 26307b6403aSDave Chinner 26407b6403aSDave Chinner cancel_delayed_work_sync(&pag->pag_blockgc_work); 26507b6403aSDave Chinner xfs_buf_hash_destroy(pag); 26607b6403aSDave Chinner 267c4d5660aSDave Chinner /* drop the mount's active reference */ 268c4d5660aSDave Chinner xfs_perag_rele(pag); 269c4d5660aSDave Chinner XFS_IS_CORRUPT(pag->pag_mount, 270c4d5660aSDave Chinner atomic_read(&pag->pag_active_ref) != 0); 27107b6403aSDave Chinner call_rcu(&pag->rcu_head, __xfs_free_perag); 27207b6403aSDave Chinner } 27307b6403aSDave Chinner } 27407b6403aSDave Chinner 2750800169eSDave Chinner /* Find the size of the AG, in blocks. */ 2760800169eSDave Chinner static xfs_agblock_t 2770800169eSDave Chinner __xfs_ag_block_count( 2780800169eSDave Chinner struct xfs_mount *mp, 2790800169eSDave Chinner xfs_agnumber_t agno, 2800800169eSDave Chinner xfs_agnumber_t agcount, 2810800169eSDave Chinner xfs_rfsblock_t dblocks) 2820800169eSDave Chinner { 2830800169eSDave Chinner ASSERT(agno < agcount); 2840800169eSDave Chinner 2850800169eSDave Chinner if (agno < agcount - 1) 2860800169eSDave Chinner return mp->m_sb.sb_agblocks; 2870800169eSDave Chinner return dblocks - (agno * mp->m_sb.sb_agblocks); 2880800169eSDave Chinner } 2890800169eSDave Chinner 2900800169eSDave Chinner xfs_agblock_t 2910800169eSDave Chinner xfs_ag_block_count( 2920800169eSDave Chinner struct xfs_mount *mp, 2930800169eSDave Chinner xfs_agnumber_t agno) 2940800169eSDave Chinner { 2950800169eSDave Chinner return __xfs_ag_block_count(mp, agno, mp->m_sb.sb_agcount, 2960800169eSDave Chinner mp->m_sb.sb_dblocks); 2970800169eSDave Chinner } 2980800169eSDave Chinner 2992d6ca832SDave Chinner /* Calculate the first and last possible inode number in an AG. */ 3002d6ca832SDave Chinner static void 3012d6ca832SDave Chinner __xfs_agino_range( 3022d6ca832SDave Chinner struct xfs_mount *mp, 3032d6ca832SDave Chinner xfs_agblock_t eoag, 3042d6ca832SDave Chinner xfs_agino_t *first, 3052d6ca832SDave Chinner xfs_agino_t *last) 3062d6ca832SDave Chinner { 3072d6ca832SDave Chinner xfs_agblock_t bno; 3082d6ca832SDave Chinner 3092d6ca832SDave Chinner /* 3102d6ca832SDave Chinner * Calculate the first inode, which will be in the first 3112d6ca832SDave Chinner * cluster-aligned block after the AGFL. 3122d6ca832SDave Chinner */ 3132d6ca832SDave Chinner bno = round_up(XFS_AGFL_BLOCK(mp) + 1, M_IGEO(mp)->cluster_align); 3142d6ca832SDave Chinner *first = XFS_AGB_TO_AGINO(mp, bno); 3152d6ca832SDave Chinner 3162d6ca832SDave Chinner /* 3172d6ca832SDave Chinner * Calculate the last inode, which will be at the end of the 3182d6ca832SDave Chinner * last (aligned) cluster that can be allocated in the AG. 3192d6ca832SDave Chinner */ 3202d6ca832SDave Chinner bno = round_down(eoag, M_IGEO(mp)->cluster_align); 3212d6ca832SDave Chinner *last = XFS_AGB_TO_AGINO(mp, bno) - 1; 3222d6ca832SDave Chinner } 3232d6ca832SDave Chinner 3242d6ca832SDave Chinner void 3252d6ca832SDave Chinner xfs_agino_range( 3262d6ca832SDave Chinner struct xfs_mount *mp, 3272d6ca832SDave Chinner xfs_agnumber_t agno, 3282d6ca832SDave Chinner xfs_agino_t *first, 3292d6ca832SDave Chinner xfs_agino_t *last) 3302d6ca832SDave Chinner { 3312d6ca832SDave Chinner return __xfs_agino_range(mp, xfs_ag_block_count(mp, agno), first, last); 3322d6ca832SDave Chinner } 3332d6ca832SDave Chinner 33407b6403aSDave Chinner int 33507b6403aSDave Chinner xfs_initialize_perag( 33607b6403aSDave Chinner struct xfs_mount *mp, 33707b6403aSDave Chinner xfs_agnumber_t agcount, 3380800169eSDave Chinner xfs_rfsblock_t dblocks, 33907b6403aSDave Chinner xfs_agnumber_t *maxagi) 34007b6403aSDave Chinner { 34107b6403aSDave Chinner struct xfs_perag *pag; 34207b6403aSDave Chinner xfs_agnumber_t index; 34307b6403aSDave Chinner xfs_agnumber_t first_initialised = NULLAGNUMBER; 34407b6403aSDave Chinner int error; 34507b6403aSDave Chinner 34607b6403aSDave Chinner /* 34707b6403aSDave Chinner * Walk the current per-ag tree so we don't try to initialise AGs 34807b6403aSDave Chinner * that already exist (growfs case). Allocate and insert all the 34907b6403aSDave Chinner * AGs we don't find ready for initialisation. 35007b6403aSDave Chinner */ 35107b6403aSDave Chinner for (index = 0; index < agcount; index++) { 35207b6403aSDave Chinner pag = xfs_perag_get(mp, index); 35307b6403aSDave Chinner if (pag) { 35407b6403aSDave Chinner xfs_perag_put(pag); 35507b6403aSDave Chinner continue; 35607b6403aSDave Chinner } 35707b6403aSDave Chinner 35807b6403aSDave Chinner pag = kmem_zalloc(sizeof(*pag), KM_MAYFAIL); 35907b6403aSDave Chinner if (!pag) { 36007b6403aSDave Chinner error = -ENOMEM; 36107b6403aSDave Chinner goto out_unwind_new_pags; 36207b6403aSDave Chinner } 36307b6403aSDave Chinner pag->pag_agno = index; 36407b6403aSDave Chinner pag->pag_mount = mp; 36507b6403aSDave Chinner 36607b6403aSDave Chinner error = radix_tree_preload(GFP_NOFS); 36707b6403aSDave Chinner if (error) 36807b6403aSDave Chinner goto out_free_pag; 36907b6403aSDave Chinner 37007b6403aSDave Chinner spin_lock(&mp->m_perag_lock); 37107b6403aSDave Chinner if (radix_tree_insert(&mp->m_perag_tree, index, pag)) { 37207b6403aSDave Chinner WARN_ON_ONCE(1); 37307b6403aSDave Chinner spin_unlock(&mp->m_perag_lock); 37407b6403aSDave Chinner radix_tree_preload_end(); 37507b6403aSDave Chinner error = -EEXIST; 37607b6403aSDave Chinner goto out_free_pag; 37707b6403aSDave Chinner } 37807b6403aSDave Chinner spin_unlock(&mp->m_perag_lock); 37907b6403aSDave Chinner radix_tree_preload_end(); 38007b6403aSDave Chinner 38129f11fceSEric Sandeen #ifdef __KERNEL__ 38207b6403aSDave Chinner /* Place kernel structure only init below this point. */ 38307b6403aSDave Chinner spin_lock_init(&pag->pag_ici_lock); 38407b6403aSDave Chinner spin_lock_init(&pag->pagb_lock); 38507b6403aSDave Chinner spin_lock_init(&pag->pag_state_lock); 38607b6403aSDave Chinner INIT_DELAYED_WORK(&pag->pag_blockgc_work, xfs_blockgc_worker); 38707b6403aSDave Chinner INIT_RADIX_TREE(&pag->pag_ici_root, GFP_ATOMIC); 38807b6403aSDave Chinner init_waitqueue_head(&pag->pagb_wait); 389c4d5660aSDave Chinner init_waitqueue_head(&pag->pag_active_wq); 39007b6403aSDave Chinner pag->pagb_count = 0; 39107b6403aSDave Chinner pag->pagb_tree = RB_ROOT; 39229f11fceSEric Sandeen #endif /* __KERNEL__ */ 39307b6403aSDave Chinner 39407b6403aSDave Chinner error = xfs_buf_hash_init(pag); 39507b6403aSDave Chinner if (error) 39607b6403aSDave Chinner goto out_remove_pag; 39707b6403aSDave Chinner 398c4d5660aSDave Chinner /* Active ref owned by mount indicates AG is online. */ 399c4d5660aSDave Chinner atomic_set(&pag->pag_active_ref, 1); 400c4d5660aSDave Chinner 40107b6403aSDave Chinner /* first new pag is fully initialized */ 40207b6403aSDave Chinner if (first_initialised == NULLAGNUMBER) 40307b6403aSDave Chinner first_initialised = index; 4040800169eSDave Chinner 4050800169eSDave Chinner /* 4060800169eSDave Chinner * Pre-calculated geometry 4070800169eSDave Chinner */ 4080800169eSDave Chinner pag->block_count = __xfs_ag_block_count(mp, index, agcount, 4090800169eSDave Chinner dblocks); 4100800169eSDave Chinner pag->min_block = XFS_AGFL_BLOCK(mp); 4112d6ca832SDave Chinner __xfs_agino_range(mp, pag->block_count, &pag->agino_min, 4122d6ca832SDave Chinner &pag->agino_max); 41307b6403aSDave Chinner } 41407b6403aSDave Chinner 41507b6403aSDave Chinner index = xfs_set_inode_alloc(mp, agcount); 41607b6403aSDave Chinner 41707b6403aSDave Chinner if (maxagi) 41807b6403aSDave Chinner *maxagi = index; 41907b6403aSDave Chinner 42007b6403aSDave Chinner mp->m_ag_prealloc_blocks = xfs_prealloc_blocks(mp); 42107b6403aSDave Chinner return 0; 42207b6403aSDave Chinner 42307b6403aSDave Chinner out_remove_pag: 42407b6403aSDave Chinner radix_tree_delete(&mp->m_perag_tree, index); 42507b6403aSDave Chinner out_free_pag: 42607b6403aSDave Chinner kmem_free(pag); 42707b6403aSDave Chinner out_unwind_new_pags: 42807b6403aSDave Chinner /* unwind any prior newly initialized pags */ 42907b6403aSDave Chinner for (index = first_initialised; index < agcount; index++) { 43007b6403aSDave Chinner pag = radix_tree_delete(&mp->m_perag_tree, index); 43107b6403aSDave Chinner if (!pag) 43207b6403aSDave Chinner break; 43307b6403aSDave Chinner xfs_buf_hash_destroy(pag); 43407b6403aSDave Chinner kmem_free(pag); 43507b6403aSDave Chinner } 43607b6403aSDave Chinner return error; 43707b6403aSDave Chinner } 438b16817b6SDave Chinner 4392842b6dbSDarrick J. Wong static int 440b16817b6SDave Chinner xfs_get_aghdr_buf( 441b16817b6SDave Chinner struct xfs_mount *mp, 442b16817b6SDave Chinner xfs_daddr_t blkno, 443b16817b6SDave Chinner size_t numblks, 4442842b6dbSDarrick J. Wong struct xfs_buf **bpp, 445b16817b6SDave Chinner const struct xfs_buf_ops *ops) 446b16817b6SDave Chinner { 447b16817b6SDave Chinner struct xfs_buf *bp; 4482842b6dbSDarrick J. Wong int error; 449b16817b6SDave Chinner 4502842b6dbSDarrick J. Wong error = xfs_buf_get_uncached(mp->m_ddev_targp, numblks, 0, &bp); 4512842b6dbSDarrick J. Wong if (error) 4522842b6dbSDarrick J. Wong return error; 453b16817b6SDave Chinner 454b16817b6SDave Chinner bp->b_maps[0].bm_bn = blkno; 455b16817b6SDave Chinner bp->b_ops = ops; 456b16817b6SDave Chinner 4572842b6dbSDarrick J. Wong *bpp = bp; 4582842b6dbSDarrick J. Wong return 0; 459b16817b6SDave Chinner } 460b16817b6SDave Chinner 461b16817b6SDave Chinner /* 462b16817b6SDave Chinner * Generic btree root block init function 463b16817b6SDave Chinner */ 464b16817b6SDave Chinner static void 465b16817b6SDave Chinner xfs_btroot_init( 466b16817b6SDave Chinner struct xfs_mount *mp, 467b16817b6SDave Chinner struct xfs_buf *bp, 468b16817b6SDave Chinner struct aghdr_init_data *id) 469b16817b6SDave Chinner { 470f5b999c0SEric Sandeen xfs_btree_init_block(mp, bp, id->type, 0, 0, id->agno); 471b16817b6SDave Chinner } 472b16817b6SDave Chinner 4738d90857cSDarrick J. Wong /* Finish initializing a free space btree. */ 4748d90857cSDarrick J. Wong static void 4758d90857cSDarrick J. Wong xfs_freesp_init_recs( 4768d90857cSDarrick J. Wong struct xfs_mount *mp, 4778d90857cSDarrick J. Wong struct xfs_buf *bp, 4788d90857cSDarrick J. Wong struct aghdr_init_data *id) 4798d90857cSDarrick J. Wong { 4808d90857cSDarrick J. Wong struct xfs_alloc_rec *arec; 481f327a007SDarrick J. Wong struct xfs_btree_block *block = XFS_BUF_TO_BLOCK(bp); 4828d90857cSDarrick J. Wong 4838d90857cSDarrick J. Wong arec = XFS_ALLOC_REC_ADDR(mp, XFS_BUF_TO_BLOCK(bp), 1); 4848d90857cSDarrick J. Wong arec->ar_startblock = cpu_to_be32(mp->m_ag_prealloc_blocks); 485f327a007SDarrick J. Wong 48636029deeSDave Chinner if (xfs_ag_contains_log(mp, id->agno)) { 487f327a007SDarrick J. Wong struct xfs_alloc_rec *nrec; 488f327a007SDarrick J. Wong xfs_agblock_t start = XFS_FSB_TO_AGBNO(mp, 489f327a007SDarrick J. Wong mp->m_sb.sb_logstart); 490f327a007SDarrick J. Wong 491f327a007SDarrick J. Wong ASSERT(start >= mp->m_ag_prealloc_blocks); 492f327a007SDarrick J. Wong if (start != mp->m_ag_prealloc_blocks) { 493f327a007SDarrick J. Wong /* 494f327a007SDarrick J. Wong * Modify first record to pad stripe align of log 495f327a007SDarrick J. Wong */ 496f327a007SDarrick J. Wong arec->ar_blockcount = cpu_to_be32(start - 497f327a007SDarrick J. Wong mp->m_ag_prealloc_blocks); 498f327a007SDarrick J. Wong nrec = arec + 1; 499f327a007SDarrick J. Wong 500f327a007SDarrick J. Wong /* 501f327a007SDarrick J. Wong * Insert second record at start of internal log 502f327a007SDarrick J. Wong * which then gets trimmed. 503f327a007SDarrick J. Wong */ 504f327a007SDarrick J. Wong nrec->ar_startblock = cpu_to_be32( 505f327a007SDarrick J. Wong be32_to_cpu(arec->ar_startblock) + 506f327a007SDarrick J. Wong be32_to_cpu(arec->ar_blockcount)); 507f327a007SDarrick J. Wong arec = nrec; 508f327a007SDarrick J. Wong be16_add_cpu(&block->bb_numrecs, 1); 509f327a007SDarrick J. Wong } 510f327a007SDarrick J. Wong /* 511f327a007SDarrick J. Wong * Change record start to after the internal log 512f327a007SDarrick J. Wong */ 513f327a007SDarrick J. Wong be32_add_cpu(&arec->ar_startblock, mp->m_sb.sb_logblocks); 514f327a007SDarrick J. Wong } 515f327a007SDarrick J. Wong 516f327a007SDarrick J. Wong /* 517f327a007SDarrick J. Wong * Calculate the record block count and check for the case where 518f327a007SDarrick J. Wong * the log might have consumed all available space in the AG. If 519f327a007SDarrick J. Wong * so, reset the record count to 0 to avoid exposure of an invalid 520f327a007SDarrick J. Wong * record start block. 521f327a007SDarrick J. Wong */ 5228d90857cSDarrick J. Wong arec->ar_blockcount = cpu_to_be32(id->agsize - 5238d90857cSDarrick J. Wong be32_to_cpu(arec->ar_startblock)); 524f327a007SDarrick J. Wong if (!arec->ar_blockcount) 525f327a007SDarrick J. Wong block->bb_numrecs = 0; 5268d90857cSDarrick J. Wong } 5278d90857cSDarrick J. Wong 528b16817b6SDave Chinner /* 529b16817b6SDave Chinner * Alloc btree root block init functions 530b16817b6SDave Chinner */ 531b16817b6SDave Chinner static void 532b16817b6SDave Chinner xfs_bnoroot_init( 533b16817b6SDave Chinner struct xfs_mount *mp, 534b16817b6SDave Chinner struct xfs_buf *bp, 535b16817b6SDave Chinner struct aghdr_init_data *id) 536b16817b6SDave Chinner { 537f5b999c0SEric Sandeen xfs_btree_init_block(mp, bp, XFS_BTNUM_BNO, 0, 1, id->agno); 5388d90857cSDarrick J. Wong xfs_freesp_init_recs(mp, bp, id); 539b16817b6SDave Chinner } 540b16817b6SDave Chinner 541b16817b6SDave Chinner static void 542b16817b6SDave Chinner xfs_cntroot_init( 543b16817b6SDave Chinner struct xfs_mount *mp, 544b16817b6SDave Chinner struct xfs_buf *bp, 545b16817b6SDave Chinner struct aghdr_init_data *id) 546b16817b6SDave Chinner { 547f5b999c0SEric Sandeen xfs_btree_init_block(mp, bp, XFS_BTNUM_CNT, 0, 1, id->agno); 5488d90857cSDarrick J. Wong xfs_freesp_init_recs(mp, bp, id); 549b16817b6SDave Chinner } 550b16817b6SDave Chinner 551b16817b6SDave Chinner /* 552b16817b6SDave Chinner * Reverse map root block init 553b16817b6SDave Chinner */ 554b16817b6SDave Chinner static void 555b16817b6SDave Chinner xfs_rmaproot_init( 556b16817b6SDave Chinner struct xfs_mount *mp, 557b16817b6SDave Chinner struct xfs_buf *bp, 558b16817b6SDave Chinner struct aghdr_init_data *id) 559b16817b6SDave Chinner { 560b16817b6SDave Chinner struct xfs_btree_block *block = XFS_BUF_TO_BLOCK(bp); 561b16817b6SDave Chinner struct xfs_rmap_rec *rrec; 562b16817b6SDave Chinner 563f5b999c0SEric Sandeen xfs_btree_init_block(mp, bp, XFS_BTNUM_RMAP, 0, 4, id->agno); 564b16817b6SDave Chinner 565b16817b6SDave Chinner /* 566b16817b6SDave Chinner * mark the AG header regions as static metadata The BNO 567b16817b6SDave Chinner * btree block is the first block after the headers, so 568b16817b6SDave Chinner * it's location defines the size of region the static 569b16817b6SDave Chinner * metadata consumes. 570b16817b6SDave Chinner * 571b16817b6SDave Chinner * Note: unlike mkfs, we never have to account for log 572b16817b6SDave Chinner * space when growing the data regions 573b16817b6SDave Chinner */ 574b16817b6SDave Chinner rrec = XFS_RMAP_REC_ADDR(block, 1); 575b16817b6SDave Chinner rrec->rm_startblock = 0; 576b16817b6SDave Chinner rrec->rm_blockcount = cpu_to_be32(XFS_BNO_BLOCK(mp)); 577b16817b6SDave Chinner rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_FS); 578b16817b6SDave Chinner rrec->rm_offset = 0; 579b16817b6SDave Chinner 580b16817b6SDave Chinner /* account freespace btree root blocks */ 581b16817b6SDave Chinner rrec = XFS_RMAP_REC_ADDR(block, 2); 582b16817b6SDave Chinner rrec->rm_startblock = cpu_to_be32(XFS_BNO_BLOCK(mp)); 583b16817b6SDave Chinner rrec->rm_blockcount = cpu_to_be32(2); 584b16817b6SDave Chinner rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_AG); 585b16817b6SDave Chinner rrec->rm_offset = 0; 586b16817b6SDave Chinner 587b16817b6SDave Chinner /* account inode btree root blocks */ 588b16817b6SDave Chinner rrec = XFS_RMAP_REC_ADDR(block, 3); 589b16817b6SDave Chinner rrec->rm_startblock = cpu_to_be32(XFS_IBT_BLOCK(mp)); 590b16817b6SDave Chinner rrec->rm_blockcount = cpu_to_be32(XFS_RMAP_BLOCK(mp) - 591b16817b6SDave Chinner XFS_IBT_BLOCK(mp)); 592b16817b6SDave Chinner rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_INOBT); 593b16817b6SDave Chinner rrec->rm_offset = 0; 594b16817b6SDave Chinner 595b16817b6SDave Chinner /* account for rmap btree root */ 596b16817b6SDave Chinner rrec = XFS_RMAP_REC_ADDR(block, 4); 597b16817b6SDave Chinner rrec->rm_startblock = cpu_to_be32(XFS_RMAP_BLOCK(mp)); 598b16817b6SDave Chinner rrec->rm_blockcount = cpu_to_be32(1); 599b16817b6SDave Chinner rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_AG); 600b16817b6SDave Chinner rrec->rm_offset = 0; 601b16817b6SDave Chinner 602b16817b6SDave Chinner /* account for refc btree root */ 60338c26bfdSDave Chinner if (xfs_has_reflink(mp)) { 604b16817b6SDave Chinner rrec = XFS_RMAP_REC_ADDR(block, 5); 605b16817b6SDave Chinner rrec->rm_startblock = cpu_to_be32(xfs_refc_block(mp)); 606b16817b6SDave Chinner rrec->rm_blockcount = cpu_to_be32(1); 607b16817b6SDave Chinner rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_REFC); 608b16817b6SDave Chinner rrec->rm_offset = 0; 609b16817b6SDave Chinner be16_add_cpu(&block->bb_numrecs, 1); 610b16817b6SDave Chinner } 611f327a007SDarrick J. Wong 612f327a007SDarrick J. Wong /* account for the log space */ 61336029deeSDave Chinner if (xfs_ag_contains_log(mp, id->agno)) { 614f327a007SDarrick J. Wong rrec = XFS_RMAP_REC_ADDR(block, 615f327a007SDarrick J. Wong be16_to_cpu(block->bb_numrecs) + 1); 616f327a007SDarrick J. Wong rrec->rm_startblock = cpu_to_be32( 617f327a007SDarrick J. Wong XFS_FSB_TO_AGBNO(mp, mp->m_sb.sb_logstart)); 618f327a007SDarrick J. Wong rrec->rm_blockcount = cpu_to_be32(mp->m_sb.sb_logblocks); 619f327a007SDarrick J. Wong rrec->rm_owner = cpu_to_be64(XFS_RMAP_OWN_LOG); 620f327a007SDarrick J. Wong rrec->rm_offset = 0; 621f327a007SDarrick J. Wong be16_add_cpu(&block->bb_numrecs, 1); 622f327a007SDarrick J. Wong } 623b16817b6SDave Chinner } 624b16817b6SDave Chinner 625b16817b6SDave Chinner /* 626b16817b6SDave Chinner * Initialise new secondary superblocks with the pre-grow geometry, but mark 627b16817b6SDave Chinner * them as "in progress" so we know they haven't yet been activated. This will 628b16817b6SDave Chinner * get cleared when the update with the new geometry information is done after 629b16817b6SDave Chinner * changes to the primary are committed. This isn't strictly necessary, but we 630b16817b6SDave Chinner * get it for free with the delayed buffer write lists and it means we can tell 631b16817b6SDave Chinner * if a grow operation didn't complete properly after the fact. 632b16817b6SDave Chinner */ 633b16817b6SDave Chinner static void 634b16817b6SDave Chinner xfs_sbblock_init( 635b16817b6SDave Chinner struct xfs_mount *mp, 636b16817b6SDave Chinner struct xfs_buf *bp, 637b16817b6SDave Chinner struct aghdr_init_data *id) 638b16817b6SDave Chinner { 6393e6e8afdSChristoph Hellwig struct xfs_dsb *dsb = bp->b_addr; 640b16817b6SDave Chinner 641b16817b6SDave Chinner xfs_sb_to_disk(dsb, &mp->m_sb); 642b16817b6SDave Chinner dsb->sb_inprogress = 1; 643b16817b6SDave Chinner } 644b16817b6SDave Chinner 645b16817b6SDave Chinner static void 646b16817b6SDave Chinner xfs_agfblock_init( 647b16817b6SDave Chinner struct xfs_mount *mp, 648b16817b6SDave Chinner struct xfs_buf *bp, 649b16817b6SDave Chinner struct aghdr_init_data *id) 650b16817b6SDave Chinner { 6519798f615SChristoph Hellwig struct xfs_agf *agf = bp->b_addr; 652b16817b6SDave Chinner xfs_extlen_t tmpsize; 653b16817b6SDave Chinner 654b16817b6SDave Chinner agf->agf_magicnum = cpu_to_be32(XFS_AGF_MAGIC); 655b16817b6SDave Chinner agf->agf_versionnum = cpu_to_be32(XFS_AGF_VERSION); 656b16817b6SDave Chinner agf->agf_seqno = cpu_to_be32(id->agno); 657b16817b6SDave Chinner agf->agf_length = cpu_to_be32(id->agsize); 658b16817b6SDave Chinner agf->agf_roots[XFS_BTNUM_BNOi] = cpu_to_be32(XFS_BNO_BLOCK(mp)); 659b16817b6SDave Chinner agf->agf_roots[XFS_BTNUM_CNTi] = cpu_to_be32(XFS_CNT_BLOCK(mp)); 660b16817b6SDave Chinner agf->agf_levels[XFS_BTNUM_BNOi] = cpu_to_be32(1); 661b16817b6SDave Chinner agf->agf_levels[XFS_BTNUM_CNTi] = cpu_to_be32(1); 66238c26bfdSDave Chinner if (xfs_has_rmapbt(mp)) { 663b16817b6SDave Chinner agf->agf_roots[XFS_BTNUM_RMAPi] = 664b16817b6SDave Chinner cpu_to_be32(XFS_RMAP_BLOCK(mp)); 665b16817b6SDave Chinner agf->agf_levels[XFS_BTNUM_RMAPi] = cpu_to_be32(1); 666b16817b6SDave Chinner agf->agf_rmap_blocks = cpu_to_be32(1); 667b16817b6SDave Chinner } 668b16817b6SDave Chinner 669b16817b6SDave Chinner agf->agf_flfirst = cpu_to_be32(1); 670b16817b6SDave Chinner agf->agf_fllast = 0; 671b16817b6SDave Chinner agf->agf_flcount = 0; 672b16817b6SDave Chinner tmpsize = id->agsize - mp->m_ag_prealloc_blocks; 673b16817b6SDave Chinner agf->agf_freeblks = cpu_to_be32(tmpsize); 674b16817b6SDave Chinner agf->agf_longest = cpu_to_be32(tmpsize); 67538c26bfdSDave Chinner if (xfs_has_crc(mp)) 676b16817b6SDave Chinner uuid_copy(&agf->agf_uuid, &mp->m_sb.sb_meta_uuid); 67738c26bfdSDave Chinner if (xfs_has_reflink(mp)) { 678b16817b6SDave Chinner agf->agf_refcount_root = cpu_to_be32( 679b16817b6SDave Chinner xfs_refc_block(mp)); 680b16817b6SDave Chinner agf->agf_refcount_level = cpu_to_be32(1); 681b16817b6SDave Chinner agf->agf_refcount_blocks = cpu_to_be32(1); 682b16817b6SDave Chinner } 683f327a007SDarrick J. Wong 68436029deeSDave Chinner if (xfs_ag_contains_log(mp, id->agno)) { 685f327a007SDarrick J. Wong int64_t logblocks = mp->m_sb.sb_logblocks; 686f327a007SDarrick J. Wong 687f327a007SDarrick J. Wong be32_add_cpu(&agf->agf_freeblks, -logblocks); 688f327a007SDarrick J. Wong agf->agf_longest = cpu_to_be32(id->agsize - 689f327a007SDarrick J. Wong XFS_FSB_TO_AGBNO(mp, mp->m_sb.sb_logstart) - logblocks); 690f327a007SDarrick J. Wong } 691b16817b6SDave Chinner } 692b16817b6SDave Chinner 693b16817b6SDave Chinner static void 694b16817b6SDave Chinner xfs_agflblock_init( 695b16817b6SDave Chinner struct xfs_mount *mp, 696b16817b6SDave Chinner struct xfs_buf *bp, 697b16817b6SDave Chinner struct aghdr_init_data *id) 698b16817b6SDave Chinner { 699b16817b6SDave Chinner struct xfs_agfl *agfl = XFS_BUF_TO_AGFL(bp); 700b16817b6SDave Chinner __be32 *agfl_bno; 701b16817b6SDave Chinner int bucket; 702b16817b6SDave Chinner 70338c26bfdSDave Chinner if (xfs_has_crc(mp)) { 704b16817b6SDave Chinner agfl->agfl_magicnum = cpu_to_be32(XFS_AGFL_MAGIC); 705b16817b6SDave Chinner agfl->agfl_seqno = cpu_to_be32(id->agno); 706b16817b6SDave Chinner uuid_copy(&agfl->agfl_uuid, &mp->m_sb.sb_meta_uuid); 707b16817b6SDave Chinner } 708b16817b6SDave Chinner 709183606d8SChristoph Hellwig agfl_bno = xfs_buf_to_agfl_bno(bp); 710b16817b6SDave Chinner for (bucket = 0; bucket < xfs_agfl_size(mp); bucket++) 711b16817b6SDave Chinner agfl_bno[bucket] = cpu_to_be32(NULLAGBLOCK); 712b16817b6SDave Chinner } 713b16817b6SDave Chinner 714b16817b6SDave Chinner static void 715b16817b6SDave Chinner xfs_agiblock_init( 716b16817b6SDave Chinner struct xfs_mount *mp, 717b16817b6SDave Chinner struct xfs_buf *bp, 718b16817b6SDave Chinner struct aghdr_init_data *id) 719b16817b6SDave Chinner { 720370c782bSChristoph Hellwig struct xfs_agi *agi = bp->b_addr; 721b16817b6SDave Chinner int bucket; 722b16817b6SDave Chinner 723b16817b6SDave Chinner agi->agi_magicnum = cpu_to_be32(XFS_AGI_MAGIC); 724b16817b6SDave Chinner agi->agi_versionnum = cpu_to_be32(XFS_AGI_VERSION); 725b16817b6SDave Chinner agi->agi_seqno = cpu_to_be32(id->agno); 726b16817b6SDave Chinner agi->agi_length = cpu_to_be32(id->agsize); 727b16817b6SDave Chinner agi->agi_count = 0; 728b16817b6SDave Chinner agi->agi_root = cpu_to_be32(XFS_IBT_BLOCK(mp)); 729b16817b6SDave Chinner agi->agi_level = cpu_to_be32(1); 730b16817b6SDave Chinner agi->agi_freecount = 0; 731b16817b6SDave Chinner agi->agi_newino = cpu_to_be32(NULLAGINO); 732b16817b6SDave Chinner agi->agi_dirino = cpu_to_be32(NULLAGINO); 73338c26bfdSDave Chinner if (xfs_has_crc(mp)) 734b16817b6SDave Chinner uuid_copy(&agi->agi_uuid, &mp->m_sb.sb_meta_uuid); 73538c26bfdSDave Chinner if (xfs_has_finobt(mp)) { 736b16817b6SDave Chinner agi->agi_free_root = cpu_to_be32(XFS_FIBT_BLOCK(mp)); 737b16817b6SDave Chinner agi->agi_free_level = cpu_to_be32(1); 738b16817b6SDave Chinner } 739b16817b6SDave Chinner for (bucket = 0; bucket < XFS_AGI_UNLINKED_BUCKETS; bucket++) 740b16817b6SDave Chinner agi->agi_unlinked[bucket] = cpu_to_be32(NULLAGINO); 741ebd9027dSDave Chinner if (xfs_has_inobtcounts(mp)) { 7422a39946cSDarrick J. Wong agi->agi_iblocks = cpu_to_be32(1); 743ebd9027dSDave Chinner if (xfs_has_finobt(mp)) 7442a39946cSDarrick J. Wong agi->agi_fblocks = cpu_to_be32(1); 7452a39946cSDarrick J. Wong } 746b16817b6SDave Chinner } 747b16817b6SDave Chinner 748b16817b6SDave Chinner typedef void (*aghdr_init_work_f)(struct xfs_mount *mp, struct xfs_buf *bp, 749b16817b6SDave Chinner struct aghdr_init_data *id); 750b16817b6SDave Chinner static int 751b16817b6SDave Chinner xfs_ag_init_hdr( 752b16817b6SDave Chinner struct xfs_mount *mp, 753b16817b6SDave Chinner struct aghdr_init_data *id, 754b16817b6SDave Chinner aghdr_init_work_f work, 755b16817b6SDave Chinner const struct xfs_buf_ops *ops) 756b16817b6SDave Chinner { 757b16817b6SDave Chinner struct xfs_buf *bp; 7582842b6dbSDarrick J. Wong int error; 759b16817b6SDave Chinner 7602842b6dbSDarrick J. Wong error = xfs_get_aghdr_buf(mp, id->daddr, id->numblks, &bp, ops); 7612842b6dbSDarrick J. Wong if (error) 7622842b6dbSDarrick J. Wong return error; 763b16817b6SDave Chinner 764b16817b6SDave Chinner (*work)(mp, bp, id); 765b16817b6SDave Chinner 766b16817b6SDave Chinner xfs_buf_delwri_queue(bp, &id->buffer_list); 767b16817b6SDave Chinner xfs_buf_relse(bp); 768b16817b6SDave Chinner return 0; 769b16817b6SDave Chinner } 770b16817b6SDave Chinner 771b16817b6SDave Chinner struct xfs_aghdr_grow_data { 772b16817b6SDave Chinner xfs_daddr_t daddr; 773b16817b6SDave Chinner size_t numblks; 774b16817b6SDave Chinner const struct xfs_buf_ops *ops; 775b16817b6SDave Chinner aghdr_init_work_f work; 776b16817b6SDave Chinner xfs_btnum_t type; 777b16817b6SDave Chinner bool need_init; 778b16817b6SDave Chinner }; 779b16817b6SDave Chinner 780b16817b6SDave Chinner /* 781b16817b6SDave Chinner * Prepare new AG headers to be written to disk. We use uncached buffers here, 782b16817b6SDave Chinner * as it is assumed these new AG headers are currently beyond the currently 783b16817b6SDave Chinner * valid filesystem address space. Using cached buffers would trip over EOFS 784b16817b6SDave Chinner * corruption detection alogrithms in the buffer cache lookup routines. 785b16817b6SDave Chinner * 786b16817b6SDave Chinner * This is a non-transactional function, but the prepared buffers are added to a 787b16817b6SDave Chinner * delayed write buffer list supplied by the caller so they can submit them to 788b16817b6SDave Chinner * disk and wait on them as required. 789b16817b6SDave Chinner */ 790b16817b6SDave Chinner int 791b16817b6SDave Chinner xfs_ag_init_headers( 792b16817b6SDave Chinner struct xfs_mount *mp, 793b16817b6SDave Chinner struct aghdr_init_data *id) 794b16817b6SDave Chinner 795b16817b6SDave Chinner { 796b16817b6SDave Chinner struct xfs_aghdr_grow_data aghdr_data[] = { 797b16817b6SDave Chinner { /* SB */ 798b16817b6SDave Chinner .daddr = XFS_AG_DADDR(mp, id->agno, XFS_SB_DADDR), 799b16817b6SDave Chinner .numblks = XFS_FSS_TO_BB(mp, 1), 800b16817b6SDave Chinner .ops = &xfs_sb_buf_ops, 801b16817b6SDave Chinner .work = &xfs_sbblock_init, 802b16817b6SDave Chinner .need_init = true 803b16817b6SDave Chinner }, 804b16817b6SDave Chinner { /* AGF */ 805b16817b6SDave Chinner .daddr = XFS_AG_DADDR(mp, id->agno, XFS_AGF_DADDR(mp)), 806b16817b6SDave Chinner .numblks = XFS_FSS_TO_BB(mp, 1), 807b16817b6SDave Chinner .ops = &xfs_agf_buf_ops, 808b16817b6SDave Chinner .work = &xfs_agfblock_init, 809b16817b6SDave Chinner .need_init = true 810b16817b6SDave Chinner }, 811b16817b6SDave Chinner { /* AGFL */ 812b16817b6SDave Chinner .daddr = XFS_AG_DADDR(mp, id->agno, XFS_AGFL_DADDR(mp)), 813b16817b6SDave Chinner .numblks = XFS_FSS_TO_BB(mp, 1), 814b16817b6SDave Chinner .ops = &xfs_agfl_buf_ops, 815b16817b6SDave Chinner .work = &xfs_agflblock_init, 816b16817b6SDave Chinner .need_init = true 817b16817b6SDave Chinner }, 818b16817b6SDave Chinner { /* AGI */ 819b16817b6SDave Chinner .daddr = XFS_AG_DADDR(mp, id->agno, XFS_AGI_DADDR(mp)), 820b16817b6SDave Chinner .numblks = XFS_FSS_TO_BB(mp, 1), 821b16817b6SDave Chinner .ops = &xfs_agi_buf_ops, 822b16817b6SDave Chinner .work = &xfs_agiblock_init, 823b16817b6SDave Chinner .need_init = true 824b16817b6SDave Chinner }, 825b16817b6SDave Chinner { /* BNO root block */ 826b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, XFS_BNO_BLOCK(mp)), 827b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 82827df4f50SBrian Foster .ops = &xfs_bnobt_buf_ops, 829b16817b6SDave Chinner .work = &xfs_bnoroot_init, 830b16817b6SDave Chinner .need_init = true 831b16817b6SDave Chinner }, 832b16817b6SDave Chinner { /* CNT root block */ 833b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, XFS_CNT_BLOCK(mp)), 834b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 83527df4f50SBrian Foster .ops = &xfs_cntbt_buf_ops, 836b16817b6SDave Chinner .work = &xfs_cntroot_init, 837b16817b6SDave Chinner .need_init = true 838b16817b6SDave Chinner }, 839b16817b6SDave Chinner { /* INO root block */ 840b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, XFS_IBT_BLOCK(mp)), 841b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 842b16817b6SDave Chinner .ops = &xfs_inobt_buf_ops, 843b16817b6SDave Chinner .work = &xfs_btroot_init, 844b16817b6SDave Chinner .type = XFS_BTNUM_INO, 845b16817b6SDave Chinner .need_init = true 846b16817b6SDave Chinner }, 847b16817b6SDave Chinner { /* FINO root block */ 848b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, XFS_FIBT_BLOCK(mp)), 849b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 85001e68f40SBrian Foster .ops = &xfs_finobt_buf_ops, 851b16817b6SDave Chinner .work = &xfs_btroot_init, 852b16817b6SDave Chinner .type = XFS_BTNUM_FINO, 85338c26bfdSDave Chinner .need_init = xfs_has_finobt(mp) 854b16817b6SDave Chinner }, 855b16817b6SDave Chinner { /* RMAP root block */ 856b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, XFS_RMAP_BLOCK(mp)), 857b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 858b16817b6SDave Chinner .ops = &xfs_rmapbt_buf_ops, 859b16817b6SDave Chinner .work = &xfs_rmaproot_init, 86038c26bfdSDave Chinner .need_init = xfs_has_rmapbt(mp) 861b16817b6SDave Chinner }, 862b16817b6SDave Chinner { /* REFC root block */ 863b16817b6SDave Chinner .daddr = XFS_AGB_TO_DADDR(mp, id->agno, xfs_refc_block(mp)), 864b16817b6SDave Chinner .numblks = BTOBB(mp->m_sb.sb_blocksize), 865b16817b6SDave Chinner .ops = &xfs_refcountbt_buf_ops, 866b16817b6SDave Chinner .work = &xfs_btroot_init, 867b16817b6SDave Chinner .type = XFS_BTNUM_REFC, 86838c26bfdSDave Chinner .need_init = xfs_has_reflink(mp) 869b16817b6SDave Chinner }, 870b16817b6SDave Chinner { /* NULL terminating block */ 871b16817b6SDave Chinner .daddr = XFS_BUF_DADDR_NULL, 872b16817b6SDave Chinner } 873b16817b6SDave Chinner }; 874b16817b6SDave Chinner struct xfs_aghdr_grow_data *dp; 875b16817b6SDave Chinner int error = 0; 876b16817b6SDave Chinner 877b16817b6SDave Chinner /* Account for AG free space in new AG */ 878b16817b6SDave Chinner id->nfree += id->agsize - mp->m_ag_prealloc_blocks; 879b16817b6SDave Chinner for (dp = &aghdr_data[0]; dp->daddr != XFS_BUF_DADDR_NULL; dp++) { 880b16817b6SDave Chinner if (!dp->need_init) 881b16817b6SDave Chinner continue; 882b16817b6SDave Chinner 883b16817b6SDave Chinner id->daddr = dp->daddr; 884b16817b6SDave Chinner id->numblks = dp->numblks; 885b16817b6SDave Chinner id->type = dp->type; 886b16817b6SDave Chinner error = xfs_ag_init_hdr(mp, id, dp->work, dp->ops); 887b16817b6SDave Chinner if (error) 888b16817b6SDave Chinner break; 889b16817b6SDave Chinner } 890b16817b6SDave Chinner return error; 891b16817b6SDave Chinner } 89249dd56f2SDave Chinner 89346141dc8SGao Xiang int 89446141dc8SGao Xiang xfs_ag_shrink_space( 895c6aee248SDave Chinner struct xfs_perag *pag, 89646141dc8SGao Xiang struct xfs_trans **tpp, 89746141dc8SGao Xiang xfs_extlen_t delta) 89846141dc8SGao Xiang { 899c6aee248SDave Chinner struct xfs_mount *mp = pag->pag_mount; 90046141dc8SGao Xiang struct xfs_alloc_arg args = { 90146141dc8SGao Xiang .tp = *tpp, 90246141dc8SGao Xiang .mp = mp, 90374c36a86SDave Chinner .pag = pag, 90446141dc8SGao Xiang .minlen = delta, 90546141dc8SGao Xiang .maxlen = delta, 90646141dc8SGao Xiang .oinfo = XFS_RMAP_OINFO_SKIP_UPDATE, 90746141dc8SGao Xiang .resv = XFS_AG_RESV_NONE, 90846141dc8SGao Xiang .prod = 1 90946141dc8SGao Xiang }; 91046141dc8SGao Xiang struct xfs_buf *agibp, *agfbp; 91146141dc8SGao Xiang struct xfs_agi *agi; 91246141dc8SGao Xiang struct xfs_agf *agf; 913a8f3522cSDarrick J. Wong xfs_agblock_t aglen; 91446141dc8SGao Xiang int error, err2; 91546141dc8SGao Xiang 916c6aee248SDave Chinner ASSERT(pag->pag_agno == mp->m_sb.sb_agcount - 1); 91799b13c7fSDave Chinner error = xfs_ialloc_read_agi(pag, *tpp, &agibp); 91846141dc8SGao Xiang if (error) 91946141dc8SGao Xiang return error; 92046141dc8SGao Xiang 92146141dc8SGao Xiang agi = agibp->b_addr; 92246141dc8SGao Xiang 92308d3e84fSDave Chinner error = xfs_alloc_read_agf(pag, *tpp, 0, &agfbp); 92446141dc8SGao Xiang if (error) 92546141dc8SGao Xiang return error; 92646141dc8SGao Xiang 92746141dc8SGao Xiang agf = agfbp->b_addr; 928a8f3522cSDarrick J. Wong aglen = be32_to_cpu(agi->agi_length); 92946141dc8SGao Xiang /* some extra paranoid checks before we shrink the ag */ 93046141dc8SGao Xiang if (XFS_IS_CORRUPT(mp, agf->agf_length != agi->agi_length)) 93146141dc8SGao Xiang return -EFSCORRUPTED; 932a8f3522cSDarrick J. Wong if (delta >= aglen) 93346141dc8SGao Xiang return -EINVAL; 93446141dc8SGao Xiang 93546141dc8SGao Xiang /* 936da062d16SDarrick J. Wong * Make sure that the last inode cluster cannot overlap with the new 937da062d16SDarrick J. Wong * end of the AG, even if it's sparse. 938da062d16SDarrick J. Wong */ 939dedab3e4SDave Chinner error = xfs_ialloc_check_shrink(pag, *tpp, agibp, aglen - delta); 940da062d16SDarrick J. Wong if (error) 941da062d16SDarrick J. Wong return error; 942da062d16SDarrick J. Wong 943da062d16SDarrick J. Wong /* 94446141dc8SGao Xiang * Disable perag reservations so it doesn't cause the allocation request 94546141dc8SGao Xiang * to fail. We'll reestablish reservation before we return. 94646141dc8SGao Xiang */ 94799b13c7fSDave Chinner error = xfs_ag_resv_free(pag); 94846141dc8SGao Xiang if (error) 94946141dc8SGao Xiang return error; 95046141dc8SGao Xiang 95146141dc8SGao Xiang /* internal log shouldn't also show up in the free space btrees */ 9525f36b2ceSDave Chinner error = xfs_alloc_vextent_exact_bno(&args, 9535f36b2ceSDave Chinner XFS_AGB_TO_FSB(mp, pag->pag_agno, aglen - delta)); 95446141dc8SGao Xiang if (!error && args.agbno == NULLAGBLOCK) 95546141dc8SGao Xiang error = -ENOSPC; 95646141dc8SGao Xiang 95746141dc8SGao Xiang if (error) { 95846141dc8SGao Xiang /* 95946141dc8SGao Xiang * if extent allocation fails, need to roll the transaction to 96046141dc8SGao Xiang * ensure that the AGFL fixup has been committed anyway. 96146141dc8SGao Xiang */ 96246141dc8SGao Xiang xfs_trans_bhold(*tpp, agfbp); 96346141dc8SGao Xiang err2 = xfs_trans_roll(tpp); 96446141dc8SGao Xiang if (err2) 96546141dc8SGao Xiang return err2; 96646141dc8SGao Xiang xfs_trans_bjoin(*tpp, agfbp); 96746141dc8SGao Xiang goto resv_init_out; 96846141dc8SGao Xiang } 96946141dc8SGao Xiang 97046141dc8SGao Xiang /* 97146141dc8SGao Xiang * if successfully deleted from freespace btrees, need to confirm 97246141dc8SGao Xiang * per-AG reservation works as expected. 97346141dc8SGao Xiang */ 97446141dc8SGao Xiang be32_add_cpu(&agi->agi_length, -delta); 97546141dc8SGao Xiang be32_add_cpu(&agf->agf_length, -delta); 97646141dc8SGao Xiang 97799b13c7fSDave Chinner err2 = xfs_ag_resv_init(pag, *tpp); 97846141dc8SGao Xiang if (err2) { 97946141dc8SGao Xiang be32_add_cpu(&agi->agi_length, delta); 98046141dc8SGao Xiang be32_add_cpu(&agf->agf_length, delta); 98146141dc8SGao Xiang if (err2 != -ENOSPC) 98246141dc8SGao Xiang goto resv_err; 98346141dc8SGao Xiang 984c201d9caSDarrick J. Wong __xfs_free_extent_later(*tpp, args.fsbno, delta, NULL, true); 98546141dc8SGao Xiang 98646141dc8SGao Xiang /* 98746141dc8SGao Xiang * Roll the transaction before trying to re-init the per-ag 98846141dc8SGao Xiang * reservation. The new transaction is clean so it will cancel 98946141dc8SGao Xiang * without any side effects. 99046141dc8SGao Xiang */ 99146141dc8SGao Xiang error = xfs_defer_finish(tpp); 99246141dc8SGao Xiang if (error) 99346141dc8SGao Xiang return error; 99446141dc8SGao Xiang 99546141dc8SGao Xiang error = -ENOSPC; 99646141dc8SGao Xiang goto resv_init_out; 99746141dc8SGao Xiang } 99846141dc8SGao Xiang xfs_ialloc_log_agi(*tpp, agibp, XFS_AGI_LENGTH); 99946141dc8SGao Xiang xfs_alloc_log_agf(*tpp, agfbp, XFS_AGF_LENGTH); 100046141dc8SGao Xiang return 0; 100199b13c7fSDave Chinner 100246141dc8SGao Xiang resv_init_out: 100399b13c7fSDave Chinner err2 = xfs_ag_resv_init(pag, *tpp); 100446141dc8SGao Xiang if (!err2) 100546141dc8SGao Xiang return error; 100646141dc8SGao Xiang resv_err: 100746141dc8SGao Xiang xfs_warn(mp, "Error %d reserving per-AG metadata reserve pool.", err2); 100846141dc8SGao Xiang xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE); 100946141dc8SGao Xiang return err2; 101046141dc8SGao Xiang } 101146141dc8SGao Xiang 101249dd56f2SDave Chinner /* 101349dd56f2SDave Chinner * Extent the AG indicated by the @id by the length passed in 101449dd56f2SDave Chinner */ 101549dd56f2SDave Chinner int 101649dd56f2SDave Chinner xfs_ag_extend_space( 1017c6aee248SDave Chinner struct xfs_perag *pag, 101849dd56f2SDave Chinner struct xfs_trans *tp, 101949dd56f2SDave Chinner xfs_extlen_t len) 102049dd56f2SDave Chinner { 102149dd56f2SDave Chinner struct xfs_buf *bp; 102249dd56f2SDave Chinner struct xfs_agi *agi; 102349dd56f2SDave Chinner struct xfs_agf *agf; 102449dd56f2SDave Chinner int error; 102549dd56f2SDave Chinner 1026c6aee248SDave Chinner ASSERT(pag->pag_agno == pag->pag_mount->m_sb.sb_agcount - 1); 1027c6aee248SDave Chinner 102899b13c7fSDave Chinner error = xfs_ialloc_read_agi(pag, tp, &bp); 102949dd56f2SDave Chinner if (error) 103049dd56f2SDave Chinner return error; 103149dd56f2SDave Chinner 1032370c782bSChristoph Hellwig agi = bp->b_addr; 103349dd56f2SDave Chinner be32_add_cpu(&agi->agi_length, len); 103449dd56f2SDave Chinner xfs_ialloc_log_agi(tp, bp, XFS_AGI_LENGTH); 103549dd56f2SDave Chinner 103649dd56f2SDave Chinner /* 103749dd56f2SDave Chinner * Change agf length. 103849dd56f2SDave Chinner */ 103908d3e84fSDave Chinner error = xfs_alloc_read_agf(pag, tp, 0, &bp); 104049dd56f2SDave Chinner if (error) 104149dd56f2SDave Chinner return error; 104249dd56f2SDave Chinner 10439798f615SChristoph Hellwig agf = bp->b_addr; 104449dd56f2SDave Chinner be32_add_cpu(&agf->agf_length, len); 104549dd56f2SDave Chinner ASSERT(agf->agf_length == agi->agi_length); 104649dd56f2SDave Chinner xfs_alloc_log_agf(tp, bp, XFS_AGF_LENGTH); 104749dd56f2SDave Chinner 104849dd56f2SDave Chinner /* 104949dd56f2SDave Chinner * Free the new space. 105049dd56f2SDave Chinner * 10517280fedaSDarrick J. Wong * XFS_RMAP_OINFO_SKIP_UPDATE is used here to tell the rmap btree that 105249dd56f2SDave Chinner * this doesn't actually exist in the rmap btree. 105349dd56f2SDave Chinner */ 1054c6aee248SDave Chinner error = xfs_rmap_free(tp, bp, pag, be32_to_cpu(agf->agf_length) - len, 10557280fedaSDarrick J. Wong len, &XFS_RMAP_OINFO_SKIP_UPDATE); 105649dd56f2SDave Chinner if (error) 105749dd56f2SDave Chinner return error; 105849dd56f2SDave Chinner 1059b2ccab31SDarrick J. Wong error = xfs_free_extent(tp, pag, be32_to_cpu(agf->agf_length) - len, 1060b2ccab31SDarrick J. Wong len, &XFS_RMAP_OINFO_SKIP_UPDATE, XFS_AG_RESV_NONE); 10610800169eSDave Chinner if (error) 10620800169eSDave Chinner return error; 10630800169eSDave Chinner 10640800169eSDave Chinner /* Update perag geometry */ 10650800169eSDave Chinner pag->block_count = be32_to_cpu(agf->agf_length); 10662d6ca832SDave Chinner __xfs_agino_range(pag->pag_mount, pag->block_count, &pag->agino_min, 10672d6ca832SDave Chinner &pag->agino_max); 10680800169eSDave Chinner return 0; 106949dd56f2SDave Chinner } 10707cd5006bSDarrick J. Wong 10717cd5006bSDarrick J. Wong /* Retrieve AG geometry. */ 10727cd5006bSDarrick J. Wong int 10737cd5006bSDarrick J. Wong xfs_ag_get_geometry( 1074c6aee248SDave Chinner struct xfs_perag *pag, 10757cd5006bSDarrick J. Wong struct xfs_ag_geometry *ageo) 10767cd5006bSDarrick J. Wong { 10777cd5006bSDarrick J. Wong struct xfs_buf *agi_bp; 10787cd5006bSDarrick J. Wong struct xfs_buf *agf_bp; 10797cd5006bSDarrick J. Wong struct xfs_agi *agi; 10807cd5006bSDarrick J. Wong struct xfs_agf *agf; 10817cd5006bSDarrick J. Wong unsigned int freeblks; 10827cd5006bSDarrick J. Wong int error; 10837cd5006bSDarrick J. Wong 10847cd5006bSDarrick J. Wong /* Lock the AG headers. */ 108599b13c7fSDave Chinner error = xfs_ialloc_read_agi(pag, NULL, &agi_bp); 10867cd5006bSDarrick J. Wong if (error) 10877cd5006bSDarrick J. Wong return error; 108808d3e84fSDave Chinner error = xfs_alloc_read_agf(pag, NULL, 0, &agf_bp); 10897cd5006bSDarrick J. Wong if (error) 10907cd5006bSDarrick J. Wong goto out_agi; 109192a00544SGao Xiang 10927cd5006bSDarrick J. Wong /* Fill out form. */ 10937cd5006bSDarrick J. Wong memset(ageo, 0, sizeof(*ageo)); 1094c6aee248SDave Chinner ageo->ag_number = pag->pag_agno; 10957cd5006bSDarrick J. Wong 1096370c782bSChristoph Hellwig agi = agi_bp->b_addr; 10977cd5006bSDarrick J. Wong ageo->ag_icount = be32_to_cpu(agi->agi_count); 10987cd5006bSDarrick J. Wong ageo->ag_ifree = be32_to_cpu(agi->agi_freecount); 10997cd5006bSDarrick J. Wong 11009798f615SChristoph Hellwig agf = agf_bp->b_addr; 11017cd5006bSDarrick J. Wong ageo->ag_length = be32_to_cpu(agf->agf_length); 11027cd5006bSDarrick J. Wong freeblks = pag->pagf_freeblks + 11037cd5006bSDarrick J. Wong pag->pagf_flcount + 11047cd5006bSDarrick J. Wong pag->pagf_btreeblks - 11057cd5006bSDarrick J. Wong xfs_ag_resv_needed(pag, XFS_AG_RESV_NONE); 11067cd5006bSDarrick J. Wong ageo->ag_freeblks = freeblks; 11071302c6a2SDarrick J. Wong xfs_ag_geom_health(pag, ageo); 11087cd5006bSDarrick J. Wong 11097cd5006bSDarrick J. Wong /* Release resources. */ 11107cd5006bSDarrick J. Wong xfs_buf_relse(agf_bp); 11117cd5006bSDarrick J. Wong out_agi: 11127cd5006bSDarrick J. Wong xfs_buf_relse(agi_bp); 11137cd5006bSDarrick J. Wong return error; 11147cd5006bSDarrick J. Wong } 1115