10b61f8a4SDave Chinner // SPDX-License-Identifier: GPL-2.0 230f712c9SDave Chinner /* 330f712c9SDave Chinner * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc. 430f712c9SDave Chinner * All Rights Reserved. 530f712c9SDave Chinner */ 630f712c9SDave Chinner #include "xfs.h" 730f712c9SDave Chinner #include "xfs_fs.h" 830f712c9SDave Chinner #include "xfs_shared.h" 930f712c9SDave Chinner #include "xfs_format.h" 1030f712c9SDave Chinner #include "xfs_log_format.h" 1130f712c9SDave Chinner #include "xfs_trans_resv.h" 1230f712c9SDave Chinner #include "xfs_bit.h" 1330f712c9SDave Chinner #include "xfs_mount.h" 1430f712c9SDave Chinner #include "xfs_inode.h" 1530f712c9SDave Chinner #include "xfs_trans.h" 1630f712c9SDave Chinner #include "xfs_alloc.h" 1730f712c9SDave Chinner #include "xfs_btree.h" 1830f712c9SDave Chinner #include "xfs_bmap_btree.h" 1930f712c9SDave Chinner #include "xfs_bmap.h" 2030f712c9SDave Chinner #include "xfs_error.h" 2130f712c9SDave Chinner #include "xfs_quota.h" 2230f712c9SDave Chinner #include "xfs_trace.h" 23340785ccSDarrick J. Wong #include "xfs_rmap.h" 2474c36a86SDave Chinner #include "xfs_ag.h" 2530f712c9SDave Chinner 26e7720afaSDarrick J. Wong static struct kmem_cache *xfs_bmbt_cur_cache; 279fa47bdcSDarrick J. Wong 2830f712c9SDave Chinner /* 2930f712c9SDave Chinner * Convert on-disk form of btree root to in-memory form. 3030f712c9SDave Chinner */ 3130f712c9SDave Chinner void 3230f712c9SDave Chinner xfs_bmdr_to_bmbt( 3330f712c9SDave Chinner struct xfs_inode *ip, 3430f712c9SDave Chinner xfs_bmdr_block_t *dblock, 3530f712c9SDave Chinner int dblocklen, 3630f712c9SDave Chinner struct xfs_btree_block *rblock, 3730f712c9SDave Chinner int rblocklen) 3830f712c9SDave Chinner { 3930f712c9SDave Chinner struct xfs_mount *mp = ip->i_mount; 4030f712c9SDave Chinner int dmxr; 4130f712c9SDave Chinner xfs_bmbt_key_t *fkp; 4230f712c9SDave Chinner __be64 *fpp; 4330f712c9SDave Chinner xfs_bmbt_key_t *tkp; 4430f712c9SDave Chinner __be64 *tpp; 4530f712c9SDave Chinner 4630f712c9SDave Chinner xfs_btree_init_block_int(mp, rblock, XFS_BUF_DADDR_NULL, 47b6f41e44SEric Sandeen XFS_BTNUM_BMAP, 0, 0, ip->i_ino, 48f88ae46bSEric Sandeen XFS_BTREE_LONG_PTRS); 4930f712c9SDave Chinner rblock->bb_level = dblock->bb_level; 5030f712c9SDave Chinner ASSERT(be16_to_cpu(rblock->bb_level) > 0); 5130f712c9SDave Chinner rblock->bb_numrecs = dblock->bb_numrecs; 5230f712c9SDave Chinner dmxr = xfs_bmdr_maxrecs(dblocklen, 0); 5330f712c9SDave Chinner fkp = XFS_BMDR_KEY_ADDR(dblock, 1); 5430f712c9SDave Chinner tkp = XFS_BMBT_KEY_ADDR(mp, rblock, 1); 5530f712c9SDave Chinner fpp = XFS_BMDR_PTR_ADDR(dblock, 1, dmxr); 5630f712c9SDave Chinner tpp = XFS_BMAP_BROOT_PTR_ADDR(mp, rblock, 1, rblocklen); 5730f712c9SDave Chinner dmxr = be16_to_cpu(dblock->bb_numrecs); 5830f712c9SDave Chinner memcpy(tkp, fkp, sizeof(*fkp) * dmxr); 5930f712c9SDave Chinner memcpy(tpp, fpp, sizeof(*fpp) * dmxr); 6030f712c9SDave Chinner } 6130f712c9SDave Chinner 6230f712c9SDave Chinner void 636bdcf26aSChristoph Hellwig xfs_bmbt_disk_get_all( 6422ece4e8SDarrick J. Wong const struct xfs_bmbt_rec *rec, 656bdcf26aSChristoph Hellwig struct xfs_bmbt_irec *irec) 6630f712c9SDave Chinner { 676bdcf26aSChristoph Hellwig uint64_t l0 = get_unaligned_be64(&rec->l0); 686bdcf26aSChristoph Hellwig uint64_t l1 = get_unaligned_be64(&rec->l1); 6930f712c9SDave Chinner 706bdcf26aSChristoph Hellwig irec->br_startoff = (l0 & xfs_mask64lo(64 - BMBT_EXNTFLAG_BITLEN)) >> 9; 716bdcf26aSChristoph Hellwig irec->br_startblock = ((l0 & xfs_mask64lo(9)) << 43) | (l1 >> 21); 726bdcf26aSChristoph Hellwig irec->br_blockcount = l1 & xfs_mask64lo(21); 736bdcf26aSChristoph Hellwig if (l0 >> (64 - BMBT_EXNTFLAG_BITLEN)) 746bdcf26aSChristoph Hellwig irec->br_state = XFS_EXT_UNWRITTEN; 756bdcf26aSChristoph Hellwig else 766bdcf26aSChristoph Hellwig irec->br_state = XFS_EXT_NORM; 7730f712c9SDave Chinner } 7830f712c9SDave Chinner 7930f712c9SDave Chinner /* 8030f712c9SDave Chinner * Extract the blockcount field from an on disk bmap extent record. 8130f712c9SDave Chinner */ 8230f712c9SDave Chinner xfs_filblks_t 8330f712c9SDave Chinner xfs_bmbt_disk_get_blockcount( 8423825cd1SDarrick J. Wong const struct xfs_bmbt_rec *r) 8530f712c9SDave Chinner { 8630f712c9SDave Chinner return (xfs_filblks_t)(be64_to_cpu(r->l1) & xfs_mask64lo(21)); 8730f712c9SDave Chinner } 8830f712c9SDave Chinner 8930f712c9SDave Chinner /* 9030f712c9SDave Chinner * Extract the startoff field from a disk format bmap extent record. 9130f712c9SDave Chinner */ 9230f712c9SDave Chinner xfs_fileoff_t 9330f712c9SDave Chinner xfs_bmbt_disk_get_startoff( 9423825cd1SDarrick J. Wong const struct xfs_bmbt_rec *r) 9530f712c9SDave Chinner { 9630f712c9SDave Chinner return ((xfs_fileoff_t)be64_to_cpu(r->l0) & 9730f712c9SDave Chinner xfs_mask64lo(64 - BMBT_EXNTFLAG_BITLEN)) >> 9; 9830f712c9SDave Chinner } 9930f712c9SDave Chinner 10030f712c9SDave Chinner /* 10130f712c9SDave Chinner * Set all the fields in a bmap extent record from the uncompressed form. 10230f712c9SDave Chinner */ 10330f712c9SDave Chinner void 10430f712c9SDave Chinner xfs_bmbt_disk_set_all( 105a67d00a5SChristoph Hellwig struct xfs_bmbt_rec *r, 106a67d00a5SChristoph Hellwig struct xfs_bmbt_irec *s) 10730f712c9SDave Chinner { 108a67d00a5SChristoph Hellwig int extent_flag = (s->br_state != XFS_EXT_NORM); 109a67d00a5SChristoph Hellwig 110a67d00a5SChristoph Hellwig ASSERT(s->br_state == XFS_EXT_NORM || s->br_state == XFS_EXT_UNWRITTEN); 111a67d00a5SChristoph Hellwig ASSERT(!(s->br_startoff & xfs_mask64hi(64-BMBT_STARTOFF_BITLEN))); 112a67d00a5SChristoph Hellwig ASSERT(!(s->br_blockcount & xfs_mask64hi(64-BMBT_BLOCKCOUNT_BITLEN))); 113a67d00a5SChristoph Hellwig ASSERT(!(s->br_startblock & xfs_mask64hi(64-BMBT_STARTBLOCK_BITLEN))); 114a67d00a5SChristoph Hellwig 115135dcc10SChristoph Hellwig put_unaligned_be64( 116a67d00a5SChristoph Hellwig ((xfs_bmbt_rec_base_t)extent_flag << 63) | 117a67d00a5SChristoph Hellwig ((xfs_bmbt_rec_base_t)s->br_startoff << 9) | 118135dcc10SChristoph Hellwig ((xfs_bmbt_rec_base_t)s->br_startblock >> 43), &r->l0); 119135dcc10SChristoph Hellwig put_unaligned_be64( 120a67d00a5SChristoph Hellwig ((xfs_bmbt_rec_base_t)s->br_startblock << 21) | 121a67d00a5SChristoph Hellwig ((xfs_bmbt_rec_base_t)s->br_blockcount & 122135dcc10SChristoph Hellwig (xfs_bmbt_rec_base_t)xfs_mask64lo(21)), &r->l1); 12330f712c9SDave Chinner } 12430f712c9SDave Chinner 12530f712c9SDave Chinner /* 12630f712c9SDave Chinner * Convert in-memory form of btree root to on-disk form. 12730f712c9SDave Chinner */ 12830f712c9SDave Chinner void 12930f712c9SDave Chinner xfs_bmbt_to_bmdr( 13030f712c9SDave Chinner struct xfs_mount *mp, 13130f712c9SDave Chinner struct xfs_btree_block *rblock, 13230f712c9SDave Chinner int rblocklen, 13330f712c9SDave Chinner xfs_bmdr_block_t *dblock, 13430f712c9SDave Chinner int dblocklen) 13530f712c9SDave Chinner { 13630f712c9SDave Chinner int dmxr; 13730f712c9SDave Chinner xfs_bmbt_key_t *fkp; 13830f712c9SDave Chinner __be64 *fpp; 13930f712c9SDave Chinner xfs_bmbt_key_t *tkp; 14030f712c9SDave Chinner __be64 *tpp; 14130f712c9SDave Chinner 14238c26bfdSDave Chinner if (xfs_has_crc(mp)) { 14330f712c9SDave Chinner ASSERT(rblock->bb_magic == cpu_to_be32(XFS_BMAP_CRC_MAGIC)); 144ce748eaaSEric Sandeen ASSERT(uuid_equal(&rblock->bb_u.l.bb_uuid, 145ce748eaaSEric Sandeen &mp->m_sb.sb_meta_uuid)); 14630f712c9SDave Chinner ASSERT(rblock->bb_u.l.bb_blkno == 14730f712c9SDave Chinner cpu_to_be64(XFS_BUF_DADDR_NULL)); 14830f712c9SDave Chinner } else 14930f712c9SDave Chinner ASSERT(rblock->bb_magic == cpu_to_be32(XFS_BMAP_MAGIC)); 150d5cf09baSChristoph Hellwig ASSERT(rblock->bb_u.l.bb_leftsib == cpu_to_be64(NULLFSBLOCK)); 151d5cf09baSChristoph Hellwig ASSERT(rblock->bb_u.l.bb_rightsib == cpu_to_be64(NULLFSBLOCK)); 15230f712c9SDave Chinner ASSERT(rblock->bb_level != 0); 15330f712c9SDave Chinner dblock->bb_level = rblock->bb_level; 15430f712c9SDave Chinner dblock->bb_numrecs = rblock->bb_numrecs; 15530f712c9SDave Chinner dmxr = xfs_bmdr_maxrecs(dblocklen, 0); 15630f712c9SDave Chinner fkp = XFS_BMBT_KEY_ADDR(mp, rblock, 1); 15730f712c9SDave Chinner tkp = XFS_BMDR_KEY_ADDR(dblock, 1); 15830f712c9SDave Chinner fpp = XFS_BMAP_BROOT_PTR_ADDR(mp, rblock, 1, rblocklen); 15930f712c9SDave Chinner tpp = XFS_BMDR_PTR_ADDR(dblock, 1, dmxr); 16030f712c9SDave Chinner dmxr = be16_to_cpu(dblock->bb_numrecs); 16130f712c9SDave Chinner memcpy(tkp, fkp, sizeof(*fkp) * dmxr); 16230f712c9SDave Chinner memcpy(tpp, fpp, sizeof(*fpp) * dmxr); 16330f712c9SDave Chinner } 16430f712c9SDave Chinner 16530f712c9SDave Chinner STATIC struct xfs_btree_cur * 16630f712c9SDave Chinner xfs_bmbt_dup_cursor( 16730f712c9SDave Chinner struct xfs_btree_cur *cur) 16830f712c9SDave Chinner { 16930f712c9SDave Chinner struct xfs_btree_cur *new; 17030f712c9SDave Chinner 17130f712c9SDave Chinner new = xfs_bmbt_init_cursor(cur->bc_mp, cur->bc_tp, 17292219c29SDave Chinner cur->bc_ino.ip, cur->bc_ino.whichfork); 17330f712c9SDave Chinner 17430f712c9SDave Chinner /* 1752c3234d1SDarrick J. Wong * Copy the firstblock, dfops, and flags values, 17630f712c9SDave Chinner * since init cursor doesn't get them. 17730f712c9SDave Chinner */ 17892219c29SDave Chinner new->bc_ino.flags = cur->bc_ino.flags; 17930f712c9SDave Chinner 18030f712c9SDave Chinner return new; 18130f712c9SDave Chinner } 18230f712c9SDave Chinner 18330f712c9SDave Chinner STATIC void 18430f712c9SDave Chinner xfs_bmbt_update_cursor( 18530f712c9SDave Chinner struct xfs_btree_cur *src, 18630f712c9SDave Chinner struct xfs_btree_cur *dst) 18730f712c9SDave Chinner { 188692b6cddSDave Chinner ASSERT((dst->bc_tp->t_highest_agno != NULLAGNUMBER) || 189db07349dSChristoph Hellwig (dst->bc_ino.ip->i_diflags & XFS_DIFLAG_REALTIME)); 19030f712c9SDave Chinner 19192219c29SDave Chinner dst->bc_ino.allocated += src->bc_ino.allocated; 192692b6cddSDave Chinner dst->bc_tp->t_highest_agno = src->bc_tp->t_highest_agno; 19330f712c9SDave Chinner 19492219c29SDave Chinner src->bc_ino.allocated = 0; 19530f712c9SDave Chinner } 19630f712c9SDave Chinner 19730f712c9SDave Chinner STATIC int 19830f712c9SDave Chinner xfs_bmbt_alloc_block( 19930f712c9SDave Chinner struct xfs_btree_cur *cur, 200deb06b9aSDarrick J. Wong const union xfs_btree_ptr *start, 20130f712c9SDave Chinner union xfs_btree_ptr *new, 20230f712c9SDave Chinner int *stat) 20330f712c9SDave Chinner { 20474c36a86SDave Chinner struct xfs_alloc_arg args; 20574c36a86SDave Chinner int error; 20630f712c9SDave Chinner 20730f712c9SDave Chinner memset(&args, 0, sizeof(args)); 20830f712c9SDave Chinner args.tp = cur->bc_tp; 20930f712c9SDave Chinner args.mp = cur->bc_mp; 21092219c29SDave Chinner xfs_rmap_ino_bmbt_owner(&args.oinfo, cur->bc_ino.ip->i_ino, 21192219c29SDave Chinner cur->bc_ino.whichfork); 21274c36a86SDave Chinner args.minlen = args.maxlen = args.prod = 1; 21374c36a86SDave Chinner args.wasdel = cur->bc_ino.flags & XFS_BTCUR_BMBT_WASDEL; 21474c36a86SDave Chinner if (!args.wasdel && args.tp->t_blk_res == 0) 21574c36a86SDave Chinner return -ENOSPC; 21630f712c9SDave Chinner 21730f712c9SDave Chinner /* 218d5753847SDave Chinner * If we are coming here from something like unwritten extent 21936b6ad2dSDave Chinner * conversion, there has been no data extent allocation already done, so 22036b6ad2dSDave Chinner * we have to ensure that we attempt to locate the entire set of bmbt 22136b6ad2dSDave Chinner * allocations in the same AG, as xfs_bmapi_write() would have reserved. 22230f712c9SDave Chinner */ 223692b6cddSDave Chinner if (cur->bc_tp->t_highest_agno == NULLAGNUMBER) 224d5753847SDave Chinner args.minleft = xfs_bmapi_minleft(cur->bc_tp, cur->bc_ino.ip, 225d5753847SDave Chinner cur->bc_ino.whichfork); 22630f712c9SDave Chinner 2272a7f6d41SDave Chinner error = xfs_alloc_vextent_start_ag(&args, be64_to_cpu(start->l)); 22830f712c9SDave Chinner if (error) 22974c36a86SDave Chinner return error; 23030f712c9SDave Chinner 23130f712c9SDave Chinner if (args.fsbno == NULLFSBLOCK && args.minleft) { 23230f712c9SDave Chinner /* 23330f712c9SDave Chinner * Could not find an AG with enough free space to satisfy 234255c5162SChristoph Hellwig * a full btree split. Try again and if 23530f712c9SDave Chinner * successful activate the lowspace algorithm. 23630f712c9SDave Chinner */ 237d5753847SDave Chinner args.minleft = 0; 2382a7f6d41SDave Chinner error = xfs_alloc_vextent_start_ag(&args, 0); 23930f712c9SDave Chinner if (error) 24074c36a86SDave Chinner return error; 2411214f1cfSBrian Foster cur->bc_tp->t_flags |= XFS_TRANS_LOWMODE; 24230f712c9SDave Chinner } 2432fcc319dSChristoph Hellwig if (WARN_ON_ONCE(args.fsbno == NULLFSBLOCK)) { 24430f712c9SDave Chinner *stat = 0; 24530f712c9SDave Chinner return 0; 24630f712c9SDave Chinner } 247e157ebdcSCarlos Maiolino 24830f712c9SDave Chinner ASSERT(args.len == 1); 24992219c29SDave Chinner cur->bc_ino.allocated++; 2506e73a545SChristoph Hellwig cur->bc_ino.ip->i_nblocks++; 25192219c29SDave Chinner xfs_trans_log_inode(args.tp, cur->bc_ino.ip, XFS_ILOG_CORE); 25292219c29SDave Chinner xfs_trans_mod_dquot_byino(args.tp, cur->bc_ino.ip, 25330f712c9SDave Chinner XFS_TRANS_DQ_BCOUNT, 1L); 25430f712c9SDave Chinner 25530f712c9SDave Chinner new->l = cpu_to_be64(args.fsbno); 25630f712c9SDave Chinner 25730f712c9SDave Chinner *stat = 1; 25830f712c9SDave Chinner return 0; 25930f712c9SDave Chinner } 26030f712c9SDave Chinner 26130f712c9SDave Chinner STATIC int 26230f712c9SDave Chinner xfs_bmbt_free_block( 26330f712c9SDave Chinner struct xfs_btree_cur *cur, 26430f712c9SDave Chinner struct xfs_buf *bp) 26530f712c9SDave Chinner { 26630f712c9SDave Chinner struct xfs_mount *mp = cur->bc_mp; 26792219c29SDave Chinner struct xfs_inode *ip = cur->bc_ino.ip; 26830f712c9SDave Chinner struct xfs_trans *tp = cur->bc_tp; 26904fcad80SDave Chinner xfs_fsblock_t fsbno = XFS_DADDR_TO_FSB(mp, xfs_buf_daddr(bp)); 270340785ccSDarrick J. Wong struct xfs_owner_info oinfo; 27130f712c9SDave Chinner 27292219c29SDave Chinner xfs_rmap_ino_bmbt_owner(&oinfo, ip->i_ino, cur->bc_ino.whichfork); 273c201d9caSDarrick J. Wong xfs_free_extent_later(cur->bc_tp, fsbno, 1, &oinfo); 2746e73a545SChristoph Hellwig ip->i_nblocks--; 27530f712c9SDave Chinner 27630f712c9SDave Chinner xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE); 27730f712c9SDave Chinner xfs_trans_mod_dquot_byino(tp, ip, XFS_TRANS_DQ_BCOUNT, -1L); 27830f712c9SDave Chinner return 0; 27930f712c9SDave Chinner } 28030f712c9SDave Chinner 28130f712c9SDave Chinner STATIC int 28230f712c9SDave Chinner xfs_bmbt_get_minrecs( 28330f712c9SDave Chinner struct xfs_btree_cur *cur, 28430f712c9SDave Chinner int level) 28530f712c9SDave Chinner { 28630f712c9SDave Chinner if (level == cur->bc_nlevels - 1) { 28730f712c9SDave Chinner struct xfs_ifork *ifp; 28830f712c9SDave Chinner 289732436efSDarrick J. Wong ifp = xfs_ifork_ptr(cur->bc_ino.ip, 29092219c29SDave Chinner cur->bc_ino.whichfork); 29130f712c9SDave Chinner 29230f712c9SDave Chinner return xfs_bmbt_maxrecs(cur->bc_mp, 29330f712c9SDave Chinner ifp->if_broot_bytes, level == 0) / 2; 29430f712c9SDave Chinner } 29530f712c9SDave Chinner 29630f712c9SDave Chinner return cur->bc_mp->m_bmap_dmnr[level != 0]; 29730f712c9SDave Chinner } 29830f712c9SDave Chinner 29930f712c9SDave Chinner int 30030f712c9SDave Chinner xfs_bmbt_get_maxrecs( 30130f712c9SDave Chinner struct xfs_btree_cur *cur, 30230f712c9SDave Chinner int level) 30330f712c9SDave Chinner { 30430f712c9SDave Chinner if (level == cur->bc_nlevels - 1) { 30530f712c9SDave Chinner struct xfs_ifork *ifp; 30630f712c9SDave Chinner 307732436efSDarrick J. Wong ifp = xfs_ifork_ptr(cur->bc_ino.ip, 30892219c29SDave Chinner cur->bc_ino.whichfork); 30930f712c9SDave Chinner 31030f712c9SDave Chinner return xfs_bmbt_maxrecs(cur->bc_mp, 31130f712c9SDave Chinner ifp->if_broot_bytes, level == 0); 31230f712c9SDave Chinner } 31330f712c9SDave Chinner 31430f712c9SDave Chinner return cur->bc_mp->m_bmap_dmxr[level != 0]; 31530f712c9SDave Chinner 31630f712c9SDave Chinner } 31730f712c9SDave Chinner 31830f712c9SDave Chinner /* 31930f712c9SDave Chinner * Get the maximum records we could store in the on-disk format. 32030f712c9SDave Chinner * 32130f712c9SDave Chinner * For non-root nodes this is equivalent to xfs_bmbt_get_maxrecs, but 32230f712c9SDave Chinner * for the root node this checks the available space in the dinode fork 32330f712c9SDave Chinner * so that we can resize the in-memory buffer to match it. After a 32430f712c9SDave Chinner * resize to the maximum size this function returns the same value 32530f712c9SDave Chinner * as xfs_bmbt_get_maxrecs for the root node, too. 32630f712c9SDave Chinner */ 32730f712c9SDave Chinner STATIC int 32830f712c9SDave Chinner xfs_bmbt_get_dmaxrecs( 32930f712c9SDave Chinner struct xfs_btree_cur *cur, 33030f712c9SDave Chinner int level) 33130f712c9SDave Chinner { 33230f712c9SDave Chinner if (level != cur->bc_nlevels - 1) 33330f712c9SDave Chinner return cur->bc_mp->m_bmap_dmxr[level != 0]; 33492219c29SDave Chinner return xfs_bmdr_maxrecs(cur->bc_ino.forksize, level == 0); 33530f712c9SDave Chinner } 33630f712c9SDave Chinner 33730f712c9SDave Chinner STATIC void 33830f712c9SDave Chinner xfs_bmbt_init_key_from_rec( 33930f712c9SDave Chinner union xfs_btree_key *key, 34023825cd1SDarrick J. Wong const union xfs_btree_rec *rec) 34130f712c9SDave Chinner { 34230f712c9SDave Chinner key->bmbt.br_startoff = 34330f712c9SDave Chinner cpu_to_be64(xfs_bmbt_disk_get_startoff(&rec->bmbt)); 34430f712c9SDave Chinner } 34530f712c9SDave Chinner 34630f712c9SDave Chinner STATIC void 347118bb47eSDarrick J. Wong xfs_bmbt_init_high_key_from_rec( 348118bb47eSDarrick J. Wong union xfs_btree_key *key, 34923825cd1SDarrick J. Wong const union xfs_btree_rec *rec) 350118bb47eSDarrick J. Wong { 351118bb47eSDarrick J. Wong key->bmbt.br_startoff = cpu_to_be64( 352118bb47eSDarrick J. Wong xfs_bmbt_disk_get_startoff(&rec->bmbt) + 353118bb47eSDarrick J. Wong xfs_bmbt_disk_get_blockcount(&rec->bmbt) - 1); 354118bb47eSDarrick J. Wong } 355118bb47eSDarrick J. Wong 356118bb47eSDarrick J. Wong STATIC void 35730f712c9SDave Chinner xfs_bmbt_init_rec_from_cur( 35830f712c9SDave Chinner struct xfs_btree_cur *cur, 35930f712c9SDave Chinner union xfs_btree_rec *rec) 36030f712c9SDave Chinner { 36130f712c9SDave Chinner xfs_bmbt_disk_set_all(&rec->bmbt, &cur->bc_rec.b); 36230f712c9SDave Chinner } 36330f712c9SDave Chinner 36430f712c9SDave Chinner STATIC void 36530f712c9SDave Chinner xfs_bmbt_init_ptr_from_cur( 36630f712c9SDave Chinner struct xfs_btree_cur *cur, 36730f712c9SDave Chinner union xfs_btree_ptr *ptr) 36830f712c9SDave Chinner { 36930f712c9SDave Chinner ptr->l = 0; 37030f712c9SDave Chinner } 37130f712c9SDave Chinner 372c8ce540dSDarrick J. Wong STATIC int64_t 37330f712c9SDave Chinner xfs_bmbt_key_diff( 37430f712c9SDave Chinner struct xfs_btree_cur *cur, 375d29d5577SDarrick J. Wong const union xfs_btree_key *key) 37630f712c9SDave Chinner { 377c8ce540dSDarrick J. Wong return (int64_t)be64_to_cpu(key->bmbt.br_startoff) - 37830f712c9SDave Chinner cur->bc_rec.b.br_startoff; 37930f712c9SDave Chinner } 38030f712c9SDave Chinner 381118bb47eSDarrick J. Wong STATIC int64_t 382118bb47eSDarrick J. Wong xfs_bmbt_diff_two_keys( 383118bb47eSDarrick J. Wong struct xfs_btree_cur *cur, 384d29d5577SDarrick J. Wong const union xfs_btree_key *k1, 385d29d5577SDarrick J. Wong const union xfs_btree_key *k2) 386118bb47eSDarrick J. Wong { 387b521c890SDarrick J. Wong uint64_t a = be64_to_cpu(k1->bmbt.br_startoff); 388b521c890SDarrick J. Wong uint64_t b = be64_to_cpu(k2->bmbt.br_startoff); 389b521c890SDarrick J. Wong 390b521c890SDarrick J. Wong /* 391b521c890SDarrick J. Wong * Note: This routine previously casted a and b to int64 and subtracted 392b521c890SDarrick J. Wong * them to generate a result. This lead to problems if b was the 393b521c890SDarrick J. Wong * "maximum" key value (all ones) being signed incorrectly, hence this 394b521c890SDarrick J. Wong * somewhat less efficient version. 395b521c890SDarrick J. Wong */ 396b521c890SDarrick J. Wong if (a > b) 397b521c890SDarrick J. Wong return 1; 398b521c890SDarrick J. Wong if (b > a) 399b521c890SDarrick J. Wong return -1; 400b521c890SDarrick J. Wong return 0; 401118bb47eSDarrick J. Wong } 402118bb47eSDarrick J. Wong 403a6a781a5SDarrick J. Wong static xfs_failaddr_t 40430f712c9SDave Chinner xfs_bmbt_verify( 40530f712c9SDave Chinner struct xfs_buf *bp) 40630f712c9SDave Chinner { 407dbd329f1SChristoph Hellwig struct xfs_mount *mp = bp->b_mount; 40830f712c9SDave Chinner struct xfs_btree_block *block = XFS_BUF_TO_BLOCK(bp); 409a6a781a5SDarrick J. Wong xfs_failaddr_t fa; 41030f712c9SDave Chinner unsigned int level; 41130f712c9SDave Chinner 41239708c20SBrian Foster if (!xfs_verify_magic(bp, block->bb_magic)) 41339708c20SBrian Foster return __this_address; 41439708c20SBrian Foster 415ebd9027dSDave Chinner if (xfs_has_crc(mp)) { 41630f712c9SDave Chinner /* 41730f712c9SDave Chinner * XXX: need a better way of verifying the owner here. Right now 41830f712c9SDave Chinner * just make sure there has been one set. 41930f712c9SDave Chinner */ 420a6a781a5SDarrick J. Wong fa = xfs_btree_lblock_v5hdr_verify(bp, XFS_RMAP_OWN_UNKNOWN); 421a6a781a5SDarrick J. Wong if (fa) 422a6a781a5SDarrick J. Wong return fa; 42330f712c9SDave Chinner } 42430f712c9SDave Chinner 42530f712c9SDave Chinner /* 42630f712c9SDave Chinner * numrecs and level verification. 42730f712c9SDave Chinner * 42830f712c9SDave Chinner * We don't know what fork we belong to, so just verify that the level 42930f712c9SDave Chinner * is less than the maximum of the two. Later checks will be more 43030f712c9SDave Chinner * precise. 43130f712c9SDave Chinner */ 43230f712c9SDave Chinner level = be16_to_cpu(block->bb_level); 43330f712c9SDave Chinner if (level > max(mp->m_bm_maxlevels[0], mp->m_bm_maxlevels[1])) 434a6a781a5SDarrick J. Wong return __this_address; 43530f712c9SDave Chinner 4368368a601SDarrick J. Wong return xfs_btree_lblock_verify(bp, mp->m_bmap_dmxr[level != 0]); 43730f712c9SDave Chinner } 43830f712c9SDave Chinner 43930f712c9SDave Chinner static void 44030f712c9SDave Chinner xfs_bmbt_read_verify( 44130f712c9SDave Chinner struct xfs_buf *bp) 44230f712c9SDave Chinner { 443bc1a09b8SDarrick J. Wong xfs_failaddr_t fa; 444bc1a09b8SDarrick J. Wong 44530f712c9SDave Chinner if (!xfs_btree_lblock_verify_crc(bp)) 446bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSBADCRC, __this_address); 447bc1a09b8SDarrick J. Wong else { 448bc1a09b8SDarrick J. Wong fa = xfs_bmbt_verify(bp); 449bc1a09b8SDarrick J. Wong if (fa) 450bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSCORRUPTED, fa); 451bc1a09b8SDarrick J. Wong } 45230f712c9SDave Chinner 45331ca03c9SDarrick J. Wong if (bp->b_error) 45430f712c9SDave Chinner trace_xfs_btree_corrupt(bp, _RET_IP_); 45530f712c9SDave Chinner } 45630f712c9SDave Chinner 45730f712c9SDave Chinner static void 45830f712c9SDave Chinner xfs_bmbt_write_verify( 45930f712c9SDave Chinner struct xfs_buf *bp) 46030f712c9SDave Chinner { 461bc1a09b8SDarrick J. Wong xfs_failaddr_t fa; 462bc1a09b8SDarrick J. Wong 463bc1a09b8SDarrick J. Wong fa = xfs_bmbt_verify(bp); 464bc1a09b8SDarrick J. Wong if (fa) { 46530f712c9SDave Chinner trace_xfs_btree_corrupt(bp, _RET_IP_); 466bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSCORRUPTED, fa); 46730f712c9SDave Chinner return; 46830f712c9SDave Chinner } 46930f712c9SDave Chinner xfs_btree_lblock_calc_crc(bp); 47030f712c9SDave Chinner } 47130f712c9SDave Chinner 47230f712c9SDave Chinner const struct xfs_buf_ops xfs_bmbt_buf_ops = { 473233135b7SEric Sandeen .name = "xfs_bmbt", 47439708c20SBrian Foster .magic = { cpu_to_be32(XFS_BMAP_MAGIC), 47539708c20SBrian Foster cpu_to_be32(XFS_BMAP_CRC_MAGIC) }, 47630f712c9SDave Chinner .verify_read = xfs_bmbt_read_verify, 47730f712c9SDave Chinner .verify_write = xfs_bmbt_write_verify, 478b5572597SDarrick J. Wong .verify_struct = xfs_bmbt_verify, 47930f712c9SDave Chinner }; 48030f712c9SDave Chinner 48130f712c9SDave Chinner 48230f712c9SDave Chinner STATIC int 48330f712c9SDave Chinner xfs_bmbt_keys_inorder( 48430f712c9SDave Chinner struct xfs_btree_cur *cur, 4858e38dc88SDarrick J. Wong const union xfs_btree_key *k1, 4868e38dc88SDarrick J. Wong const union xfs_btree_key *k2) 48730f712c9SDave Chinner { 48830f712c9SDave Chinner return be64_to_cpu(k1->bmbt.br_startoff) < 48930f712c9SDave Chinner be64_to_cpu(k2->bmbt.br_startoff); 49030f712c9SDave Chinner } 49130f712c9SDave Chinner 49230f712c9SDave Chinner STATIC int 49330f712c9SDave Chinner xfs_bmbt_recs_inorder( 49430f712c9SDave Chinner struct xfs_btree_cur *cur, 4958e38dc88SDarrick J. Wong const union xfs_btree_rec *r1, 4968e38dc88SDarrick J. Wong const union xfs_btree_rec *r2) 49730f712c9SDave Chinner { 49830f712c9SDave Chinner return xfs_bmbt_disk_get_startoff(&r1->bmbt) + 49930f712c9SDave Chinner xfs_bmbt_disk_get_blockcount(&r1->bmbt) <= 50030f712c9SDave Chinner xfs_bmbt_disk_get_startoff(&r2->bmbt); 50130f712c9SDave Chinner } 50230f712c9SDave Chinner 503*6abc7aefSDarrick J. Wong STATIC enum xbtree_key_contig 504*6abc7aefSDarrick J. Wong xfs_bmbt_keys_contiguous( 505*6abc7aefSDarrick J. Wong struct xfs_btree_cur *cur, 506*6abc7aefSDarrick J. Wong const union xfs_btree_key *key1, 507*6abc7aefSDarrick J. Wong const union xfs_btree_key *key2) 508*6abc7aefSDarrick J. Wong { 509*6abc7aefSDarrick J. Wong return xbtree_key_contig(be64_to_cpu(key1->bmbt.br_startoff), 510*6abc7aefSDarrick J. Wong be64_to_cpu(key2->bmbt.br_startoff)); 511*6abc7aefSDarrick J. Wong } 512*6abc7aefSDarrick J. Wong 51330f712c9SDave Chinner static const struct xfs_btree_ops xfs_bmbt_ops = { 51430f712c9SDave Chinner .rec_len = sizeof(xfs_bmbt_rec_t), 51530f712c9SDave Chinner .key_len = sizeof(xfs_bmbt_key_t), 51630f712c9SDave Chinner 51730f712c9SDave Chinner .dup_cursor = xfs_bmbt_dup_cursor, 51830f712c9SDave Chinner .update_cursor = xfs_bmbt_update_cursor, 51930f712c9SDave Chinner .alloc_block = xfs_bmbt_alloc_block, 52030f712c9SDave Chinner .free_block = xfs_bmbt_free_block, 52130f712c9SDave Chinner .get_maxrecs = xfs_bmbt_get_maxrecs, 52230f712c9SDave Chinner .get_minrecs = xfs_bmbt_get_minrecs, 52330f712c9SDave Chinner .get_dmaxrecs = xfs_bmbt_get_dmaxrecs, 52430f712c9SDave Chinner .init_key_from_rec = xfs_bmbt_init_key_from_rec, 525118bb47eSDarrick J. Wong .init_high_key_from_rec = xfs_bmbt_init_high_key_from_rec, 52630f712c9SDave Chinner .init_rec_from_cur = xfs_bmbt_init_rec_from_cur, 52730f712c9SDave Chinner .init_ptr_from_cur = xfs_bmbt_init_ptr_from_cur, 52830f712c9SDave Chinner .key_diff = xfs_bmbt_key_diff, 529118bb47eSDarrick J. Wong .diff_two_keys = xfs_bmbt_diff_two_keys, 53030f712c9SDave Chinner .buf_ops = &xfs_bmbt_buf_ops, 53130f712c9SDave Chinner .keys_inorder = xfs_bmbt_keys_inorder, 53230f712c9SDave Chinner .recs_inorder = xfs_bmbt_recs_inorder, 533*6abc7aefSDarrick J. Wong .keys_contiguous = xfs_bmbt_keys_contiguous, 53430f712c9SDave Chinner }; 53530f712c9SDave Chinner 53630f712c9SDave Chinner /* 53730f712c9SDave Chinner * Allocate a new bmap btree cursor. 53830f712c9SDave Chinner */ 53930f712c9SDave Chinner struct xfs_btree_cur * /* new bmap btree cursor */ 54030f712c9SDave Chinner xfs_bmbt_init_cursor( 54130f712c9SDave Chinner struct xfs_mount *mp, /* file system mount point */ 54230f712c9SDave Chinner struct xfs_trans *tp, /* transaction pointer */ 54330f712c9SDave Chinner struct xfs_inode *ip, /* inode owning the btree */ 54430f712c9SDave Chinner int whichfork) /* data or attr fork */ 54530f712c9SDave Chinner { 546732436efSDarrick J. Wong struct xfs_ifork *ifp = xfs_ifork_ptr(ip, whichfork); 54730f712c9SDave Chinner struct xfs_btree_cur *cur; 5483993baebSDarrick J. Wong ASSERT(whichfork != XFS_COW_FORK); 54930f712c9SDave Chinner 550c940a0c5SDarrick J. Wong cur = xfs_btree_alloc_cursor(mp, tp, XFS_BTNUM_BMAP, 5519fa47bdcSDarrick J. Wong mp->m_bm_maxlevels[whichfork], xfs_bmbt_cur_cache); 55230f712c9SDave Chinner cur->bc_nlevels = be16_to_cpu(ifp->if_broot->bb_level) + 1; 55311ef38afSDave Chinner cur->bc_statoff = XFS_STATS_CALC_INDEX(xs_bmbt_2); 55430f712c9SDave Chinner 55530f712c9SDave Chinner cur->bc_ops = &xfs_bmbt_ops; 55630f712c9SDave Chinner cur->bc_flags = XFS_BTREE_LONG_PTRS | XFS_BTREE_ROOT_IN_INODE; 55738c26bfdSDave Chinner if (xfs_has_crc(mp)) 55830f712c9SDave Chinner cur->bc_flags |= XFS_BTREE_CRC_BLOCKS; 55930f712c9SDave Chinner 560c01147d9SDarrick J. Wong cur->bc_ino.forksize = xfs_inode_fork_size(ip, whichfork); 56192219c29SDave Chinner cur->bc_ino.ip = ip; 56292219c29SDave Chinner cur->bc_ino.allocated = 0; 56392219c29SDave Chinner cur->bc_ino.flags = 0; 56492219c29SDave Chinner cur->bc_ino.whichfork = whichfork; 56530f712c9SDave Chinner 56630f712c9SDave Chinner return cur; 56730f712c9SDave Chinner } 56830f712c9SDave Chinner 5690ed5f735SDarrick J. Wong /* Calculate number of records in a block mapping btree block. */ 5700ed5f735SDarrick J. Wong static inline unsigned int 5710ed5f735SDarrick J. Wong xfs_bmbt_block_maxrecs( 5720ed5f735SDarrick J. Wong unsigned int blocklen, 5730ed5f735SDarrick J. Wong bool leaf) 5740ed5f735SDarrick J. Wong { 5750ed5f735SDarrick J. Wong if (leaf) 5760ed5f735SDarrick J. Wong return blocklen / sizeof(xfs_bmbt_rec_t); 5770ed5f735SDarrick J. Wong return blocklen / (sizeof(xfs_bmbt_key_t) + sizeof(xfs_bmbt_ptr_t)); 5780ed5f735SDarrick J. Wong } 5790ed5f735SDarrick J. Wong 58030f712c9SDave Chinner /* 58130f712c9SDave Chinner * Calculate number of records in a bmap btree block. 58230f712c9SDave Chinner */ 58330f712c9SDave Chinner int 58430f712c9SDave Chinner xfs_bmbt_maxrecs( 58530f712c9SDave Chinner struct xfs_mount *mp, 58630f712c9SDave Chinner int blocklen, 58730f712c9SDave Chinner int leaf) 58830f712c9SDave Chinner { 58930f712c9SDave Chinner blocklen -= XFS_BMBT_BLOCK_LEN(mp); 5900ed5f735SDarrick J. Wong return xfs_bmbt_block_maxrecs(blocklen, leaf); 5910ed5f735SDarrick J. Wong } 59230f712c9SDave Chinner 593df9ad5ccSChandan Babu R /* 594df9ad5ccSChandan Babu R * Calculate the maximum possible height of the btree that the on-disk format 595df9ad5ccSChandan Babu R * supports. This is used for sizing structures large enough to support every 596df9ad5ccSChandan Babu R * possible configuration of a filesystem that might get mounted. 597df9ad5ccSChandan Babu R */ 5980ed5f735SDarrick J. Wong unsigned int 5990ed5f735SDarrick J. Wong xfs_bmbt_maxlevels_ondisk(void) 6000ed5f735SDarrick J. Wong { 6010ed5f735SDarrick J. Wong unsigned int minrecs[2]; 6020ed5f735SDarrick J. Wong unsigned int blocklen; 6030ed5f735SDarrick J. Wong 6040ed5f735SDarrick J. Wong blocklen = min(XFS_MIN_BLOCKSIZE - XFS_BTREE_SBLOCK_LEN, 6050ed5f735SDarrick J. Wong XFS_MIN_CRC_BLOCKSIZE - XFS_BTREE_SBLOCK_CRC_LEN); 6060ed5f735SDarrick J. Wong 6070ed5f735SDarrick J. Wong minrecs[0] = xfs_bmbt_block_maxrecs(blocklen, true) / 2; 6080ed5f735SDarrick J. Wong minrecs[1] = xfs_bmbt_block_maxrecs(blocklen, false) / 2; 6090ed5f735SDarrick J. Wong 6100ed5f735SDarrick J. Wong /* One extra level for the inode root. */ 611df9ad5ccSChandan Babu R return xfs_btree_compute_maxlevels(minrecs, 612df9ad5ccSChandan Babu R XFS_MAX_EXTCNT_DATA_FORK_LARGE) + 1; 61330f712c9SDave Chinner } 61430f712c9SDave Chinner 61530f712c9SDave Chinner /* 61630f712c9SDave Chinner * Calculate number of records in a bmap btree inode root. 61730f712c9SDave Chinner */ 61830f712c9SDave Chinner int 61930f712c9SDave Chinner xfs_bmdr_maxrecs( 62030f712c9SDave Chinner int blocklen, 62130f712c9SDave Chinner int leaf) 62230f712c9SDave Chinner { 62330f712c9SDave Chinner blocklen -= sizeof(xfs_bmdr_block_t); 62430f712c9SDave Chinner 62530f712c9SDave Chinner if (leaf) 62630f712c9SDave Chinner return blocklen / sizeof(xfs_bmdr_rec_t); 62730f712c9SDave Chinner return blocklen / (sizeof(xfs_bmdr_key_t) + sizeof(xfs_bmdr_ptr_t)); 62830f712c9SDave Chinner } 62930f712c9SDave Chinner 63030f712c9SDave Chinner /* 63130f712c9SDave Chinner * Change the owner of a btree format fork fo the inode passed in. Change it to 63230f712c9SDave Chinner * the owner of that is passed in so that we can change owners before or after 63330f712c9SDave Chinner * we switch forks between inodes. The operation that the caller is doing will 63430f712c9SDave Chinner * determine whether is needs to change owner before or after the switch. 63530f712c9SDave Chinner * 63630f712c9SDave Chinner * For demand paged transactional modification, the fork switch should be done 63730f712c9SDave Chinner * after reading in all the blocks, modifying them and pinning them in the 63830f712c9SDave Chinner * transaction. For modification when the buffers are already pinned in memory, 63930f712c9SDave Chinner * the fork switch can be done before changing the owner as we won't need to 64030f712c9SDave Chinner * validate the owner until the btree buffers are unpinned and writes can occur 64130f712c9SDave Chinner * again. 64230f712c9SDave Chinner * 64330f712c9SDave Chinner * For recovery based ownership change, there is no transactional context and 64430f712c9SDave Chinner * so a buffer list must be supplied so that we can record the buffers that we 64530f712c9SDave Chinner * modified for the caller to issue IO on. 64630f712c9SDave Chinner */ 64730f712c9SDave Chinner int 64830f712c9SDave Chinner xfs_bmbt_change_owner( 64930f712c9SDave Chinner struct xfs_trans *tp, 65030f712c9SDave Chinner struct xfs_inode *ip, 65130f712c9SDave Chinner int whichfork, 65230f712c9SDave Chinner xfs_ino_t new_owner, 65330f712c9SDave Chinner struct list_head *buffer_list) 65430f712c9SDave Chinner { 65530f712c9SDave Chinner struct xfs_btree_cur *cur; 65630f712c9SDave Chinner int error; 65730f712c9SDave Chinner 65830f712c9SDave Chinner ASSERT(tp || buffer_list); 65930f712c9SDave Chinner ASSERT(!(tp && buffer_list)); 660732436efSDarrick J. Wong ASSERT(xfs_ifork_ptr(ip, whichfork)->if_format == XFS_DINODE_FMT_BTREE); 66130f712c9SDave Chinner 66230f712c9SDave Chinner cur = xfs_bmbt_init_cursor(ip->i_mount, tp, ip, whichfork); 6638ef54797SDave Chinner cur->bc_ino.flags |= XFS_BTCUR_BMBT_INVALID_OWNER; 66430f712c9SDave Chinner 66530f712c9SDave Chinner error = xfs_btree_change_owner(cur, new_owner, buffer_list); 6660b04b6b8SDarrick J. Wong xfs_btree_del_cursor(cur, error); 66730f712c9SDave Chinner return error; 66830f712c9SDave Chinner } 66914861c47SDarrick J. Wong 67014861c47SDarrick J. Wong /* Calculate the bmap btree size for some records. */ 67114861c47SDarrick J. Wong unsigned long long 67214861c47SDarrick J. Wong xfs_bmbt_calc_size( 67314861c47SDarrick J. Wong struct xfs_mount *mp, 67414861c47SDarrick J. Wong unsigned long long len) 67514861c47SDarrick J. Wong { 67614861c47SDarrick J. Wong return xfs_btree_calc_size(mp->m_bmap_dmnr, len); 67714861c47SDarrick J. Wong } 6789fa47bdcSDarrick J. Wong 6799fa47bdcSDarrick J. Wong int __init 6809fa47bdcSDarrick J. Wong xfs_bmbt_init_cur_cache(void) 6819fa47bdcSDarrick J. Wong { 6829fa47bdcSDarrick J. Wong xfs_bmbt_cur_cache = kmem_cache_create("xfs_bmbt_cur", 6839fa47bdcSDarrick J. Wong xfs_btree_cur_sizeof(xfs_bmbt_maxlevels_ondisk()), 6849fa47bdcSDarrick J. Wong 0, 0, NULL); 6859fa47bdcSDarrick J. Wong 6869fa47bdcSDarrick J. Wong if (!xfs_bmbt_cur_cache) 6879fa47bdcSDarrick J. Wong return -ENOMEM; 6889fa47bdcSDarrick J. Wong return 0; 6899fa47bdcSDarrick J. Wong } 6909fa47bdcSDarrick J. Wong 6919fa47bdcSDarrick J. Wong void 6929fa47bdcSDarrick J. Wong xfs_bmbt_destroy_cur_cache(void) 6939fa47bdcSDarrick J. Wong { 6949fa47bdcSDarrick J. Wong kmem_cache_destroy(xfs_bmbt_cur_cache); 6959fa47bdcSDarrick J. Wong xfs_bmbt_cur_cache = NULL; 6969fa47bdcSDarrick J. Wong } 697