130f712c9SDave Chinner /* 230f712c9SDave Chinner * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc. 330f712c9SDave Chinner * Copyright (c) 2013 Red Hat, Inc. 430f712c9SDave Chinner * All Rights Reserved. 530f712c9SDave Chinner * 630f712c9SDave Chinner * This program is free software; you can redistribute it and/or 730f712c9SDave Chinner * modify it under the terms of the GNU General Public License as 830f712c9SDave Chinner * published by the Free Software Foundation. 930f712c9SDave Chinner * 1030f712c9SDave Chinner * This program is distributed in the hope that it would be useful, 1130f712c9SDave Chinner * but WITHOUT ANY WARRANTY; without even the implied warranty of 1230f712c9SDave Chinner * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 1330f712c9SDave Chinner * GNU General Public License for more details. 1430f712c9SDave Chinner * 1530f712c9SDave Chinner * You should have received a copy of the GNU General Public License 1630f712c9SDave Chinner * along with this program; if not, write the Free Software Foundation, 1730f712c9SDave Chinner * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA 1830f712c9SDave Chinner */ 1930f712c9SDave Chinner #include "xfs.h" 2030f712c9SDave Chinner #include "xfs_fs.h" 2130f712c9SDave Chinner #include "xfs_format.h" 2230f712c9SDave Chinner #include "xfs_log_format.h" 2330f712c9SDave Chinner #include "xfs_trans_resv.h" 2430f712c9SDave Chinner #include "xfs_mount.h" 2530f712c9SDave Chinner #include "xfs_da_format.h" 2630f712c9SDave Chinner #include "xfs_da_btree.h" 2730f712c9SDave Chinner #include "xfs_inode.h" 2830f712c9SDave Chinner #include "xfs_bmap.h" 2930f712c9SDave Chinner #include "xfs_dir2.h" 3030f712c9SDave Chinner #include "xfs_dir2_priv.h" 3130f712c9SDave Chinner #include "xfs_error.h" 3230f712c9SDave Chinner #include "xfs_trace.h" 3330f712c9SDave Chinner #include "xfs_trans.h" 3430f712c9SDave Chinner #include "xfs_buf_item.h" 3530f712c9SDave Chinner #include "xfs_cksum.h" 36a45086e2SBrian Foster #include "xfs_log.h" 3730f712c9SDave Chinner 3830f712c9SDave Chinner /* 3930f712c9SDave Chinner * Local function declarations. 4030f712c9SDave Chinner */ 4130f712c9SDave Chinner static int xfs_dir2_leaf_lookup_int(xfs_da_args_t *args, struct xfs_buf **lbpp, 4230f712c9SDave Chinner int *indexp, struct xfs_buf **dbpp); 4330f712c9SDave Chinner static void xfs_dir3_leaf_log_bests(struct xfs_da_args *args, 4430f712c9SDave Chinner struct xfs_buf *bp, int first, int last); 4530f712c9SDave Chinner static void xfs_dir3_leaf_log_tail(struct xfs_da_args *args, 4630f712c9SDave Chinner struct xfs_buf *bp); 4730f712c9SDave Chinner 4830f712c9SDave Chinner /* 4930f712c9SDave Chinner * Check the internal consistency of a leaf1 block. 5030f712c9SDave Chinner * Pop an assert if something is wrong. 5130f712c9SDave Chinner */ 5230f712c9SDave Chinner #ifdef DEBUG 53a6a781a5SDarrick J. Wong static xfs_failaddr_t 5430f712c9SDave Chinner xfs_dir3_leaf1_check( 5530f712c9SDave Chinner struct xfs_inode *dp, 5630f712c9SDave Chinner struct xfs_buf *bp) 5730f712c9SDave Chinner { 5830f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 5930f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 6030f712c9SDave Chinner 6130f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 6230f712c9SDave Chinner 6330f712c9SDave Chinner if (leafhdr.magic == XFS_DIR3_LEAF1_MAGIC) { 6430f712c9SDave Chinner struct xfs_dir3_leaf_hdr *leaf3 = bp->b_addr; 6530f712c9SDave Chinner if (be64_to_cpu(leaf3->info.blkno) != bp->b_bn) 66a6a781a5SDarrick J. Wong return __this_address; 6730f712c9SDave Chinner } else if (leafhdr.magic != XFS_DIR2_LEAF1_MAGIC) 68a6a781a5SDarrick J. Wong return __this_address; 6930f712c9SDave Chinner 7030f712c9SDave Chinner return xfs_dir3_leaf_check_int(dp->i_mount, dp, &leafhdr, leaf); 7130f712c9SDave Chinner } 72a6a781a5SDarrick J. Wong 73a6a781a5SDarrick J. Wong static inline void 74a6a781a5SDarrick J. Wong xfs_dir3_leaf_check( 75a6a781a5SDarrick J. Wong struct xfs_inode *dp, 76a6a781a5SDarrick J. Wong struct xfs_buf *bp) 77a6a781a5SDarrick J. Wong { 78a6a781a5SDarrick J. Wong xfs_failaddr_t fa; 79a6a781a5SDarrick J. Wong 80a6a781a5SDarrick J. Wong fa = xfs_dir3_leaf1_check(dp, bp); 81a6a781a5SDarrick J. Wong if (!fa) 82a6a781a5SDarrick J. Wong return; 83a6a781a5SDarrick J. Wong xfs_corruption_error(__func__, XFS_ERRLEVEL_LOW, dp->i_mount, 84a6a781a5SDarrick J. Wong bp->b_addr, __FILE__, __LINE__, fa); 85a6a781a5SDarrick J. Wong ASSERT(0); 86a6a781a5SDarrick J. Wong } 8730f712c9SDave Chinner #else 8830f712c9SDave Chinner #define xfs_dir3_leaf_check(dp, bp) 8930f712c9SDave Chinner #endif 9030f712c9SDave Chinner 91a6a781a5SDarrick J. Wong xfs_failaddr_t 9230f712c9SDave Chinner xfs_dir3_leaf_check_int( 9330f712c9SDave Chinner struct xfs_mount *mp, 9430f712c9SDave Chinner struct xfs_inode *dp, 9530f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *hdr, 9630f712c9SDave Chinner struct xfs_dir2_leaf *leaf) 9730f712c9SDave Chinner { 9830f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 9930f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; 10030f712c9SDave Chinner int stale; 10130f712c9SDave Chinner int i; 10230f712c9SDave Chinner const struct xfs_dir_ops *ops; 10330f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 10430f712c9SDave Chinner struct xfs_da_geometry *geo = mp->m_dir_geo; 10530f712c9SDave Chinner 10630f712c9SDave Chinner /* 10730f712c9SDave Chinner * we can be passed a null dp here from a verifier, so we need to go the 10830f712c9SDave Chinner * hard way to get them. 10930f712c9SDave Chinner */ 11030f712c9SDave Chinner ops = xfs_dir_get_ops(mp, dp); 11130f712c9SDave Chinner 11230f712c9SDave Chinner if (!hdr) { 11330f712c9SDave Chinner ops->leaf_hdr_from_disk(&leafhdr, leaf); 11430f712c9SDave Chinner hdr = &leafhdr; 11530f712c9SDave Chinner } 11630f712c9SDave Chinner 11730f712c9SDave Chinner ents = ops->leaf_ents_p(leaf); 11830f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(geo, leaf); 11930f712c9SDave Chinner 12030f712c9SDave Chinner /* 12130f712c9SDave Chinner * XXX (dgc): This value is not restrictive enough. 12230f712c9SDave Chinner * Should factor in the size of the bests table as well. 12330f712c9SDave Chinner * We can deduce a value for that from di_size. 12430f712c9SDave Chinner */ 12530f712c9SDave Chinner if (hdr->count > ops->leaf_max_ents(geo)) 126a6a781a5SDarrick J. Wong return __this_address; 12730f712c9SDave Chinner 12830f712c9SDave Chinner /* Leaves and bests don't overlap in leaf format. */ 12930f712c9SDave Chinner if ((hdr->magic == XFS_DIR2_LEAF1_MAGIC || 13030f712c9SDave Chinner hdr->magic == XFS_DIR3_LEAF1_MAGIC) && 13130f712c9SDave Chinner (char *)&ents[hdr->count] > (char *)xfs_dir2_leaf_bests_p(ltp)) 132a6a781a5SDarrick J. Wong return __this_address; 13330f712c9SDave Chinner 13430f712c9SDave Chinner /* Check hash value order, count stale entries. */ 13530f712c9SDave Chinner for (i = stale = 0; i < hdr->count; i++) { 13630f712c9SDave Chinner if (i + 1 < hdr->count) { 13730f712c9SDave Chinner if (be32_to_cpu(ents[i].hashval) > 13830f712c9SDave Chinner be32_to_cpu(ents[i + 1].hashval)) 139a6a781a5SDarrick J. Wong return __this_address; 14030f712c9SDave Chinner } 14130f712c9SDave Chinner if (ents[i].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) 14230f712c9SDave Chinner stale++; 14330f712c9SDave Chinner } 14430f712c9SDave Chinner if (hdr->stale != stale) 145a6a781a5SDarrick J. Wong return __this_address; 146a6a781a5SDarrick J. Wong return NULL; 14730f712c9SDave Chinner } 14830f712c9SDave Chinner 14930f712c9SDave Chinner /* 15030f712c9SDave Chinner * We verify the magic numbers before decoding the leaf header so that on debug 15130f712c9SDave Chinner * kernels we don't get assertion failures in xfs_dir3_leaf_hdr_from_disk() due 15230f712c9SDave Chinner * to incorrect magic numbers. 15330f712c9SDave Chinner */ 154a6a781a5SDarrick J. Wong static xfs_failaddr_t 15530f712c9SDave Chinner xfs_dir3_leaf_verify( 15630f712c9SDave Chinner struct xfs_buf *bp, 157c8ce540dSDarrick J. Wong uint16_t magic) 15830f712c9SDave Chinner { 15930f712c9SDave Chinner struct xfs_mount *mp = bp->b_target->bt_mount; 16030f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 16130f712c9SDave Chinner 16230f712c9SDave Chinner ASSERT(magic == XFS_DIR2_LEAF1_MAGIC || magic == XFS_DIR2_LEAFN_MAGIC); 16330f712c9SDave Chinner 16430f712c9SDave Chinner if (xfs_sb_version_hascrc(&mp->m_sb)) { 16530f712c9SDave Chinner struct xfs_dir3_leaf_hdr *leaf3 = bp->b_addr; 166c8ce540dSDarrick J. Wong uint16_t magic3; 16730f712c9SDave Chinner 16830f712c9SDave Chinner magic3 = (magic == XFS_DIR2_LEAF1_MAGIC) ? XFS_DIR3_LEAF1_MAGIC 16930f712c9SDave Chinner : XFS_DIR3_LEAFN_MAGIC; 17030f712c9SDave Chinner 17130f712c9SDave Chinner if (leaf3->info.hdr.magic != cpu_to_be16(magic3)) 172a6a781a5SDarrick J. Wong return __this_address; 173ce748eaaSEric Sandeen if (!uuid_equal(&leaf3->info.uuid, &mp->m_sb.sb_meta_uuid)) 174a6a781a5SDarrick J. Wong return __this_address; 17530f712c9SDave Chinner if (be64_to_cpu(leaf3->info.blkno) != bp->b_bn) 176a6a781a5SDarrick J. Wong return __this_address; 177a45086e2SBrian Foster if (!xfs_log_check_lsn(mp, be64_to_cpu(leaf3->info.lsn))) 178a6a781a5SDarrick J. Wong return __this_address; 17930f712c9SDave Chinner } else { 18030f712c9SDave Chinner if (leaf->hdr.info.magic != cpu_to_be16(magic)) 181a6a781a5SDarrick J. Wong return __this_address; 18230f712c9SDave Chinner } 18330f712c9SDave Chinner 18430f712c9SDave Chinner return xfs_dir3_leaf_check_int(mp, NULL, NULL, leaf); 18530f712c9SDave Chinner } 18630f712c9SDave Chinner 18730f712c9SDave Chinner static void 18830f712c9SDave Chinner __read_verify( 18930f712c9SDave Chinner struct xfs_buf *bp, 190c8ce540dSDarrick J. Wong uint16_t magic) 19130f712c9SDave Chinner { 19230f712c9SDave Chinner struct xfs_mount *mp = bp->b_target->bt_mount; 193bc1a09b8SDarrick J. Wong xfs_failaddr_t fa; 19430f712c9SDave Chinner 19530f712c9SDave Chinner if (xfs_sb_version_hascrc(&mp->m_sb) && 19630f712c9SDave Chinner !xfs_buf_verify_cksum(bp, XFS_DIR3_LEAF_CRC_OFF)) 197bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSBADCRC, __this_address); 198bc1a09b8SDarrick J. Wong else { 199bc1a09b8SDarrick J. Wong fa = xfs_dir3_leaf_verify(bp, magic); 200bc1a09b8SDarrick J. Wong if (fa) 201bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSCORRUPTED, fa); 202bc1a09b8SDarrick J. Wong } 20330f712c9SDave Chinner } 20430f712c9SDave Chinner 20530f712c9SDave Chinner static void 20630f712c9SDave Chinner __write_verify( 20730f712c9SDave Chinner struct xfs_buf *bp, 208c8ce540dSDarrick J. Wong uint16_t magic) 20930f712c9SDave Chinner { 21030f712c9SDave Chinner struct xfs_mount *mp = bp->b_target->bt_mount; 211fb1755a6SCarlos Maiolino struct xfs_buf_log_item *bip = bp->b_log_item; 21230f712c9SDave Chinner struct xfs_dir3_leaf_hdr *hdr3 = bp->b_addr; 213bc1a09b8SDarrick J. Wong xfs_failaddr_t fa; 21430f712c9SDave Chinner 215bc1a09b8SDarrick J. Wong fa = xfs_dir3_leaf_verify(bp, magic); 216bc1a09b8SDarrick J. Wong if (fa) { 217bc1a09b8SDarrick J. Wong xfs_verifier_error(bp, -EFSCORRUPTED, fa); 21830f712c9SDave Chinner return; 21930f712c9SDave Chinner } 22030f712c9SDave Chinner 22130f712c9SDave Chinner if (!xfs_sb_version_hascrc(&mp->m_sb)) 22230f712c9SDave Chinner return; 22330f712c9SDave Chinner 22430f712c9SDave Chinner if (bip) 22530f712c9SDave Chinner hdr3->info.lsn = cpu_to_be64(bip->bli_item.li_lsn); 22630f712c9SDave Chinner 22730f712c9SDave Chinner xfs_buf_update_cksum(bp, XFS_DIR3_LEAF_CRC_OFF); 22830f712c9SDave Chinner } 22930f712c9SDave Chinner 230b5572597SDarrick J. Wong static xfs_failaddr_t 231b5572597SDarrick J. Wong xfs_dir3_leaf1_verify( 232b5572597SDarrick J. Wong struct xfs_buf *bp) 233b5572597SDarrick J. Wong { 234b5572597SDarrick J. Wong return xfs_dir3_leaf_verify(bp, XFS_DIR2_LEAF1_MAGIC); 235b5572597SDarrick J. Wong } 236b5572597SDarrick J. Wong 23730f712c9SDave Chinner static void 23830f712c9SDave Chinner xfs_dir3_leaf1_read_verify( 23930f712c9SDave Chinner struct xfs_buf *bp) 24030f712c9SDave Chinner { 24130f712c9SDave Chinner __read_verify(bp, XFS_DIR2_LEAF1_MAGIC); 24230f712c9SDave Chinner } 24330f712c9SDave Chinner 24430f712c9SDave Chinner static void 24530f712c9SDave Chinner xfs_dir3_leaf1_write_verify( 24630f712c9SDave Chinner struct xfs_buf *bp) 24730f712c9SDave Chinner { 24830f712c9SDave Chinner __write_verify(bp, XFS_DIR2_LEAF1_MAGIC); 24930f712c9SDave Chinner } 25030f712c9SDave Chinner 251b5572597SDarrick J. Wong static xfs_failaddr_t 252b5572597SDarrick J. Wong xfs_dir3_leafn_verify( 253b5572597SDarrick J. Wong struct xfs_buf *bp) 254b5572597SDarrick J. Wong { 255b5572597SDarrick J. Wong return xfs_dir3_leaf_verify(bp, XFS_DIR2_LEAFN_MAGIC); 256b5572597SDarrick J. Wong } 257b5572597SDarrick J. Wong 25830f712c9SDave Chinner static void 25930f712c9SDave Chinner xfs_dir3_leafn_read_verify( 26030f712c9SDave Chinner struct xfs_buf *bp) 26130f712c9SDave Chinner { 26230f712c9SDave Chinner __read_verify(bp, XFS_DIR2_LEAFN_MAGIC); 26330f712c9SDave Chinner } 26430f712c9SDave Chinner 26530f712c9SDave Chinner static void 26630f712c9SDave Chinner xfs_dir3_leafn_write_verify( 26730f712c9SDave Chinner struct xfs_buf *bp) 26830f712c9SDave Chinner { 26930f712c9SDave Chinner __write_verify(bp, XFS_DIR2_LEAFN_MAGIC); 27030f712c9SDave Chinner } 27130f712c9SDave Chinner 27230f712c9SDave Chinner const struct xfs_buf_ops xfs_dir3_leaf1_buf_ops = { 273233135b7SEric Sandeen .name = "xfs_dir3_leaf1", 27430f712c9SDave Chinner .verify_read = xfs_dir3_leaf1_read_verify, 27530f712c9SDave Chinner .verify_write = xfs_dir3_leaf1_write_verify, 276b5572597SDarrick J. Wong .verify_struct = xfs_dir3_leaf1_verify, 27730f712c9SDave Chinner }; 27830f712c9SDave Chinner 27930f712c9SDave Chinner const struct xfs_buf_ops xfs_dir3_leafn_buf_ops = { 280233135b7SEric Sandeen .name = "xfs_dir3_leafn", 28130f712c9SDave Chinner .verify_read = xfs_dir3_leafn_read_verify, 28230f712c9SDave Chinner .verify_write = xfs_dir3_leafn_write_verify, 283b5572597SDarrick J. Wong .verify_struct = xfs_dir3_leafn_verify, 28430f712c9SDave Chinner }; 28530f712c9SDave Chinner 28626788097SDarrick J. Wong int 28730f712c9SDave Chinner xfs_dir3_leaf_read( 28830f712c9SDave Chinner struct xfs_trans *tp, 28930f712c9SDave Chinner struct xfs_inode *dp, 29030f712c9SDave Chinner xfs_dablk_t fbno, 29130f712c9SDave Chinner xfs_daddr_t mappedbno, 29230f712c9SDave Chinner struct xfs_buf **bpp) 29330f712c9SDave Chinner { 29430f712c9SDave Chinner int err; 29530f712c9SDave Chinner 29630f712c9SDave Chinner err = xfs_da_read_buf(tp, dp, fbno, mappedbno, bpp, 29730f712c9SDave Chinner XFS_DATA_FORK, &xfs_dir3_leaf1_buf_ops); 298cd87d867SDarrick J. Wong if (!err && tp && *bpp) 29930f712c9SDave Chinner xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_LEAF1_BUF); 30030f712c9SDave Chinner return err; 30130f712c9SDave Chinner } 30230f712c9SDave Chinner 30330f712c9SDave Chinner int 30430f712c9SDave Chinner xfs_dir3_leafn_read( 30530f712c9SDave Chinner struct xfs_trans *tp, 30630f712c9SDave Chinner struct xfs_inode *dp, 30730f712c9SDave Chinner xfs_dablk_t fbno, 30830f712c9SDave Chinner xfs_daddr_t mappedbno, 30930f712c9SDave Chinner struct xfs_buf **bpp) 31030f712c9SDave Chinner { 31130f712c9SDave Chinner int err; 31230f712c9SDave Chinner 31330f712c9SDave Chinner err = xfs_da_read_buf(tp, dp, fbno, mappedbno, bpp, 31430f712c9SDave Chinner XFS_DATA_FORK, &xfs_dir3_leafn_buf_ops); 315cd87d867SDarrick J. Wong if (!err && tp && *bpp) 31630f712c9SDave Chinner xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_LEAFN_BUF); 31730f712c9SDave Chinner return err; 31830f712c9SDave Chinner } 31930f712c9SDave Chinner 32030f712c9SDave Chinner /* 32130f712c9SDave Chinner * Initialize a new leaf block, leaf1 or leafn magic accepted. 32230f712c9SDave Chinner */ 32330f712c9SDave Chinner static void 32430f712c9SDave Chinner xfs_dir3_leaf_init( 32530f712c9SDave Chinner struct xfs_mount *mp, 32630f712c9SDave Chinner struct xfs_trans *tp, 32730f712c9SDave Chinner struct xfs_buf *bp, 32830f712c9SDave Chinner xfs_ino_t owner, 329c8ce540dSDarrick J. Wong uint16_t type) 33030f712c9SDave Chinner { 33130f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 33230f712c9SDave Chinner 33330f712c9SDave Chinner ASSERT(type == XFS_DIR2_LEAF1_MAGIC || type == XFS_DIR2_LEAFN_MAGIC); 33430f712c9SDave Chinner 33530f712c9SDave Chinner if (xfs_sb_version_hascrc(&mp->m_sb)) { 33630f712c9SDave Chinner struct xfs_dir3_leaf_hdr *leaf3 = bp->b_addr; 33730f712c9SDave Chinner 33830f712c9SDave Chinner memset(leaf3, 0, sizeof(*leaf3)); 33930f712c9SDave Chinner 34030f712c9SDave Chinner leaf3->info.hdr.magic = (type == XFS_DIR2_LEAF1_MAGIC) 34130f712c9SDave Chinner ? cpu_to_be16(XFS_DIR3_LEAF1_MAGIC) 34230f712c9SDave Chinner : cpu_to_be16(XFS_DIR3_LEAFN_MAGIC); 34330f712c9SDave Chinner leaf3->info.blkno = cpu_to_be64(bp->b_bn); 34430f712c9SDave Chinner leaf3->info.owner = cpu_to_be64(owner); 345ce748eaaSEric Sandeen uuid_copy(&leaf3->info.uuid, &mp->m_sb.sb_meta_uuid); 34630f712c9SDave Chinner } else { 34730f712c9SDave Chinner memset(leaf, 0, sizeof(*leaf)); 34830f712c9SDave Chinner leaf->hdr.info.magic = cpu_to_be16(type); 34930f712c9SDave Chinner } 35030f712c9SDave Chinner 35130f712c9SDave Chinner /* 35230f712c9SDave Chinner * If it's a leaf-format directory initialize the tail. 35330f712c9SDave Chinner * Caller is responsible for initialising the bests table. 35430f712c9SDave Chinner */ 35530f712c9SDave Chinner if (type == XFS_DIR2_LEAF1_MAGIC) { 35630f712c9SDave Chinner struct xfs_dir2_leaf_tail *ltp; 35730f712c9SDave Chinner 35830f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(mp->m_dir_geo, leaf); 35930f712c9SDave Chinner ltp->bestcount = 0; 36030f712c9SDave Chinner bp->b_ops = &xfs_dir3_leaf1_buf_ops; 36130f712c9SDave Chinner xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_LEAF1_BUF); 36230f712c9SDave Chinner } else { 36330f712c9SDave Chinner bp->b_ops = &xfs_dir3_leafn_buf_ops; 36430f712c9SDave Chinner xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_LEAFN_BUF); 36530f712c9SDave Chinner } 36630f712c9SDave Chinner } 36730f712c9SDave Chinner 36830f712c9SDave Chinner int 36930f712c9SDave Chinner xfs_dir3_leaf_get_buf( 37030f712c9SDave Chinner xfs_da_args_t *args, 37130f712c9SDave Chinner xfs_dir2_db_t bno, 37230f712c9SDave Chinner struct xfs_buf **bpp, 373c8ce540dSDarrick J. Wong uint16_t magic) 37430f712c9SDave Chinner { 37530f712c9SDave Chinner struct xfs_inode *dp = args->dp; 37630f712c9SDave Chinner struct xfs_trans *tp = args->trans; 37730f712c9SDave Chinner struct xfs_mount *mp = dp->i_mount; 37830f712c9SDave Chinner struct xfs_buf *bp; 37930f712c9SDave Chinner int error; 38030f712c9SDave Chinner 38130f712c9SDave Chinner ASSERT(magic == XFS_DIR2_LEAF1_MAGIC || magic == XFS_DIR2_LEAFN_MAGIC); 38230f712c9SDave Chinner ASSERT(bno >= xfs_dir2_byte_to_db(args->geo, XFS_DIR2_LEAF_OFFSET) && 38330f712c9SDave Chinner bno < xfs_dir2_byte_to_db(args->geo, XFS_DIR2_FREE_OFFSET)); 38430f712c9SDave Chinner 38530f712c9SDave Chinner error = xfs_da_get_buf(tp, dp, xfs_dir2_db_to_da(args->geo, bno), 38630f712c9SDave Chinner -1, &bp, XFS_DATA_FORK); 38730f712c9SDave Chinner if (error) 38830f712c9SDave Chinner return error; 38930f712c9SDave Chinner 39030f712c9SDave Chinner xfs_dir3_leaf_init(mp, tp, bp, dp->i_ino, magic); 39130f712c9SDave Chinner xfs_dir3_leaf_log_header(args, bp); 39230f712c9SDave Chinner if (magic == XFS_DIR2_LEAF1_MAGIC) 39330f712c9SDave Chinner xfs_dir3_leaf_log_tail(args, bp); 39430f712c9SDave Chinner *bpp = bp; 39530f712c9SDave Chinner return 0; 39630f712c9SDave Chinner } 39730f712c9SDave Chinner 39830f712c9SDave Chinner /* 39930f712c9SDave Chinner * Convert a block form directory to a leaf form directory. 40030f712c9SDave Chinner */ 40130f712c9SDave Chinner int /* error */ 40230f712c9SDave Chinner xfs_dir2_block_to_leaf( 40330f712c9SDave Chinner xfs_da_args_t *args, /* operation arguments */ 40430f712c9SDave Chinner struct xfs_buf *dbp) /* input block's buffer */ 40530f712c9SDave Chinner { 40630f712c9SDave Chinner __be16 *bestsp; /* leaf's bestsp entries */ 40730f712c9SDave Chinner xfs_dablk_t blkno; /* leaf block's bno */ 40830f712c9SDave Chinner xfs_dir2_data_hdr_t *hdr; /* block header */ 40930f712c9SDave Chinner xfs_dir2_leaf_entry_t *blp; /* block's leaf entries */ 41030f712c9SDave Chinner xfs_dir2_block_tail_t *btp; /* block's tail */ 41130f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 41230f712c9SDave Chinner int error; /* error return code */ 41330f712c9SDave Chinner struct xfs_buf *lbp; /* leaf block's buffer */ 41430f712c9SDave Chinner xfs_dir2_db_t ldb; /* leaf block's bno */ 41530f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 41630f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf's tail */ 41730f712c9SDave Chinner int needlog; /* need to log block header */ 41830f712c9SDave Chinner int needscan; /* need to rescan bestfree */ 41930f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 42030f712c9SDave Chinner struct xfs_dir2_data_free *bf; 42130f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 42230f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 42330f712c9SDave Chinner 42430f712c9SDave Chinner trace_xfs_dir2_block_to_leaf(args); 42530f712c9SDave Chinner 42630f712c9SDave Chinner dp = args->dp; 42730f712c9SDave Chinner tp = args->trans; 42830f712c9SDave Chinner /* 42930f712c9SDave Chinner * Add the leaf block to the inode. 43030f712c9SDave Chinner * This interface will only put blocks in the leaf/node range. 43130f712c9SDave Chinner * Since that's empty now, we'll get the root (block 0 in range). 43230f712c9SDave Chinner */ 43330f712c9SDave Chinner if ((error = xfs_da_grow_inode(args, &blkno))) { 43430f712c9SDave Chinner return error; 43530f712c9SDave Chinner } 43630f712c9SDave Chinner ldb = xfs_dir2_da_to_db(args->geo, blkno); 43730f712c9SDave Chinner ASSERT(ldb == xfs_dir2_byte_to_db(args->geo, XFS_DIR2_LEAF_OFFSET)); 43830f712c9SDave Chinner /* 43930f712c9SDave Chinner * Initialize the leaf block, get a buffer for it. 44030f712c9SDave Chinner */ 44130f712c9SDave Chinner error = xfs_dir3_leaf_get_buf(args, ldb, &lbp, XFS_DIR2_LEAF1_MAGIC); 44230f712c9SDave Chinner if (error) 44330f712c9SDave Chinner return error; 44430f712c9SDave Chinner 44530f712c9SDave Chinner leaf = lbp->b_addr; 44630f712c9SDave Chinner hdr = dbp->b_addr; 44730f712c9SDave Chinner xfs_dir3_data_check(dp, dbp); 44830f712c9SDave Chinner btp = xfs_dir2_block_tail_p(args->geo, hdr); 44930f712c9SDave Chinner blp = xfs_dir2_block_leaf_p(btp); 45030f712c9SDave Chinner bf = dp->d_ops->data_bestfree_p(hdr); 45130f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 45230f712c9SDave Chinner 45330f712c9SDave Chinner /* 45430f712c9SDave Chinner * Set the counts in the leaf header. 45530f712c9SDave Chinner */ 45630f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 45730f712c9SDave Chinner leafhdr.count = be32_to_cpu(btp->count); 45830f712c9SDave Chinner leafhdr.stale = be32_to_cpu(btp->stale); 45930f712c9SDave Chinner dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr); 46030f712c9SDave Chinner xfs_dir3_leaf_log_header(args, lbp); 46130f712c9SDave Chinner 46230f712c9SDave Chinner /* 46330f712c9SDave Chinner * Could compact these but I think we always do the conversion 46430f712c9SDave Chinner * after squeezing out stale entries. 46530f712c9SDave Chinner */ 46630f712c9SDave Chinner memcpy(ents, blp, be32_to_cpu(btp->count) * sizeof(xfs_dir2_leaf_entry_t)); 46730f712c9SDave Chinner xfs_dir3_leaf_log_ents(args, lbp, 0, leafhdr.count - 1); 46830f712c9SDave Chinner needscan = 0; 46930f712c9SDave Chinner needlog = 1; 47030f712c9SDave Chinner /* 47130f712c9SDave Chinner * Make the space formerly occupied by the leaf entries and block 47230f712c9SDave Chinner * tail be free. 47330f712c9SDave Chinner */ 47430f712c9SDave Chinner xfs_dir2_data_make_free(args, dbp, 47530f712c9SDave Chinner (xfs_dir2_data_aoff_t)((char *)blp - (char *)hdr), 47630f712c9SDave Chinner (xfs_dir2_data_aoff_t)((char *)hdr + args->geo->blksize - 47730f712c9SDave Chinner (char *)blp), 47830f712c9SDave Chinner &needlog, &needscan); 47930f712c9SDave Chinner /* 48030f712c9SDave Chinner * Fix up the block header, make it a data block. 48130f712c9SDave Chinner */ 48230f712c9SDave Chinner dbp->b_ops = &xfs_dir3_data_buf_ops; 48330f712c9SDave Chinner xfs_trans_buf_set_type(tp, dbp, XFS_BLFT_DIR_DATA_BUF); 48430f712c9SDave Chinner if (hdr->magic == cpu_to_be32(XFS_DIR2_BLOCK_MAGIC)) 48530f712c9SDave Chinner hdr->magic = cpu_to_be32(XFS_DIR2_DATA_MAGIC); 48630f712c9SDave Chinner else 48730f712c9SDave Chinner hdr->magic = cpu_to_be32(XFS_DIR3_DATA_MAGIC); 48830f712c9SDave Chinner 48930f712c9SDave Chinner if (needscan) 49030f712c9SDave Chinner xfs_dir2_data_freescan(dp, hdr, &needlog); 49130f712c9SDave Chinner /* 49230f712c9SDave Chinner * Set up leaf tail and bests table. 49330f712c9SDave Chinner */ 49430f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 49530f712c9SDave Chinner ltp->bestcount = cpu_to_be32(1); 49630f712c9SDave Chinner bestsp = xfs_dir2_leaf_bests_p(ltp); 49730f712c9SDave Chinner bestsp[0] = bf[0].length; 49830f712c9SDave Chinner /* 49930f712c9SDave Chinner * Log the data header and leaf bests table. 50030f712c9SDave Chinner */ 50130f712c9SDave Chinner if (needlog) 50230f712c9SDave Chinner xfs_dir2_data_log_header(args, dbp); 50330f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 50430f712c9SDave Chinner xfs_dir3_data_check(dp, dbp); 50530f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, 0, 0); 50630f712c9SDave Chinner return 0; 50730f712c9SDave Chinner } 50830f712c9SDave Chinner 50930f712c9SDave Chinner STATIC void 51030f712c9SDave Chinner xfs_dir3_leaf_find_stale( 51130f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *leafhdr, 51230f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents, 51330f712c9SDave Chinner int index, 51430f712c9SDave Chinner int *lowstale, 51530f712c9SDave Chinner int *highstale) 51630f712c9SDave Chinner { 51730f712c9SDave Chinner /* 51830f712c9SDave Chinner * Find the first stale entry before our index, if any. 51930f712c9SDave Chinner */ 52030f712c9SDave Chinner for (*lowstale = index - 1; *lowstale >= 0; --*lowstale) { 52130f712c9SDave Chinner if (ents[*lowstale].address == 52230f712c9SDave Chinner cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) 52330f712c9SDave Chinner break; 52430f712c9SDave Chinner } 52530f712c9SDave Chinner 52630f712c9SDave Chinner /* 52730f712c9SDave Chinner * Find the first stale entry at or after our index, if any. 52830f712c9SDave Chinner * Stop if the result would require moving more entries than using 52930f712c9SDave Chinner * lowstale. 53030f712c9SDave Chinner */ 53130f712c9SDave Chinner for (*highstale = index; *highstale < leafhdr->count; ++*highstale) { 53230f712c9SDave Chinner if (ents[*highstale].address == 53330f712c9SDave Chinner cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) 53430f712c9SDave Chinner break; 53530f712c9SDave Chinner if (*lowstale >= 0 && index - *lowstale <= *highstale - index) 53630f712c9SDave Chinner break; 53730f712c9SDave Chinner } 53830f712c9SDave Chinner } 53930f712c9SDave Chinner 54030f712c9SDave Chinner struct xfs_dir2_leaf_entry * 54130f712c9SDave Chinner xfs_dir3_leaf_find_entry( 54230f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *leafhdr, 54330f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents, 54430f712c9SDave Chinner int index, /* leaf table position */ 54530f712c9SDave Chinner int compact, /* need to compact leaves */ 54630f712c9SDave Chinner int lowstale, /* index of prev stale leaf */ 54730f712c9SDave Chinner int highstale, /* index of next stale leaf */ 54830f712c9SDave Chinner int *lfloglow, /* low leaf logging index */ 54930f712c9SDave Chinner int *lfloghigh) /* high leaf logging index */ 55030f712c9SDave Chinner { 55130f712c9SDave Chinner if (!leafhdr->stale) { 55230f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry table pointer */ 55330f712c9SDave Chinner 55430f712c9SDave Chinner /* 55530f712c9SDave Chinner * Now we need to make room to insert the leaf entry. 55630f712c9SDave Chinner * 55730f712c9SDave Chinner * If there are no stale entries, just insert a hole at index. 55830f712c9SDave Chinner */ 55930f712c9SDave Chinner lep = &ents[index]; 56030f712c9SDave Chinner if (index < leafhdr->count) 56130f712c9SDave Chinner memmove(lep + 1, lep, 56230f712c9SDave Chinner (leafhdr->count - index) * sizeof(*lep)); 56330f712c9SDave Chinner 56430f712c9SDave Chinner /* 56530f712c9SDave Chinner * Record low and high logging indices for the leaf. 56630f712c9SDave Chinner */ 56730f712c9SDave Chinner *lfloglow = index; 56830f712c9SDave Chinner *lfloghigh = leafhdr->count++; 56930f712c9SDave Chinner return lep; 57030f712c9SDave Chinner } 57130f712c9SDave Chinner 57230f712c9SDave Chinner /* 57330f712c9SDave Chinner * There are stale entries. 57430f712c9SDave Chinner * 57530f712c9SDave Chinner * We will use one of them for the new entry. It's probably not at 57630f712c9SDave Chinner * the right location, so we'll have to shift some up or down first. 57730f712c9SDave Chinner * 57830f712c9SDave Chinner * If we didn't compact before, we need to find the nearest stale 57930f712c9SDave Chinner * entries before and after our insertion point. 58030f712c9SDave Chinner */ 58130f712c9SDave Chinner if (compact == 0) 58230f712c9SDave Chinner xfs_dir3_leaf_find_stale(leafhdr, ents, index, 58330f712c9SDave Chinner &lowstale, &highstale); 58430f712c9SDave Chinner 58530f712c9SDave Chinner /* 58630f712c9SDave Chinner * If the low one is better, use it. 58730f712c9SDave Chinner */ 58830f712c9SDave Chinner if (lowstale >= 0 && 58930f712c9SDave Chinner (highstale == leafhdr->count || 59030f712c9SDave Chinner index - lowstale - 1 < highstale - index)) { 59130f712c9SDave Chinner ASSERT(index - lowstale - 1 >= 0); 59230f712c9SDave Chinner ASSERT(ents[lowstale].address == 59330f712c9SDave Chinner cpu_to_be32(XFS_DIR2_NULL_DATAPTR)); 59430f712c9SDave Chinner 59530f712c9SDave Chinner /* 59630f712c9SDave Chinner * Copy entries up to cover the stale entry and make room 59730f712c9SDave Chinner * for the new entry. 59830f712c9SDave Chinner */ 59930f712c9SDave Chinner if (index - lowstale - 1 > 0) { 60030f712c9SDave Chinner memmove(&ents[lowstale], &ents[lowstale + 1], 60130f712c9SDave Chinner (index - lowstale - 1) * 60230f712c9SDave Chinner sizeof(xfs_dir2_leaf_entry_t)); 60330f712c9SDave Chinner } 60430f712c9SDave Chinner *lfloglow = MIN(lowstale, *lfloglow); 60530f712c9SDave Chinner *lfloghigh = MAX(index - 1, *lfloghigh); 60630f712c9SDave Chinner leafhdr->stale--; 60730f712c9SDave Chinner return &ents[index - 1]; 60830f712c9SDave Chinner } 60930f712c9SDave Chinner 61030f712c9SDave Chinner /* 61130f712c9SDave Chinner * The high one is better, so use that one. 61230f712c9SDave Chinner */ 61330f712c9SDave Chinner ASSERT(highstale - index >= 0); 61430f712c9SDave Chinner ASSERT(ents[highstale].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)); 61530f712c9SDave Chinner 61630f712c9SDave Chinner /* 61730f712c9SDave Chinner * Copy entries down to cover the stale entry and make room for the 61830f712c9SDave Chinner * new entry. 61930f712c9SDave Chinner */ 62030f712c9SDave Chinner if (highstale - index > 0) { 62130f712c9SDave Chinner memmove(&ents[index + 1], &ents[index], 62230f712c9SDave Chinner (highstale - index) * sizeof(xfs_dir2_leaf_entry_t)); 62330f712c9SDave Chinner } 62430f712c9SDave Chinner *lfloglow = MIN(index, *lfloglow); 62530f712c9SDave Chinner *lfloghigh = MAX(highstale, *lfloghigh); 62630f712c9SDave Chinner leafhdr->stale--; 62730f712c9SDave Chinner return &ents[index]; 62830f712c9SDave Chinner } 62930f712c9SDave Chinner 63030f712c9SDave Chinner /* 63130f712c9SDave Chinner * Add an entry to a leaf form directory. 63230f712c9SDave Chinner */ 63330f712c9SDave Chinner int /* error */ 63430f712c9SDave Chinner xfs_dir2_leaf_addname( 63530f712c9SDave Chinner xfs_da_args_t *args) /* operation arguments */ 63630f712c9SDave Chinner { 63730f712c9SDave Chinner __be16 *bestsp; /* freespace table in leaf */ 63830f712c9SDave Chinner int compact; /* need to compact leaves */ 63930f712c9SDave Chinner xfs_dir2_data_hdr_t *hdr; /* data block header */ 64030f712c9SDave Chinner struct xfs_buf *dbp; /* data block buffer */ 64130f712c9SDave Chinner xfs_dir2_data_entry_t *dep; /* data block entry */ 64230f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 64330f712c9SDave Chinner xfs_dir2_data_unused_t *dup; /* data unused entry */ 64430f712c9SDave Chinner int error; /* error return value */ 64530f712c9SDave Chinner int grown; /* allocated new data block */ 64630f712c9SDave Chinner int highstale; /* index of next stale leaf */ 64730f712c9SDave Chinner int i; /* temporary, index */ 64830f712c9SDave Chinner int index; /* leaf table position */ 64930f712c9SDave Chinner struct xfs_buf *lbp; /* leaf's buffer */ 65030f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 65130f712c9SDave Chinner int length; /* length of new entry */ 65230f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry table pointer */ 65330f712c9SDave Chinner int lfloglow; /* low leaf logging index */ 65430f712c9SDave Chinner int lfloghigh; /* high leaf logging index */ 65530f712c9SDave Chinner int lowstale; /* index of prev stale leaf */ 65630f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf tail pointer */ 65730f712c9SDave Chinner int needbytes; /* leaf block bytes needed */ 65830f712c9SDave Chinner int needlog; /* need to log data header */ 65930f712c9SDave Chinner int needscan; /* need to rescan data free */ 66030f712c9SDave Chinner __be16 *tagp; /* end of data entry */ 66130f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 66230f712c9SDave Chinner xfs_dir2_db_t use_block; /* data block number */ 66330f712c9SDave Chinner struct xfs_dir2_data_free *bf; /* bestfree table */ 66430f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 66530f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 66630f712c9SDave Chinner 66730f712c9SDave Chinner trace_xfs_dir2_leaf_addname(args); 66830f712c9SDave Chinner 66930f712c9SDave Chinner dp = args->dp; 67030f712c9SDave Chinner tp = args->trans; 67130f712c9SDave Chinner 67230f712c9SDave Chinner error = xfs_dir3_leaf_read(tp, dp, args->geo->leafblk, -1, &lbp); 67330f712c9SDave Chinner if (error) 67430f712c9SDave Chinner return error; 67530f712c9SDave Chinner 67630f712c9SDave Chinner /* 67730f712c9SDave Chinner * Look up the entry by hash value and name. 67830f712c9SDave Chinner * We know it's not there, our caller has already done a lookup. 67930f712c9SDave Chinner * So the index is of the entry to insert in front of. 68030f712c9SDave Chinner * But if there are dup hash values the index is of the first of those. 68130f712c9SDave Chinner */ 68230f712c9SDave Chinner index = xfs_dir2_leaf_search_hash(args, lbp); 68330f712c9SDave Chinner leaf = lbp->b_addr; 68430f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 68530f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 68630f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 68730f712c9SDave Chinner bestsp = xfs_dir2_leaf_bests_p(ltp); 68830f712c9SDave Chinner length = dp->d_ops->data_entsize(args->namelen); 68930f712c9SDave Chinner 69030f712c9SDave Chinner /* 69130f712c9SDave Chinner * See if there are any entries with the same hash value 69230f712c9SDave Chinner * and space in their block for the new entry. 69330f712c9SDave Chinner * This is good because it puts multiple same-hash value entries 69430f712c9SDave Chinner * in a data block, improving the lookup of those entries. 69530f712c9SDave Chinner */ 69630f712c9SDave Chinner for (use_block = -1, lep = &ents[index]; 69730f712c9SDave Chinner index < leafhdr.count && be32_to_cpu(lep->hashval) == args->hashval; 69830f712c9SDave Chinner index++, lep++) { 69930f712c9SDave Chinner if (be32_to_cpu(lep->address) == XFS_DIR2_NULL_DATAPTR) 70030f712c9SDave Chinner continue; 70130f712c9SDave Chinner i = xfs_dir2_dataptr_to_db(args->geo, be32_to_cpu(lep->address)); 70230f712c9SDave Chinner ASSERT(i < be32_to_cpu(ltp->bestcount)); 70330f712c9SDave Chinner ASSERT(bestsp[i] != cpu_to_be16(NULLDATAOFF)); 70430f712c9SDave Chinner if (be16_to_cpu(bestsp[i]) >= length) { 70530f712c9SDave Chinner use_block = i; 70630f712c9SDave Chinner break; 70730f712c9SDave Chinner } 70830f712c9SDave Chinner } 70930f712c9SDave Chinner /* 71030f712c9SDave Chinner * Didn't find a block yet, linear search all the data blocks. 71130f712c9SDave Chinner */ 71230f712c9SDave Chinner if (use_block == -1) { 71330f712c9SDave Chinner for (i = 0; i < be32_to_cpu(ltp->bestcount); i++) { 71430f712c9SDave Chinner /* 71530f712c9SDave Chinner * Remember a block we see that's missing. 71630f712c9SDave Chinner */ 71730f712c9SDave Chinner if (bestsp[i] == cpu_to_be16(NULLDATAOFF) && 71830f712c9SDave Chinner use_block == -1) 71930f712c9SDave Chinner use_block = i; 72030f712c9SDave Chinner else if (be16_to_cpu(bestsp[i]) >= length) { 72130f712c9SDave Chinner use_block = i; 72230f712c9SDave Chinner break; 72330f712c9SDave Chinner } 72430f712c9SDave Chinner } 72530f712c9SDave Chinner } 72630f712c9SDave Chinner /* 72730f712c9SDave Chinner * How many bytes do we need in the leaf block? 72830f712c9SDave Chinner */ 72930f712c9SDave Chinner needbytes = 0; 73030f712c9SDave Chinner if (!leafhdr.stale) 73130f712c9SDave Chinner needbytes += sizeof(xfs_dir2_leaf_entry_t); 73230f712c9SDave Chinner if (use_block == -1) 73330f712c9SDave Chinner needbytes += sizeof(xfs_dir2_data_off_t); 73430f712c9SDave Chinner 73530f712c9SDave Chinner /* 73630f712c9SDave Chinner * Now kill use_block if it refers to a missing block, so we 73730f712c9SDave Chinner * can use it as an indication of allocation needed. 73830f712c9SDave Chinner */ 73930f712c9SDave Chinner if (use_block != -1 && bestsp[use_block] == cpu_to_be16(NULLDATAOFF)) 74030f712c9SDave Chinner use_block = -1; 74130f712c9SDave Chinner /* 74230f712c9SDave Chinner * If we don't have enough free bytes but we can make enough 74330f712c9SDave Chinner * by compacting out stale entries, we'll do that. 74430f712c9SDave Chinner */ 74530f712c9SDave Chinner if ((char *)bestsp - (char *)&ents[leafhdr.count] < needbytes && 74630f712c9SDave Chinner leafhdr.stale > 1) 74730f712c9SDave Chinner compact = 1; 74830f712c9SDave Chinner 74930f712c9SDave Chinner /* 75030f712c9SDave Chinner * Otherwise if we don't have enough free bytes we need to 75130f712c9SDave Chinner * convert to node form. 75230f712c9SDave Chinner */ 75330f712c9SDave Chinner else if ((char *)bestsp - (char *)&ents[leafhdr.count] < needbytes) { 75430f712c9SDave Chinner /* 75530f712c9SDave Chinner * Just checking or no space reservation, give up. 75630f712c9SDave Chinner */ 75730f712c9SDave Chinner if ((args->op_flags & XFS_DA_OP_JUSTCHECK) || 75830f712c9SDave Chinner args->total == 0) { 75930f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 7602451337dSDave Chinner return -ENOSPC; 76130f712c9SDave Chinner } 76230f712c9SDave Chinner /* 76330f712c9SDave Chinner * Convert to node form. 76430f712c9SDave Chinner */ 76530f712c9SDave Chinner error = xfs_dir2_leaf_to_node(args, lbp); 76630f712c9SDave Chinner if (error) 76730f712c9SDave Chinner return error; 76830f712c9SDave Chinner /* 76930f712c9SDave Chinner * Then add the new entry. 77030f712c9SDave Chinner */ 77130f712c9SDave Chinner return xfs_dir2_node_addname(args); 77230f712c9SDave Chinner } 77330f712c9SDave Chinner /* 77430f712c9SDave Chinner * Otherwise it will fit without compaction. 77530f712c9SDave Chinner */ 77630f712c9SDave Chinner else 77730f712c9SDave Chinner compact = 0; 77830f712c9SDave Chinner /* 77930f712c9SDave Chinner * If just checking, then it will fit unless we needed to allocate 78030f712c9SDave Chinner * a new data block. 78130f712c9SDave Chinner */ 78230f712c9SDave Chinner if (args->op_flags & XFS_DA_OP_JUSTCHECK) { 78330f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 7842451337dSDave Chinner return use_block == -1 ? -ENOSPC : 0; 78530f712c9SDave Chinner } 78630f712c9SDave Chinner /* 78730f712c9SDave Chinner * If no allocations are allowed, return now before we've 78830f712c9SDave Chinner * changed anything. 78930f712c9SDave Chinner */ 79030f712c9SDave Chinner if (args->total == 0 && use_block == -1) { 79130f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 7922451337dSDave Chinner return -ENOSPC; 79330f712c9SDave Chinner } 79430f712c9SDave Chinner /* 79530f712c9SDave Chinner * Need to compact the leaf entries, removing stale ones. 79630f712c9SDave Chinner * Leave one stale entry behind - the one closest to our 79730f712c9SDave Chinner * insertion index - and we'll shift that one to our insertion 79830f712c9SDave Chinner * point later. 79930f712c9SDave Chinner */ 80030f712c9SDave Chinner if (compact) { 80130f712c9SDave Chinner xfs_dir3_leaf_compact_x1(&leafhdr, ents, &index, &lowstale, 80230f712c9SDave Chinner &highstale, &lfloglow, &lfloghigh); 80330f712c9SDave Chinner } 80430f712c9SDave Chinner /* 80530f712c9SDave Chinner * There are stale entries, so we'll need log-low and log-high 80630f712c9SDave Chinner * impossibly bad values later. 80730f712c9SDave Chinner */ 80830f712c9SDave Chinner else if (leafhdr.stale) { 80930f712c9SDave Chinner lfloglow = leafhdr.count; 81030f712c9SDave Chinner lfloghigh = -1; 81130f712c9SDave Chinner } 81230f712c9SDave Chinner /* 81330f712c9SDave Chinner * If there was no data block space found, we need to allocate 81430f712c9SDave Chinner * a new one. 81530f712c9SDave Chinner */ 81630f712c9SDave Chinner if (use_block == -1) { 81730f712c9SDave Chinner /* 81830f712c9SDave Chinner * Add the new data block. 81930f712c9SDave Chinner */ 82030f712c9SDave Chinner if ((error = xfs_dir2_grow_inode(args, XFS_DIR2_DATA_SPACE, 82130f712c9SDave Chinner &use_block))) { 82230f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 82330f712c9SDave Chinner return error; 82430f712c9SDave Chinner } 82530f712c9SDave Chinner /* 82630f712c9SDave Chinner * Initialize the block. 82730f712c9SDave Chinner */ 82830f712c9SDave Chinner if ((error = xfs_dir3_data_init(args, use_block, &dbp))) { 82930f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 83030f712c9SDave Chinner return error; 83130f712c9SDave Chinner } 83230f712c9SDave Chinner /* 83330f712c9SDave Chinner * If we're adding a new data block on the end we need to 83430f712c9SDave Chinner * extend the bests table. Copy it up one entry. 83530f712c9SDave Chinner */ 83630f712c9SDave Chinner if (use_block >= be32_to_cpu(ltp->bestcount)) { 83730f712c9SDave Chinner bestsp--; 83830f712c9SDave Chinner memmove(&bestsp[0], &bestsp[1], 83930f712c9SDave Chinner be32_to_cpu(ltp->bestcount) * sizeof(bestsp[0])); 84030f712c9SDave Chinner be32_add_cpu(<p->bestcount, 1); 84130f712c9SDave Chinner xfs_dir3_leaf_log_tail(args, lbp); 84230f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, 0, 84330f712c9SDave Chinner be32_to_cpu(ltp->bestcount) - 1); 84430f712c9SDave Chinner } 84530f712c9SDave Chinner /* 84630f712c9SDave Chinner * If we're filling in a previously empty block just log it. 84730f712c9SDave Chinner */ 84830f712c9SDave Chinner else 84930f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, use_block, use_block); 85030f712c9SDave Chinner hdr = dbp->b_addr; 85130f712c9SDave Chinner bf = dp->d_ops->data_bestfree_p(hdr); 85230f712c9SDave Chinner bestsp[use_block] = bf[0].length; 85330f712c9SDave Chinner grown = 1; 85430f712c9SDave Chinner } else { 85530f712c9SDave Chinner /* 85630f712c9SDave Chinner * Already had space in some data block. 85730f712c9SDave Chinner * Just read that one in. 85830f712c9SDave Chinner */ 85930f712c9SDave Chinner error = xfs_dir3_data_read(tp, dp, 86030f712c9SDave Chinner xfs_dir2_db_to_da(args->geo, use_block), 86130f712c9SDave Chinner -1, &dbp); 86230f712c9SDave Chinner if (error) { 86330f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 86430f712c9SDave Chinner return error; 86530f712c9SDave Chinner } 86630f712c9SDave Chinner hdr = dbp->b_addr; 86730f712c9SDave Chinner bf = dp->d_ops->data_bestfree_p(hdr); 86830f712c9SDave Chinner grown = 0; 86930f712c9SDave Chinner } 87030f712c9SDave Chinner /* 87130f712c9SDave Chinner * Point to the biggest freespace in our data block. 87230f712c9SDave Chinner */ 87330f712c9SDave Chinner dup = (xfs_dir2_data_unused_t *) 87430f712c9SDave Chinner ((char *)hdr + be16_to_cpu(bf[0].offset)); 87530f712c9SDave Chinner ASSERT(be16_to_cpu(dup->length) >= length); 87630f712c9SDave Chinner needscan = needlog = 0; 87730f712c9SDave Chinner /* 87830f712c9SDave Chinner * Mark the initial part of our freespace in use for the new entry. 87930f712c9SDave Chinner */ 88030f712c9SDave Chinner xfs_dir2_data_use_free(args, dbp, dup, 88130f712c9SDave Chinner (xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr), length, 88230f712c9SDave Chinner &needlog, &needscan); 88330f712c9SDave Chinner /* 88430f712c9SDave Chinner * Initialize our new entry (at last). 88530f712c9SDave Chinner */ 88630f712c9SDave Chinner dep = (xfs_dir2_data_entry_t *)dup; 88730f712c9SDave Chinner dep->inumber = cpu_to_be64(args->inumber); 88830f712c9SDave Chinner dep->namelen = args->namelen; 88930f712c9SDave Chinner memcpy(dep->name, args->name, dep->namelen); 89030f712c9SDave Chinner dp->d_ops->data_put_ftype(dep, args->filetype); 89130f712c9SDave Chinner tagp = dp->d_ops->data_entry_tag_p(dep); 89230f712c9SDave Chinner *tagp = cpu_to_be16((char *)dep - (char *)hdr); 89330f712c9SDave Chinner /* 89430f712c9SDave Chinner * Need to scan fix up the bestfree table. 89530f712c9SDave Chinner */ 89630f712c9SDave Chinner if (needscan) 89730f712c9SDave Chinner xfs_dir2_data_freescan(dp, hdr, &needlog); 89830f712c9SDave Chinner /* 89930f712c9SDave Chinner * Need to log the data block's header. 90030f712c9SDave Chinner */ 90130f712c9SDave Chinner if (needlog) 90230f712c9SDave Chinner xfs_dir2_data_log_header(args, dbp); 90330f712c9SDave Chinner xfs_dir2_data_log_entry(args, dbp, dep); 90430f712c9SDave Chinner /* 90530f712c9SDave Chinner * If the bests table needs to be changed, do it. 90630f712c9SDave Chinner * Log the change unless we've already done that. 90730f712c9SDave Chinner */ 90830f712c9SDave Chinner if (be16_to_cpu(bestsp[use_block]) != be16_to_cpu(bf[0].length)) { 90930f712c9SDave Chinner bestsp[use_block] = bf[0].length; 91030f712c9SDave Chinner if (!grown) 91130f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, use_block, use_block); 91230f712c9SDave Chinner } 91330f712c9SDave Chinner 91430f712c9SDave Chinner lep = xfs_dir3_leaf_find_entry(&leafhdr, ents, index, compact, lowstale, 91530f712c9SDave Chinner highstale, &lfloglow, &lfloghigh); 91630f712c9SDave Chinner 91730f712c9SDave Chinner /* 91830f712c9SDave Chinner * Fill in the new leaf entry. 91930f712c9SDave Chinner */ 92030f712c9SDave Chinner lep->hashval = cpu_to_be32(args->hashval); 92130f712c9SDave Chinner lep->address = cpu_to_be32( 92230f712c9SDave Chinner xfs_dir2_db_off_to_dataptr(args->geo, use_block, 92330f712c9SDave Chinner be16_to_cpu(*tagp))); 92430f712c9SDave Chinner /* 92530f712c9SDave Chinner * Log the leaf fields and give up the buffers. 92630f712c9SDave Chinner */ 92730f712c9SDave Chinner dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr); 92830f712c9SDave Chinner xfs_dir3_leaf_log_header(args, lbp); 92930f712c9SDave Chinner xfs_dir3_leaf_log_ents(args, lbp, lfloglow, lfloghigh); 93030f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 93130f712c9SDave Chinner xfs_dir3_data_check(dp, dbp); 93230f712c9SDave Chinner return 0; 93330f712c9SDave Chinner } 93430f712c9SDave Chinner 93530f712c9SDave Chinner /* 93630f712c9SDave Chinner * Compact out any stale entries in the leaf. 93730f712c9SDave Chinner * Log the header and changed leaf entries, if any. 93830f712c9SDave Chinner */ 93930f712c9SDave Chinner void 94030f712c9SDave Chinner xfs_dir3_leaf_compact( 94130f712c9SDave Chinner xfs_da_args_t *args, /* operation arguments */ 94230f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *leafhdr, 94330f712c9SDave Chinner struct xfs_buf *bp) /* leaf buffer */ 94430f712c9SDave Chinner { 94530f712c9SDave Chinner int from; /* source leaf index */ 94630f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 94730f712c9SDave Chinner int loglow; /* first leaf entry to log */ 94830f712c9SDave Chinner int to; /* target leaf index */ 94930f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 95030f712c9SDave Chinner struct xfs_inode *dp = args->dp; 95130f712c9SDave Chinner 95230f712c9SDave Chinner leaf = bp->b_addr; 95330f712c9SDave Chinner if (!leafhdr->stale) 95430f712c9SDave Chinner return; 95530f712c9SDave Chinner 95630f712c9SDave Chinner /* 95730f712c9SDave Chinner * Compress out the stale entries in place. 95830f712c9SDave Chinner */ 95930f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 96030f712c9SDave Chinner for (from = to = 0, loglow = -1; from < leafhdr->count; from++) { 96130f712c9SDave Chinner if (ents[from].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) 96230f712c9SDave Chinner continue; 96330f712c9SDave Chinner /* 96430f712c9SDave Chinner * Only actually copy the entries that are different. 96530f712c9SDave Chinner */ 96630f712c9SDave Chinner if (from > to) { 96730f712c9SDave Chinner if (loglow == -1) 96830f712c9SDave Chinner loglow = to; 96930f712c9SDave Chinner ents[to] = ents[from]; 97030f712c9SDave Chinner } 97130f712c9SDave Chinner to++; 97230f712c9SDave Chinner } 97330f712c9SDave Chinner /* 97430f712c9SDave Chinner * Update and log the header, log the leaf entries. 97530f712c9SDave Chinner */ 97630f712c9SDave Chinner ASSERT(leafhdr->stale == from - to); 97730f712c9SDave Chinner leafhdr->count -= leafhdr->stale; 97830f712c9SDave Chinner leafhdr->stale = 0; 97930f712c9SDave Chinner 98030f712c9SDave Chinner dp->d_ops->leaf_hdr_to_disk(leaf, leafhdr); 98130f712c9SDave Chinner xfs_dir3_leaf_log_header(args, bp); 98230f712c9SDave Chinner if (loglow != -1) 98330f712c9SDave Chinner xfs_dir3_leaf_log_ents(args, bp, loglow, to - 1); 98430f712c9SDave Chinner } 98530f712c9SDave Chinner 98630f712c9SDave Chinner /* 98730f712c9SDave Chinner * Compact the leaf entries, removing stale ones. 98830f712c9SDave Chinner * Leave one stale entry behind - the one closest to our 98930f712c9SDave Chinner * insertion index - and the caller will shift that one to our insertion 99030f712c9SDave Chinner * point later. 99130f712c9SDave Chinner * Return new insertion index, where the remaining stale entry is, 99230f712c9SDave Chinner * and leaf logging indices. 99330f712c9SDave Chinner */ 99430f712c9SDave Chinner void 99530f712c9SDave Chinner xfs_dir3_leaf_compact_x1( 99630f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *leafhdr, 99730f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents, 99830f712c9SDave Chinner int *indexp, /* insertion index */ 99930f712c9SDave Chinner int *lowstalep, /* out: stale entry before us */ 100030f712c9SDave Chinner int *highstalep, /* out: stale entry after us */ 100130f712c9SDave Chinner int *lowlogp, /* out: low log index */ 100230f712c9SDave Chinner int *highlogp) /* out: high log index */ 100330f712c9SDave Chinner { 100430f712c9SDave Chinner int from; /* source copy index */ 100530f712c9SDave Chinner int highstale; /* stale entry at/after index */ 100630f712c9SDave Chinner int index; /* insertion index */ 100730f712c9SDave Chinner int keepstale; /* source index of kept stale */ 100830f712c9SDave Chinner int lowstale; /* stale entry before index */ 100930f712c9SDave Chinner int newindex=0; /* new insertion index */ 101030f712c9SDave Chinner int to; /* destination copy index */ 101130f712c9SDave Chinner 101230f712c9SDave Chinner ASSERT(leafhdr->stale > 1); 101330f712c9SDave Chinner index = *indexp; 101430f712c9SDave Chinner 101530f712c9SDave Chinner xfs_dir3_leaf_find_stale(leafhdr, ents, index, &lowstale, &highstale); 101630f712c9SDave Chinner 101730f712c9SDave Chinner /* 101830f712c9SDave Chinner * Pick the better of lowstale and highstale. 101930f712c9SDave Chinner */ 102030f712c9SDave Chinner if (lowstale >= 0 && 102130f712c9SDave Chinner (highstale == leafhdr->count || 102230f712c9SDave Chinner index - lowstale <= highstale - index)) 102330f712c9SDave Chinner keepstale = lowstale; 102430f712c9SDave Chinner else 102530f712c9SDave Chinner keepstale = highstale; 102630f712c9SDave Chinner /* 102730f712c9SDave Chinner * Copy the entries in place, removing all the stale entries 102830f712c9SDave Chinner * except keepstale. 102930f712c9SDave Chinner */ 103030f712c9SDave Chinner for (from = to = 0; from < leafhdr->count; from++) { 103130f712c9SDave Chinner /* 103230f712c9SDave Chinner * Notice the new value of index. 103330f712c9SDave Chinner */ 103430f712c9SDave Chinner if (index == from) 103530f712c9SDave Chinner newindex = to; 103630f712c9SDave Chinner if (from != keepstale && 103730f712c9SDave Chinner ents[from].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) { 103830f712c9SDave Chinner if (from == to) 103930f712c9SDave Chinner *lowlogp = to; 104030f712c9SDave Chinner continue; 104130f712c9SDave Chinner } 104230f712c9SDave Chinner /* 104330f712c9SDave Chinner * Record the new keepstale value for the insertion. 104430f712c9SDave Chinner */ 104530f712c9SDave Chinner if (from == keepstale) 104630f712c9SDave Chinner lowstale = highstale = to; 104730f712c9SDave Chinner /* 104830f712c9SDave Chinner * Copy only the entries that have moved. 104930f712c9SDave Chinner */ 105030f712c9SDave Chinner if (from > to) 105130f712c9SDave Chinner ents[to] = ents[from]; 105230f712c9SDave Chinner to++; 105330f712c9SDave Chinner } 105430f712c9SDave Chinner ASSERT(from > to); 105530f712c9SDave Chinner /* 105630f712c9SDave Chinner * If the insertion point was past the last entry, 105730f712c9SDave Chinner * set the new insertion point accordingly. 105830f712c9SDave Chinner */ 105930f712c9SDave Chinner if (index == from) 106030f712c9SDave Chinner newindex = to; 106130f712c9SDave Chinner *indexp = newindex; 106230f712c9SDave Chinner /* 106330f712c9SDave Chinner * Adjust the leaf header values. 106430f712c9SDave Chinner */ 106530f712c9SDave Chinner leafhdr->count -= from - to; 106630f712c9SDave Chinner leafhdr->stale = 1; 106730f712c9SDave Chinner /* 106830f712c9SDave Chinner * Remember the low/high stale value only in the "right" 106930f712c9SDave Chinner * direction. 107030f712c9SDave Chinner */ 107130f712c9SDave Chinner if (lowstale >= newindex) 107230f712c9SDave Chinner lowstale = -1; 107330f712c9SDave Chinner else 107430f712c9SDave Chinner highstale = leafhdr->count; 107530f712c9SDave Chinner *highlogp = leafhdr->count - 1; 107630f712c9SDave Chinner *lowstalep = lowstale; 107730f712c9SDave Chinner *highstalep = highstale; 107830f712c9SDave Chinner } 107930f712c9SDave Chinner 108030f712c9SDave Chinner /* 108130f712c9SDave Chinner * Log the bests entries indicated from a leaf1 block. 108230f712c9SDave Chinner */ 108330f712c9SDave Chinner static void 108430f712c9SDave Chinner xfs_dir3_leaf_log_bests( 108530f712c9SDave Chinner struct xfs_da_args *args, 108630f712c9SDave Chinner struct xfs_buf *bp, /* leaf buffer */ 108730f712c9SDave Chinner int first, /* first entry to log */ 108830f712c9SDave Chinner int last) /* last entry to log */ 108930f712c9SDave Chinner { 109030f712c9SDave Chinner __be16 *firstb; /* pointer to first entry */ 109130f712c9SDave Chinner __be16 *lastb; /* pointer to last entry */ 109230f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 109330f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf tail structure */ 109430f712c9SDave Chinner 109530f712c9SDave Chinner ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAF1_MAGIC) || 109630f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAF1_MAGIC)); 109730f712c9SDave Chinner 109830f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 109930f712c9SDave Chinner firstb = xfs_dir2_leaf_bests_p(ltp) + first; 110030f712c9SDave Chinner lastb = xfs_dir2_leaf_bests_p(ltp) + last; 110130f712c9SDave Chinner xfs_trans_log_buf(args->trans, bp, 110230f712c9SDave Chinner (uint)((char *)firstb - (char *)leaf), 110330f712c9SDave Chinner (uint)((char *)lastb - (char *)leaf + sizeof(*lastb) - 1)); 110430f712c9SDave Chinner } 110530f712c9SDave Chinner 110630f712c9SDave Chinner /* 110730f712c9SDave Chinner * Log the leaf entries indicated from a leaf1 or leafn block. 110830f712c9SDave Chinner */ 110930f712c9SDave Chinner void 111030f712c9SDave Chinner xfs_dir3_leaf_log_ents( 111130f712c9SDave Chinner struct xfs_da_args *args, 111230f712c9SDave Chinner struct xfs_buf *bp, 111330f712c9SDave Chinner int first, 111430f712c9SDave Chinner int last) 111530f712c9SDave Chinner { 111630f712c9SDave Chinner xfs_dir2_leaf_entry_t *firstlep; /* pointer to first entry */ 111730f712c9SDave Chinner xfs_dir2_leaf_entry_t *lastlep; /* pointer to last entry */ 111830f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 111930f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 112030f712c9SDave Chinner 112130f712c9SDave Chinner ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAF1_MAGIC) || 112230f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAF1_MAGIC) || 112330f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) || 112430f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)); 112530f712c9SDave Chinner 112630f712c9SDave Chinner ents = args->dp->d_ops->leaf_ents_p(leaf); 112730f712c9SDave Chinner firstlep = &ents[first]; 112830f712c9SDave Chinner lastlep = &ents[last]; 112930f712c9SDave Chinner xfs_trans_log_buf(args->trans, bp, 113030f712c9SDave Chinner (uint)((char *)firstlep - (char *)leaf), 113130f712c9SDave Chinner (uint)((char *)lastlep - (char *)leaf + sizeof(*lastlep) - 1)); 113230f712c9SDave Chinner } 113330f712c9SDave Chinner 113430f712c9SDave Chinner /* 113530f712c9SDave Chinner * Log the header of the leaf1 or leafn block. 113630f712c9SDave Chinner */ 113730f712c9SDave Chinner void 113830f712c9SDave Chinner xfs_dir3_leaf_log_header( 113930f712c9SDave Chinner struct xfs_da_args *args, 114030f712c9SDave Chinner struct xfs_buf *bp) 114130f712c9SDave Chinner { 114230f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 114330f712c9SDave Chinner 114430f712c9SDave Chinner ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAF1_MAGIC) || 114530f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAF1_MAGIC) || 114630f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) || 114730f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)); 114830f712c9SDave Chinner 114930f712c9SDave Chinner xfs_trans_log_buf(args->trans, bp, 115030f712c9SDave Chinner (uint)((char *)&leaf->hdr - (char *)leaf), 115130f712c9SDave Chinner args->dp->d_ops->leaf_hdr_size - 1); 115230f712c9SDave Chinner } 115330f712c9SDave Chinner 115430f712c9SDave Chinner /* 115530f712c9SDave Chinner * Log the tail of the leaf1 block. 115630f712c9SDave Chinner */ 115730f712c9SDave Chinner STATIC void 115830f712c9SDave Chinner xfs_dir3_leaf_log_tail( 115930f712c9SDave Chinner struct xfs_da_args *args, 116030f712c9SDave Chinner struct xfs_buf *bp) 116130f712c9SDave Chinner { 116230f712c9SDave Chinner struct xfs_dir2_leaf *leaf = bp->b_addr; 116330f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf tail structure */ 116430f712c9SDave Chinner 116530f712c9SDave Chinner ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAF1_MAGIC) || 116630f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAF1_MAGIC) || 116730f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAFN_MAGIC) || 116830f712c9SDave Chinner leaf->hdr.info.magic == cpu_to_be16(XFS_DIR3_LEAFN_MAGIC)); 116930f712c9SDave Chinner 117030f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 117130f712c9SDave Chinner xfs_trans_log_buf(args->trans, bp, (uint)((char *)ltp - (char *)leaf), 117230f712c9SDave Chinner (uint)(args->geo->blksize - 1)); 117330f712c9SDave Chinner } 117430f712c9SDave Chinner 117530f712c9SDave Chinner /* 117630f712c9SDave Chinner * Look up the entry referred to by args in the leaf format directory. 117730f712c9SDave Chinner * Most of the work is done by the xfs_dir2_leaf_lookup_int routine which 117830f712c9SDave Chinner * is also used by the node-format code. 117930f712c9SDave Chinner */ 118030f712c9SDave Chinner int 118130f712c9SDave Chinner xfs_dir2_leaf_lookup( 118230f712c9SDave Chinner xfs_da_args_t *args) /* operation arguments */ 118330f712c9SDave Chinner { 118430f712c9SDave Chinner struct xfs_buf *dbp; /* data block buffer */ 118530f712c9SDave Chinner xfs_dir2_data_entry_t *dep; /* data block entry */ 118630f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 118730f712c9SDave Chinner int error; /* error return code */ 118830f712c9SDave Chinner int index; /* found entry index */ 118930f712c9SDave Chinner struct xfs_buf *lbp; /* leaf buffer */ 119030f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 119130f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry */ 119230f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 119330f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 119430f712c9SDave Chinner 119530f712c9SDave Chinner trace_xfs_dir2_leaf_lookup(args); 119630f712c9SDave Chinner 119730f712c9SDave Chinner /* 119830f712c9SDave Chinner * Look up name in the leaf block, returning both buffers and index. 119930f712c9SDave Chinner */ 120030f712c9SDave Chinner if ((error = xfs_dir2_leaf_lookup_int(args, &lbp, &index, &dbp))) { 120130f712c9SDave Chinner return error; 120230f712c9SDave Chinner } 120330f712c9SDave Chinner tp = args->trans; 120430f712c9SDave Chinner dp = args->dp; 120530f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 120630f712c9SDave Chinner leaf = lbp->b_addr; 120730f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 120830f712c9SDave Chinner /* 120930f712c9SDave Chinner * Get to the leaf entry and contained data entry address. 121030f712c9SDave Chinner */ 121130f712c9SDave Chinner lep = &ents[index]; 121230f712c9SDave Chinner 121330f712c9SDave Chinner /* 121430f712c9SDave Chinner * Point to the data entry. 121530f712c9SDave Chinner */ 121630f712c9SDave Chinner dep = (xfs_dir2_data_entry_t *) 121730f712c9SDave Chinner ((char *)dbp->b_addr + 121830f712c9SDave Chinner xfs_dir2_dataptr_to_off(args->geo, be32_to_cpu(lep->address))); 121930f712c9SDave Chinner /* 122030f712c9SDave Chinner * Return the found inode number & CI name if appropriate 122130f712c9SDave Chinner */ 122230f712c9SDave Chinner args->inumber = be64_to_cpu(dep->inumber); 122330f712c9SDave Chinner args->filetype = dp->d_ops->data_get_ftype(dep); 122430f712c9SDave Chinner error = xfs_dir_cilookup_result(args, dep->name, dep->namelen); 122530f712c9SDave Chinner xfs_trans_brelse(tp, dbp); 122630f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 122730f712c9SDave Chinner return error; 122830f712c9SDave Chinner } 122930f712c9SDave Chinner 123030f712c9SDave Chinner /* 123130f712c9SDave Chinner * Look up name/hash in the leaf block. 123230f712c9SDave Chinner * Fill in indexp with the found index, and dbpp with the data buffer. 123330f712c9SDave Chinner * If not found dbpp will be NULL, and ENOENT comes back. 123430f712c9SDave Chinner * lbpp will always be filled in with the leaf buffer unless there's an error. 123530f712c9SDave Chinner */ 123630f712c9SDave Chinner static int /* error */ 123730f712c9SDave Chinner xfs_dir2_leaf_lookup_int( 123830f712c9SDave Chinner xfs_da_args_t *args, /* operation arguments */ 123930f712c9SDave Chinner struct xfs_buf **lbpp, /* out: leaf buffer */ 124030f712c9SDave Chinner int *indexp, /* out: index in leaf block */ 124130f712c9SDave Chinner struct xfs_buf **dbpp) /* out: data buffer */ 124230f712c9SDave Chinner { 124330f712c9SDave Chinner xfs_dir2_db_t curdb = -1; /* current data block number */ 124430f712c9SDave Chinner struct xfs_buf *dbp = NULL; /* data buffer */ 124530f712c9SDave Chinner xfs_dir2_data_entry_t *dep; /* data entry */ 124630f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 124730f712c9SDave Chinner int error; /* error return code */ 124830f712c9SDave Chinner int index; /* index in leaf block */ 124930f712c9SDave Chinner struct xfs_buf *lbp; /* leaf buffer */ 125030f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry */ 125130f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 125230f712c9SDave Chinner xfs_mount_t *mp; /* filesystem mount point */ 125330f712c9SDave Chinner xfs_dir2_db_t newdb; /* new data block number */ 125430f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 125530f712c9SDave Chinner xfs_dir2_db_t cidb = -1; /* case match data block no. */ 125630f712c9SDave Chinner enum xfs_dacmp cmp; /* name compare result */ 125730f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 125830f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 125930f712c9SDave Chinner 126030f712c9SDave Chinner dp = args->dp; 126130f712c9SDave Chinner tp = args->trans; 126230f712c9SDave Chinner mp = dp->i_mount; 126330f712c9SDave Chinner 126430f712c9SDave Chinner error = xfs_dir3_leaf_read(tp, dp, args->geo->leafblk, -1, &lbp); 126530f712c9SDave Chinner if (error) 126630f712c9SDave Chinner return error; 126730f712c9SDave Chinner 126830f712c9SDave Chinner *lbpp = lbp; 126930f712c9SDave Chinner leaf = lbp->b_addr; 127030f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 127130f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 127230f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 127330f712c9SDave Chinner 127430f712c9SDave Chinner /* 127530f712c9SDave Chinner * Look for the first leaf entry with our hash value. 127630f712c9SDave Chinner */ 127730f712c9SDave Chinner index = xfs_dir2_leaf_search_hash(args, lbp); 127830f712c9SDave Chinner /* 127930f712c9SDave Chinner * Loop over all the entries with the right hash value 128030f712c9SDave Chinner * looking to match the name. 128130f712c9SDave Chinner */ 128230f712c9SDave Chinner for (lep = &ents[index]; 128330f712c9SDave Chinner index < leafhdr.count && be32_to_cpu(lep->hashval) == args->hashval; 128430f712c9SDave Chinner lep++, index++) { 128530f712c9SDave Chinner /* 128630f712c9SDave Chinner * Skip over stale leaf entries. 128730f712c9SDave Chinner */ 128830f712c9SDave Chinner if (be32_to_cpu(lep->address) == XFS_DIR2_NULL_DATAPTR) 128930f712c9SDave Chinner continue; 129030f712c9SDave Chinner /* 129130f712c9SDave Chinner * Get the new data block number. 129230f712c9SDave Chinner */ 129330f712c9SDave Chinner newdb = xfs_dir2_dataptr_to_db(args->geo, 129430f712c9SDave Chinner be32_to_cpu(lep->address)); 129530f712c9SDave Chinner /* 129630f712c9SDave Chinner * If it's not the same as the old data block number, 129730f712c9SDave Chinner * need to pitch the old one and read the new one. 129830f712c9SDave Chinner */ 129930f712c9SDave Chinner if (newdb != curdb) { 130030f712c9SDave Chinner if (dbp) 130130f712c9SDave Chinner xfs_trans_brelse(tp, dbp); 130230f712c9SDave Chinner error = xfs_dir3_data_read(tp, dp, 130330f712c9SDave Chinner xfs_dir2_db_to_da(args->geo, newdb), 130430f712c9SDave Chinner -1, &dbp); 130530f712c9SDave Chinner if (error) { 130630f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 130730f712c9SDave Chinner return error; 130830f712c9SDave Chinner } 130930f712c9SDave Chinner curdb = newdb; 131030f712c9SDave Chinner } 131130f712c9SDave Chinner /* 131230f712c9SDave Chinner * Point to the data entry. 131330f712c9SDave Chinner */ 131430f712c9SDave Chinner dep = (xfs_dir2_data_entry_t *)((char *)dbp->b_addr + 131530f712c9SDave Chinner xfs_dir2_dataptr_to_off(args->geo, 131630f712c9SDave Chinner be32_to_cpu(lep->address))); 131730f712c9SDave Chinner /* 131830f712c9SDave Chinner * Compare name and if it's an exact match, return the index 131930f712c9SDave Chinner * and buffer. If it's the first case-insensitive match, store 132030f712c9SDave Chinner * the index and buffer and continue looking for an exact match. 132130f712c9SDave Chinner */ 132230f712c9SDave Chinner cmp = mp->m_dirnameops->compname(args, dep->name, dep->namelen); 132330f712c9SDave Chinner if (cmp != XFS_CMP_DIFFERENT && cmp != args->cmpresult) { 132430f712c9SDave Chinner args->cmpresult = cmp; 132530f712c9SDave Chinner *indexp = index; 132630f712c9SDave Chinner /* case exact match: return the current buffer. */ 132730f712c9SDave Chinner if (cmp == XFS_CMP_EXACT) { 132830f712c9SDave Chinner *dbpp = dbp; 132930f712c9SDave Chinner return 0; 133030f712c9SDave Chinner } 133130f712c9SDave Chinner cidb = curdb; 133230f712c9SDave Chinner } 133330f712c9SDave Chinner } 133430f712c9SDave Chinner ASSERT(args->op_flags & XFS_DA_OP_OKNOENT); 133530f712c9SDave Chinner /* 133630f712c9SDave Chinner * Here, we can only be doing a lookup (not a rename or remove). 133730f712c9SDave Chinner * If a case-insensitive match was found earlier, re-read the 133830f712c9SDave Chinner * appropriate data block if required and return it. 133930f712c9SDave Chinner */ 134030f712c9SDave Chinner if (args->cmpresult == XFS_CMP_CASE) { 134130f712c9SDave Chinner ASSERT(cidb != -1); 134230f712c9SDave Chinner if (cidb != curdb) { 134330f712c9SDave Chinner xfs_trans_brelse(tp, dbp); 134430f712c9SDave Chinner error = xfs_dir3_data_read(tp, dp, 134530f712c9SDave Chinner xfs_dir2_db_to_da(args->geo, cidb), 134630f712c9SDave Chinner -1, &dbp); 134730f712c9SDave Chinner if (error) { 134830f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 134930f712c9SDave Chinner return error; 135030f712c9SDave Chinner } 135130f712c9SDave Chinner } 135230f712c9SDave Chinner *dbpp = dbp; 135330f712c9SDave Chinner return 0; 135430f712c9SDave Chinner } 135530f712c9SDave Chinner /* 13562451337dSDave Chinner * No match found, return -ENOENT. 135730f712c9SDave Chinner */ 135830f712c9SDave Chinner ASSERT(cidb == -1); 135930f712c9SDave Chinner if (dbp) 136030f712c9SDave Chinner xfs_trans_brelse(tp, dbp); 136130f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 13622451337dSDave Chinner return -ENOENT; 136330f712c9SDave Chinner } 136430f712c9SDave Chinner 136530f712c9SDave Chinner /* 136630f712c9SDave Chinner * Remove an entry from a leaf format directory. 136730f712c9SDave Chinner */ 136830f712c9SDave Chinner int /* error */ 136930f712c9SDave Chinner xfs_dir2_leaf_removename( 137030f712c9SDave Chinner xfs_da_args_t *args) /* operation arguments */ 137130f712c9SDave Chinner { 137230f712c9SDave Chinner __be16 *bestsp; /* leaf block best freespace */ 137330f712c9SDave Chinner xfs_dir2_data_hdr_t *hdr; /* data block header */ 137430f712c9SDave Chinner xfs_dir2_db_t db; /* data block number */ 137530f712c9SDave Chinner struct xfs_buf *dbp; /* data block buffer */ 137630f712c9SDave Chinner xfs_dir2_data_entry_t *dep; /* data entry structure */ 137730f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 137830f712c9SDave Chinner int error; /* error return code */ 137930f712c9SDave Chinner xfs_dir2_db_t i; /* temporary data block # */ 138030f712c9SDave Chinner int index; /* index into leaf entries */ 138130f712c9SDave Chinner struct xfs_buf *lbp; /* leaf buffer */ 138230f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 138330f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry */ 138430f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf tail structure */ 138530f712c9SDave Chinner int needlog; /* need to log data header */ 138630f712c9SDave Chinner int needscan; /* need to rescan data frees */ 138730f712c9SDave Chinner xfs_dir2_data_off_t oldbest; /* old value of best free */ 138830f712c9SDave Chinner struct xfs_dir2_data_free *bf; /* bestfree table */ 138930f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 139030f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 139130f712c9SDave Chinner 139230f712c9SDave Chinner trace_xfs_dir2_leaf_removename(args); 139330f712c9SDave Chinner 139430f712c9SDave Chinner /* 139530f712c9SDave Chinner * Lookup the leaf entry, get the leaf and data blocks read in. 139630f712c9SDave Chinner */ 139730f712c9SDave Chinner if ((error = xfs_dir2_leaf_lookup_int(args, &lbp, &index, &dbp))) { 139830f712c9SDave Chinner return error; 139930f712c9SDave Chinner } 140030f712c9SDave Chinner dp = args->dp; 140130f712c9SDave Chinner leaf = lbp->b_addr; 140230f712c9SDave Chinner hdr = dbp->b_addr; 140330f712c9SDave Chinner xfs_dir3_data_check(dp, dbp); 140430f712c9SDave Chinner bf = dp->d_ops->data_bestfree_p(hdr); 140530f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 140630f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 140730f712c9SDave Chinner /* 140830f712c9SDave Chinner * Point to the leaf entry, use that to point to the data entry. 140930f712c9SDave Chinner */ 141030f712c9SDave Chinner lep = &ents[index]; 141130f712c9SDave Chinner db = xfs_dir2_dataptr_to_db(args->geo, be32_to_cpu(lep->address)); 141230f712c9SDave Chinner dep = (xfs_dir2_data_entry_t *)((char *)hdr + 141330f712c9SDave Chinner xfs_dir2_dataptr_to_off(args->geo, be32_to_cpu(lep->address))); 141430f712c9SDave Chinner needscan = needlog = 0; 141530f712c9SDave Chinner oldbest = be16_to_cpu(bf[0].length); 141630f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 141730f712c9SDave Chinner bestsp = xfs_dir2_leaf_bests_p(ltp); 14183f883f5bSDarrick J. Wong if (be16_to_cpu(bestsp[db]) != oldbest) 14193f883f5bSDarrick J. Wong return -EFSCORRUPTED; 142030f712c9SDave Chinner /* 142130f712c9SDave Chinner * Mark the former data entry unused. 142230f712c9SDave Chinner */ 142330f712c9SDave Chinner xfs_dir2_data_make_free(args, dbp, 142430f712c9SDave Chinner (xfs_dir2_data_aoff_t)((char *)dep - (char *)hdr), 142530f712c9SDave Chinner dp->d_ops->data_entsize(dep->namelen), &needlog, &needscan); 142630f712c9SDave Chinner /* 142730f712c9SDave Chinner * We just mark the leaf entry stale by putting a null in it. 142830f712c9SDave Chinner */ 142930f712c9SDave Chinner leafhdr.stale++; 143030f712c9SDave Chinner dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr); 143130f712c9SDave Chinner xfs_dir3_leaf_log_header(args, lbp); 143230f712c9SDave Chinner 143330f712c9SDave Chinner lep->address = cpu_to_be32(XFS_DIR2_NULL_DATAPTR); 143430f712c9SDave Chinner xfs_dir3_leaf_log_ents(args, lbp, index, index); 143530f712c9SDave Chinner 143630f712c9SDave Chinner /* 143730f712c9SDave Chinner * Scan the freespace in the data block again if necessary, 143830f712c9SDave Chinner * log the data block header if necessary. 143930f712c9SDave Chinner */ 144030f712c9SDave Chinner if (needscan) 144130f712c9SDave Chinner xfs_dir2_data_freescan(dp, hdr, &needlog); 144230f712c9SDave Chinner if (needlog) 144330f712c9SDave Chinner xfs_dir2_data_log_header(args, dbp); 144430f712c9SDave Chinner /* 144530f712c9SDave Chinner * If the longest freespace in the data block has changed, 144630f712c9SDave Chinner * put the new value in the bests table and log that. 144730f712c9SDave Chinner */ 144830f712c9SDave Chinner if (be16_to_cpu(bf[0].length) != oldbest) { 144930f712c9SDave Chinner bestsp[db] = bf[0].length; 145030f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, db, db); 145130f712c9SDave Chinner } 145230f712c9SDave Chinner xfs_dir3_data_check(dp, dbp); 145330f712c9SDave Chinner /* 145430f712c9SDave Chinner * If the data block is now empty then get rid of the data block. 145530f712c9SDave Chinner */ 145630f712c9SDave Chinner if (be16_to_cpu(bf[0].length) == 145730f712c9SDave Chinner args->geo->blksize - dp->d_ops->data_entry_offset) { 145830f712c9SDave Chinner ASSERT(db != args->geo->datablk); 145930f712c9SDave Chinner if ((error = xfs_dir2_shrink_inode(args, db, dbp))) { 146030f712c9SDave Chinner /* 146130f712c9SDave Chinner * Nope, can't get rid of it because it caused 146230f712c9SDave Chinner * allocation of a bmap btree block to do so. 146330f712c9SDave Chinner * Just go on, returning success, leaving the 146430f712c9SDave Chinner * empty block in place. 146530f712c9SDave Chinner */ 14662451337dSDave Chinner if (error == -ENOSPC && args->total == 0) 146730f712c9SDave Chinner error = 0; 146830f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 146930f712c9SDave Chinner return error; 147030f712c9SDave Chinner } 147130f712c9SDave Chinner dbp = NULL; 147230f712c9SDave Chinner /* 147330f712c9SDave Chinner * If this is the last data block then compact the 147430f712c9SDave Chinner * bests table by getting rid of entries. 147530f712c9SDave Chinner */ 147630f712c9SDave Chinner if (db == be32_to_cpu(ltp->bestcount) - 1) { 147730f712c9SDave Chinner /* 147830f712c9SDave Chinner * Look for the last active entry (i). 147930f712c9SDave Chinner */ 148030f712c9SDave Chinner for (i = db - 1; i > 0; i--) { 148130f712c9SDave Chinner if (bestsp[i] != cpu_to_be16(NULLDATAOFF)) 148230f712c9SDave Chinner break; 148330f712c9SDave Chinner } 148430f712c9SDave Chinner /* 148530f712c9SDave Chinner * Copy the table down so inactive entries at the 148630f712c9SDave Chinner * end are removed. 148730f712c9SDave Chinner */ 148830f712c9SDave Chinner memmove(&bestsp[db - i], bestsp, 148930f712c9SDave Chinner (be32_to_cpu(ltp->bestcount) - (db - i)) * sizeof(*bestsp)); 149030f712c9SDave Chinner be32_add_cpu(<p->bestcount, -(db - i)); 149130f712c9SDave Chinner xfs_dir3_leaf_log_tail(args, lbp); 149230f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, 0, 149330f712c9SDave Chinner be32_to_cpu(ltp->bestcount) - 1); 149430f712c9SDave Chinner } else 149530f712c9SDave Chinner bestsp[db] = cpu_to_be16(NULLDATAOFF); 149630f712c9SDave Chinner } 149730f712c9SDave Chinner /* 149830f712c9SDave Chinner * If the data block was not the first one, drop it. 149930f712c9SDave Chinner */ 150030f712c9SDave Chinner else if (db != args->geo->datablk) 150130f712c9SDave Chinner dbp = NULL; 150230f712c9SDave Chinner 150330f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 150430f712c9SDave Chinner /* 150530f712c9SDave Chinner * See if we can convert to block form. 150630f712c9SDave Chinner */ 150730f712c9SDave Chinner return xfs_dir2_leaf_to_block(args, lbp, dbp); 150830f712c9SDave Chinner } 150930f712c9SDave Chinner 151030f712c9SDave Chinner /* 151130f712c9SDave Chinner * Replace the inode number in a leaf format directory entry. 151230f712c9SDave Chinner */ 151330f712c9SDave Chinner int /* error */ 151430f712c9SDave Chinner xfs_dir2_leaf_replace( 151530f712c9SDave Chinner xfs_da_args_t *args) /* operation arguments */ 151630f712c9SDave Chinner { 151730f712c9SDave Chinner struct xfs_buf *dbp; /* data block buffer */ 151830f712c9SDave Chinner xfs_dir2_data_entry_t *dep; /* data block entry */ 151930f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 152030f712c9SDave Chinner int error; /* error return code */ 152130f712c9SDave Chinner int index; /* index of leaf entry */ 152230f712c9SDave Chinner struct xfs_buf *lbp; /* leaf buffer */ 152330f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 152430f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry */ 152530f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 152630f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 152730f712c9SDave Chinner 152830f712c9SDave Chinner trace_xfs_dir2_leaf_replace(args); 152930f712c9SDave Chinner 153030f712c9SDave Chinner /* 153130f712c9SDave Chinner * Look up the entry. 153230f712c9SDave Chinner */ 153330f712c9SDave Chinner if ((error = xfs_dir2_leaf_lookup_int(args, &lbp, &index, &dbp))) { 153430f712c9SDave Chinner return error; 153530f712c9SDave Chinner } 153630f712c9SDave Chinner dp = args->dp; 153730f712c9SDave Chinner leaf = lbp->b_addr; 153830f712c9SDave Chinner ents = dp->d_ops->leaf_ents_p(leaf); 153930f712c9SDave Chinner /* 154030f712c9SDave Chinner * Point to the leaf entry, get data address from it. 154130f712c9SDave Chinner */ 154230f712c9SDave Chinner lep = &ents[index]; 154330f712c9SDave Chinner /* 154430f712c9SDave Chinner * Point to the data entry. 154530f712c9SDave Chinner */ 154630f712c9SDave Chinner dep = (xfs_dir2_data_entry_t *) 154730f712c9SDave Chinner ((char *)dbp->b_addr + 154830f712c9SDave Chinner xfs_dir2_dataptr_to_off(args->geo, be32_to_cpu(lep->address))); 154930f712c9SDave Chinner ASSERT(args->inumber != be64_to_cpu(dep->inumber)); 155030f712c9SDave Chinner /* 155130f712c9SDave Chinner * Put the new inode number in, log it. 155230f712c9SDave Chinner */ 155330f712c9SDave Chinner dep->inumber = cpu_to_be64(args->inumber); 155430f712c9SDave Chinner dp->d_ops->data_put_ftype(dep, args->filetype); 155530f712c9SDave Chinner tp = args->trans; 155630f712c9SDave Chinner xfs_dir2_data_log_entry(args, dbp, dep); 155730f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 155830f712c9SDave Chinner xfs_trans_brelse(tp, lbp); 155930f712c9SDave Chinner return 0; 156030f712c9SDave Chinner } 156130f712c9SDave Chinner 156230f712c9SDave Chinner /* 156330f712c9SDave Chinner * Return index in the leaf block (lbp) which is either the first 156430f712c9SDave Chinner * one with this hash value, or if there are none, the insert point 156530f712c9SDave Chinner * for that hash value. 156630f712c9SDave Chinner */ 156730f712c9SDave Chinner int /* index value */ 156830f712c9SDave Chinner xfs_dir2_leaf_search_hash( 156930f712c9SDave Chinner xfs_da_args_t *args, /* operation arguments */ 157030f712c9SDave Chinner struct xfs_buf *lbp) /* leaf buffer */ 157130f712c9SDave Chinner { 157230f712c9SDave Chinner xfs_dahash_t hash=0; /* hash from this entry */ 157330f712c9SDave Chinner xfs_dahash_t hashwant; /* hash value looking for */ 157430f712c9SDave Chinner int high; /* high leaf index */ 157530f712c9SDave Chinner int low; /* low leaf index */ 157630f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 157730f712c9SDave Chinner xfs_dir2_leaf_entry_t *lep; /* leaf entry */ 157830f712c9SDave Chinner int mid=0; /* current leaf index */ 157930f712c9SDave Chinner struct xfs_dir2_leaf_entry *ents; 158030f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 158130f712c9SDave Chinner 158230f712c9SDave Chinner leaf = lbp->b_addr; 158330f712c9SDave Chinner ents = args->dp->d_ops->leaf_ents_p(leaf); 158430f712c9SDave Chinner args->dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 158530f712c9SDave Chinner 158630f712c9SDave Chinner /* 158730f712c9SDave Chinner * Note, the table cannot be empty, so we have to go through the loop. 158830f712c9SDave Chinner * Binary search the leaf entries looking for our hash value. 158930f712c9SDave Chinner */ 159030f712c9SDave Chinner for (lep = ents, low = 0, high = leafhdr.count - 1, 159130f712c9SDave Chinner hashwant = args->hashval; 159230f712c9SDave Chinner low <= high; ) { 159330f712c9SDave Chinner mid = (low + high) >> 1; 159430f712c9SDave Chinner if ((hash = be32_to_cpu(lep[mid].hashval)) == hashwant) 159530f712c9SDave Chinner break; 159630f712c9SDave Chinner if (hash < hashwant) 159730f712c9SDave Chinner low = mid + 1; 159830f712c9SDave Chinner else 159930f712c9SDave Chinner high = mid - 1; 160030f712c9SDave Chinner } 160130f712c9SDave Chinner /* 160230f712c9SDave Chinner * Found one, back up through all the equal hash values. 160330f712c9SDave Chinner */ 160430f712c9SDave Chinner if (hash == hashwant) { 160530f712c9SDave Chinner while (mid > 0 && be32_to_cpu(lep[mid - 1].hashval) == hashwant) { 160630f712c9SDave Chinner mid--; 160730f712c9SDave Chinner } 160830f712c9SDave Chinner } 160930f712c9SDave Chinner /* 161030f712c9SDave Chinner * Need to point to an entry higher than ours. 161130f712c9SDave Chinner */ 161230f712c9SDave Chinner else if (hash < hashwant) 161330f712c9SDave Chinner mid++; 161430f712c9SDave Chinner return mid; 161530f712c9SDave Chinner } 161630f712c9SDave Chinner 161730f712c9SDave Chinner /* 161830f712c9SDave Chinner * Trim off a trailing data block. We know it's empty since the leaf 161930f712c9SDave Chinner * freespace table says so. 162030f712c9SDave Chinner */ 162130f712c9SDave Chinner int /* error */ 162230f712c9SDave Chinner xfs_dir2_leaf_trim_data( 162330f712c9SDave Chinner xfs_da_args_t *args, /* operation arguments */ 162430f712c9SDave Chinner struct xfs_buf *lbp, /* leaf buffer */ 162530f712c9SDave Chinner xfs_dir2_db_t db) /* data block number */ 162630f712c9SDave Chinner { 162730f712c9SDave Chinner __be16 *bestsp; /* leaf bests table */ 162830f712c9SDave Chinner struct xfs_buf *dbp; /* data block buffer */ 162930f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 163030f712c9SDave Chinner int error; /* error return value */ 163130f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 163230f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* leaf tail structure */ 163330f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 163430f712c9SDave Chinner 163530f712c9SDave Chinner dp = args->dp; 163630f712c9SDave Chinner tp = args->trans; 163730f712c9SDave Chinner /* 163830f712c9SDave Chinner * Read the offending data block. We need its buffer. 163930f712c9SDave Chinner */ 164030f712c9SDave Chinner error = xfs_dir3_data_read(tp, dp, xfs_dir2_db_to_da(args->geo, db), 164130f712c9SDave Chinner -1, &dbp); 164230f712c9SDave Chinner if (error) 164330f712c9SDave Chinner return error; 164430f712c9SDave Chinner 164530f712c9SDave Chinner leaf = lbp->b_addr; 164630f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 164730f712c9SDave Chinner 164830f712c9SDave Chinner #ifdef DEBUG 164930f712c9SDave Chinner { 165030f712c9SDave Chinner struct xfs_dir2_data_hdr *hdr = dbp->b_addr; 165130f712c9SDave Chinner struct xfs_dir2_data_free *bf = dp->d_ops->data_bestfree_p(hdr); 165230f712c9SDave Chinner 165330f712c9SDave Chinner ASSERT(hdr->magic == cpu_to_be32(XFS_DIR2_DATA_MAGIC) || 165430f712c9SDave Chinner hdr->magic == cpu_to_be32(XFS_DIR3_DATA_MAGIC)); 165530f712c9SDave Chinner ASSERT(be16_to_cpu(bf[0].length) == 165630f712c9SDave Chinner args->geo->blksize - dp->d_ops->data_entry_offset); 165730f712c9SDave Chinner ASSERT(db == be32_to_cpu(ltp->bestcount) - 1); 165830f712c9SDave Chinner } 165930f712c9SDave Chinner #endif 166030f712c9SDave Chinner 166130f712c9SDave Chinner /* 166230f712c9SDave Chinner * Get rid of the data block. 166330f712c9SDave Chinner */ 166430f712c9SDave Chinner if ((error = xfs_dir2_shrink_inode(args, db, dbp))) { 16652451337dSDave Chinner ASSERT(error != -ENOSPC); 166630f712c9SDave Chinner xfs_trans_brelse(tp, dbp); 166730f712c9SDave Chinner return error; 166830f712c9SDave Chinner } 166930f712c9SDave Chinner /* 167030f712c9SDave Chinner * Eliminate the last bests entry from the table. 167130f712c9SDave Chinner */ 167230f712c9SDave Chinner bestsp = xfs_dir2_leaf_bests_p(ltp); 167330f712c9SDave Chinner be32_add_cpu(<p->bestcount, -1); 167430f712c9SDave Chinner memmove(&bestsp[1], &bestsp[0], be32_to_cpu(ltp->bestcount) * sizeof(*bestsp)); 167530f712c9SDave Chinner xfs_dir3_leaf_log_tail(args, lbp); 167630f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, 0, be32_to_cpu(ltp->bestcount) - 1); 167730f712c9SDave Chinner return 0; 167830f712c9SDave Chinner } 167930f712c9SDave Chinner 168030f712c9SDave Chinner static inline size_t 168130f712c9SDave Chinner xfs_dir3_leaf_size( 168230f712c9SDave Chinner struct xfs_dir3_icleaf_hdr *hdr, 168330f712c9SDave Chinner int counts) 168430f712c9SDave Chinner { 168530f712c9SDave Chinner int entries; 168630f712c9SDave Chinner int hdrsize; 168730f712c9SDave Chinner 168830f712c9SDave Chinner entries = hdr->count - hdr->stale; 168930f712c9SDave Chinner if (hdr->magic == XFS_DIR2_LEAF1_MAGIC || 169030f712c9SDave Chinner hdr->magic == XFS_DIR2_LEAFN_MAGIC) 169130f712c9SDave Chinner hdrsize = sizeof(struct xfs_dir2_leaf_hdr); 169230f712c9SDave Chinner else 169330f712c9SDave Chinner hdrsize = sizeof(struct xfs_dir3_leaf_hdr); 169430f712c9SDave Chinner 169530f712c9SDave Chinner return hdrsize + entries * sizeof(xfs_dir2_leaf_entry_t) 169630f712c9SDave Chinner + counts * sizeof(xfs_dir2_data_off_t) 169730f712c9SDave Chinner + sizeof(xfs_dir2_leaf_tail_t); 169830f712c9SDave Chinner } 169930f712c9SDave Chinner 170030f712c9SDave Chinner /* 170130f712c9SDave Chinner * Convert node form directory to leaf form directory. 170230f712c9SDave Chinner * The root of the node form dir needs to already be a LEAFN block. 170330f712c9SDave Chinner * Just return if we can't do anything. 170430f712c9SDave Chinner */ 170530f712c9SDave Chinner int /* error */ 170630f712c9SDave Chinner xfs_dir2_node_to_leaf( 170730f712c9SDave Chinner xfs_da_state_t *state) /* directory operation state */ 170830f712c9SDave Chinner { 170930f712c9SDave Chinner xfs_da_args_t *args; /* operation arguments */ 171030f712c9SDave Chinner xfs_inode_t *dp; /* incore directory inode */ 171130f712c9SDave Chinner int error; /* error return code */ 171230f712c9SDave Chinner struct xfs_buf *fbp; /* buffer for freespace block */ 171330f712c9SDave Chinner xfs_fileoff_t fo; /* freespace file offset */ 171430f712c9SDave Chinner xfs_dir2_free_t *free; /* freespace structure */ 171530f712c9SDave Chinner struct xfs_buf *lbp; /* buffer for leaf block */ 171630f712c9SDave Chinner xfs_dir2_leaf_tail_t *ltp; /* tail of leaf structure */ 171730f712c9SDave Chinner xfs_dir2_leaf_t *leaf; /* leaf structure */ 171830f712c9SDave Chinner xfs_mount_t *mp; /* filesystem mount point */ 171930f712c9SDave Chinner int rval; /* successful free trim? */ 172030f712c9SDave Chinner xfs_trans_t *tp; /* transaction pointer */ 172130f712c9SDave Chinner struct xfs_dir3_icleaf_hdr leafhdr; 172230f712c9SDave Chinner struct xfs_dir3_icfree_hdr freehdr; 172330f712c9SDave Chinner 172430f712c9SDave Chinner /* 172530f712c9SDave Chinner * There's more than a leaf level in the btree, so there must 172630f712c9SDave Chinner * be multiple leafn blocks. Give up. 172730f712c9SDave Chinner */ 172830f712c9SDave Chinner if (state->path.active > 1) 172930f712c9SDave Chinner return 0; 173030f712c9SDave Chinner args = state->args; 173130f712c9SDave Chinner 173230f712c9SDave Chinner trace_xfs_dir2_node_to_leaf(args); 173330f712c9SDave Chinner 173430f712c9SDave Chinner mp = state->mp; 173530f712c9SDave Chinner dp = args->dp; 173630f712c9SDave Chinner tp = args->trans; 173730f712c9SDave Chinner /* 173830f712c9SDave Chinner * Get the last offset in the file. 173930f712c9SDave Chinner */ 174030f712c9SDave Chinner if ((error = xfs_bmap_last_offset(dp, &fo, XFS_DATA_FORK))) { 174130f712c9SDave Chinner return error; 174230f712c9SDave Chinner } 174330f712c9SDave Chinner fo -= args->geo->fsbcount; 174430f712c9SDave Chinner /* 174530f712c9SDave Chinner * If there are freespace blocks other than the first one, 174630f712c9SDave Chinner * take this opportunity to remove trailing empty freespace blocks 174730f712c9SDave Chinner * that may have been left behind during no-space-reservation 174830f712c9SDave Chinner * operations. 174930f712c9SDave Chinner */ 175030f712c9SDave Chinner while (fo > args->geo->freeblk) { 175130f712c9SDave Chinner if ((error = xfs_dir2_node_trim_free(args, fo, &rval))) { 175230f712c9SDave Chinner return error; 175330f712c9SDave Chinner } 175430f712c9SDave Chinner if (rval) 175530f712c9SDave Chinner fo -= args->geo->fsbcount; 175630f712c9SDave Chinner else 175730f712c9SDave Chinner return 0; 175830f712c9SDave Chinner } 175930f712c9SDave Chinner /* 176030f712c9SDave Chinner * Now find the block just before the freespace block. 176130f712c9SDave Chinner */ 176230f712c9SDave Chinner if ((error = xfs_bmap_last_before(tp, dp, &fo, XFS_DATA_FORK))) { 176330f712c9SDave Chinner return error; 176430f712c9SDave Chinner } 176530f712c9SDave Chinner /* 176630f712c9SDave Chinner * If it's not the single leaf block, give up. 176730f712c9SDave Chinner */ 176830f712c9SDave Chinner if (XFS_FSB_TO_B(mp, fo) > XFS_DIR2_LEAF_OFFSET + args->geo->blksize) 176930f712c9SDave Chinner return 0; 177030f712c9SDave Chinner lbp = state->path.blk[0].bp; 177130f712c9SDave Chinner leaf = lbp->b_addr; 177230f712c9SDave Chinner dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf); 177330f712c9SDave Chinner 177430f712c9SDave Chinner ASSERT(leafhdr.magic == XFS_DIR2_LEAFN_MAGIC || 177530f712c9SDave Chinner leafhdr.magic == XFS_DIR3_LEAFN_MAGIC); 177630f712c9SDave Chinner 177730f712c9SDave Chinner /* 177830f712c9SDave Chinner * Read the freespace block. 177930f712c9SDave Chinner */ 178030f712c9SDave Chinner error = xfs_dir2_free_read(tp, dp, args->geo->freeblk, &fbp); 178130f712c9SDave Chinner if (error) 178230f712c9SDave Chinner return error; 178330f712c9SDave Chinner free = fbp->b_addr; 178430f712c9SDave Chinner dp->d_ops->free_hdr_from_disk(&freehdr, free); 178530f712c9SDave Chinner 178630f712c9SDave Chinner ASSERT(!freehdr.firstdb); 178730f712c9SDave Chinner 178830f712c9SDave Chinner /* 178930f712c9SDave Chinner * Now see if the leafn and free data will fit in a leaf1. 179030f712c9SDave Chinner * If not, release the buffer and give up. 179130f712c9SDave Chinner */ 179230f712c9SDave Chinner if (xfs_dir3_leaf_size(&leafhdr, freehdr.nvalid) > args->geo->blksize) { 179330f712c9SDave Chinner xfs_trans_brelse(tp, fbp); 179430f712c9SDave Chinner return 0; 179530f712c9SDave Chinner } 179630f712c9SDave Chinner 179730f712c9SDave Chinner /* 179830f712c9SDave Chinner * If the leaf has any stale entries in it, compress them out. 179930f712c9SDave Chinner */ 180030f712c9SDave Chinner if (leafhdr.stale) 180130f712c9SDave Chinner xfs_dir3_leaf_compact(args, &leafhdr, lbp); 180230f712c9SDave Chinner 180330f712c9SDave Chinner lbp->b_ops = &xfs_dir3_leaf1_buf_ops; 180430f712c9SDave Chinner xfs_trans_buf_set_type(tp, lbp, XFS_BLFT_DIR_LEAF1_BUF); 180530f712c9SDave Chinner leafhdr.magic = (leafhdr.magic == XFS_DIR2_LEAFN_MAGIC) 180630f712c9SDave Chinner ? XFS_DIR2_LEAF1_MAGIC 180730f712c9SDave Chinner : XFS_DIR3_LEAF1_MAGIC; 180830f712c9SDave Chinner 180930f712c9SDave Chinner /* 181030f712c9SDave Chinner * Set up the leaf tail from the freespace block. 181130f712c9SDave Chinner */ 181230f712c9SDave Chinner ltp = xfs_dir2_leaf_tail_p(args->geo, leaf); 181330f712c9SDave Chinner ltp->bestcount = cpu_to_be32(freehdr.nvalid); 181430f712c9SDave Chinner 181530f712c9SDave Chinner /* 181630f712c9SDave Chinner * Set up the leaf bests table. 181730f712c9SDave Chinner */ 181830f712c9SDave Chinner memcpy(xfs_dir2_leaf_bests_p(ltp), dp->d_ops->free_bests_p(free), 181930f712c9SDave Chinner freehdr.nvalid * sizeof(xfs_dir2_data_off_t)); 182030f712c9SDave Chinner 182130f712c9SDave Chinner dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr); 182230f712c9SDave Chinner xfs_dir3_leaf_log_header(args, lbp); 182330f712c9SDave Chinner xfs_dir3_leaf_log_bests(args, lbp, 0, be32_to_cpu(ltp->bestcount) - 1); 182430f712c9SDave Chinner xfs_dir3_leaf_log_tail(args, lbp); 182530f712c9SDave Chinner xfs_dir3_leaf_check(dp, lbp); 182630f712c9SDave Chinner 182730f712c9SDave Chinner /* 182830f712c9SDave Chinner * Get rid of the freespace block. 182930f712c9SDave Chinner */ 183030f712c9SDave Chinner error = xfs_dir2_shrink_inode(args, 183130f712c9SDave Chinner xfs_dir2_byte_to_db(args->geo, XFS_DIR2_FREE_OFFSET), 183230f712c9SDave Chinner fbp); 183330f712c9SDave Chinner if (error) { 183430f712c9SDave Chinner /* 183530f712c9SDave Chinner * This can't fail here because it can only happen when 183630f712c9SDave Chinner * punching out the middle of an extent, and this is an 183730f712c9SDave Chinner * isolated block. 183830f712c9SDave Chinner */ 18392451337dSDave Chinner ASSERT(error != -ENOSPC); 184030f712c9SDave Chinner return error; 184130f712c9SDave Chinner } 184230f712c9SDave Chinner fbp = NULL; 184330f712c9SDave Chinner /* 184430f712c9SDave Chinner * Now see if we can convert the single-leaf directory 184530f712c9SDave Chinner * down to a block form directory. 184630f712c9SDave Chinner * This routine always kills the dabuf for the leaf, so 184730f712c9SDave Chinner * eliminate it from the path. 184830f712c9SDave Chinner */ 184930f712c9SDave Chinner error = xfs_dir2_leaf_to_block(args, lbp, NULL); 185030f712c9SDave Chinner state->path.blk[0].bp = NULL; 185130f712c9SDave Chinner return error; 185230f712c9SDave Chinner } 1853