xref: /openbmc/linux/fs/xfs/libxfs/xfs_dir2_node.c (revision b55725974c9d3a5afcdf83daff6fba7d3f91ffca)
130f712c9SDave Chinner /*
230f712c9SDave Chinner  * Copyright (c) 2000-2005 Silicon Graphics, Inc.
330f712c9SDave Chinner  * Copyright (c) 2013 Red Hat, Inc.
430f712c9SDave Chinner  * All Rights Reserved.
530f712c9SDave Chinner  *
630f712c9SDave Chinner  * This program is free software; you can redistribute it and/or
730f712c9SDave Chinner  * modify it under the terms of the GNU General Public License as
830f712c9SDave Chinner  * published by the Free Software Foundation.
930f712c9SDave Chinner  *
1030f712c9SDave Chinner  * This program is distributed in the hope that it would be useful,
1130f712c9SDave Chinner  * but WITHOUT ANY WARRANTY; without even the implied warranty of
1230f712c9SDave Chinner  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
1330f712c9SDave Chinner  * GNU General Public License for more details.
1430f712c9SDave Chinner  *
1530f712c9SDave Chinner  * You should have received a copy of the GNU General Public License
1630f712c9SDave Chinner  * along with this program; if not, write the Free Software Foundation,
1730f712c9SDave Chinner  * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
1830f712c9SDave Chinner  */
1930f712c9SDave Chinner #include "xfs.h"
2030f712c9SDave Chinner #include "xfs_fs.h"
2130f712c9SDave Chinner #include "xfs_format.h"
2230f712c9SDave Chinner #include "xfs_log_format.h"
2330f712c9SDave Chinner #include "xfs_trans_resv.h"
2430f712c9SDave Chinner #include "xfs_mount.h"
2530f712c9SDave Chinner #include "xfs_da_format.h"
2630f712c9SDave Chinner #include "xfs_da_btree.h"
2730f712c9SDave Chinner #include "xfs_inode.h"
2830f712c9SDave Chinner #include "xfs_bmap.h"
2930f712c9SDave Chinner #include "xfs_dir2.h"
3030f712c9SDave Chinner #include "xfs_dir2_priv.h"
3130f712c9SDave Chinner #include "xfs_error.h"
3230f712c9SDave Chinner #include "xfs_trace.h"
3330f712c9SDave Chinner #include "xfs_trans.h"
3430f712c9SDave Chinner #include "xfs_buf_item.h"
3530f712c9SDave Chinner #include "xfs_cksum.h"
36a45086e2SBrian Foster #include "xfs_log.h"
3730f712c9SDave Chinner 
3830f712c9SDave Chinner /*
3930f712c9SDave Chinner  * Function declarations.
4030f712c9SDave Chinner  */
4130f712c9SDave Chinner static int xfs_dir2_leafn_add(struct xfs_buf *bp, xfs_da_args_t *args,
4230f712c9SDave Chinner 			      int index);
4330f712c9SDave Chinner static void xfs_dir2_leafn_rebalance(xfs_da_state_t *state,
4430f712c9SDave Chinner 				     xfs_da_state_blk_t *blk1,
4530f712c9SDave Chinner 				     xfs_da_state_blk_t *blk2);
4630f712c9SDave Chinner static int xfs_dir2_leafn_remove(xfs_da_args_t *args, struct xfs_buf *bp,
4730f712c9SDave Chinner 				 int index, xfs_da_state_blk_t *dblk,
4830f712c9SDave Chinner 				 int *rval);
4930f712c9SDave Chinner static int xfs_dir2_node_addname_int(xfs_da_args_t *args,
5030f712c9SDave Chinner 				     xfs_da_state_blk_t *fblk);
5130f712c9SDave Chinner 
5230f712c9SDave Chinner /*
5330f712c9SDave Chinner  * Check internal consistency of a leafn block.
5430f712c9SDave Chinner  */
5530f712c9SDave Chinner #ifdef DEBUG
56a6a781a5SDarrick J. Wong static xfs_failaddr_t
5730f712c9SDave Chinner xfs_dir3_leafn_check(
5830f712c9SDave Chinner 	struct xfs_inode	*dp,
5930f712c9SDave Chinner 	struct xfs_buf		*bp)
6030f712c9SDave Chinner {
6130f712c9SDave Chinner 	struct xfs_dir2_leaf	*leaf = bp->b_addr;
6230f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
6330f712c9SDave Chinner 
6430f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
6530f712c9SDave Chinner 
6630f712c9SDave Chinner 	if (leafhdr.magic == XFS_DIR3_LEAFN_MAGIC) {
6730f712c9SDave Chinner 		struct xfs_dir3_leaf_hdr *leaf3 = bp->b_addr;
6830f712c9SDave Chinner 		if (be64_to_cpu(leaf3->info.blkno) != bp->b_bn)
69a6a781a5SDarrick J. Wong 			return __this_address;
7030f712c9SDave Chinner 	} else if (leafhdr.magic != XFS_DIR2_LEAFN_MAGIC)
71a6a781a5SDarrick J. Wong 		return __this_address;
7230f712c9SDave Chinner 
7330f712c9SDave Chinner 	return xfs_dir3_leaf_check_int(dp->i_mount, dp, &leafhdr, leaf);
7430f712c9SDave Chinner }
75a6a781a5SDarrick J. Wong 
76a6a781a5SDarrick J. Wong static inline void
77a6a781a5SDarrick J. Wong xfs_dir3_leaf_check(
78a6a781a5SDarrick J. Wong 	struct xfs_inode	*dp,
79a6a781a5SDarrick J. Wong 	struct xfs_buf		*bp)
80a6a781a5SDarrick J. Wong {
81a6a781a5SDarrick J. Wong 	xfs_failaddr_t		fa;
82a6a781a5SDarrick J. Wong 
83a6a781a5SDarrick J. Wong 	fa = xfs_dir3_leafn_check(dp, bp);
84a6a781a5SDarrick J. Wong 	if (!fa)
85a6a781a5SDarrick J. Wong 		return;
86a6a781a5SDarrick J. Wong 	xfs_corruption_error(__func__, XFS_ERRLEVEL_LOW, dp->i_mount,
87a6a781a5SDarrick J. Wong 			bp->b_addr, __FILE__, __LINE__, fa);
88a6a781a5SDarrick J. Wong 	ASSERT(0);
89a6a781a5SDarrick J. Wong }
9030f712c9SDave Chinner #else
9130f712c9SDave Chinner #define	xfs_dir3_leaf_check(dp, bp)
9230f712c9SDave Chinner #endif
9330f712c9SDave Chinner 
94a6a781a5SDarrick J. Wong static xfs_failaddr_t
9530f712c9SDave Chinner xfs_dir3_free_verify(
9630f712c9SDave Chinner 	struct xfs_buf		*bp)
9730f712c9SDave Chinner {
9830f712c9SDave Chinner 	struct xfs_mount	*mp = bp->b_target->bt_mount;
9930f712c9SDave Chinner 	struct xfs_dir2_free_hdr *hdr = bp->b_addr;
10030f712c9SDave Chinner 
10130f712c9SDave Chinner 	if (xfs_sb_version_hascrc(&mp->m_sb)) {
10230f712c9SDave Chinner 		struct xfs_dir3_blk_hdr *hdr3 = bp->b_addr;
10330f712c9SDave Chinner 
10430f712c9SDave Chinner 		if (hdr3->magic != cpu_to_be32(XFS_DIR3_FREE_MAGIC))
105a6a781a5SDarrick J. Wong 			return __this_address;
106ce748eaaSEric Sandeen 		if (!uuid_equal(&hdr3->uuid, &mp->m_sb.sb_meta_uuid))
107a6a781a5SDarrick J. Wong 			return __this_address;
10830f712c9SDave Chinner 		if (be64_to_cpu(hdr3->blkno) != bp->b_bn)
109a6a781a5SDarrick J. Wong 			return __this_address;
110a45086e2SBrian Foster 		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->lsn)))
111a6a781a5SDarrick J. Wong 			return __this_address;
11230f712c9SDave Chinner 	} else {
11330f712c9SDave Chinner 		if (hdr->magic != cpu_to_be32(XFS_DIR2_FREE_MAGIC))
114a6a781a5SDarrick J. Wong 			return __this_address;
11530f712c9SDave Chinner 	}
11630f712c9SDave Chinner 
11730f712c9SDave Chinner 	/* XXX: should bounds check the xfs_dir3_icfree_hdr here */
11830f712c9SDave Chinner 
119a6a781a5SDarrick J. Wong 	return NULL;
12030f712c9SDave Chinner }
12130f712c9SDave Chinner 
12230f712c9SDave Chinner static void
12330f712c9SDave Chinner xfs_dir3_free_read_verify(
12430f712c9SDave Chinner 	struct xfs_buf	*bp)
12530f712c9SDave Chinner {
12630f712c9SDave Chinner 	struct xfs_mount	*mp = bp->b_target->bt_mount;
127bc1a09b8SDarrick J. Wong 	xfs_failaddr_t		fa;
12830f712c9SDave Chinner 
12930f712c9SDave Chinner 	if (xfs_sb_version_hascrc(&mp->m_sb) &&
13030f712c9SDave Chinner 	    !xfs_buf_verify_cksum(bp, XFS_DIR3_FREE_CRC_OFF))
131bc1a09b8SDarrick J. Wong 		xfs_verifier_error(bp, -EFSBADCRC, __this_address);
132bc1a09b8SDarrick J. Wong 	else {
133bc1a09b8SDarrick J. Wong 		fa = xfs_dir3_free_verify(bp);
134bc1a09b8SDarrick J. Wong 		if (fa)
135bc1a09b8SDarrick J. Wong 			xfs_verifier_error(bp, -EFSCORRUPTED, fa);
136bc1a09b8SDarrick J. Wong 	}
13730f712c9SDave Chinner }
13830f712c9SDave Chinner 
13930f712c9SDave Chinner static void
14030f712c9SDave Chinner xfs_dir3_free_write_verify(
14130f712c9SDave Chinner 	struct xfs_buf	*bp)
14230f712c9SDave Chinner {
14330f712c9SDave Chinner 	struct xfs_mount	*mp = bp->b_target->bt_mount;
14430f712c9SDave Chinner 	struct xfs_buf_log_item	*bip = bp->b_fspriv;
14530f712c9SDave Chinner 	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;
146bc1a09b8SDarrick J. Wong 	xfs_failaddr_t		fa;
14730f712c9SDave Chinner 
148bc1a09b8SDarrick J. Wong 	fa = xfs_dir3_free_verify(bp);
149bc1a09b8SDarrick J. Wong 	if (fa) {
150bc1a09b8SDarrick J. Wong 		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
15130f712c9SDave Chinner 		return;
15230f712c9SDave Chinner 	}
15330f712c9SDave Chinner 
15430f712c9SDave Chinner 	if (!xfs_sb_version_hascrc(&mp->m_sb))
15530f712c9SDave Chinner 		return;
15630f712c9SDave Chinner 
15730f712c9SDave Chinner 	if (bip)
15830f712c9SDave Chinner 		hdr3->lsn = cpu_to_be64(bip->bli_item.li_lsn);
15930f712c9SDave Chinner 
16030f712c9SDave Chinner 	xfs_buf_update_cksum(bp, XFS_DIR3_FREE_CRC_OFF);
16130f712c9SDave Chinner }
16230f712c9SDave Chinner 
16330f712c9SDave Chinner const struct xfs_buf_ops xfs_dir3_free_buf_ops = {
164233135b7SEric Sandeen 	.name = "xfs_dir3_free",
16530f712c9SDave Chinner 	.verify_read = xfs_dir3_free_read_verify,
16630f712c9SDave Chinner 	.verify_write = xfs_dir3_free_write_verify,
167*b5572597SDarrick J. Wong 	.verify_struct = xfs_dir3_free_verify,
16830f712c9SDave Chinner };
16930f712c9SDave Chinner 
170de14c5f5SDarrick J. Wong /* Everything ok in the free block header? */
171bc1a09b8SDarrick J. Wong static xfs_failaddr_t
172de14c5f5SDarrick J. Wong xfs_dir3_free_header_check(
173de14c5f5SDarrick J. Wong 	struct xfs_inode	*dp,
174de14c5f5SDarrick J. Wong 	xfs_dablk_t		fbno,
175de14c5f5SDarrick J. Wong 	struct xfs_buf		*bp)
176de14c5f5SDarrick J. Wong {
177de14c5f5SDarrick J. Wong 	struct xfs_mount	*mp = dp->i_mount;
178de14c5f5SDarrick J. Wong 	unsigned int		firstdb;
179de14c5f5SDarrick J. Wong 	int			maxbests;
180de14c5f5SDarrick J. Wong 
181de14c5f5SDarrick J. Wong 	maxbests = dp->d_ops->free_max_bests(mp->m_dir_geo);
182de14c5f5SDarrick J. Wong 	firstdb = (xfs_dir2_da_to_db(mp->m_dir_geo, fbno) -
183de14c5f5SDarrick J. Wong 		   xfs_dir2_byte_to_db(mp->m_dir_geo, XFS_DIR2_FREE_OFFSET)) *
184de14c5f5SDarrick J. Wong 			maxbests;
185de14c5f5SDarrick J. Wong 	if (xfs_sb_version_hascrc(&mp->m_sb)) {
186de14c5f5SDarrick J. Wong 		struct xfs_dir3_free_hdr *hdr3 = bp->b_addr;
187de14c5f5SDarrick J. Wong 
188de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr3->firstdb) != firstdb)
189a6a781a5SDarrick J. Wong 			return __this_address;
190de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr3->nvalid) > maxbests)
191a6a781a5SDarrick J. Wong 			return __this_address;
192de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr3->nvalid) < be32_to_cpu(hdr3->nused))
193a6a781a5SDarrick J. Wong 			return __this_address;
194de14c5f5SDarrick J. Wong 	} else {
195de14c5f5SDarrick J. Wong 		struct xfs_dir2_free_hdr *hdr = bp->b_addr;
196de14c5f5SDarrick J. Wong 
197de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr->firstdb) != firstdb)
198a6a781a5SDarrick J. Wong 			return __this_address;
199de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr->nvalid) > maxbests)
200a6a781a5SDarrick J. Wong 			return __this_address;
201de14c5f5SDarrick J. Wong 		if (be32_to_cpu(hdr->nvalid) < be32_to_cpu(hdr->nused))
202a6a781a5SDarrick J. Wong 			return __this_address;
203de14c5f5SDarrick J. Wong 	}
204a6a781a5SDarrick J. Wong 	return NULL;
205de14c5f5SDarrick J. Wong }
20630f712c9SDave Chinner 
20730f712c9SDave Chinner static int
20830f712c9SDave Chinner __xfs_dir3_free_read(
20930f712c9SDave Chinner 	struct xfs_trans	*tp,
21030f712c9SDave Chinner 	struct xfs_inode	*dp,
21130f712c9SDave Chinner 	xfs_dablk_t		fbno,
21230f712c9SDave Chinner 	xfs_daddr_t		mappedbno,
21330f712c9SDave Chinner 	struct xfs_buf		**bpp)
21430f712c9SDave Chinner {
215bc1a09b8SDarrick J. Wong 	xfs_failaddr_t		fa;
21630f712c9SDave Chinner 	int			err;
21730f712c9SDave Chinner 
21830f712c9SDave Chinner 	err = xfs_da_read_buf(tp, dp, fbno, mappedbno, bpp,
21930f712c9SDave Chinner 				XFS_DATA_FORK, &xfs_dir3_free_buf_ops);
220de14c5f5SDarrick J. Wong 	if (err || !*bpp)
221de14c5f5SDarrick J. Wong 		return err;
222de14c5f5SDarrick J. Wong 
223de14c5f5SDarrick J. Wong 	/* Check things that we can't do in the verifier. */
224bc1a09b8SDarrick J. Wong 	fa = xfs_dir3_free_header_check(dp, fbno, *bpp);
225bc1a09b8SDarrick J. Wong 	if (fa) {
226bc1a09b8SDarrick J. Wong 		xfs_verifier_error(*bpp, -EFSCORRUPTED, fa);
227de14c5f5SDarrick J. Wong 		xfs_trans_brelse(tp, *bpp);
228de14c5f5SDarrick J. Wong 		return -EFSCORRUPTED;
229de14c5f5SDarrick J. Wong 	}
23030f712c9SDave Chinner 
23130f712c9SDave Chinner 	/* try read returns without an error or *bpp if it lands in a hole */
232de14c5f5SDarrick J. Wong 	if (tp)
23330f712c9SDave Chinner 		xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_FREE_BUF);
234de14c5f5SDarrick J. Wong 
235de14c5f5SDarrick J. Wong 	return 0;
23630f712c9SDave Chinner }
23730f712c9SDave Chinner 
23830f712c9SDave Chinner int
23930f712c9SDave Chinner xfs_dir2_free_read(
24030f712c9SDave Chinner 	struct xfs_trans	*tp,
24130f712c9SDave Chinner 	struct xfs_inode	*dp,
24230f712c9SDave Chinner 	xfs_dablk_t		fbno,
24330f712c9SDave Chinner 	struct xfs_buf		**bpp)
24430f712c9SDave Chinner {
24530f712c9SDave Chinner 	return __xfs_dir3_free_read(tp, dp, fbno, -1, bpp);
24630f712c9SDave Chinner }
24730f712c9SDave Chinner 
24830f712c9SDave Chinner static int
24930f712c9SDave Chinner xfs_dir2_free_try_read(
25030f712c9SDave Chinner 	struct xfs_trans	*tp,
25130f712c9SDave Chinner 	struct xfs_inode	*dp,
25230f712c9SDave Chinner 	xfs_dablk_t		fbno,
25330f712c9SDave Chinner 	struct xfs_buf		**bpp)
25430f712c9SDave Chinner {
25530f712c9SDave Chinner 	return __xfs_dir3_free_read(tp, dp, fbno, -2, bpp);
25630f712c9SDave Chinner }
25730f712c9SDave Chinner 
25830f712c9SDave Chinner static int
25930f712c9SDave Chinner xfs_dir3_free_get_buf(
26030f712c9SDave Chinner 	xfs_da_args_t		*args,
26130f712c9SDave Chinner 	xfs_dir2_db_t		fbno,
26230f712c9SDave Chinner 	struct xfs_buf		**bpp)
26330f712c9SDave Chinner {
26430f712c9SDave Chinner 	struct xfs_trans	*tp = args->trans;
26530f712c9SDave Chinner 	struct xfs_inode	*dp = args->dp;
26630f712c9SDave Chinner 	struct xfs_mount	*mp = dp->i_mount;
26730f712c9SDave Chinner 	struct xfs_buf		*bp;
26830f712c9SDave Chinner 	int			error;
26930f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr hdr;
27030f712c9SDave Chinner 
27130f712c9SDave Chinner 	error = xfs_da_get_buf(tp, dp, xfs_dir2_db_to_da(args->geo, fbno),
27230f712c9SDave Chinner 				   -1, &bp, XFS_DATA_FORK);
27330f712c9SDave Chinner 	if (error)
27430f712c9SDave Chinner 		return error;
27530f712c9SDave Chinner 
27630f712c9SDave Chinner 	xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_FREE_BUF);
27730f712c9SDave Chinner 	bp->b_ops = &xfs_dir3_free_buf_ops;
27830f712c9SDave Chinner 
27930f712c9SDave Chinner 	/*
28030f712c9SDave Chinner 	 * Initialize the new block to be empty, and remember
28130f712c9SDave Chinner 	 * its first slot as our empty slot.
28230f712c9SDave Chinner 	 */
28330f712c9SDave Chinner 	memset(bp->b_addr, 0, sizeof(struct xfs_dir3_free_hdr));
28430f712c9SDave Chinner 	memset(&hdr, 0, sizeof(hdr));
28530f712c9SDave Chinner 
28630f712c9SDave Chinner 	if (xfs_sb_version_hascrc(&mp->m_sb)) {
28730f712c9SDave Chinner 		struct xfs_dir3_free_hdr *hdr3 = bp->b_addr;
28830f712c9SDave Chinner 
28930f712c9SDave Chinner 		hdr.magic = XFS_DIR3_FREE_MAGIC;
29030f712c9SDave Chinner 
29130f712c9SDave Chinner 		hdr3->hdr.blkno = cpu_to_be64(bp->b_bn);
29230f712c9SDave Chinner 		hdr3->hdr.owner = cpu_to_be64(dp->i_ino);
293ce748eaaSEric Sandeen 		uuid_copy(&hdr3->hdr.uuid, &mp->m_sb.sb_meta_uuid);
29430f712c9SDave Chinner 	} else
29530f712c9SDave Chinner 		hdr.magic = XFS_DIR2_FREE_MAGIC;
29630f712c9SDave Chinner 	dp->d_ops->free_hdr_to_disk(bp->b_addr, &hdr);
29730f712c9SDave Chinner 	*bpp = bp;
29830f712c9SDave Chinner 	return 0;
29930f712c9SDave Chinner }
30030f712c9SDave Chinner 
30130f712c9SDave Chinner /*
30230f712c9SDave Chinner  * Log entries from a freespace block.
30330f712c9SDave Chinner  */
30430f712c9SDave Chinner STATIC void
30530f712c9SDave Chinner xfs_dir2_free_log_bests(
30630f712c9SDave Chinner 	struct xfs_da_args	*args,
30730f712c9SDave Chinner 	struct xfs_buf		*bp,
30830f712c9SDave Chinner 	int			first,		/* first entry to log */
30930f712c9SDave Chinner 	int			last)		/* last entry to log */
31030f712c9SDave Chinner {
31130f712c9SDave Chinner 	xfs_dir2_free_t		*free;		/* freespace structure */
31230f712c9SDave Chinner 	__be16			*bests;
31330f712c9SDave Chinner 
31430f712c9SDave Chinner 	free = bp->b_addr;
31530f712c9SDave Chinner 	bests = args->dp->d_ops->free_bests_p(free);
31630f712c9SDave Chinner 	ASSERT(free->hdr.magic == cpu_to_be32(XFS_DIR2_FREE_MAGIC) ||
31730f712c9SDave Chinner 	       free->hdr.magic == cpu_to_be32(XFS_DIR3_FREE_MAGIC));
31830f712c9SDave Chinner 	xfs_trans_log_buf(args->trans, bp,
31930f712c9SDave Chinner 		(uint)((char *)&bests[first] - (char *)free),
32030f712c9SDave Chinner 		(uint)((char *)&bests[last] - (char *)free +
32130f712c9SDave Chinner 		       sizeof(bests[0]) - 1));
32230f712c9SDave Chinner }
32330f712c9SDave Chinner 
32430f712c9SDave Chinner /*
32530f712c9SDave Chinner  * Log header from a freespace block.
32630f712c9SDave Chinner  */
32730f712c9SDave Chinner static void
32830f712c9SDave Chinner xfs_dir2_free_log_header(
32930f712c9SDave Chinner 	struct xfs_da_args	*args,
33030f712c9SDave Chinner 	struct xfs_buf		*bp)
33130f712c9SDave Chinner {
33230f712c9SDave Chinner #ifdef DEBUG
33330f712c9SDave Chinner 	xfs_dir2_free_t		*free;		/* freespace structure */
33430f712c9SDave Chinner 
33530f712c9SDave Chinner 	free = bp->b_addr;
33630f712c9SDave Chinner 	ASSERT(free->hdr.magic == cpu_to_be32(XFS_DIR2_FREE_MAGIC) ||
33730f712c9SDave Chinner 	       free->hdr.magic == cpu_to_be32(XFS_DIR3_FREE_MAGIC));
33830f712c9SDave Chinner #endif
33930f712c9SDave Chinner 	xfs_trans_log_buf(args->trans, bp, 0,
34030f712c9SDave Chinner 			  args->dp->d_ops->free_hdr_size - 1);
34130f712c9SDave Chinner }
34230f712c9SDave Chinner 
34330f712c9SDave Chinner /*
34430f712c9SDave Chinner  * Convert a leaf-format directory to a node-format directory.
34530f712c9SDave Chinner  * We need to change the magic number of the leaf block, and copy
34630f712c9SDave Chinner  * the freespace table out of the leaf block into its own block.
34730f712c9SDave Chinner  */
34830f712c9SDave Chinner int						/* error */
34930f712c9SDave Chinner xfs_dir2_leaf_to_node(
35030f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
35130f712c9SDave Chinner 	struct xfs_buf		*lbp)		/* leaf buffer */
35230f712c9SDave Chinner {
35330f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
35430f712c9SDave Chinner 	int			error;		/* error return value */
35530f712c9SDave Chinner 	struct xfs_buf		*fbp;		/* freespace buffer */
35630f712c9SDave Chinner 	xfs_dir2_db_t		fdb;		/* freespace block number */
35730f712c9SDave Chinner 	xfs_dir2_free_t		*free;		/* freespace structure */
35830f712c9SDave Chinner 	__be16			*from;		/* pointer to freespace entry */
35930f712c9SDave Chinner 	int			i;		/* leaf freespace index */
36030f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
36130f712c9SDave Chinner 	xfs_dir2_leaf_tail_t	*ltp;		/* leaf tail structure */
36230f712c9SDave Chinner 	int			n;		/* count of live freespc ents */
36330f712c9SDave Chinner 	xfs_dir2_data_off_t	off;		/* freespace entry value */
36430f712c9SDave Chinner 	__be16			*to;		/* pointer to freespace entry */
36530f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
36630f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr freehdr;
36730f712c9SDave Chinner 
36830f712c9SDave Chinner 	trace_xfs_dir2_leaf_to_node(args);
36930f712c9SDave Chinner 
37030f712c9SDave Chinner 	dp = args->dp;
37130f712c9SDave Chinner 	tp = args->trans;
37230f712c9SDave Chinner 	/*
37330f712c9SDave Chinner 	 * Add a freespace block to the directory.
37430f712c9SDave Chinner 	 */
37530f712c9SDave Chinner 	if ((error = xfs_dir2_grow_inode(args, XFS_DIR2_FREE_SPACE, &fdb))) {
37630f712c9SDave Chinner 		return error;
37730f712c9SDave Chinner 	}
37830f712c9SDave Chinner 	ASSERT(fdb == xfs_dir2_byte_to_db(args->geo, XFS_DIR2_FREE_OFFSET));
37930f712c9SDave Chinner 	/*
38030f712c9SDave Chinner 	 * Get the buffer for the new freespace block.
38130f712c9SDave Chinner 	 */
38230f712c9SDave Chinner 	error = xfs_dir3_free_get_buf(args, fdb, &fbp);
38330f712c9SDave Chinner 	if (error)
38430f712c9SDave Chinner 		return error;
38530f712c9SDave Chinner 
38630f712c9SDave Chinner 	free = fbp->b_addr;
38730f712c9SDave Chinner 	dp->d_ops->free_hdr_from_disk(&freehdr, free);
38830f712c9SDave Chinner 	leaf = lbp->b_addr;
38930f712c9SDave Chinner 	ltp = xfs_dir2_leaf_tail_p(args->geo, leaf);
39030f712c9SDave Chinner 	ASSERT(be32_to_cpu(ltp->bestcount) <=
39130f712c9SDave Chinner 				(uint)dp->i_d.di_size / args->geo->blksize);
39230f712c9SDave Chinner 
39330f712c9SDave Chinner 	/*
39430f712c9SDave Chinner 	 * Copy freespace entries from the leaf block to the new block.
39530f712c9SDave Chinner 	 * Count active entries.
39630f712c9SDave Chinner 	 */
39730f712c9SDave Chinner 	from = xfs_dir2_leaf_bests_p(ltp);
39830f712c9SDave Chinner 	to = dp->d_ops->free_bests_p(free);
39930f712c9SDave Chinner 	for (i = n = 0; i < be32_to_cpu(ltp->bestcount); i++, from++, to++) {
40030f712c9SDave Chinner 		if ((off = be16_to_cpu(*from)) != NULLDATAOFF)
40130f712c9SDave Chinner 			n++;
40230f712c9SDave Chinner 		*to = cpu_to_be16(off);
40330f712c9SDave Chinner 	}
40430f712c9SDave Chinner 
40530f712c9SDave Chinner 	/*
40630f712c9SDave Chinner 	 * Now initialize the freespace block header.
40730f712c9SDave Chinner 	 */
40830f712c9SDave Chinner 	freehdr.nused = n;
40930f712c9SDave Chinner 	freehdr.nvalid = be32_to_cpu(ltp->bestcount);
41030f712c9SDave Chinner 
41130f712c9SDave Chinner 	dp->d_ops->free_hdr_to_disk(fbp->b_addr, &freehdr);
41230f712c9SDave Chinner 	xfs_dir2_free_log_bests(args, fbp, 0, freehdr.nvalid - 1);
41330f712c9SDave Chinner 	xfs_dir2_free_log_header(args, fbp);
41430f712c9SDave Chinner 
41530f712c9SDave Chinner 	/*
41630f712c9SDave Chinner 	 * Converting the leaf to a leafnode is just a matter of changing the
41730f712c9SDave Chinner 	 * magic number and the ops. Do the change directly to the buffer as
41830f712c9SDave Chinner 	 * it's less work (and less code) than decoding the header to host
41930f712c9SDave Chinner 	 * format and back again.
42030f712c9SDave Chinner 	 */
42130f712c9SDave Chinner 	if (leaf->hdr.info.magic == cpu_to_be16(XFS_DIR2_LEAF1_MAGIC))
42230f712c9SDave Chinner 		leaf->hdr.info.magic = cpu_to_be16(XFS_DIR2_LEAFN_MAGIC);
42330f712c9SDave Chinner 	else
42430f712c9SDave Chinner 		leaf->hdr.info.magic = cpu_to_be16(XFS_DIR3_LEAFN_MAGIC);
42530f712c9SDave Chinner 	lbp->b_ops = &xfs_dir3_leafn_buf_ops;
42630f712c9SDave Chinner 	xfs_trans_buf_set_type(tp, lbp, XFS_BLFT_DIR_LEAFN_BUF);
42730f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, lbp);
42830f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, lbp);
42930f712c9SDave Chinner 	return 0;
43030f712c9SDave Chinner }
43130f712c9SDave Chinner 
43230f712c9SDave Chinner /*
43330f712c9SDave Chinner  * Add a leaf entry to a leaf block in a node-form directory.
43430f712c9SDave Chinner  * The other work necessary is done from the caller.
43530f712c9SDave Chinner  */
43630f712c9SDave Chinner static int					/* error */
43730f712c9SDave Chinner xfs_dir2_leafn_add(
43830f712c9SDave Chinner 	struct xfs_buf		*bp,		/* leaf buffer */
43930f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
44030f712c9SDave Chinner 	int			index)		/* insertion pt for new entry */
44130f712c9SDave Chinner {
44230f712c9SDave Chinner 	int			compact;	/* compacting stale leaves */
44330f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
44430f712c9SDave Chinner 	int			highstale;	/* next stale entry */
44530f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
44630f712c9SDave Chinner 	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
44730f712c9SDave Chinner 	int			lfloghigh;	/* high leaf entry logging */
44830f712c9SDave Chinner 	int			lfloglow;	/* low leaf entry logging */
44930f712c9SDave Chinner 	int			lowstale;	/* previous stale entry */
45030f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
45130f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
45230f712c9SDave Chinner 
45330f712c9SDave Chinner 	trace_xfs_dir2_leafn_add(args, index);
45430f712c9SDave Chinner 
45530f712c9SDave Chinner 	dp = args->dp;
45630f712c9SDave Chinner 	leaf = bp->b_addr;
45730f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
45830f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
45930f712c9SDave Chinner 
46030f712c9SDave Chinner 	/*
46130f712c9SDave Chinner 	 * Quick check just to make sure we are not going to index
46230f712c9SDave Chinner 	 * into other peoples memory
46330f712c9SDave Chinner 	 */
46430f712c9SDave Chinner 	if (index < 0)
4652451337dSDave Chinner 		return -EFSCORRUPTED;
46630f712c9SDave Chinner 
46730f712c9SDave Chinner 	/*
46830f712c9SDave Chinner 	 * If there are already the maximum number of leaf entries in
46930f712c9SDave Chinner 	 * the block, if there are no stale entries it won't fit.
47030f712c9SDave Chinner 	 * Caller will do a split.  If there are stale entries we'll do
47130f712c9SDave Chinner 	 * a compact.
47230f712c9SDave Chinner 	 */
47330f712c9SDave Chinner 
47430f712c9SDave Chinner 	if (leafhdr.count == dp->d_ops->leaf_max_ents(args->geo)) {
47530f712c9SDave Chinner 		if (!leafhdr.stale)
4762451337dSDave Chinner 			return -ENOSPC;
47730f712c9SDave Chinner 		compact = leafhdr.stale > 1;
47830f712c9SDave Chinner 	} else
47930f712c9SDave Chinner 		compact = 0;
48030f712c9SDave Chinner 	ASSERT(index == 0 || be32_to_cpu(ents[index - 1].hashval) <= args->hashval);
48130f712c9SDave Chinner 	ASSERT(index == leafhdr.count ||
48230f712c9SDave Chinner 	       be32_to_cpu(ents[index].hashval) >= args->hashval);
48330f712c9SDave Chinner 
48430f712c9SDave Chinner 	if (args->op_flags & XFS_DA_OP_JUSTCHECK)
48530f712c9SDave Chinner 		return 0;
48630f712c9SDave Chinner 
48730f712c9SDave Chinner 	/*
48830f712c9SDave Chinner 	 * Compact out all but one stale leaf entry.  Leaves behind
48930f712c9SDave Chinner 	 * the entry closest to index.
49030f712c9SDave Chinner 	 */
49130f712c9SDave Chinner 	if (compact)
49230f712c9SDave Chinner 		xfs_dir3_leaf_compact_x1(&leafhdr, ents, &index, &lowstale,
49330f712c9SDave Chinner 					 &highstale, &lfloglow, &lfloghigh);
49430f712c9SDave Chinner 	else if (leafhdr.stale) {
49530f712c9SDave Chinner 		/*
49630f712c9SDave Chinner 		 * Set impossible logging indices for this case.
49730f712c9SDave Chinner 		 */
49830f712c9SDave Chinner 		lfloglow = leafhdr.count;
49930f712c9SDave Chinner 		lfloghigh = -1;
50030f712c9SDave Chinner 	}
50130f712c9SDave Chinner 
50230f712c9SDave Chinner 	/*
50330f712c9SDave Chinner 	 * Insert the new entry, log everything.
50430f712c9SDave Chinner 	 */
50530f712c9SDave Chinner 	lep = xfs_dir3_leaf_find_entry(&leafhdr, ents, index, compact, lowstale,
50630f712c9SDave Chinner 				       highstale, &lfloglow, &lfloghigh);
50730f712c9SDave Chinner 
50830f712c9SDave Chinner 	lep->hashval = cpu_to_be32(args->hashval);
50930f712c9SDave Chinner 	lep->address = cpu_to_be32(xfs_dir2_db_off_to_dataptr(args->geo,
51030f712c9SDave Chinner 				args->blkno, args->index));
51130f712c9SDave Chinner 
51230f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr);
51330f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, bp);
51430f712c9SDave Chinner 	xfs_dir3_leaf_log_ents(args, bp, lfloglow, lfloghigh);
51530f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, bp);
51630f712c9SDave Chinner 	return 0;
51730f712c9SDave Chinner }
51830f712c9SDave Chinner 
51930f712c9SDave Chinner #ifdef DEBUG
52030f712c9SDave Chinner static void
52130f712c9SDave Chinner xfs_dir2_free_hdr_check(
52230f712c9SDave Chinner 	struct xfs_inode *dp,
52330f712c9SDave Chinner 	struct xfs_buf	*bp,
52430f712c9SDave Chinner 	xfs_dir2_db_t	db)
52530f712c9SDave Chinner {
52630f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr hdr;
52730f712c9SDave Chinner 
52830f712c9SDave Chinner 	dp->d_ops->free_hdr_from_disk(&hdr, bp->b_addr);
52930f712c9SDave Chinner 
53030f712c9SDave Chinner 	ASSERT((hdr.firstdb %
53130f712c9SDave Chinner 		dp->d_ops->free_max_bests(dp->i_mount->m_dir_geo)) == 0);
53230f712c9SDave Chinner 	ASSERT(hdr.firstdb <= db);
53330f712c9SDave Chinner 	ASSERT(db < hdr.firstdb + hdr.nvalid);
53430f712c9SDave Chinner }
53530f712c9SDave Chinner #else
53630f712c9SDave Chinner #define xfs_dir2_free_hdr_check(dp, bp, db)
53730f712c9SDave Chinner #endif	/* DEBUG */
53830f712c9SDave Chinner 
53930f712c9SDave Chinner /*
54030f712c9SDave Chinner  * Return the last hash value in the leaf.
54130f712c9SDave Chinner  * Stale entries are ok.
54230f712c9SDave Chinner  */
54330f712c9SDave Chinner xfs_dahash_t					/* hash value */
5448e8877e6SDarrick J. Wong xfs_dir2_leaf_lasthash(
54530f712c9SDave Chinner 	struct xfs_inode *dp,
54630f712c9SDave Chinner 	struct xfs_buf	*bp,			/* leaf buffer */
54730f712c9SDave Chinner 	int		*count)			/* count of entries in leaf */
54830f712c9SDave Chinner {
54930f712c9SDave Chinner 	struct xfs_dir2_leaf	*leaf = bp->b_addr;
55030f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
55130f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
55230f712c9SDave Chinner 
55330f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
55430f712c9SDave Chinner 
55530f712c9SDave Chinner 	ASSERT(leafhdr.magic == XFS_DIR2_LEAFN_MAGIC ||
5568e8877e6SDarrick J. Wong 	       leafhdr.magic == XFS_DIR3_LEAFN_MAGIC ||
5578e8877e6SDarrick J. Wong 	       leafhdr.magic == XFS_DIR2_LEAF1_MAGIC ||
5588e8877e6SDarrick J. Wong 	       leafhdr.magic == XFS_DIR3_LEAF1_MAGIC);
55930f712c9SDave Chinner 
56030f712c9SDave Chinner 	if (count)
56130f712c9SDave Chinner 		*count = leafhdr.count;
56230f712c9SDave Chinner 	if (!leafhdr.count)
56330f712c9SDave Chinner 		return 0;
56430f712c9SDave Chinner 
56530f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
56630f712c9SDave Chinner 	return be32_to_cpu(ents[leafhdr.count - 1].hashval);
56730f712c9SDave Chinner }
56830f712c9SDave Chinner 
56930f712c9SDave Chinner /*
57030f712c9SDave Chinner  * Look up a leaf entry for space to add a name in a node-format leaf block.
57130f712c9SDave Chinner  * The extrablk in state is a freespace block.
57230f712c9SDave Chinner  */
57330f712c9SDave Chinner STATIC int
57430f712c9SDave Chinner xfs_dir2_leafn_lookup_for_addname(
57530f712c9SDave Chinner 	struct xfs_buf		*bp,		/* leaf buffer */
57630f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
57730f712c9SDave Chinner 	int			*indexp,	/* out: leaf entry index */
57830f712c9SDave Chinner 	xfs_da_state_t		*state)		/* state to fill in */
57930f712c9SDave Chinner {
58030f712c9SDave Chinner 	struct xfs_buf		*curbp = NULL;	/* current data/free buffer */
58130f712c9SDave Chinner 	xfs_dir2_db_t		curdb = -1;	/* current data block number */
58230f712c9SDave Chinner 	xfs_dir2_db_t		curfdb = -1;	/* current free block number */
58330f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
58430f712c9SDave Chinner 	int			error;		/* error return value */
58530f712c9SDave Chinner 	int			fi;		/* free entry index */
58630f712c9SDave Chinner 	xfs_dir2_free_t		*free = NULL;	/* free block structure */
58730f712c9SDave Chinner 	int			index;		/* leaf entry index */
58830f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
58930f712c9SDave Chinner 	int			length;		/* length of new data entry */
59030f712c9SDave Chinner 	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
59130f712c9SDave Chinner 	xfs_mount_t		*mp;		/* filesystem mount point */
59230f712c9SDave Chinner 	xfs_dir2_db_t		newdb;		/* new data block number */
59330f712c9SDave Chinner 	xfs_dir2_db_t		newfdb;		/* new free block number */
59430f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
59530f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
59630f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
59730f712c9SDave Chinner 
59830f712c9SDave Chinner 	dp = args->dp;
59930f712c9SDave Chinner 	tp = args->trans;
60030f712c9SDave Chinner 	mp = dp->i_mount;
60130f712c9SDave Chinner 	leaf = bp->b_addr;
60230f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
60330f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
60430f712c9SDave Chinner 
60530f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, bp);
60630f712c9SDave Chinner 	ASSERT(leafhdr.count > 0);
60730f712c9SDave Chinner 
60830f712c9SDave Chinner 	/*
60930f712c9SDave Chinner 	 * Look up the hash value in the leaf entries.
61030f712c9SDave Chinner 	 */
61130f712c9SDave Chinner 	index = xfs_dir2_leaf_search_hash(args, bp);
61230f712c9SDave Chinner 	/*
61330f712c9SDave Chinner 	 * Do we have a buffer coming in?
61430f712c9SDave Chinner 	 */
61530f712c9SDave Chinner 	if (state->extravalid) {
61630f712c9SDave Chinner 		/* If so, it's a free block buffer, get the block number. */
61730f712c9SDave Chinner 		curbp = state->extrablk.bp;
61830f712c9SDave Chinner 		curfdb = state->extrablk.blkno;
61930f712c9SDave Chinner 		free = curbp->b_addr;
62030f712c9SDave Chinner 		ASSERT(free->hdr.magic == cpu_to_be32(XFS_DIR2_FREE_MAGIC) ||
62130f712c9SDave Chinner 		       free->hdr.magic == cpu_to_be32(XFS_DIR3_FREE_MAGIC));
62230f712c9SDave Chinner 	}
62330f712c9SDave Chinner 	length = dp->d_ops->data_entsize(args->namelen);
62430f712c9SDave Chinner 	/*
62530f712c9SDave Chinner 	 * Loop over leaf entries with the right hash value.
62630f712c9SDave Chinner 	 */
62730f712c9SDave Chinner 	for (lep = &ents[index];
62830f712c9SDave Chinner 	     index < leafhdr.count && be32_to_cpu(lep->hashval) == args->hashval;
62930f712c9SDave Chinner 	     lep++, index++) {
63030f712c9SDave Chinner 		/*
63130f712c9SDave Chinner 		 * Skip stale leaf entries.
63230f712c9SDave Chinner 		 */
63330f712c9SDave Chinner 		if (be32_to_cpu(lep->address) == XFS_DIR2_NULL_DATAPTR)
63430f712c9SDave Chinner 			continue;
63530f712c9SDave Chinner 		/*
63630f712c9SDave Chinner 		 * Pull the data block number from the entry.
63730f712c9SDave Chinner 		 */
63830f712c9SDave Chinner 		newdb = xfs_dir2_dataptr_to_db(args->geo,
63930f712c9SDave Chinner 					       be32_to_cpu(lep->address));
64030f712c9SDave Chinner 		/*
64130f712c9SDave Chinner 		 * For addname, we're looking for a place to put the new entry.
64230f712c9SDave Chinner 		 * We want to use a data block with an entry of equal
64330f712c9SDave Chinner 		 * hash value to ours if there is one with room.
64430f712c9SDave Chinner 		 *
64530f712c9SDave Chinner 		 * If this block isn't the data block we already have
64630f712c9SDave Chinner 		 * in hand, take a look at it.
64730f712c9SDave Chinner 		 */
64830f712c9SDave Chinner 		if (newdb != curdb) {
64930f712c9SDave Chinner 			__be16 *bests;
65030f712c9SDave Chinner 
65130f712c9SDave Chinner 			curdb = newdb;
65230f712c9SDave Chinner 			/*
65330f712c9SDave Chinner 			 * Convert the data block to the free block
65430f712c9SDave Chinner 			 * holding its freespace information.
65530f712c9SDave Chinner 			 */
65630f712c9SDave Chinner 			newfdb = dp->d_ops->db_to_fdb(args->geo, newdb);
65730f712c9SDave Chinner 			/*
65830f712c9SDave Chinner 			 * If it's not the one we have in hand, read it in.
65930f712c9SDave Chinner 			 */
66030f712c9SDave Chinner 			if (newfdb != curfdb) {
66130f712c9SDave Chinner 				/*
66230f712c9SDave Chinner 				 * If we had one before, drop it.
66330f712c9SDave Chinner 				 */
66430f712c9SDave Chinner 				if (curbp)
66530f712c9SDave Chinner 					xfs_trans_brelse(tp, curbp);
66630f712c9SDave Chinner 
66730f712c9SDave Chinner 				error = xfs_dir2_free_read(tp, dp,
66830f712c9SDave Chinner 						xfs_dir2_db_to_da(args->geo,
66930f712c9SDave Chinner 								  newfdb),
67030f712c9SDave Chinner 						&curbp);
67130f712c9SDave Chinner 				if (error)
67230f712c9SDave Chinner 					return error;
67330f712c9SDave Chinner 				free = curbp->b_addr;
67430f712c9SDave Chinner 
67530f712c9SDave Chinner 				xfs_dir2_free_hdr_check(dp, curbp, curdb);
67630f712c9SDave Chinner 			}
67730f712c9SDave Chinner 			/*
67830f712c9SDave Chinner 			 * Get the index for our entry.
67930f712c9SDave Chinner 			 */
68030f712c9SDave Chinner 			fi = dp->d_ops->db_to_fdindex(args->geo, curdb);
68130f712c9SDave Chinner 			/*
68230f712c9SDave Chinner 			 * If it has room, return it.
68330f712c9SDave Chinner 			 */
68430f712c9SDave Chinner 			bests = dp->d_ops->free_bests_p(free);
68530f712c9SDave Chinner 			if (unlikely(bests[fi] == cpu_to_be16(NULLDATAOFF))) {
68630f712c9SDave Chinner 				XFS_ERROR_REPORT("xfs_dir2_leafn_lookup_int",
68730f712c9SDave Chinner 							XFS_ERRLEVEL_LOW, mp);
68830f712c9SDave Chinner 				if (curfdb != newfdb)
68930f712c9SDave Chinner 					xfs_trans_brelse(tp, curbp);
6902451337dSDave Chinner 				return -EFSCORRUPTED;
69130f712c9SDave Chinner 			}
69230f712c9SDave Chinner 			curfdb = newfdb;
69330f712c9SDave Chinner 			if (be16_to_cpu(bests[fi]) >= length)
69430f712c9SDave Chinner 				goto out;
69530f712c9SDave Chinner 		}
69630f712c9SDave Chinner 	}
69730f712c9SDave Chinner 	/* Didn't find any space */
69830f712c9SDave Chinner 	fi = -1;
69930f712c9SDave Chinner out:
70030f712c9SDave Chinner 	ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
70130f712c9SDave Chinner 	if (curbp) {
70230f712c9SDave Chinner 		/* Giving back a free block. */
70330f712c9SDave Chinner 		state->extravalid = 1;
70430f712c9SDave Chinner 		state->extrablk.bp = curbp;
70530f712c9SDave Chinner 		state->extrablk.index = fi;
70630f712c9SDave Chinner 		state->extrablk.blkno = curfdb;
70730f712c9SDave Chinner 
70830f712c9SDave Chinner 		/*
70930f712c9SDave Chinner 		 * Important: this magic number is not in the buffer - it's for
71030f712c9SDave Chinner 		 * buffer type information and therefore only the free/data type
71130f712c9SDave Chinner 		 * matters here, not whether CRCs are enabled or not.
71230f712c9SDave Chinner 		 */
71330f712c9SDave Chinner 		state->extrablk.magic = XFS_DIR2_FREE_MAGIC;
71430f712c9SDave Chinner 	} else {
71530f712c9SDave Chinner 		state->extravalid = 0;
71630f712c9SDave Chinner 	}
71730f712c9SDave Chinner 	/*
71830f712c9SDave Chinner 	 * Return the index, that will be the insertion point.
71930f712c9SDave Chinner 	 */
72030f712c9SDave Chinner 	*indexp = index;
7212451337dSDave Chinner 	return -ENOENT;
72230f712c9SDave Chinner }
72330f712c9SDave Chinner 
72430f712c9SDave Chinner /*
72530f712c9SDave Chinner  * Look up a leaf entry in a node-format leaf block.
72630f712c9SDave Chinner  * The extrablk in state a data block.
72730f712c9SDave Chinner  */
72830f712c9SDave Chinner STATIC int
72930f712c9SDave Chinner xfs_dir2_leafn_lookup_for_entry(
73030f712c9SDave Chinner 	struct xfs_buf		*bp,		/* leaf buffer */
73130f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
73230f712c9SDave Chinner 	int			*indexp,	/* out: leaf entry index */
73330f712c9SDave Chinner 	xfs_da_state_t		*state)		/* state to fill in */
73430f712c9SDave Chinner {
73530f712c9SDave Chinner 	struct xfs_buf		*curbp = NULL;	/* current data/free buffer */
73630f712c9SDave Chinner 	xfs_dir2_db_t		curdb = -1;	/* current data block number */
73730f712c9SDave Chinner 	xfs_dir2_data_entry_t	*dep;		/* data block entry */
73830f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
73930f712c9SDave Chinner 	int			error;		/* error return value */
74030f712c9SDave Chinner 	int			index;		/* leaf entry index */
74130f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
74230f712c9SDave Chinner 	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
74330f712c9SDave Chinner 	xfs_mount_t		*mp;		/* filesystem mount point */
74430f712c9SDave Chinner 	xfs_dir2_db_t		newdb;		/* new data block number */
74530f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
74630f712c9SDave Chinner 	enum xfs_dacmp		cmp;		/* comparison result */
74730f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
74830f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
74930f712c9SDave Chinner 
75030f712c9SDave Chinner 	dp = args->dp;
75130f712c9SDave Chinner 	tp = args->trans;
75230f712c9SDave Chinner 	mp = dp->i_mount;
75330f712c9SDave Chinner 	leaf = bp->b_addr;
75430f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
75530f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
75630f712c9SDave Chinner 
75730f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, bp);
75830f712c9SDave Chinner 	ASSERT(leafhdr.count > 0);
75930f712c9SDave Chinner 
76030f712c9SDave Chinner 	/*
76130f712c9SDave Chinner 	 * Look up the hash value in the leaf entries.
76230f712c9SDave Chinner 	 */
76330f712c9SDave Chinner 	index = xfs_dir2_leaf_search_hash(args, bp);
76430f712c9SDave Chinner 	/*
76530f712c9SDave Chinner 	 * Do we have a buffer coming in?
76630f712c9SDave Chinner 	 */
76730f712c9SDave Chinner 	if (state->extravalid) {
76830f712c9SDave Chinner 		curbp = state->extrablk.bp;
76930f712c9SDave Chinner 		curdb = state->extrablk.blkno;
77030f712c9SDave Chinner 	}
77130f712c9SDave Chinner 	/*
77230f712c9SDave Chinner 	 * Loop over leaf entries with the right hash value.
77330f712c9SDave Chinner 	 */
77430f712c9SDave Chinner 	for (lep = &ents[index];
77530f712c9SDave Chinner 	     index < leafhdr.count && be32_to_cpu(lep->hashval) == args->hashval;
77630f712c9SDave Chinner 	     lep++, index++) {
77730f712c9SDave Chinner 		/*
77830f712c9SDave Chinner 		 * Skip stale leaf entries.
77930f712c9SDave Chinner 		 */
78030f712c9SDave Chinner 		if (be32_to_cpu(lep->address) == XFS_DIR2_NULL_DATAPTR)
78130f712c9SDave Chinner 			continue;
78230f712c9SDave Chinner 		/*
78330f712c9SDave Chinner 		 * Pull the data block number from the entry.
78430f712c9SDave Chinner 		 */
78530f712c9SDave Chinner 		newdb = xfs_dir2_dataptr_to_db(args->geo,
78630f712c9SDave Chinner 					       be32_to_cpu(lep->address));
78730f712c9SDave Chinner 		/*
78830f712c9SDave Chinner 		 * Not adding a new entry, so we really want to find
78930f712c9SDave Chinner 		 * the name given to us.
79030f712c9SDave Chinner 		 *
79130f712c9SDave Chinner 		 * If it's a different data block, go get it.
79230f712c9SDave Chinner 		 */
79330f712c9SDave Chinner 		if (newdb != curdb) {
79430f712c9SDave Chinner 			/*
79530f712c9SDave Chinner 			 * If we had a block before that we aren't saving
79630f712c9SDave Chinner 			 * for a CI name, drop it
79730f712c9SDave Chinner 			 */
79830f712c9SDave Chinner 			if (curbp && (args->cmpresult == XFS_CMP_DIFFERENT ||
79930f712c9SDave Chinner 						curdb != state->extrablk.blkno))
80030f712c9SDave Chinner 				xfs_trans_brelse(tp, curbp);
80130f712c9SDave Chinner 			/*
80230f712c9SDave Chinner 			 * If needing the block that is saved with a CI match,
80330f712c9SDave Chinner 			 * use it otherwise read in the new data block.
80430f712c9SDave Chinner 			 */
80530f712c9SDave Chinner 			if (args->cmpresult != XFS_CMP_DIFFERENT &&
80630f712c9SDave Chinner 					newdb == state->extrablk.blkno) {
80730f712c9SDave Chinner 				ASSERT(state->extravalid);
80830f712c9SDave Chinner 				curbp = state->extrablk.bp;
80930f712c9SDave Chinner 			} else {
81030f712c9SDave Chinner 				error = xfs_dir3_data_read(tp, dp,
81130f712c9SDave Chinner 						xfs_dir2_db_to_da(args->geo,
81230f712c9SDave Chinner 								  newdb),
81330f712c9SDave Chinner 						-1, &curbp);
81430f712c9SDave Chinner 				if (error)
81530f712c9SDave Chinner 					return error;
81630f712c9SDave Chinner 			}
81730f712c9SDave Chinner 			xfs_dir3_data_check(dp, curbp);
81830f712c9SDave Chinner 			curdb = newdb;
81930f712c9SDave Chinner 		}
82030f712c9SDave Chinner 		/*
82130f712c9SDave Chinner 		 * Point to the data entry.
82230f712c9SDave Chinner 		 */
82330f712c9SDave Chinner 		dep = (xfs_dir2_data_entry_t *)((char *)curbp->b_addr +
82430f712c9SDave Chinner 			xfs_dir2_dataptr_to_off(args->geo,
82530f712c9SDave Chinner 						be32_to_cpu(lep->address)));
82630f712c9SDave Chinner 		/*
82730f712c9SDave Chinner 		 * Compare the entry and if it's an exact match, return
82830f712c9SDave Chinner 		 * EEXIST immediately. If it's the first case-insensitive
82930f712c9SDave Chinner 		 * match, store the block & inode number and continue looking.
83030f712c9SDave Chinner 		 */
83130f712c9SDave Chinner 		cmp = mp->m_dirnameops->compname(args, dep->name, dep->namelen);
83230f712c9SDave Chinner 		if (cmp != XFS_CMP_DIFFERENT && cmp != args->cmpresult) {
83330f712c9SDave Chinner 			/* If there is a CI match block, drop it */
83430f712c9SDave Chinner 			if (args->cmpresult != XFS_CMP_DIFFERENT &&
83530f712c9SDave Chinner 						curdb != state->extrablk.blkno)
83630f712c9SDave Chinner 				xfs_trans_brelse(tp, state->extrablk.bp);
83730f712c9SDave Chinner 			args->cmpresult = cmp;
83830f712c9SDave Chinner 			args->inumber = be64_to_cpu(dep->inumber);
83930f712c9SDave Chinner 			args->filetype = dp->d_ops->data_get_ftype(dep);
84030f712c9SDave Chinner 			*indexp = index;
84130f712c9SDave Chinner 			state->extravalid = 1;
84230f712c9SDave Chinner 			state->extrablk.bp = curbp;
84330f712c9SDave Chinner 			state->extrablk.blkno = curdb;
84430f712c9SDave Chinner 			state->extrablk.index = (int)((char *)dep -
84530f712c9SDave Chinner 							(char *)curbp->b_addr);
84630f712c9SDave Chinner 			state->extrablk.magic = XFS_DIR2_DATA_MAGIC;
84730f712c9SDave Chinner 			curbp->b_ops = &xfs_dir3_data_buf_ops;
84830f712c9SDave Chinner 			xfs_trans_buf_set_type(tp, curbp, XFS_BLFT_DIR_DATA_BUF);
84930f712c9SDave Chinner 			if (cmp == XFS_CMP_EXACT)
8502451337dSDave Chinner 				return -EEXIST;
85130f712c9SDave Chinner 		}
85230f712c9SDave Chinner 	}
85330f712c9SDave Chinner 	ASSERT(index == leafhdr.count || (args->op_flags & XFS_DA_OP_OKNOENT));
85430f712c9SDave Chinner 	if (curbp) {
85530f712c9SDave Chinner 		if (args->cmpresult == XFS_CMP_DIFFERENT) {
85630f712c9SDave Chinner 			/* Giving back last used data block. */
85730f712c9SDave Chinner 			state->extravalid = 1;
85830f712c9SDave Chinner 			state->extrablk.bp = curbp;
85930f712c9SDave Chinner 			state->extrablk.index = -1;
86030f712c9SDave Chinner 			state->extrablk.blkno = curdb;
86130f712c9SDave Chinner 			state->extrablk.magic = XFS_DIR2_DATA_MAGIC;
86230f712c9SDave Chinner 			curbp->b_ops = &xfs_dir3_data_buf_ops;
86330f712c9SDave Chinner 			xfs_trans_buf_set_type(tp, curbp, XFS_BLFT_DIR_DATA_BUF);
86430f712c9SDave Chinner 		} else {
86530f712c9SDave Chinner 			/* If the curbp is not the CI match block, drop it */
86630f712c9SDave Chinner 			if (state->extrablk.bp != curbp)
86730f712c9SDave Chinner 				xfs_trans_brelse(tp, curbp);
86830f712c9SDave Chinner 		}
86930f712c9SDave Chinner 	} else {
87030f712c9SDave Chinner 		state->extravalid = 0;
87130f712c9SDave Chinner 	}
87230f712c9SDave Chinner 	*indexp = index;
8732451337dSDave Chinner 	return -ENOENT;
87430f712c9SDave Chinner }
87530f712c9SDave Chinner 
87630f712c9SDave Chinner /*
87730f712c9SDave Chinner  * Look up a leaf entry in a node-format leaf block.
87830f712c9SDave Chinner  * If this is an addname then the extrablk in state is a freespace block,
87930f712c9SDave Chinner  * otherwise it's a data block.
88030f712c9SDave Chinner  */
88130f712c9SDave Chinner int
88230f712c9SDave Chinner xfs_dir2_leafn_lookup_int(
88330f712c9SDave Chinner 	struct xfs_buf		*bp,		/* leaf buffer */
88430f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
88530f712c9SDave Chinner 	int			*indexp,	/* out: leaf entry index */
88630f712c9SDave Chinner 	xfs_da_state_t		*state)		/* state to fill in */
88730f712c9SDave Chinner {
88830f712c9SDave Chinner 	if (args->op_flags & XFS_DA_OP_ADDNAME)
88930f712c9SDave Chinner 		return xfs_dir2_leafn_lookup_for_addname(bp, args, indexp,
89030f712c9SDave Chinner 							state);
89130f712c9SDave Chinner 	return xfs_dir2_leafn_lookup_for_entry(bp, args, indexp, state);
89230f712c9SDave Chinner }
89330f712c9SDave Chinner 
89430f712c9SDave Chinner /*
89530f712c9SDave Chinner  * Move count leaf entries from source to destination leaf.
89630f712c9SDave Chinner  * Log entries and headers.  Stale entries are preserved.
89730f712c9SDave Chinner  */
89830f712c9SDave Chinner static void
89930f712c9SDave Chinner xfs_dir3_leafn_moveents(
90030f712c9SDave Chinner 	xfs_da_args_t			*args,	/* operation arguments */
90130f712c9SDave Chinner 	struct xfs_buf			*bp_s,	/* source */
90230f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr	*shdr,
90330f712c9SDave Chinner 	struct xfs_dir2_leaf_entry	*sents,
90430f712c9SDave Chinner 	int				start_s,/* source leaf index */
90530f712c9SDave Chinner 	struct xfs_buf			*bp_d,	/* destination */
90630f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr	*dhdr,
90730f712c9SDave Chinner 	struct xfs_dir2_leaf_entry	*dents,
90830f712c9SDave Chinner 	int				start_d,/* destination leaf index */
90930f712c9SDave Chinner 	int				count)	/* count of leaves to copy */
91030f712c9SDave Chinner {
91130f712c9SDave Chinner 	int				stale;	/* count stale leaves copied */
91230f712c9SDave Chinner 
91330f712c9SDave Chinner 	trace_xfs_dir2_leafn_moveents(args, start_s, start_d, count);
91430f712c9SDave Chinner 
91530f712c9SDave Chinner 	/*
91630f712c9SDave Chinner 	 * Silently return if nothing to do.
91730f712c9SDave Chinner 	 */
91830f712c9SDave Chinner 	if (count == 0)
91930f712c9SDave Chinner 		return;
92030f712c9SDave Chinner 
92130f712c9SDave Chinner 	/*
92230f712c9SDave Chinner 	 * If the destination index is not the end of the current
92330f712c9SDave Chinner 	 * destination leaf entries, open up a hole in the destination
92430f712c9SDave Chinner 	 * to hold the new entries.
92530f712c9SDave Chinner 	 */
92630f712c9SDave Chinner 	if (start_d < dhdr->count) {
92730f712c9SDave Chinner 		memmove(&dents[start_d + count], &dents[start_d],
92830f712c9SDave Chinner 			(dhdr->count - start_d) * sizeof(xfs_dir2_leaf_entry_t));
92930f712c9SDave Chinner 		xfs_dir3_leaf_log_ents(args, bp_d, start_d + count,
93030f712c9SDave Chinner 				       count + dhdr->count - 1);
93130f712c9SDave Chinner 	}
93230f712c9SDave Chinner 	/*
93330f712c9SDave Chinner 	 * If the source has stale leaves, count the ones in the copy range
93430f712c9SDave Chinner 	 * so we can update the header correctly.
93530f712c9SDave Chinner 	 */
93630f712c9SDave Chinner 	if (shdr->stale) {
93730f712c9SDave Chinner 		int	i;			/* temp leaf index */
93830f712c9SDave Chinner 
93930f712c9SDave Chinner 		for (i = start_s, stale = 0; i < start_s + count; i++) {
94030f712c9SDave Chinner 			if (sents[i].address ==
94130f712c9SDave Chinner 					cpu_to_be32(XFS_DIR2_NULL_DATAPTR))
94230f712c9SDave Chinner 				stale++;
94330f712c9SDave Chinner 		}
94430f712c9SDave Chinner 	} else
94530f712c9SDave Chinner 		stale = 0;
94630f712c9SDave Chinner 	/*
94730f712c9SDave Chinner 	 * Copy the leaf entries from source to destination.
94830f712c9SDave Chinner 	 */
94930f712c9SDave Chinner 	memcpy(&dents[start_d], &sents[start_s],
95030f712c9SDave Chinner 		count * sizeof(xfs_dir2_leaf_entry_t));
95130f712c9SDave Chinner 	xfs_dir3_leaf_log_ents(args, bp_d, start_d, start_d + count - 1);
95230f712c9SDave Chinner 
95330f712c9SDave Chinner 	/*
95430f712c9SDave Chinner 	 * If there are source entries after the ones we copied,
95530f712c9SDave Chinner 	 * delete the ones we copied by sliding the next ones down.
95630f712c9SDave Chinner 	 */
95730f712c9SDave Chinner 	if (start_s + count < shdr->count) {
95830f712c9SDave Chinner 		memmove(&sents[start_s], &sents[start_s + count],
95930f712c9SDave Chinner 			count * sizeof(xfs_dir2_leaf_entry_t));
96030f712c9SDave Chinner 		xfs_dir3_leaf_log_ents(args, bp_s, start_s, start_s + count - 1);
96130f712c9SDave Chinner 	}
96230f712c9SDave Chinner 
96330f712c9SDave Chinner 	/*
96430f712c9SDave Chinner 	 * Update the headers and log them.
96530f712c9SDave Chinner 	 */
96630f712c9SDave Chinner 	shdr->count -= count;
96730f712c9SDave Chinner 	shdr->stale -= stale;
96830f712c9SDave Chinner 	dhdr->count += count;
96930f712c9SDave Chinner 	dhdr->stale += stale;
97030f712c9SDave Chinner }
97130f712c9SDave Chinner 
97230f712c9SDave Chinner /*
97330f712c9SDave Chinner  * Determine the sort order of two leaf blocks.
97430f712c9SDave Chinner  * Returns 1 if both are valid and leaf2 should be before leaf1, else 0.
97530f712c9SDave Chinner  */
97630f712c9SDave Chinner int						/* sort order */
97730f712c9SDave Chinner xfs_dir2_leafn_order(
97830f712c9SDave Chinner 	struct xfs_inode	*dp,
97930f712c9SDave Chinner 	struct xfs_buf		*leaf1_bp,		/* leaf1 buffer */
98030f712c9SDave Chinner 	struct xfs_buf		*leaf2_bp)		/* leaf2 buffer */
98130f712c9SDave Chinner {
98230f712c9SDave Chinner 	struct xfs_dir2_leaf	*leaf1 = leaf1_bp->b_addr;
98330f712c9SDave Chinner 	struct xfs_dir2_leaf	*leaf2 = leaf2_bp->b_addr;
98430f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents1;
98530f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents2;
98630f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr hdr1;
98730f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr hdr2;
98830f712c9SDave Chinner 
98930f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&hdr1, leaf1);
99030f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&hdr2, leaf2);
99130f712c9SDave Chinner 	ents1 = dp->d_ops->leaf_ents_p(leaf1);
99230f712c9SDave Chinner 	ents2 = dp->d_ops->leaf_ents_p(leaf2);
99330f712c9SDave Chinner 
99430f712c9SDave Chinner 	if (hdr1.count > 0 && hdr2.count > 0 &&
99530f712c9SDave Chinner 	    (be32_to_cpu(ents2[0].hashval) < be32_to_cpu(ents1[0].hashval) ||
99630f712c9SDave Chinner 	     be32_to_cpu(ents2[hdr2.count - 1].hashval) <
99730f712c9SDave Chinner 				be32_to_cpu(ents1[hdr1.count - 1].hashval)))
99830f712c9SDave Chinner 		return 1;
99930f712c9SDave Chinner 	return 0;
100030f712c9SDave Chinner }
100130f712c9SDave Chinner 
100230f712c9SDave Chinner /*
100330f712c9SDave Chinner  * Rebalance leaf entries between two leaf blocks.
100430f712c9SDave Chinner  * This is actually only called when the second block is new,
100530f712c9SDave Chinner  * though the code deals with the general case.
100630f712c9SDave Chinner  * A new entry will be inserted in one of the blocks, and that
100730f712c9SDave Chinner  * entry is taken into account when balancing.
100830f712c9SDave Chinner  */
100930f712c9SDave Chinner static void
101030f712c9SDave Chinner xfs_dir2_leafn_rebalance(
101130f712c9SDave Chinner 	xfs_da_state_t		*state,		/* btree cursor */
101230f712c9SDave Chinner 	xfs_da_state_blk_t	*blk1,		/* first btree block */
101330f712c9SDave Chinner 	xfs_da_state_blk_t	*blk2)		/* second btree block */
101430f712c9SDave Chinner {
101530f712c9SDave Chinner 	xfs_da_args_t		*args;		/* operation arguments */
101630f712c9SDave Chinner 	int			count;		/* count (& direction) leaves */
101730f712c9SDave Chinner 	int			isleft;		/* new goes in left leaf */
101830f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf1;		/* first leaf structure */
101930f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf2;		/* second leaf structure */
102030f712c9SDave Chinner 	int			mid;		/* midpoint leaf index */
102130f712c9SDave Chinner #if defined(DEBUG) || defined(XFS_WARN)
102230f712c9SDave Chinner 	int			oldstale;	/* old count of stale leaves */
102330f712c9SDave Chinner #endif
102430f712c9SDave Chinner 	int			oldsum;		/* old total leaf count */
102530f712c9SDave Chinner 	int			swap;		/* swapped leaf blocks */
102630f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents1;
102730f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents2;
102830f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr hdr1;
102930f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr hdr2;
103030f712c9SDave Chinner 	struct xfs_inode	*dp = state->args->dp;
103130f712c9SDave Chinner 
103230f712c9SDave Chinner 	args = state->args;
103330f712c9SDave Chinner 	/*
103430f712c9SDave Chinner 	 * If the block order is wrong, swap the arguments.
103530f712c9SDave Chinner 	 */
103630f712c9SDave Chinner 	if ((swap = xfs_dir2_leafn_order(dp, blk1->bp, blk2->bp))) {
103730f712c9SDave Chinner 		xfs_da_state_blk_t	*tmp;	/* temp for block swap */
103830f712c9SDave Chinner 
103930f712c9SDave Chinner 		tmp = blk1;
104030f712c9SDave Chinner 		blk1 = blk2;
104130f712c9SDave Chinner 		blk2 = tmp;
104230f712c9SDave Chinner 	}
104330f712c9SDave Chinner 	leaf1 = blk1->bp->b_addr;
104430f712c9SDave Chinner 	leaf2 = blk2->bp->b_addr;
104530f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&hdr1, leaf1);
104630f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&hdr2, leaf2);
104730f712c9SDave Chinner 	ents1 = dp->d_ops->leaf_ents_p(leaf1);
104830f712c9SDave Chinner 	ents2 = dp->d_ops->leaf_ents_p(leaf2);
104930f712c9SDave Chinner 
105030f712c9SDave Chinner 	oldsum = hdr1.count + hdr2.count;
105130f712c9SDave Chinner #if defined(DEBUG) || defined(XFS_WARN)
105230f712c9SDave Chinner 	oldstale = hdr1.stale + hdr2.stale;
105330f712c9SDave Chinner #endif
105430f712c9SDave Chinner 	mid = oldsum >> 1;
105530f712c9SDave Chinner 
105630f712c9SDave Chinner 	/*
105730f712c9SDave Chinner 	 * If the old leaf count was odd then the new one will be even,
105830f712c9SDave Chinner 	 * so we need to divide the new count evenly.
105930f712c9SDave Chinner 	 */
106030f712c9SDave Chinner 	if (oldsum & 1) {
106130f712c9SDave Chinner 		xfs_dahash_t	midhash;	/* middle entry hash value */
106230f712c9SDave Chinner 
106330f712c9SDave Chinner 		if (mid >= hdr1.count)
106430f712c9SDave Chinner 			midhash = be32_to_cpu(ents2[mid - hdr1.count].hashval);
106530f712c9SDave Chinner 		else
106630f712c9SDave Chinner 			midhash = be32_to_cpu(ents1[mid].hashval);
106730f712c9SDave Chinner 		isleft = args->hashval <= midhash;
106830f712c9SDave Chinner 	}
106930f712c9SDave Chinner 	/*
107030f712c9SDave Chinner 	 * If the old count is even then the new count is odd, so there's
107130f712c9SDave Chinner 	 * no preferred side for the new entry.
107230f712c9SDave Chinner 	 * Pick the left one.
107330f712c9SDave Chinner 	 */
107430f712c9SDave Chinner 	else
107530f712c9SDave Chinner 		isleft = 1;
107630f712c9SDave Chinner 	/*
107730f712c9SDave Chinner 	 * Calculate moved entry count.  Positive means left-to-right,
107830f712c9SDave Chinner 	 * negative means right-to-left.  Then move the entries.
107930f712c9SDave Chinner 	 */
108030f712c9SDave Chinner 	count = hdr1.count - mid + (isleft == 0);
108130f712c9SDave Chinner 	if (count > 0)
108230f712c9SDave Chinner 		xfs_dir3_leafn_moveents(args, blk1->bp, &hdr1, ents1,
108330f712c9SDave Chinner 					hdr1.count - count, blk2->bp,
108430f712c9SDave Chinner 					&hdr2, ents2, 0, count);
108530f712c9SDave Chinner 	else if (count < 0)
108630f712c9SDave Chinner 		xfs_dir3_leafn_moveents(args, blk2->bp, &hdr2, ents2, 0,
108730f712c9SDave Chinner 					blk1->bp, &hdr1, ents1,
108830f712c9SDave Chinner 					hdr1.count, count);
108930f712c9SDave Chinner 
109030f712c9SDave Chinner 	ASSERT(hdr1.count + hdr2.count == oldsum);
109130f712c9SDave Chinner 	ASSERT(hdr1.stale + hdr2.stale == oldstale);
109230f712c9SDave Chinner 
109330f712c9SDave Chinner 	/* log the changes made when moving the entries */
109430f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(leaf1, &hdr1);
109530f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(leaf2, &hdr2);
109630f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, blk1->bp);
109730f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, blk2->bp);
109830f712c9SDave Chinner 
109930f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, blk1->bp);
110030f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, blk2->bp);
110130f712c9SDave Chinner 
110230f712c9SDave Chinner 	/*
110330f712c9SDave Chinner 	 * Mark whether we're inserting into the old or new leaf.
110430f712c9SDave Chinner 	 */
110530f712c9SDave Chinner 	if (hdr1.count < hdr2.count)
110630f712c9SDave Chinner 		state->inleaf = swap;
110730f712c9SDave Chinner 	else if (hdr1.count > hdr2.count)
110830f712c9SDave Chinner 		state->inleaf = !swap;
110930f712c9SDave Chinner 	else
111030f712c9SDave Chinner 		state->inleaf = swap ^ (blk1->index <= hdr1.count);
111130f712c9SDave Chinner 	/*
111230f712c9SDave Chinner 	 * Adjust the expected index for insertion.
111330f712c9SDave Chinner 	 */
111430f712c9SDave Chinner 	if (!state->inleaf)
111530f712c9SDave Chinner 		blk2->index = blk1->index - hdr1.count;
111630f712c9SDave Chinner 
111730f712c9SDave Chinner 	/*
111830f712c9SDave Chinner 	 * Finally sanity check just to make sure we are not returning a
111930f712c9SDave Chinner 	 * negative index
112030f712c9SDave Chinner 	 */
112130f712c9SDave Chinner 	if (blk2->index < 0) {
112230f712c9SDave Chinner 		state->inleaf = 1;
112330f712c9SDave Chinner 		blk2->index = 0;
112430f712c9SDave Chinner 		xfs_alert(dp->i_mount,
112530f712c9SDave Chinner 	"%s: picked the wrong leaf? reverting original leaf: blk1->index %d",
112630f712c9SDave Chinner 			__func__, blk1->index);
112730f712c9SDave Chinner 	}
112830f712c9SDave Chinner }
112930f712c9SDave Chinner 
113030f712c9SDave Chinner static int
113130f712c9SDave Chinner xfs_dir3_data_block_free(
113230f712c9SDave Chinner 	xfs_da_args_t		*args,
113330f712c9SDave Chinner 	struct xfs_dir2_data_hdr *hdr,
113430f712c9SDave Chinner 	struct xfs_dir2_free	*free,
113530f712c9SDave Chinner 	xfs_dir2_db_t		fdb,
113630f712c9SDave Chinner 	int			findex,
113730f712c9SDave Chinner 	struct xfs_buf		*fbp,
113830f712c9SDave Chinner 	int			longest)
113930f712c9SDave Chinner {
114030f712c9SDave Chinner 	int			logfree = 0;
114130f712c9SDave Chinner 	__be16			*bests;
114230f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr freehdr;
114330f712c9SDave Chinner 	struct xfs_inode	*dp = args->dp;
114430f712c9SDave Chinner 
114530f712c9SDave Chinner 	dp->d_ops->free_hdr_from_disk(&freehdr, free);
114630f712c9SDave Chinner 	bests = dp->d_ops->free_bests_p(free);
114730f712c9SDave Chinner 	if (hdr) {
114830f712c9SDave Chinner 		/*
114930f712c9SDave Chinner 		 * Data block is not empty, just set the free entry to the new
115030f712c9SDave Chinner 		 * value.
115130f712c9SDave Chinner 		 */
115230f712c9SDave Chinner 		bests[findex] = cpu_to_be16(longest);
115330f712c9SDave Chinner 		xfs_dir2_free_log_bests(args, fbp, findex, findex);
115430f712c9SDave Chinner 		return 0;
115530f712c9SDave Chinner 	}
115630f712c9SDave Chinner 
115730f712c9SDave Chinner 	/* One less used entry in the free table. */
115830f712c9SDave Chinner 	freehdr.nused--;
115930f712c9SDave Chinner 
116030f712c9SDave Chinner 	/*
116130f712c9SDave Chinner 	 * If this was the last entry in the table, we can trim the table size
116230f712c9SDave Chinner 	 * back.  There might be other entries at the end referring to
116330f712c9SDave Chinner 	 * non-existent data blocks, get those too.
116430f712c9SDave Chinner 	 */
116530f712c9SDave Chinner 	if (findex == freehdr.nvalid - 1) {
116630f712c9SDave Chinner 		int	i;		/* free entry index */
116730f712c9SDave Chinner 
116830f712c9SDave Chinner 		for (i = findex - 1; i >= 0; i--) {
116930f712c9SDave Chinner 			if (bests[i] != cpu_to_be16(NULLDATAOFF))
117030f712c9SDave Chinner 				break;
117130f712c9SDave Chinner 		}
117230f712c9SDave Chinner 		freehdr.nvalid = i + 1;
117330f712c9SDave Chinner 		logfree = 0;
117430f712c9SDave Chinner 	} else {
117530f712c9SDave Chinner 		/* Not the last entry, just punch it out.  */
117630f712c9SDave Chinner 		bests[findex] = cpu_to_be16(NULLDATAOFF);
117730f712c9SDave Chinner 		logfree = 1;
117830f712c9SDave Chinner 	}
117930f712c9SDave Chinner 
118030f712c9SDave Chinner 	dp->d_ops->free_hdr_to_disk(free, &freehdr);
118130f712c9SDave Chinner 	xfs_dir2_free_log_header(args, fbp);
118230f712c9SDave Chinner 
118330f712c9SDave Chinner 	/*
118430f712c9SDave Chinner 	 * If there are no useful entries left in the block, get rid of the
118530f712c9SDave Chinner 	 * block if we can.
118630f712c9SDave Chinner 	 */
118730f712c9SDave Chinner 	if (!freehdr.nused) {
118830f712c9SDave Chinner 		int error;
118930f712c9SDave Chinner 
119030f712c9SDave Chinner 		error = xfs_dir2_shrink_inode(args, fdb, fbp);
119130f712c9SDave Chinner 		if (error == 0) {
119230f712c9SDave Chinner 			fbp = NULL;
119330f712c9SDave Chinner 			logfree = 0;
11942451337dSDave Chinner 		} else if (error != -ENOSPC || args->total != 0)
119530f712c9SDave Chinner 			return error;
119630f712c9SDave Chinner 		/*
119730f712c9SDave Chinner 		 * It's possible to get ENOSPC if there is no
119830f712c9SDave Chinner 		 * space reservation.  In this case some one
119930f712c9SDave Chinner 		 * else will eventually get rid of this block.
120030f712c9SDave Chinner 		 */
120130f712c9SDave Chinner 	}
120230f712c9SDave Chinner 
120330f712c9SDave Chinner 	/* Log the free entry that changed, unless we got rid of it.  */
120430f712c9SDave Chinner 	if (logfree)
120530f712c9SDave Chinner 		xfs_dir2_free_log_bests(args, fbp, findex, findex);
120630f712c9SDave Chinner 	return 0;
120730f712c9SDave Chinner }
120830f712c9SDave Chinner 
120930f712c9SDave Chinner /*
121030f712c9SDave Chinner  * Remove an entry from a node directory.
121130f712c9SDave Chinner  * This removes the leaf entry and the data entry,
121230f712c9SDave Chinner  * and updates the free block if necessary.
121330f712c9SDave Chinner  */
121430f712c9SDave Chinner static int					/* error */
121530f712c9SDave Chinner xfs_dir2_leafn_remove(
121630f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
121730f712c9SDave Chinner 	struct xfs_buf		*bp,		/* leaf buffer */
121830f712c9SDave Chinner 	int			index,		/* leaf entry index */
121930f712c9SDave Chinner 	xfs_da_state_blk_t	*dblk,		/* data block */
122030f712c9SDave Chinner 	int			*rval)		/* resulting block needs join */
122130f712c9SDave Chinner {
122230f712c9SDave Chinner 	xfs_dir2_data_hdr_t	*hdr;		/* data block header */
122330f712c9SDave Chinner 	xfs_dir2_db_t		db;		/* data block number */
122430f712c9SDave Chinner 	struct xfs_buf		*dbp;		/* data block buffer */
122530f712c9SDave Chinner 	xfs_dir2_data_entry_t	*dep;		/* data block entry */
122630f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
122730f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
122830f712c9SDave Chinner 	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
122930f712c9SDave Chinner 	int			longest;	/* longest data free entry */
123030f712c9SDave Chinner 	int			off;		/* data block entry offset */
123130f712c9SDave Chinner 	int			needlog;	/* need to log data header */
123230f712c9SDave Chinner 	int			needscan;	/* need to rescan data frees */
123330f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
123430f712c9SDave Chinner 	struct xfs_dir2_data_free *bf;		/* bestfree table */
123530f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
123630f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
123730f712c9SDave Chinner 
123830f712c9SDave Chinner 	trace_xfs_dir2_leafn_remove(args, index);
123930f712c9SDave Chinner 
124030f712c9SDave Chinner 	dp = args->dp;
124130f712c9SDave Chinner 	tp = args->trans;
124230f712c9SDave Chinner 	leaf = bp->b_addr;
124330f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
124430f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
124530f712c9SDave Chinner 
124630f712c9SDave Chinner 	/*
124730f712c9SDave Chinner 	 * Point to the entry we're removing.
124830f712c9SDave Chinner 	 */
124930f712c9SDave Chinner 	lep = &ents[index];
125030f712c9SDave Chinner 
125130f712c9SDave Chinner 	/*
125230f712c9SDave Chinner 	 * Extract the data block and offset from the entry.
125330f712c9SDave Chinner 	 */
125430f712c9SDave Chinner 	db = xfs_dir2_dataptr_to_db(args->geo, be32_to_cpu(lep->address));
125530f712c9SDave Chinner 	ASSERT(dblk->blkno == db);
125630f712c9SDave Chinner 	off = xfs_dir2_dataptr_to_off(args->geo, be32_to_cpu(lep->address));
125730f712c9SDave Chinner 	ASSERT(dblk->index == off);
125830f712c9SDave Chinner 
125930f712c9SDave Chinner 	/*
126030f712c9SDave Chinner 	 * Kill the leaf entry by marking it stale.
126130f712c9SDave Chinner 	 * Log the leaf block changes.
126230f712c9SDave Chinner 	 */
126330f712c9SDave Chinner 	leafhdr.stale++;
126430f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(leaf, &leafhdr);
126530f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, bp);
126630f712c9SDave Chinner 
126730f712c9SDave Chinner 	lep->address = cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
126830f712c9SDave Chinner 	xfs_dir3_leaf_log_ents(args, bp, index, index);
126930f712c9SDave Chinner 
127030f712c9SDave Chinner 	/*
127130f712c9SDave Chinner 	 * Make the data entry free.  Keep track of the longest freespace
127230f712c9SDave Chinner 	 * in the data block in case it changes.
127330f712c9SDave Chinner 	 */
127430f712c9SDave Chinner 	dbp = dblk->bp;
127530f712c9SDave Chinner 	hdr = dbp->b_addr;
127630f712c9SDave Chinner 	dep = (xfs_dir2_data_entry_t *)((char *)hdr + off);
127730f712c9SDave Chinner 	bf = dp->d_ops->data_bestfree_p(hdr);
127830f712c9SDave Chinner 	longest = be16_to_cpu(bf[0].length);
127930f712c9SDave Chinner 	needlog = needscan = 0;
128030f712c9SDave Chinner 	xfs_dir2_data_make_free(args, dbp, off,
128130f712c9SDave Chinner 		dp->d_ops->data_entsize(dep->namelen), &needlog, &needscan);
128230f712c9SDave Chinner 	/*
128330f712c9SDave Chinner 	 * Rescan the data block freespaces for bestfree.
128430f712c9SDave Chinner 	 * Log the data block header if needed.
128530f712c9SDave Chinner 	 */
128630f712c9SDave Chinner 	if (needscan)
128730f712c9SDave Chinner 		xfs_dir2_data_freescan(dp, hdr, &needlog);
128830f712c9SDave Chinner 	if (needlog)
128930f712c9SDave Chinner 		xfs_dir2_data_log_header(args, dbp);
129030f712c9SDave Chinner 	xfs_dir3_data_check(dp, dbp);
129130f712c9SDave Chinner 	/*
129230f712c9SDave Chinner 	 * If the longest data block freespace changes, need to update
129330f712c9SDave Chinner 	 * the corresponding freeblock entry.
129430f712c9SDave Chinner 	 */
129530f712c9SDave Chinner 	if (longest < be16_to_cpu(bf[0].length)) {
129630f712c9SDave Chinner 		int		error;		/* error return value */
129730f712c9SDave Chinner 		struct xfs_buf	*fbp;		/* freeblock buffer */
129830f712c9SDave Chinner 		xfs_dir2_db_t	fdb;		/* freeblock block number */
129930f712c9SDave Chinner 		int		findex;		/* index in freeblock entries */
130030f712c9SDave Chinner 		xfs_dir2_free_t	*free;		/* freeblock structure */
130130f712c9SDave Chinner 
130230f712c9SDave Chinner 		/*
130330f712c9SDave Chinner 		 * Convert the data block number to a free block,
130430f712c9SDave Chinner 		 * read in the free block.
130530f712c9SDave Chinner 		 */
130630f712c9SDave Chinner 		fdb = dp->d_ops->db_to_fdb(args->geo, db);
130730f712c9SDave Chinner 		error = xfs_dir2_free_read(tp, dp,
130830f712c9SDave Chinner 					   xfs_dir2_db_to_da(args->geo, fdb),
130930f712c9SDave Chinner 					   &fbp);
131030f712c9SDave Chinner 		if (error)
131130f712c9SDave Chinner 			return error;
131230f712c9SDave Chinner 		free = fbp->b_addr;
131330f712c9SDave Chinner #ifdef DEBUG
131430f712c9SDave Chinner 	{
131530f712c9SDave Chinner 		struct xfs_dir3_icfree_hdr freehdr;
131630f712c9SDave Chinner 		dp->d_ops->free_hdr_from_disk(&freehdr, free);
131730f712c9SDave Chinner 		ASSERT(freehdr.firstdb == dp->d_ops->free_max_bests(args->geo) *
131830f712c9SDave Chinner 			(fdb - xfs_dir2_byte_to_db(args->geo,
131930f712c9SDave Chinner 						   XFS_DIR2_FREE_OFFSET)));
132030f712c9SDave Chinner 	}
132130f712c9SDave Chinner #endif
132230f712c9SDave Chinner 		/*
132330f712c9SDave Chinner 		 * Calculate which entry we need to fix.
132430f712c9SDave Chinner 		 */
132530f712c9SDave Chinner 		findex = dp->d_ops->db_to_fdindex(args->geo, db);
132630f712c9SDave Chinner 		longest = be16_to_cpu(bf[0].length);
132730f712c9SDave Chinner 		/*
132830f712c9SDave Chinner 		 * If the data block is now empty we can get rid of it
132930f712c9SDave Chinner 		 * (usually).
133030f712c9SDave Chinner 		 */
133130f712c9SDave Chinner 		if (longest == args->geo->blksize -
133230f712c9SDave Chinner 			       dp->d_ops->data_entry_offset) {
133330f712c9SDave Chinner 			/*
133430f712c9SDave Chinner 			 * Try to punch out the data block.
133530f712c9SDave Chinner 			 */
133630f712c9SDave Chinner 			error = xfs_dir2_shrink_inode(args, db, dbp);
133730f712c9SDave Chinner 			if (error == 0) {
133830f712c9SDave Chinner 				dblk->bp = NULL;
133930f712c9SDave Chinner 				hdr = NULL;
134030f712c9SDave Chinner 			}
134130f712c9SDave Chinner 			/*
134230f712c9SDave Chinner 			 * We can get ENOSPC if there's no space reservation.
134330f712c9SDave Chinner 			 * In this case just drop the buffer and some one else
134430f712c9SDave Chinner 			 * will eventually get rid of the empty block.
134530f712c9SDave Chinner 			 */
13462451337dSDave Chinner 			else if (!(error == -ENOSPC && args->total == 0))
134730f712c9SDave Chinner 				return error;
134830f712c9SDave Chinner 		}
134930f712c9SDave Chinner 		/*
135030f712c9SDave Chinner 		 * If we got rid of the data block, we can eliminate that entry
135130f712c9SDave Chinner 		 * in the free block.
135230f712c9SDave Chinner 		 */
135330f712c9SDave Chinner 		error = xfs_dir3_data_block_free(args, hdr, free,
135430f712c9SDave Chinner 						 fdb, findex, fbp, longest);
135530f712c9SDave Chinner 		if (error)
135630f712c9SDave Chinner 			return error;
135730f712c9SDave Chinner 	}
135830f712c9SDave Chinner 
135930f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, bp);
136030f712c9SDave Chinner 	/*
136130f712c9SDave Chinner 	 * Return indication of whether this leaf block is empty enough
136230f712c9SDave Chinner 	 * to justify trying to join it with a neighbor.
136330f712c9SDave Chinner 	 */
136430f712c9SDave Chinner 	*rval = (dp->d_ops->leaf_hdr_size +
136530f712c9SDave Chinner 		 (uint)sizeof(ents[0]) * (leafhdr.count - leafhdr.stale)) <
136630f712c9SDave Chinner 		args->geo->magicpct;
136730f712c9SDave Chinner 	return 0;
136830f712c9SDave Chinner }
136930f712c9SDave Chinner 
137030f712c9SDave Chinner /*
137130f712c9SDave Chinner  * Split the leaf entries in the old block into old and new blocks.
137230f712c9SDave Chinner  */
137330f712c9SDave Chinner int						/* error */
137430f712c9SDave Chinner xfs_dir2_leafn_split(
137530f712c9SDave Chinner 	xfs_da_state_t		*state,		/* btree cursor */
137630f712c9SDave Chinner 	xfs_da_state_blk_t	*oldblk,	/* original block */
137730f712c9SDave Chinner 	xfs_da_state_blk_t	*newblk)	/* newly created block */
137830f712c9SDave Chinner {
137930f712c9SDave Chinner 	xfs_da_args_t		*args;		/* operation arguments */
138030f712c9SDave Chinner 	xfs_dablk_t		blkno;		/* new leaf block number */
138130f712c9SDave Chinner 	int			error;		/* error return value */
138230f712c9SDave Chinner 	struct xfs_inode	*dp;
138330f712c9SDave Chinner 
138430f712c9SDave Chinner 	/*
138530f712c9SDave Chinner 	 * Allocate space for a new leaf node.
138630f712c9SDave Chinner 	 */
138730f712c9SDave Chinner 	args = state->args;
138830f712c9SDave Chinner 	dp = args->dp;
138930f712c9SDave Chinner 	ASSERT(oldblk->magic == XFS_DIR2_LEAFN_MAGIC);
139030f712c9SDave Chinner 	error = xfs_da_grow_inode(args, &blkno);
139130f712c9SDave Chinner 	if (error) {
139230f712c9SDave Chinner 		return error;
139330f712c9SDave Chinner 	}
139430f712c9SDave Chinner 	/*
139530f712c9SDave Chinner 	 * Initialize the new leaf block.
139630f712c9SDave Chinner 	 */
139730f712c9SDave Chinner 	error = xfs_dir3_leaf_get_buf(args, xfs_dir2_da_to_db(args->geo, blkno),
139830f712c9SDave Chinner 				      &newblk->bp, XFS_DIR2_LEAFN_MAGIC);
139930f712c9SDave Chinner 	if (error)
140030f712c9SDave Chinner 		return error;
140130f712c9SDave Chinner 
140230f712c9SDave Chinner 	newblk->blkno = blkno;
140330f712c9SDave Chinner 	newblk->magic = XFS_DIR2_LEAFN_MAGIC;
140430f712c9SDave Chinner 	/*
140530f712c9SDave Chinner 	 * Rebalance the entries across the two leaves, link the new
140630f712c9SDave Chinner 	 * block into the leaves.
140730f712c9SDave Chinner 	 */
140830f712c9SDave Chinner 	xfs_dir2_leafn_rebalance(state, oldblk, newblk);
140930f712c9SDave Chinner 	error = xfs_da3_blk_link(state, oldblk, newblk);
141030f712c9SDave Chinner 	if (error) {
141130f712c9SDave Chinner 		return error;
141230f712c9SDave Chinner 	}
141330f712c9SDave Chinner 	/*
141430f712c9SDave Chinner 	 * Insert the new entry in the correct block.
141530f712c9SDave Chinner 	 */
141630f712c9SDave Chinner 	if (state->inleaf)
141730f712c9SDave Chinner 		error = xfs_dir2_leafn_add(oldblk->bp, args, oldblk->index);
141830f712c9SDave Chinner 	else
141930f712c9SDave Chinner 		error = xfs_dir2_leafn_add(newblk->bp, args, newblk->index);
142030f712c9SDave Chinner 	/*
142130f712c9SDave Chinner 	 * Update last hashval in each block since we added the name.
142230f712c9SDave Chinner 	 */
14238e8877e6SDarrick J. Wong 	oldblk->hashval = xfs_dir2_leaf_lasthash(dp, oldblk->bp, NULL);
14248e8877e6SDarrick J. Wong 	newblk->hashval = xfs_dir2_leaf_lasthash(dp, newblk->bp, NULL);
142530f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, oldblk->bp);
142630f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, newblk->bp);
142730f712c9SDave Chinner 	return error;
142830f712c9SDave Chinner }
142930f712c9SDave Chinner 
143030f712c9SDave Chinner /*
143130f712c9SDave Chinner  * Check a leaf block and its neighbors to see if the block should be
143230f712c9SDave Chinner  * collapsed into one or the other neighbor.  Always keep the block
143330f712c9SDave Chinner  * with the smaller block number.
143430f712c9SDave Chinner  * If the current block is over 50% full, don't try to join it, return 0.
143530f712c9SDave Chinner  * If the block is empty, fill in the state structure and return 2.
143630f712c9SDave Chinner  * If it can be collapsed, fill in the state structure and return 1.
143730f712c9SDave Chinner  * If nothing can be done, return 0.
143830f712c9SDave Chinner  */
143930f712c9SDave Chinner int						/* error */
144030f712c9SDave Chinner xfs_dir2_leafn_toosmall(
144130f712c9SDave Chinner 	xfs_da_state_t		*state,		/* btree cursor */
144230f712c9SDave Chinner 	int			*action)	/* resulting action to take */
144330f712c9SDave Chinner {
144430f712c9SDave Chinner 	xfs_da_state_blk_t	*blk;		/* leaf block */
144530f712c9SDave Chinner 	xfs_dablk_t		blkno;		/* leaf block number */
144630f712c9SDave Chinner 	struct xfs_buf		*bp;		/* leaf buffer */
144730f712c9SDave Chinner 	int			bytes;		/* bytes in use */
144830f712c9SDave Chinner 	int			count;		/* leaf live entry count */
144930f712c9SDave Chinner 	int			error;		/* error return value */
145030f712c9SDave Chinner 	int			forward;	/* sibling block direction */
145130f712c9SDave Chinner 	int			i;		/* sibling counter */
145230f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
145330f712c9SDave Chinner 	int			rval;		/* result from path_shift */
145430f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr leafhdr;
145530f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *ents;
145630f712c9SDave Chinner 	struct xfs_inode	*dp = state->args->dp;
145730f712c9SDave Chinner 
145830f712c9SDave Chinner 	/*
145930f712c9SDave Chinner 	 * Check for the degenerate case of the block being over 50% full.
146030f712c9SDave Chinner 	 * If so, it's not worth even looking to see if we might be able
146130f712c9SDave Chinner 	 * to coalesce with a sibling.
146230f712c9SDave Chinner 	 */
146330f712c9SDave Chinner 	blk = &state->path.blk[state->path.active - 1];
146430f712c9SDave Chinner 	leaf = blk->bp->b_addr;
146530f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
146630f712c9SDave Chinner 	ents = dp->d_ops->leaf_ents_p(leaf);
146730f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, blk->bp);
146830f712c9SDave Chinner 
146930f712c9SDave Chinner 	count = leafhdr.count - leafhdr.stale;
147030f712c9SDave Chinner 	bytes = dp->d_ops->leaf_hdr_size + count * sizeof(ents[0]);
147130f712c9SDave Chinner 	if (bytes > (state->args->geo->blksize >> 1)) {
147230f712c9SDave Chinner 		/*
147330f712c9SDave Chinner 		 * Blk over 50%, don't try to join.
147430f712c9SDave Chinner 		 */
147530f712c9SDave Chinner 		*action = 0;
147630f712c9SDave Chinner 		return 0;
147730f712c9SDave Chinner 	}
147830f712c9SDave Chinner 	/*
147930f712c9SDave Chinner 	 * Check for the degenerate case of the block being empty.
148030f712c9SDave Chinner 	 * If the block is empty, we'll simply delete it, no need to
148130f712c9SDave Chinner 	 * coalesce it with a sibling block.  We choose (arbitrarily)
148230f712c9SDave Chinner 	 * to merge with the forward block unless it is NULL.
148330f712c9SDave Chinner 	 */
148430f712c9SDave Chinner 	if (count == 0) {
148530f712c9SDave Chinner 		/*
148630f712c9SDave Chinner 		 * Make altpath point to the block we want to keep and
148730f712c9SDave Chinner 		 * path point to the block we want to drop (this one).
148830f712c9SDave Chinner 		 */
148930f712c9SDave Chinner 		forward = (leafhdr.forw != 0);
149030f712c9SDave Chinner 		memcpy(&state->altpath, &state->path, sizeof(state->path));
149130f712c9SDave Chinner 		error = xfs_da3_path_shift(state, &state->altpath, forward, 0,
149230f712c9SDave Chinner 			&rval);
149330f712c9SDave Chinner 		if (error)
149430f712c9SDave Chinner 			return error;
149530f712c9SDave Chinner 		*action = rval ? 2 : 0;
149630f712c9SDave Chinner 		return 0;
149730f712c9SDave Chinner 	}
149830f712c9SDave Chinner 	/*
149930f712c9SDave Chinner 	 * Examine each sibling block to see if we can coalesce with
150030f712c9SDave Chinner 	 * at least 25% free space to spare.  We need to figure out
150130f712c9SDave Chinner 	 * whether to merge with the forward or the backward block.
150230f712c9SDave Chinner 	 * We prefer coalescing with the lower numbered sibling so as
150330f712c9SDave Chinner 	 * to shrink a directory over time.
150430f712c9SDave Chinner 	 */
150530f712c9SDave Chinner 	forward = leafhdr.forw < leafhdr.back;
150630f712c9SDave Chinner 	for (i = 0, bp = NULL; i < 2; forward = !forward, i++) {
150730f712c9SDave Chinner 		struct xfs_dir3_icleaf_hdr hdr2;
150830f712c9SDave Chinner 
150930f712c9SDave Chinner 		blkno = forward ? leafhdr.forw : leafhdr.back;
151030f712c9SDave Chinner 		if (blkno == 0)
151130f712c9SDave Chinner 			continue;
151230f712c9SDave Chinner 		/*
151330f712c9SDave Chinner 		 * Read the sibling leaf block.
151430f712c9SDave Chinner 		 */
151530f712c9SDave Chinner 		error = xfs_dir3_leafn_read(state->args->trans, dp,
151630f712c9SDave Chinner 					    blkno, -1, &bp);
151730f712c9SDave Chinner 		if (error)
151830f712c9SDave Chinner 			return error;
151930f712c9SDave Chinner 
152030f712c9SDave Chinner 		/*
152130f712c9SDave Chinner 		 * Count bytes in the two blocks combined.
152230f712c9SDave Chinner 		 */
152330f712c9SDave Chinner 		count = leafhdr.count - leafhdr.stale;
152430f712c9SDave Chinner 		bytes = state->args->geo->blksize -
152530f712c9SDave Chinner 			(state->args->geo->blksize >> 2);
152630f712c9SDave Chinner 
152730f712c9SDave Chinner 		leaf = bp->b_addr;
152830f712c9SDave Chinner 		dp->d_ops->leaf_hdr_from_disk(&hdr2, leaf);
152930f712c9SDave Chinner 		ents = dp->d_ops->leaf_ents_p(leaf);
153030f712c9SDave Chinner 		count += hdr2.count - hdr2.stale;
153130f712c9SDave Chinner 		bytes -= count * sizeof(ents[0]);
153230f712c9SDave Chinner 
153330f712c9SDave Chinner 		/*
153430f712c9SDave Chinner 		 * Fits with at least 25% to spare.
153530f712c9SDave Chinner 		 */
153630f712c9SDave Chinner 		if (bytes >= 0)
153730f712c9SDave Chinner 			break;
153830f712c9SDave Chinner 		xfs_trans_brelse(state->args->trans, bp);
153930f712c9SDave Chinner 	}
154030f712c9SDave Chinner 	/*
154130f712c9SDave Chinner 	 * Didn't like either block, give up.
154230f712c9SDave Chinner 	 */
154330f712c9SDave Chinner 	if (i >= 2) {
154430f712c9SDave Chinner 		*action = 0;
154530f712c9SDave Chinner 		return 0;
154630f712c9SDave Chinner 	}
154730f712c9SDave Chinner 
154830f712c9SDave Chinner 	/*
154930f712c9SDave Chinner 	 * Make altpath point to the block we want to keep (the lower
155030f712c9SDave Chinner 	 * numbered block) and path point to the block we want to drop.
155130f712c9SDave Chinner 	 */
155230f712c9SDave Chinner 	memcpy(&state->altpath, &state->path, sizeof(state->path));
155330f712c9SDave Chinner 	if (blkno < blk->blkno)
155430f712c9SDave Chinner 		error = xfs_da3_path_shift(state, &state->altpath, forward, 0,
155530f712c9SDave Chinner 			&rval);
155630f712c9SDave Chinner 	else
155730f712c9SDave Chinner 		error = xfs_da3_path_shift(state, &state->path, forward, 0,
155830f712c9SDave Chinner 			&rval);
155930f712c9SDave Chinner 	if (error) {
156030f712c9SDave Chinner 		return error;
156130f712c9SDave Chinner 	}
156230f712c9SDave Chinner 	*action = rval ? 0 : 1;
156330f712c9SDave Chinner 	return 0;
156430f712c9SDave Chinner }
156530f712c9SDave Chinner 
156630f712c9SDave Chinner /*
156730f712c9SDave Chinner  * Move all the leaf entries from drop_blk to save_blk.
156830f712c9SDave Chinner  * This is done as part of a join operation.
156930f712c9SDave Chinner  */
157030f712c9SDave Chinner void
157130f712c9SDave Chinner xfs_dir2_leafn_unbalance(
157230f712c9SDave Chinner 	xfs_da_state_t		*state,		/* cursor */
157330f712c9SDave Chinner 	xfs_da_state_blk_t	*drop_blk,	/* dead block */
157430f712c9SDave Chinner 	xfs_da_state_blk_t	*save_blk)	/* surviving block */
157530f712c9SDave Chinner {
157630f712c9SDave Chinner 	xfs_da_args_t		*args;		/* operation arguments */
157730f712c9SDave Chinner 	xfs_dir2_leaf_t		*drop_leaf;	/* dead leaf structure */
157830f712c9SDave Chinner 	xfs_dir2_leaf_t		*save_leaf;	/* surviving leaf structure */
157930f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr savehdr;
158030f712c9SDave Chinner 	struct xfs_dir3_icleaf_hdr drophdr;
158130f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *sents;
158230f712c9SDave Chinner 	struct xfs_dir2_leaf_entry *dents;
158330f712c9SDave Chinner 	struct xfs_inode	*dp = state->args->dp;
158430f712c9SDave Chinner 
158530f712c9SDave Chinner 	args = state->args;
158630f712c9SDave Chinner 	ASSERT(drop_blk->magic == XFS_DIR2_LEAFN_MAGIC);
158730f712c9SDave Chinner 	ASSERT(save_blk->magic == XFS_DIR2_LEAFN_MAGIC);
158830f712c9SDave Chinner 	drop_leaf = drop_blk->bp->b_addr;
158930f712c9SDave Chinner 	save_leaf = save_blk->bp->b_addr;
159030f712c9SDave Chinner 
159130f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&savehdr, save_leaf);
159230f712c9SDave Chinner 	dp->d_ops->leaf_hdr_from_disk(&drophdr, drop_leaf);
159330f712c9SDave Chinner 	sents = dp->d_ops->leaf_ents_p(save_leaf);
159430f712c9SDave Chinner 	dents = dp->d_ops->leaf_ents_p(drop_leaf);
159530f712c9SDave Chinner 
159630f712c9SDave Chinner 	/*
159730f712c9SDave Chinner 	 * If there are any stale leaf entries, take this opportunity
159830f712c9SDave Chinner 	 * to purge them.
159930f712c9SDave Chinner 	 */
160030f712c9SDave Chinner 	if (drophdr.stale)
160130f712c9SDave Chinner 		xfs_dir3_leaf_compact(args, &drophdr, drop_blk->bp);
160230f712c9SDave Chinner 	if (savehdr.stale)
160330f712c9SDave Chinner 		xfs_dir3_leaf_compact(args, &savehdr, save_blk->bp);
160430f712c9SDave Chinner 
160530f712c9SDave Chinner 	/*
160630f712c9SDave Chinner 	 * Move the entries from drop to the appropriate end of save.
160730f712c9SDave Chinner 	 */
160830f712c9SDave Chinner 	drop_blk->hashval = be32_to_cpu(dents[drophdr.count - 1].hashval);
160930f712c9SDave Chinner 	if (xfs_dir2_leafn_order(dp, save_blk->bp, drop_blk->bp))
161030f712c9SDave Chinner 		xfs_dir3_leafn_moveents(args, drop_blk->bp, &drophdr, dents, 0,
161130f712c9SDave Chinner 					save_blk->bp, &savehdr, sents, 0,
161230f712c9SDave Chinner 					drophdr.count);
161330f712c9SDave Chinner 	else
161430f712c9SDave Chinner 		xfs_dir3_leafn_moveents(args, drop_blk->bp, &drophdr, dents, 0,
161530f712c9SDave Chinner 					save_blk->bp, &savehdr, sents,
161630f712c9SDave Chinner 					savehdr.count, drophdr.count);
161730f712c9SDave Chinner 	save_blk->hashval = be32_to_cpu(sents[savehdr.count - 1].hashval);
161830f712c9SDave Chinner 
161930f712c9SDave Chinner 	/* log the changes made when moving the entries */
162030f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(save_leaf, &savehdr);
162130f712c9SDave Chinner 	dp->d_ops->leaf_hdr_to_disk(drop_leaf, &drophdr);
162230f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, save_blk->bp);
162330f712c9SDave Chinner 	xfs_dir3_leaf_log_header(args, drop_blk->bp);
162430f712c9SDave Chinner 
162530f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, save_blk->bp);
162630f712c9SDave Chinner 	xfs_dir3_leaf_check(dp, drop_blk->bp);
162730f712c9SDave Chinner }
162830f712c9SDave Chinner 
162930f712c9SDave Chinner /*
163030f712c9SDave Chinner  * Top-level node form directory addname routine.
163130f712c9SDave Chinner  */
163230f712c9SDave Chinner int						/* error */
163330f712c9SDave Chinner xfs_dir2_node_addname(
163430f712c9SDave Chinner 	xfs_da_args_t		*args)		/* operation arguments */
163530f712c9SDave Chinner {
163630f712c9SDave Chinner 	xfs_da_state_blk_t	*blk;		/* leaf block for insert */
163730f712c9SDave Chinner 	int			error;		/* error return value */
163830f712c9SDave Chinner 	int			rval;		/* sub-return value */
163930f712c9SDave Chinner 	xfs_da_state_t		*state;		/* btree cursor */
164030f712c9SDave Chinner 
164130f712c9SDave Chinner 	trace_xfs_dir2_node_addname(args);
164230f712c9SDave Chinner 
164330f712c9SDave Chinner 	/*
164430f712c9SDave Chinner 	 * Allocate and initialize the state (btree cursor).
164530f712c9SDave Chinner 	 */
164630f712c9SDave Chinner 	state = xfs_da_state_alloc();
164730f712c9SDave Chinner 	state->args = args;
164830f712c9SDave Chinner 	state->mp = args->dp->i_mount;
164930f712c9SDave Chinner 	/*
165030f712c9SDave Chinner 	 * Look up the name.  We're not supposed to find it, but
165130f712c9SDave Chinner 	 * this gives us the insertion point.
165230f712c9SDave Chinner 	 */
165330f712c9SDave Chinner 	error = xfs_da3_node_lookup_int(state, &rval);
165430f712c9SDave Chinner 	if (error)
165530f712c9SDave Chinner 		rval = error;
16562451337dSDave Chinner 	if (rval != -ENOENT) {
165730f712c9SDave Chinner 		goto done;
165830f712c9SDave Chinner 	}
165930f712c9SDave Chinner 	/*
166030f712c9SDave Chinner 	 * Add the data entry to a data block.
166130f712c9SDave Chinner 	 * Extravalid is set to a freeblock found by lookup.
166230f712c9SDave Chinner 	 */
166330f712c9SDave Chinner 	rval = xfs_dir2_node_addname_int(args,
166430f712c9SDave Chinner 		state->extravalid ? &state->extrablk : NULL);
166530f712c9SDave Chinner 	if (rval) {
166630f712c9SDave Chinner 		goto done;
166730f712c9SDave Chinner 	}
166830f712c9SDave Chinner 	blk = &state->path.blk[state->path.active - 1];
166930f712c9SDave Chinner 	ASSERT(blk->magic == XFS_DIR2_LEAFN_MAGIC);
167030f712c9SDave Chinner 	/*
167130f712c9SDave Chinner 	 * Add the new leaf entry.
167230f712c9SDave Chinner 	 */
167330f712c9SDave Chinner 	rval = xfs_dir2_leafn_add(blk->bp, args, blk->index);
167430f712c9SDave Chinner 	if (rval == 0) {
167530f712c9SDave Chinner 		/*
167630f712c9SDave Chinner 		 * It worked, fix the hash values up the btree.
167730f712c9SDave Chinner 		 */
167830f712c9SDave Chinner 		if (!(args->op_flags & XFS_DA_OP_JUSTCHECK))
167930f712c9SDave Chinner 			xfs_da3_fixhashpath(state, &state->path);
168030f712c9SDave Chinner 	} else {
168130f712c9SDave Chinner 		/*
168230f712c9SDave Chinner 		 * It didn't work, we need to split the leaf block.
168330f712c9SDave Chinner 		 */
168430f712c9SDave Chinner 		if (args->total == 0) {
16852451337dSDave Chinner 			ASSERT(rval == -ENOSPC);
168630f712c9SDave Chinner 			goto done;
168730f712c9SDave Chinner 		}
168830f712c9SDave Chinner 		/*
168930f712c9SDave Chinner 		 * Split the leaf block and insert the new entry.
169030f712c9SDave Chinner 		 */
169130f712c9SDave Chinner 		rval = xfs_da3_split(state);
169230f712c9SDave Chinner 	}
169330f712c9SDave Chinner done:
169430f712c9SDave Chinner 	xfs_da_state_free(state);
169530f712c9SDave Chinner 	return rval;
169630f712c9SDave Chinner }
169730f712c9SDave Chinner 
169830f712c9SDave Chinner /*
169930f712c9SDave Chinner  * Add the data entry for a node-format directory name addition.
170030f712c9SDave Chinner  * The leaf entry is added in xfs_dir2_leafn_add.
170130f712c9SDave Chinner  * We may enter with a freespace block that the lookup found.
170230f712c9SDave Chinner  */
170330f712c9SDave Chinner static int					/* error */
170430f712c9SDave Chinner xfs_dir2_node_addname_int(
170530f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
170630f712c9SDave Chinner 	xfs_da_state_blk_t	*fblk)		/* optional freespace block */
170730f712c9SDave Chinner {
170830f712c9SDave Chinner 	xfs_dir2_data_hdr_t	*hdr;		/* data block header */
170930f712c9SDave Chinner 	xfs_dir2_db_t		dbno;		/* data block number */
171030f712c9SDave Chinner 	struct xfs_buf		*dbp;		/* data block buffer */
171130f712c9SDave Chinner 	xfs_dir2_data_entry_t	*dep;		/* data entry pointer */
171230f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
171330f712c9SDave Chinner 	xfs_dir2_data_unused_t	*dup;		/* data unused entry pointer */
171430f712c9SDave Chinner 	int			error;		/* error return value */
171530f712c9SDave Chinner 	xfs_dir2_db_t		fbno;		/* freespace block number */
171630f712c9SDave Chinner 	struct xfs_buf		*fbp;		/* freespace buffer */
171730f712c9SDave Chinner 	int			findex;		/* freespace entry index */
171830f712c9SDave Chinner 	xfs_dir2_free_t		*free=NULL;	/* freespace block structure */
171930f712c9SDave Chinner 	xfs_dir2_db_t		ifbno;		/* initial freespace block no */
172030f712c9SDave Chinner 	xfs_dir2_db_t		lastfbno=0;	/* highest freespace block no */
172130f712c9SDave Chinner 	int			length;		/* length of the new entry */
172230f712c9SDave Chinner 	int			logfree;	/* need to log free entry */
172330f712c9SDave Chinner 	xfs_mount_t		*mp;		/* filesystem mount point */
172430f712c9SDave Chinner 	int			needlog;	/* need to log data header */
172530f712c9SDave Chinner 	int			needscan;	/* need to rescan data frees */
172630f712c9SDave Chinner 	__be16			*tagp;		/* data entry tag pointer */
172730f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
172830f712c9SDave Chinner 	__be16			*bests;
172930f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr freehdr;
173030f712c9SDave Chinner 	struct xfs_dir2_data_free *bf;
173130f712c9SDave Chinner 
173230f712c9SDave Chinner 	dp = args->dp;
173330f712c9SDave Chinner 	mp = dp->i_mount;
173430f712c9SDave Chinner 	tp = args->trans;
173530f712c9SDave Chinner 	length = dp->d_ops->data_entsize(args->namelen);
173630f712c9SDave Chinner 	/*
173730f712c9SDave Chinner 	 * If we came in with a freespace block that means that lookup
173830f712c9SDave Chinner 	 * found an entry with our hash value.  This is the freespace
173930f712c9SDave Chinner 	 * block for that data entry.
174030f712c9SDave Chinner 	 */
174130f712c9SDave Chinner 	if (fblk) {
174230f712c9SDave Chinner 		fbp = fblk->bp;
174330f712c9SDave Chinner 		/*
174430f712c9SDave Chinner 		 * Remember initial freespace block number.
174530f712c9SDave Chinner 		 */
174630f712c9SDave Chinner 		ifbno = fblk->blkno;
174730f712c9SDave Chinner 		free = fbp->b_addr;
174830f712c9SDave Chinner 		findex = fblk->index;
174930f712c9SDave Chinner 		bests = dp->d_ops->free_bests_p(free);
175030f712c9SDave Chinner 		dp->d_ops->free_hdr_from_disk(&freehdr, free);
175130f712c9SDave Chinner 
175230f712c9SDave Chinner 		/*
175330f712c9SDave Chinner 		 * This means the free entry showed that the data block had
175430f712c9SDave Chinner 		 * space for our entry, so we remembered it.
175530f712c9SDave Chinner 		 * Use that data block.
175630f712c9SDave Chinner 		 */
175730f712c9SDave Chinner 		if (findex >= 0) {
175830f712c9SDave Chinner 			ASSERT(findex < freehdr.nvalid);
175930f712c9SDave Chinner 			ASSERT(be16_to_cpu(bests[findex]) != NULLDATAOFF);
176030f712c9SDave Chinner 			ASSERT(be16_to_cpu(bests[findex]) >= length);
176130f712c9SDave Chinner 			dbno = freehdr.firstdb + findex;
176230f712c9SDave Chinner 		} else {
176330f712c9SDave Chinner 			/*
176430f712c9SDave Chinner 			 * The data block looked at didn't have enough room.
176530f712c9SDave Chinner 			 * We'll start at the beginning of the freespace entries.
176630f712c9SDave Chinner 			 */
176730f712c9SDave Chinner 			dbno = -1;
176830f712c9SDave Chinner 			findex = 0;
176930f712c9SDave Chinner 		}
177030f712c9SDave Chinner 	} else {
177130f712c9SDave Chinner 		/*
177230f712c9SDave Chinner 		 * Didn't come in with a freespace block, so no data block.
177330f712c9SDave Chinner 		 */
177430f712c9SDave Chinner 		ifbno = dbno = -1;
177530f712c9SDave Chinner 		fbp = NULL;
177630f712c9SDave Chinner 		findex = 0;
177730f712c9SDave Chinner 	}
177830f712c9SDave Chinner 
177930f712c9SDave Chinner 	/*
178030f712c9SDave Chinner 	 * If we don't have a data block yet, we're going to scan the
178130f712c9SDave Chinner 	 * freespace blocks looking for one.  Figure out what the
178230f712c9SDave Chinner 	 * highest freespace block number is.
178330f712c9SDave Chinner 	 */
178430f712c9SDave Chinner 	if (dbno == -1) {
178530f712c9SDave Chinner 		xfs_fileoff_t	fo;		/* freespace block number */
178630f712c9SDave Chinner 
178730f712c9SDave Chinner 		if ((error = xfs_bmap_last_offset(dp, &fo, XFS_DATA_FORK)))
178830f712c9SDave Chinner 			return error;
178930f712c9SDave Chinner 		lastfbno = xfs_dir2_da_to_db(args->geo, (xfs_dablk_t)fo);
179030f712c9SDave Chinner 		fbno = ifbno;
179130f712c9SDave Chinner 	}
179230f712c9SDave Chinner 	/*
179330f712c9SDave Chinner 	 * While we haven't identified a data block, search the freeblock
179430f712c9SDave Chinner 	 * data for a good data block.  If we find a null freeblock entry,
179530f712c9SDave Chinner 	 * indicating a hole in the data blocks, remember that.
179630f712c9SDave Chinner 	 */
179730f712c9SDave Chinner 	while (dbno == -1) {
179830f712c9SDave Chinner 		/*
179930f712c9SDave Chinner 		 * If we don't have a freeblock in hand, get the next one.
180030f712c9SDave Chinner 		 */
180130f712c9SDave Chinner 		if (fbp == NULL) {
180230f712c9SDave Chinner 			/*
180330f712c9SDave Chinner 			 * Happens the first time through unless lookup gave
180430f712c9SDave Chinner 			 * us a freespace block to start with.
180530f712c9SDave Chinner 			 */
180630f712c9SDave Chinner 			if (++fbno == 0)
180730f712c9SDave Chinner 				fbno = xfs_dir2_byte_to_db(args->geo,
180830f712c9SDave Chinner 							XFS_DIR2_FREE_OFFSET);
180930f712c9SDave Chinner 			/*
181030f712c9SDave Chinner 			 * If it's ifbno we already looked at it.
181130f712c9SDave Chinner 			 */
181230f712c9SDave Chinner 			if (fbno == ifbno)
181330f712c9SDave Chinner 				fbno++;
181430f712c9SDave Chinner 			/*
181530f712c9SDave Chinner 			 * If it's off the end we're done.
181630f712c9SDave Chinner 			 */
181730f712c9SDave Chinner 			if (fbno >= lastfbno)
181830f712c9SDave Chinner 				break;
181930f712c9SDave Chinner 			/*
182030f712c9SDave Chinner 			 * Read the block.  There can be holes in the
182130f712c9SDave Chinner 			 * freespace blocks, so this might not succeed.
182230f712c9SDave Chinner 			 * This should be really rare, so there's no reason
182330f712c9SDave Chinner 			 * to avoid it.
182430f712c9SDave Chinner 			 */
182530f712c9SDave Chinner 			error = xfs_dir2_free_try_read(tp, dp,
182630f712c9SDave Chinner 					xfs_dir2_db_to_da(args->geo, fbno),
182730f712c9SDave Chinner 					&fbp);
182830f712c9SDave Chinner 			if (error)
182930f712c9SDave Chinner 				return error;
183030f712c9SDave Chinner 			if (!fbp)
183130f712c9SDave Chinner 				continue;
183230f712c9SDave Chinner 			free = fbp->b_addr;
183330f712c9SDave Chinner 			findex = 0;
183430f712c9SDave Chinner 		}
183530f712c9SDave Chinner 		/*
183630f712c9SDave Chinner 		 * Look at the current free entry.  Is it good enough?
183730f712c9SDave Chinner 		 *
183830f712c9SDave Chinner 		 * The bests initialisation should be where the bufer is read in
183930f712c9SDave Chinner 		 * the above branch. But gcc is too stupid to realise that bests
184030f712c9SDave Chinner 		 * and the freehdr are actually initialised if they are placed
184130f712c9SDave Chinner 		 * there, so we have to do it here to avoid warnings. Blech.
184230f712c9SDave Chinner 		 */
184330f712c9SDave Chinner 		bests = dp->d_ops->free_bests_p(free);
184430f712c9SDave Chinner 		dp->d_ops->free_hdr_from_disk(&freehdr, free);
184530f712c9SDave Chinner 		if (be16_to_cpu(bests[findex]) != NULLDATAOFF &&
184630f712c9SDave Chinner 		    be16_to_cpu(bests[findex]) >= length)
184730f712c9SDave Chinner 			dbno = freehdr.firstdb + findex;
184830f712c9SDave Chinner 		else {
184930f712c9SDave Chinner 			/*
185030f712c9SDave Chinner 			 * Are we done with the freeblock?
185130f712c9SDave Chinner 			 */
185230f712c9SDave Chinner 			if (++findex == freehdr.nvalid) {
185330f712c9SDave Chinner 				/*
185430f712c9SDave Chinner 				 * Drop the block.
185530f712c9SDave Chinner 				 */
185630f712c9SDave Chinner 				xfs_trans_brelse(tp, fbp);
185730f712c9SDave Chinner 				fbp = NULL;
185830f712c9SDave Chinner 				if (fblk && fblk->bp)
185930f712c9SDave Chinner 					fblk->bp = NULL;
186030f712c9SDave Chinner 			}
186130f712c9SDave Chinner 		}
186230f712c9SDave Chinner 	}
186330f712c9SDave Chinner 	/*
186430f712c9SDave Chinner 	 * If we don't have a data block, we need to allocate one and make
186530f712c9SDave Chinner 	 * the freespace entries refer to it.
186630f712c9SDave Chinner 	 */
186730f712c9SDave Chinner 	if (unlikely(dbno == -1)) {
186830f712c9SDave Chinner 		/*
186930f712c9SDave Chinner 		 * Not allowed to allocate, return failure.
187030f712c9SDave Chinner 		 */
187130f712c9SDave Chinner 		if ((args->op_flags & XFS_DA_OP_JUSTCHECK) || args->total == 0)
18722451337dSDave Chinner 			return -ENOSPC;
187330f712c9SDave Chinner 
187430f712c9SDave Chinner 		/*
187530f712c9SDave Chinner 		 * Allocate and initialize the new data block.
187630f712c9SDave Chinner 		 */
187730f712c9SDave Chinner 		if (unlikely((error = xfs_dir2_grow_inode(args,
187830f712c9SDave Chinner 							 XFS_DIR2_DATA_SPACE,
187930f712c9SDave Chinner 							 &dbno)) ||
188030f712c9SDave Chinner 		    (error = xfs_dir3_data_init(args, dbno, &dbp))))
188130f712c9SDave Chinner 			return error;
188230f712c9SDave Chinner 
188330f712c9SDave Chinner 		/*
188430f712c9SDave Chinner 		 * If (somehow) we have a freespace block, get rid of it.
188530f712c9SDave Chinner 		 */
188630f712c9SDave Chinner 		if (fbp)
188730f712c9SDave Chinner 			xfs_trans_brelse(tp, fbp);
188830f712c9SDave Chinner 		if (fblk && fblk->bp)
188930f712c9SDave Chinner 			fblk->bp = NULL;
189030f712c9SDave Chinner 
189130f712c9SDave Chinner 		/*
189230f712c9SDave Chinner 		 * Get the freespace block corresponding to the data block
189330f712c9SDave Chinner 		 * that was just allocated.
189430f712c9SDave Chinner 		 */
189530f712c9SDave Chinner 		fbno = dp->d_ops->db_to_fdb(args->geo, dbno);
189630f712c9SDave Chinner 		error = xfs_dir2_free_try_read(tp, dp,
189730f712c9SDave Chinner 				       xfs_dir2_db_to_da(args->geo, fbno),
189830f712c9SDave Chinner 				       &fbp);
189930f712c9SDave Chinner 		if (error)
190030f712c9SDave Chinner 			return error;
190130f712c9SDave Chinner 
190230f712c9SDave Chinner 		/*
190330f712c9SDave Chinner 		 * If there wasn't a freespace block, the read will
190430f712c9SDave Chinner 		 * return a NULL fbp.  Allocate and initialize a new one.
190530f712c9SDave Chinner 		 */
190630f712c9SDave Chinner 		if (!fbp) {
190730f712c9SDave Chinner 			error = xfs_dir2_grow_inode(args, XFS_DIR2_FREE_SPACE,
190830f712c9SDave Chinner 						    &fbno);
190930f712c9SDave Chinner 			if (error)
191030f712c9SDave Chinner 				return error;
191130f712c9SDave Chinner 
191230f712c9SDave Chinner 			if (dp->d_ops->db_to_fdb(args->geo, dbno) != fbno) {
191330f712c9SDave Chinner 				xfs_alert(mp,
1914f41febd2SJoe Perches "%s: dir ino %llu needed freesp block %lld for data block %lld, got %lld ifbno %llu lastfbno %d",
191530f712c9SDave Chinner 					__func__, (unsigned long long)dp->i_ino,
191630f712c9SDave Chinner 					(long long)dp->d_ops->db_to_fdb(
191730f712c9SDave Chinner 								args->geo, dbno),
191830f712c9SDave Chinner 					(long long)dbno, (long long)fbno,
191930f712c9SDave Chinner 					(unsigned long long)ifbno, lastfbno);
192030f712c9SDave Chinner 				if (fblk) {
192130f712c9SDave Chinner 					xfs_alert(mp,
192230f712c9SDave Chinner 				" fblk 0x%p blkno %llu index %d magic 0x%x",
192330f712c9SDave Chinner 						fblk,
192430f712c9SDave Chinner 						(unsigned long long)fblk->blkno,
192530f712c9SDave Chinner 						fblk->index,
192630f712c9SDave Chinner 						fblk->magic);
192730f712c9SDave Chinner 				} else {
192830f712c9SDave Chinner 					xfs_alert(mp, " ... fblk is NULL");
192930f712c9SDave Chinner 				}
193030f712c9SDave Chinner 				XFS_ERROR_REPORT("xfs_dir2_node_addname_int",
193130f712c9SDave Chinner 						 XFS_ERRLEVEL_LOW, mp);
19322451337dSDave Chinner 				return -EFSCORRUPTED;
193330f712c9SDave Chinner 			}
193430f712c9SDave Chinner 
193530f712c9SDave Chinner 			/*
193630f712c9SDave Chinner 			 * Get a buffer for the new block.
193730f712c9SDave Chinner 			 */
193830f712c9SDave Chinner 			error = xfs_dir3_free_get_buf(args, fbno, &fbp);
193930f712c9SDave Chinner 			if (error)
194030f712c9SDave Chinner 				return error;
194130f712c9SDave Chinner 			free = fbp->b_addr;
194230f712c9SDave Chinner 			bests = dp->d_ops->free_bests_p(free);
194330f712c9SDave Chinner 			dp->d_ops->free_hdr_from_disk(&freehdr, free);
194430f712c9SDave Chinner 
194530f712c9SDave Chinner 			/*
194630f712c9SDave Chinner 			 * Remember the first slot as our empty slot.
194730f712c9SDave Chinner 			 */
194830f712c9SDave Chinner 			freehdr.firstdb =
194930f712c9SDave Chinner 				(fbno - xfs_dir2_byte_to_db(args->geo,
195030f712c9SDave Chinner 							XFS_DIR2_FREE_OFFSET)) *
195130f712c9SDave Chinner 					dp->d_ops->free_max_bests(args->geo);
195230f712c9SDave Chinner 		} else {
195330f712c9SDave Chinner 			free = fbp->b_addr;
195430f712c9SDave Chinner 			bests = dp->d_ops->free_bests_p(free);
195530f712c9SDave Chinner 			dp->d_ops->free_hdr_from_disk(&freehdr, free);
195630f712c9SDave Chinner 		}
195730f712c9SDave Chinner 
195830f712c9SDave Chinner 		/*
195930f712c9SDave Chinner 		 * Set the freespace block index from the data block number.
196030f712c9SDave Chinner 		 */
196130f712c9SDave Chinner 		findex = dp->d_ops->db_to_fdindex(args->geo, dbno);
196230f712c9SDave Chinner 		/*
196330f712c9SDave Chinner 		 * If it's after the end of the current entries in the
196430f712c9SDave Chinner 		 * freespace block, extend that table.
196530f712c9SDave Chinner 		 */
196630f712c9SDave Chinner 		if (findex >= freehdr.nvalid) {
196730f712c9SDave Chinner 			ASSERT(findex < dp->d_ops->free_max_bests(args->geo));
196830f712c9SDave Chinner 			freehdr.nvalid = findex + 1;
196930f712c9SDave Chinner 			/*
197030f712c9SDave Chinner 			 * Tag new entry so nused will go up.
197130f712c9SDave Chinner 			 */
197230f712c9SDave Chinner 			bests[findex] = cpu_to_be16(NULLDATAOFF);
197330f712c9SDave Chinner 		}
197430f712c9SDave Chinner 		/*
197530f712c9SDave Chinner 		 * If this entry was for an empty data block
197630f712c9SDave Chinner 		 * (this should always be true) then update the header.
197730f712c9SDave Chinner 		 */
197830f712c9SDave Chinner 		if (bests[findex] == cpu_to_be16(NULLDATAOFF)) {
197930f712c9SDave Chinner 			freehdr.nused++;
198030f712c9SDave Chinner 			dp->d_ops->free_hdr_to_disk(fbp->b_addr, &freehdr);
198130f712c9SDave Chinner 			xfs_dir2_free_log_header(args, fbp);
198230f712c9SDave Chinner 		}
198330f712c9SDave Chinner 		/*
198430f712c9SDave Chinner 		 * Update the real value in the table.
198530f712c9SDave Chinner 		 * We haven't allocated the data entry yet so this will
198630f712c9SDave Chinner 		 * change again.
198730f712c9SDave Chinner 		 */
198830f712c9SDave Chinner 		hdr = dbp->b_addr;
198930f712c9SDave Chinner 		bf = dp->d_ops->data_bestfree_p(hdr);
199030f712c9SDave Chinner 		bests[findex] = bf[0].length;
199130f712c9SDave Chinner 		logfree = 1;
199230f712c9SDave Chinner 	}
199330f712c9SDave Chinner 	/*
199430f712c9SDave Chinner 	 * We had a data block so we don't have to make a new one.
199530f712c9SDave Chinner 	 */
199630f712c9SDave Chinner 	else {
199730f712c9SDave Chinner 		/*
199830f712c9SDave Chinner 		 * If just checking, we succeeded.
199930f712c9SDave Chinner 		 */
200030f712c9SDave Chinner 		if (args->op_flags & XFS_DA_OP_JUSTCHECK)
200130f712c9SDave Chinner 			return 0;
200230f712c9SDave Chinner 
200330f712c9SDave Chinner 		/*
200430f712c9SDave Chinner 		 * Read the data block in.
200530f712c9SDave Chinner 		 */
200630f712c9SDave Chinner 		error = xfs_dir3_data_read(tp, dp,
200730f712c9SDave Chinner 					   xfs_dir2_db_to_da(args->geo, dbno),
200830f712c9SDave Chinner 					   -1, &dbp);
200930f712c9SDave Chinner 		if (error)
201030f712c9SDave Chinner 			return error;
201130f712c9SDave Chinner 		hdr = dbp->b_addr;
201230f712c9SDave Chinner 		bf = dp->d_ops->data_bestfree_p(hdr);
201330f712c9SDave Chinner 		logfree = 0;
201430f712c9SDave Chinner 	}
201530f712c9SDave Chinner 	ASSERT(be16_to_cpu(bf[0].length) >= length);
201630f712c9SDave Chinner 	/*
201730f712c9SDave Chinner 	 * Point to the existing unused space.
201830f712c9SDave Chinner 	 */
201930f712c9SDave Chinner 	dup = (xfs_dir2_data_unused_t *)
202030f712c9SDave Chinner 	      ((char *)hdr + be16_to_cpu(bf[0].offset));
202130f712c9SDave Chinner 	needscan = needlog = 0;
202230f712c9SDave Chinner 	/*
202330f712c9SDave Chinner 	 * Mark the first part of the unused space, inuse for us.
202430f712c9SDave Chinner 	 */
202530f712c9SDave Chinner 	xfs_dir2_data_use_free(args, dbp, dup,
202630f712c9SDave Chinner 		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr), length,
202730f712c9SDave Chinner 		&needlog, &needscan);
202830f712c9SDave Chinner 	/*
202930f712c9SDave Chinner 	 * Fill in the new entry and log it.
203030f712c9SDave Chinner 	 */
203130f712c9SDave Chinner 	dep = (xfs_dir2_data_entry_t *)dup;
203230f712c9SDave Chinner 	dep->inumber = cpu_to_be64(args->inumber);
203330f712c9SDave Chinner 	dep->namelen = args->namelen;
203430f712c9SDave Chinner 	memcpy(dep->name, args->name, dep->namelen);
203530f712c9SDave Chinner 	dp->d_ops->data_put_ftype(dep, args->filetype);
203630f712c9SDave Chinner 	tagp = dp->d_ops->data_entry_tag_p(dep);
203730f712c9SDave Chinner 	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
203830f712c9SDave Chinner 	xfs_dir2_data_log_entry(args, dbp, dep);
203930f712c9SDave Chinner 	/*
204030f712c9SDave Chinner 	 * Rescan the block for bestfree if needed.
204130f712c9SDave Chinner 	 */
204230f712c9SDave Chinner 	if (needscan)
204330f712c9SDave Chinner 		xfs_dir2_data_freescan(dp, hdr, &needlog);
204430f712c9SDave Chinner 	/*
204530f712c9SDave Chinner 	 * Log the data block header if needed.
204630f712c9SDave Chinner 	 */
204730f712c9SDave Chinner 	if (needlog)
204830f712c9SDave Chinner 		xfs_dir2_data_log_header(args, dbp);
204930f712c9SDave Chinner 	/*
205030f712c9SDave Chinner 	 * If the freespace entry is now wrong, update it.
205130f712c9SDave Chinner 	 */
205230f712c9SDave Chinner 	bests = dp->d_ops->free_bests_p(free); /* gcc is so stupid */
205330f712c9SDave Chinner 	if (be16_to_cpu(bests[findex]) != be16_to_cpu(bf[0].length)) {
205430f712c9SDave Chinner 		bests[findex] = bf[0].length;
205530f712c9SDave Chinner 		logfree = 1;
205630f712c9SDave Chinner 	}
205730f712c9SDave Chinner 	/*
205830f712c9SDave Chinner 	 * Log the freespace entry if needed.
205930f712c9SDave Chinner 	 */
206030f712c9SDave Chinner 	if (logfree)
206130f712c9SDave Chinner 		xfs_dir2_free_log_bests(args, fbp, findex, findex);
206230f712c9SDave Chinner 	/*
206330f712c9SDave Chinner 	 * Return the data block and offset in args, then drop the data block.
206430f712c9SDave Chinner 	 */
206530f712c9SDave Chinner 	args->blkno = (xfs_dablk_t)dbno;
206630f712c9SDave Chinner 	args->index = be16_to_cpu(*tagp);
206730f712c9SDave Chinner 	return 0;
206830f712c9SDave Chinner }
206930f712c9SDave Chinner 
207030f712c9SDave Chinner /*
207130f712c9SDave Chinner  * Lookup an entry in a node-format directory.
207230f712c9SDave Chinner  * All the real work happens in xfs_da3_node_lookup_int.
207330f712c9SDave Chinner  * The only real output is the inode number of the entry.
207430f712c9SDave Chinner  */
207530f712c9SDave Chinner int						/* error */
207630f712c9SDave Chinner xfs_dir2_node_lookup(
207730f712c9SDave Chinner 	xfs_da_args_t	*args)			/* operation arguments */
207830f712c9SDave Chinner {
207930f712c9SDave Chinner 	int		error;			/* error return value */
208030f712c9SDave Chinner 	int		i;			/* btree level */
208130f712c9SDave Chinner 	int		rval;			/* operation return value */
208230f712c9SDave Chinner 	xfs_da_state_t	*state;			/* btree cursor */
208330f712c9SDave Chinner 
208430f712c9SDave Chinner 	trace_xfs_dir2_node_lookup(args);
208530f712c9SDave Chinner 
208630f712c9SDave Chinner 	/*
208730f712c9SDave Chinner 	 * Allocate and initialize the btree cursor.
208830f712c9SDave Chinner 	 */
208930f712c9SDave Chinner 	state = xfs_da_state_alloc();
209030f712c9SDave Chinner 	state->args = args;
209130f712c9SDave Chinner 	state->mp = args->dp->i_mount;
209230f712c9SDave Chinner 	/*
209330f712c9SDave Chinner 	 * Fill in the path to the entry in the cursor.
209430f712c9SDave Chinner 	 */
209530f712c9SDave Chinner 	error = xfs_da3_node_lookup_int(state, &rval);
209630f712c9SDave Chinner 	if (error)
209730f712c9SDave Chinner 		rval = error;
20982451337dSDave Chinner 	else if (rval == -ENOENT && args->cmpresult == XFS_CMP_CASE) {
20992451337dSDave Chinner 		/* If a CI match, dup the actual name and return -EEXIST */
210030f712c9SDave Chinner 		xfs_dir2_data_entry_t	*dep;
210130f712c9SDave Chinner 
210230f712c9SDave Chinner 		dep = (xfs_dir2_data_entry_t *)
210330f712c9SDave Chinner 			((char *)state->extrablk.bp->b_addr +
210430f712c9SDave Chinner 						 state->extrablk.index);
210530f712c9SDave Chinner 		rval = xfs_dir_cilookup_result(args, dep->name, dep->namelen);
210630f712c9SDave Chinner 	}
210730f712c9SDave Chinner 	/*
210830f712c9SDave Chinner 	 * Release the btree blocks and leaf block.
210930f712c9SDave Chinner 	 */
211030f712c9SDave Chinner 	for (i = 0; i < state->path.active; i++) {
211130f712c9SDave Chinner 		xfs_trans_brelse(args->trans, state->path.blk[i].bp);
211230f712c9SDave Chinner 		state->path.blk[i].bp = NULL;
211330f712c9SDave Chinner 	}
211430f712c9SDave Chinner 	/*
211530f712c9SDave Chinner 	 * Release the data block if we have it.
211630f712c9SDave Chinner 	 */
211730f712c9SDave Chinner 	if (state->extravalid && state->extrablk.bp) {
211830f712c9SDave Chinner 		xfs_trans_brelse(args->trans, state->extrablk.bp);
211930f712c9SDave Chinner 		state->extrablk.bp = NULL;
212030f712c9SDave Chinner 	}
212130f712c9SDave Chinner 	xfs_da_state_free(state);
212230f712c9SDave Chinner 	return rval;
212330f712c9SDave Chinner }
212430f712c9SDave Chinner 
212530f712c9SDave Chinner /*
212630f712c9SDave Chinner  * Remove an entry from a node-format directory.
212730f712c9SDave Chinner  */
212830f712c9SDave Chinner int						/* error */
212930f712c9SDave Chinner xfs_dir2_node_removename(
213030f712c9SDave Chinner 	struct xfs_da_args	*args)		/* operation arguments */
213130f712c9SDave Chinner {
213230f712c9SDave Chinner 	struct xfs_da_state_blk	*blk;		/* leaf block */
213330f712c9SDave Chinner 	int			error;		/* error return value */
213430f712c9SDave Chinner 	int			rval;		/* operation return value */
213530f712c9SDave Chinner 	struct xfs_da_state	*state;		/* btree cursor */
213630f712c9SDave Chinner 
213730f712c9SDave Chinner 	trace_xfs_dir2_node_removename(args);
213830f712c9SDave Chinner 
213930f712c9SDave Chinner 	/*
214030f712c9SDave Chinner 	 * Allocate and initialize the btree cursor.
214130f712c9SDave Chinner 	 */
214230f712c9SDave Chinner 	state = xfs_da_state_alloc();
214330f712c9SDave Chinner 	state->args = args;
214430f712c9SDave Chinner 	state->mp = args->dp->i_mount;
214530f712c9SDave Chinner 
214630f712c9SDave Chinner 	/* Look up the entry we're deleting, set up the cursor. */
214730f712c9SDave Chinner 	error = xfs_da3_node_lookup_int(state, &rval);
214830f712c9SDave Chinner 	if (error)
214930f712c9SDave Chinner 		goto out_free;
215030f712c9SDave Chinner 
215130f712c9SDave Chinner 	/* Didn't find it, upper layer screwed up. */
21522451337dSDave Chinner 	if (rval != -EEXIST) {
215330f712c9SDave Chinner 		error = rval;
215430f712c9SDave Chinner 		goto out_free;
215530f712c9SDave Chinner 	}
215630f712c9SDave Chinner 
215730f712c9SDave Chinner 	blk = &state->path.blk[state->path.active - 1];
215830f712c9SDave Chinner 	ASSERT(blk->magic == XFS_DIR2_LEAFN_MAGIC);
215930f712c9SDave Chinner 	ASSERT(state->extravalid);
216030f712c9SDave Chinner 	/*
216130f712c9SDave Chinner 	 * Remove the leaf and data entries.
216230f712c9SDave Chinner 	 * Extrablk refers to the data block.
216330f712c9SDave Chinner 	 */
216430f712c9SDave Chinner 	error = xfs_dir2_leafn_remove(args, blk->bp, blk->index,
216530f712c9SDave Chinner 		&state->extrablk, &rval);
216630f712c9SDave Chinner 	if (error)
216730f712c9SDave Chinner 		goto out_free;
216830f712c9SDave Chinner 	/*
216930f712c9SDave Chinner 	 * Fix the hash values up the btree.
217030f712c9SDave Chinner 	 */
217130f712c9SDave Chinner 	xfs_da3_fixhashpath(state, &state->path);
217230f712c9SDave Chinner 	/*
217330f712c9SDave Chinner 	 * If we need to join leaf blocks, do it.
217430f712c9SDave Chinner 	 */
217530f712c9SDave Chinner 	if (rval && state->path.active > 1)
217630f712c9SDave Chinner 		error = xfs_da3_join(state);
217730f712c9SDave Chinner 	/*
217830f712c9SDave Chinner 	 * If no errors so far, try conversion to leaf format.
217930f712c9SDave Chinner 	 */
218030f712c9SDave Chinner 	if (!error)
218130f712c9SDave Chinner 		error = xfs_dir2_node_to_leaf(state);
218230f712c9SDave Chinner out_free:
218330f712c9SDave Chinner 	xfs_da_state_free(state);
218430f712c9SDave Chinner 	return error;
218530f712c9SDave Chinner }
218630f712c9SDave Chinner 
218730f712c9SDave Chinner /*
218830f712c9SDave Chinner  * Replace an entry's inode number in a node-format directory.
218930f712c9SDave Chinner  */
219030f712c9SDave Chinner int						/* error */
219130f712c9SDave Chinner xfs_dir2_node_replace(
219230f712c9SDave Chinner 	xfs_da_args_t		*args)		/* operation arguments */
219330f712c9SDave Chinner {
219430f712c9SDave Chinner 	xfs_da_state_blk_t	*blk;		/* leaf block */
219530f712c9SDave Chinner 	xfs_dir2_data_hdr_t	*hdr;		/* data block header */
219630f712c9SDave Chinner 	xfs_dir2_data_entry_t	*dep;		/* data entry changed */
219730f712c9SDave Chinner 	int			error;		/* error return value */
219830f712c9SDave Chinner 	int			i;		/* btree level */
219930f712c9SDave Chinner 	xfs_ino_t		inum;		/* new inode number */
220003754234SJan Kara 	int			ftype;		/* new file type */
220130f712c9SDave Chinner 	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
220230f712c9SDave Chinner 	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry being changed */
220330f712c9SDave Chinner 	int			rval;		/* internal return value */
220430f712c9SDave Chinner 	xfs_da_state_t		*state;		/* btree cursor */
220530f712c9SDave Chinner 
220630f712c9SDave Chinner 	trace_xfs_dir2_node_replace(args);
220730f712c9SDave Chinner 
220830f712c9SDave Chinner 	/*
220930f712c9SDave Chinner 	 * Allocate and initialize the btree cursor.
221030f712c9SDave Chinner 	 */
221130f712c9SDave Chinner 	state = xfs_da_state_alloc();
221230f712c9SDave Chinner 	state->args = args;
221330f712c9SDave Chinner 	state->mp = args->dp->i_mount;
221403754234SJan Kara 
221503754234SJan Kara 	/*
221603754234SJan Kara 	 * We have to save new inode number and ftype since
221703754234SJan Kara 	 * xfs_da3_node_lookup_int() is going to overwrite them
221803754234SJan Kara 	 */
221930f712c9SDave Chinner 	inum = args->inumber;
222003754234SJan Kara 	ftype = args->filetype;
222103754234SJan Kara 
222230f712c9SDave Chinner 	/*
222330f712c9SDave Chinner 	 * Lookup the entry to change in the btree.
222430f712c9SDave Chinner 	 */
222530f712c9SDave Chinner 	error = xfs_da3_node_lookup_int(state, &rval);
222630f712c9SDave Chinner 	if (error) {
222730f712c9SDave Chinner 		rval = error;
222830f712c9SDave Chinner 	}
222930f712c9SDave Chinner 	/*
223030f712c9SDave Chinner 	 * It should be found, since the vnodeops layer has looked it up
223130f712c9SDave Chinner 	 * and locked it.  But paranoia is good.
223230f712c9SDave Chinner 	 */
22332451337dSDave Chinner 	if (rval == -EEXIST) {
223430f712c9SDave Chinner 		struct xfs_dir2_leaf_entry *ents;
223530f712c9SDave Chinner 		/*
223630f712c9SDave Chinner 		 * Find the leaf entry.
223730f712c9SDave Chinner 		 */
223830f712c9SDave Chinner 		blk = &state->path.blk[state->path.active - 1];
223930f712c9SDave Chinner 		ASSERT(blk->magic == XFS_DIR2_LEAFN_MAGIC);
224030f712c9SDave Chinner 		leaf = blk->bp->b_addr;
224130f712c9SDave Chinner 		ents = args->dp->d_ops->leaf_ents_p(leaf);
224230f712c9SDave Chinner 		lep = &ents[blk->index];
224330f712c9SDave Chinner 		ASSERT(state->extravalid);
224430f712c9SDave Chinner 		/*
224530f712c9SDave Chinner 		 * Point to the data entry.
224630f712c9SDave Chinner 		 */
224730f712c9SDave Chinner 		hdr = state->extrablk.bp->b_addr;
224830f712c9SDave Chinner 		ASSERT(hdr->magic == cpu_to_be32(XFS_DIR2_DATA_MAGIC) ||
224930f712c9SDave Chinner 		       hdr->magic == cpu_to_be32(XFS_DIR3_DATA_MAGIC));
225030f712c9SDave Chinner 		dep = (xfs_dir2_data_entry_t *)
225130f712c9SDave Chinner 		      ((char *)hdr +
225230f712c9SDave Chinner 		       xfs_dir2_dataptr_to_off(args->geo,
225330f712c9SDave Chinner 					       be32_to_cpu(lep->address)));
225430f712c9SDave Chinner 		ASSERT(inum != be64_to_cpu(dep->inumber));
225530f712c9SDave Chinner 		/*
225630f712c9SDave Chinner 		 * Fill in the new inode number and log the entry.
225730f712c9SDave Chinner 		 */
225830f712c9SDave Chinner 		dep->inumber = cpu_to_be64(inum);
225903754234SJan Kara 		args->dp->d_ops->data_put_ftype(dep, ftype);
226030f712c9SDave Chinner 		xfs_dir2_data_log_entry(args, state->extrablk.bp, dep);
226130f712c9SDave Chinner 		rval = 0;
226230f712c9SDave Chinner 	}
226330f712c9SDave Chinner 	/*
226430f712c9SDave Chinner 	 * Didn't find it, and we're holding a data block.  Drop it.
226530f712c9SDave Chinner 	 */
226630f712c9SDave Chinner 	else if (state->extravalid) {
226730f712c9SDave Chinner 		xfs_trans_brelse(args->trans, state->extrablk.bp);
226830f712c9SDave Chinner 		state->extrablk.bp = NULL;
226930f712c9SDave Chinner 	}
227030f712c9SDave Chinner 	/*
227130f712c9SDave Chinner 	 * Release all the buffers in the cursor.
227230f712c9SDave Chinner 	 */
227330f712c9SDave Chinner 	for (i = 0; i < state->path.active; i++) {
227430f712c9SDave Chinner 		xfs_trans_brelse(args->trans, state->path.blk[i].bp);
227530f712c9SDave Chinner 		state->path.blk[i].bp = NULL;
227630f712c9SDave Chinner 	}
227730f712c9SDave Chinner 	xfs_da_state_free(state);
227830f712c9SDave Chinner 	return rval;
227930f712c9SDave Chinner }
228030f712c9SDave Chinner 
228130f712c9SDave Chinner /*
228230f712c9SDave Chinner  * Trim off a trailing empty freespace block.
228330f712c9SDave Chinner  * Return (in rvalp) 1 if we did it, 0 if not.
228430f712c9SDave Chinner  */
228530f712c9SDave Chinner int						/* error */
228630f712c9SDave Chinner xfs_dir2_node_trim_free(
228730f712c9SDave Chinner 	xfs_da_args_t		*args,		/* operation arguments */
228830f712c9SDave Chinner 	xfs_fileoff_t		fo,		/* free block number */
228930f712c9SDave Chinner 	int			*rvalp)		/* out: did something */
229030f712c9SDave Chinner {
229130f712c9SDave Chinner 	struct xfs_buf		*bp;		/* freespace buffer */
229230f712c9SDave Chinner 	xfs_inode_t		*dp;		/* incore directory inode */
229330f712c9SDave Chinner 	int			error;		/* error return code */
229430f712c9SDave Chinner 	xfs_dir2_free_t		*free;		/* freespace structure */
229530f712c9SDave Chinner 	xfs_trans_t		*tp;		/* transaction pointer */
229630f712c9SDave Chinner 	struct xfs_dir3_icfree_hdr freehdr;
229730f712c9SDave Chinner 
229830f712c9SDave Chinner 	dp = args->dp;
229930f712c9SDave Chinner 	tp = args->trans;
2300355cced4SChristoph Hellwig 
2301355cced4SChristoph Hellwig 	*rvalp = 0;
2302355cced4SChristoph Hellwig 
230330f712c9SDave Chinner 	/*
230430f712c9SDave Chinner 	 * Read the freespace block.
230530f712c9SDave Chinner 	 */
230630f712c9SDave Chinner 	error = xfs_dir2_free_try_read(tp, dp, fo, &bp);
230730f712c9SDave Chinner 	if (error)
230830f712c9SDave Chinner 		return error;
230930f712c9SDave Chinner 	/*
231030f712c9SDave Chinner 	 * There can be holes in freespace.  If fo is a hole, there's
231130f712c9SDave Chinner 	 * nothing to do.
231230f712c9SDave Chinner 	 */
231330f712c9SDave Chinner 	if (!bp)
231430f712c9SDave Chinner 		return 0;
231530f712c9SDave Chinner 	free = bp->b_addr;
231630f712c9SDave Chinner 	dp->d_ops->free_hdr_from_disk(&freehdr, free);
231730f712c9SDave Chinner 
231830f712c9SDave Chinner 	/*
231930f712c9SDave Chinner 	 * If there are used entries, there's nothing to do.
232030f712c9SDave Chinner 	 */
232130f712c9SDave Chinner 	if (freehdr.nused > 0) {
232230f712c9SDave Chinner 		xfs_trans_brelse(tp, bp);
232330f712c9SDave Chinner 		return 0;
232430f712c9SDave Chinner 	}
232530f712c9SDave Chinner 	/*
232630f712c9SDave Chinner 	 * Blow the block away.
232730f712c9SDave Chinner 	 */
232830f712c9SDave Chinner 	error = xfs_dir2_shrink_inode(args,
232930f712c9SDave Chinner 			xfs_dir2_da_to_db(args->geo, (xfs_dablk_t)fo), bp);
233030f712c9SDave Chinner 	if (error) {
233130f712c9SDave Chinner 		/*
233230f712c9SDave Chinner 		 * Can't fail with ENOSPC since that only happens with no
233330f712c9SDave Chinner 		 * space reservation, when breaking up an extent into two
233430f712c9SDave Chinner 		 * pieces.  This is the last block of an extent.
233530f712c9SDave Chinner 		 */
23362451337dSDave Chinner 		ASSERT(error != -ENOSPC);
233730f712c9SDave Chinner 		xfs_trans_brelse(tp, bp);
233830f712c9SDave Chinner 		return error;
233930f712c9SDave Chinner 	}
234030f712c9SDave Chinner 	/*
234130f712c9SDave Chinner 	 * Return that we succeeded.
234230f712c9SDave Chinner 	 */
234330f712c9SDave Chinner 	*rvalp = 1;
234430f712c9SDave Chinner 	return 0;
234530f712c9SDave Chinner }
2346