xref: /openbmc/linux/fs/xfs/xfs_itable.c (revision cd57e594adc624dd9ee4c0ded3949da21ec24b2f)
11da177e4SLinus Torvalds /*
27b718769SNathan Scott  * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc.
37b718769SNathan Scott  * All Rights Reserved.
41da177e4SLinus Torvalds  *
57b718769SNathan Scott  * This program is free software; you can redistribute it and/or
67b718769SNathan Scott  * modify it under the terms of the GNU General Public License as
71da177e4SLinus Torvalds  * published by the Free Software Foundation.
81da177e4SLinus Torvalds  *
97b718769SNathan Scott  * This program is distributed in the hope that it would be useful,
107b718769SNathan Scott  * but WITHOUT ANY WARRANTY; without even the implied warranty of
117b718769SNathan Scott  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
127b718769SNathan Scott  * GNU General Public License for more details.
131da177e4SLinus Torvalds  *
147b718769SNathan Scott  * You should have received a copy of the GNU General Public License
157b718769SNathan Scott  * along with this program; if not, write the Free Software Foundation,
167b718769SNathan Scott  * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
171da177e4SLinus Torvalds  */
181da177e4SLinus Torvalds #include "xfs.h"
19a844f451SNathan Scott #include "xfs_fs.h"
201da177e4SLinus Torvalds #include "xfs_types.h"
21a844f451SNathan Scott #include "xfs_bit.h"
221da177e4SLinus Torvalds #include "xfs_log.h"
23a844f451SNathan Scott #include "xfs_inum.h"
241da177e4SLinus Torvalds #include "xfs_trans.h"
251da177e4SLinus Torvalds #include "xfs_sb.h"
26a844f451SNathan Scott #include "xfs_ag.h"
271da177e4SLinus Torvalds #include "xfs_dir2.h"
281da177e4SLinus Torvalds #include "xfs_dmapi.h"
291da177e4SLinus Torvalds #include "xfs_mount.h"
301da177e4SLinus Torvalds #include "xfs_bmap_btree.h"
31a844f451SNathan Scott #include "xfs_alloc_btree.h"
321da177e4SLinus Torvalds #include "xfs_ialloc_btree.h"
331da177e4SLinus Torvalds #include "xfs_dir2_sf.h"
34a844f451SNathan Scott #include "xfs_attr_sf.h"
351da177e4SLinus Torvalds #include "xfs_dinode.h"
361da177e4SLinus Torvalds #include "xfs_inode.h"
371da177e4SLinus Torvalds #include "xfs_ialloc.h"
381da177e4SLinus Torvalds #include "xfs_itable.h"
391da177e4SLinus Torvalds #include "xfs_error.h"
40a844f451SNathan Scott #include "xfs_btree.h"
411da177e4SLinus Torvalds 
426f1f2168SVlad Apostolov int
436f1f2168SVlad Apostolov xfs_internal_inum(
446f1f2168SVlad Apostolov 	xfs_mount_t	*mp,
456f1f2168SVlad Apostolov 	xfs_ino_t	ino)
466f1f2168SVlad Apostolov {
476f1f2168SVlad Apostolov 	return (ino == mp->m_sb.sb_rbmino || ino == mp->m_sb.sb_rsumino ||
486f1f2168SVlad Apostolov 		(XFS_SB_VERSION_HASQUOTA(&mp->m_sb) &&
496f1f2168SVlad Apostolov 		 (ino == mp->m_sb.sb_uquotino || ino == mp->m_sb.sb_gquotino)));
506f1f2168SVlad Apostolov }
516f1f2168SVlad Apostolov 
521da177e4SLinus Torvalds STATIC int
531da177e4SLinus Torvalds xfs_bulkstat_one_iget(
541da177e4SLinus Torvalds 	xfs_mount_t	*mp,		/* mount point for filesystem */
551da177e4SLinus Torvalds 	xfs_ino_t	ino,		/* inode number to get data for */
561da177e4SLinus Torvalds 	xfs_daddr_t	bno,		/* starting bno of inode cluster */
571da177e4SLinus Torvalds 	xfs_bstat_t	*buf,		/* return buffer */
581da177e4SLinus Torvalds 	int		*stat)		/* BULKSTAT_RV_... */
591da177e4SLinus Torvalds {
60347d1c01SChristoph Hellwig 	xfs_icdinode_t	*dic;	/* dinode core info pointer */
611da177e4SLinus Torvalds 	xfs_inode_t	*ip;		/* incore inode pointer */
6267fcaa73SNathan Scott 	bhv_vnode_t	*vp;
631da177e4SLinus Torvalds 	int		error;
641da177e4SLinus Torvalds 
65745b1f47SNathan Scott 	error = xfs_iget(mp, NULL, ino,
66745b1f47SNathan Scott 			 XFS_IGET_BULKSTAT, XFS_ILOCK_SHARED, &ip, bno);
671da177e4SLinus Torvalds 	if (error) {
681da177e4SLinus Torvalds 		*stat = BULKSTAT_RV_NOTHING;
691da177e4SLinus Torvalds 		return error;
701da177e4SLinus Torvalds 	}
711da177e4SLinus Torvalds 
721da177e4SLinus Torvalds 	ASSERT(ip != NULL);
731da177e4SLinus Torvalds 	ASSERT(ip->i_blkno != (xfs_daddr_t)0);
741da177e4SLinus Torvalds 	if (ip->i_d.di_mode == 0) {
751da177e4SLinus Torvalds 		*stat = BULKSTAT_RV_NOTHING;
761da177e4SLinus Torvalds 		error = XFS_ERROR(ENOENT);
771da177e4SLinus Torvalds 		goto out_iput;
781da177e4SLinus Torvalds 	}
791da177e4SLinus Torvalds 
8042fe2b1fSChristoph Hellwig 	vp = XFS_ITOV(ip);
811da177e4SLinus Torvalds 	dic = &ip->i_d;
821da177e4SLinus Torvalds 
831da177e4SLinus Torvalds 	/* xfs_iget returns the following without needing
841da177e4SLinus Torvalds 	 * further change.
851da177e4SLinus Torvalds 	 */
861da177e4SLinus Torvalds 	buf->bs_nlink = dic->di_nlink;
871da177e4SLinus Torvalds 	buf->bs_projid = dic->di_projid;
881da177e4SLinus Torvalds 	buf->bs_ino = ino;
891da177e4SLinus Torvalds 	buf->bs_mode = dic->di_mode;
901da177e4SLinus Torvalds 	buf->bs_uid = dic->di_uid;
911da177e4SLinus Torvalds 	buf->bs_gid = dic->di_gid;
921da177e4SLinus Torvalds 	buf->bs_size = dic->di_size;
93ca5ccbf9SNathan Scott 	vn_atime_to_bstime(vp, &buf->bs_atime);
941da177e4SLinus Torvalds 	buf->bs_mtime.tv_sec = dic->di_mtime.t_sec;
951da177e4SLinus Torvalds 	buf->bs_mtime.tv_nsec = dic->di_mtime.t_nsec;
961da177e4SLinus Torvalds 	buf->bs_ctime.tv_sec = dic->di_ctime.t_sec;
971da177e4SLinus Torvalds 	buf->bs_ctime.tv_nsec = dic->di_ctime.t_nsec;
981da177e4SLinus Torvalds 	buf->bs_xflags = xfs_ip2xflags(ip);
991da177e4SLinus Torvalds 	buf->bs_extsize = dic->di_extsize << mp->m_sb.sb_blocklog;
1001da177e4SLinus Torvalds 	buf->bs_extents = dic->di_nextents;
1011da177e4SLinus Torvalds 	buf->bs_gen = dic->di_gen;
1021da177e4SLinus Torvalds 	memset(buf->bs_pad, 0, sizeof(buf->bs_pad));
1031da177e4SLinus Torvalds 	buf->bs_dmevmask = dic->di_dmevmask;
1041da177e4SLinus Torvalds 	buf->bs_dmstate = dic->di_dmstate;
1051da177e4SLinus Torvalds 	buf->bs_aextents = dic->di_anextents;
1061da177e4SLinus Torvalds 
1071da177e4SLinus Torvalds 	switch (dic->di_format) {
1081da177e4SLinus Torvalds 	case XFS_DINODE_FMT_DEV:
1091da177e4SLinus Torvalds 		buf->bs_rdev = ip->i_df.if_u2.if_rdev;
1101da177e4SLinus Torvalds 		buf->bs_blksize = BLKDEV_IOSIZE;
1111da177e4SLinus Torvalds 		buf->bs_blocks = 0;
1121da177e4SLinus Torvalds 		break;
1131da177e4SLinus Torvalds 	case XFS_DINODE_FMT_LOCAL:
1141da177e4SLinus Torvalds 	case XFS_DINODE_FMT_UUID:
1151da177e4SLinus Torvalds 		buf->bs_rdev = 0;
1161da177e4SLinus Torvalds 		buf->bs_blksize = mp->m_sb.sb_blocksize;
1171da177e4SLinus Torvalds 		buf->bs_blocks = 0;
1181da177e4SLinus Torvalds 		break;
1191da177e4SLinus Torvalds 	case XFS_DINODE_FMT_EXTENTS:
1201da177e4SLinus Torvalds 	case XFS_DINODE_FMT_BTREE:
1211da177e4SLinus Torvalds 		buf->bs_rdev = 0;
1221da177e4SLinus Torvalds 		buf->bs_blksize = mp->m_sb.sb_blocksize;
1231da177e4SLinus Torvalds 		buf->bs_blocks = dic->di_nblocks + ip->i_delayed_blks;
1241da177e4SLinus Torvalds 		break;
1251da177e4SLinus Torvalds 	}
1261da177e4SLinus Torvalds 
1271da177e4SLinus Torvalds  out_iput:
1281da177e4SLinus Torvalds 	xfs_iput(ip, XFS_ILOCK_SHARED);
1291da177e4SLinus Torvalds 	return error;
1301da177e4SLinus Torvalds }
1311da177e4SLinus Torvalds 
1321da177e4SLinus Torvalds STATIC int
1331da177e4SLinus Torvalds xfs_bulkstat_one_dinode(
1341da177e4SLinus Torvalds 	xfs_mount_t	*mp,		/* mount point for filesystem */
1351da177e4SLinus Torvalds 	xfs_ino_t	ino,		/* inode number to get data for */
1361da177e4SLinus Torvalds 	xfs_dinode_t	*dip,		/* dinode inode pointer */
1371da177e4SLinus Torvalds 	xfs_bstat_t	*buf)		/* return buffer */
1381da177e4SLinus Torvalds {
1391da177e4SLinus Torvalds 	xfs_dinode_core_t *dic;		/* dinode core info pointer */
1401da177e4SLinus Torvalds 
1411da177e4SLinus Torvalds 	dic = &dip->di_core;
1421da177e4SLinus Torvalds 
1431da177e4SLinus Torvalds 	/*
1441da177e4SLinus Torvalds 	 * The inode format changed when we moved the link count and
1451da177e4SLinus Torvalds 	 * made it 32 bits long.  If this is an old format inode,
1461da177e4SLinus Torvalds 	 * convert it in memory to look like a new one.  If it gets
1471da177e4SLinus Torvalds 	 * flushed to disk we will convert back before flushing or
1481da177e4SLinus Torvalds 	 * logging it.  We zero out the new projid field and the old link
1491da177e4SLinus Torvalds 	 * count field.  We'll handle clearing the pad field (the remains
1501da177e4SLinus Torvalds 	 * of the old uuid field) when we actually convert the inode to
1511da177e4SLinus Torvalds 	 * the new format. We don't change the version number so that we
1521da177e4SLinus Torvalds 	 * can distinguish this from a real new format inode.
1531da177e4SLinus Torvalds 	 */
154347d1c01SChristoph Hellwig 	if (dic->di_version == XFS_DINODE_VERSION_1) {
155347d1c01SChristoph Hellwig 		buf->bs_nlink = be16_to_cpu(dic->di_onlink);
1561da177e4SLinus Torvalds 		buf->bs_projid = 0;
1571da177e4SLinus Torvalds 	} else {
158347d1c01SChristoph Hellwig 		buf->bs_nlink = be32_to_cpu(dic->di_nlink);
159347d1c01SChristoph Hellwig 		buf->bs_projid = be16_to_cpu(dic->di_projid);
1601da177e4SLinus Torvalds 	}
1611da177e4SLinus Torvalds 
1621da177e4SLinus Torvalds 	buf->bs_ino = ino;
163347d1c01SChristoph Hellwig 	buf->bs_mode = be16_to_cpu(dic->di_mode);
164347d1c01SChristoph Hellwig 	buf->bs_uid = be32_to_cpu(dic->di_uid);
165347d1c01SChristoph Hellwig 	buf->bs_gid = be32_to_cpu(dic->di_gid);
166347d1c01SChristoph Hellwig 	buf->bs_size = be64_to_cpu(dic->di_size);
167347d1c01SChristoph Hellwig 	buf->bs_atime.tv_sec = be32_to_cpu(dic->di_atime.t_sec);
168347d1c01SChristoph Hellwig 	buf->bs_atime.tv_nsec = be32_to_cpu(dic->di_atime.t_nsec);
169347d1c01SChristoph Hellwig 	buf->bs_mtime.tv_sec = be32_to_cpu(dic->di_mtime.t_sec);
170347d1c01SChristoph Hellwig 	buf->bs_mtime.tv_nsec = be32_to_cpu(dic->di_mtime.t_nsec);
171347d1c01SChristoph Hellwig 	buf->bs_ctime.tv_sec = be32_to_cpu(dic->di_ctime.t_sec);
172347d1c01SChristoph Hellwig 	buf->bs_ctime.tv_nsec = be32_to_cpu(dic->di_ctime.t_nsec);
1731da177e4SLinus Torvalds 	buf->bs_xflags = xfs_dic2xflags(dic);
174347d1c01SChristoph Hellwig 	buf->bs_extsize = be32_to_cpu(dic->di_extsize) << mp->m_sb.sb_blocklog;
175347d1c01SChristoph Hellwig 	buf->bs_extents = be32_to_cpu(dic->di_nextents);
176347d1c01SChristoph Hellwig 	buf->bs_gen = be32_to_cpu(dic->di_gen);
1771da177e4SLinus Torvalds 	memset(buf->bs_pad, 0, sizeof(buf->bs_pad));
178347d1c01SChristoph Hellwig 	buf->bs_dmevmask = be32_to_cpu(dic->di_dmevmask);
179347d1c01SChristoph Hellwig 	buf->bs_dmstate = be16_to_cpu(dic->di_dmstate);
180347d1c01SChristoph Hellwig 	buf->bs_aextents = be16_to_cpu(dic->di_anextents);
1811da177e4SLinus Torvalds 
182347d1c01SChristoph Hellwig 	switch (dic->di_format) {
1831da177e4SLinus Torvalds 	case XFS_DINODE_FMT_DEV:
184347d1c01SChristoph Hellwig 		buf->bs_rdev = be32_to_cpu(dip->di_u.di_dev);
1851da177e4SLinus Torvalds 		buf->bs_blksize = BLKDEV_IOSIZE;
1861da177e4SLinus Torvalds 		buf->bs_blocks = 0;
1871da177e4SLinus Torvalds 		break;
1881da177e4SLinus Torvalds 	case XFS_DINODE_FMT_LOCAL:
1891da177e4SLinus Torvalds 	case XFS_DINODE_FMT_UUID:
1901da177e4SLinus Torvalds 		buf->bs_rdev = 0;
1911da177e4SLinus Torvalds 		buf->bs_blksize = mp->m_sb.sb_blocksize;
1921da177e4SLinus Torvalds 		buf->bs_blocks = 0;
1931da177e4SLinus Torvalds 		break;
1941da177e4SLinus Torvalds 	case XFS_DINODE_FMT_EXTENTS:
1951da177e4SLinus Torvalds 	case XFS_DINODE_FMT_BTREE:
1961da177e4SLinus Torvalds 		buf->bs_rdev = 0;
1971da177e4SLinus Torvalds 		buf->bs_blksize = mp->m_sb.sb_blocksize;
198347d1c01SChristoph Hellwig 		buf->bs_blocks = be64_to_cpu(dic->di_nblocks);
1991da177e4SLinus Torvalds 		break;
2001da177e4SLinus Torvalds 	}
2011da177e4SLinus Torvalds 
2021da177e4SLinus Torvalds 	return 0;
2031da177e4SLinus Torvalds }
2041da177e4SLinus Torvalds 
205faa63e95SMichal Marek STATIC int
206faa63e95SMichal Marek xfs_bulkstat_one_fmt(
207faa63e95SMichal Marek 	void			__user *ubuffer,
208faa63e95SMichal Marek 	const xfs_bstat_t	*buffer)
209faa63e95SMichal Marek {
210faa63e95SMichal Marek 	if (copy_to_user(ubuffer, buffer, sizeof(*buffer)))
211faa63e95SMichal Marek 		return -EFAULT;
212faa63e95SMichal Marek 	return sizeof(*buffer);
213faa63e95SMichal Marek }
214faa63e95SMichal Marek 
2151da177e4SLinus Torvalds /*
2161da177e4SLinus Torvalds  * Return stat information for one inode.
2171da177e4SLinus Torvalds  * Return 0 if ok, else errno.
2181da177e4SLinus Torvalds  */
2191da177e4SLinus Torvalds int		       		/* error status */
2201da177e4SLinus Torvalds xfs_bulkstat_one(
2211da177e4SLinus Torvalds 	xfs_mount_t	*mp,		/* mount point for filesystem */
2221da177e4SLinus Torvalds 	xfs_ino_t	ino,		/* inode number to get data for */
2231da177e4SLinus Torvalds 	void		__user *buffer,	/* buffer to place output in */
2241da177e4SLinus Torvalds 	int		ubsize,		/* size of buffer */
2251da177e4SLinus Torvalds 	void		*private_data,	/* my private data */
2261da177e4SLinus Torvalds 	xfs_daddr_t	bno,		/* starting bno of inode cluster */
2271da177e4SLinus Torvalds 	int		*ubused,	/* bytes used by me */
2281da177e4SLinus Torvalds 	void		*dibuff,	/* on-disk inode buffer */
2291da177e4SLinus Torvalds 	int		*stat)		/* BULKSTAT_RV_... */
2301da177e4SLinus Torvalds {
2311da177e4SLinus Torvalds 	xfs_bstat_t	*buf;		/* return buffer */
2321da177e4SLinus Torvalds 	int		error = 0;	/* error value */
2331da177e4SLinus Torvalds 	xfs_dinode_t	*dip;		/* dinode inode pointer */
234faa63e95SMichal Marek 	bulkstat_one_fmt_pf formatter = private_data ? : xfs_bulkstat_one_fmt;
2351da177e4SLinus Torvalds 
2361da177e4SLinus Torvalds 	dip = (xfs_dinode_t *)dibuff;
2376f1f2168SVlad Apostolov 	*stat = BULKSTAT_RV_NOTHING;
2381da177e4SLinus Torvalds 
2396f1f2168SVlad Apostolov 	if (!buffer || xfs_internal_inum(mp, ino))
2401da177e4SLinus Torvalds 		return XFS_ERROR(EINVAL);
2416f1f2168SVlad Apostolov 	if (ubsize < sizeof(*buf))
2421da177e4SLinus Torvalds 		return XFS_ERROR(ENOMEM);
2431da177e4SLinus Torvalds 
2441da177e4SLinus Torvalds 	buf = kmem_alloc(sizeof(*buf), KM_SLEEP);
2451da177e4SLinus Torvalds 
2461da177e4SLinus Torvalds 	if (dip == NULL) {
2471da177e4SLinus Torvalds 		/* We're not being passed a pointer to a dinode.  This happens
2481da177e4SLinus Torvalds 		 * if BULKSTAT_FG_IGET is selected.  Do the iget.
2491da177e4SLinus Torvalds 		 */
2501da177e4SLinus Torvalds 		error = xfs_bulkstat_one_iget(mp, ino, bno, buf, stat);
2511da177e4SLinus Torvalds 		if (error)
2521da177e4SLinus Torvalds 			goto out_free;
2531da177e4SLinus Torvalds 	} else {
2541da177e4SLinus Torvalds 		xfs_bulkstat_one_dinode(mp, ino, dip, buf);
2551da177e4SLinus Torvalds 	}
2561da177e4SLinus Torvalds 
257faa63e95SMichal Marek 	error = formatter(buffer, buf);
258faa63e95SMichal Marek 	if (error < 0)  {
2591da177e4SLinus Torvalds 		error = EFAULT;
2601da177e4SLinus Torvalds 		goto out_free;
2611da177e4SLinus Torvalds 	}
2621da177e4SLinus Torvalds 
2631da177e4SLinus Torvalds 	*stat = BULKSTAT_RV_DIDONE;
2641da177e4SLinus Torvalds 	if (ubused)
265faa63e95SMichal Marek 		*ubused = error;
2661da177e4SLinus Torvalds 
2671da177e4SLinus Torvalds  out_free:
2681da177e4SLinus Torvalds 	kmem_free(buf, sizeof(*buf));
2691da177e4SLinus Torvalds 	return error;
2701da177e4SLinus Torvalds }
2711da177e4SLinus Torvalds 
2721da177e4SLinus Torvalds /*
2738b56f083SNathan Scott  * Test to see whether we can use the ondisk inode directly, based
2748b56f083SNathan Scott  * on the given bulkstat flags, filling in dipp accordingly.
2758b56f083SNathan Scott  * Returns zero if the inode is dodgey.
2768b56f083SNathan Scott  */
2778b56f083SNathan Scott STATIC int
2788b56f083SNathan Scott xfs_bulkstat_use_dinode(
2798b56f083SNathan Scott 	xfs_mount_t	*mp,
2808b56f083SNathan Scott 	int		flags,
2818b56f083SNathan Scott 	xfs_buf_t	*bp,
2828b56f083SNathan Scott 	int		clustidx,
2838b56f083SNathan Scott 	xfs_dinode_t	**dipp)
2848b56f083SNathan Scott {
2858b56f083SNathan Scott 	xfs_dinode_t	*dip;
2868b56f083SNathan Scott 	unsigned int	aformat;
2878b56f083SNathan Scott 
2888b56f083SNathan Scott 	*dipp = NULL;
2898b56f083SNathan Scott 	if (!bp || (flags & BULKSTAT_FG_IGET))
2908b56f083SNathan Scott 		return 1;
2918b56f083SNathan Scott 	dip = (xfs_dinode_t *)
2928b56f083SNathan Scott 			xfs_buf_offset(bp, clustidx << mp->m_sb.sb_inodelog);
293859d7182SVlad Apostolov 	/*
294859d7182SVlad Apostolov 	 * Check the buffer containing the on-disk inode for di_nlink == 0.
295859d7182SVlad Apostolov 	 * This is to prevent xfs_bulkstat from picking up just reclaimed
296859d7182SVlad Apostolov 	 * inodes that have their in-core state initialized but not flushed
297859d7182SVlad Apostolov 	 * to disk yet. This is a temporary hack that would require a proper
298859d7182SVlad Apostolov 	 * fix in the future.
299859d7182SVlad Apostolov 	 */
300347d1c01SChristoph Hellwig 	if (be16_to_cpu(dip->di_core.di_magic) != XFS_DINODE_MAGIC ||
301859d7182SVlad Apostolov 	    !XFS_DINODE_GOOD_VERSION(dip->di_core.di_version) ||
302859d7182SVlad Apostolov 	    !dip->di_core.di_nlink)
3038b56f083SNathan Scott 		return 0;
3048b56f083SNathan Scott 	if (flags & BULKSTAT_FG_QUICK) {
3058b56f083SNathan Scott 		*dipp = dip;
3068b56f083SNathan Scott 		return 1;
3078b56f083SNathan Scott 	}
3088b56f083SNathan Scott 	/* BULKSTAT_FG_INLINE: if attr fork is local, or not there, use it */
309347d1c01SChristoph Hellwig 	aformat = dip->di_core.di_aformat;
3108b56f083SNathan Scott 	if ((XFS_CFORK_Q(&dip->di_core) == 0) ||
3118b56f083SNathan Scott 	    (aformat == XFS_DINODE_FMT_LOCAL) ||
3128b56f083SNathan Scott 	    (aformat == XFS_DINODE_FMT_EXTENTS && !dip->di_core.di_anextents)) {
3138b56f083SNathan Scott 		*dipp = dip;
3148b56f083SNathan Scott 		return 1;
3158b56f083SNathan Scott 	}
3168b56f083SNathan Scott 	return 1;
3178b56f083SNathan Scott }
3188b56f083SNathan Scott 
319*cd57e594SLachlan McIlroy #define XFS_BULKSTAT_UBLEFT(ubleft)	((ubleft) >= statstruct_size)
320*cd57e594SLachlan McIlroy 
3218b56f083SNathan Scott /*
3221da177e4SLinus Torvalds  * Return stat information in bulk (by-inode) for the filesystem.
3231da177e4SLinus Torvalds  */
3241da177e4SLinus Torvalds int					/* error status */
3251da177e4SLinus Torvalds xfs_bulkstat(
3261da177e4SLinus Torvalds 	xfs_mount_t		*mp,	/* mount point for filesystem */
3271da177e4SLinus Torvalds 	xfs_ino_t		*lastinop, /* last inode returned */
3281da177e4SLinus Torvalds 	int			*ubcountp, /* size of buffer/count returned */
3291da177e4SLinus Torvalds 	bulkstat_one_pf		formatter, /* func that'd fill a single buf */
3301da177e4SLinus Torvalds 	void			*private_data,/* private data for formatter */
3311da177e4SLinus Torvalds 	size_t			statstruct_size, /* sizeof struct filling */
3321da177e4SLinus Torvalds 	char			__user *ubuffer, /* buffer with inode stats */
3331da177e4SLinus Torvalds 	int			flags,	/* defined in xfs_itable.h */
334c41564b5SNathan Scott 	int			*done)	/* 1 if there are more stats to get */
3351da177e4SLinus Torvalds {
3361da177e4SLinus Torvalds 	xfs_agblock_t		agbno=0;/* allocation group block number */
3371da177e4SLinus Torvalds 	xfs_buf_t		*agbp;	/* agi header buffer */
3381da177e4SLinus Torvalds 	xfs_agi_t		*agi;	/* agi header data */
3391da177e4SLinus Torvalds 	xfs_agino_t		agino;	/* inode # in allocation group */
3401da177e4SLinus Torvalds 	xfs_agnumber_t		agno;	/* allocation group number */
3411da177e4SLinus Torvalds 	xfs_daddr_t		bno;	/* inode cluster start daddr */
3421da177e4SLinus Torvalds 	int			chunkidx; /* current index into inode chunk */
3431da177e4SLinus Torvalds 	int			clustidx; /* current index into inode cluster */
3441da177e4SLinus Torvalds 	xfs_btree_cur_t		*cur;	/* btree cursor for ialloc btree */
3451da177e4SLinus Torvalds 	int			end_of_ag; /* set if we've seen the ag end */
3461da177e4SLinus Torvalds 	int			error;	/* error code */
3471da177e4SLinus Torvalds 	int                     fmterror;/* bulkstat formatter result */
3481da177e4SLinus Torvalds 	__int32_t		gcnt;	/* current btree rec's count */
3491da177e4SLinus Torvalds 	xfs_inofree_t		gfree;	/* current btree rec's free mask */
3501da177e4SLinus Torvalds 	xfs_agino_t		gino;	/* current btree rec's start inode */
3511da177e4SLinus Torvalds 	int			i;	/* loop index */
3521da177e4SLinus Torvalds 	int			icount;	/* count of inodes good in irbuf */
353215101c3SNathan Scott 	size_t			irbsize; /* size of irec buffer in bytes */
3541da177e4SLinus Torvalds 	xfs_ino_t		ino;	/* inode number (filesystem) */
35526275093SNathan Scott 	xfs_inobt_rec_incore_t	*irbp;	/* current irec buffer pointer */
35626275093SNathan Scott 	xfs_inobt_rec_incore_t	*irbuf;	/* start of irec buffer */
35726275093SNathan Scott 	xfs_inobt_rec_incore_t	*irbufend; /* end of good irec buffer entries */
358*cd57e594SLachlan McIlroy 	xfs_ino_t		lastino; /* last inode number returned */
3591da177e4SLinus Torvalds 	int			nbcluster; /* # of blocks in a cluster */
3601da177e4SLinus Torvalds 	int			nicluster; /* # of inodes in a cluster */
3611da177e4SLinus Torvalds 	int			nimask;	/* mask for inode clusters */
3621da177e4SLinus Torvalds 	int			nirbuf;	/* size of irbuf */
3631da177e4SLinus Torvalds 	int			rval;	/* return value error code */
3641da177e4SLinus Torvalds 	int			tmp;	/* result value from btree calls */
3651da177e4SLinus Torvalds 	int			ubcount; /* size of user's buffer */
3661da177e4SLinus Torvalds 	int			ubleft;	/* bytes left in user's buffer */
3671da177e4SLinus Torvalds 	char			__user *ubufp;	/* pointer into user's buffer */
3681da177e4SLinus Torvalds 	int			ubelem;	/* spaces used in user's buffer */
3691da177e4SLinus Torvalds 	int			ubused;	/* bytes used by formatter */
3701da177e4SLinus Torvalds 	xfs_buf_t		*bp;	/* ptr to on-disk inode cluster buf */
3711da177e4SLinus Torvalds 	xfs_dinode_t		*dip;	/* ptr into bp for specific inode */
3721da177e4SLinus Torvalds 	xfs_inode_t		*ip;	/* ptr to in-core inode struct */
3731da177e4SLinus Torvalds 
3741da177e4SLinus Torvalds 	/*
3751da177e4SLinus Torvalds 	 * Get the last inode value, see if there's nothing to do.
3761da177e4SLinus Torvalds 	 */
3771da177e4SLinus Torvalds 	ino = (xfs_ino_t)*lastinop;
378*cd57e594SLachlan McIlroy 	lastino = ino;
3791da177e4SLinus Torvalds 	dip = NULL;
3801da177e4SLinus Torvalds 	agno = XFS_INO_TO_AGNO(mp, ino);
3811da177e4SLinus Torvalds 	agino = XFS_INO_TO_AGINO(mp, ino);
3821da177e4SLinus Torvalds 	if (agno >= mp->m_sb.sb_agcount ||
3831da177e4SLinus Torvalds 	    ino != XFS_AGINO_TO_INO(mp, agno, agino)) {
3841da177e4SLinus Torvalds 		*done = 1;
3851da177e4SLinus Torvalds 		*ubcountp = 0;
3861da177e4SLinus Torvalds 		return 0;
3871da177e4SLinus Torvalds 	}
388*cd57e594SLachlan McIlroy 	if (!ubcountp || *ubcountp <= 0) {
389*cd57e594SLachlan McIlroy 		return EINVAL;
390*cd57e594SLachlan McIlroy 	}
3911da177e4SLinus Torvalds 	ubcount = *ubcountp; /* statstruct's */
3921da177e4SLinus Torvalds 	ubleft = ubcount * statstruct_size; /* bytes */
3931da177e4SLinus Torvalds 	*ubcountp = ubelem = 0;
3941da177e4SLinus Torvalds 	*done = 0;
3951da177e4SLinus Torvalds 	fmterror = 0;
3961da177e4SLinus Torvalds 	ubufp = ubuffer;
3971da177e4SLinus Torvalds 	nicluster = mp->m_sb.sb_blocksize >= XFS_INODE_CLUSTER_SIZE(mp) ?
3981da177e4SLinus Torvalds 		mp->m_sb.sb_inopblock :
3991da177e4SLinus Torvalds 		(XFS_INODE_CLUSTER_SIZE(mp) >> mp->m_sb.sb_inodelog);
4001da177e4SLinus Torvalds 	nimask = ~(nicluster - 1);
4011da177e4SLinus Torvalds 	nbcluster = nicluster >> mp->m_sb.sb_inopblog;
40277e4635aSNathan Scott 	irbuf = kmem_zalloc_greedy(&irbsize, NBPC, NBPC * 4,
40377e4635aSNathan Scott 				   KM_SLEEP | KM_MAYFAIL | KM_LARGE);
404bb3c7d29SNathan Scott 	nirbuf = irbsize / sizeof(*irbuf);
405bb3c7d29SNathan Scott 
4061da177e4SLinus Torvalds 	/*
4071da177e4SLinus Torvalds 	 * Loop over the allocation groups, starting from the last
4081da177e4SLinus Torvalds 	 * inode returned; 0 means start of the allocation group.
4091da177e4SLinus Torvalds 	 */
4101da177e4SLinus Torvalds 	rval = 0;
411*cd57e594SLachlan McIlroy 	while (XFS_BULKSTAT_UBLEFT(ubleft) && agno < mp->m_sb.sb_agcount) {
412*cd57e594SLachlan McIlroy 		cond_resched();
4131da177e4SLinus Torvalds 		bp = NULL;
4141da177e4SLinus Torvalds 		down_read(&mp->m_peraglock);
4151da177e4SLinus Torvalds 		error = xfs_ialloc_read_agi(mp, NULL, agno, &agbp);
4161da177e4SLinus Torvalds 		up_read(&mp->m_peraglock);
4171da177e4SLinus Torvalds 		if (error) {
4181da177e4SLinus Torvalds 			/*
4191da177e4SLinus Torvalds 			 * Skip this allocation group and go to the next one.
4201da177e4SLinus Torvalds 			 */
4211da177e4SLinus Torvalds 			agno++;
4221da177e4SLinus Torvalds 			agino = 0;
4231da177e4SLinus Torvalds 			continue;
4241da177e4SLinus Torvalds 		}
4251da177e4SLinus Torvalds 		agi = XFS_BUF_TO_AGI(agbp);
4261da177e4SLinus Torvalds 		/*
4271da177e4SLinus Torvalds 		 * Allocate and initialize a btree cursor for ialloc btree.
4281da177e4SLinus Torvalds 		 */
4291da177e4SLinus Torvalds 		cur = xfs_btree_init_cursor(mp, NULL, agbp, agno, XFS_BTNUM_INO,
4301da177e4SLinus Torvalds 						(xfs_inode_t *)0, 0);
4311da177e4SLinus Torvalds 		irbp = irbuf;
4321da177e4SLinus Torvalds 		irbufend = irbuf + nirbuf;
4331da177e4SLinus Torvalds 		end_of_ag = 0;
4341da177e4SLinus Torvalds 		/*
4351da177e4SLinus Torvalds 		 * If we're returning in the middle of an allocation group,
4361da177e4SLinus Torvalds 		 * we need to get the remainder of the chunk we're in.
4371da177e4SLinus Torvalds 		 */
4381da177e4SLinus Torvalds 		if (agino > 0) {
4391da177e4SLinus Torvalds 			/*
4401da177e4SLinus Torvalds 			 * Lookup the inode chunk that this inode lives in.
4411da177e4SLinus Torvalds 			 */
4421da177e4SLinus Torvalds 			error = xfs_inobt_lookup_le(cur, agino, 0, 0, &tmp);
4431da177e4SLinus Torvalds 			if (!error &&	/* no I/O error */
4441da177e4SLinus Torvalds 			    tmp &&	/* lookup succeeded */
4451da177e4SLinus Torvalds 					/* got the record, should always work */
4461da177e4SLinus Torvalds 			    !(error = xfs_inobt_get_rec(cur, &gino, &gcnt,
4471da177e4SLinus Torvalds 				    &gfree, &i)) &&
4481da177e4SLinus Torvalds 			    i == 1 &&
4491da177e4SLinus Torvalds 					/* this is the right chunk */
4501da177e4SLinus Torvalds 			    agino < gino + XFS_INODES_PER_CHUNK &&
4511da177e4SLinus Torvalds 					/* lastino was not last in chunk */
4521da177e4SLinus Torvalds 			    (chunkidx = agino - gino + 1) <
4531da177e4SLinus Torvalds 				    XFS_INODES_PER_CHUNK &&
4541da177e4SLinus Torvalds 					/* there are some left allocated */
4551da177e4SLinus Torvalds 			    XFS_INOBT_MASKN(chunkidx,
4561da177e4SLinus Torvalds 				    XFS_INODES_PER_CHUNK - chunkidx) & ~gfree) {
4571da177e4SLinus Torvalds 				/*
4581da177e4SLinus Torvalds 				 * Grab the chunk record.  Mark all the
4591da177e4SLinus Torvalds 				 * uninteresting inodes (because they're
4601da177e4SLinus Torvalds 				 * before our start point) free.
4611da177e4SLinus Torvalds 				 */
4621da177e4SLinus Torvalds 				for (i = 0; i < chunkidx; i++) {
4631da177e4SLinus Torvalds 					if (XFS_INOBT_MASK(i) & ~gfree)
4641da177e4SLinus Torvalds 						gcnt++;
4651da177e4SLinus Torvalds 				}
4661da177e4SLinus Torvalds 				gfree |= XFS_INOBT_MASKN(0, chunkidx);
46726275093SNathan Scott 				irbp->ir_startino = gino;
46826275093SNathan Scott 				irbp->ir_freecount = gcnt;
46926275093SNathan Scott 				irbp->ir_free = gfree;
4701da177e4SLinus Torvalds 				irbp++;
4711da177e4SLinus Torvalds 				agino = gino + XFS_INODES_PER_CHUNK;
4721da177e4SLinus Torvalds 				icount = XFS_INODES_PER_CHUNK - gcnt;
4731da177e4SLinus Torvalds 			} else {
4741da177e4SLinus Torvalds 				/*
4751da177e4SLinus Torvalds 				 * If any of those tests failed, bump the
4761da177e4SLinus Torvalds 				 * inode number (just in case).
4771da177e4SLinus Torvalds 				 */
4781da177e4SLinus Torvalds 				agino++;
4791da177e4SLinus Torvalds 				icount = 0;
4801da177e4SLinus Torvalds 			}
4811da177e4SLinus Torvalds 			/*
4821da177e4SLinus Torvalds 			 * In any case, increment to the next record.
4831da177e4SLinus Torvalds 			 */
4841da177e4SLinus Torvalds 			if (!error)
4851da177e4SLinus Torvalds 				error = xfs_inobt_increment(cur, 0, &tmp);
4861da177e4SLinus Torvalds 		} else {
4871da177e4SLinus Torvalds 			/*
4881da177e4SLinus Torvalds 			 * Start of ag.  Lookup the first inode chunk.
4891da177e4SLinus Torvalds 			 */
4901da177e4SLinus Torvalds 			error = xfs_inobt_lookup_ge(cur, 0, 0, 0, &tmp);
4911da177e4SLinus Torvalds 			icount = 0;
4921da177e4SLinus Torvalds 		}
4931da177e4SLinus Torvalds 		/*
4941da177e4SLinus Torvalds 		 * Loop through inode btree records in this ag,
4951da177e4SLinus Torvalds 		 * until we run out of inodes or space in the buffer.
4961da177e4SLinus Torvalds 		 */
4971da177e4SLinus Torvalds 		while (irbp < irbufend && icount < ubcount) {
4981da177e4SLinus Torvalds 			/*
4991da177e4SLinus Torvalds 			 * Loop as long as we're unable to read the
5001da177e4SLinus Torvalds 			 * inode btree.
5011da177e4SLinus Torvalds 			 */
5021da177e4SLinus Torvalds 			while (error) {
5031da177e4SLinus Torvalds 				agino += XFS_INODES_PER_CHUNK;
5041da177e4SLinus Torvalds 				if (XFS_AGINO_TO_AGBNO(mp, agino) >=
50516259e7dSChristoph Hellwig 						be32_to_cpu(agi->agi_length))
5061da177e4SLinus Torvalds 					break;
5071da177e4SLinus Torvalds 				error = xfs_inobt_lookup_ge(cur, agino, 0, 0,
5081da177e4SLinus Torvalds 							    &tmp);
509*cd57e594SLachlan McIlroy 				cond_resched();
5101da177e4SLinus Torvalds 			}
5111da177e4SLinus Torvalds 			/*
5121da177e4SLinus Torvalds 			 * If ran off the end of the ag either with an error,
5131da177e4SLinus Torvalds 			 * or the normal way, set end and stop collecting.
5141da177e4SLinus Torvalds 			 */
5151da177e4SLinus Torvalds 			if (error ||
5161da177e4SLinus Torvalds 			    (error = xfs_inobt_get_rec(cur, &gino, &gcnt,
5171da177e4SLinus Torvalds 				    &gfree, &i)) ||
5181da177e4SLinus Torvalds 			    i == 0) {
5191da177e4SLinus Torvalds 				end_of_ag = 1;
5201da177e4SLinus Torvalds 				break;
5211da177e4SLinus Torvalds 			}
5221da177e4SLinus Torvalds 			/*
5231da177e4SLinus Torvalds 			 * If this chunk has any allocated inodes, save it.
52426275093SNathan Scott 			 * Also start read-ahead now for this chunk.
5251da177e4SLinus Torvalds 			 */
5261da177e4SLinus Torvalds 			if (gcnt < XFS_INODES_PER_CHUNK) {
52726275093SNathan Scott 				/*
52826275093SNathan Scott 				 * Loop over all clusters in the next chunk.
52926275093SNathan Scott 				 * Do a readahead if there are any allocated
53026275093SNathan Scott 				 * inodes in that cluster.
53126275093SNathan Scott 				 */
53226275093SNathan Scott 				for (agbno = XFS_AGINO_TO_AGBNO(mp, gino),
53326275093SNathan Scott 				     chunkidx = 0;
53426275093SNathan Scott 				     chunkidx < XFS_INODES_PER_CHUNK;
53526275093SNathan Scott 				     chunkidx += nicluster,
53626275093SNathan Scott 				     agbno += nbcluster) {
53726275093SNathan Scott 					if (XFS_INOBT_MASKN(chunkidx,
53826275093SNathan Scott 							    nicluster) & ~gfree)
53926275093SNathan Scott 						xfs_btree_reada_bufs(mp, agno,
54026275093SNathan Scott 							agbno, nbcluster);
54126275093SNathan Scott 				}
54226275093SNathan Scott 				irbp->ir_startino = gino;
54326275093SNathan Scott 				irbp->ir_freecount = gcnt;
54426275093SNathan Scott 				irbp->ir_free = gfree;
5451da177e4SLinus Torvalds 				irbp++;
5461da177e4SLinus Torvalds 				icount += XFS_INODES_PER_CHUNK - gcnt;
5471da177e4SLinus Torvalds 			}
5481da177e4SLinus Torvalds 			/*
5491da177e4SLinus Torvalds 			 * Set agino to after this chunk and bump the cursor.
5501da177e4SLinus Torvalds 			 */
5511da177e4SLinus Torvalds 			agino = gino + XFS_INODES_PER_CHUNK;
5521da177e4SLinus Torvalds 			error = xfs_inobt_increment(cur, 0, &tmp);
553*cd57e594SLachlan McIlroy 			cond_resched();
5541da177e4SLinus Torvalds 		}
5551da177e4SLinus Torvalds 		/*
5561da177e4SLinus Torvalds 		 * Drop the btree buffers and the agi buffer.
5571da177e4SLinus Torvalds 		 * We can't hold any of the locks these represent
5581da177e4SLinus Torvalds 		 * when calling iget.
5591da177e4SLinus Torvalds 		 */
5601da177e4SLinus Torvalds 		xfs_btree_del_cursor(cur, XFS_BTREE_NOERROR);
5611da177e4SLinus Torvalds 		xfs_buf_relse(agbp);
5621da177e4SLinus Torvalds 		/*
5631da177e4SLinus Torvalds 		 * Now format all the good inodes into the user's buffer.
5641da177e4SLinus Torvalds 		 */
5651da177e4SLinus Torvalds 		irbufend = irbp;
5661da177e4SLinus Torvalds 		for (irbp = irbuf;
567*cd57e594SLachlan McIlroy 		     irbp < irbufend && XFS_BULKSTAT_UBLEFT(ubleft); irbp++) {
5681da177e4SLinus Torvalds 			/*
5691da177e4SLinus Torvalds 			 * Now process this chunk of inodes.
5701da177e4SLinus Torvalds 			 */
57126275093SNathan Scott 			for (agino = irbp->ir_startino, chunkidx = clustidx = 0;
572*cd57e594SLachlan McIlroy 			     XFS_BULKSTAT_UBLEFT(ubleft) &&
57326275093SNathan Scott 				irbp->ir_freecount < XFS_INODES_PER_CHUNK;
5741da177e4SLinus Torvalds 			     chunkidx++, clustidx++, agino++) {
5751da177e4SLinus Torvalds 				ASSERT(chunkidx < XFS_INODES_PER_CHUNK);
5761da177e4SLinus Torvalds 				/*
5771da177e4SLinus Torvalds 				 * Recompute agbno if this is the
5781da177e4SLinus Torvalds 				 * first inode of the cluster.
5791da177e4SLinus Torvalds 				 *
5801da177e4SLinus Torvalds 				 * Careful with clustidx.   There can be
5811da177e4SLinus Torvalds 				 * multple clusters per chunk, a single
5821da177e4SLinus Torvalds 				 * cluster per chunk or a cluster that has
5831da177e4SLinus Torvalds 				 * inodes represented from several different
5841da177e4SLinus Torvalds 				 * chunks (if blocksize is large).
5851da177e4SLinus Torvalds 				 *
5861da177e4SLinus Torvalds 				 * Because of this, the starting clustidx is
5871da177e4SLinus Torvalds 				 * initialized to zero in this loop but must
5881da177e4SLinus Torvalds 				 * later be reset after reading in the cluster
5891da177e4SLinus Torvalds 				 * buffer.
5901da177e4SLinus Torvalds 				 */
5911da177e4SLinus Torvalds 				if ((chunkidx & (nicluster - 1)) == 0) {
5921da177e4SLinus Torvalds 					agbno = XFS_AGINO_TO_AGBNO(mp,
59326275093SNathan Scott 							irbp->ir_startino) +
5941da177e4SLinus Torvalds 						((chunkidx & nimask) >>
5951da177e4SLinus Torvalds 						 mp->m_sb.sb_inopblog);
5961da177e4SLinus Torvalds 
5978b56f083SNathan Scott 					if (flags & (BULKSTAT_FG_QUICK |
5988b56f083SNathan Scott 						     BULKSTAT_FG_INLINE)) {
5991da177e4SLinus Torvalds 						ino = XFS_AGINO_TO_INO(mp, agno,
6001da177e4SLinus Torvalds 								       agino);
6011da177e4SLinus Torvalds 						bno = XFS_AGB_TO_DADDR(mp, agno,
6021da177e4SLinus Torvalds 								       agbno);
6031da177e4SLinus Torvalds 
6041da177e4SLinus Torvalds 						/*
6051da177e4SLinus Torvalds 						 * Get the inode cluster buffer
6061da177e4SLinus Torvalds 						 */
6071da177e4SLinus Torvalds 						ASSERT(xfs_inode_zone != NULL);
6081da177e4SLinus Torvalds 						ip = kmem_zone_zalloc(xfs_inode_zone,
6091da177e4SLinus Torvalds 								      KM_SLEEP);
6101da177e4SLinus Torvalds 						ip->i_ino = ino;
6111da177e4SLinus Torvalds 						ip->i_mount = mp;
612f273ab84SDavid Chinner 						spin_lock_init(&ip->i_flags_lock);
6131da177e4SLinus Torvalds 						if (bp)
6141da177e4SLinus Torvalds 							xfs_buf_relse(bp);
6151da177e4SLinus Torvalds 						error = xfs_itobp(mp, NULL, ip,
616b12dd342SNathan Scott 								&dip, &bp, bno,
617b12dd342SNathan Scott 								XFS_IMAP_BULKSTAT);
6181da177e4SLinus Torvalds 						if (!error)
6191da177e4SLinus Torvalds 							clustidx = ip->i_boffset / mp->m_sb.sb_inodesize;
6201da177e4SLinus Torvalds 						kmem_zone_free(xfs_inode_zone, ip);
6211da177e4SLinus Torvalds 						if (XFS_TEST_ERROR(error != 0,
6221da177e4SLinus Torvalds 								   mp, XFS_ERRTAG_BULKSTAT_READ_CHUNK,
6231da177e4SLinus Torvalds 								   XFS_RANDOM_BULKSTAT_READ_CHUNK)) {
6241da177e4SLinus Torvalds 							bp = NULL;
625b12dd342SNathan Scott 							ubleft = 0;
626b12dd342SNathan Scott 							rval = error;
6271da177e4SLinus Torvalds 							break;
6281da177e4SLinus Torvalds 						}
6291da177e4SLinus Torvalds 					}
6301da177e4SLinus Torvalds 				}
631c2cba57eSLachlan McIlroy 				ino = XFS_AGINO_TO_INO(mp, agno, agino);
632c2cba57eSLachlan McIlroy 				bno = XFS_AGB_TO_DADDR(mp, agno, agbno);
6331da177e4SLinus Torvalds 				/*
6341da177e4SLinus Torvalds 				 * Skip if this inode is free.
6351da177e4SLinus Torvalds 				 */
636c2cba57eSLachlan McIlroy 				if (XFS_INOBT_MASK(chunkidx) & irbp->ir_free) {
637c2cba57eSLachlan McIlroy 					lastino = ino;
6381da177e4SLinus Torvalds 					continue;
639c2cba57eSLachlan McIlroy 				}
6401da177e4SLinus Torvalds 				/*
6411da177e4SLinus Torvalds 				 * Count used inodes as free so we can tell
6421da177e4SLinus Torvalds 				 * when the chunk is used up.
6431da177e4SLinus Torvalds 				 */
64426275093SNathan Scott 				irbp->ir_freecount++;
6458b56f083SNathan Scott 				if (!xfs_bulkstat_use_dinode(mp, flags, bp,
646c2cba57eSLachlan McIlroy 							     clustidx, &dip)) {
647c2cba57eSLachlan McIlroy 					lastino = ino;
6481da177e4SLinus Torvalds 					continue;
649c2cba57eSLachlan McIlroy 				}
6508b56f083SNathan Scott 				/*
6518b56f083SNathan Scott 				 * If we need to do an iget, cannot hold bp.
6528b56f083SNathan Scott 				 * Drop it, until starting the next cluster.
6538b56f083SNathan Scott 				 */
6548b56f083SNathan Scott 				if ((flags & BULKSTAT_FG_INLINE) && !dip) {
6558b56f083SNathan Scott 					if (bp)
6568b56f083SNathan Scott 						xfs_buf_relse(bp);
6578b56f083SNathan Scott 					bp = NULL;
6581da177e4SLinus Torvalds 				}
6591da177e4SLinus Torvalds 
6601da177e4SLinus Torvalds 				/*
6611da177e4SLinus Torvalds 				 * Get the inode and fill in a single buffer.
6621da177e4SLinus Torvalds 				 * BULKSTAT_FG_QUICK uses dip to fill it in.
6631da177e4SLinus Torvalds 				 * BULKSTAT_FG_IGET uses igets.
6648b56f083SNathan Scott 				 * BULKSTAT_FG_INLINE uses dip if we have an
6658b56f083SNathan Scott 				 * inline attr fork, else igets.
6661da177e4SLinus Torvalds 				 * See: xfs_bulkstat_one & xfs_dm_bulkstat_one.
6671da177e4SLinus Torvalds 				 * This is also used to count inodes/blks, etc
6681da177e4SLinus Torvalds 				 * in xfs_qm_quotacheck.
6691da177e4SLinus Torvalds 				 */
6701da177e4SLinus Torvalds 				ubused = statstruct_size;
6711da177e4SLinus Torvalds 				error = formatter(mp, ino, ubufp,
6721da177e4SLinus Torvalds 						ubleft, private_data,
6731da177e4SLinus Torvalds 						bno, &ubused, dip, &fmterror);
6741da177e4SLinus Torvalds 				if (fmterror == BULKSTAT_RV_NOTHING) {
675*cd57e594SLachlan McIlroy 					if (error && error != ENOENT &&
676*cd57e594SLachlan McIlroy 						error != EINVAL) {
67722de606aSVlad Apostolov 						ubleft = 0;
67822de606aSVlad Apostolov 						rval = error;
67922de606aSVlad Apostolov 						break;
68022de606aSVlad Apostolov 					}
6816e73b418SVlad Apostolov 					lastino = ino;
6821da177e4SLinus Torvalds 					continue;
6831da177e4SLinus Torvalds 				}
6841da177e4SLinus Torvalds 				if (fmterror == BULKSTAT_RV_GIVEUP) {
6851da177e4SLinus Torvalds 					ubleft = 0;
6861da177e4SLinus Torvalds 					ASSERT(error);
6871da177e4SLinus Torvalds 					rval = error;
6881da177e4SLinus Torvalds 					break;
6891da177e4SLinus Torvalds 				}
6901da177e4SLinus Torvalds 				if (ubufp)
6911da177e4SLinus Torvalds 					ubufp += ubused;
6921da177e4SLinus Torvalds 				ubleft -= ubused;
6931da177e4SLinus Torvalds 				ubelem++;
6941da177e4SLinus Torvalds 				lastino = ino;
6951da177e4SLinus Torvalds 			}
696*cd57e594SLachlan McIlroy 
697*cd57e594SLachlan McIlroy 			cond_resched();
6981da177e4SLinus Torvalds 		}
6991da177e4SLinus Torvalds 
7001da177e4SLinus Torvalds 		if (bp)
7011da177e4SLinus Torvalds 			xfs_buf_relse(bp);
7021da177e4SLinus Torvalds 
7031da177e4SLinus Torvalds 		/*
7041da177e4SLinus Torvalds 		 * Set up for the next loop iteration.
7051da177e4SLinus Torvalds 		 */
706*cd57e594SLachlan McIlroy 		if (XFS_BULKSTAT_UBLEFT(ubleft)) {
7071da177e4SLinus Torvalds 			if (end_of_ag) {
7081da177e4SLinus Torvalds 				agno++;
7091da177e4SLinus Torvalds 				agino = 0;
710*cd57e594SLachlan McIlroy 			} else
711*cd57e594SLachlan McIlroy 				agino = XFS_INO_TO_AGINO(mp, lastino);
7121da177e4SLinus Torvalds 		} else
7131da177e4SLinus Torvalds 			break;
7141da177e4SLinus Torvalds 	}
7151da177e4SLinus Torvalds 	/*
7161da177e4SLinus Torvalds 	 * Done, we're either out of filesystem or space to put the data.
7171da177e4SLinus Torvalds 	 */
718bb3c7d29SNathan Scott 	kmem_free(irbuf, irbsize);
7191da177e4SLinus Torvalds 	*ubcountp = ubelem;
720*cd57e594SLachlan McIlroy 	/*
721*cd57e594SLachlan McIlroy 	 * Found some inodes, return them now and return the error next time.
722*cd57e594SLachlan McIlroy 	 */
723*cd57e594SLachlan McIlroy 	if (ubelem)
724*cd57e594SLachlan McIlroy 		rval = 0;
7251da177e4SLinus Torvalds 	if (agno >= mp->m_sb.sb_agcount) {
7261da177e4SLinus Torvalds 		/*
7271da177e4SLinus Torvalds 		 * If we ran out of filesystem, mark lastino as off
7281da177e4SLinus Torvalds 		 * the end of the filesystem, so the next call
7291da177e4SLinus Torvalds 		 * will return immediately.
7301da177e4SLinus Torvalds 		 */
7311da177e4SLinus Torvalds 		*lastinop = (xfs_ino_t)XFS_AGINO_TO_INO(mp, agno, 0);
7321da177e4SLinus Torvalds 		*done = 1;
7331da177e4SLinus Torvalds 	} else
7341da177e4SLinus Torvalds 		*lastinop = (xfs_ino_t)lastino;
7351da177e4SLinus Torvalds 
7361da177e4SLinus Torvalds 	return rval;
7371da177e4SLinus Torvalds }
7381da177e4SLinus Torvalds 
7391da177e4SLinus Torvalds /*
7401da177e4SLinus Torvalds  * Return stat information in bulk (by-inode) for the filesystem.
7411da177e4SLinus Torvalds  * Special case for non-sequential one inode bulkstat.
7421da177e4SLinus Torvalds  */
7431da177e4SLinus Torvalds int					/* error status */
7441da177e4SLinus Torvalds xfs_bulkstat_single(
7451da177e4SLinus Torvalds 	xfs_mount_t		*mp,	/* mount point for filesystem */
7461da177e4SLinus Torvalds 	xfs_ino_t		*lastinop, /* inode to return */
7471da177e4SLinus Torvalds 	char			__user *buffer, /* buffer with inode stats */
748c41564b5SNathan Scott 	int			*done)	/* 1 if there are more stats to get */
7491da177e4SLinus Torvalds {
7501da177e4SLinus Torvalds 	int			count;	/* count value for bulkstat call */
7511da177e4SLinus Torvalds 	int			error;	/* return value */
7521da177e4SLinus Torvalds 	xfs_ino_t		ino;	/* filesystem inode number */
7531da177e4SLinus Torvalds 	int			res;	/* result from bs1 */
7541da177e4SLinus Torvalds 
7551da177e4SLinus Torvalds 	/*
7561da177e4SLinus Torvalds 	 * note that requesting valid inode numbers which are not allocated
7571da177e4SLinus Torvalds 	 * to inodes will most likely cause xfs_itobp to generate warning
7581da177e4SLinus Torvalds 	 * messages about bad magic numbers. This is ok. The fact that
7591da177e4SLinus Torvalds 	 * the inode isn't actually an inode is handled by the
7601da177e4SLinus Torvalds 	 * error check below. Done this way to make the usual case faster
7611da177e4SLinus Torvalds 	 * at the expense of the error case.
7621da177e4SLinus Torvalds 	 */
7631da177e4SLinus Torvalds 
7641da177e4SLinus Torvalds 	ino = (xfs_ino_t)*lastinop;
7651da177e4SLinus Torvalds 	error = xfs_bulkstat_one(mp, ino, buffer, sizeof(xfs_bstat_t),
7661da177e4SLinus Torvalds 				 NULL, 0, NULL, NULL, &res);
7671da177e4SLinus Torvalds 	if (error) {
7681da177e4SLinus Torvalds 		/*
7691da177e4SLinus Torvalds 		 * Special case way failed, do it the "long" way
7701da177e4SLinus Torvalds 		 * to see if that works.
7711da177e4SLinus Torvalds 		 */
7721da177e4SLinus Torvalds 		(*lastinop)--;
7731da177e4SLinus Torvalds 		count = 1;
7741da177e4SLinus Torvalds 		if (xfs_bulkstat(mp, lastinop, &count, xfs_bulkstat_one,
7751da177e4SLinus Torvalds 				NULL, sizeof(xfs_bstat_t), buffer,
7761da177e4SLinus Torvalds 				BULKSTAT_FG_IGET, done))
7771da177e4SLinus Torvalds 			return error;
7781da177e4SLinus Torvalds 		if (count == 0 || (xfs_ino_t)*lastinop != ino)
7791da177e4SLinus Torvalds 			return error == EFSCORRUPTED ?
7801da177e4SLinus Torvalds 				XFS_ERROR(EINVAL) : error;
7811da177e4SLinus Torvalds 		else
7821da177e4SLinus Torvalds 			return 0;
7831da177e4SLinus Torvalds 	}
7841da177e4SLinus Torvalds 	*done = 0;
7851da177e4SLinus Torvalds 	return 0;
7861da177e4SLinus Torvalds }
7871da177e4SLinus Torvalds 
788faa63e95SMichal Marek int
789faa63e95SMichal Marek xfs_inumbers_fmt(
790faa63e95SMichal Marek 	void			__user *ubuffer, /* buffer to write to */
791faa63e95SMichal Marek 	const xfs_inogrp_t	*buffer,	/* buffer to read from */
792faa63e95SMichal Marek 	long			count,		/* # of elements to read */
793faa63e95SMichal Marek 	long			*written)	/* # of bytes written */
794faa63e95SMichal Marek {
795faa63e95SMichal Marek 	if (copy_to_user(ubuffer, buffer, count * sizeof(*buffer)))
796faa63e95SMichal Marek 		return -EFAULT;
797faa63e95SMichal Marek 	*written = count * sizeof(*buffer);
798faa63e95SMichal Marek 	return 0;
799faa63e95SMichal Marek }
800faa63e95SMichal Marek 
8011da177e4SLinus Torvalds /*
8021da177e4SLinus Torvalds  * Return inode number table for the filesystem.
8031da177e4SLinus Torvalds  */
8041da177e4SLinus Torvalds int					/* error status */
8051da177e4SLinus Torvalds xfs_inumbers(
8061da177e4SLinus Torvalds 	xfs_mount_t	*mp,		/* mount point for filesystem */
8071da177e4SLinus Torvalds 	xfs_ino_t	*lastino,	/* last inode returned */
8081da177e4SLinus Torvalds 	int		*count,		/* size of buffer/count returned */
809faa63e95SMichal Marek 	void		__user *ubuffer,/* buffer with inode descriptions */
810faa63e95SMichal Marek 	inumbers_fmt_pf	formatter)
8111da177e4SLinus Torvalds {
8121da177e4SLinus Torvalds 	xfs_buf_t	*agbp;
8131da177e4SLinus Torvalds 	xfs_agino_t	agino;
8141da177e4SLinus Torvalds 	xfs_agnumber_t	agno;
8151da177e4SLinus Torvalds 	int		bcount;
8161da177e4SLinus Torvalds 	xfs_inogrp_t	*buffer;
8171da177e4SLinus Torvalds 	int		bufidx;
8181da177e4SLinus Torvalds 	xfs_btree_cur_t	*cur;
8191da177e4SLinus Torvalds 	int		error;
8201da177e4SLinus Torvalds 	__int32_t	gcnt;
8211da177e4SLinus Torvalds 	xfs_inofree_t	gfree;
8221da177e4SLinus Torvalds 	xfs_agino_t	gino;
8231da177e4SLinus Torvalds 	int		i;
8241da177e4SLinus Torvalds 	xfs_ino_t	ino;
8251da177e4SLinus Torvalds 	int		left;
8261da177e4SLinus Torvalds 	int		tmp;
8271da177e4SLinus Torvalds 
8281da177e4SLinus Torvalds 	ino = (xfs_ino_t)*lastino;
8291da177e4SLinus Torvalds 	agno = XFS_INO_TO_AGNO(mp, ino);
8301da177e4SLinus Torvalds 	agino = XFS_INO_TO_AGINO(mp, ino);
8311da177e4SLinus Torvalds 	left = *count;
8321da177e4SLinus Torvalds 	*count = 0;
8331da177e4SLinus Torvalds 	bcount = MIN(left, (int)(NBPP / sizeof(*buffer)));
8341da177e4SLinus Torvalds 	buffer = kmem_alloc(bcount * sizeof(*buffer), KM_SLEEP);
8351da177e4SLinus Torvalds 	error = bufidx = 0;
8361da177e4SLinus Torvalds 	cur = NULL;
8371da177e4SLinus Torvalds 	agbp = NULL;
8381da177e4SLinus Torvalds 	while (left > 0 && agno < mp->m_sb.sb_agcount) {
8391da177e4SLinus Torvalds 		if (agbp == NULL) {
8401da177e4SLinus Torvalds 			down_read(&mp->m_peraglock);
8411da177e4SLinus Torvalds 			error = xfs_ialloc_read_agi(mp, NULL, agno, &agbp);
8421da177e4SLinus Torvalds 			up_read(&mp->m_peraglock);
8431da177e4SLinus Torvalds 			if (error) {
8441da177e4SLinus Torvalds 				/*
8451da177e4SLinus Torvalds 				 * If we can't read the AGI of this ag,
8461da177e4SLinus Torvalds 				 * then just skip to the next one.
8471da177e4SLinus Torvalds 				 */
8481da177e4SLinus Torvalds 				ASSERT(cur == NULL);
8491da177e4SLinus Torvalds 				agbp = NULL;
8501da177e4SLinus Torvalds 				agno++;
8511da177e4SLinus Torvalds 				agino = 0;
8521da177e4SLinus Torvalds 				continue;
8531da177e4SLinus Torvalds 			}
8541da177e4SLinus Torvalds 			cur = xfs_btree_init_cursor(mp, NULL, agbp, agno,
8551da177e4SLinus Torvalds 				XFS_BTNUM_INO, (xfs_inode_t *)0, 0);
8561da177e4SLinus Torvalds 			error = xfs_inobt_lookup_ge(cur, agino, 0, 0, &tmp);
8571da177e4SLinus Torvalds 			if (error) {
8581da177e4SLinus Torvalds 				xfs_btree_del_cursor(cur, XFS_BTREE_ERROR);
8591da177e4SLinus Torvalds 				cur = NULL;
8601da177e4SLinus Torvalds 				xfs_buf_relse(agbp);
8611da177e4SLinus Torvalds 				agbp = NULL;
8621da177e4SLinus Torvalds 				/*
86359c51591SMichael Opdenacker 				 * Move up the last inode in the current
8641da177e4SLinus Torvalds 				 * chunk.  The lookup_ge will always get
8651da177e4SLinus Torvalds 				 * us the first inode in the next chunk.
8661da177e4SLinus Torvalds 				 */
8671da177e4SLinus Torvalds 				agino += XFS_INODES_PER_CHUNK - 1;
8681da177e4SLinus Torvalds 				continue;
8691da177e4SLinus Torvalds 			}
8701da177e4SLinus Torvalds 		}
8711da177e4SLinus Torvalds 		if ((error = xfs_inobt_get_rec(cur, &gino, &gcnt, &gfree,
8721da177e4SLinus Torvalds 			&i)) ||
8731da177e4SLinus Torvalds 		    i == 0) {
8741da177e4SLinus Torvalds 			xfs_buf_relse(agbp);
8751da177e4SLinus Torvalds 			agbp = NULL;
8761da177e4SLinus Torvalds 			xfs_btree_del_cursor(cur, XFS_BTREE_NOERROR);
8771da177e4SLinus Torvalds 			cur = NULL;
8781da177e4SLinus Torvalds 			agno++;
8791da177e4SLinus Torvalds 			agino = 0;
8801da177e4SLinus Torvalds 			continue;
8811da177e4SLinus Torvalds 		}
8821da177e4SLinus Torvalds 		agino = gino + XFS_INODES_PER_CHUNK - 1;
8831da177e4SLinus Torvalds 		buffer[bufidx].xi_startino = XFS_AGINO_TO_INO(mp, agno, gino);
8841da177e4SLinus Torvalds 		buffer[bufidx].xi_alloccount = XFS_INODES_PER_CHUNK - gcnt;
8851da177e4SLinus Torvalds 		buffer[bufidx].xi_allocmask = ~gfree;
8861da177e4SLinus Torvalds 		bufidx++;
8871da177e4SLinus Torvalds 		left--;
8881da177e4SLinus Torvalds 		if (bufidx == bcount) {
889faa63e95SMichal Marek 			long written;
890faa63e95SMichal Marek 			if (formatter(ubuffer, buffer, bufidx, &written)) {
8911da177e4SLinus Torvalds 				error = XFS_ERROR(EFAULT);
8921da177e4SLinus Torvalds 				break;
8931da177e4SLinus Torvalds 			}
894faa63e95SMichal Marek 			ubuffer += written;
8951da177e4SLinus Torvalds 			*count += bufidx;
8961da177e4SLinus Torvalds 			bufidx = 0;
8971da177e4SLinus Torvalds 		}
8981da177e4SLinus Torvalds 		if (left) {
8991da177e4SLinus Torvalds 			error = xfs_inobt_increment(cur, 0, &tmp);
9001da177e4SLinus Torvalds 			if (error) {
9011da177e4SLinus Torvalds 				xfs_btree_del_cursor(cur, XFS_BTREE_ERROR);
9021da177e4SLinus Torvalds 				cur = NULL;
9031da177e4SLinus Torvalds 				xfs_buf_relse(agbp);
9041da177e4SLinus Torvalds 				agbp = NULL;
9051da177e4SLinus Torvalds 				/*
9061da177e4SLinus Torvalds 				 * The agino value has already been bumped.
9071da177e4SLinus Torvalds 				 * Just try to skip up to it.
9081da177e4SLinus Torvalds 				 */
9091da177e4SLinus Torvalds 				agino += XFS_INODES_PER_CHUNK;
9101da177e4SLinus Torvalds 				continue;
9111da177e4SLinus Torvalds 			}
9121da177e4SLinus Torvalds 		}
9131da177e4SLinus Torvalds 	}
9141da177e4SLinus Torvalds 	if (!error) {
9151da177e4SLinus Torvalds 		if (bufidx) {
916faa63e95SMichal Marek 			long written;
917faa63e95SMichal Marek 			if (formatter(ubuffer, buffer, bufidx, &written))
9181da177e4SLinus Torvalds 				error = XFS_ERROR(EFAULT);
9191da177e4SLinus Torvalds 			else
9201da177e4SLinus Torvalds 				*count += bufidx;
9211da177e4SLinus Torvalds 		}
9221da177e4SLinus Torvalds 		*lastino = XFS_AGINO_TO_INO(mp, agno, agino);
9231da177e4SLinus Torvalds 	}
9241da177e4SLinus Torvalds 	kmem_free(buffer, bcount * sizeof(*buffer));
9251da177e4SLinus Torvalds 	if (cur)
9261da177e4SLinus Torvalds 		xfs_btree_del_cursor(cur, (error ? XFS_BTREE_ERROR :
9271da177e4SLinus Torvalds 					   XFS_BTREE_NOERROR));
9281da177e4SLinus Torvalds 	if (agbp)
9291da177e4SLinus Torvalds 		xfs_buf_relse(agbp);
9301da177e4SLinus Torvalds 	return error;
9311da177e4SLinus Torvalds }
932