xref: /openbmc/linux/fs/btrfs/tree-checker.c (revision c1bf973f57b7ca62e868c5bc7f3cbdf8ea8d5dc5)
1c1d7c514SDavid Sterba // SPDX-License-Identifier: GPL-2.0
2557ea5ddSQu Wenruo /*
3557ea5ddSQu Wenruo  * Copyright (C) Qu Wenruo 2017.  All rights reserved.
4557ea5ddSQu Wenruo  */
5557ea5ddSQu Wenruo 
6557ea5ddSQu Wenruo /*
7557ea5ddSQu Wenruo  * The module is used to catch unexpected/corrupted tree block data.
8557ea5ddSQu Wenruo  * Such behavior can be caused either by a fuzzed image or bugs.
9557ea5ddSQu Wenruo  *
10557ea5ddSQu Wenruo  * The objective is to do leaf/node validation checks when tree block is read
11557ea5ddSQu Wenruo  * from disk, and check *every* possible member, so other code won't
12557ea5ddSQu Wenruo  * need to checking them again.
13557ea5ddSQu Wenruo  *
14557ea5ddSQu Wenruo  * Due to the potential and unwanted damage, every checker needs to be
15557ea5ddSQu Wenruo  * carefully reviewed otherwise so it does not prevent mount of valid images.
16557ea5ddSQu Wenruo  */
17557ea5ddSQu Wenruo 
1802529d7aSQu Wenruo #include <linux/types.h>
1902529d7aSQu Wenruo #include <linux/stddef.h>
2002529d7aSQu Wenruo #include <linux/error-injection.h>
219b569ea0SJosef Bacik #include "messages.h"
22557ea5ddSQu Wenruo #include "ctree.h"
23557ea5ddSQu Wenruo #include "tree-checker.h"
24557ea5ddSQu Wenruo #include "disk-io.h"
25557ea5ddSQu Wenruo #include "compression.h"
26fce466eaSQu Wenruo #include "volumes.h"
27c1499166SDavid Sterba #include "misc.h"
28c7f13d42SJosef Bacik #include "fs.h"
2907e81dc9SJosef Bacik #include "accessors.h"
306bfd0ffaSJosef Bacik #include "file-item.h"
31f541833cSJosef Bacik #include "inode-item.h"
32*c1bf973fSQu Wenruo #include "extent-tree.h"
33557ea5ddSQu Wenruo 
34bba4f298SQu Wenruo /*
35bba4f298SQu Wenruo  * Error message should follow the following format:
36bba4f298SQu Wenruo  * corrupt <type>: <identifier>, <reason>[, <bad_value>]
37bba4f298SQu Wenruo  *
38bba4f298SQu Wenruo  * @type:	leaf or node
39bba4f298SQu Wenruo  * @identifier:	the necessary info to locate the leaf/node.
4052042d8eSAndrea Gelmini  * 		It's recommended to decode key.objecitd/offset if it's
41bba4f298SQu Wenruo  * 		meaningful.
42bba4f298SQu Wenruo  * @reason:	describe the error
4352042d8eSAndrea Gelmini  * @bad_value:	optional, it's recommended to output bad value and its
44bba4f298SQu Wenruo  *		expected value (range).
45bba4f298SQu Wenruo  *
46bba4f298SQu Wenruo  * Since comma is used to separate the components, only space is allowed
47bba4f298SQu Wenruo  * inside each component.
48bba4f298SQu Wenruo  */
49bba4f298SQu Wenruo 
50bba4f298SQu Wenruo /*
51bba4f298SQu Wenruo  * Append generic "corrupt leaf/node root=%llu block=%llu slot=%d: " to @fmt.
52bba4f298SQu Wenruo  * Allows callers to customize the output.
53bba4f298SQu Wenruo  */
5486a6be3aSDavid Sterba __printf(3, 4)
55e67c718bSDavid Sterba __cold
5686a6be3aSDavid Sterba static void generic_err(const struct extent_buffer *eb, int slot,
57bba4f298SQu Wenruo 			const char *fmt, ...)
58bba4f298SQu Wenruo {
5986a6be3aSDavid Sterba 	const struct btrfs_fs_info *fs_info = eb->fs_info;
60bba4f298SQu Wenruo 	struct va_format vaf;
61bba4f298SQu Wenruo 	va_list args;
62bba4f298SQu Wenruo 
63bba4f298SQu Wenruo 	va_start(args, fmt);
64bba4f298SQu Wenruo 
65bba4f298SQu Wenruo 	vaf.fmt = fmt;
66bba4f298SQu Wenruo 	vaf.va = &args;
67bba4f298SQu Wenruo 
682f659546SQu Wenruo 	btrfs_crit(fs_info,
69bba4f298SQu Wenruo 		"corrupt %s: root=%llu block=%llu slot=%d, %pV",
70bba4f298SQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
712f659546SQu Wenruo 		btrfs_header_owner(eb), btrfs_header_bytenr(eb), slot, &vaf);
72bba4f298SQu Wenruo 	va_end(args);
73bba4f298SQu Wenruo }
74bba4f298SQu Wenruo 
758806d718SQu Wenruo /*
768806d718SQu Wenruo  * Customized reporter for extent data item, since its key objectid and
778806d718SQu Wenruo  * offset has its own meaning.
788806d718SQu Wenruo  */
791fd715ffSDavid Sterba __printf(3, 4)
80e67c718bSDavid Sterba __cold
811fd715ffSDavid Sterba static void file_extent_err(const struct extent_buffer *eb, int slot,
828806d718SQu Wenruo 			    const char *fmt, ...)
838806d718SQu Wenruo {
841fd715ffSDavid Sterba 	const struct btrfs_fs_info *fs_info = eb->fs_info;
858806d718SQu Wenruo 	struct btrfs_key key;
868806d718SQu Wenruo 	struct va_format vaf;
878806d718SQu Wenruo 	va_list args;
888806d718SQu Wenruo 
898806d718SQu Wenruo 	btrfs_item_key_to_cpu(eb, &key, slot);
908806d718SQu Wenruo 	va_start(args, fmt);
918806d718SQu Wenruo 
928806d718SQu Wenruo 	vaf.fmt = fmt;
938806d718SQu Wenruo 	vaf.va = &args;
948806d718SQu Wenruo 
952f659546SQu Wenruo 	btrfs_crit(fs_info,
968806d718SQu Wenruo 	"corrupt %s: root=%llu block=%llu slot=%d ino=%llu file_offset=%llu, %pV",
972f659546SQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
982f659546SQu Wenruo 		btrfs_header_owner(eb), btrfs_header_bytenr(eb), slot,
992f659546SQu Wenruo 		key.objectid, key.offset, &vaf);
1008806d718SQu Wenruo 	va_end(args);
1018806d718SQu Wenruo }
1028806d718SQu Wenruo 
1038806d718SQu Wenruo /*
1048806d718SQu Wenruo  * Return 0 if the btrfs_file_extent_##name is aligned to @alignment
1058806d718SQu Wenruo  * Else return 1
1068806d718SQu Wenruo  */
107033774dcSDavid Sterba #define CHECK_FE_ALIGNED(leaf, slot, fi, name, alignment)		      \
1088806d718SQu Wenruo ({									      \
109c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(btrfs_file_extent_##name((leaf), (fi)),      \
110c7c01a4aSDavid Sterba 				 (alignment))))				      \
1111fd715ffSDavid Sterba 		file_extent_err((leaf), (slot),				      \
1128806d718SQu Wenruo 	"invalid %s for file extent, have %llu, should be aligned to %u",     \
1138806d718SQu Wenruo 			(#name), btrfs_file_extent_##name((leaf), (fi)),      \
1148806d718SQu Wenruo 			(alignment));					      \
1158806d718SQu Wenruo 	(!IS_ALIGNED(btrfs_file_extent_##name((leaf), (fi)), (alignment)));   \
1168806d718SQu Wenruo })
1178806d718SQu Wenruo 
1184e9845efSFilipe Manana static u64 file_extent_end(struct extent_buffer *leaf,
1194e9845efSFilipe Manana 			   struct btrfs_key *key,
1204e9845efSFilipe Manana 			   struct btrfs_file_extent_item *extent)
1214e9845efSFilipe Manana {
1224e9845efSFilipe Manana 	u64 end;
1234e9845efSFilipe Manana 	u64 len;
1244e9845efSFilipe Manana 
1254e9845efSFilipe Manana 	if (btrfs_file_extent_type(leaf, extent) == BTRFS_FILE_EXTENT_INLINE) {
1264e9845efSFilipe Manana 		len = btrfs_file_extent_ram_bytes(leaf, extent);
1274e9845efSFilipe Manana 		end = ALIGN(key->offset + len, leaf->fs_info->sectorsize);
1284e9845efSFilipe Manana 	} else {
1294e9845efSFilipe Manana 		len = btrfs_file_extent_num_bytes(leaf, extent);
1304e9845efSFilipe Manana 		end = key->offset + len;
1314e9845efSFilipe Manana 	}
1324e9845efSFilipe Manana 	return end;
1334e9845efSFilipe Manana }
1344e9845efSFilipe Manana 
13580d7fd1eSQu Wenruo /*
13680d7fd1eSQu Wenruo  * Customized report for dir_item, the only new important information is
13780d7fd1eSQu Wenruo  * key->objectid, which represents inode number
13880d7fd1eSQu Wenruo  */
13980d7fd1eSQu Wenruo __printf(3, 4)
14080d7fd1eSQu Wenruo __cold
14180d7fd1eSQu Wenruo static void dir_item_err(const struct extent_buffer *eb, int slot,
14280d7fd1eSQu Wenruo 			 const char *fmt, ...)
14380d7fd1eSQu Wenruo {
14480d7fd1eSQu Wenruo 	const struct btrfs_fs_info *fs_info = eb->fs_info;
14580d7fd1eSQu Wenruo 	struct btrfs_key key;
14680d7fd1eSQu Wenruo 	struct va_format vaf;
14780d7fd1eSQu Wenruo 	va_list args;
14880d7fd1eSQu Wenruo 
14980d7fd1eSQu Wenruo 	btrfs_item_key_to_cpu(eb, &key, slot);
15080d7fd1eSQu Wenruo 	va_start(args, fmt);
15180d7fd1eSQu Wenruo 
15280d7fd1eSQu Wenruo 	vaf.fmt = fmt;
15380d7fd1eSQu Wenruo 	vaf.va = &args;
15480d7fd1eSQu Wenruo 
15580d7fd1eSQu Wenruo 	btrfs_crit(fs_info,
15680d7fd1eSQu Wenruo 		"corrupt %s: root=%llu block=%llu slot=%d ino=%llu, %pV",
15780d7fd1eSQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
15880d7fd1eSQu Wenruo 		btrfs_header_owner(eb), btrfs_header_bytenr(eb), slot,
15980d7fd1eSQu Wenruo 		key.objectid, &vaf);
16080d7fd1eSQu Wenruo 	va_end(args);
16180d7fd1eSQu Wenruo }
16280d7fd1eSQu Wenruo 
16380d7fd1eSQu Wenruo /*
16480d7fd1eSQu Wenruo  * This functions checks prev_key->objectid, to ensure current key and prev_key
16580d7fd1eSQu Wenruo  * share the same objectid as inode number.
16680d7fd1eSQu Wenruo  *
16780d7fd1eSQu Wenruo  * This is to detect missing INODE_ITEM in subvolume trees.
16880d7fd1eSQu Wenruo  *
16980d7fd1eSQu Wenruo  * Return true if everything is OK or we don't need to check.
17080d7fd1eSQu Wenruo  * Return false if anything is wrong.
17180d7fd1eSQu Wenruo  */
17280d7fd1eSQu Wenruo static bool check_prev_ino(struct extent_buffer *leaf,
17380d7fd1eSQu Wenruo 			   struct btrfs_key *key, int slot,
17480d7fd1eSQu Wenruo 			   struct btrfs_key *prev_key)
17580d7fd1eSQu Wenruo {
17680d7fd1eSQu Wenruo 	/* No prev key, skip check */
17780d7fd1eSQu Wenruo 	if (slot == 0)
17880d7fd1eSQu Wenruo 		return true;
17980d7fd1eSQu Wenruo 
18080d7fd1eSQu Wenruo 	/* Only these key->types needs to be checked */
18180d7fd1eSQu Wenruo 	ASSERT(key->type == BTRFS_XATTR_ITEM_KEY ||
18280d7fd1eSQu Wenruo 	       key->type == BTRFS_INODE_REF_KEY ||
18380d7fd1eSQu Wenruo 	       key->type == BTRFS_DIR_INDEX_KEY ||
18480d7fd1eSQu Wenruo 	       key->type == BTRFS_DIR_ITEM_KEY ||
18580d7fd1eSQu Wenruo 	       key->type == BTRFS_EXTENT_DATA_KEY);
18680d7fd1eSQu Wenruo 
18780d7fd1eSQu Wenruo 	/*
18880d7fd1eSQu Wenruo 	 * Only subvolume trees along with their reloc trees need this check.
18980d7fd1eSQu Wenruo 	 * Things like log tree doesn't follow this ino requirement.
19080d7fd1eSQu Wenruo 	 */
19180d7fd1eSQu Wenruo 	if (!is_fstree(btrfs_header_owner(leaf)))
19280d7fd1eSQu Wenruo 		return true;
19380d7fd1eSQu Wenruo 
19480d7fd1eSQu Wenruo 	if (key->objectid == prev_key->objectid)
19580d7fd1eSQu Wenruo 		return true;
19680d7fd1eSQu Wenruo 
19780d7fd1eSQu Wenruo 	/* Error found */
19880d7fd1eSQu Wenruo 	dir_item_err(leaf, slot,
19980d7fd1eSQu Wenruo 		"invalid previous key objectid, have %llu expect %llu",
20080d7fd1eSQu Wenruo 		prev_key->objectid, key->objectid);
20180d7fd1eSQu Wenruo 	return false;
20280d7fd1eSQu Wenruo }
203ae2a19d8SDavid Sterba static int check_extent_data_item(struct extent_buffer *leaf,
2044e9845efSFilipe Manana 				  struct btrfs_key *key, int slot,
2054e9845efSFilipe Manana 				  struct btrfs_key *prev_key)
206557ea5ddSQu Wenruo {
207ae2a19d8SDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
208557ea5ddSQu Wenruo 	struct btrfs_file_extent_item *fi;
2092f659546SQu Wenruo 	u32 sectorsize = fs_info->sectorsize;
2103212fa14SJosef Bacik 	u32 item_size = btrfs_item_size(leaf, slot);
2114c094c33SQu Wenruo 	u64 extent_end;
212557ea5ddSQu Wenruo 
213c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(key->offset, sectorsize))) {
2141fd715ffSDavid Sterba 		file_extent_err(leaf, slot,
2158806d718SQu Wenruo "unaligned file_offset for file extent, have %llu should be aligned to %u",
2168806d718SQu Wenruo 			key->offset, sectorsize);
217557ea5ddSQu Wenruo 		return -EUCLEAN;
218557ea5ddSQu Wenruo 	}
219557ea5ddSQu Wenruo 
220c18679ebSQu Wenruo 	/*
221c18679ebSQu Wenruo 	 * Previous key must have the same key->objectid (ino).
222c18679ebSQu Wenruo 	 * It can be XATTR_ITEM, INODE_ITEM or just another EXTENT_DATA.
223c18679ebSQu Wenruo 	 * But if objectids mismatch, it means we have a missing
224c18679ebSQu Wenruo 	 * INODE_ITEM.
225c18679ebSQu Wenruo 	 */
226c7c01a4aSDavid Sterba 	if (unlikely(!check_prev_ino(leaf, key, slot, prev_key)))
227c18679ebSQu Wenruo 		return -EUCLEAN;
228c18679ebSQu Wenruo 
229557ea5ddSQu Wenruo 	fi = btrfs_item_ptr(leaf, slot, struct btrfs_file_extent_item);
230557ea5ddSQu Wenruo 
231153a6d29SQu Wenruo 	/*
232153a6d29SQu Wenruo 	 * Make sure the item contains at least inline header, so the file
233153a6d29SQu Wenruo 	 * extent type is not some garbage.
234153a6d29SQu Wenruo 	 */
235c7c01a4aSDavid Sterba 	if (unlikely(item_size < BTRFS_FILE_EXTENT_INLINE_DATA_START)) {
236153a6d29SQu Wenruo 		file_extent_err(leaf, slot,
237994bf9cdSAndreas Färber 				"invalid item size, have %u expect [%zu, %u)",
238153a6d29SQu Wenruo 				item_size, BTRFS_FILE_EXTENT_INLINE_DATA_START,
239153a6d29SQu Wenruo 				SZ_4K);
240153a6d29SQu Wenruo 		return -EUCLEAN;
241153a6d29SQu Wenruo 	}
242c7c01a4aSDavid Sterba 	if (unlikely(btrfs_file_extent_type(leaf, fi) >=
243c7c01a4aSDavid Sterba 		     BTRFS_NR_FILE_EXTENT_TYPES)) {
2441fd715ffSDavid Sterba 		file_extent_err(leaf, slot,
2458806d718SQu Wenruo 		"invalid type for file extent, have %u expect range [0, %u]",
2468806d718SQu Wenruo 			btrfs_file_extent_type(leaf, fi),
247b9b1a53eSChengguang Xu 			BTRFS_NR_FILE_EXTENT_TYPES - 1);
248557ea5ddSQu Wenruo 		return -EUCLEAN;
249557ea5ddSQu Wenruo 	}
250557ea5ddSQu Wenruo 
251557ea5ddSQu Wenruo 	/*
25252042d8eSAndrea Gelmini 	 * Support for new compression/encryption must introduce incompat flag,
253557ea5ddSQu Wenruo 	 * and must be caught in open_ctree().
254557ea5ddSQu Wenruo 	 */
255c7c01a4aSDavid Sterba 	if (unlikely(btrfs_file_extent_compression(leaf, fi) >=
256c7c01a4aSDavid Sterba 		     BTRFS_NR_COMPRESS_TYPES)) {
2571fd715ffSDavid Sterba 		file_extent_err(leaf, slot,
2588806d718SQu Wenruo 	"invalid compression for file extent, have %u expect range [0, %u]",
2598806d718SQu Wenruo 			btrfs_file_extent_compression(leaf, fi),
260ce96b7ffSChengguang Xu 			BTRFS_NR_COMPRESS_TYPES - 1);
261557ea5ddSQu Wenruo 		return -EUCLEAN;
262557ea5ddSQu Wenruo 	}
263c7c01a4aSDavid Sterba 	if (unlikely(btrfs_file_extent_encryption(leaf, fi))) {
2641fd715ffSDavid Sterba 		file_extent_err(leaf, slot,
2658806d718SQu Wenruo 			"invalid encryption for file extent, have %u expect 0",
2668806d718SQu Wenruo 			btrfs_file_extent_encryption(leaf, fi));
267557ea5ddSQu Wenruo 		return -EUCLEAN;
268557ea5ddSQu Wenruo 	}
269557ea5ddSQu Wenruo 	if (btrfs_file_extent_type(leaf, fi) == BTRFS_FILE_EXTENT_INLINE) {
270557ea5ddSQu Wenruo 		/* Inline extent must have 0 as key offset */
271c7c01a4aSDavid Sterba 		if (unlikely(key->offset)) {
2721fd715ffSDavid Sterba 			file_extent_err(leaf, slot,
2738806d718SQu Wenruo 		"invalid file_offset for inline file extent, have %llu expect 0",
2748806d718SQu Wenruo 				key->offset);
275557ea5ddSQu Wenruo 			return -EUCLEAN;
276557ea5ddSQu Wenruo 		}
277557ea5ddSQu Wenruo 
278557ea5ddSQu Wenruo 		/* Compressed inline extent has no on-disk size, skip it */
279557ea5ddSQu Wenruo 		if (btrfs_file_extent_compression(leaf, fi) !=
280557ea5ddSQu Wenruo 		    BTRFS_COMPRESS_NONE)
281557ea5ddSQu Wenruo 			return 0;
282557ea5ddSQu Wenruo 
283557ea5ddSQu Wenruo 		/* Uncompressed inline extent size must match item size */
284c7c01a4aSDavid Sterba 		if (unlikely(item_size != BTRFS_FILE_EXTENT_INLINE_DATA_START +
285c7c01a4aSDavid Sterba 					  btrfs_file_extent_ram_bytes(leaf, fi))) {
2861fd715ffSDavid Sterba 			file_extent_err(leaf, slot,
2878806d718SQu Wenruo 	"invalid ram_bytes for uncompressed inline extent, have %u expect %llu",
2888806d718SQu Wenruo 				item_size, BTRFS_FILE_EXTENT_INLINE_DATA_START +
2898806d718SQu Wenruo 				btrfs_file_extent_ram_bytes(leaf, fi));
290557ea5ddSQu Wenruo 			return -EUCLEAN;
291557ea5ddSQu Wenruo 		}
292557ea5ddSQu Wenruo 		return 0;
293557ea5ddSQu Wenruo 	}
294557ea5ddSQu Wenruo 
295557ea5ddSQu Wenruo 	/* Regular or preallocated extent has fixed item size */
296c7c01a4aSDavid Sterba 	if (unlikely(item_size != sizeof(*fi))) {
2971fd715ffSDavid Sterba 		file_extent_err(leaf, slot,
298709a95c3SArnd Bergmann 	"invalid item size for reg/prealloc file extent, have %u expect %zu",
2998806d718SQu Wenruo 			item_size, sizeof(*fi));
300557ea5ddSQu Wenruo 		return -EUCLEAN;
301557ea5ddSQu Wenruo 	}
302c7c01a4aSDavid Sterba 	if (unlikely(CHECK_FE_ALIGNED(leaf, slot, fi, ram_bytes, sectorsize) ||
303033774dcSDavid Sterba 		     CHECK_FE_ALIGNED(leaf, slot, fi, disk_bytenr, sectorsize) ||
304033774dcSDavid Sterba 		     CHECK_FE_ALIGNED(leaf, slot, fi, disk_num_bytes, sectorsize) ||
305033774dcSDavid Sterba 		     CHECK_FE_ALIGNED(leaf, slot, fi, offset, sectorsize) ||
306c7c01a4aSDavid Sterba 		     CHECK_FE_ALIGNED(leaf, slot, fi, num_bytes, sectorsize)))
307557ea5ddSQu Wenruo 		return -EUCLEAN;
3084e9845efSFilipe Manana 
3094c094c33SQu Wenruo 	/* Catch extent end overflow */
310c7c01a4aSDavid Sterba 	if (unlikely(check_add_overflow(btrfs_file_extent_num_bytes(leaf, fi),
311c7c01a4aSDavid Sterba 					key->offset, &extent_end))) {
3124c094c33SQu Wenruo 		file_extent_err(leaf, slot,
3134c094c33SQu Wenruo 	"extent end overflow, have file offset %llu extent num bytes %llu",
3144c094c33SQu Wenruo 				key->offset,
3154c094c33SQu Wenruo 				btrfs_file_extent_num_bytes(leaf, fi));
3164c094c33SQu Wenruo 		return -EUCLEAN;
3174c094c33SQu Wenruo 	}
3184c094c33SQu Wenruo 
3194e9845efSFilipe Manana 	/*
3204e9845efSFilipe Manana 	 * Check that no two consecutive file extent items, in the same leaf,
3214e9845efSFilipe Manana 	 * present ranges that overlap each other.
3224e9845efSFilipe Manana 	 */
3234e9845efSFilipe Manana 	if (slot > 0 &&
3244e9845efSFilipe Manana 	    prev_key->objectid == key->objectid &&
3254e9845efSFilipe Manana 	    prev_key->type == BTRFS_EXTENT_DATA_KEY) {
3264e9845efSFilipe Manana 		struct btrfs_file_extent_item *prev_fi;
3274e9845efSFilipe Manana 		u64 prev_end;
3284e9845efSFilipe Manana 
3294e9845efSFilipe Manana 		prev_fi = btrfs_item_ptr(leaf, slot - 1,
3304e9845efSFilipe Manana 					 struct btrfs_file_extent_item);
3314e9845efSFilipe Manana 		prev_end = file_extent_end(leaf, prev_key, prev_fi);
332c7c01a4aSDavid Sterba 		if (unlikely(prev_end > key->offset)) {
3334e9845efSFilipe Manana 			file_extent_err(leaf, slot - 1,
3344e9845efSFilipe Manana "file extent end range (%llu) goes beyond start offset (%llu) of the next file extent",
3354e9845efSFilipe Manana 					prev_end, key->offset);
3364e9845efSFilipe Manana 			return -EUCLEAN;
3374e9845efSFilipe Manana 		}
3384e9845efSFilipe Manana 	}
3394e9845efSFilipe Manana 
340557ea5ddSQu Wenruo 	return 0;
341557ea5ddSQu Wenruo }
342557ea5ddSQu Wenruo 
34368128ce7SDavid Sterba static int check_csum_item(struct extent_buffer *leaf, struct btrfs_key *key,
344ad1d8c43SFilipe Manana 			   int slot, struct btrfs_key *prev_key)
345557ea5ddSQu Wenruo {
34668128ce7SDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
3472f659546SQu Wenruo 	u32 sectorsize = fs_info->sectorsize;
348223486c2SDavid Sterba 	const u32 csumsize = fs_info->csum_size;
349557ea5ddSQu Wenruo 
350c7c01a4aSDavid Sterba 	if (unlikely(key->objectid != BTRFS_EXTENT_CSUM_OBJECTID)) {
35186a6be3aSDavid Sterba 		generic_err(leaf, slot,
352d508c5f0SQu Wenruo 		"invalid key objectid for csum item, have %llu expect %llu",
353d508c5f0SQu Wenruo 			key->objectid, BTRFS_EXTENT_CSUM_OBJECTID);
354557ea5ddSQu Wenruo 		return -EUCLEAN;
355557ea5ddSQu Wenruo 	}
356c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(key->offset, sectorsize))) {
35786a6be3aSDavid Sterba 		generic_err(leaf, slot,
358d508c5f0SQu Wenruo 	"unaligned key offset for csum item, have %llu should be aligned to %u",
359d508c5f0SQu Wenruo 			key->offset, sectorsize);
360557ea5ddSQu Wenruo 		return -EUCLEAN;
361557ea5ddSQu Wenruo 	}
3623212fa14SJosef Bacik 	if (unlikely(!IS_ALIGNED(btrfs_item_size(leaf, slot), csumsize))) {
36386a6be3aSDavid Sterba 		generic_err(leaf, slot,
364d508c5f0SQu Wenruo 	"unaligned item size for csum item, have %u should be aligned to %u",
3653212fa14SJosef Bacik 			btrfs_item_size(leaf, slot), csumsize);
366557ea5ddSQu Wenruo 		return -EUCLEAN;
367557ea5ddSQu Wenruo 	}
368ad1d8c43SFilipe Manana 	if (slot > 0 && prev_key->type == BTRFS_EXTENT_CSUM_KEY) {
369ad1d8c43SFilipe Manana 		u64 prev_csum_end;
370ad1d8c43SFilipe Manana 		u32 prev_item_size;
371ad1d8c43SFilipe Manana 
3723212fa14SJosef Bacik 		prev_item_size = btrfs_item_size(leaf, slot - 1);
373ad1d8c43SFilipe Manana 		prev_csum_end = (prev_item_size / csumsize) * sectorsize;
374ad1d8c43SFilipe Manana 		prev_csum_end += prev_key->offset;
375c7c01a4aSDavid Sterba 		if (unlikely(prev_csum_end > key->offset)) {
376ad1d8c43SFilipe Manana 			generic_err(leaf, slot - 1,
377ad1d8c43SFilipe Manana "csum end range (%llu) goes beyond the start range (%llu) of the next csum item",
378ad1d8c43SFilipe Manana 				    prev_csum_end, key->offset);
379ad1d8c43SFilipe Manana 			return -EUCLEAN;
380ad1d8c43SFilipe Manana 		}
381ad1d8c43SFilipe Manana 	}
382557ea5ddSQu Wenruo 	return 0;
383557ea5ddSQu Wenruo }
384557ea5ddSQu Wenruo 
385c23c77b0SQu Wenruo /* Inode item error output has the same format as dir_item_err() */
386c23c77b0SQu Wenruo #define inode_item_err(eb, slot, fmt, ...)			\
387c23c77b0SQu Wenruo 	dir_item_err(eb, slot, fmt, __VA_ARGS__)
388c23c77b0SQu Wenruo 
389c23c77b0SQu Wenruo static int check_inode_key(struct extent_buffer *leaf, struct btrfs_key *key,
390c23c77b0SQu Wenruo 			   int slot)
391c23c77b0SQu Wenruo {
392c23c77b0SQu Wenruo 	struct btrfs_key item_key;
393c23c77b0SQu Wenruo 	bool is_inode_item;
394c23c77b0SQu Wenruo 
395c23c77b0SQu Wenruo 	btrfs_item_key_to_cpu(leaf, &item_key, slot);
396c23c77b0SQu Wenruo 	is_inode_item = (item_key.type == BTRFS_INODE_ITEM_KEY);
397c23c77b0SQu Wenruo 
398c23c77b0SQu Wenruo 	/* For XATTR_ITEM, location key should be all 0 */
399c23c77b0SQu Wenruo 	if (item_key.type == BTRFS_XATTR_ITEM_KEY) {
400c7c01a4aSDavid Sterba 		if (unlikely(key->objectid != 0 || key->type != 0 ||
401c7c01a4aSDavid Sterba 			     key->offset != 0))
402c23c77b0SQu Wenruo 			return -EUCLEAN;
403c23c77b0SQu Wenruo 		return 0;
404c23c77b0SQu Wenruo 	}
405c23c77b0SQu Wenruo 
406c7c01a4aSDavid Sterba 	if (unlikely((key->objectid < BTRFS_FIRST_FREE_OBJECTID ||
407c23c77b0SQu Wenruo 		      key->objectid > BTRFS_LAST_FREE_OBJECTID) &&
408c23c77b0SQu Wenruo 		     key->objectid != BTRFS_ROOT_TREE_DIR_OBJECTID &&
409c7c01a4aSDavid Sterba 		     key->objectid != BTRFS_FREE_INO_OBJECTID)) {
410c23c77b0SQu Wenruo 		if (is_inode_item) {
411c23c77b0SQu Wenruo 			generic_err(leaf, slot,
412c23c77b0SQu Wenruo 	"invalid key objectid: has %llu expect %llu or [%llu, %llu] or %llu",
413c23c77b0SQu Wenruo 				key->objectid, BTRFS_ROOT_TREE_DIR_OBJECTID,
414c23c77b0SQu Wenruo 				BTRFS_FIRST_FREE_OBJECTID,
415c23c77b0SQu Wenruo 				BTRFS_LAST_FREE_OBJECTID,
416c23c77b0SQu Wenruo 				BTRFS_FREE_INO_OBJECTID);
417c23c77b0SQu Wenruo 		} else {
418c23c77b0SQu Wenruo 			dir_item_err(leaf, slot,
419c23c77b0SQu Wenruo "invalid location key objectid: has %llu expect %llu or [%llu, %llu] or %llu",
420c23c77b0SQu Wenruo 				key->objectid, BTRFS_ROOT_TREE_DIR_OBJECTID,
421c23c77b0SQu Wenruo 				BTRFS_FIRST_FREE_OBJECTID,
422c23c77b0SQu Wenruo 				BTRFS_LAST_FREE_OBJECTID,
423c23c77b0SQu Wenruo 				BTRFS_FREE_INO_OBJECTID);
424c23c77b0SQu Wenruo 		}
425c23c77b0SQu Wenruo 		return -EUCLEAN;
426c23c77b0SQu Wenruo 	}
427c7c01a4aSDavid Sterba 	if (unlikely(key->offset != 0)) {
428c23c77b0SQu Wenruo 		if (is_inode_item)
429c23c77b0SQu Wenruo 			inode_item_err(leaf, slot,
430c23c77b0SQu Wenruo 				       "invalid key offset: has %llu expect 0",
431c23c77b0SQu Wenruo 				       key->offset);
432c23c77b0SQu Wenruo 		else
433c23c77b0SQu Wenruo 			dir_item_err(leaf, slot,
434c23c77b0SQu Wenruo 				"invalid location key offset:has %llu expect 0",
435c23c77b0SQu Wenruo 				key->offset);
436c23c77b0SQu Wenruo 		return -EUCLEAN;
437c23c77b0SQu Wenruo 	}
438c23c77b0SQu Wenruo 	return 0;
439c23c77b0SQu Wenruo }
440c23c77b0SQu Wenruo 
44157a0e674SQu Wenruo static int check_root_key(struct extent_buffer *leaf, struct btrfs_key *key,
44257a0e674SQu Wenruo 			  int slot)
44357a0e674SQu Wenruo {
44457a0e674SQu Wenruo 	struct btrfs_key item_key;
44557a0e674SQu Wenruo 	bool is_root_item;
44657a0e674SQu Wenruo 
44757a0e674SQu Wenruo 	btrfs_item_key_to_cpu(leaf, &item_key, slot);
44857a0e674SQu Wenruo 	is_root_item = (item_key.type == BTRFS_ROOT_ITEM_KEY);
44957a0e674SQu Wenruo 
4506ebcd021SQu Wenruo 	/*
4516ebcd021SQu Wenruo 	 * Bad rootid for reloc trees.
4526ebcd021SQu Wenruo 	 *
4536ebcd021SQu Wenruo 	 * Reloc trees are only for subvolume trees, other trees only need
4546ebcd021SQu Wenruo 	 * to be COWed to be relocated.
4556ebcd021SQu Wenruo 	 */
4566ebcd021SQu Wenruo 	if (unlikely(is_root_item && key->objectid == BTRFS_TREE_RELOC_OBJECTID &&
4576ebcd021SQu Wenruo 		     !is_fstree(key->offset))) {
4586ebcd021SQu Wenruo 		generic_err(leaf, slot,
4596ebcd021SQu Wenruo 		"invalid reloc tree for root %lld, root id is not a subvolume tree",
4606ebcd021SQu Wenruo 			    key->offset);
4616ebcd021SQu Wenruo 		return -EUCLEAN;
4626ebcd021SQu Wenruo 	}
4636ebcd021SQu Wenruo 
46457a0e674SQu Wenruo 	/* No such tree id */
465c7c01a4aSDavid Sterba 	if (unlikely(key->objectid == 0)) {
46657a0e674SQu Wenruo 		if (is_root_item)
46757a0e674SQu Wenruo 			generic_err(leaf, slot, "invalid root id 0");
46857a0e674SQu Wenruo 		else
46957a0e674SQu Wenruo 			dir_item_err(leaf, slot,
47057a0e674SQu Wenruo 				     "invalid location key root id 0");
47157a0e674SQu Wenruo 		return -EUCLEAN;
47257a0e674SQu Wenruo 	}
47357a0e674SQu Wenruo 
47457a0e674SQu Wenruo 	/* DIR_ITEM/INDEX/INODE_REF is not allowed to point to non-fs trees */
475c7c01a4aSDavid Sterba 	if (unlikely(!is_fstree(key->objectid) && !is_root_item)) {
47657a0e674SQu Wenruo 		dir_item_err(leaf, slot,
47757a0e674SQu Wenruo 		"invalid location key objectid, have %llu expect [%llu, %llu]",
47857a0e674SQu Wenruo 				key->objectid, BTRFS_FIRST_FREE_OBJECTID,
47957a0e674SQu Wenruo 				BTRFS_LAST_FREE_OBJECTID);
48057a0e674SQu Wenruo 		return -EUCLEAN;
48157a0e674SQu Wenruo 	}
48257a0e674SQu Wenruo 
48357a0e674SQu Wenruo 	/*
48457a0e674SQu Wenruo 	 * ROOT_ITEM with non-zero offset means this is a snapshot, created at
48557a0e674SQu Wenruo 	 * @offset transid.
48657a0e674SQu Wenruo 	 * Furthermore, for location key in DIR_ITEM, its offset is always -1.
48757a0e674SQu Wenruo 	 *
48857a0e674SQu Wenruo 	 * So here we only check offset for reloc tree whose key->offset must
48957a0e674SQu Wenruo 	 * be a valid tree.
49057a0e674SQu Wenruo 	 */
491c7c01a4aSDavid Sterba 	if (unlikely(key->objectid == BTRFS_TREE_RELOC_OBJECTID &&
492c7c01a4aSDavid Sterba 		     key->offset == 0)) {
49357a0e674SQu Wenruo 		generic_err(leaf, slot, "invalid root id 0 for reloc tree");
49457a0e674SQu Wenruo 		return -EUCLEAN;
49557a0e674SQu Wenruo 	}
49657a0e674SQu Wenruo 	return 0;
49757a0e674SQu Wenruo }
49857a0e674SQu Wenruo 
499ce4252c0SDavid Sterba static int check_dir_item(struct extent_buffer *leaf,
500c18679ebSQu Wenruo 			  struct btrfs_key *key, struct btrfs_key *prev_key,
501c18679ebSQu Wenruo 			  int slot)
502ad7b0368SQu Wenruo {
503ce4252c0SDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
504ad7b0368SQu Wenruo 	struct btrfs_dir_item *di;
5053212fa14SJosef Bacik 	u32 item_size = btrfs_item_size(leaf, slot);
506ad7b0368SQu Wenruo 	u32 cur = 0;
507ad7b0368SQu Wenruo 
508c7c01a4aSDavid Sterba 	if (unlikely(!check_prev_ino(leaf, key, slot, prev_key)))
509c18679ebSQu Wenruo 		return -EUCLEAN;
510c7c01a4aSDavid Sterba 
511ad7b0368SQu Wenruo 	di = btrfs_item_ptr(leaf, slot, struct btrfs_dir_item);
512ad7b0368SQu Wenruo 	while (cur < item_size) {
513147a097cSQu Wenruo 		struct btrfs_key location_key;
514ad7b0368SQu Wenruo 		u32 name_len;
515ad7b0368SQu Wenruo 		u32 data_len;
516ad7b0368SQu Wenruo 		u32 max_name_len;
517ad7b0368SQu Wenruo 		u32 total_size;
518ad7b0368SQu Wenruo 		u32 name_hash;
519ad7b0368SQu Wenruo 		u8 dir_type;
520147a097cSQu Wenruo 		int ret;
521ad7b0368SQu Wenruo 
522ad7b0368SQu Wenruo 		/* header itself should not cross item boundary */
523c7c01a4aSDavid Sterba 		if (unlikely(cur + sizeof(*di) > item_size)) {
524d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
5257cfad652SArnd Bergmann 		"dir item header crosses item boundary, have %zu boundary %u",
526ad7b0368SQu Wenruo 				cur + sizeof(*di), item_size);
527ad7b0368SQu Wenruo 			return -EUCLEAN;
528ad7b0368SQu Wenruo 		}
529ad7b0368SQu Wenruo 
530147a097cSQu Wenruo 		/* Location key check */
531147a097cSQu Wenruo 		btrfs_dir_item_key_to_cpu(leaf, di, &location_key);
532147a097cSQu Wenruo 		if (location_key.type == BTRFS_ROOT_ITEM_KEY) {
533147a097cSQu Wenruo 			ret = check_root_key(leaf, &location_key, slot);
534c7c01a4aSDavid Sterba 			if (unlikely(ret < 0))
535147a097cSQu Wenruo 				return ret;
536147a097cSQu Wenruo 		} else if (location_key.type == BTRFS_INODE_ITEM_KEY ||
537147a097cSQu Wenruo 			   location_key.type == 0) {
538147a097cSQu Wenruo 			ret = check_inode_key(leaf, &location_key, slot);
539c7c01a4aSDavid Sterba 			if (unlikely(ret < 0))
540147a097cSQu Wenruo 				return ret;
541147a097cSQu Wenruo 		} else {
542147a097cSQu Wenruo 			dir_item_err(leaf, slot,
543147a097cSQu Wenruo 			"invalid location key type, have %u, expect %u or %u",
544147a097cSQu Wenruo 				     location_key.type, BTRFS_ROOT_ITEM_KEY,
545147a097cSQu Wenruo 				     BTRFS_INODE_ITEM_KEY);
546147a097cSQu Wenruo 			return -EUCLEAN;
547147a097cSQu Wenruo 		}
548147a097cSQu Wenruo 
549ad7b0368SQu Wenruo 		/* dir type check */
55094a48aefSOmar Sandoval 		dir_type = btrfs_dir_ftype(leaf, di);
551c7c01a4aSDavid Sterba 		if (unlikely(dir_type >= BTRFS_FT_MAX)) {
552d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
553ad7b0368SQu Wenruo 			"invalid dir item type, have %u expect [0, %u)",
554ad7b0368SQu Wenruo 				dir_type, BTRFS_FT_MAX);
555ad7b0368SQu Wenruo 			return -EUCLEAN;
556ad7b0368SQu Wenruo 		}
557ad7b0368SQu Wenruo 
558c7c01a4aSDavid Sterba 		if (unlikely(key->type == BTRFS_XATTR_ITEM_KEY &&
559c7c01a4aSDavid Sterba 			     dir_type != BTRFS_FT_XATTR)) {
560d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
561ad7b0368SQu Wenruo 		"invalid dir item type for XATTR key, have %u expect %u",
562ad7b0368SQu Wenruo 				dir_type, BTRFS_FT_XATTR);
563ad7b0368SQu Wenruo 			return -EUCLEAN;
564ad7b0368SQu Wenruo 		}
565c7c01a4aSDavid Sterba 		if (unlikely(dir_type == BTRFS_FT_XATTR &&
566c7c01a4aSDavid Sterba 			     key->type != BTRFS_XATTR_ITEM_KEY)) {
567d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
568ad7b0368SQu Wenruo 			"xattr dir type found for non-XATTR key");
569ad7b0368SQu Wenruo 			return -EUCLEAN;
570ad7b0368SQu Wenruo 		}
571ad7b0368SQu Wenruo 		if (dir_type == BTRFS_FT_XATTR)
572ad7b0368SQu Wenruo 			max_name_len = XATTR_NAME_MAX;
573ad7b0368SQu Wenruo 		else
574ad7b0368SQu Wenruo 			max_name_len = BTRFS_NAME_LEN;
575ad7b0368SQu Wenruo 
576ad7b0368SQu Wenruo 		/* Name/data length check */
577ad7b0368SQu Wenruo 		name_len = btrfs_dir_name_len(leaf, di);
578ad7b0368SQu Wenruo 		data_len = btrfs_dir_data_len(leaf, di);
579c7c01a4aSDavid Sterba 		if (unlikely(name_len > max_name_len)) {
580d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
581ad7b0368SQu Wenruo 			"dir item name len too long, have %u max %u",
582ad7b0368SQu Wenruo 				name_len, max_name_len);
583ad7b0368SQu Wenruo 			return -EUCLEAN;
584ad7b0368SQu Wenruo 		}
585c7c01a4aSDavid Sterba 		if (unlikely(name_len + data_len > BTRFS_MAX_XATTR_SIZE(fs_info))) {
586d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
587ad7b0368SQu Wenruo 			"dir item name and data len too long, have %u max %u",
588ad7b0368SQu Wenruo 				name_len + data_len,
5892f659546SQu Wenruo 				BTRFS_MAX_XATTR_SIZE(fs_info));
590ad7b0368SQu Wenruo 			return -EUCLEAN;
591ad7b0368SQu Wenruo 		}
592ad7b0368SQu Wenruo 
593c7c01a4aSDavid Sterba 		if (unlikely(data_len && dir_type != BTRFS_FT_XATTR)) {
594d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
595ad7b0368SQu Wenruo 			"dir item with invalid data len, have %u expect 0",
596ad7b0368SQu Wenruo 				data_len);
597ad7b0368SQu Wenruo 			return -EUCLEAN;
598ad7b0368SQu Wenruo 		}
599ad7b0368SQu Wenruo 
600ad7b0368SQu Wenruo 		total_size = sizeof(*di) + name_len + data_len;
601ad7b0368SQu Wenruo 
602ad7b0368SQu Wenruo 		/* header and name/data should not cross item boundary */
603c7c01a4aSDavid Sterba 		if (unlikely(cur + total_size > item_size)) {
604d98ced68SDavid Sterba 			dir_item_err(leaf, slot,
605ad7b0368SQu Wenruo 		"dir item data crosses item boundary, have %u boundary %u",
606ad7b0368SQu Wenruo 				cur + total_size, item_size);
607ad7b0368SQu Wenruo 			return -EUCLEAN;
608ad7b0368SQu Wenruo 		}
609ad7b0368SQu Wenruo 
610ad7b0368SQu Wenruo 		/*
611ad7b0368SQu Wenruo 		 * Special check for XATTR/DIR_ITEM, as key->offset is name
612ad7b0368SQu Wenruo 		 * hash, should match its name
613ad7b0368SQu Wenruo 		 */
614ad7b0368SQu Wenruo 		if (key->type == BTRFS_DIR_ITEM_KEY ||
615ad7b0368SQu Wenruo 		    key->type == BTRFS_XATTR_ITEM_KEY) {
616e2683fc9SDavid Sterba 			char namebuf[max(BTRFS_NAME_LEN, XATTR_NAME_MAX)];
617e2683fc9SDavid Sterba 
618ad7b0368SQu Wenruo 			read_extent_buffer(leaf, namebuf,
619ad7b0368SQu Wenruo 					(unsigned long)(di + 1), name_len);
620ad7b0368SQu Wenruo 			name_hash = btrfs_name_hash(namebuf, name_len);
621c7c01a4aSDavid Sterba 			if (unlikely(key->offset != name_hash)) {
622d98ced68SDavid Sterba 				dir_item_err(leaf, slot,
623ad7b0368SQu Wenruo 		"name hash mismatch with key, have 0x%016x expect 0x%016llx",
624ad7b0368SQu Wenruo 					name_hash, key->offset);
625ad7b0368SQu Wenruo 				return -EUCLEAN;
626ad7b0368SQu Wenruo 			}
627ad7b0368SQu Wenruo 		}
628ad7b0368SQu Wenruo 		cur += total_size;
629ad7b0368SQu Wenruo 		di = (struct btrfs_dir_item *)((void *)di + total_size);
630ad7b0368SQu Wenruo 	}
631ad7b0368SQu Wenruo 	return 0;
632ad7b0368SQu Wenruo }
633ad7b0368SQu Wenruo 
6344806bd88SDavid Sterba __printf(3, 4)
635fce466eaSQu Wenruo __cold
6364806bd88SDavid Sterba static void block_group_err(const struct extent_buffer *eb, int slot,
637fce466eaSQu Wenruo 			    const char *fmt, ...)
638fce466eaSQu Wenruo {
6394806bd88SDavid Sterba 	const struct btrfs_fs_info *fs_info = eb->fs_info;
640fce466eaSQu Wenruo 	struct btrfs_key key;
641fce466eaSQu Wenruo 	struct va_format vaf;
642fce466eaSQu Wenruo 	va_list args;
643fce466eaSQu Wenruo 
644fce466eaSQu Wenruo 	btrfs_item_key_to_cpu(eb, &key, slot);
645fce466eaSQu Wenruo 	va_start(args, fmt);
646fce466eaSQu Wenruo 
647fce466eaSQu Wenruo 	vaf.fmt = fmt;
648fce466eaSQu Wenruo 	vaf.va = &args;
649fce466eaSQu Wenruo 
650fce466eaSQu Wenruo 	btrfs_crit(fs_info,
651fce466eaSQu Wenruo 	"corrupt %s: root=%llu block=%llu slot=%d bg_start=%llu bg_len=%llu, %pV",
652fce466eaSQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
653fce466eaSQu Wenruo 		btrfs_header_owner(eb), btrfs_header_bytenr(eb), slot,
654fce466eaSQu Wenruo 		key.objectid, key.offset, &vaf);
655fce466eaSQu Wenruo 	va_end(args);
656fce466eaSQu Wenruo }
657fce466eaSQu Wenruo 
658af60ce2bSDavid Sterba static int check_block_group_item(struct extent_buffer *leaf,
659fce466eaSQu Wenruo 				  struct btrfs_key *key, int slot)
660fce466eaSQu Wenruo {
661f7238e50SJosef Bacik 	struct btrfs_fs_info *fs_info = leaf->fs_info;
662fce466eaSQu Wenruo 	struct btrfs_block_group_item bgi;
6633212fa14SJosef Bacik 	u32 item_size = btrfs_item_size(leaf, slot);
664f7238e50SJosef Bacik 	u64 chunk_objectid;
665fce466eaSQu Wenruo 	u64 flags;
666fce466eaSQu Wenruo 	u64 type;
667fce466eaSQu Wenruo 
668fce466eaSQu Wenruo 	/*
669fce466eaSQu Wenruo 	 * Here we don't really care about alignment since extent allocator can
67010950929SQu Wenruo 	 * handle it.  We care more about the size.
671fce466eaSQu Wenruo 	 */
672c7c01a4aSDavid Sterba 	if (unlikely(key->offset == 0)) {
6734806bd88SDavid Sterba 		block_group_err(leaf, slot,
67410950929SQu Wenruo 				"invalid block group size 0");
675fce466eaSQu Wenruo 		return -EUCLEAN;
676fce466eaSQu Wenruo 	}
677fce466eaSQu Wenruo 
678c7c01a4aSDavid Sterba 	if (unlikely(item_size != sizeof(bgi))) {
6794806bd88SDavid Sterba 		block_group_err(leaf, slot,
680fce466eaSQu Wenruo 			"invalid item size, have %u expect %zu",
681fce466eaSQu Wenruo 				item_size, sizeof(bgi));
682fce466eaSQu Wenruo 		return -EUCLEAN;
683fce466eaSQu Wenruo 	}
684fce466eaSQu Wenruo 
685fce466eaSQu Wenruo 	read_extent_buffer(leaf, &bgi, btrfs_item_ptr_offset(leaf, slot),
686fce466eaSQu Wenruo 			   sizeof(bgi));
687f7238e50SJosef Bacik 	chunk_objectid = btrfs_stack_block_group_chunk_objectid(&bgi);
688f7238e50SJosef Bacik 	if (btrfs_fs_incompat(fs_info, EXTENT_TREE_V2)) {
689f7238e50SJosef Bacik 		/*
690f7238e50SJosef Bacik 		 * We don't init the nr_global_roots until we load the global
691f7238e50SJosef Bacik 		 * roots, so this could be 0 at mount time.  If it's 0 we'll
692f7238e50SJosef Bacik 		 * just assume we're fine, and later we'll check against our
693f7238e50SJosef Bacik 		 * actual value.
694f7238e50SJosef Bacik 		 */
695f7238e50SJosef Bacik 		if (unlikely(fs_info->nr_global_roots &&
696f7238e50SJosef Bacik 			     chunk_objectid >= fs_info->nr_global_roots)) {
697f7238e50SJosef Bacik 			block_group_err(leaf, slot,
698f7238e50SJosef Bacik 	"invalid block group global root id, have %llu, needs to be <= %llu",
699f7238e50SJosef Bacik 					chunk_objectid,
700f7238e50SJosef Bacik 					fs_info->nr_global_roots);
701f7238e50SJosef Bacik 			return -EUCLEAN;
702f7238e50SJosef Bacik 		}
703f7238e50SJosef Bacik 	} else if (unlikely(chunk_objectid != BTRFS_FIRST_CHUNK_TREE_OBJECTID)) {
7044806bd88SDavid Sterba 		block_group_err(leaf, slot,
705fce466eaSQu Wenruo 		"invalid block group chunk objectid, have %llu expect %llu",
706de0dc456SDavid Sterba 				btrfs_stack_block_group_chunk_objectid(&bgi),
707fce466eaSQu Wenruo 				BTRFS_FIRST_CHUNK_TREE_OBJECTID);
708fce466eaSQu Wenruo 		return -EUCLEAN;
709fce466eaSQu Wenruo 	}
710fce466eaSQu Wenruo 
711c7c01a4aSDavid Sterba 	if (unlikely(btrfs_stack_block_group_used(&bgi) > key->offset)) {
7124806bd88SDavid Sterba 		block_group_err(leaf, slot,
713fce466eaSQu Wenruo 			"invalid block group used, have %llu expect [0, %llu)",
714de0dc456SDavid Sterba 				btrfs_stack_block_group_used(&bgi), key->offset);
715fce466eaSQu Wenruo 		return -EUCLEAN;
716fce466eaSQu Wenruo 	}
717fce466eaSQu Wenruo 
718de0dc456SDavid Sterba 	flags = btrfs_stack_block_group_flags(&bgi);
719c7c01a4aSDavid Sterba 	if (unlikely(hweight64(flags & BTRFS_BLOCK_GROUP_PROFILE_MASK) > 1)) {
7204806bd88SDavid Sterba 		block_group_err(leaf, slot,
721fce466eaSQu Wenruo "invalid profile flags, have 0x%llx (%lu bits set) expect no more than 1 bit set",
722fce466eaSQu Wenruo 			flags & BTRFS_BLOCK_GROUP_PROFILE_MASK,
723fce466eaSQu Wenruo 			hweight64(flags & BTRFS_BLOCK_GROUP_PROFILE_MASK));
724fce466eaSQu Wenruo 		return -EUCLEAN;
725fce466eaSQu Wenruo 	}
726fce466eaSQu Wenruo 
727fce466eaSQu Wenruo 	type = flags & BTRFS_BLOCK_GROUP_TYPE_MASK;
728c7c01a4aSDavid Sterba 	if (unlikely(type != BTRFS_BLOCK_GROUP_DATA &&
729fce466eaSQu Wenruo 		     type != BTRFS_BLOCK_GROUP_METADATA &&
730fce466eaSQu Wenruo 		     type != BTRFS_BLOCK_GROUP_SYSTEM &&
731fce466eaSQu Wenruo 		     type != (BTRFS_BLOCK_GROUP_METADATA |
732c7c01a4aSDavid Sterba 			      BTRFS_BLOCK_GROUP_DATA))) {
7334806bd88SDavid Sterba 		block_group_err(leaf, slot,
734761333f2SShaokun Zhang "invalid type, have 0x%llx (%lu bits set) expect either 0x%llx, 0x%llx, 0x%llx or 0x%llx",
735fce466eaSQu Wenruo 			type, hweight64(type),
736fce466eaSQu Wenruo 			BTRFS_BLOCK_GROUP_DATA, BTRFS_BLOCK_GROUP_METADATA,
737fce466eaSQu Wenruo 			BTRFS_BLOCK_GROUP_SYSTEM,
738fce466eaSQu Wenruo 			BTRFS_BLOCK_GROUP_METADATA | BTRFS_BLOCK_GROUP_DATA);
739fce466eaSQu Wenruo 		return -EUCLEAN;
740fce466eaSQu Wenruo 	}
741fce466eaSQu Wenruo 	return 0;
742fce466eaSQu Wenruo }
743fce466eaSQu Wenruo 
744d001e4a3SDavid Sterba __printf(4, 5)
745f1140243SQu Wenruo __cold
746d001e4a3SDavid Sterba static void chunk_err(const struct extent_buffer *leaf,
747f1140243SQu Wenruo 		      const struct btrfs_chunk *chunk, u64 logical,
748f1140243SQu Wenruo 		      const char *fmt, ...)
749f1140243SQu Wenruo {
750d001e4a3SDavid Sterba 	const struct btrfs_fs_info *fs_info = leaf->fs_info;
751f1140243SQu Wenruo 	bool is_sb;
752f1140243SQu Wenruo 	struct va_format vaf;
753f1140243SQu Wenruo 	va_list args;
754f1140243SQu Wenruo 	int i;
755f1140243SQu Wenruo 	int slot = -1;
756f1140243SQu Wenruo 
757f1140243SQu Wenruo 	/* Only superblock eb is able to have such small offset */
758f1140243SQu Wenruo 	is_sb = (leaf->start == BTRFS_SUPER_INFO_OFFSET);
759f1140243SQu Wenruo 
760f1140243SQu Wenruo 	if (!is_sb) {
761f1140243SQu Wenruo 		/*
762f1140243SQu Wenruo 		 * Get the slot number by iterating through all slots, this
763f1140243SQu Wenruo 		 * would provide better readability.
764f1140243SQu Wenruo 		 */
765f1140243SQu Wenruo 		for (i = 0; i < btrfs_header_nritems(leaf); i++) {
766f1140243SQu Wenruo 			if (btrfs_item_ptr_offset(leaf, i) ==
767f1140243SQu Wenruo 					(unsigned long)chunk) {
768f1140243SQu Wenruo 				slot = i;
769f1140243SQu Wenruo 				break;
770f1140243SQu Wenruo 			}
771f1140243SQu Wenruo 		}
772f1140243SQu Wenruo 	}
773f1140243SQu Wenruo 	va_start(args, fmt);
774f1140243SQu Wenruo 	vaf.fmt = fmt;
775f1140243SQu Wenruo 	vaf.va = &args;
776f1140243SQu Wenruo 
777f1140243SQu Wenruo 	if (is_sb)
778f1140243SQu Wenruo 		btrfs_crit(fs_info,
779f1140243SQu Wenruo 		"corrupt superblock syschunk array: chunk_start=%llu, %pV",
780f1140243SQu Wenruo 			   logical, &vaf);
781f1140243SQu Wenruo 	else
782f1140243SQu Wenruo 		btrfs_crit(fs_info,
783f1140243SQu Wenruo 	"corrupt leaf: root=%llu block=%llu slot=%d chunk_start=%llu, %pV",
784f1140243SQu Wenruo 			   BTRFS_CHUNK_TREE_OBJECTID, leaf->start, slot,
785f1140243SQu Wenruo 			   logical, &vaf);
786f1140243SQu Wenruo 	va_end(args);
787f1140243SQu Wenruo }
788f1140243SQu Wenruo 
789ad7b0368SQu Wenruo /*
79082fc28fbSQu Wenruo  * The common chunk check which could also work on super block sys chunk array.
79182fc28fbSQu Wenruo  *
792bf871c3bSQu Wenruo  * Return -EUCLEAN if anything is corrupted.
79382fc28fbSQu Wenruo  * Return 0 if everything is OK.
79482fc28fbSQu Wenruo  */
795ddaf1d5aSDavid Sterba int btrfs_check_chunk_valid(struct extent_buffer *leaf,
79682fc28fbSQu Wenruo 			    struct btrfs_chunk *chunk, u64 logical)
79782fc28fbSQu Wenruo {
798ddaf1d5aSDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
79982fc28fbSQu Wenruo 	u64 length;
800347fb0cfSSu Yue 	u64 chunk_end;
80182fc28fbSQu Wenruo 	u64 stripe_len;
80282fc28fbSQu Wenruo 	u16 num_stripes;
80382fc28fbSQu Wenruo 	u16 sub_stripes;
80482fc28fbSQu Wenruo 	u64 type;
80582fc28fbSQu Wenruo 	u64 features;
80682fc28fbSQu Wenruo 	bool mixed = false;
80785d07fbeSDaniel Xu 	int raid_index;
80885d07fbeSDaniel Xu 	int nparity;
80985d07fbeSDaniel Xu 	int ncopies;
81082fc28fbSQu Wenruo 
81182fc28fbSQu Wenruo 	length = btrfs_chunk_length(leaf, chunk);
81282fc28fbSQu Wenruo 	stripe_len = btrfs_chunk_stripe_len(leaf, chunk);
81382fc28fbSQu Wenruo 	num_stripes = btrfs_chunk_num_stripes(leaf, chunk);
81482fc28fbSQu Wenruo 	sub_stripes = btrfs_chunk_sub_stripes(leaf, chunk);
81582fc28fbSQu Wenruo 	type = btrfs_chunk_type(leaf, chunk);
81685d07fbeSDaniel Xu 	raid_index = btrfs_bg_flags_to_raid_index(type);
81785d07fbeSDaniel Xu 	ncopies = btrfs_raid_array[raid_index].ncopies;
81885d07fbeSDaniel Xu 	nparity = btrfs_raid_array[raid_index].nparity;
81982fc28fbSQu Wenruo 
820c7c01a4aSDavid Sterba 	if (unlikely(!num_stripes)) {
821d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
822f1140243SQu Wenruo 			  "invalid chunk num_stripes, have %u", num_stripes);
823bf871c3bSQu Wenruo 		return -EUCLEAN;
82482fc28fbSQu Wenruo 	}
825c7c01a4aSDavid Sterba 	if (unlikely(num_stripes < ncopies)) {
82685d07fbeSDaniel Xu 		chunk_err(leaf, chunk, logical,
82785d07fbeSDaniel Xu 			  "invalid chunk num_stripes < ncopies, have %u < %d",
82885d07fbeSDaniel Xu 			  num_stripes, ncopies);
82985d07fbeSDaniel Xu 		return -EUCLEAN;
83085d07fbeSDaniel Xu 	}
831c7c01a4aSDavid Sterba 	if (unlikely(nparity && num_stripes == nparity)) {
83285d07fbeSDaniel Xu 		chunk_err(leaf, chunk, logical,
83385d07fbeSDaniel Xu 			  "invalid chunk num_stripes == nparity, have %u == %d",
83485d07fbeSDaniel Xu 			  num_stripes, nparity);
83585d07fbeSDaniel Xu 		return -EUCLEAN;
83685d07fbeSDaniel Xu 	}
837c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(logical, fs_info->sectorsize))) {
838d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
839f1140243SQu Wenruo 		"invalid chunk logical, have %llu should aligned to %u",
840f1140243SQu Wenruo 			  logical, fs_info->sectorsize);
841bf871c3bSQu Wenruo 		return -EUCLEAN;
84282fc28fbSQu Wenruo 	}
843c7c01a4aSDavid Sterba 	if (unlikely(btrfs_chunk_sector_size(leaf, chunk) != fs_info->sectorsize)) {
844d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
845f1140243SQu Wenruo 			  "invalid chunk sectorsize, have %u expect %u",
846f1140243SQu Wenruo 			  btrfs_chunk_sector_size(leaf, chunk),
847f1140243SQu Wenruo 			  fs_info->sectorsize);
848bf871c3bSQu Wenruo 		return -EUCLEAN;
84982fc28fbSQu Wenruo 	}
850c7c01a4aSDavid Sterba 	if (unlikely(!length || !IS_ALIGNED(length, fs_info->sectorsize))) {
851d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
852f1140243SQu Wenruo 			  "invalid chunk length, have %llu", length);
853bf871c3bSQu Wenruo 		return -EUCLEAN;
85482fc28fbSQu Wenruo 	}
855347fb0cfSSu Yue 	if (unlikely(check_add_overflow(logical, length, &chunk_end))) {
856347fb0cfSSu Yue 		chunk_err(leaf, chunk, logical,
857347fb0cfSSu Yue "invalid chunk logical start and length, have logical start %llu length %llu",
858347fb0cfSSu Yue 			  logical, length);
859347fb0cfSSu Yue 		return -EUCLEAN;
860347fb0cfSSu Yue 	}
861c7c01a4aSDavid Sterba 	if (unlikely(!is_power_of_2(stripe_len) || stripe_len != BTRFS_STRIPE_LEN)) {
862d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
863f1140243SQu Wenruo 			  "invalid chunk stripe length: %llu",
86482fc28fbSQu Wenruo 			  stripe_len);
865bf871c3bSQu Wenruo 		return -EUCLEAN;
86682fc28fbSQu Wenruo 	}
8676ded22c1SQu Wenruo 	/*
8686ded22c1SQu Wenruo 	 * We artificially limit the chunk size, so that the number of stripes
8696ded22c1SQu Wenruo 	 * inside a chunk can be fit into a U32.  The current limit (256G) is
8706ded22c1SQu Wenruo 	 * way too large for real world usage anyway, and it's also much larger
8716ded22c1SQu Wenruo 	 * than our existing limit (10G).
8726ded22c1SQu Wenruo 	 *
8736ded22c1SQu Wenruo 	 * Thus it should be a good way to catch obvious bitflips.
8746ded22c1SQu Wenruo 	 */
875cb091225SQu Wenruo 	if (unlikely(length >= btrfs_stripe_nr_to_offset(U32_MAX))) {
8766ded22c1SQu Wenruo 		chunk_err(leaf, chunk, logical,
8776ded22c1SQu Wenruo 			  "chunk length too large: have %llu limit %llu",
878cb091225SQu Wenruo 			  length, btrfs_stripe_nr_to_offset(U32_MAX));
8796ded22c1SQu Wenruo 		return -EUCLEAN;
8806ded22c1SQu Wenruo 	}
881c7c01a4aSDavid Sterba 	if (unlikely(type & ~(BTRFS_BLOCK_GROUP_TYPE_MASK |
882c7c01a4aSDavid Sterba 			      BTRFS_BLOCK_GROUP_PROFILE_MASK))) {
883d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
884f1140243SQu Wenruo 			  "unrecognized chunk type: 0x%llx",
88582fc28fbSQu Wenruo 			  ~(BTRFS_BLOCK_GROUP_TYPE_MASK |
88682fc28fbSQu Wenruo 			    BTRFS_BLOCK_GROUP_PROFILE_MASK) &
88782fc28fbSQu Wenruo 			  btrfs_chunk_type(leaf, chunk));
888bf871c3bSQu Wenruo 		return -EUCLEAN;
88982fc28fbSQu Wenruo 	}
89082fc28fbSQu Wenruo 
891c7c01a4aSDavid Sterba 	if (unlikely(!has_single_bit_set(type & BTRFS_BLOCK_GROUP_PROFILE_MASK) &&
892c7c01a4aSDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_PROFILE_MASK) != 0)) {
893d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
89480e46cf2SQu Wenruo 		"invalid chunk profile flag: 0x%llx, expect 0 or 1 bit set",
89580e46cf2SQu Wenruo 			  type & BTRFS_BLOCK_GROUP_PROFILE_MASK);
89680e46cf2SQu Wenruo 		return -EUCLEAN;
89780e46cf2SQu Wenruo 	}
898c7c01a4aSDavid Sterba 	if (unlikely((type & BTRFS_BLOCK_GROUP_TYPE_MASK) == 0)) {
899d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
900f1140243SQu Wenruo 	"missing chunk type flag, have 0x%llx one bit must be set in 0x%llx",
901f1140243SQu Wenruo 			  type, BTRFS_BLOCK_GROUP_TYPE_MASK);
902bf871c3bSQu Wenruo 		return -EUCLEAN;
90382fc28fbSQu Wenruo 	}
90482fc28fbSQu Wenruo 
905c7c01a4aSDavid Sterba 	if (unlikely((type & BTRFS_BLOCK_GROUP_SYSTEM) &&
906c7c01a4aSDavid Sterba 		     (type & (BTRFS_BLOCK_GROUP_METADATA |
907c7c01a4aSDavid Sterba 			      BTRFS_BLOCK_GROUP_DATA)))) {
908d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
909f1140243SQu Wenruo 			  "system chunk with data or metadata type: 0x%llx",
910f1140243SQu Wenruo 			  type);
911bf871c3bSQu Wenruo 		return -EUCLEAN;
91282fc28fbSQu Wenruo 	}
91382fc28fbSQu Wenruo 
91482fc28fbSQu Wenruo 	features = btrfs_super_incompat_flags(fs_info->super_copy);
91582fc28fbSQu Wenruo 	if (features & BTRFS_FEATURE_INCOMPAT_MIXED_GROUPS)
91682fc28fbSQu Wenruo 		mixed = true;
91782fc28fbSQu Wenruo 
91882fc28fbSQu Wenruo 	if (!mixed) {
919c7c01a4aSDavid Sterba 		if (unlikely((type & BTRFS_BLOCK_GROUP_METADATA) &&
920c7c01a4aSDavid Sterba 			     (type & BTRFS_BLOCK_GROUP_DATA))) {
921d001e4a3SDavid Sterba 			chunk_err(leaf, chunk, logical,
92282fc28fbSQu Wenruo 			"mixed chunk type in non-mixed mode: 0x%llx", type);
923bf871c3bSQu Wenruo 			return -EUCLEAN;
92482fc28fbSQu Wenruo 		}
92582fc28fbSQu Wenruo 	}
92682fc28fbSQu Wenruo 
9270ac6e06bSDavid Sterba 	if (unlikely((type & BTRFS_BLOCK_GROUP_RAID10 &&
9280ac6e06bSDavid Sterba 		      sub_stripes != btrfs_raid_array[BTRFS_RAID_RAID10].sub_stripes) ||
9290ac6e06bSDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_RAID1 &&
9300ac6e06bSDavid Sterba 		      num_stripes != btrfs_raid_array[BTRFS_RAID_RAID1].devs_min) ||
9316c154ba4SDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_RAID1C3 &&
9326c154ba4SDavid Sterba 		      num_stripes != btrfs_raid_array[BTRFS_RAID_RAID1C3].devs_min) ||
9336c154ba4SDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_RAID1C4 &&
9346c154ba4SDavid Sterba 		      num_stripes != btrfs_raid_array[BTRFS_RAID_RAID1C4].devs_min) ||
9350ac6e06bSDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_RAID5 &&
9360ac6e06bSDavid Sterba 		      num_stripes < btrfs_raid_array[BTRFS_RAID_RAID5].devs_min) ||
9370ac6e06bSDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_RAID6 &&
9380ac6e06bSDavid Sterba 		      num_stripes < btrfs_raid_array[BTRFS_RAID_RAID6].devs_min) ||
9390ac6e06bSDavid Sterba 		     (type & BTRFS_BLOCK_GROUP_DUP &&
9400ac6e06bSDavid Sterba 		      num_stripes != btrfs_raid_array[BTRFS_RAID_DUP].dev_stripes) ||
941c7c01a4aSDavid Sterba 		     ((type & BTRFS_BLOCK_GROUP_PROFILE_MASK) == 0 &&
9420ac6e06bSDavid Sterba 		      num_stripes != btrfs_raid_array[BTRFS_RAID_SINGLE].dev_stripes))) {
943d001e4a3SDavid Sterba 		chunk_err(leaf, chunk, logical,
94482fc28fbSQu Wenruo 			"invalid num_stripes:sub_stripes %u:%u for profile %llu",
94582fc28fbSQu Wenruo 			num_stripes, sub_stripes,
94682fc28fbSQu Wenruo 			type & BTRFS_BLOCK_GROUP_PROFILE_MASK);
947bf871c3bSQu Wenruo 		return -EUCLEAN;
94882fc28fbSQu Wenruo 	}
94982fc28fbSQu Wenruo 
95082fc28fbSQu Wenruo 	return 0;
95182fc28fbSQu Wenruo }
95282fc28fbSQu Wenruo 
953f6d2a5c2SQu Wenruo /*
954f6d2a5c2SQu Wenruo  * Enhanced version of chunk item checker.
955f6d2a5c2SQu Wenruo  *
956f6d2a5c2SQu Wenruo  * The common btrfs_check_chunk_valid() doesn't check item size since it needs
957f6d2a5c2SQu Wenruo  * to work on super block sys_chunk_array which doesn't have full item ptr.
958f6d2a5c2SQu Wenruo  */
959f6d2a5c2SQu Wenruo static int check_leaf_chunk_item(struct extent_buffer *leaf,
960f6d2a5c2SQu Wenruo 				 struct btrfs_chunk *chunk,
961f6d2a5c2SQu Wenruo 				 struct btrfs_key *key, int slot)
962f6d2a5c2SQu Wenruo {
963f6d2a5c2SQu Wenruo 	int num_stripes;
964f6d2a5c2SQu Wenruo 
9653212fa14SJosef Bacik 	if (unlikely(btrfs_item_size(leaf, slot) < sizeof(struct btrfs_chunk))) {
966f6d2a5c2SQu Wenruo 		chunk_err(leaf, chunk, key->offset,
967f6d2a5c2SQu Wenruo 			"invalid chunk item size: have %u expect [%zu, %u)",
9683212fa14SJosef Bacik 			btrfs_item_size(leaf, slot),
969f6d2a5c2SQu Wenruo 			sizeof(struct btrfs_chunk),
970f6d2a5c2SQu Wenruo 			BTRFS_LEAF_DATA_SIZE(leaf->fs_info));
971f6d2a5c2SQu Wenruo 		return -EUCLEAN;
972f6d2a5c2SQu Wenruo 	}
973f6d2a5c2SQu Wenruo 
974f6d2a5c2SQu Wenruo 	num_stripes = btrfs_chunk_num_stripes(leaf, chunk);
975f6d2a5c2SQu Wenruo 	/* Let btrfs_check_chunk_valid() handle this error type */
976f6d2a5c2SQu Wenruo 	if (num_stripes == 0)
977f6d2a5c2SQu Wenruo 		goto out;
978f6d2a5c2SQu Wenruo 
979c7c01a4aSDavid Sterba 	if (unlikely(btrfs_chunk_item_size(num_stripes) !=
9803212fa14SJosef Bacik 		     btrfs_item_size(leaf, slot))) {
981f6d2a5c2SQu Wenruo 		chunk_err(leaf, chunk, key->offset,
982f6d2a5c2SQu Wenruo 			"invalid chunk item size: have %u expect %lu",
9833212fa14SJosef Bacik 			btrfs_item_size(leaf, slot),
984f6d2a5c2SQu Wenruo 			btrfs_chunk_item_size(num_stripes));
985f6d2a5c2SQu Wenruo 		return -EUCLEAN;
986f6d2a5c2SQu Wenruo 	}
987f6d2a5c2SQu Wenruo out:
988f6d2a5c2SQu Wenruo 	return btrfs_check_chunk_valid(leaf, chunk, key->offset);
989f6d2a5c2SQu Wenruo }
990f6d2a5c2SQu Wenruo 
9915617ed80SDavid Sterba __printf(3, 4)
992ab4ba2e1SQu Wenruo __cold
9935617ed80SDavid Sterba static void dev_item_err(const struct extent_buffer *eb, int slot,
994ab4ba2e1SQu Wenruo 			 const char *fmt, ...)
995ab4ba2e1SQu Wenruo {
996ab4ba2e1SQu Wenruo 	struct btrfs_key key;
997ab4ba2e1SQu Wenruo 	struct va_format vaf;
998ab4ba2e1SQu Wenruo 	va_list args;
999ab4ba2e1SQu Wenruo 
1000ab4ba2e1SQu Wenruo 	btrfs_item_key_to_cpu(eb, &key, slot);
1001ab4ba2e1SQu Wenruo 	va_start(args, fmt);
1002ab4ba2e1SQu Wenruo 
1003ab4ba2e1SQu Wenruo 	vaf.fmt = fmt;
1004ab4ba2e1SQu Wenruo 	vaf.va = &args;
1005ab4ba2e1SQu Wenruo 
10065617ed80SDavid Sterba 	btrfs_crit(eb->fs_info,
1007ab4ba2e1SQu Wenruo 	"corrupt %s: root=%llu block=%llu slot=%d devid=%llu %pV",
1008ab4ba2e1SQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
1009ab4ba2e1SQu Wenruo 		btrfs_header_owner(eb), btrfs_header_bytenr(eb), slot,
1010ab4ba2e1SQu Wenruo 		key.objectid, &vaf);
1011ab4ba2e1SQu Wenruo 	va_end(args);
1012ab4ba2e1SQu Wenruo }
1013ab4ba2e1SQu Wenruo 
1014412a2312SDavid Sterba static int check_dev_item(struct extent_buffer *leaf,
1015ab4ba2e1SQu Wenruo 			  struct btrfs_key *key, int slot)
1016ab4ba2e1SQu Wenruo {
1017ab4ba2e1SQu Wenruo 	struct btrfs_dev_item *ditem;
1018ea1d1ca4SSu Yue 	const u32 item_size = btrfs_item_size(leaf, slot);
1019ab4ba2e1SQu Wenruo 
1020c7c01a4aSDavid Sterba 	if (unlikely(key->objectid != BTRFS_DEV_ITEMS_OBJECTID)) {
10215617ed80SDavid Sterba 		dev_item_err(leaf, slot,
1022ab4ba2e1SQu Wenruo 			     "invalid objectid: has=%llu expect=%llu",
1023ab4ba2e1SQu Wenruo 			     key->objectid, BTRFS_DEV_ITEMS_OBJECTID);
1024ab4ba2e1SQu Wenruo 		return -EUCLEAN;
1025ab4ba2e1SQu Wenruo 	}
1026ea1d1ca4SSu Yue 
1027ea1d1ca4SSu Yue 	if (unlikely(item_size != sizeof(*ditem))) {
1028ea1d1ca4SSu Yue 		dev_item_err(leaf, slot, "invalid item size: has %u expect %zu",
1029ea1d1ca4SSu Yue 			     item_size, sizeof(*ditem));
1030ea1d1ca4SSu Yue 		return -EUCLEAN;
1031ea1d1ca4SSu Yue 	}
1032ea1d1ca4SSu Yue 
1033ab4ba2e1SQu Wenruo 	ditem = btrfs_item_ptr(leaf, slot, struct btrfs_dev_item);
1034c7c01a4aSDavid Sterba 	if (unlikely(btrfs_device_id(leaf, ditem) != key->offset)) {
10355617ed80SDavid Sterba 		dev_item_err(leaf, slot,
1036ab4ba2e1SQu Wenruo 			     "devid mismatch: key has=%llu item has=%llu",
1037ab4ba2e1SQu Wenruo 			     key->offset, btrfs_device_id(leaf, ditem));
1038ab4ba2e1SQu Wenruo 		return -EUCLEAN;
1039ab4ba2e1SQu Wenruo 	}
1040ab4ba2e1SQu Wenruo 
1041ab4ba2e1SQu Wenruo 	/*
1042ab4ba2e1SQu Wenruo 	 * For device total_bytes, we don't have reliable way to check it, as
1043ab4ba2e1SQu Wenruo 	 * it can be 0 for device removal. Device size check can only be done
1044ab4ba2e1SQu Wenruo 	 * by dev extents check.
1045ab4ba2e1SQu Wenruo 	 */
1046c7c01a4aSDavid Sterba 	if (unlikely(btrfs_device_bytes_used(leaf, ditem) >
1047c7c01a4aSDavid Sterba 		     btrfs_device_total_bytes(leaf, ditem))) {
10485617ed80SDavid Sterba 		dev_item_err(leaf, slot,
1049ab4ba2e1SQu Wenruo 			     "invalid bytes used: have %llu expect [0, %llu]",
1050ab4ba2e1SQu Wenruo 			     btrfs_device_bytes_used(leaf, ditem),
1051ab4ba2e1SQu Wenruo 			     btrfs_device_total_bytes(leaf, ditem));
1052ab4ba2e1SQu Wenruo 		return -EUCLEAN;
1053ab4ba2e1SQu Wenruo 	}
1054ab4ba2e1SQu Wenruo 	/*
1055ab4ba2e1SQu Wenruo 	 * Remaining members like io_align/type/gen/dev_group aren't really
1056ab4ba2e1SQu Wenruo 	 * utilized.  Skip them to make later usage of them easier.
1057ab4ba2e1SQu Wenruo 	 */
1058ab4ba2e1SQu Wenruo 	return 0;
1059ab4ba2e1SQu Wenruo }
1060ab4ba2e1SQu Wenruo 
106139e57f49SDavid Sterba static int check_inode_item(struct extent_buffer *leaf,
1062496245caSQu Wenruo 			    struct btrfs_key *key, int slot)
1063496245caSQu Wenruo {
106439e57f49SDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
1065496245caSQu Wenruo 	struct btrfs_inode_item *iitem;
1066496245caSQu Wenruo 	u64 super_gen = btrfs_super_generation(fs_info->super_copy);
1067496245caSQu Wenruo 	u32 valid_mask = (S_IFMT | S_ISUID | S_ISGID | S_ISVTX | 0777);
10680c982944SSu Yue 	const u32 item_size = btrfs_item_size(leaf, slot);
1069496245caSQu Wenruo 	u32 mode;
1070c23c77b0SQu Wenruo 	int ret;
107177eea05eSBoris Burkov 	u32 flags;
107277eea05eSBoris Burkov 	u32 ro_flags;
1073496245caSQu Wenruo 
1074c23c77b0SQu Wenruo 	ret = check_inode_key(leaf, key, slot);
1075c7c01a4aSDavid Sterba 	if (unlikely(ret < 0))
1076c23c77b0SQu Wenruo 		return ret;
1077c23c77b0SQu Wenruo 
10780c982944SSu Yue 	if (unlikely(item_size != sizeof(*iitem))) {
10790c982944SSu Yue 		generic_err(leaf, slot, "invalid item size: has %u expect %zu",
10800c982944SSu Yue 			    item_size, sizeof(*iitem));
10810c982944SSu Yue 		return -EUCLEAN;
10820c982944SSu Yue 	}
10830c982944SSu Yue 
1084496245caSQu Wenruo 	iitem = btrfs_item_ptr(leaf, slot, struct btrfs_inode_item);
1085496245caSQu Wenruo 
1086496245caSQu Wenruo 	/* Here we use super block generation + 1 to handle log tree */
1087c7c01a4aSDavid Sterba 	if (unlikely(btrfs_inode_generation(leaf, iitem) > super_gen + 1)) {
1088c3053ebbSQu Wenruo 		inode_item_err(leaf, slot,
1089496245caSQu Wenruo 			"invalid inode generation: has %llu expect (0, %llu]",
1090496245caSQu Wenruo 			       btrfs_inode_generation(leaf, iitem),
1091496245caSQu Wenruo 			       super_gen + 1);
1092496245caSQu Wenruo 		return -EUCLEAN;
1093496245caSQu Wenruo 	}
1094496245caSQu Wenruo 	/* Note for ROOT_TREE_DIR_ITEM, mkfs could set its transid 0 */
1095c7c01a4aSDavid Sterba 	if (unlikely(btrfs_inode_transid(leaf, iitem) > super_gen + 1)) {
1096c3053ebbSQu Wenruo 		inode_item_err(leaf, slot,
1097f96d6960SQu Wenruo 			"invalid inode transid: has %llu expect [0, %llu]",
1098496245caSQu Wenruo 			       btrfs_inode_transid(leaf, iitem), super_gen + 1);
1099496245caSQu Wenruo 		return -EUCLEAN;
1100496245caSQu Wenruo 	}
1101496245caSQu Wenruo 
1102496245caSQu Wenruo 	/*
1103496245caSQu Wenruo 	 * For size and nbytes it's better not to be too strict, as for dir
1104496245caSQu Wenruo 	 * item its size/nbytes can easily get wrong, but doesn't affect
1105496245caSQu Wenruo 	 * anything in the fs. So here we skip the check.
1106496245caSQu Wenruo 	 */
1107496245caSQu Wenruo 	mode = btrfs_inode_mode(leaf, iitem);
1108c7c01a4aSDavid Sterba 	if (unlikely(mode & ~valid_mask)) {
1109c3053ebbSQu Wenruo 		inode_item_err(leaf, slot,
1110496245caSQu Wenruo 			       "unknown mode bit detected: 0x%x",
1111496245caSQu Wenruo 			       mode & ~valid_mask);
1112496245caSQu Wenruo 		return -EUCLEAN;
1113496245caSQu Wenruo 	}
1114496245caSQu Wenruo 
1115496245caSQu Wenruo 	/*
1116c1499166SDavid Sterba 	 * S_IFMT is not bit mapped so we can't completely rely on
1117c1499166SDavid Sterba 	 * is_power_of_2/has_single_bit_set, but it can save us from checking
1118c1499166SDavid Sterba 	 * FIFO/CHR/DIR/REG.  Only needs to check BLK, LNK and SOCKS
1119496245caSQu Wenruo 	 */
1120c1499166SDavid Sterba 	if (!has_single_bit_set(mode & S_IFMT)) {
1121c7c01a4aSDavid Sterba 		if (unlikely(!S_ISLNK(mode) && !S_ISBLK(mode) && !S_ISSOCK(mode))) {
1122c3053ebbSQu Wenruo 			inode_item_err(leaf, slot,
1123496245caSQu Wenruo 			"invalid mode: has 0%o expect valid S_IF* bit(s)",
1124496245caSQu Wenruo 				       mode & S_IFMT);
1125496245caSQu Wenruo 			return -EUCLEAN;
1126496245caSQu Wenruo 		}
1127496245caSQu Wenruo 	}
1128c7c01a4aSDavid Sterba 	if (unlikely(S_ISDIR(mode) && btrfs_inode_nlink(leaf, iitem) > 1)) {
1129c3053ebbSQu Wenruo 		inode_item_err(leaf, slot,
1130496245caSQu Wenruo 		       "invalid nlink: has %u expect no more than 1 for dir",
1131496245caSQu Wenruo 			btrfs_inode_nlink(leaf, iitem));
1132496245caSQu Wenruo 		return -EUCLEAN;
1133496245caSQu Wenruo 	}
113477eea05eSBoris Burkov 	btrfs_inode_split_flags(btrfs_inode_flags(leaf, iitem), &flags, &ro_flags);
113577eea05eSBoris Burkov 	if (unlikely(flags & ~BTRFS_INODE_FLAG_MASK)) {
1136c3053ebbSQu Wenruo 		inode_item_err(leaf, slot,
113777eea05eSBoris Burkov 			       "unknown incompat flags detected: 0x%x", flags);
113877eea05eSBoris Burkov 		return -EUCLEAN;
113977eea05eSBoris Burkov 	}
114077eea05eSBoris Burkov 	if (unlikely(!sb_rdonly(fs_info->sb) &&
114177eea05eSBoris Burkov 		     (ro_flags & ~BTRFS_INODE_RO_FLAG_MASK))) {
114277eea05eSBoris Burkov 		inode_item_err(leaf, slot,
114377eea05eSBoris Burkov 			"unknown ro-compat flags detected on writeable mount: 0x%x",
114477eea05eSBoris Burkov 			ro_flags);
1145496245caSQu Wenruo 		return -EUCLEAN;
1146496245caSQu Wenruo 	}
1147496245caSQu Wenruo 	return 0;
1148496245caSQu Wenruo }
1149496245caSQu Wenruo 
1150259ee775SQu Wenruo static int check_root_item(struct extent_buffer *leaf, struct btrfs_key *key,
1151259ee775SQu Wenruo 			   int slot)
1152259ee775SQu Wenruo {
1153259ee775SQu Wenruo 	struct btrfs_fs_info *fs_info = leaf->fs_info;
11541465af12SQu Wenruo 	struct btrfs_root_item ri = { 0 };
1155259ee775SQu Wenruo 	const u64 valid_root_flags = BTRFS_ROOT_SUBVOL_RDONLY |
1156259ee775SQu Wenruo 				     BTRFS_ROOT_SUBVOL_DEAD;
115757a0e674SQu Wenruo 	int ret;
1158259ee775SQu Wenruo 
115957a0e674SQu Wenruo 	ret = check_root_key(leaf, key, slot);
1160c7c01a4aSDavid Sterba 	if (unlikely(ret < 0))
116157a0e674SQu Wenruo 		return ret;
1162259ee775SQu Wenruo 
11633212fa14SJosef Bacik 	if (unlikely(btrfs_item_size(leaf, slot) != sizeof(ri) &&
11643212fa14SJosef Bacik 		     btrfs_item_size(leaf, slot) !=
1165c7c01a4aSDavid Sterba 		     btrfs_legacy_root_item_size())) {
1166259ee775SQu Wenruo 		generic_err(leaf, slot,
11671465af12SQu Wenruo 			    "invalid root item size, have %u expect %zu or %u",
11683212fa14SJosef Bacik 			    btrfs_item_size(leaf, slot), sizeof(ri),
11691465af12SQu Wenruo 			    btrfs_legacy_root_item_size());
11701a49a97dSDaniel Xu 		return -EUCLEAN;
1171259ee775SQu Wenruo 	}
1172259ee775SQu Wenruo 
11731465af12SQu Wenruo 	/*
11741465af12SQu Wenruo 	 * For legacy root item, the members starting at generation_v2 will be
11751465af12SQu Wenruo 	 * all filled with 0.
11761465af12SQu Wenruo 	 * And since we allow geneartion_v2 as 0, it will still pass the check.
11771465af12SQu Wenruo 	 */
1178259ee775SQu Wenruo 	read_extent_buffer(leaf, &ri, btrfs_item_ptr_offset(leaf, slot),
11793212fa14SJosef Bacik 			   btrfs_item_size(leaf, slot));
1180259ee775SQu Wenruo 
1181259ee775SQu Wenruo 	/* Generation related */
1182c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_generation(&ri) >
1183c7c01a4aSDavid Sterba 		     btrfs_super_generation(fs_info->super_copy) + 1)) {
1184259ee775SQu Wenruo 		generic_err(leaf, slot,
1185259ee775SQu Wenruo 			"invalid root generation, have %llu expect (0, %llu]",
1186259ee775SQu Wenruo 			    btrfs_root_generation(&ri),
1187259ee775SQu Wenruo 			    btrfs_super_generation(fs_info->super_copy) + 1);
1188259ee775SQu Wenruo 		return -EUCLEAN;
1189259ee775SQu Wenruo 	}
1190c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_generation_v2(&ri) >
1191c7c01a4aSDavid Sterba 		     btrfs_super_generation(fs_info->super_copy) + 1)) {
1192259ee775SQu Wenruo 		generic_err(leaf, slot,
1193259ee775SQu Wenruo 		"invalid root v2 generation, have %llu expect (0, %llu]",
1194259ee775SQu Wenruo 			    btrfs_root_generation_v2(&ri),
1195259ee775SQu Wenruo 			    btrfs_super_generation(fs_info->super_copy) + 1);
1196259ee775SQu Wenruo 		return -EUCLEAN;
1197259ee775SQu Wenruo 	}
1198c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_last_snapshot(&ri) >
1199c7c01a4aSDavid Sterba 		     btrfs_super_generation(fs_info->super_copy) + 1)) {
1200259ee775SQu Wenruo 		generic_err(leaf, slot,
1201259ee775SQu Wenruo 		"invalid root last_snapshot, have %llu expect (0, %llu]",
1202259ee775SQu Wenruo 			    btrfs_root_last_snapshot(&ri),
1203259ee775SQu Wenruo 			    btrfs_super_generation(fs_info->super_copy) + 1);
1204259ee775SQu Wenruo 		return -EUCLEAN;
1205259ee775SQu Wenruo 	}
1206259ee775SQu Wenruo 
1207259ee775SQu Wenruo 	/* Alignment and level check */
1208c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(btrfs_root_bytenr(&ri), fs_info->sectorsize))) {
1209259ee775SQu Wenruo 		generic_err(leaf, slot,
1210259ee775SQu Wenruo 		"invalid root bytenr, have %llu expect to be aligned to %u",
1211259ee775SQu Wenruo 			    btrfs_root_bytenr(&ri), fs_info->sectorsize);
1212259ee775SQu Wenruo 		return -EUCLEAN;
1213259ee775SQu Wenruo 	}
1214c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_level(&ri) >= BTRFS_MAX_LEVEL)) {
1215259ee775SQu Wenruo 		generic_err(leaf, slot,
1216259ee775SQu Wenruo 			    "invalid root level, have %u expect [0, %u]",
1217259ee775SQu Wenruo 			    btrfs_root_level(&ri), BTRFS_MAX_LEVEL - 1);
1218259ee775SQu Wenruo 		return -EUCLEAN;
1219259ee775SQu Wenruo 	}
1220c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_drop_level(&ri) >= BTRFS_MAX_LEVEL)) {
1221259ee775SQu Wenruo 		generic_err(leaf, slot,
1222259ee775SQu Wenruo 			    "invalid root level, have %u expect [0, %u]",
1223c8422684SDavid Sterba 			    btrfs_root_drop_level(&ri), BTRFS_MAX_LEVEL - 1);
1224259ee775SQu Wenruo 		return -EUCLEAN;
1225259ee775SQu Wenruo 	}
1226259ee775SQu Wenruo 
1227259ee775SQu Wenruo 	/* Flags check */
1228c7c01a4aSDavid Sterba 	if (unlikely(btrfs_root_flags(&ri) & ~valid_root_flags)) {
1229259ee775SQu Wenruo 		generic_err(leaf, slot,
1230259ee775SQu Wenruo 			    "invalid root flags, have 0x%llx expect mask 0x%llx",
1231259ee775SQu Wenruo 			    btrfs_root_flags(&ri), valid_root_flags);
1232259ee775SQu Wenruo 		return -EUCLEAN;
1233259ee775SQu Wenruo 	}
1234259ee775SQu Wenruo 	return 0;
1235259ee775SQu Wenruo }
1236259ee775SQu Wenruo 
1237f82d1c7cSQu Wenruo __printf(3,4)
1238f82d1c7cSQu Wenruo __cold
1239f82d1c7cSQu Wenruo static void extent_err(const struct extent_buffer *eb, int slot,
1240f82d1c7cSQu Wenruo 		       const char *fmt, ...)
1241f82d1c7cSQu Wenruo {
1242f82d1c7cSQu Wenruo 	struct btrfs_key key;
1243f82d1c7cSQu Wenruo 	struct va_format vaf;
1244f82d1c7cSQu Wenruo 	va_list args;
1245f82d1c7cSQu Wenruo 	u64 bytenr;
1246f82d1c7cSQu Wenruo 	u64 len;
1247f82d1c7cSQu Wenruo 
1248f82d1c7cSQu Wenruo 	btrfs_item_key_to_cpu(eb, &key, slot);
1249f82d1c7cSQu Wenruo 	bytenr = key.objectid;
1250e2406a6fSQu Wenruo 	if (key.type == BTRFS_METADATA_ITEM_KEY ||
1251e2406a6fSQu Wenruo 	    key.type == BTRFS_TREE_BLOCK_REF_KEY ||
1252e2406a6fSQu Wenruo 	    key.type == BTRFS_SHARED_BLOCK_REF_KEY)
1253f82d1c7cSQu Wenruo 		len = eb->fs_info->nodesize;
1254f82d1c7cSQu Wenruo 	else
1255f82d1c7cSQu Wenruo 		len = key.offset;
1256f82d1c7cSQu Wenruo 	va_start(args, fmt);
1257f82d1c7cSQu Wenruo 
1258f82d1c7cSQu Wenruo 	vaf.fmt = fmt;
1259f82d1c7cSQu Wenruo 	vaf.va = &args;
1260f82d1c7cSQu Wenruo 
1261f82d1c7cSQu Wenruo 	btrfs_crit(eb->fs_info,
1262f82d1c7cSQu Wenruo 	"corrupt %s: block=%llu slot=%d extent bytenr=%llu len=%llu %pV",
1263f82d1c7cSQu Wenruo 		btrfs_header_level(eb) == 0 ? "leaf" : "node",
1264f82d1c7cSQu Wenruo 		eb->start, slot, bytenr, len, &vaf);
1265f82d1c7cSQu Wenruo 	va_end(args);
1266f82d1c7cSQu Wenruo }
1267f82d1c7cSQu Wenruo 
1268f82d1c7cSQu Wenruo static int check_extent_item(struct extent_buffer *leaf,
1269899b7f69SJosef Bacik 			     struct btrfs_key *key, int slot,
1270899b7f69SJosef Bacik 			     struct btrfs_key *prev_key)
1271f82d1c7cSQu Wenruo {
1272f82d1c7cSQu Wenruo 	struct btrfs_fs_info *fs_info = leaf->fs_info;
1273f82d1c7cSQu Wenruo 	struct btrfs_extent_item *ei;
1274f82d1c7cSQu Wenruo 	bool is_tree_block = false;
1275f82d1c7cSQu Wenruo 	unsigned long ptr;	/* Current pointer inside inline refs */
1276f82d1c7cSQu Wenruo 	unsigned long end;	/* Extent item end */
12773212fa14SJosef Bacik 	const u32 item_size = btrfs_item_size(leaf, slot);
1278*c1bf973fSQu Wenruo 	u8 last_type = 0;
1279*c1bf973fSQu Wenruo 	u64 last_seq = U64_MAX;
1280f82d1c7cSQu Wenruo 	u64 flags;
1281f82d1c7cSQu Wenruo 	u64 generation;
1282f82d1c7cSQu Wenruo 	u64 total_refs;		/* Total refs in btrfs_extent_item */
1283f82d1c7cSQu Wenruo 	u64 inline_refs = 0;	/* found total inline refs */
1284f82d1c7cSQu Wenruo 
1285c7c01a4aSDavid Sterba 	if (unlikely(key->type == BTRFS_METADATA_ITEM_KEY &&
1286c7c01a4aSDavid Sterba 		     !btrfs_fs_incompat(fs_info, SKINNY_METADATA))) {
1287f82d1c7cSQu Wenruo 		generic_err(leaf, slot,
1288f82d1c7cSQu Wenruo "invalid key type, METADATA_ITEM type invalid when SKINNY_METADATA feature disabled");
1289f82d1c7cSQu Wenruo 		return -EUCLEAN;
1290f82d1c7cSQu Wenruo 	}
1291f82d1c7cSQu Wenruo 	/* key->objectid is the bytenr for both key types */
1292c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(key->objectid, fs_info->sectorsize))) {
1293f82d1c7cSQu Wenruo 		generic_err(leaf, slot,
1294f82d1c7cSQu Wenruo 		"invalid key objectid, have %llu expect to be aligned to %u",
1295f82d1c7cSQu Wenruo 			   key->objectid, fs_info->sectorsize);
1296f82d1c7cSQu Wenruo 		return -EUCLEAN;
1297f82d1c7cSQu Wenruo 	}
1298f82d1c7cSQu Wenruo 
1299f82d1c7cSQu Wenruo 	/* key->offset is tree level for METADATA_ITEM_KEY */
1300c7c01a4aSDavid Sterba 	if (unlikely(key->type == BTRFS_METADATA_ITEM_KEY &&
1301c7c01a4aSDavid Sterba 		     key->offset >= BTRFS_MAX_LEVEL)) {
1302f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1303f82d1c7cSQu Wenruo 			   "invalid tree level, have %llu expect [0, %u]",
1304f82d1c7cSQu Wenruo 			   key->offset, BTRFS_MAX_LEVEL - 1);
1305f82d1c7cSQu Wenruo 		return -EUCLEAN;
1306f82d1c7cSQu Wenruo 	}
1307f82d1c7cSQu Wenruo 
1308f82d1c7cSQu Wenruo 	/*
1309f82d1c7cSQu Wenruo 	 * EXTENT/METADATA_ITEM consists of:
1310f82d1c7cSQu Wenruo 	 * 1) One btrfs_extent_item
1311f82d1c7cSQu Wenruo 	 *    Records the total refs, type and generation of the extent.
1312f82d1c7cSQu Wenruo 	 *
1313f82d1c7cSQu Wenruo 	 * 2) One btrfs_tree_block_info (for EXTENT_ITEM and tree backref only)
1314f82d1c7cSQu Wenruo 	 *    Records the first key and level of the tree block.
1315f82d1c7cSQu Wenruo 	 *
1316f82d1c7cSQu Wenruo 	 * 2) Zero or more btrfs_extent_inline_ref(s)
1317f82d1c7cSQu Wenruo 	 *    Each inline ref has one btrfs_extent_inline_ref shows:
1318f82d1c7cSQu Wenruo 	 *    2.1) The ref type, one of the 4
1319f82d1c7cSQu Wenruo 	 *         TREE_BLOCK_REF	Tree block only
1320f82d1c7cSQu Wenruo 	 *         SHARED_BLOCK_REF	Tree block only
1321f82d1c7cSQu Wenruo 	 *         EXTENT_DATA_REF	Data only
1322f82d1c7cSQu Wenruo 	 *         SHARED_DATA_REF	Data only
1323f82d1c7cSQu Wenruo 	 *    2.2) Ref type specific data
1324f82d1c7cSQu Wenruo 	 *         Either using btrfs_extent_inline_ref::offset, or specific
1325f82d1c7cSQu Wenruo 	 *         data structure.
1326*c1bf973fSQu Wenruo 	 *
1327*c1bf973fSQu Wenruo 	 *    All above inline items should follow the order:
1328*c1bf973fSQu Wenruo 	 *
1329*c1bf973fSQu Wenruo 	 *    - All btrfs_extent_inline_ref::type should be in an ascending
1330*c1bf973fSQu Wenruo 	 *      order
1331*c1bf973fSQu Wenruo 	 *
1332*c1bf973fSQu Wenruo 	 *    - Within the same type, the items should follow a descending
1333*c1bf973fSQu Wenruo 	 *      order by their sequence number. The sequence number is
1334*c1bf973fSQu Wenruo 	 *      determined by:
1335*c1bf973fSQu Wenruo 	 *      * btrfs_extent_inline_ref::offset for all types  other than
1336*c1bf973fSQu Wenruo 	 *        EXTENT_DATA_REF
1337*c1bf973fSQu Wenruo 	 *      * hash_extent_data_ref() for EXTENT_DATA_REF
1338f82d1c7cSQu Wenruo 	 */
1339c7c01a4aSDavid Sterba 	if (unlikely(item_size < sizeof(*ei))) {
1340f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1341f82d1c7cSQu Wenruo 			   "invalid item size, have %u expect [%zu, %u)",
1342f82d1c7cSQu Wenruo 			   item_size, sizeof(*ei),
1343f82d1c7cSQu Wenruo 			   BTRFS_LEAF_DATA_SIZE(fs_info));
1344f82d1c7cSQu Wenruo 		return -EUCLEAN;
1345f82d1c7cSQu Wenruo 	}
1346f82d1c7cSQu Wenruo 	end = item_size + btrfs_item_ptr_offset(leaf, slot);
1347f82d1c7cSQu Wenruo 
1348f82d1c7cSQu Wenruo 	/* Checks against extent_item */
1349f82d1c7cSQu Wenruo 	ei = btrfs_item_ptr(leaf, slot, struct btrfs_extent_item);
1350f82d1c7cSQu Wenruo 	flags = btrfs_extent_flags(leaf, ei);
1351f82d1c7cSQu Wenruo 	total_refs = btrfs_extent_refs(leaf, ei);
1352f82d1c7cSQu Wenruo 	generation = btrfs_extent_generation(leaf, ei);
1353c7c01a4aSDavid Sterba 	if (unlikely(generation >
1354c7c01a4aSDavid Sterba 		     btrfs_super_generation(fs_info->super_copy) + 1)) {
1355f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1356f82d1c7cSQu Wenruo 			   "invalid generation, have %llu expect (0, %llu]",
1357f82d1c7cSQu Wenruo 			   generation,
1358f82d1c7cSQu Wenruo 			   btrfs_super_generation(fs_info->super_copy) + 1);
1359f82d1c7cSQu Wenruo 		return -EUCLEAN;
1360f82d1c7cSQu Wenruo 	}
1361c7c01a4aSDavid Sterba 	if (unlikely(!has_single_bit_set(flags & (BTRFS_EXTENT_FLAG_DATA |
1362c7c01a4aSDavid Sterba 						  BTRFS_EXTENT_FLAG_TREE_BLOCK)))) {
1363f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1364f82d1c7cSQu Wenruo 		"invalid extent flag, have 0x%llx expect 1 bit set in 0x%llx",
1365f82d1c7cSQu Wenruo 			flags, BTRFS_EXTENT_FLAG_DATA |
1366f82d1c7cSQu Wenruo 			BTRFS_EXTENT_FLAG_TREE_BLOCK);
1367f82d1c7cSQu Wenruo 		return -EUCLEAN;
1368f82d1c7cSQu Wenruo 	}
1369f82d1c7cSQu Wenruo 	is_tree_block = !!(flags & BTRFS_EXTENT_FLAG_TREE_BLOCK);
1370f82d1c7cSQu Wenruo 	if (is_tree_block) {
1371c7c01a4aSDavid Sterba 		if (unlikely(key->type == BTRFS_EXTENT_ITEM_KEY &&
1372c7c01a4aSDavid Sterba 			     key->offset != fs_info->nodesize)) {
1373f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1374f82d1c7cSQu Wenruo 				   "invalid extent length, have %llu expect %u",
1375f82d1c7cSQu Wenruo 				   key->offset, fs_info->nodesize);
1376f82d1c7cSQu Wenruo 			return -EUCLEAN;
1377f82d1c7cSQu Wenruo 		}
1378f82d1c7cSQu Wenruo 	} else {
1379c7c01a4aSDavid Sterba 		if (unlikely(key->type != BTRFS_EXTENT_ITEM_KEY)) {
1380f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1381f82d1c7cSQu Wenruo 			"invalid key type, have %u expect %u for data backref",
1382f82d1c7cSQu Wenruo 				   key->type, BTRFS_EXTENT_ITEM_KEY);
1383f82d1c7cSQu Wenruo 			return -EUCLEAN;
1384f82d1c7cSQu Wenruo 		}
1385c7c01a4aSDavid Sterba 		if (unlikely(!IS_ALIGNED(key->offset, fs_info->sectorsize))) {
1386f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1387f82d1c7cSQu Wenruo 			"invalid extent length, have %llu expect aligned to %u",
1388f82d1c7cSQu Wenruo 				   key->offset, fs_info->sectorsize);
1389f82d1c7cSQu Wenruo 			return -EUCLEAN;
1390f82d1c7cSQu Wenruo 		}
13910ebb6bbbSJosef Bacik 		if (unlikely(flags & BTRFS_BLOCK_FLAG_FULL_BACKREF)) {
13920ebb6bbbSJosef Bacik 			extent_err(leaf, slot,
13930ebb6bbbSJosef Bacik 			"invalid extent flag, data has full backref set");
13940ebb6bbbSJosef Bacik 			return -EUCLEAN;
13950ebb6bbbSJosef Bacik 		}
1396f82d1c7cSQu Wenruo 	}
1397f82d1c7cSQu Wenruo 	ptr = (unsigned long)(struct btrfs_extent_item *)(ei + 1);
1398f82d1c7cSQu Wenruo 
1399f82d1c7cSQu Wenruo 	/* Check the special case of btrfs_tree_block_info */
1400f82d1c7cSQu Wenruo 	if (is_tree_block && key->type != BTRFS_METADATA_ITEM_KEY) {
1401f82d1c7cSQu Wenruo 		struct btrfs_tree_block_info *info;
1402f82d1c7cSQu Wenruo 
1403f82d1c7cSQu Wenruo 		info = (struct btrfs_tree_block_info *)ptr;
1404c7c01a4aSDavid Sterba 		if (unlikely(btrfs_tree_block_level(leaf, info) >= BTRFS_MAX_LEVEL)) {
1405f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1406f82d1c7cSQu Wenruo 			"invalid tree block info level, have %u expect [0, %u]",
1407f82d1c7cSQu Wenruo 				   btrfs_tree_block_level(leaf, info),
1408f82d1c7cSQu Wenruo 				   BTRFS_MAX_LEVEL - 1);
1409f82d1c7cSQu Wenruo 			return -EUCLEAN;
1410f82d1c7cSQu Wenruo 		}
1411f82d1c7cSQu Wenruo 		ptr = (unsigned long)(struct btrfs_tree_block_info *)(info + 1);
1412f82d1c7cSQu Wenruo 	}
1413f82d1c7cSQu Wenruo 
1414f82d1c7cSQu Wenruo 	/* Check inline refs */
1415f82d1c7cSQu Wenruo 	while (ptr < end) {
1416f82d1c7cSQu Wenruo 		struct btrfs_extent_inline_ref *iref;
1417f82d1c7cSQu Wenruo 		struct btrfs_extent_data_ref *dref;
1418f82d1c7cSQu Wenruo 		struct btrfs_shared_data_ref *sref;
1419*c1bf973fSQu Wenruo 		u64 seq;
1420f82d1c7cSQu Wenruo 		u64 dref_offset;
1421f82d1c7cSQu Wenruo 		u64 inline_offset;
1422f82d1c7cSQu Wenruo 		u8 inline_type;
1423f82d1c7cSQu Wenruo 
1424c7c01a4aSDavid Sterba 		if (unlikely(ptr + sizeof(*iref) > end)) {
1425f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1426f82d1c7cSQu Wenruo "inline ref item overflows extent item, ptr %lu iref size %zu end %lu",
1427f82d1c7cSQu Wenruo 				   ptr, sizeof(*iref), end);
1428f82d1c7cSQu Wenruo 			return -EUCLEAN;
1429f82d1c7cSQu Wenruo 		}
1430f82d1c7cSQu Wenruo 		iref = (struct btrfs_extent_inline_ref *)ptr;
1431f82d1c7cSQu Wenruo 		inline_type = btrfs_extent_inline_ref_type(leaf, iref);
1432f82d1c7cSQu Wenruo 		inline_offset = btrfs_extent_inline_ref_offset(leaf, iref);
1433*c1bf973fSQu Wenruo 		seq = inline_offset;
1434c7c01a4aSDavid Sterba 		if (unlikely(ptr + btrfs_extent_inline_ref_size(inline_type) > end)) {
1435f82d1c7cSQu Wenruo 			extent_err(leaf, slot,
1436f82d1c7cSQu Wenruo "inline ref item overflows extent item, ptr %lu iref size %u end %lu",
1437ad854a86SChung-Chiang Cheng 				   ptr, btrfs_extent_inline_ref_size(inline_type), end);
1438f82d1c7cSQu Wenruo 			return -EUCLEAN;
1439f82d1c7cSQu Wenruo 		}
1440f82d1c7cSQu Wenruo 
1441f82d1c7cSQu Wenruo 		switch (inline_type) {
1442f82d1c7cSQu Wenruo 		/* inline_offset is subvolid of the owner, no need to check */
1443f82d1c7cSQu Wenruo 		case BTRFS_TREE_BLOCK_REF_KEY:
1444f82d1c7cSQu Wenruo 			inline_refs++;
1445f82d1c7cSQu Wenruo 			break;
1446f82d1c7cSQu Wenruo 		/* Contains parent bytenr */
1447f82d1c7cSQu Wenruo 		case BTRFS_SHARED_BLOCK_REF_KEY:
1448c7c01a4aSDavid Sterba 			if (unlikely(!IS_ALIGNED(inline_offset,
1449c7c01a4aSDavid Sterba 						 fs_info->sectorsize))) {
1450f82d1c7cSQu Wenruo 				extent_err(leaf, slot,
1451f82d1c7cSQu Wenruo 		"invalid tree parent bytenr, have %llu expect aligned to %u",
1452f82d1c7cSQu Wenruo 					   inline_offset, fs_info->sectorsize);
1453f82d1c7cSQu Wenruo 				return -EUCLEAN;
1454f82d1c7cSQu Wenruo 			}
1455f82d1c7cSQu Wenruo 			inline_refs++;
1456f82d1c7cSQu Wenruo 			break;
1457f82d1c7cSQu Wenruo 		/*
1458f82d1c7cSQu Wenruo 		 * Contains owner subvolid, owner key objectid, adjusted offset.
1459f82d1c7cSQu Wenruo 		 * The only obvious corruption can happen in that offset.
1460f82d1c7cSQu Wenruo 		 */
1461f82d1c7cSQu Wenruo 		case BTRFS_EXTENT_DATA_REF_KEY:
1462f82d1c7cSQu Wenruo 			dref = (struct btrfs_extent_data_ref *)(&iref->offset);
1463f82d1c7cSQu Wenruo 			dref_offset = btrfs_extent_data_ref_offset(leaf, dref);
1464*c1bf973fSQu Wenruo 			seq = hash_extent_data_ref(
1465*c1bf973fSQu Wenruo 					btrfs_extent_data_ref_root(leaf, dref),
1466*c1bf973fSQu Wenruo 					btrfs_extent_data_ref_objectid(leaf, dref),
1467*c1bf973fSQu Wenruo 					btrfs_extent_data_ref_offset(leaf, dref));
1468c7c01a4aSDavid Sterba 			if (unlikely(!IS_ALIGNED(dref_offset,
1469c7c01a4aSDavid Sterba 						 fs_info->sectorsize))) {
1470f82d1c7cSQu Wenruo 				extent_err(leaf, slot,
1471f82d1c7cSQu Wenruo 		"invalid data ref offset, have %llu expect aligned to %u",
1472f82d1c7cSQu Wenruo 					   dref_offset, fs_info->sectorsize);
1473f82d1c7cSQu Wenruo 				return -EUCLEAN;
1474f82d1c7cSQu Wenruo 			}
1475f82d1c7cSQu Wenruo 			inline_refs += btrfs_extent_data_ref_count(leaf, dref);
1476f82d1c7cSQu Wenruo 			break;
1477f82d1c7cSQu Wenruo 		/* Contains parent bytenr and ref count */
1478f82d1c7cSQu Wenruo 		case BTRFS_SHARED_DATA_REF_KEY:
1479f82d1c7cSQu Wenruo 			sref = (struct btrfs_shared_data_ref *)(iref + 1);
1480c7c01a4aSDavid Sterba 			if (unlikely(!IS_ALIGNED(inline_offset,
1481c7c01a4aSDavid Sterba 						 fs_info->sectorsize))) {
1482f82d1c7cSQu Wenruo 				extent_err(leaf, slot,
1483f82d1c7cSQu Wenruo 		"invalid data parent bytenr, have %llu expect aligned to %u",
1484f82d1c7cSQu Wenruo 					   inline_offset, fs_info->sectorsize);
1485f82d1c7cSQu Wenruo 				return -EUCLEAN;
1486f82d1c7cSQu Wenruo 			}
1487f82d1c7cSQu Wenruo 			inline_refs += btrfs_shared_data_ref_count(leaf, sref);
1488f82d1c7cSQu Wenruo 			break;
1489f82d1c7cSQu Wenruo 		default:
1490f82d1c7cSQu Wenruo 			extent_err(leaf, slot, "unknown inline ref type: %u",
1491f82d1c7cSQu Wenruo 				   inline_type);
1492f82d1c7cSQu Wenruo 			return -EUCLEAN;
1493f82d1c7cSQu Wenruo 		}
1494*c1bf973fSQu Wenruo 		if (inline_type < last_type) {
1495*c1bf973fSQu Wenruo 			extent_err(leaf, slot,
1496*c1bf973fSQu Wenruo 				   "inline ref out-of-order: has type %u, prev type %u",
1497*c1bf973fSQu Wenruo 				   inline_type, last_type);
1498*c1bf973fSQu Wenruo 			return -EUCLEAN;
1499*c1bf973fSQu Wenruo 		}
1500*c1bf973fSQu Wenruo 		/* Type changed, allow the sequence starts from U64_MAX again. */
1501*c1bf973fSQu Wenruo 		if (inline_type > last_type)
1502*c1bf973fSQu Wenruo 			last_seq = U64_MAX;
1503*c1bf973fSQu Wenruo 		if (seq > last_seq) {
1504*c1bf973fSQu Wenruo 			extent_err(leaf, slot,
1505*c1bf973fSQu Wenruo "inline ref out-of-order: has type %u offset %llu seq 0x%llx, prev type %u seq 0x%llx",
1506*c1bf973fSQu Wenruo 				   inline_type, inline_offset, seq,
1507*c1bf973fSQu Wenruo 				   last_type, last_seq);
1508*c1bf973fSQu Wenruo 			return -EUCLEAN;
1509*c1bf973fSQu Wenruo 		}
1510*c1bf973fSQu Wenruo 		last_type = inline_type;
1511*c1bf973fSQu Wenruo 		last_seq = seq;
1512f82d1c7cSQu Wenruo 		ptr += btrfs_extent_inline_ref_size(inline_type);
1513f82d1c7cSQu Wenruo 	}
1514f82d1c7cSQu Wenruo 	/* No padding is allowed */
1515c7c01a4aSDavid Sterba 	if (unlikely(ptr != end)) {
1516f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1517f82d1c7cSQu Wenruo 			   "invalid extent item size, padding bytes found");
1518f82d1c7cSQu Wenruo 		return -EUCLEAN;
1519f82d1c7cSQu Wenruo 	}
1520f82d1c7cSQu Wenruo 
1521f82d1c7cSQu Wenruo 	/* Finally, check the inline refs against total refs */
1522c7c01a4aSDavid Sterba 	if (unlikely(inline_refs > total_refs)) {
1523f82d1c7cSQu Wenruo 		extent_err(leaf, slot,
1524f82d1c7cSQu Wenruo 			"invalid extent refs, have %llu expect >= inline %llu",
1525f82d1c7cSQu Wenruo 			   total_refs, inline_refs);
1526f82d1c7cSQu Wenruo 		return -EUCLEAN;
1527f82d1c7cSQu Wenruo 	}
1528899b7f69SJosef Bacik 
1529899b7f69SJosef Bacik 	if ((prev_key->type == BTRFS_EXTENT_ITEM_KEY) ||
1530899b7f69SJosef Bacik 	    (prev_key->type == BTRFS_METADATA_ITEM_KEY)) {
1531899b7f69SJosef Bacik 		u64 prev_end = prev_key->objectid;
1532899b7f69SJosef Bacik 
1533899b7f69SJosef Bacik 		if (prev_key->type == BTRFS_METADATA_ITEM_KEY)
1534899b7f69SJosef Bacik 			prev_end += fs_info->nodesize;
1535899b7f69SJosef Bacik 		else
1536899b7f69SJosef Bacik 			prev_end += prev_key->offset;
1537899b7f69SJosef Bacik 
1538899b7f69SJosef Bacik 		if (unlikely(prev_end > key->objectid)) {
1539899b7f69SJosef Bacik 			extent_err(leaf, slot,
1540899b7f69SJosef Bacik 	"previous extent [%llu %u %llu] overlaps current extent [%llu %u %llu]",
1541899b7f69SJosef Bacik 				   prev_key->objectid, prev_key->type,
1542899b7f69SJosef Bacik 				   prev_key->offset, key->objectid, key->type,
1543899b7f69SJosef Bacik 				   key->offset);
1544899b7f69SJosef Bacik 			return -EUCLEAN;
1545899b7f69SJosef Bacik 		}
1546899b7f69SJosef Bacik 	}
1547899b7f69SJosef Bacik 
1548f82d1c7cSQu Wenruo 	return 0;
1549f82d1c7cSQu Wenruo }
1550f82d1c7cSQu Wenruo 
1551e2406a6fSQu Wenruo static int check_simple_keyed_refs(struct extent_buffer *leaf,
1552e2406a6fSQu Wenruo 				   struct btrfs_key *key, int slot)
1553e2406a6fSQu Wenruo {
1554e2406a6fSQu Wenruo 	u32 expect_item_size = 0;
1555e2406a6fSQu Wenruo 
1556e2406a6fSQu Wenruo 	if (key->type == BTRFS_SHARED_DATA_REF_KEY)
1557e2406a6fSQu Wenruo 		expect_item_size = sizeof(struct btrfs_shared_data_ref);
1558e2406a6fSQu Wenruo 
15593212fa14SJosef Bacik 	if (unlikely(btrfs_item_size(leaf, slot) != expect_item_size)) {
1560e2406a6fSQu Wenruo 		generic_err(leaf, slot,
1561e2406a6fSQu Wenruo 		"invalid item size, have %u expect %u for key type %u",
15623212fa14SJosef Bacik 			    btrfs_item_size(leaf, slot),
1563e2406a6fSQu Wenruo 			    expect_item_size, key->type);
1564e2406a6fSQu Wenruo 		return -EUCLEAN;
1565e2406a6fSQu Wenruo 	}
1566c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(key->objectid, leaf->fs_info->sectorsize))) {
1567e2406a6fSQu Wenruo 		generic_err(leaf, slot,
1568e2406a6fSQu Wenruo "invalid key objectid for shared block ref, have %llu expect aligned to %u",
1569e2406a6fSQu Wenruo 			    key->objectid, leaf->fs_info->sectorsize);
1570e2406a6fSQu Wenruo 		return -EUCLEAN;
1571e2406a6fSQu Wenruo 	}
1572c7c01a4aSDavid Sterba 	if (unlikely(key->type != BTRFS_TREE_BLOCK_REF_KEY &&
1573c7c01a4aSDavid Sterba 		     !IS_ALIGNED(key->offset, leaf->fs_info->sectorsize))) {
1574e2406a6fSQu Wenruo 		extent_err(leaf, slot,
1575e2406a6fSQu Wenruo 		"invalid tree parent bytenr, have %llu expect aligned to %u",
1576e2406a6fSQu Wenruo 			   key->offset, leaf->fs_info->sectorsize);
1577e2406a6fSQu Wenruo 		return -EUCLEAN;
1578e2406a6fSQu Wenruo 	}
1579e2406a6fSQu Wenruo 	return 0;
1580e2406a6fSQu Wenruo }
1581e2406a6fSQu Wenruo 
15820785a9aaSQu Wenruo static int check_extent_data_ref(struct extent_buffer *leaf,
15830785a9aaSQu Wenruo 				 struct btrfs_key *key, int slot)
15840785a9aaSQu Wenruo {
15850785a9aaSQu Wenruo 	struct btrfs_extent_data_ref *dref;
15860785a9aaSQu Wenruo 	unsigned long ptr = btrfs_item_ptr_offset(leaf, slot);
15873212fa14SJosef Bacik 	const unsigned long end = ptr + btrfs_item_size(leaf, slot);
15880785a9aaSQu Wenruo 
15893212fa14SJosef Bacik 	if (unlikely(btrfs_item_size(leaf, slot) % sizeof(*dref) != 0)) {
15900785a9aaSQu Wenruo 		generic_err(leaf, slot,
15910785a9aaSQu Wenruo 	"invalid item size, have %u expect aligned to %zu for key type %u",
15923212fa14SJosef Bacik 			    btrfs_item_size(leaf, slot),
15930785a9aaSQu Wenruo 			    sizeof(*dref), key->type);
15946d06b0adSDavid Sterba 		return -EUCLEAN;
15950785a9aaSQu Wenruo 	}
1596c7c01a4aSDavid Sterba 	if (unlikely(!IS_ALIGNED(key->objectid, leaf->fs_info->sectorsize))) {
15970785a9aaSQu Wenruo 		generic_err(leaf, slot,
15980785a9aaSQu Wenruo "invalid key objectid for shared block ref, have %llu expect aligned to %u",
15990785a9aaSQu Wenruo 			    key->objectid, leaf->fs_info->sectorsize);
16000785a9aaSQu Wenruo 		return -EUCLEAN;
16010785a9aaSQu Wenruo 	}
16020785a9aaSQu Wenruo 	for (; ptr < end; ptr += sizeof(*dref)) {
16030785a9aaSQu Wenruo 		u64 offset;
16040785a9aaSQu Wenruo 
16051119a72eSJosef Bacik 		/*
16061119a72eSJosef Bacik 		 * We cannot check the extent_data_ref hash due to possible
16071119a72eSJosef Bacik 		 * overflow from the leaf due to hash collisions.
16081119a72eSJosef Bacik 		 */
16090785a9aaSQu Wenruo 		dref = (struct btrfs_extent_data_ref *)ptr;
16100785a9aaSQu Wenruo 		offset = btrfs_extent_data_ref_offset(leaf, dref);
1611c7c01a4aSDavid Sterba 		if (unlikely(!IS_ALIGNED(offset, leaf->fs_info->sectorsize))) {
16120785a9aaSQu Wenruo 			extent_err(leaf, slot,
16130785a9aaSQu Wenruo 	"invalid extent data backref offset, have %llu expect aligned to %u",
16140785a9aaSQu Wenruo 				   offset, leaf->fs_info->sectorsize);
16156d06b0adSDavid Sterba 			return -EUCLEAN;
16160785a9aaSQu Wenruo 		}
16170785a9aaSQu Wenruo 	}
16180785a9aaSQu Wenruo 	return 0;
16190785a9aaSQu Wenruo }
16200785a9aaSQu Wenruo 
1621c3053ebbSQu Wenruo #define inode_ref_err(eb, slot, fmt, args...)			\
1622c3053ebbSQu Wenruo 	inode_item_err(eb, slot, fmt, ##args)
162371bf92a9SQu Wenruo static int check_inode_ref(struct extent_buffer *leaf,
162471bf92a9SQu Wenruo 			   struct btrfs_key *key, struct btrfs_key *prev_key,
162571bf92a9SQu Wenruo 			   int slot)
162671bf92a9SQu Wenruo {
162771bf92a9SQu Wenruo 	struct btrfs_inode_ref *iref;
162871bf92a9SQu Wenruo 	unsigned long ptr;
162971bf92a9SQu Wenruo 	unsigned long end;
163071bf92a9SQu Wenruo 
1631c7c01a4aSDavid Sterba 	if (unlikely(!check_prev_ino(leaf, key, slot, prev_key)))
163280d7fd1eSQu Wenruo 		return -EUCLEAN;
163371bf92a9SQu Wenruo 	/* namelen can't be 0, so item_size == sizeof() is also invalid */
16343212fa14SJosef Bacik 	if (unlikely(btrfs_item_size(leaf, slot) <= sizeof(*iref))) {
1635c3053ebbSQu Wenruo 		inode_ref_err(leaf, slot,
163671bf92a9SQu Wenruo 			"invalid item size, have %u expect (%zu, %u)",
16373212fa14SJosef Bacik 			btrfs_item_size(leaf, slot),
163871bf92a9SQu Wenruo 			sizeof(*iref), BTRFS_LEAF_DATA_SIZE(leaf->fs_info));
163971bf92a9SQu Wenruo 		return -EUCLEAN;
164071bf92a9SQu Wenruo 	}
164171bf92a9SQu Wenruo 
164271bf92a9SQu Wenruo 	ptr = btrfs_item_ptr_offset(leaf, slot);
16433212fa14SJosef Bacik 	end = ptr + btrfs_item_size(leaf, slot);
164471bf92a9SQu Wenruo 	while (ptr < end) {
164571bf92a9SQu Wenruo 		u16 namelen;
164671bf92a9SQu Wenruo 
1647c7c01a4aSDavid Sterba 		if (unlikely(ptr + sizeof(iref) > end)) {
1648c3053ebbSQu Wenruo 			inode_ref_err(leaf, slot,
164971bf92a9SQu Wenruo 			"inode ref overflow, ptr %lu end %lu inode_ref_size %zu",
165071bf92a9SQu Wenruo 				ptr, end, sizeof(iref));
165171bf92a9SQu Wenruo 			return -EUCLEAN;
165271bf92a9SQu Wenruo 		}
165371bf92a9SQu Wenruo 
165471bf92a9SQu Wenruo 		iref = (struct btrfs_inode_ref *)ptr;
165571bf92a9SQu Wenruo 		namelen = btrfs_inode_ref_name_len(leaf, iref);
1656c7c01a4aSDavid Sterba 		if (unlikely(ptr + sizeof(*iref) + namelen > end)) {
1657c3053ebbSQu Wenruo 			inode_ref_err(leaf, slot,
165871bf92a9SQu Wenruo 				"inode ref overflow, ptr %lu end %lu namelen %u",
165971bf92a9SQu Wenruo 				ptr, end, namelen);
166071bf92a9SQu Wenruo 			return -EUCLEAN;
166171bf92a9SQu Wenruo 		}
166271bf92a9SQu Wenruo 
166371bf92a9SQu Wenruo 		/*
166471bf92a9SQu Wenruo 		 * NOTE: In theory we should record all found index numbers
166571bf92a9SQu Wenruo 		 * to find any duplicated indexes, but that will be too time
166671bf92a9SQu Wenruo 		 * consuming for inodes with too many hard links.
166771bf92a9SQu Wenruo 		 */
166871bf92a9SQu Wenruo 		ptr += sizeof(*iref) + namelen;
166971bf92a9SQu Wenruo 	}
167071bf92a9SQu Wenruo 	return 0;
167171bf92a9SQu Wenruo }
167271bf92a9SQu Wenruo 
167382fc28fbSQu Wenruo /*
1674557ea5ddSQu Wenruo  * Common point to switch the item-specific validation.
1675557ea5ddSQu Wenruo  */
1676c8d54215SJosef Bacik static enum btrfs_tree_block_status check_leaf_item(struct extent_buffer *leaf,
1677c8d54215SJosef Bacik 						    struct btrfs_key *key,
1678c8d54215SJosef Bacik 						    int slot,
16794e9845efSFilipe Manana 						    struct btrfs_key *prev_key)
1680557ea5ddSQu Wenruo {
1681557ea5ddSQu Wenruo 	int ret = 0;
1682075cb3c7SQu Wenruo 	struct btrfs_chunk *chunk;
1683557ea5ddSQu Wenruo 
1684557ea5ddSQu Wenruo 	switch (key->type) {
1685557ea5ddSQu Wenruo 	case BTRFS_EXTENT_DATA_KEY:
16864e9845efSFilipe Manana 		ret = check_extent_data_item(leaf, key, slot, prev_key);
1687557ea5ddSQu Wenruo 		break;
1688557ea5ddSQu Wenruo 	case BTRFS_EXTENT_CSUM_KEY:
1689ad1d8c43SFilipe Manana 		ret = check_csum_item(leaf, key, slot, prev_key);
1690557ea5ddSQu Wenruo 		break;
1691ad7b0368SQu Wenruo 	case BTRFS_DIR_ITEM_KEY:
1692ad7b0368SQu Wenruo 	case BTRFS_DIR_INDEX_KEY:
1693ad7b0368SQu Wenruo 	case BTRFS_XATTR_ITEM_KEY:
1694c18679ebSQu Wenruo 		ret = check_dir_item(leaf, key, prev_key, slot);
1695ad7b0368SQu Wenruo 		break;
169671bf92a9SQu Wenruo 	case BTRFS_INODE_REF_KEY:
169771bf92a9SQu Wenruo 		ret = check_inode_ref(leaf, key, prev_key, slot);
169871bf92a9SQu Wenruo 		break;
1699fce466eaSQu Wenruo 	case BTRFS_BLOCK_GROUP_ITEM_KEY:
1700af60ce2bSDavid Sterba 		ret = check_block_group_item(leaf, key, slot);
1701fce466eaSQu Wenruo 		break;
1702075cb3c7SQu Wenruo 	case BTRFS_CHUNK_ITEM_KEY:
1703075cb3c7SQu Wenruo 		chunk = btrfs_item_ptr(leaf, slot, struct btrfs_chunk);
1704f6d2a5c2SQu Wenruo 		ret = check_leaf_chunk_item(leaf, chunk, key, slot);
1705075cb3c7SQu Wenruo 		break;
1706ab4ba2e1SQu Wenruo 	case BTRFS_DEV_ITEM_KEY:
1707412a2312SDavid Sterba 		ret = check_dev_item(leaf, key, slot);
1708ab4ba2e1SQu Wenruo 		break;
1709496245caSQu Wenruo 	case BTRFS_INODE_ITEM_KEY:
171039e57f49SDavid Sterba 		ret = check_inode_item(leaf, key, slot);
1711496245caSQu Wenruo 		break;
1712259ee775SQu Wenruo 	case BTRFS_ROOT_ITEM_KEY:
1713259ee775SQu Wenruo 		ret = check_root_item(leaf, key, slot);
1714259ee775SQu Wenruo 		break;
1715f82d1c7cSQu Wenruo 	case BTRFS_EXTENT_ITEM_KEY:
1716f82d1c7cSQu Wenruo 	case BTRFS_METADATA_ITEM_KEY:
1717899b7f69SJosef Bacik 		ret = check_extent_item(leaf, key, slot, prev_key);
1718f82d1c7cSQu Wenruo 		break;
1719e2406a6fSQu Wenruo 	case BTRFS_TREE_BLOCK_REF_KEY:
1720e2406a6fSQu Wenruo 	case BTRFS_SHARED_DATA_REF_KEY:
1721e2406a6fSQu Wenruo 	case BTRFS_SHARED_BLOCK_REF_KEY:
1722e2406a6fSQu Wenruo 		ret = check_simple_keyed_refs(leaf, key, slot);
1723e2406a6fSQu Wenruo 		break;
17240785a9aaSQu Wenruo 	case BTRFS_EXTENT_DATA_REF_KEY:
17250785a9aaSQu Wenruo 		ret = check_extent_data_ref(leaf, key, slot);
17260785a9aaSQu Wenruo 		break;
1727557ea5ddSQu Wenruo 	}
1728c8d54215SJosef Bacik 
1729c8d54215SJosef Bacik 	if (ret)
1730c8d54215SJosef Bacik 		return BTRFS_TREE_BLOCK_INVALID_ITEM;
1731c8d54215SJosef Bacik 	return BTRFS_TREE_BLOCK_CLEAN;
1732557ea5ddSQu Wenruo }
1733557ea5ddSQu Wenruo 
1734924452c8SJosef Bacik enum btrfs_tree_block_status __btrfs_check_leaf(struct extent_buffer *leaf)
1735557ea5ddSQu Wenruo {
1736e2ccd361SDavid Sterba 	struct btrfs_fs_info *fs_info = leaf->fs_info;
1737557ea5ddSQu Wenruo 	/* No valid key type is 0, so all key should be larger than this key */
1738557ea5ddSQu Wenruo 	struct btrfs_key prev_key = {0, 0, 0};
1739557ea5ddSQu Wenruo 	struct btrfs_key key;
1740557ea5ddSQu Wenruo 	u32 nritems = btrfs_header_nritems(leaf);
1741557ea5ddSQu Wenruo 	int slot;
1742557ea5ddSQu Wenruo 
1743c7c01a4aSDavid Sterba 	if (unlikely(btrfs_header_level(leaf) != 0)) {
174486a6be3aSDavid Sterba 		generic_err(leaf, 0,
1745f556faa4SQu Wenruo 			"invalid level for leaf, have %d expect 0",
1746f556faa4SQu Wenruo 			btrfs_header_level(leaf));
1747924452c8SJosef Bacik 		return BTRFS_TREE_BLOCK_INVALID_LEVEL;
1748f556faa4SQu Wenruo 	}
1749f556faa4SQu Wenruo 
1750557ea5ddSQu Wenruo 	/*
1751557ea5ddSQu Wenruo 	 * Extent buffers from a relocation tree have a owner field that
1752557ea5ddSQu Wenruo 	 * corresponds to the subvolume tree they are based on. So just from an
1753557ea5ddSQu Wenruo 	 * extent buffer alone we can not find out what is the id of the
1754557ea5ddSQu Wenruo 	 * corresponding subvolume tree, so we can not figure out if the extent
1755557ea5ddSQu Wenruo 	 * buffer corresponds to the root of the relocation tree or not. So
1756557ea5ddSQu Wenruo 	 * skip this check for relocation trees.
1757557ea5ddSQu Wenruo 	 */
1758557ea5ddSQu Wenruo 	if (nritems == 0 && !btrfs_header_flag(leaf, BTRFS_HEADER_FLAG_RELOC)) {
1759ba480dd4SQu Wenruo 		u64 owner = btrfs_header_owner(leaf);
1760557ea5ddSQu Wenruo 
1761ba480dd4SQu Wenruo 		/* These trees must never be empty */
1762c7c01a4aSDavid Sterba 		if (unlikely(owner == BTRFS_ROOT_TREE_OBJECTID ||
1763ba480dd4SQu Wenruo 			     owner == BTRFS_CHUNK_TREE_OBJECTID ||
1764ba480dd4SQu Wenruo 			     owner == BTRFS_DEV_TREE_OBJECTID ||
1765ba480dd4SQu Wenruo 			     owner == BTRFS_FS_TREE_OBJECTID ||
1766c7c01a4aSDavid Sterba 			     owner == BTRFS_DATA_RELOC_TREE_OBJECTID)) {
176786a6be3aSDavid Sterba 			generic_err(leaf, 0,
1768ba480dd4SQu Wenruo 			"invalid root, root %llu must never be empty",
1769ba480dd4SQu Wenruo 				    owner);
1770924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_NRITEMS;
1771ba480dd4SQu Wenruo 		}
1772c2fa821cSJosef Bacik 
177362fdaa52SQu Wenruo 		/* Unknown tree */
1774c7c01a4aSDavid Sterba 		if (unlikely(owner == 0)) {
177562fdaa52SQu Wenruo 			generic_err(leaf, 0,
177662fdaa52SQu Wenruo 				"invalid owner, root 0 is not defined");
1777924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_OWNER;
177862fdaa52SQu Wenruo 		}
1779c2fa821cSJosef Bacik 
1780c2fa821cSJosef Bacik 		/* EXTENT_TREE_V2 can have empty extent trees. */
1781c2fa821cSJosef Bacik 		if (btrfs_fs_incompat(fs_info, EXTENT_TREE_V2))
1782924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_CLEAN;
1783c2fa821cSJosef Bacik 
1784c2fa821cSJosef Bacik 		if (unlikely(owner == BTRFS_EXTENT_TREE_OBJECTID)) {
1785c2fa821cSJosef Bacik 			generic_err(leaf, 0,
1786c2fa821cSJosef Bacik 			"invalid root, root %llu must never be empty",
1787c2fa821cSJosef Bacik 				    owner);
1788924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_NRITEMS;
1789c2fa821cSJosef Bacik 		}
1790c2fa821cSJosef Bacik 
1791924452c8SJosef Bacik 		return BTRFS_TREE_BLOCK_CLEAN;
1792557ea5ddSQu Wenruo 	}
1793557ea5ddSQu Wenruo 
1794c7c01a4aSDavid Sterba 	if (unlikely(nritems == 0))
1795924452c8SJosef Bacik 		return BTRFS_TREE_BLOCK_CLEAN;
1796557ea5ddSQu Wenruo 
1797557ea5ddSQu Wenruo 	/*
1798557ea5ddSQu Wenruo 	 * Check the following things to make sure this is a good leaf, and
1799557ea5ddSQu Wenruo 	 * leaf users won't need to bother with similar sanity checks:
1800557ea5ddSQu Wenruo 	 *
1801557ea5ddSQu Wenruo 	 * 1) key ordering
1802557ea5ddSQu Wenruo 	 * 2) item offset and size
1803557ea5ddSQu Wenruo 	 *    No overlap, no hole, all inside the leaf.
1804557ea5ddSQu Wenruo 	 * 3) item content
1805557ea5ddSQu Wenruo 	 *    If possible, do comprehensive sanity check.
1806557ea5ddSQu Wenruo 	 *    NOTE: All checks must only rely on the item data itself.
1807557ea5ddSQu Wenruo 	 */
1808557ea5ddSQu Wenruo 	for (slot = 0; slot < nritems; slot++) {
1809557ea5ddSQu Wenruo 		u32 item_end_expected;
1810a6ab66ebSSu Yue 		u64 item_data_end;
1811557ea5ddSQu Wenruo 
1812557ea5ddSQu Wenruo 		btrfs_item_key_to_cpu(leaf, &key, slot);
1813557ea5ddSQu Wenruo 
1814557ea5ddSQu Wenruo 		/* Make sure the keys are in the right order */
1815c7c01a4aSDavid Sterba 		if (unlikely(btrfs_comp_cpu_keys(&prev_key, &key) >= 0)) {
181686a6be3aSDavid Sterba 			generic_err(leaf, slot,
1817478d01b3SQu Wenruo 	"bad key order, prev (%llu %u %llu) current (%llu %u %llu)",
1818478d01b3SQu Wenruo 				prev_key.objectid, prev_key.type,
1819478d01b3SQu Wenruo 				prev_key.offset, key.objectid, key.type,
1820478d01b3SQu Wenruo 				key.offset);
1821924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_BAD_KEY_ORDER;
1822557ea5ddSQu Wenruo 		}
1823557ea5ddSQu Wenruo 
1824a6ab66ebSSu Yue 		item_data_end = (u64)btrfs_item_offset(leaf, slot) +
1825a6ab66ebSSu Yue 				btrfs_item_size(leaf, slot);
1826557ea5ddSQu Wenruo 		/*
1827557ea5ddSQu Wenruo 		 * Make sure the offset and ends are right, remember that the
1828557ea5ddSQu Wenruo 		 * item data starts at the end of the leaf and grows towards the
1829557ea5ddSQu Wenruo 		 * front.
1830557ea5ddSQu Wenruo 		 */
1831557ea5ddSQu Wenruo 		if (slot == 0)
1832557ea5ddSQu Wenruo 			item_end_expected = BTRFS_LEAF_DATA_SIZE(fs_info);
1833557ea5ddSQu Wenruo 		else
18343212fa14SJosef Bacik 			item_end_expected = btrfs_item_offset(leaf,
1835557ea5ddSQu Wenruo 								 slot - 1);
1836a6ab66ebSSu Yue 		if (unlikely(item_data_end != item_end_expected)) {
183786a6be3aSDavid Sterba 			generic_err(leaf, slot,
1838a6ab66ebSSu Yue 				"unexpected item end, have %llu expect %u",
1839a6ab66ebSSu Yue 				item_data_end, item_end_expected);
1840924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_OFFSETS;
1841557ea5ddSQu Wenruo 		}
1842557ea5ddSQu Wenruo 
1843557ea5ddSQu Wenruo 		/*
1844557ea5ddSQu Wenruo 		 * Check to make sure that we don't point outside of the leaf,
1845557ea5ddSQu Wenruo 		 * just in case all the items are consistent to each other, but
1846557ea5ddSQu Wenruo 		 * all point outside of the leaf.
1847557ea5ddSQu Wenruo 		 */
1848a6ab66ebSSu Yue 		if (unlikely(item_data_end > BTRFS_LEAF_DATA_SIZE(fs_info))) {
184986a6be3aSDavid Sterba 			generic_err(leaf, slot,
1850a6ab66ebSSu Yue 			"slot end outside of leaf, have %llu expect range [0, %u]",
1851a6ab66ebSSu Yue 				item_data_end, BTRFS_LEAF_DATA_SIZE(fs_info));
1852924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_OFFSETS;
1853557ea5ddSQu Wenruo 		}
1854557ea5ddSQu Wenruo 
1855557ea5ddSQu Wenruo 		/* Also check if the item pointer overlaps with btrfs item. */
1856c7c01a4aSDavid Sterba 		if (unlikely(btrfs_item_ptr_offset(leaf, slot) <
185742c9419aSJosef Bacik 			     btrfs_item_nr_offset(leaf, slot) + sizeof(struct btrfs_item))) {
185886a6be3aSDavid Sterba 			generic_err(leaf, slot,
1859478d01b3SQu Wenruo 		"slot overlaps with its data, item end %lu data start %lu",
186042c9419aSJosef Bacik 				btrfs_item_nr_offset(leaf, slot) +
1861478d01b3SQu Wenruo 				sizeof(struct btrfs_item),
1862478d01b3SQu Wenruo 				btrfs_item_ptr_offset(leaf, slot));
1863924452c8SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_OFFSETS;
1864557ea5ddSQu Wenruo 		}
1865557ea5ddSQu Wenruo 
186685d8a826SJosef Bacik 		/*
186785d8a826SJosef Bacik 		 * We only want to do this if WRITTEN is set, otherwise the leaf
186885d8a826SJosef Bacik 		 * may be in some intermediate state and won't appear valid.
186985d8a826SJosef Bacik 		 */
187085d8a826SJosef Bacik 		if (btrfs_header_flag(leaf, BTRFS_HEADER_FLAG_WRITTEN)) {
1871c8d54215SJosef Bacik 			enum btrfs_tree_block_status ret;
1872c8d54215SJosef Bacik 
187369fc6cbbSQu Wenruo 			/*
187469fc6cbbSQu Wenruo 			 * Check if the item size and content meet other
187569fc6cbbSQu Wenruo 			 * criteria
187669fc6cbbSQu Wenruo 			 */
18774e9845efSFilipe Manana 			ret = check_leaf_item(leaf, &key, slot, &prev_key);
1878c8d54215SJosef Bacik 			if (unlikely(ret != BTRFS_TREE_BLOCK_CLEAN))
1879557ea5ddSQu Wenruo 				return ret;
188069fc6cbbSQu Wenruo 		}
1881557ea5ddSQu Wenruo 
1882557ea5ddSQu Wenruo 		prev_key.objectid = key.objectid;
1883557ea5ddSQu Wenruo 		prev_key.type = key.type;
1884557ea5ddSQu Wenruo 		prev_key.offset = key.offset;
1885557ea5ddSQu Wenruo 	}
1886557ea5ddSQu Wenruo 
1887924452c8SJosef Bacik 	return BTRFS_TREE_BLOCK_CLEAN;
1888924452c8SJosef Bacik }
1889924452c8SJosef Bacik 
1890924452c8SJosef Bacik int btrfs_check_leaf(struct extent_buffer *leaf)
1891924452c8SJosef Bacik {
1892924452c8SJosef Bacik 	enum btrfs_tree_block_status ret;
1893924452c8SJosef Bacik 
1894924452c8SJosef Bacik 	ret = __btrfs_check_leaf(leaf);
1895924452c8SJosef Bacik 	if (unlikely(ret != BTRFS_TREE_BLOCK_CLEAN))
1896924452c8SJosef Bacik 		return -EUCLEAN;
1897557ea5ddSQu Wenruo 	return 0;
1898557ea5ddSQu Wenruo }
189985d8a826SJosef Bacik ALLOW_ERROR_INJECTION(btrfs_check_leaf, ERRNO);
1900557ea5ddSQu Wenruo 
1901c26fa931SJosef Bacik enum btrfs_tree_block_status __btrfs_check_node(struct extent_buffer *node)
1902557ea5ddSQu Wenruo {
1903813fd1dcSDavid Sterba 	struct btrfs_fs_info *fs_info = node->fs_info;
1904557ea5ddSQu Wenruo 	unsigned long nr = btrfs_header_nritems(node);
1905557ea5ddSQu Wenruo 	struct btrfs_key key, next_key;
1906557ea5ddSQu Wenruo 	int slot;
1907f556faa4SQu Wenruo 	int level = btrfs_header_level(node);
1908557ea5ddSQu Wenruo 	u64 bytenr;
1909557ea5ddSQu Wenruo 
1910c7c01a4aSDavid Sterba 	if (unlikely(level <= 0 || level >= BTRFS_MAX_LEVEL)) {
191186a6be3aSDavid Sterba 		generic_err(node, 0,
1912f556faa4SQu Wenruo 			"invalid level for node, have %d expect [1, %d]",
1913f556faa4SQu Wenruo 			level, BTRFS_MAX_LEVEL - 1);
1914c26fa931SJosef Bacik 		return BTRFS_TREE_BLOCK_INVALID_LEVEL;
1915f556faa4SQu Wenruo 	}
1916c7c01a4aSDavid Sterba 	if (unlikely(nr == 0 || nr > BTRFS_NODEPTRS_PER_BLOCK(fs_info))) {
19172f659546SQu Wenruo 		btrfs_crit(fs_info,
1918bba4f298SQu Wenruo "corrupt node: root=%llu block=%llu, nritems too %s, have %lu expect range [1,%u]",
19192f659546SQu Wenruo 			   btrfs_header_owner(node), node->start,
1920bba4f298SQu Wenruo 			   nr == 0 ? "small" : "large", nr,
19212f659546SQu Wenruo 			   BTRFS_NODEPTRS_PER_BLOCK(fs_info));
1922c26fa931SJosef Bacik 		return BTRFS_TREE_BLOCK_INVALID_NRITEMS;
1923557ea5ddSQu Wenruo 	}
1924557ea5ddSQu Wenruo 
1925557ea5ddSQu Wenruo 	for (slot = 0; slot < nr - 1; slot++) {
1926557ea5ddSQu Wenruo 		bytenr = btrfs_node_blockptr(node, slot);
1927557ea5ddSQu Wenruo 		btrfs_node_key_to_cpu(node, &key, slot);
1928557ea5ddSQu Wenruo 		btrfs_node_key_to_cpu(node, &next_key, slot + 1);
1929557ea5ddSQu Wenruo 
1930c7c01a4aSDavid Sterba 		if (unlikely(!bytenr)) {
193186a6be3aSDavid Sterba 			generic_err(node, slot,
1932bba4f298SQu Wenruo 				"invalid NULL node pointer");
1933c26fa931SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_BLOCKPTR;
1934bba4f298SQu Wenruo 		}
1935c7c01a4aSDavid Sterba 		if (unlikely(!IS_ALIGNED(bytenr, fs_info->sectorsize))) {
193686a6be3aSDavid Sterba 			generic_err(node, slot,
1937bba4f298SQu Wenruo 			"unaligned pointer, have %llu should be aligned to %u",
19382f659546SQu Wenruo 				bytenr, fs_info->sectorsize);
1939c26fa931SJosef Bacik 			return BTRFS_TREE_BLOCK_INVALID_BLOCKPTR;
1940557ea5ddSQu Wenruo 		}
1941557ea5ddSQu Wenruo 
1942c7c01a4aSDavid Sterba 		if (unlikely(btrfs_comp_cpu_keys(&key, &next_key) >= 0)) {
194386a6be3aSDavid Sterba 			generic_err(node, slot,
1944bba4f298SQu Wenruo 	"bad key order, current (%llu %u %llu) next (%llu %u %llu)",
1945bba4f298SQu Wenruo 				key.objectid, key.type, key.offset,
1946bba4f298SQu Wenruo 				next_key.objectid, next_key.type,
1947bba4f298SQu Wenruo 				next_key.offset);
1948c26fa931SJosef Bacik 			return BTRFS_TREE_BLOCK_BAD_KEY_ORDER;
1949557ea5ddSQu Wenruo 		}
1950557ea5ddSQu Wenruo 	}
1951c26fa931SJosef Bacik 	return BTRFS_TREE_BLOCK_CLEAN;
1952c26fa931SJosef Bacik }
1953c26fa931SJosef Bacik 
1954c26fa931SJosef Bacik int btrfs_check_node(struct extent_buffer *node)
1955c26fa931SJosef Bacik {
1956c26fa931SJosef Bacik 	enum btrfs_tree_block_status ret;
1957c26fa931SJosef Bacik 
1958c26fa931SJosef Bacik 	ret = __btrfs_check_node(node);
1959c26fa931SJosef Bacik 	if (unlikely(ret != BTRFS_TREE_BLOCK_CLEAN))
1960c26fa931SJosef Bacik 		return -EUCLEAN;
1961c26fa931SJosef Bacik 	return 0;
1962557ea5ddSQu Wenruo }
196302529d7aSQu Wenruo ALLOW_ERROR_INJECTION(btrfs_check_node, ERRNO);
196488c602abSQu Wenruo 
196588c602abSQu Wenruo int btrfs_check_eb_owner(const struct extent_buffer *eb, u64 root_owner)
196688c602abSQu Wenruo {
196788c602abSQu Wenruo 	const bool is_subvol = is_fstree(root_owner);
196888c602abSQu Wenruo 	const u64 eb_owner = btrfs_header_owner(eb);
196988c602abSQu Wenruo 
197088c602abSQu Wenruo 	/*
197188c602abSQu Wenruo 	 * Skip dummy fs, as selftests don't create unique ebs for each dummy
197288c602abSQu Wenruo 	 * root.
197388c602abSQu Wenruo 	 */
197488c602abSQu Wenruo 	if (test_bit(BTRFS_FS_STATE_DUMMY_FS_INFO, &eb->fs_info->fs_state))
197588c602abSQu Wenruo 		return 0;
197688c602abSQu Wenruo 	/*
197788c602abSQu Wenruo 	 * There are several call sites (backref walking, qgroup, and data
197888c602abSQu Wenruo 	 * reloc) passing 0 as @root_owner, as they are not holding the
197988c602abSQu Wenruo 	 * tree root.  In that case, we can not do a reliable ownership check,
198088c602abSQu Wenruo 	 * so just exit.
198188c602abSQu Wenruo 	 */
198288c602abSQu Wenruo 	if (root_owner == 0)
198388c602abSQu Wenruo 		return 0;
198488c602abSQu Wenruo 	/*
198588c602abSQu Wenruo 	 * These trees use key.offset as their owner, our callers don't have
198688c602abSQu Wenruo 	 * the extra capacity to pass key.offset here.  So we just skip them.
198788c602abSQu Wenruo 	 */
198888c602abSQu Wenruo 	if (root_owner == BTRFS_TREE_LOG_OBJECTID ||
198988c602abSQu Wenruo 	    root_owner == BTRFS_TREE_RELOC_OBJECTID)
199088c602abSQu Wenruo 		return 0;
199188c602abSQu Wenruo 
199288c602abSQu Wenruo 	if (!is_subvol) {
199388c602abSQu Wenruo 		/* For non-subvolume trees, the eb owner should match root owner */
199488c602abSQu Wenruo 		if (unlikely(root_owner != eb_owner)) {
199588c602abSQu Wenruo 			btrfs_crit(eb->fs_info,
199688c602abSQu Wenruo "corrupted %s, root=%llu block=%llu owner mismatch, have %llu expect %llu",
199788c602abSQu Wenruo 				btrfs_header_level(eb) == 0 ? "leaf" : "node",
199888c602abSQu Wenruo 				root_owner, btrfs_header_bytenr(eb), eb_owner,
199988c602abSQu Wenruo 				root_owner);
200088c602abSQu Wenruo 			return -EUCLEAN;
200188c602abSQu Wenruo 		}
200288c602abSQu Wenruo 		return 0;
200388c602abSQu Wenruo 	}
200488c602abSQu Wenruo 
200588c602abSQu Wenruo 	/*
200688c602abSQu Wenruo 	 * For subvolume trees, owners can mismatch, but they should all belong
200788c602abSQu Wenruo 	 * to subvolume trees.
200888c602abSQu Wenruo 	 */
200988c602abSQu Wenruo 	if (unlikely(is_subvol != is_fstree(eb_owner))) {
201088c602abSQu Wenruo 		btrfs_crit(eb->fs_info,
201188c602abSQu Wenruo "corrupted %s, root=%llu block=%llu owner mismatch, have %llu expect [%llu, %llu]",
201288c602abSQu Wenruo 			btrfs_header_level(eb) == 0 ? "leaf" : "node",
201388c602abSQu Wenruo 			root_owner, btrfs_header_bytenr(eb), eb_owner,
201488c602abSQu Wenruo 			BTRFS_FIRST_FREE_OBJECTID, BTRFS_LAST_FREE_OBJECTID);
201588c602abSQu Wenruo 		return -EUCLEAN;
201688c602abSQu Wenruo 	}
201788c602abSQu Wenruo 	return 0;
201888c602abSQu Wenruo }
20192cac5af1SJosef Bacik 
20202cac5af1SJosef Bacik int btrfs_verify_level_key(struct extent_buffer *eb, int level,
20212cac5af1SJosef Bacik 			   struct btrfs_key *first_key, u64 parent_transid)
20222cac5af1SJosef Bacik {
20232cac5af1SJosef Bacik 	struct btrfs_fs_info *fs_info = eb->fs_info;
20242cac5af1SJosef Bacik 	int found_level;
20252cac5af1SJosef Bacik 	struct btrfs_key found_key;
20262cac5af1SJosef Bacik 	int ret;
20272cac5af1SJosef Bacik 
20282cac5af1SJosef Bacik 	found_level = btrfs_header_level(eb);
20292cac5af1SJosef Bacik 	if (found_level != level) {
20302cac5af1SJosef Bacik 		WARN(IS_ENABLED(CONFIG_BTRFS_DEBUG),
20312cac5af1SJosef Bacik 		     KERN_ERR "BTRFS: tree level check failed\n");
20322cac5af1SJosef Bacik 		btrfs_err(fs_info,
20332cac5af1SJosef Bacik "tree level mismatch detected, bytenr=%llu level expected=%u has=%u",
20342cac5af1SJosef Bacik 			  eb->start, level, found_level);
20352cac5af1SJosef Bacik 		return -EIO;
20362cac5af1SJosef Bacik 	}
20372cac5af1SJosef Bacik 
20382cac5af1SJosef Bacik 	if (!first_key)
20392cac5af1SJosef Bacik 		return 0;
20402cac5af1SJosef Bacik 
20412cac5af1SJosef Bacik 	/*
20422cac5af1SJosef Bacik 	 * For live tree block (new tree blocks in current transaction),
20432cac5af1SJosef Bacik 	 * we need proper lock context to avoid race, which is impossible here.
20442cac5af1SJosef Bacik 	 * So we only checks tree blocks which is read from disk, whose
20452cac5af1SJosef Bacik 	 * generation <= fs_info->last_trans_committed.
20462cac5af1SJosef Bacik 	 */
20472cac5af1SJosef Bacik 	if (btrfs_header_generation(eb) > fs_info->last_trans_committed)
20482cac5af1SJosef Bacik 		return 0;
20492cac5af1SJosef Bacik 
20502cac5af1SJosef Bacik 	/* We have @first_key, so this @eb must have at least one item */
20512cac5af1SJosef Bacik 	if (btrfs_header_nritems(eb) == 0) {
20522cac5af1SJosef Bacik 		btrfs_err(fs_info,
20532cac5af1SJosef Bacik 		"invalid tree nritems, bytenr=%llu nritems=0 expect >0",
20542cac5af1SJosef Bacik 			  eb->start);
20552cac5af1SJosef Bacik 		WARN_ON(IS_ENABLED(CONFIG_BTRFS_DEBUG));
20562cac5af1SJosef Bacik 		return -EUCLEAN;
20572cac5af1SJosef Bacik 	}
20582cac5af1SJosef Bacik 
20592cac5af1SJosef Bacik 	if (found_level)
20602cac5af1SJosef Bacik 		btrfs_node_key_to_cpu(eb, &found_key, 0);
20612cac5af1SJosef Bacik 	else
20622cac5af1SJosef Bacik 		btrfs_item_key_to_cpu(eb, &found_key, 0);
20632cac5af1SJosef Bacik 	ret = btrfs_comp_cpu_keys(first_key, &found_key);
20642cac5af1SJosef Bacik 
20652cac5af1SJosef Bacik 	if (ret) {
20662cac5af1SJosef Bacik 		WARN(IS_ENABLED(CONFIG_BTRFS_DEBUG),
20672cac5af1SJosef Bacik 		     KERN_ERR "BTRFS: tree first key check failed\n");
20682cac5af1SJosef Bacik 		btrfs_err(fs_info,
20692cac5af1SJosef Bacik "tree first key mismatch detected, bytenr=%llu parent_transid=%llu key expected=(%llu,%u,%llu) has=(%llu,%u,%llu)",
20702cac5af1SJosef Bacik 			  eb->start, parent_transid, first_key->objectid,
20712cac5af1SJosef Bacik 			  first_key->type, first_key->offset,
20722cac5af1SJosef Bacik 			  found_key.objectid, found_key.type,
20732cac5af1SJosef Bacik 			  found_key.offset);
20742cac5af1SJosef Bacik 	}
20752cac5af1SJosef Bacik 	return ret;
20762cac5af1SJosef Bacik }
2077