xref: /openbmc/linux/fs/btrfs/super.c (revision 34d97007)
16cbd5570SChris Mason /*
26cbd5570SChris Mason  * Copyright (C) 2007 Oracle.  All rights reserved.
36cbd5570SChris Mason  *
46cbd5570SChris Mason  * This program is free software; you can redistribute it and/or
56cbd5570SChris Mason  * modify it under the terms of the GNU General Public
66cbd5570SChris Mason  * License v2 as published by the Free Software Foundation.
76cbd5570SChris Mason  *
86cbd5570SChris Mason  * This program is distributed in the hope that it will be useful,
96cbd5570SChris Mason  * but WITHOUT ANY WARRANTY; without even the implied warranty of
106cbd5570SChris Mason  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
116cbd5570SChris Mason  * General Public License for more details.
126cbd5570SChris Mason  *
136cbd5570SChris Mason  * You should have received a copy of the GNU General Public
146cbd5570SChris Mason  * License along with this program; if not, write to the
156cbd5570SChris Mason  * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
166cbd5570SChris Mason  * Boston, MA 021110-1307, USA.
176cbd5570SChris Mason  */
186cbd5570SChris Mason 
194b82d6e4SYan #include <linux/blkdev.h>
202e635a27SChris Mason #include <linux/module.h>
21e20d96d6SChris Mason #include <linux/buffer_head.h>
222e635a27SChris Mason #include <linux/fs.h>
232e635a27SChris Mason #include <linux/pagemap.h>
242e635a27SChris Mason #include <linux/highmem.h>
252e635a27SChris Mason #include <linux/time.h>
262e635a27SChris Mason #include <linux/init.h>
27a9572a15SEric Paris #include <linux/seq_file.h>
282e635a27SChris Mason #include <linux/string.h>
292e635a27SChris Mason #include <linux/backing-dev.h>
304b82d6e4SYan #include <linux/mount.h>
31dee26a9fSChris Mason #include <linux/mpage.h>
3275dfe396SChris Mason #include <linux/swap.h>
3375dfe396SChris Mason #include <linux/writeback.h>
348fd17795SChris Mason #include <linux/statfs.h>
3508607c1bSChris Mason #include <linux/compat.h>
3695e05289SChris Mason #include <linux/parser.h>
37c59f8951SChris Mason #include <linux/ctype.h>
386da6abaeSChris Mason #include <linux/namei.h>
39a9218f6bSChris Mason #include <linux/miscdevice.h>
401bcbf313SQinghuang Feng #include <linux/magic.h>
415a0e3ad6STejun Heo #include <linux/slab.h>
4290a887c9SDan Magenheimer #include <linux/cleancache.h>
4322c44fe6SJosef Bacik #include <linux/ratelimit.h>
4455e301fdSFilipe Brandenburger #include <linux/btrfs.h>
4516cdcec7SMiao Xie #include "delayed-inode.h"
462e635a27SChris Mason #include "ctree.h"
47e20d96d6SChris Mason #include "disk-io.h"
48d5719762SChris Mason #include "transaction.h"
492c90e5d6SChris Mason #include "btrfs_inode.h"
503a686375SChris Mason #include "print-tree.h"
5114a958e6SFilipe David Borba Manana #include "hash.h"
5263541927SFilipe David Borba Manana #include "props.h"
535103e947SJosef Bacik #include "xattr.h"
548a4b83ccSChris Mason #include "volumes.h"
55be6e8dc0SBalaji Rao #include "export.h"
56c8b97818SChris Mason #include "compression.h"
579c5085c1SJosef Bacik #include "rcu-string.h"
588dabb742SStefan Behrens #include "dev-replace.h"
5974255aa0SJosef Bacik #include "free-space-cache.h"
60b9e9a6cbSWang Shilong #include "backref.h"
61dc11dd5dSJosef Bacik #include "tests/btrfs-tests.h"
622e635a27SChris Mason 
63d3982100SMark Fasheh #include "qgroup.h"
641abe9b8aSliubo #define CREATE_TRACE_POINTS
651abe9b8aSliubo #include <trace/events/btrfs.h>
661abe9b8aSliubo 
67b87221deSAlexey Dobriyan static const struct super_operations btrfs_super_ops;
68830c4adbSJosef Bacik static struct file_system_type btrfs_fs_type;
69e20d96d6SChris Mason 
700723a047SHarald Hoyer static int btrfs_remount(struct super_block *sb, int *flags, char *data);
710723a047SHarald Hoyer 
72e33e17eeSJeff Mahoney const char *btrfs_decode_error(int errno)
73acce952bSliubo {
7408748810SDavid Sterba 	char *errstr = "unknown";
75acce952bSliubo 
76acce952bSliubo 	switch (errno) {
77acce952bSliubo 	case -EIO:
78acce952bSliubo 		errstr = "IO failure";
79acce952bSliubo 		break;
80acce952bSliubo 	case -ENOMEM:
81acce952bSliubo 		errstr = "Out of memory";
82acce952bSliubo 		break;
83acce952bSliubo 	case -EROFS:
84acce952bSliubo 		errstr = "Readonly filesystem";
85acce952bSliubo 		break;
868c342930SJeff Mahoney 	case -EEXIST:
878c342930SJeff Mahoney 		errstr = "Object already exists";
888c342930SJeff Mahoney 		break;
8994ef7280SDavid Sterba 	case -ENOSPC:
9094ef7280SDavid Sterba 		errstr = "No space left";
9194ef7280SDavid Sterba 		break;
9294ef7280SDavid Sterba 	case -ENOENT:
9394ef7280SDavid Sterba 		errstr = "No such entry";
9494ef7280SDavid Sterba 		break;
95acce952bSliubo 	}
96acce952bSliubo 
97acce952bSliubo 	return errstr;
98acce952bSliubo }
99acce952bSliubo 
100bbece8a3SDavid Sterba static void save_error_info(struct btrfs_fs_info *fs_info)
101acce952bSliubo {
102acce952bSliubo 	/*
103acce952bSliubo 	 * today we only save the error info into ram.  Long term we'll
104acce952bSliubo 	 * also send it down to the disk
105acce952bSliubo 	 */
10687533c47SMiao Xie 	set_bit(BTRFS_FS_STATE_ERROR, &fs_info->fs_state);
107acce952bSliubo }
108acce952bSliubo 
109acce952bSliubo /* btrfs handle error by forcing the filesystem readonly */
110acce952bSliubo static void btrfs_handle_error(struct btrfs_fs_info *fs_info)
111acce952bSliubo {
112acce952bSliubo 	struct super_block *sb = fs_info->sb;
113acce952bSliubo 
114acce952bSliubo 	if (sb->s_flags & MS_RDONLY)
115acce952bSliubo 		return;
116acce952bSliubo 
11787533c47SMiao Xie 	if (test_bit(BTRFS_FS_STATE_ERROR, &fs_info->fs_state)) {
118acce952bSliubo 		sb->s_flags |= MS_RDONLY;
119c2cf52ebSSimon Kirby 		btrfs_info(fs_info, "forced readonly");
1201acd6831SStefan Behrens 		/*
1211acd6831SStefan Behrens 		 * Note that a running device replace operation is not
1221acd6831SStefan Behrens 		 * canceled here although there is no way to update
1231acd6831SStefan Behrens 		 * the progress. It would add the risk of a deadlock,
1241acd6831SStefan Behrens 		 * therefore the canceling is ommited. The only penalty
1251acd6831SStefan Behrens 		 * is that some I/O remains active until the procedure
1261acd6831SStefan Behrens 		 * completes. The next time when the filesystem is
1271acd6831SStefan Behrens 		 * mounted writeable again, the device replace
1281acd6831SStefan Behrens 		 * operation continues.
1291acd6831SStefan Behrens 		 */
130acce952bSliubo 	}
131acce952bSliubo }
132acce952bSliubo 
133acce952bSliubo /*
134*34d97007SAnand Jain  * __btrfs_handle_fs_error decodes expected errors from the caller and
135acce952bSliubo  * invokes the approciate error response.
136acce952bSliubo  */
137c0d19e2bSDavid Sterba __cold
138*34d97007SAnand Jain void __btrfs_handle_fs_error(struct btrfs_fs_info *fs_info, const char *function,
1394da35113SJeff Mahoney 		       unsigned int line, int errno, const char *fmt, ...)
140acce952bSliubo {
141acce952bSliubo 	struct super_block *sb = fs_info->sb;
14257d816a1SAnand Jain #ifdef CONFIG_PRINTK
143acce952bSliubo 	const char *errstr;
14457d816a1SAnand Jain #endif
145acce952bSliubo 
146acce952bSliubo 	/*
147acce952bSliubo 	 * Special case: if the error is EROFS, and we're already
148acce952bSliubo 	 * under MS_RDONLY, then it is safe here.
149acce952bSliubo 	 */
150acce952bSliubo 	if (errno == -EROFS && (sb->s_flags & MS_RDONLY))
151acce952bSliubo   		return;
152acce952bSliubo 
15357d816a1SAnand Jain #ifdef CONFIG_PRINTK
15408748810SDavid Sterba 	errstr = btrfs_decode_error(errno);
1554da35113SJeff Mahoney 	if (fmt) {
15637252a66SEric Sandeen 		struct va_format vaf;
15737252a66SEric Sandeen 		va_list args;
15837252a66SEric Sandeen 
15937252a66SEric Sandeen 		va_start(args, fmt);
16037252a66SEric Sandeen 		vaf.fmt = fmt;
16137252a66SEric Sandeen 		vaf.va = &args;
1624da35113SJeff Mahoney 
163efe120a0SFrank Holton 		printk(KERN_CRIT
164efe120a0SFrank Holton 			"BTRFS: error (device %s) in %s:%d: errno=%d %s (%pV)\n",
16508748810SDavid Sterba 			sb->s_id, function, line, errno, errstr, &vaf);
16637252a66SEric Sandeen 		va_end(args);
1674da35113SJeff Mahoney 	} else {
168efe120a0SFrank Holton 		printk(KERN_CRIT "BTRFS: error (device %s) in %s:%d: errno=%d %s\n",
16908748810SDavid Sterba 			sb->s_id, function, line, errno, errstr);
1704da35113SJeff Mahoney 	}
17157d816a1SAnand Jain #endif
172acce952bSliubo 
1734da35113SJeff Mahoney 	/* Don't go through full error handling during mount */
1744da35113SJeff Mahoney 	save_error_info(fs_info);
175cf79ffb5SJosef Bacik 	if (sb->s_flags & MS_BORN)
176acce952bSliubo 		btrfs_handle_error(fs_info);
177acce952bSliubo }
1784da35113SJeff Mahoney 
17957d816a1SAnand Jain #ifdef CONFIG_PRINTK
180533574c6SJoe Perches static const char * const logtypes[] = {
1814da35113SJeff Mahoney 	"emergency",
1824da35113SJeff Mahoney 	"alert",
1834da35113SJeff Mahoney 	"critical",
1844da35113SJeff Mahoney 	"error",
1854da35113SJeff Mahoney 	"warning",
1864da35113SJeff Mahoney 	"notice",
1874da35113SJeff Mahoney 	"info",
1884da35113SJeff Mahoney 	"debug",
1894da35113SJeff Mahoney };
1904da35113SJeff Mahoney 
191c2cf52ebSSimon Kirby void btrfs_printk(const struct btrfs_fs_info *fs_info, const char *fmt, ...)
1924da35113SJeff Mahoney {
1934da35113SJeff Mahoney 	struct super_block *sb = fs_info->sb;
1944da35113SJeff Mahoney 	char lvl[4];
1954da35113SJeff Mahoney 	struct va_format vaf;
1964da35113SJeff Mahoney 	va_list args;
1974da35113SJeff Mahoney 	const char *type = logtypes[4];
198533574c6SJoe Perches 	int kern_level;
1994da35113SJeff Mahoney 
2004da35113SJeff Mahoney 	va_start(args, fmt);
2014da35113SJeff Mahoney 
202533574c6SJoe Perches 	kern_level = printk_get_level(fmt);
203533574c6SJoe Perches 	if (kern_level) {
204533574c6SJoe Perches 		size_t size = printk_skip_level(fmt) - fmt;
205533574c6SJoe Perches 		memcpy(lvl, fmt,  size);
206533574c6SJoe Perches 		lvl[size] = '\0';
207533574c6SJoe Perches 		fmt += size;
208533574c6SJoe Perches 		type = logtypes[kern_level - '0'];
2094da35113SJeff Mahoney 	} else
2104da35113SJeff Mahoney 		*lvl = '\0';
2114da35113SJeff Mahoney 
2124da35113SJeff Mahoney 	vaf.fmt = fmt;
2134da35113SJeff Mahoney 	vaf.va = &args;
214533574c6SJoe Perches 
215c2cf52ebSSimon Kirby 	printk("%sBTRFS %s (device %s): %pV\n", lvl, type, sb->s_id, &vaf);
216533574c6SJoe Perches 
217533574c6SJoe Perches 	va_end(args);
2184da35113SJeff Mahoney }
219533574c6SJoe Perches #endif
220533574c6SJoe Perches 
2218c342930SJeff Mahoney /*
22249b25e05SJeff Mahoney  * We only mark the transaction aborted and then set the file system read-only.
22349b25e05SJeff Mahoney  * This will prevent new transactions from starting or trying to join this
22449b25e05SJeff Mahoney  * one.
22549b25e05SJeff Mahoney  *
22649b25e05SJeff Mahoney  * This means that error recovery at the call site is limited to freeing
22749b25e05SJeff Mahoney  * any local memory allocations and passing the error code up without
22849b25e05SJeff Mahoney  * further cleanup. The transaction should complete as it normally would
22949b25e05SJeff Mahoney  * in the call path but will return -EIO.
23049b25e05SJeff Mahoney  *
23149b25e05SJeff Mahoney  * We'll complete the cleanup in btrfs_end_transaction and
23249b25e05SJeff Mahoney  * btrfs_commit_transaction.
23349b25e05SJeff Mahoney  */
234c0d19e2bSDavid Sterba __cold
23549b25e05SJeff Mahoney void __btrfs_abort_transaction(struct btrfs_trans_handle *trans,
23649b25e05SJeff Mahoney 			       struct btrfs_root *root, const char *function,
23749b25e05SJeff Mahoney 			       unsigned int line, int errno)
23849b25e05SJeff Mahoney {
23949b25e05SJeff Mahoney 	trans->aborted = errno;
24049b25e05SJeff Mahoney 	/* Nothing used. The other threads that have joined this
24149b25e05SJeff Mahoney 	 * transaction may be able to continue. */
242c92f6be3SFilipe Manana 	if (!trans->blocks_used && list_empty(&trans->new_bgs)) {
24369ce977aSMiao Xie 		const char *errstr;
24469ce977aSMiao Xie 
24508748810SDavid Sterba 		errstr = btrfs_decode_error(errno);
246c2cf52ebSSimon Kirby 		btrfs_warn(root->fs_info,
247c2cf52ebSSimon Kirby 		           "%s:%d: Aborting unused transaction(%s).",
24869ce977aSMiao Xie 		           function, line, errstr);
24949b25e05SJeff Mahoney 		return;
25049b25e05SJeff Mahoney 	}
2518d25a086SMiao Xie 	ACCESS_ONCE(trans->transaction->aborted) = errno;
252501407aaSJosef Bacik 	/* Wake up anybody who may be waiting on this transaction */
253501407aaSJosef Bacik 	wake_up(&root->fs_info->transaction_wait);
254501407aaSJosef Bacik 	wake_up(&root->fs_info->transaction_blocked_wait);
255*34d97007SAnand Jain 	__btrfs_handle_fs_error(root->fs_info, function, line, errno, NULL);
25649b25e05SJeff Mahoney }
25749b25e05SJeff Mahoney /*
2588c342930SJeff Mahoney  * __btrfs_panic decodes unexpected, fatal errors from the caller,
2598c342930SJeff Mahoney  * issues an alert, and either panics or BUGs, depending on mount options.
2608c342930SJeff Mahoney  */
261c0d19e2bSDavid Sterba __cold
2628c342930SJeff Mahoney void __btrfs_panic(struct btrfs_fs_info *fs_info, const char *function,
2638c342930SJeff Mahoney 		   unsigned int line, int errno, const char *fmt, ...)
2648c342930SJeff Mahoney {
2658c342930SJeff Mahoney 	char *s_id = "<unknown>";
2668c342930SJeff Mahoney 	const char *errstr;
2678c342930SJeff Mahoney 	struct va_format vaf = { .fmt = fmt };
2688c342930SJeff Mahoney 	va_list args;
2698c342930SJeff Mahoney 
2708c342930SJeff Mahoney 	if (fs_info)
2718c342930SJeff Mahoney 		s_id = fs_info->sb->s_id;
2728c342930SJeff Mahoney 
2738c342930SJeff Mahoney 	va_start(args, fmt);
2748c342930SJeff Mahoney 	vaf.va = &args;
2758c342930SJeff Mahoney 
27608748810SDavid Sterba 	errstr = btrfs_decode_error(errno);
277aa43a17cSEric Sandeen 	if (fs_info && (fs_info->mount_opt & BTRFS_MOUNT_PANIC_ON_FATAL_ERROR))
27808748810SDavid Sterba 		panic(KERN_CRIT "BTRFS panic (device %s) in %s:%d: %pV (errno=%d %s)\n",
27908748810SDavid Sterba 			s_id, function, line, &vaf, errno, errstr);
2808c342930SJeff Mahoney 
281efe120a0SFrank Holton 	btrfs_crit(fs_info, "panic in %s:%d: %pV (errno=%d %s)",
282efe120a0SFrank Holton 		   function, line, &vaf, errno, errstr);
2838c342930SJeff Mahoney 	va_end(args);
2848c342930SJeff Mahoney 	/* Caller calls BUG() */
2858c342930SJeff Mahoney }
286acce952bSliubo 
287e20d96d6SChris Mason static void btrfs_put_super(struct super_block *sb)
288e20d96d6SChris Mason {
2893abdbd78SDavid Sterba 	close_ctree(btrfs_sb(sb)->tree_root);
290e20d96d6SChris Mason }
2912e635a27SChris Mason 
29295e05289SChris Mason enum {
29373f73415SJosef Bacik 	Opt_degraded, Opt_subvol, Opt_subvolid, Opt_device, Opt_nodatasum,
294287a0ab9SJosef Bacik 	Opt_nodatacow, Opt_max_inline, Opt_alloc_start, Opt_nobarrier, Opt_ssd,
295287a0ab9SJosef Bacik 	Opt_nossd, Opt_ssd_spread, Opt_thread_pool, Opt_noacl, Opt_compress,
296261507a0SLi Zefan 	Opt_compress_type, Opt_compress_force, Opt_compress_force_type,
297261507a0SLi Zefan 	Opt_notreelog, Opt_ratio, Opt_flushoncommit, Opt_discard,
29870f6d82eSOmar Sandoval 	Opt_space_cache, Opt_space_cache_version, Opt_clear_cache,
29970f6d82eSOmar Sandoval 	Opt_user_subvol_rm_allowed, Opt_enospc_debug, Opt_subvolrootid,
30070f6d82eSOmar Sandoval 	Opt_defrag, Opt_inode_cache, Opt_no_space_cache, Opt_recovery,
30170f6d82eSOmar Sandoval 	Opt_skip_balance, Opt_check_integrity,
30270f6d82eSOmar Sandoval 	Opt_check_integrity_including_extent_data,
303f420ee1eSStefan Behrens 	Opt_check_integrity_print_mask, Opt_fatal_errors, Opt_rescan_uuid_tree,
304e07a2adeSQu Wenruo 	Opt_commit_interval, Opt_barrier, Opt_nodefrag, Opt_nodiscard,
305a258af7aSQu Wenruo 	Opt_noenospc_debug, Opt_noflushoncommit, Opt_acl, Opt_datacow,
3068dcddfa0SQu Wenruo 	Opt_datasum, Opt_treelog, Opt_noinode_cache, Opt_usebackuproot,
307fed8f166SQu Wenruo 	Opt_nologreplay, Opt_norecovery,
308d0bd4560SJosef Bacik #ifdef CONFIG_BTRFS_DEBUG
309d0bd4560SJosef Bacik 	Opt_fragment_data, Opt_fragment_metadata, Opt_fragment_all,
310d0bd4560SJosef Bacik #endif
3119555c6c1SIlya Dryomov 	Opt_err,
31295e05289SChris Mason };
31395e05289SChris Mason 
3144d4ab6d6SDavid Sterba static const match_table_t tokens = {
315dfe25020SChris Mason 	{Opt_degraded, "degraded"},
31695e05289SChris Mason 	{Opt_subvol, "subvol=%s"},
3171493381fSWang Shilong 	{Opt_subvolid, "subvolid=%s"},
31843e570b0SChristoph Hellwig 	{Opt_device, "device=%s"},
319b6cda9bcSChris Mason 	{Opt_nodatasum, "nodatasum"},
320d399167dSQu Wenruo 	{Opt_datasum, "datasum"},
321be20aa9dSChris Mason 	{Opt_nodatacow, "nodatacow"},
322a258af7aSQu Wenruo 	{Opt_datacow, "datacow"},
32321ad10cfSChris Mason 	{Opt_nobarrier, "nobarrier"},
324842bef58SQu Wenruo 	{Opt_barrier, "barrier"},
3256f568d35SChris Mason 	{Opt_max_inline, "max_inline=%s"},
3268f662a76SChris Mason 	{Opt_alloc_start, "alloc_start=%s"},
3274543df7eSChris Mason 	{Opt_thread_pool, "thread_pool=%d"},
328c8b97818SChris Mason 	{Opt_compress, "compress"},
329261507a0SLi Zefan 	{Opt_compress_type, "compress=%s"},
330a555f810SChris Mason 	{Opt_compress_force, "compress-force"},
331261507a0SLi Zefan 	{Opt_compress_force_type, "compress-force=%s"},
332e18e4809SChris Mason 	{Opt_ssd, "ssd"},
333451d7585SChris Mason 	{Opt_ssd_spread, "ssd_spread"},
3343b30c22fSChris Mason 	{Opt_nossd, "nossd"},
335bd0330adSQu Wenruo 	{Opt_acl, "acl"},
33633268eafSJosef Bacik 	{Opt_noacl, "noacl"},
3373a5e1404SSage Weil 	{Opt_notreelog, "notreelog"},
338a88998f2SQu Wenruo 	{Opt_treelog, "treelog"},
33996da0919SQu Wenruo 	{Opt_nologreplay, "nologreplay"},
340fed8f166SQu Wenruo 	{Opt_norecovery, "norecovery"},
341dccae999SSage Weil 	{Opt_flushoncommit, "flushoncommit"},
3422c9ee856SQu Wenruo 	{Opt_noflushoncommit, "noflushoncommit"},
34397e728d4SJosef Bacik 	{Opt_ratio, "metadata_ratio=%d"},
344e244a0aeSChristoph Hellwig 	{Opt_discard, "discard"},
345e07a2adeSQu Wenruo 	{Opt_nodiscard, "nodiscard"},
3460af3d00bSJosef Bacik 	{Opt_space_cache, "space_cache"},
34770f6d82eSOmar Sandoval 	{Opt_space_cache_version, "space_cache=%s"},
34888c2ba3bSJosef Bacik 	{Opt_clear_cache, "clear_cache"},
3494260f7c7SSage Weil 	{Opt_user_subvol_rm_allowed, "user_subvol_rm_allowed"},
35091435650SChris Mason 	{Opt_enospc_debug, "enospc_debug"},
35153036293SQu Wenruo 	{Opt_noenospc_debug, "noenospc_debug"},
352e15d0542SXin Zhong 	{Opt_subvolrootid, "subvolrootid=%d"},
3534cb5300bSChris Mason 	{Opt_defrag, "autodefrag"},
354fc0ca9afSQu Wenruo 	{Opt_nodefrag, "noautodefrag"},
3554b9465cbSChris Mason 	{Opt_inode_cache, "inode_cache"},
3563818aea2SQu Wenruo 	{Opt_noinode_cache, "noinode_cache"},
3578965593eSDavid Sterba 	{Opt_no_space_cache, "nospace_cache"},
3588dcddfa0SQu Wenruo 	{Opt_recovery, "recovery"}, /* deprecated */
3598dcddfa0SQu Wenruo 	{Opt_usebackuproot, "usebackuproot"},
3609555c6c1SIlya Dryomov 	{Opt_skip_balance, "skip_balance"},
36121adbd5cSStefan Behrens 	{Opt_check_integrity, "check_int"},
36221adbd5cSStefan Behrens 	{Opt_check_integrity_including_extent_data, "check_int_data"},
36321adbd5cSStefan Behrens 	{Opt_check_integrity_print_mask, "check_int_print_mask=%d"},
364f420ee1eSStefan Behrens 	{Opt_rescan_uuid_tree, "rescan_uuid_tree"},
3658c342930SJeff Mahoney 	{Opt_fatal_errors, "fatal_errors=%s"},
3668b87dc17SDavid Sterba 	{Opt_commit_interval, "commit=%d"},
367d0bd4560SJosef Bacik #ifdef CONFIG_BTRFS_DEBUG
368d0bd4560SJosef Bacik 	{Opt_fragment_data, "fragment=data"},
369d0bd4560SJosef Bacik 	{Opt_fragment_metadata, "fragment=metadata"},
370d0bd4560SJosef Bacik 	{Opt_fragment_all, "fragment=all"},
371d0bd4560SJosef Bacik #endif
37233268eafSJosef Bacik 	{Opt_err, NULL},
37395e05289SChris Mason };
37495e05289SChris Mason 
375edf24abeSChristoph Hellwig /*
376edf24abeSChristoph Hellwig  * Regular mount options parser.  Everything that is needed only when
377edf24abeSChristoph Hellwig  * reading in a new superblock is parsed here.
37849b25e05SJeff Mahoney  * XXX JDM: This needs to be cleaned up for remount.
379edf24abeSChristoph Hellwig  */
38096da0919SQu Wenruo int btrfs_parse_options(struct btrfs_root *root, char *options,
38196da0919SQu Wenruo 			unsigned long new_flags)
38295e05289SChris Mason {
383edf24abeSChristoph Hellwig 	struct btrfs_fs_info *info = root->fs_info;
38495e05289SChris Mason 	substring_t args[MAX_OPT_ARGS];
38573bc1876SJosef Bacik 	char *p, *num, *orig = NULL;
38673bc1876SJosef Bacik 	u64 cache_gen;
3874543df7eSChris Mason 	int intarg;
388a7a3f7caSSage Weil 	int ret = 0;
389261507a0SLi Zefan 	char *compress_type;
390261507a0SLi Zefan 	bool compress_force = false;
391b7c47bbbSTsutomu Itoh 	enum btrfs_compression_type saved_compress_type;
392b7c47bbbSTsutomu Itoh 	bool saved_compress_force;
393b7c47bbbSTsutomu Itoh 	int no_compress = 0;
394b6cda9bcSChris Mason 
3956c41761fSDavid Sterba 	cache_gen = btrfs_super_cache_generation(root->fs_info->super_copy);
39670f6d82eSOmar Sandoval 	if (btrfs_fs_compat_ro(root->fs_info, FREE_SPACE_TREE))
39770f6d82eSOmar Sandoval 		btrfs_set_opt(info->mount_opt, FREE_SPACE_TREE);
39870f6d82eSOmar Sandoval 	else if (cache_gen)
39973bc1876SJosef Bacik 		btrfs_set_opt(info->mount_opt, SPACE_CACHE);
40073bc1876SJosef Bacik 
40196da0919SQu Wenruo 	/*
40296da0919SQu Wenruo 	 * Even the options are empty, we still need to do extra check
40396da0919SQu Wenruo 	 * against new flags
40496da0919SQu Wenruo 	 */
40595e05289SChris Mason 	if (!options)
40696da0919SQu Wenruo 		goto check;
40795e05289SChris Mason 
408be20aa9dSChris Mason 	/*
409be20aa9dSChris Mason 	 * strsep changes the string, duplicate it because parse_options
410be20aa9dSChris Mason 	 * gets called twice
411be20aa9dSChris Mason 	 */
412be20aa9dSChris Mason 	options = kstrdup(options, GFP_NOFS);
413be20aa9dSChris Mason 	if (!options)
414be20aa9dSChris Mason 		return -ENOMEM;
415be20aa9dSChris Mason 
416da495eccSJosef Bacik 	orig = options;
417be20aa9dSChris Mason 
41895e05289SChris Mason 	while ((p = strsep(&options, ",")) != NULL) {
41995e05289SChris Mason 		int token;
42095e05289SChris Mason 		if (!*p)
42195e05289SChris Mason 			continue;
42295e05289SChris Mason 
42395e05289SChris Mason 		token = match_token(p, tokens, args);
42495e05289SChris Mason 		switch (token) {
425dfe25020SChris Mason 		case Opt_degraded:
426efe120a0SFrank Holton 			btrfs_info(root->fs_info, "allowing degraded mounts");
427dfe25020SChris Mason 			btrfs_set_opt(info->mount_opt, DEGRADED);
428dfe25020SChris Mason 			break;
42995e05289SChris Mason 		case Opt_subvol:
43073f73415SJosef Bacik 		case Opt_subvolid:
431e15d0542SXin Zhong 		case Opt_subvolrootid:
43243e570b0SChristoph Hellwig 		case Opt_device:
433edf24abeSChristoph Hellwig 			/*
43443e570b0SChristoph Hellwig 			 * These are parsed by btrfs_parse_early_options
435edf24abeSChristoph Hellwig 			 * and can be happily ignored here.
436edf24abeSChristoph Hellwig 			 */
43795e05289SChris Mason 			break;
438b6cda9bcSChris Mason 		case Opt_nodatasum:
43907802534SQu Wenruo 			btrfs_set_and_info(root, NODATASUM,
44007802534SQu Wenruo 					   "setting nodatasum");
441be20aa9dSChris Mason 			break;
442d399167dSQu Wenruo 		case Opt_datasum:
44307802534SQu Wenruo 			if (btrfs_test_opt(root, NODATASUM)) {
444d399167dSQu Wenruo 				if (btrfs_test_opt(root, NODATACOW))
445d399167dSQu Wenruo 					btrfs_info(root->fs_info, "setting datasum, datacow enabled");
446d399167dSQu Wenruo 				else
447d399167dSQu Wenruo 					btrfs_info(root->fs_info, "setting datasum");
44807802534SQu Wenruo 			}
449d399167dSQu Wenruo 			btrfs_clear_opt(info->mount_opt, NODATACOW);
450d399167dSQu Wenruo 			btrfs_clear_opt(info->mount_opt, NODATASUM);
451d399167dSQu Wenruo 			break;
452be20aa9dSChris Mason 		case Opt_nodatacow:
45307802534SQu Wenruo 			if (!btrfs_test_opt(root, NODATACOW)) {
454bedb2ccaSAndrei Popa 				if (!btrfs_test_opt(root, COMPRESS) ||
455bedb2ccaSAndrei Popa 				    !btrfs_test_opt(root, FORCE_COMPRESS)) {
456efe120a0SFrank Holton 					btrfs_info(root->fs_info,
457efe120a0SFrank Holton 						   "setting nodatacow, compression disabled");
458bedb2ccaSAndrei Popa 				} else {
459efe120a0SFrank Holton 					btrfs_info(root->fs_info, "setting nodatacow");
460bedb2ccaSAndrei Popa 				}
46107802534SQu Wenruo 			}
462bedb2ccaSAndrei Popa 			btrfs_clear_opt(info->mount_opt, COMPRESS);
463bedb2ccaSAndrei Popa 			btrfs_clear_opt(info->mount_opt, FORCE_COMPRESS);
464be20aa9dSChris Mason 			btrfs_set_opt(info->mount_opt, NODATACOW);
465be20aa9dSChris Mason 			btrfs_set_opt(info->mount_opt, NODATASUM);
466b6cda9bcSChris Mason 			break;
467a258af7aSQu Wenruo 		case Opt_datacow:
46807802534SQu Wenruo 			btrfs_clear_and_info(root, NODATACOW,
46907802534SQu Wenruo 					     "setting datacow");
470a258af7aSQu Wenruo 			break;
471a555f810SChris Mason 		case Opt_compress_force:
472261507a0SLi Zefan 		case Opt_compress_force_type:
473261507a0SLi Zefan 			compress_force = true;
4741c697d4aSEric Sandeen 			/* Fallthrough */
475261507a0SLi Zefan 		case Opt_compress:
476261507a0SLi Zefan 		case Opt_compress_type:
477b7c47bbbSTsutomu Itoh 			saved_compress_type = btrfs_test_opt(root, COMPRESS) ?
478b7c47bbbSTsutomu Itoh 				info->compress_type : BTRFS_COMPRESS_NONE;
479b7c47bbbSTsutomu Itoh 			saved_compress_force =
480b7c47bbbSTsutomu Itoh 				btrfs_test_opt(root, FORCE_COMPRESS);
481261507a0SLi Zefan 			if (token == Opt_compress ||
482261507a0SLi Zefan 			    token == Opt_compress_force ||
483261507a0SLi Zefan 			    strcmp(args[0].from, "zlib") == 0) {
484261507a0SLi Zefan 				compress_type = "zlib";
485261507a0SLi Zefan 				info->compress_type = BTRFS_COMPRESS_ZLIB;
486063849eaSArnd Hannemann 				btrfs_set_opt(info->mount_opt, COMPRESS);
487bedb2ccaSAndrei Popa 				btrfs_clear_opt(info->mount_opt, NODATACOW);
488bedb2ccaSAndrei Popa 				btrfs_clear_opt(info->mount_opt, NODATASUM);
489b7c47bbbSTsutomu Itoh 				no_compress = 0;
490a6fa6faeSLi Zefan 			} else if (strcmp(args[0].from, "lzo") == 0) {
491a6fa6faeSLi Zefan 				compress_type = "lzo";
492a6fa6faeSLi Zefan 				info->compress_type = BTRFS_COMPRESS_LZO;
493063849eaSArnd Hannemann 				btrfs_set_opt(info->mount_opt, COMPRESS);
494bedb2ccaSAndrei Popa 				btrfs_clear_opt(info->mount_opt, NODATACOW);
495bedb2ccaSAndrei Popa 				btrfs_clear_opt(info->mount_opt, NODATASUM);
4962b0ce2c2SMitch Harder 				btrfs_set_fs_incompat(info, COMPRESS_LZO);
497b7c47bbbSTsutomu Itoh 				no_compress = 0;
498063849eaSArnd Hannemann 			} else if (strncmp(args[0].from, "no", 2) == 0) {
499063849eaSArnd Hannemann 				compress_type = "no";
500063849eaSArnd Hannemann 				btrfs_clear_opt(info->mount_opt, COMPRESS);
501063849eaSArnd Hannemann 				btrfs_clear_opt(info->mount_opt, FORCE_COMPRESS);
502063849eaSArnd Hannemann 				compress_force = false;
503b7c47bbbSTsutomu Itoh 				no_compress++;
504261507a0SLi Zefan 			} else {
505261507a0SLi Zefan 				ret = -EINVAL;
506261507a0SLi Zefan 				goto out;
507261507a0SLi Zefan 			}
508261507a0SLi Zefan 
509261507a0SLi Zefan 			if (compress_force) {
510b7c47bbbSTsutomu Itoh 				btrfs_set_opt(info->mount_opt, FORCE_COMPRESS);
511143f3636SDavid Sterba 			} else {
5124027e0f4SWang Shilong 				/*
5134027e0f4SWang Shilong 				 * If we remount from compress-force=xxx to
5144027e0f4SWang Shilong 				 * compress=xxx, we need clear FORCE_COMPRESS
5154027e0f4SWang Shilong 				 * flag, otherwise, there is no way for users
5164027e0f4SWang Shilong 				 * to disable forcible compression separately.
5174027e0f4SWang Shilong 				 */
5184027e0f4SWang Shilong 				btrfs_clear_opt(info->mount_opt, FORCE_COMPRESS);
519a7e252afSMiao Xie 			}
520b7c47bbbSTsutomu Itoh 			if ((btrfs_test_opt(root, COMPRESS) &&
521b7c47bbbSTsutomu Itoh 			     (info->compress_type != saved_compress_type ||
522b7c47bbbSTsutomu Itoh 			      compress_force != saved_compress_force)) ||
523b7c47bbbSTsutomu Itoh 			    (!btrfs_test_opt(root, COMPRESS) &&
524b7c47bbbSTsutomu Itoh 			     no_compress == 1)) {
525b7c47bbbSTsutomu Itoh 				btrfs_info(root->fs_info,
526b7c47bbbSTsutomu Itoh 					   "%s %s compression",
527b7c47bbbSTsutomu Itoh 					   (compress_force) ? "force" : "use",
528b7c47bbbSTsutomu Itoh 					   compress_type);
529b7c47bbbSTsutomu Itoh 			}
530b7c47bbbSTsutomu Itoh 			compress_force = false;
531a555f810SChris Mason 			break;
532e18e4809SChris Mason 		case Opt_ssd:
53307802534SQu Wenruo 			btrfs_set_and_info(root, SSD,
53407802534SQu Wenruo 					   "use ssd allocation scheme");
535e18e4809SChris Mason 			break;
536451d7585SChris Mason 		case Opt_ssd_spread:
53707802534SQu Wenruo 			btrfs_set_and_info(root, SSD_SPREAD,
53807802534SQu Wenruo 					   "use spread ssd allocation scheme");
5392aa06a35SEric Sandeen 			btrfs_set_opt(info->mount_opt, SSD);
540451d7585SChris Mason 			break;
5413b30c22fSChris Mason 		case Opt_nossd:
5422aa06a35SEric Sandeen 			btrfs_set_and_info(root, NOSSD,
54307802534SQu Wenruo 					     "not using ssd allocation scheme");
5443b30c22fSChris Mason 			btrfs_clear_opt(info->mount_opt, SSD);
5453b30c22fSChris Mason 			break;
546842bef58SQu Wenruo 		case Opt_barrier:
54707802534SQu Wenruo 			btrfs_clear_and_info(root, NOBARRIER,
54807802534SQu Wenruo 					     "turning on barriers");
549842bef58SQu Wenruo 			break;
55021ad10cfSChris Mason 		case Opt_nobarrier:
55107802534SQu Wenruo 			btrfs_set_and_info(root, NOBARRIER,
55207802534SQu Wenruo 					   "turning off barriers");
55321ad10cfSChris Mason 			break;
5544543df7eSChris Mason 		case Opt_thread_pool:
5552c334e87SWang Shilong 			ret = match_int(&args[0], &intarg);
5562c334e87SWang Shilong 			if (ret) {
5572c334e87SWang Shilong 				goto out;
5582c334e87SWang Shilong 			} else if (intarg > 0) {
5594543df7eSChris Mason 				info->thread_pool_size = intarg;
5602c334e87SWang Shilong 			} else {
5612c334e87SWang Shilong 				ret = -EINVAL;
5622c334e87SWang Shilong 				goto out;
5632c334e87SWang Shilong 			}
5644543df7eSChris Mason 			break;
5656f568d35SChris Mason 		case Opt_max_inline:
566edf24abeSChristoph Hellwig 			num = match_strdup(&args[0]);
5676f568d35SChris Mason 			if (num) {
56891748467SAkinobu Mita 				info->max_inline = memparse(num, NULL);
5696f568d35SChris Mason 				kfree(num);
5706f568d35SChris Mason 
57115ada040SChris Mason 				if (info->max_inline) {
572feb5f965SMitch Harder 					info->max_inline = min_t(u64,
57315ada040SChris Mason 						info->max_inline,
57415ada040SChris Mason 						root->sectorsize);
57515ada040SChris Mason 				}
576efe120a0SFrank Holton 				btrfs_info(root->fs_info, "max_inline at %llu",
577c1c9ff7cSGeert Uytterhoeven 					info->max_inline);
5782c334e87SWang Shilong 			} else {
5792c334e87SWang Shilong 				ret = -ENOMEM;
5802c334e87SWang Shilong 				goto out;
5816f568d35SChris Mason 			}
5826f568d35SChris Mason 			break;
5838f662a76SChris Mason 		case Opt_alloc_start:
584edf24abeSChristoph Hellwig 			num = match_strdup(&args[0]);
5858f662a76SChris Mason 			if (num) {
586c018daecSMiao Xie 				mutex_lock(&info->chunk_mutex);
58791748467SAkinobu Mita 				info->alloc_start = memparse(num, NULL);
588c018daecSMiao Xie 				mutex_unlock(&info->chunk_mutex);
5898f662a76SChris Mason 				kfree(num);
590efe120a0SFrank Holton 				btrfs_info(root->fs_info, "allocations start at %llu",
591c1c9ff7cSGeert Uytterhoeven 					info->alloc_start);
5922c334e87SWang Shilong 			} else {
5932c334e87SWang Shilong 				ret = -ENOMEM;
5942c334e87SWang Shilong 				goto out;
5958f662a76SChris Mason 			}
5968f662a76SChris Mason 			break;
597bd0330adSQu Wenruo 		case Opt_acl:
59845ff35d6SGuangliang Zhao #ifdef CONFIG_BTRFS_FS_POSIX_ACL
599bd0330adSQu Wenruo 			root->fs_info->sb->s_flags |= MS_POSIXACL;
600bd0330adSQu Wenruo 			break;
60145ff35d6SGuangliang Zhao #else
60245ff35d6SGuangliang Zhao 			btrfs_err(root->fs_info,
60345ff35d6SGuangliang Zhao 				"support for ACL not compiled in!");
60445ff35d6SGuangliang Zhao 			ret = -EINVAL;
60545ff35d6SGuangliang Zhao 			goto out;
60645ff35d6SGuangliang Zhao #endif
60733268eafSJosef Bacik 		case Opt_noacl:
60833268eafSJosef Bacik 			root->fs_info->sb->s_flags &= ~MS_POSIXACL;
60933268eafSJosef Bacik 			break;
6103a5e1404SSage Weil 		case Opt_notreelog:
61107802534SQu Wenruo 			btrfs_set_and_info(root, NOTREELOG,
61207802534SQu Wenruo 					   "disabling tree log");
6133a5e1404SSage Weil 			break;
614a88998f2SQu Wenruo 		case Opt_treelog:
61507802534SQu Wenruo 			btrfs_clear_and_info(root, NOTREELOG,
61607802534SQu Wenruo 					     "enabling tree log");
617a88998f2SQu Wenruo 			break;
618fed8f166SQu Wenruo 		case Opt_norecovery:
61996da0919SQu Wenruo 		case Opt_nologreplay:
62096da0919SQu Wenruo 			btrfs_set_and_info(root, NOLOGREPLAY,
62196da0919SQu Wenruo 					   "disabling log replay at mount time");
62296da0919SQu Wenruo 			break;
623dccae999SSage Weil 		case Opt_flushoncommit:
62407802534SQu Wenruo 			btrfs_set_and_info(root, FLUSHONCOMMIT,
62507802534SQu Wenruo 					   "turning on flush-on-commit");
626dccae999SSage Weil 			break;
6272c9ee856SQu Wenruo 		case Opt_noflushoncommit:
62807802534SQu Wenruo 			btrfs_clear_and_info(root, FLUSHONCOMMIT,
62907802534SQu Wenruo 					     "turning off flush-on-commit");
6302c9ee856SQu Wenruo 			break;
63197e728d4SJosef Bacik 		case Opt_ratio:
6322c334e87SWang Shilong 			ret = match_int(&args[0], &intarg);
6332c334e87SWang Shilong 			if (ret) {
6342c334e87SWang Shilong 				goto out;
6352c334e87SWang Shilong 			} else if (intarg >= 0) {
63697e728d4SJosef Bacik 				info->metadata_ratio = intarg;
637efe120a0SFrank Holton 				btrfs_info(root->fs_info, "metadata ratio %d",
63897e728d4SJosef Bacik 				       info->metadata_ratio);
6392c334e87SWang Shilong 			} else {
6402c334e87SWang Shilong 				ret = -EINVAL;
6412c334e87SWang Shilong 				goto out;
64297e728d4SJosef Bacik 			}
64397e728d4SJosef Bacik 			break;
644e244a0aeSChristoph Hellwig 		case Opt_discard:
64507802534SQu Wenruo 			btrfs_set_and_info(root, DISCARD,
64607802534SQu Wenruo 					   "turning on discard");
647e244a0aeSChristoph Hellwig 			break;
648e07a2adeSQu Wenruo 		case Opt_nodiscard:
64907802534SQu Wenruo 			btrfs_clear_and_info(root, DISCARD,
65007802534SQu Wenruo 					     "turning off discard");
651e07a2adeSQu Wenruo 			break;
6520af3d00bSJosef Bacik 		case Opt_space_cache:
65370f6d82eSOmar Sandoval 		case Opt_space_cache_version:
65470f6d82eSOmar Sandoval 			if (token == Opt_space_cache ||
65570f6d82eSOmar Sandoval 			    strcmp(args[0].from, "v1") == 0) {
65670f6d82eSOmar Sandoval 				btrfs_clear_opt(root->fs_info->mount_opt,
65770f6d82eSOmar Sandoval 						FREE_SPACE_TREE);
65807802534SQu Wenruo 				btrfs_set_and_info(root, SPACE_CACHE,
65907802534SQu Wenruo 						   "enabling disk space caching");
66070f6d82eSOmar Sandoval 			} else if (strcmp(args[0].from, "v2") == 0) {
66170f6d82eSOmar Sandoval 				btrfs_clear_opt(root->fs_info->mount_opt,
66270f6d82eSOmar Sandoval 						SPACE_CACHE);
66370f6d82eSOmar Sandoval 				btrfs_set_and_info(root, FREE_SPACE_TREE,
66470f6d82eSOmar Sandoval 						   "enabling free space tree");
66570f6d82eSOmar Sandoval 			} else {
66670f6d82eSOmar Sandoval 				ret = -EINVAL;
66770f6d82eSOmar Sandoval 				goto out;
66870f6d82eSOmar Sandoval 			}
6690de90876SJosef Bacik 			break;
670f420ee1eSStefan Behrens 		case Opt_rescan_uuid_tree:
671f420ee1eSStefan Behrens 			btrfs_set_opt(info->mount_opt, RESCAN_UUID_TREE);
672f420ee1eSStefan Behrens 			break;
67373bc1876SJosef Bacik 		case Opt_no_space_cache:
67470f6d82eSOmar Sandoval 			if (btrfs_test_opt(root, SPACE_CACHE)) {
67507802534SQu Wenruo 				btrfs_clear_and_info(root, SPACE_CACHE,
67607802534SQu Wenruo 						     "disabling disk space caching");
67770f6d82eSOmar Sandoval 			}
67870f6d82eSOmar Sandoval 			if (btrfs_test_opt(root, FREE_SPACE_TREE)) {
67970f6d82eSOmar Sandoval 				btrfs_clear_and_info(root, FREE_SPACE_TREE,
68070f6d82eSOmar Sandoval 						     "disabling free space tree");
68170f6d82eSOmar Sandoval 			}
68273bc1876SJosef Bacik 			break;
6834b9465cbSChris Mason 		case Opt_inode_cache:
6847e1876acSDavid Sterba 			btrfs_set_pending_and_info(info, INODE_MAP_CACHE,
68507802534SQu Wenruo 					   "enabling inode map caching");
6863818aea2SQu Wenruo 			break;
6873818aea2SQu Wenruo 		case Opt_noinode_cache:
6887e1876acSDavid Sterba 			btrfs_clear_pending_and_info(info, INODE_MAP_CACHE,
68907802534SQu Wenruo 					     "disabling inode map caching");
6904b9465cbSChris Mason 			break;
69188c2ba3bSJosef Bacik 		case Opt_clear_cache:
69207802534SQu Wenruo 			btrfs_set_and_info(root, CLEAR_CACHE,
69307802534SQu Wenruo 					   "force clearing of disk cache");
6940af3d00bSJosef Bacik 			break;
6954260f7c7SSage Weil 		case Opt_user_subvol_rm_allowed:
6964260f7c7SSage Weil 			btrfs_set_opt(info->mount_opt, USER_SUBVOL_RM_ALLOWED);
6974260f7c7SSage Weil 			break;
69891435650SChris Mason 		case Opt_enospc_debug:
69991435650SChris Mason 			btrfs_set_opt(info->mount_opt, ENOSPC_DEBUG);
70091435650SChris Mason 			break;
70153036293SQu Wenruo 		case Opt_noenospc_debug:
70253036293SQu Wenruo 			btrfs_clear_opt(info->mount_opt, ENOSPC_DEBUG);
70353036293SQu Wenruo 			break;
7044cb5300bSChris Mason 		case Opt_defrag:
70507802534SQu Wenruo 			btrfs_set_and_info(root, AUTO_DEFRAG,
70607802534SQu Wenruo 					   "enabling auto defrag");
7074cb5300bSChris Mason 			break;
708fc0ca9afSQu Wenruo 		case Opt_nodefrag:
70907802534SQu Wenruo 			btrfs_clear_and_info(root, AUTO_DEFRAG,
71007802534SQu Wenruo 					     "disabling auto defrag");
711fc0ca9afSQu Wenruo 			break;
712af31f5e5SChris Mason 		case Opt_recovery:
7138dcddfa0SQu Wenruo 			btrfs_warn(root->fs_info,
7148dcddfa0SQu Wenruo 				   "'recovery' is deprecated, use 'usebackuproot' instead");
7158dcddfa0SQu Wenruo 		case Opt_usebackuproot:
7168dcddfa0SQu Wenruo 			btrfs_info(root->fs_info,
7178dcddfa0SQu Wenruo 				   "trying to use backup root at mount time");
7188dcddfa0SQu Wenruo 			btrfs_set_opt(info->mount_opt, USEBACKUPROOT);
719af31f5e5SChris Mason 			break;
7209555c6c1SIlya Dryomov 		case Opt_skip_balance:
7219555c6c1SIlya Dryomov 			btrfs_set_opt(info->mount_opt, SKIP_BALANCE);
7229555c6c1SIlya Dryomov 			break;
72321adbd5cSStefan Behrens #ifdef CONFIG_BTRFS_FS_CHECK_INTEGRITY
72421adbd5cSStefan Behrens 		case Opt_check_integrity_including_extent_data:
725efe120a0SFrank Holton 			btrfs_info(root->fs_info,
726efe120a0SFrank Holton 				   "enabling check integrity including extent data");
72721adbd5cSStefan Behrens 			btrfs_set_opt(info->mount_opt,
72821adbd5cSStefan Behrens 				      CHECK_INTEGRITY_INCLUDING_EXTENT_DATA);
72921adbd5cSStefan Behrens 			btrfs_set_opt(info->mount_opt, CHECK_INTEGRITY);
73021adbd5cSStefan Behrens 			break;
73121adbd5cSStefan Behrens 		case Opt_check_integrity:
732efe120a0SFrank Holton 			btrfs_info(root->fs_info, "enabling check integrity");
73321adbd5cSStefan Behrens 			btrfs_set_opt(info->mount_opt, CHECK_INTEGRITY);
73421adbd5cSStefan Behrens 			break;
73521adbd5cSStefan Behrens 		case Opt_check_integrity_print_mask:
7362c334e87SWang Shilong 			ret = match_int(&args[0], &intarg);
7372c334e87SWang Shilong 			if (ret) {
7382c334e87SWang Shilong 				goto out;
7392c334e87SWang Shilong 			} else if (intarg >= 0) {
74021adbd5cSStefan Behrens 				info->check_integrity_print_mask = intarg;
741efe120a0SFrank Holton 				btrfs_info(root->fs_info, "check_integrity_print_mask 0x%x",
74221adbd5cSStefan Behrens 				       info->check_integrity_print_mask);
7432c334e87SWang Shilong 			} else {
7442c334e87SWang Shilong 				ret = -EINVAL;
7452c334e87SWang Shilong 				goto out;
74621adbd5cSStefan Behrens 			}
74721adbd5cSStefan Behrens 			break;
74821adbd5cSStefan Behrens #else
74921adbd5cSStefan Behrens 		case Opt_check_integrity_including_extent_data:
75021adbd5cSStefan Behrens 		case Opt_check_integrity:
75121adbd5cSStefan Behrens 		case Opt_check_integrity_print_mask:
752efe120a0SFrank Holton 			btrfs_err(root->fs_info,
753efe120a0SFrank Holton 				"support for check_integrity* not compiled in!");
75421adbd5cSStefan Behrens 			ret = -EINVAL;
75521adbd5cSStefan Behrens 			goto out;
75621adbd5cSStefan Behrens #endif
7578c342930SJeff Mahoney 		case Opt_fatal_errors:
7588c342930SJeff Mahoney 			if (strcmp(args[0].from, "panic") == 0)
7598c342930SJeff Mahoney 				btrfs_set_opt(info->mount_opt,
7608c342930SJeff Mahoney 					      PANIC_ON_FATAL_ERROR);
7618c342930SJeff Mahoney 			else if (strcmp(args[0].from, "bug") == 0)
7628c342930SJeff Mahoney 				btrfs_clear_opt(info->mount_opt,
7638c342930SJeff Mahoney 					      PANIC_ON_FATAL_ERROR);
7648c342930SJeff Mahoney 			else {
7658c342930SJeff Mahoney 				ret = -EINVAL;
7668c342930SJeff Mahoney 				goto out;
7678c342930SJeff Mahoney 			}
7688c342930SJeff Mahoney 			break;
7698b87dc17SDavid Sterba 		case Opt_commit_interval:
7708b87dc17SDavid Sterba 			intarg = 0;
7718b87dc17SDavid Sterba 			ret = match_int(&args[0], &intarg);
7728b87dc17SDavid Sterba 			if (ret < 0) {
773efe120a0SFrank Holton 				btrfs_err(root->fs_info, "invalid commit interval");
7748b87dc17SDavid Sterba 				ret = -EINVAL;
7758b87dc17SDavid Sterba 				goto out;
7768b87dc17SDavid Sterba 			}
7778b87dc17SDavid Sterba 			if (intarg > 0) {
7788b87dc17SDavid Sterba 				if (intarg > 300) {
779efe120a0SFrank Holton 					btrfs_warn(root->fs_info, "excessive commit interval %d",
7808b87dc17SDavid Sterba 							intarg);
7818b87dc17SDavid Sterba 				}
7828b87dc17SDavid Sterba 				info->commit_interval = intarg;
7838b87dc17SDavid Sterba 			} else {
784efe120a0SFrank Holton 				btrfs_info(root->fs_info, "using default commit interval %ds",
7858b87dc17SDavid Sterba 				    BTRFS_DEFAULT_COMMIT_INTERVAL);
7868b87dc17SDavid Sterba 				info->commit_interval = BTRFS_DEFAULT_COMMIT_INTERVAL;
7878b87dc17SDavid Sterba 			}
7888b87dc17SDavid Sterba 			break;
789d0bd4560SJosef Bacik #ifdef CONFIG_BTRFS_DEBUG
790d0bd4560SJosef Bacik 		case Opt_fragment_all:
791d0bd4560SJosef Bacik 			btrfs_info(root->fs_info, "fragmenting all space");
792d0bd4560SJosef Bacik 			btrfs_set_opt(info->mount_opt, FRAGMENT_DATA);
793d0bd4560SJosef Bacik 			btrfs_set_opt(info->mount_opt, FRAGMENT_METADATA);
794d0bd4560SJosef Bacik 			break;
795d0bd4560SJosef Bacik 		case Opt_fragment_metadata:
796d0bd4560SJosef Bacik 			btrfs_info(root->fs_info, "fragmenting metadata");
797d0bd4560SJosef Bacik 			btrfs_set_opt(info->mount_opt,
798d0bd4560SJosef Bacik 				      FRAGMENT_METADATA);
799d0bd4560SJosef Bacik 			break;
800d0bd4560SJosef Bacik 		case Opt_fragment_data:
801d0bd4560SJosef Bacik 			btrfs_info(root->fs_info, "fragmenting data");
802d0bd4560SJosef Bacik 			btrfs_set_opt(info->mount_opt, FRAGMENT_DATA);
803d0bd4560SJosef Bacik 			break;
804d0bd4560SJosef Bacik #endif
805a7a3f7caSSage Weil 		case Opt_err:
806efe120a0SFrank Holton 			btrfs_info(root->fs_info, "unrecognized mount option '%s'", p);
807a7a3f7caSSage Weil 			ret = -EINVAL;
808a7a3f7caSSage Weil 			goto out;
80995e05289SChris Mason 		default:
810be20aa9dSChris Mason 			break;
81195e05289SChris Mason 		}
81295e05289SChris Mason 	}
81396da0919SQu Wenruo check:
81496da0919SQu Wenruo 	/*
81596da0919SQu Wenruo 	 * Extra check for current option against current flag
81696da0919SQu Wenruo 	 */
81796da0919SQu Wenruo 	if (btrfs_test_opt(root, NOLOGREPLAY) && !(new_flags & MS_RDONLY)) {
81896da0919SQu Wenruo 		btrfs_err(root->fs_info,
81996da0919SQu Wenruo 			  "nologreplay must be used with ro mount option");
82096da0919SQu Wenruo 		ret = -EINVAL;
82196da0919SQu Wenruo 	}
822a7a3f7caSSage Weil out:
82370f6d82eSOmar Sandoval 	if (btrfs_fs_compat_ro(root->fs_info, FREE_SPACE_TREE) &&
82470f6d82eSOmar Sandoval 	    !btrfs_test_opt(root, FREE_SPACE_TREE) &&
82570f6d82eSOmar Sandoval 	    !btrfs_test_opt(root, CLEAR_CACHE)) {
82670f6d82eSOmar Sandoval 		btrfs_err(root->fs_info, "cannot disable free space tree");
82770f6d82eSOmar Sandoval 		ret = -EINVAL;
82870f6d82eSOmar Sandoval 
82970f6d82eSOmar Sandoval 	}
83073bc1876SJosef Bacik 	if (!ret && btrfs_test_opt(root, SPACE_CACHE))
831efe120a0SFrank Holton 		btrfs_info(root->fs_info, "disk space caching is enabled");
83270f6d82eSOmar Sandoval 	if (!ret && btrfs_test_opt(root, FREE_SPACE_TREE))
83370f6d82eSOmar Sandoval 		btrfs_info(root->fs_info, "using free space tree");
834da495eccSJosef Bacik 	kfree(orig);
835a7a3f7caSSage Weil 	return ret;
836edf24abeSChristoph Hellwig }
837edf24abeSChristoph Hellwig 
838edf24abeSChristoph Hellwig /*
839edf24abeSChristoph Hellwig  * Parse mount options that are required early in the mount process.
840edf24abeSChristoph Hellwig  *
841edf24abeSChristoph Hellwig  * All other options will be parsed on much later in the mount process and
842edf24abeSChristoph Hellwig  * only when we need to allocate a new super block.
843edf24abeSChristoph Hellwig  */
84497288f2cSChristoph Hellwig static int btrfs_parse_early_options(const char *options, fmode_t flags,
84573f73415SJosef Bacik 		void *holder, char **subvol_name, u64 *subvol_objectid,
8465e2a4b25SDavid Sterba 		struct btrfs_fs_devices **fs_devices)
847edf24abeSChristoph Hellwig {
848edf24abeSChristoph Hellwig 	substring_t args[MAX_OPT_ARGS];
84983c8c9bdSJeff Liu 	char *device_name, *opts, *orig, *p;
8501493381fSWang Shilong 	char *num = NULL;
851edf24abeSChristoph Hellwig 	int error = 0;
852edf24abeSChristoph Hellwig 
853edf24abeSChristoph Hellwig 	if (!options)
854830c4adbSJosef Bacik 		return 0;
855edf24abeSChristoph Hellwig 
856edf24abeSChristoph Hellwig 	/*
857edf24abeSChristoph Hellwig 	 * strsep changes the string, duplicate it because parse_options
858edf24abeSChristoph Hellwig 	 * gets called twice
859edf24abeSChristoph Hellwig 	 */
860edf24abeSChristoph Hellwig 	opts = kstrdup(options, GFP_KERNEL);
861edf24abeSChristoph Hellwig 	if (!opts)
862edf24abeSChristoph Hellwig 		return -ENOMEM;
8633f3d0bc0STero Roponen 	orig = opts;
864edf24abeSChristoph Hellwig 
865edf24abeSChristoph Hellwig 	while ((p = strsep(&opts, ",")) != NULL) {
866edf24abeSChristoph Hellwig 		int token;
867edf24abeSChristoph Hellwig 		if (!*p)
868edf24abeSChristoph Hellwig 			continue;
869edf24abeSChristoph Hellwig 
870edf24abeSChristoph Hellwig 		token = match_token(p, tokens, args);
871edf24abeSChristoph Hellwig 		switch (token) {
872edf24abeSChristoph Hellwig 		case Opt_subvol:
873a90e8b6fSIlya Dryomov 			kfree(*subvol_name);
874edf24abeSChristoph Hellwig 			*subvol_name = match_strdup(&args[0]);
8752c334e87SWang Shilong 			if (!*subvol_name) {
8762c334e87SWang Shilong 				error = -ENOMEM;
8772c334e87SWang Shilong 				goto out;
8782c334e87SWang Shilong 			}
879edf24abeSChristoph Hellwig 			break;
88073f73415SJosef Bacik 		case Opt_subvolid:
8811493381fSWang Shilong 			num = match_strdup(&args[0]);
8821493381fSWang Shilong 			if (num) {
8831493381fSWang Shilong 				*subvol_objectid = memparse(num, NULL);
8841493381fSWang Shilong 				kfree(num);
8854849f01dSJosef Bacik 				/* we want the original fs_tree */
8861493381fSWang Shilong 				if (!*subvol_objectid)
8874849f01dSJosef Bacik 					*subvol_objectid =
8884849f01dSJosef Bacik 						BTRFS_FS_TREE_OBJECTID;
8892c334e87SWang Shilong 			} else {
8902c334e87SWang Shilong 				error = -EINVAL;
8912c334e87SWang Shilong 				goto out;
8924849f01dSJosef Bacik 			}
89373f73415SJosef Bacik 			break;
894e15d0542SXin Zhong 		case Opt_subvolrootid:
8955e2a4b25SDavid Sterba 			printk(KERN_WARNING
896efe120a0SFrank Holton 				"BTRFS: 'subvolrootid' mount option is deprecated and has "
897efe120a0SFrank Holton 				"no effect\n");
898e15d0542SXin Zhong 			break;
89943e570b0SChristoph Hellwig 		case Opt_device:
90083c8c9bdSJeff Liu 			device_name = match_strdup(&args[0]);
90183c8c9bdSJeff Liu 			if (!device_name) {
90283c8c9bdSJeff Liu 				error = -ENOMEM;
90383c8c9bdSJeff Liu 				goto out;
90483c8c9bdSJeff Liu 			}
90583c8c9bdSJeff Liu 			error = btrfs_scan_one_device(device_name,
90643e570b0SChristoph Hellwig 					flags, holder, fs_devices);
90783c8c9bdSJeff Liu 			kfree(device_name);
90843e570b0SChristoph Hellwig 			if (error)
909830c4adbSJosef Bacik 				goto out;
91043e570b0SChristoph Hellwig 			break;
911edf24abeSChristoph Hellwig 		default:
912edf24abeSChristoph Hellwig 			break;
913edf24abeSChristoph Hellwig 		}
914edf24abeSChristoph Hellwig 	}
915edf24abeSChristoph Hellwig 
916edf24abeSChristoph Hellwig out:
917830c4adbSJosef Bacik 	kfree(orig);
918edf24abeSChristoph Hellwig 	return error;
91995e05289SChris Mason }
92095e05289SChris Mason 
92105dbe683SOmar Sandoval static char *get_subvol_name_from_objectid(struct btrfs_fs_info *fs_info,
92273f73415SJosef Bacik 					   u64 subvol_objectid)
92373f73415SJosef Bacik {
924815745cfSAl Viro 	struct btrfs_root *root = fs_info->tree_root;
92505dbe683SOmar Sandoval 	struct btrfs_root *fs_root;
92605dbe683SOmar Sandoval 	struct btrfs_root_ref *root_ref;
92705dbe683SOmar Sandoval 	struct btrfs_inode_ref *inode_ref;
92805dbe683SOmar Sandoval 	struct btrfs_key key;
92905dbe683SOmar Sandoval 	struct btrfs_path *path = NULL;
93005dbe683SOmar Sandoval 	char *name = NULL, *ptr;
93105dbe683SOmar Sandoval 	u64 dirid;
93205dbe683SOmar Sandoval 	int len;
93305dbe683SOmar Sandoval 	int ret;
93405dbe683SOmar Sandoval 
93505dbe683SOmar Sandoval 	path = btrfs_alloc_path();
93605dbe683SOmar Sandoval 	if (!path) {
93705dbe683SOmar Sandoval 		ret = -ENOMEM;
93805dbe683SOmar Sandoval 		goto err;
93905dbe683SOmar Sandoval 	}
94005dbe683SOmar Sandoval 	path->leave_spinning = 1;
94105dbe683SOmar Sandoval 
94205dbe683SOmar Sandoval 	name = kmalloc(PATH_MAX, GFP_NOFS);
94305dbe683SOmar Sandoval 	if (!name) {
94405dbe683SOmar Sandoval 		ret = -ENOMEM;
94505dbe683SOmar Sandoval 		goto err;
94605dbe683SOmar Sandoval 	}
94705dbe683SOmar Sandoval 	ptr = name + PATH_MAX - 1;
94805dbe683SOmar Sandoval 	ptr[0] = '\0';
94905dbe683SOmar Sandoval 
95005dbe683SOmar Sandoval 	/*
95105dbe683SOmar Sandoval 	 * Walk up the subvolume trees in the tree of tree roots by root
95205dbe683SOmar Sandoval 	 * backrefs until we hit the top-level subvolume.
95305dbe683SOmar Sandoval 	 */
95405dbe683SOmar Sandoval 	while (subvol_objectid != BTRFS_FS_TREE_OBJECTID) {
95505dbe683SOmar Sandoval 		key.objectid = subvol_objectid;
95605dbe683SOmar Sandoval 		key.type = BTRFS_ROOT_BACKREF_KEY;
95705dbe683SOmar Sandoval 		key.offset = (u64)-1;
95805dbe683SOmar Sandoval 
95905dbe683SOmar Sandoval 		ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
96005dbe683SOmar Sandoval 		if (ret < 0) {
96105dbe683SOmar Sandoval 			goto err;
96205dbe683SOmar Sandoval 		} else if (ret > 0) {
96305dbe683SOmar Sandoval 			ret = btrfs_previous_item(root, path, subvol_objectid,
96405dbe683SOmar Sandoval 						  BTRFS_ROOT_BACKREF_KEY);
96505dbe683SOmar Sandoval 			if (ret < 0) {
96605dbe683SOmar Sandoval 				goto err;
96705dbe683SOmar Sandoval 			} else if (ret > 0) {
96805dbe683SOmar Sandoval 				ret = -ENOENT;
96905dbe683SOmar Sandoval 				goto err;
97005dbe683SOmar Sandoval 			}
97105dbe683SOmar Sandoval 		}
97205dbe683SOmar Sandoval 
97305dbe683SOmar Sandoval 		btrfs_item_key_to_cpu(path->nodes[0], &key, path->slots[0]);
97405dbe683SOmar Sandoval 		subvol_objectid = key.offset;
97505dbe683SOmar Sandoval 
97605dbe683SOmar Sandoval 		root_ref = btrfs_item_ptr(path->nodes[0], path->slots[0],
97705dbe683SOmar Sandoval 					  struct btrfs_root_ref);
97805dbe683SOmar Sandoval 		len = btrfs_root_ref_name_len(path->nodes[0], root_ref);
97905dbe683SOmar Sandoval 		ptr -= len + 1;
98005dbe683SOmar Sandoval 		if (ptr < name) {
98105dbe683SOmar Sandoval 			ret = -ENAMETOOLONG;
98205dbe683SOmar Sandoval 			goto err;
98305dbe683SOmar Sandoval 		}
98405dbe683SOmar Sandoval 		read_extent_buffer(path->nodes[0], ptr + 1,
98505dbe683SOmar Sandoval 				   (unsigned long)(root_ref + 1), len);
98605dbe683SOmar Sandoval 		ptr[0] = '/';
98705dbe683SOmar Sandoval 		dirid = btrfs_root_ref_dirid(path->nodes[0], root_ref);
98805dbe683SOmar Sandoval 		btrfs_release_path(path);
98905dbe683SOmar Sandoval 
99005dbe683SOmar Sandoval 		key.objectid = subvol_objectid;
99105dbe683SOmar Sandoval 		key.type = BTRFS_ROOT_ITEM_KEY;
99205dbe683SOmar Sandoval 		key.offset = (u64)-1;
99305dbe683SOmar Sandoval 		fs_root = btrfs_read_fs_root_no_name(fs_info, &key);
99405dbe683SOmar Sandoval 		if (IS_ERR(fs_root)) {
99505dbe683SOmar Sandoval 			ret = PTR_ERR(fs_root);
99605dbe683SOmar Sandoval 			goto err;
99705dbe683SOmar Sandoval 		}
99805dbe683SOmar Sandoval 
99905dbe683SOmar Sandoval 		/*
100005dbe683SOmar Sandoval 		 * Walk up the filesystem tree by inode refs until we hit the
100105dbe683SOmar Sandoval 		 * root directory.
100205dbe683SOmar Sandoval 		 */
100305dbe683SOmar Sandoval 		while (dirid != BTRFS_FIRST_FREE_OBJECTID) {
100405dbe683SOmar Sandoval 			key.objectid = dirid;
100505dbe683SOmar Sandoval 			key.type = BTRFS_INODE_REF_KEY;
100605dbe683SOmar Sandoval 			key.offset = (u64)-1;
100705dbe683SOmar Sandoval 
100805dbe683SOmar Sandoval 			ret = btrfs_search_slot(NULL, fs_root, &key, path, 0, 0);
100905dbe683SOmar Sandoval 			if (ret < 0) {
101005dbe683SOmar Sandoval 				goto err;
101105dbe683SOmar Sandoval 			} else if (ret > 0) {
101205dbe683SOmar Sandoval 				ret = btrfs_previous_item(fs_root, path, dirid,
101305dbe683SOmar Sandoval 							  BTRFS_INODE_REF_KEY);
101405dbe683SOmar Sandoval 				if (ret < 0) {
101505dbe683SOmar Sandoval 					goto err;
101605dbe683SOmar Sandoval 				} else if (ret > 0) {
101705dbe683SOmar Sandoval 					ret = -ENOENT;
101805dbe683SOmar Sandoval 					goto err;
101905dbe683SOmar Sandoval 				}
102005dbe683SOmar Sandoval 			}
102105dbe683SOmar Sandoval 
102205dbe683SOmar Sandoval 			btrfs_item_key_to_cpu(path->nodes[0], &key, path->slots[0]);
102305dbe683SOmar Sandoval 			dirid = key.offset;
102405dbe683SOmar Sandoval 
102505dbe683SOmar Sandoval 			inode_ref = btrfs_item_ptr(path->nodes[0],
102605dbe683SOmar Sandoval 						   path->slots[0],
102705dbe683SOmar Sandoval 						   struct btrfs_inode_ref);
102805dbe683SOmar Sandoval 			len = btrfs_inode_ref_name_len(path->nodes[0],
102905dbe683SOmar Sandoval 						       inode_ref);
103005dbe683SOmar Sandoval 			ptr -= len + 1;
103105dbe683SOmar Sandoval 			if (ptr < name) {
103205dbe683SOmar Sandoval 				ret = -ENAMETOOLONG;
103305dbe683SOmar Sandoval 				goto err;
103405dbe683SOmar Sandoval 			}
103505dbe683SOmar Sandoval 			read_extent_buffer(path->nodes[0], ptr + 1,
103605dbe683SOmar Sandoval 					   (unsigned long)(inode_ref + 1), len);
103705dbe683SOmar Sandoval 			ptr[0] = '/';
103805dbe683SOmar Sandoval 			btrfs_release_path(path);
103905dbe683SOmar Sandoval 		}
104005dbe683SOmar Sandoval 	}
104105dbe683SOmar Sandoval 
104205dbe683SOmar Sandoval 	btrfs_free_path(path);
104305dbe683SOmar Sandoval 	if (ptr == name + PATH_MAX - 1) {
104405dbe683SOmar Sandoval 		name[0] = '/';
104505dbe683SOmar Sandoval 		name[1] = '\0';
104605dbe683SOmar Sandoval 	} else {
104705dbe683SOmar Sandoval 		memmove(name, ptr, name + PATH_MAX - ptr);
104805dbe683SOmar Sandoval 	}
104905dbe683SOmar Sandoval 	return name;
105005dbe683SOmar Sandoval 
105105dbe683SOmar Sandoval err:
105205dbe683SOmar Sandoval 	btrfs_free_path(path);
105305dbe683SOmar Sandoval 	kfree(name);
105405dbe683SOmar Sandoval 	return ERR_PTR(ret);
105505dbe683SOmar Sandoval }
105605dbe683SOmar Sandoval 
105705dbe683SOmar Sandoval static int get_default_subvol_objectid(struct btrfs_fs_info *fs_info, u64 *objectid)
105805dbe683SOmar Sandoval {
105905dbe683SOmar Sandoval 	struct btrfs_root *root = fs_info->tree_root;
106073f73415SJosef Bacik 	struct btrfs_dir_item *di;
106173f73415SJosef Bacik 	struct btrfs_path *path;
106273f73415SJosef Bacik 	struct btrfs_key location;
106373f73415SJosef Bacik 	u64 dir_id;
106473f73415SJosef Bacik 
106573f73415SJosef Bacik 	path = btrfs_alloc_path();
106673f73415SJosef Bacik 	if (!path)
106705dbe683SOmar Sandoval 		return -ENOMEM;
106873f73415SJosef Bacik 	path->leave_spinning = 1;
106973f73415SJosef Bacik 
107073f73415SJosef Bacik 	/*
107173f73415SJosef Bacik 	 * Find the "default" dir item which points to the root item that we
107273f73415SJosef Bacik 	 * will mount by default if we haven't been given a specific subvolume
107373f73415SJosef Bacik 	 * to mount.
107473f73415SJosef Bacik 	 */
1075815745cfSAl Viro 	dir_id = btrfs_super_root_dir(fs_info->super_copy);
107673f73415SJosef Bacik 	di = btrfs_lookup_dir_item(NULL, root, path, dir_id, "default", 7, 0);
1077b0839166SJulia Lawall 	if (IS_ERR(di)) {
1078b0839166SJulia Lawall 		btrfs_free_path(path);
107905dbe683SOmar Sandoval 		return PTR_ERR(di);
1080b0839166SJulia Lawall 	}
108173f73415SJosef Bacik 	if (!di) {
108273f73415SJosef Bacik 		/*
108373f73415SJosef Bacik 		 * Ok the default dir item isn't there.  This is weird since
108473f73415SJosef Bacik 		 * it's always been there, but don't freak out, just try and
108505dbe683SOmar Sandoval 		 * mount the top-level subvolume.
108673f73415SJosef Bacik 		 */
108773f73415SJosef Bacik 		btrfs_free_path(path);
108805dbe683SOmar Sandoval 		*objectid = BTRFS_FS_TREE_OBJECTID;
108905dbe683SOmar Sandoval 		return 0;
109073f73415SJosef Bacik 	}
109173f73415SJosef Bacik 
109273f73415SJosef Bacik 	btrfs_dir_item_key_to_cpu(path->nodes[0], di, &location);
109373f73415SJosef Bacik 	btrfs_free_path(path);
109405dbe683SOmar Sandoval 	*objectid = location.objectid;
109505dbe683SOmar Sandoval 	return 0;
109673f73415SJosef Bacik }
109773f73415SJosef Bacik 
10988a4b83ccSChris Mason static int btrfs_fill_super(struct super_block *sb,
10998a4b83ccSChris Mason 			    struct btrfs_fs_devices *fs_devices,
11008a4b83ccSChris Mason 			    void *data, int silent)
11012e635a27SChris Mason {
11022e635a27SChris Mason 	struct inode *inode;
1103815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(sb);
11045d4f98a2SYan Zheng 	struct btrfs_key key;
110539279cc3SChris Mason 	int err;
11062e635a27SChris Mason 
11072e635a27SChris Mason 	sb->s_maxbytes = MAX_LFS_FILESIZE;
11082e635a27SChris Mason 	sb->s_magic = BTRFS_SUPER_MAGIC;
1109e20d96d6SChris Mason 	sb->s_op = &btrfs_super_ops;
1110af53d29aSAl Viro 	sb->s_d_op = &btrfs_dentry_operations;
1111be6e8dc0SBalaji Rao 	sb->s_export_op = &btrfs_export_ops;
11125103e947SJosef Bacik 	sb->s_xattr = btrfs_xattr_handlers;
11132e635a27SChris Mason 	sb->s_time_gran = 1;
11140eda294dSChris Mason #ifdef CONFIG_BTRFS_FS_POSIX_ACL
111533268eafSJosef Bacik 	sb->s_flags |= MS_POSIXACL;
111649cf6f45SChris Ball #endif
11170c4d2d95SJosef Bacik 	sb->s_flags |= MS_I_VERSION;
1118da2f0f74SChris Mason 	sb->s_iflags |= SB_I_CGROUPWB;
1119ad2b2c80SAl Viro 	err = open_ctree(sb, fs_devices, (char *)data);
1120ad2b2c80SAl Viro 	if (err) {
1121efe120a0SFrank Holton 		printk(KERN_ERR "BTRFS: open_ctree failed\n");
1122ad2b2c80SAl Viro 		return err;
1123e20d96d6SChris Mason 	}
1124b888db2bSChris Mason 
11255d4f98a2SYan Zheng 	key.objectid = BTRFS_FIRST_FREE_OBJECTID;
11265d4f98a2SYan Zheng 	key.type = BTRFS_INODE_ITEM_KEY;
11275d4f98a2SYan Zheng 	key.offset = 0;
112898c7089cSAl Viro 	inode = btrfs_iget(sb, &key, fs_info->fs_root, NULL);
11295d4f98a2SYan Zheng 	if (IS_ERR(inode)) {
11305d4f98a2SYan Zheng 		err = PTR_ERR(inode);
113139279cc3SChris Mason 		goto fail_close;
113239279cc3SChris Mason 	}
11332e635a27SChris Mason 
113448fde701SAl Viro 	sb->s_root = d_make_root(inode);
113548fde701SAl Viro 	if (!sb->s_root) {
113639279cc3SChris Mason 		err = -ENOMEM;
113739279cc3SChris Mason 		goto fail_close;
11382e635a27SChris Mason 	}
113958176a96SJosef Bacik 
11406885f308SChris Mason 	save_mount_options(sb, data);
114190a887c9SDan Magenheimer 	cleancache_init_fs(sb);
114259553edfSAl Viro 	sb->s_flags |= MS_ACTIVE;
11432e635a27SChris Mason 	return 0;
11442e635a27SChris Mason 
114539279cc3SChris Mason fail_close:
1146815745cfSAl Viro 	close_ctree(fs_info->tree_root);
1147d5719762SChris Mason 	return err;
1148d5719762SChris Mason }
1149d5719762SChris Mason 
11506bf13c0cSSage Weil int btrfs_sync_fs(struct super_block *sb, int wait)
1151d5719762SChris Mason {
1152d5719762SChris Mason 	struct btrfs_trans_handle *trans;
1153815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(sb);
1154815745cfSAl Viro 	struct btrfs_root *root = fs_info->tree_root;
1155df2ce34cSChris Mason 
11561abe9b8aSliubo 	trace_btrfs_sync_fs(wait);
11571abe9b8aSliubo 
1158d561c025SChris Mason 	if (!wait) {
1159815745cfSAl Viro 		filemap_flush(fs_info->btree_inode->i_mapping);
1160df2ce34cSChris Mason 		return 0;
1161d561c025SChris Mason 	}
1162771ed689SChris Mason 
1163b0244199SMiao Xie 	btrfs_wait_ordered_roots(fs_info, -1);
1164771ed689SChris Mason 
1165d4edf39bSMiao Xie 	trans = btrfs_attach_transaction_barrier(root);
116660376ce4SJosef Bacik 	if (IS_ERR(trans)) {
1167354aa0fbSMiao Xie 		/* no transaction, don't bother */
11686b5fe46dSDavid Sterba 		if (PTR_ERR(trans) == -ENOENT) {
11696b5fe46dSDavid Sterba 			/*
11706b5fe46dSDavid Sterba 			 * Exit unless we have some pending changes
11716b5fe46dSDavid Sterba 			 * that need to go through commit
11726b5fe46dSDavid Sterba 			 */
11736b5fe46dSDavid Sterba 			if (fs_info->pending_changes == 0)
1174bd7de2c9SJosef Bacik 				return 0;
1175a53f4f8eSQu Wenruo 			/*
1176a53f4f8eSQu Wenruo 			 * A non-blocking test if the fs is frozen. We must not
1177a53f4f8eSQu Wenruo 			 * start a new transaction here otherwise a deadlock
1178a53f4f8eSQu Wenruo 			 * happens. The pending operations are delayed to the
1179a53f4f8eSQu Wenruo 			 * next commit after thawing.
1180a53f4f8eSQu Wenruo 			 */
1181a53f4f8eSQu Wenruo 			if (__sb_start_write(sb, SB_FREEZE_WRITE, false))
1182a53f4f8eSQu Wenruo 				__sb_end_write(sb, SB_FREEZE_WRITE);
1183a53f4f8eSQu Wenruo 			else
1184a53f4f8eSQu Wenruo 				return 0;
11856b5fe46dSDavid Sterba 			trans = btrfs_start_transaction(root, 0);
118660376ce4SJosef Bacik 		}
118798bd5c54SDavid Sterba 		if (IS_ERR(trans))
118898bd5c54SDavid Sterba 			return PTR_ERR(trans);
11896b5fe46dSDavid Sterba 	}
1190bd7de2c9SJosef Bacik 	return btrfs_commit_transaction(trans, root);
1191d5719762SChris Mason }
1192d5719762SChris Mason 
119334c80b1dSAl Viro static int btrfs_show_options(struct seq_file *seq, struct dentry *dentry)
1194a9572a15SEric Paris {
1195815745cfSAl Viro 	struct btrfs_fs_info *info = btrfs_sb(dentry->d_sb);
1196815745cfSAl Viro 	struct btrfs_root *root = info->tree_root;
1197200da64eSTsutomu Itoh 	char *compress_type;
1198a9572a15SEric Paris 
1199a9572a15SEric Paris 	if (btrfs_test_opt(root, DEGRADED))
1200a9572a15SEric Paris 		seq_puts(seq, ",degraded");
1201a9572a15SEric Paris 	if (btrfs_test_opt(root, NODATASUM))
1202a9572a15SEric Paris 		seq_puts(seq, ",nodatasum");
1203a9572a15SEric Paris 	if (btrfs_test_opt(root, NODATACOW))
1204a9572a15SEric Paris 		seq_puts(seq, ",nodatacow");
1205a9572a15SEric Paris 	if (btrfs_test_opt(root, NOBARRIER))
1206a9572a15SEric Paris 		seq_puts(seq, ",nobarrier");
120795ac567aSFilipe David Borba Manana 	if (info->max_inline != BTRFS_DEFAULT_MAX_INLINE)
1208c1c9ff7cSGeert Uytterhoeven 		seq_printf(seq, ",max_inline=%llu", info->max_inline);
1209a9572a15SEric Paris 	if (info->alloc_start != 0)
1210c1c9ff7cSGeert Uytterhoeven 		seq_printf(seq, ",alloc_start=%llu", info->alloc_start);
1211a9572a15SEric Paris 	if (info->thread_pool_size !=  min_t(unsigned long,
1212a9572a15SEric Paris 					     num_online_cpus() + 2, 8))
1213a9572a15SEric Paris 		seq_printf(seq, ",thread_pool=%d", info->thread_pool_size);
1214200da64eSTsutomu Itoh 	if (btrfs_test_opt(root, COMPRESS)) {
1215200da64eSTsutomu Itoh 		if (info->compress_type == BTRFS_COMPRESS_ZLIB)
1216200da64eSTsutomu Itoh 			compress_type = "zlib";
1217200da64eSTsutomu Itoh 		else
1218200da64eSTsutomu Itoh 			compress_type = "lzo";
1219200da64eSTsutomu Itoh 		if (btrfs_test_opt(root, FORCE_COMPRESS))
1220200da64eSTsutomu Itoh 			seq_printf(seq, ",compress-force=%s", compress_type);
1221200da64eSTsutomu Itoh 		else
1222200da64eSTsutomu Itoh 			seq_printf(seq, ",compress=%s", compress_type);
1223200da64eSTsutomu Itoh 	}
1224c289811cSChris Mason 	if (btrfs_test_opt(root, NOSSD))
1225c289811cSChris Mason 		seq_puts(seq, ",nossd");
1226451d7585SChris Mason 	if (btrfs_test_opt(root, SSD_SPREAD))
1227451d7585SChris Mason 		seq_puts(seq, ",ssd_spread");
1228451d7585SChris Mason 	else if (btrfs_test_opt(root, SSD))
1229a9572a15SEric Paris 		seq_puts(seq, ",ssd");
12303a5e1404SSage Weil 	if (btrfs_test_opt(root, NOTREELOG))
12316b65c5c6SSage Weil 		seq_puts(seq, ",notreelog");
123296da0919SQu Wenruo 	if (btrfs_test_opt(root, NOLOGREPLAY))
123396da0919SQu Wenruo 		seq_puts(seq, ",nologreplay");
1234dccae999SSage Weil 	if (btrfs_test_opt(root, FLUSHONCOMMIT))
12356b65c5c6SSage Weil 		seq_puts(seq, ",flushoncommit");
123620a5239aSMatthew Wilcox 	if (btrfs_test_opt(root, DISCARD))
123720a5239aSMatthew Wilcox 		seq_puts(seq, ",discard");
1238a9572a15SEric Paris 	if (!(root->fs_info->sb->s_flags & MS_POSIXACL))
1239a9572a15SEric Paris 		seq_puts(seq, ",noacl");
1240200da64eSTsutomu Itoh 	if (btrfs_test_opt(root, SPACE_CACHE))
1241200da64eSTsutomu Itoh 		seq_puts(seq, ",space_cache");
124270f6d82eSOmar Sandoval 	else if (btrfs_test_opt(root, FREE_SPACE_TREE))
124370f6d82eSOmar Sandoval 		seq_puts(seq, ",space_cache=v2");
124473bc1876SJosef Bacik 	else
12458965593eSDavid Sterba 		seq_puts(seq, ",nospace_cache");
1246f420ee1eSStefan Behrens 	if (btrfs_test_opt(root, RESCAN_UUID_TREE))
1247f420ee1eSStefan Behrens 		seq_puts(seq, ",rescan_uuid_tree");
1248200da64eSTsutomu Itoh 	if (btrfs_test_opt(root, CLEAR_CACHE))
1249200da64eSTsutomu Itoh 		seq_puts(seq, ",clear_cache");
1250200da64eSTsutomu Itoh 	if (btrfs_test_opt(root, USER_SUBVOL_RM_ALLOWED))
1251200da64eSTsutomu Itoh 		seq_puts(seq, ",user_subvol_rm_allowed");
12520942caa3SDavid Sterba 	if (btrfs_test_opt(root, ENOSPC_DEBUG))
12530942caa3SDavid Sterba 		seq_puts(seq, ",enospc_debug");
12540942caa3SDavid Sterba 	if (btrfs_test_opt(root, AUTO_DEFRAG))
12550942caa3SDavid Sterba 		seq_puts(seq, ",autodefrag");
12560942caa3SDavid Sterba 	if (btrfs_test_opt(root, INODE_MAP_CACHE))
12570942caa3SDavid Sterba 		seq_puts(seq, ",inode_cache");
12589555c6c1SIlya Dryomov 	if (btrfs_test_opt(root, SKIP_BALANCE))
12599555c6c1SIlya Dryomov 		seq_puts(seq, ",skip_balance");
12608507d216SWang Shilong #ifdef CONFIG_BTRFS_FS_CHECK_INTEGRITY
12618507d216SWang Shilong 	if (btrfs_test_opt(root, CHECK_INTEGRITY_INCLUDING_EXTENT_DATA))
12628507d216SWang Shilong 		seq_puts(seq, ",check_int_data");
12638507d216SWang Shilong 	else if (btrfs_test_opt(root, CHECK_INTEGRITY))
12648507d216SWang Shilong 		seq_puts(seq, ",check_int");
12658507d216SWang Shilong 	if (info->check_integrity_print_mask)
12668507d216SWang Shilong 		seq_printf(seq, ",check_int_print_mask=%d",
12678507d216SWang Shilong 				info->check_integrity_print_mask);
12688507d216SWang Shilong #endif
12698507d216SWang Shilong 	if (info->metadata_ratio)
12708507d216SWang Shilong 		seq_printf(seq, ",metadata_ratio=%d",
12718507d216SWang Shilong 				info->metadata_ratio);
12728c342930SJeff Mahoney 	if (btrfs_test_opt(root, PANIC_ON_FATAL_ERROR))
12738c342930SJeff Mahoney 		seq_puts(seq, ",fatal_errors=panic");
12748b87dc17SDavid Sterba 	if (info->commit_interval != BTRFS_DEFAULT_COMMIT_INTERVAL)
12758b87dc17SDavid Sterba 		seq_printf(seq, ",commit=%d", info->commit_interval);
1276d0bd4560SJosef Bacik #ifdef CONFIG_BTRFS_DEBUG
1277d0bd4560SJosef Bacik 	if (btrfs_test_opt(root, FRAGMENT_DATA))
1278d0bd4560SJosef Bacik 		seq_puts(seq, ",fragment=data");
1279d0bd4560SJosef Bacik 	if (btrfs_test_opt(root, FRAGMENT_METADATA))
1280d0bd4560SJosef Bacik 		seq_puts(seq, ",fragment=metadata");
1281d0bd4560SJosef Bacik #endif
1282c8d3fe02SOmar Sandoval 	seq_printf(seq, ",subvolid=%llu",
1283c8d3fe02SOmar Sandoval 		  BTRFS_I(d_inode(dentry))->root->root_key.objectid);
1284c8d3fe02SOmar Sandoval 	seq_puts(seq, ",subvol=");
1285c8d3fe02SOmar Sandoval 	seq_dentry(seq, dentry, " \t\n\\");
1286a9572a15SEric Paris 	return 0;
1287a9572a15SEric Paris }
1288a9572a15SEric Paris 
1289a061fc8dSChris Mason static int btrfs_test_super(struct super_block *s, void *data)
12902e635a27SChris Mason {
1291815745cfSAl Viro 	struct btrfs_fs_info *p = data;
1292815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(s);
12934b82d6e4SYan 
1294815745cfSAl Viro 	return fs_info->fs_devices == p->fs_devices;
12954b82d6e4SYan }
12964b82d6e4SYan 
1297450ba0eaSJosef Bacik static int btrfs_set_super(struct super_block *s, void *data)
1298450ba0eaSJosef Bacik {
12996de1d09dSAl Viro 	int err = set_anon_super(s, data);
13006de1d09dSAl Viro 	if (!err)
1301450ba0eaSJosef Bacik 		s->s_fs_info = data;
13026de1d09dSAl Viro 	return err;
1303450ba0eaSJosef Bacik }
1304450ba0eaSJosef Bacik 
1305830c4adbSJosef Bacik /*
1306f9d9ef62SDavid Sterba  * subvolumes are identified by ino 256
1307f9d9ef62SDavid Sterba  */
1308f9d9ef62SDavid Sterba static inline int is_subvolume_inode(struct inode *inode)
1309f9d9ef62SDavid Sterba {
1310f9d9ef62SDavid Sterba 	if (inode && inode->i_ino == BTRFS_FIRST_FREE_OBJECTID)
1311f9d9ef62SDavid Sterba 		return 1;
1312f9d9ef62SDavid Sterba 	return 0;
1313f9d9ef62SDavid Sterba }
1314f9d9ef62SDavid Sterba 
1315f9d9ef62SDavid Sterba /*
1316e6e4dbe8SOmar Sandoval  * This will add subvolid=0 to the argument string while removing any subvol=
1317e6e4dbe8SOmar Sandoval  * and subvolid= arguments to make sure we get the top-level root for path
1318e6e4dbe8SOmar Sandoval  * walking to the subvol we want.
1319830c4adbSJosef Bacik  */
1320830c4adbSJosef Bacik static char *setup_root_args(char *args)
1321830c4adbSJosef Bacik {
1322e6e4dbe8SOmar Sandoval 	char *buf, *dst, *sep;
1323830c4adbSJosef Bacik 
1324e6e4dbe8SOmar Sandoval 	if (!args)
1325e6e4dbe8SOmar Sandoval 		return kstrdup("subvolid=0", GFP_NOFS);
1326830c4adbSJosef Bacik 
1327e6e4dbe8SOmar Sandoval 	/* The worst case is that we add ",subvolid=0" to the end. */
1328e6e4dbe8SOmar Sandoval 	buf = dst = kmalloc(strlen(args) + strlen(",subvolid=0") + 1, GFP_NOFS);
1329f60d16a8SJim Meyering 	if (!buf)
1330f60d16a8SJim Meyering 		return NULL;
1331830c4adbSJosef Bacik 
1332e6e4dbe8SOmar Sandoval 	while (1) {
1333e6e4dbe8SOmar Sandoval 		sep = strchrnul(args, ',');
1334e6e4dbe8SOmar Sandoval 		if (!strstarts(args, "subvol=") &&
1335e6e4dbe8SOmar Sandoval 		    !strstarts(args, "subvolid=")) {
1336e6e4dbe8SOmar Sandoval 			memcpy(dst, args, sep - args);
1337e6e4dbe8SOmar Sandoval 			dst += sep - args;
1338e6e4dbe8SOmar Sandoval 			*dst++ = ',';
1339830c4adbSJosef Bacik 		}
1340e6e4dbe8SOmar Sandoval 		if (*sep)
1341e6e4dbe8SOmar Sandoval 			args = sep + 1;
1342e6e4dbe8SOmar Sandoval 		else
1343e6e4dbe8SOmar Sandoval 			break;
1344e6e4dbe8SOmar Sandoval 	}
1345f60d16a8SJim Meyering 	strcpy(dst, "subvolid=0");
1346830c4adbSJosef Bacik 
1347f60d16a8SJim Meyering 	return buf;
1348830c4adbSJosef Bacik }
1349830c4adbSJosef Bacik 
1350bb289b7bSOmar Sandoval static struct dentry *mount_subvol(const char *subvol_name, u64 subvol_objectid,
1351bb289b7bSOmar Sandoval 				   int flags, const char *device_name,
1352bb289b7bSOmar Sandoval 				   char *data)
1353830c4adbSJosef Bacik {
1354830c4adbSJosef Bacik 	struct dentry *root;
1355fa330659SOmar Sandoval 	struct vfsmount *mnt = NULL;
1356830c4adbSJosef Bacik 	char *newargs;
1357fa330659SOmar Sandoval 	int ret;
1358830c4adbSJosef Bacik 
1359830c4adbSJosef Bacik 	newargs = setup_root_args(data);
1360fa330659SOmar Sandoval 	if (!newargs) {
1361fa330659SOmar Sandoval 		root = ERR_PTR(-ENOMEM);
1362fa330659SOmar Sandoval 		goto out;
1363fa330659SOmar Sandoval 	}
13640723a047SHarald Hoyer 
1365fa330659SOmar Sandoval 	mnt = vfs_kern_mount(&btrfs_fs_type, flags, device_name, newargs);
1366fa330659SOmar Sandoval 	if (PTR_ERR_OR_ZERO(mnt) == -EBUSY) {
13670723a047SHarald Hoyer 		if (flags & MS_RDONLY) {
1368fa330659SOmar Sandoval 			mnt = vfs_kern_mount(&btrfs_fs_type, flags & ~MS_RDONLY,
1369fa330659SOmar Sandoval 					     device_name, newargs);
13700723a047SHarald Hoyer 		} else {
1371fa330659SOmar Sandoval 			mnt = vfs_kern_mount(&btrfs_fs_type, flags | MS_RDONLY,
1372fa330659SOmar Sandoval 					     device_name, newargs);
13730040e606SChristoph Jaeger 			if (IS_ERR(mnt)) {
1374fa330659SOmar Sandoval 				root = ERR_CAST(mnt);
1375fa330659SOmar Sandoval 				mnt = NULL;
1376fa330659SOmar Sandoval 				goto out;
13770040e606SChristoph Jaeger 			}
13780723a047SHarald Hoyer 
1379773cd04eSOmar Sandoval 			down_write(&mnt->mnt_sb->s_umount);
1380fa330659SOmar Sandoval 			ret = btrfs_remount(mnt->mnt_sb, &flags, NULL);
1381773cd04eSOmar Sandoval 			up_write(&mnt->mnt_sb->s_umount);
1382fa330659SOmar Sandoval 			if (ret < 0) {
1383fa330659SOmar Sandoval 				root = ERR_PTR(ret);
1384fa330659SOmar Sandoval 				goto out;
13850723a047SHarald Hoyer 			}
13860723a047SHarald Hoyer 		}
13870723a047SHarald Hoyer 	}
1388fa330659SOmar Sandoval 	if (IS_ERR(mnt)) {
1389fa330659SOmar Sandoval 		root = ERR_CAST(mnt);
1390fa330659SOmar Sandoval 		mnt = NULL;
1391fa330659SOmar Sandoval 		goto out;
1392fa330659SOmar Sandoval 	}
1393830c4adbSJosef Bacik 
139405dbe683SOmar Sandoval 	if (!subvol_name) {
139505dbe683SOmar Sandoval 		if (!subvol_objectid) {
139605dbe683SOmar Sandoval 			ret = get_default_subvol_objectid(btrfs_sb(mnt->mnt_sb),
139705dbe683SOmar Sandoval 							  &subvol_objectid);
139805dbe683SOmar Sandoval 			if (ret) {
139905dbe683SOmar Sandoval 				root = ERR_PTR(ret);
140005dbe683SOmar Sandoval 				goto out;
140105dbe683SOmar Sandoval 			}
140205dbe683SOmar Sandoval 		}
140305dbe683SOmar Sandoval 		subvol_name = get_subvol_name_from_objectid(btrfs_sb(mnt->mnt_sb),
140405dbe683SOmar Sandoval 							    subvol_objectid);
140505dbe683SOmar Sandoval 		if (IS_ERR(subvol_name)) {
140605dbe683SOmar Sandoval 			root = ERR_CAST(subvol_name);
140705dbe683SOmar Sandoval 			subvol_name = NULL;
140805dbe683SOmar Sandoval 			goto out;
140905dbe683SOmar Sandoval 		}
141005dbe683SOmar Sandoval 
141105dbe683SOmar Sandoval 	}
141205dbe683SOmar Sandoval 
1413ea441d11SAl Viro 	root = mount_subtree(mnt, subvol_name);
1414fa330659SOmar Sandoval 	/* mount_subtree() drops our reference on the vfsmount. */
1415fa330659SOmar Sandoval 	mnt = NULL;
1416830c4adbSJosef Bacik 
1417bb289b7bSOmar Sandoval 	if (!IS_ERR(root)) {
1418ea441d11SAl Viro 		struct super_block *s = root->d_sb;
1419bb289b7bSOmar Sandoval 		struct inode *root_inode = d_inode(root);
1420bb289b7bSOmar Sandoval 		u64 root_objectid = BTRFS_I(root_inode)->root->root_key.objectid;
1421bb289b7bSOmar Sandoval 
1422bb289b7bSOmar Sandoval 		ret = 0;
1423bb289b7bSOmar Sandoval 		if (!is_subvolume_inode(root_inode)) {
1424bb289b7bSOmar Sandoval 			pr_err("BTRFS: '%s' is not a valid subvolume\n",
1425bb289b7bSOmar Sandoval 			       subvol_name);
1426bb289b7bSOmar Sandoval 			ret = -EINVAL;
1427bb289b7bSOmar Sandoval 		}
1428bb289b7bSOmar Sandoval 		if (subvol_objectid && root_objectid != subvol_objectid) {
142905dbe683SOmar Sandoval 			/*
143005dbe683SOmar Sandoval 			 * This will also catch a race condition where a
143105dbe683SOmar Sandoval 			 * subvolume which was passed by ID is renamed and
143205dbe683SOmar Sandoval 			 * another subvolume is renamed over the old location.
143305dbe683SOmar Sandoval 			 */
1434bb289b7bSOmar Sandoval 			pr_err("BTRFS: subvol '%s' does not match subvolid %llu\n",
1435bb289b7bSOmar Sandoval 			       subvol_name, subvol_objectid);
1436bb289b7bSOmar Sandoval 			ret = -EINVAL;
1437bb289b7bSOmar Sandoval 		}
1438bb289b7bSOmar Sandoval 		if (ret) {
1439ea441d11SAl Viro 			dput(root);
1440bb289b7bSOmar Sandoval 			root = ERR_PTR(ret);
1441ea441d11SAl Viro 			deactivate_locked_super(s);
1442bb289b7bSOmar Sandoval 		}
1443f9d9ef62SDavid Sterba 	}
1444f9d9ef62SDavid Sterba 
1445fa330659SOmar Sandoval out:
1446fa330659SOmar Sandoval 	mntput(mnt);
1447fa330659SOmar Sandoval 	kfree(newargs);
1448fa330659SOmar Sandoval 	kfree(subvol_name);
1449830c4adbSJosef Bacik 	return root;
1450830c4adbSJosef Bacik }
1451450ba0eaSJosef Bacik 
1452f667aef6SQu Wenruo static int parse_security_options(char *orig_opts,
1453f667aef6SQu Wenruo 				  struct security_mnt_opts *sec_opts)
1454f667aef6SQu Wenruo {
1455f667aef6SQu Wenruo 	char *secdata = NULL;
1456f667aef6SQu Wenruo 	int ret = 0;
1457f667aef6SQu Wenruo 
1458f667aef6SQu Wenruo 	secdata = alloc_secdata();
1459f667aef6SQu Wenruo 	if (!secdata)
1460f667aef6SQu Wenruo 		return -ENOMEM;
1461f667aef6SQu Wenruo 	ret = security_sb_copy_data(orig_opts, secdata);
1462f667aef6SQu Wenruo 	if (ret) {
1463f667aef6SQu Wenruo 		free_secdata(secdata);
1464f667aef6SQu Wenruo 		return ret;
1465f667aef6SQu Wenruo 	}
1466f667aef6SQu Wenruo 	ret = security_sb_parse_opts_str(secdata, sec_opts);
1467f667aef6SQu Wenruo 	free_secdata(secdata);
1468f667aef6SQu Wenruo 	return ret;
1469f667aef6SQu Wenruo }
1470f667aef6SQu Wenruo 
1471f667aef6SQu Wenruo static int setup_security_options(struct btrfs_fs_info *fs_info,
1472f667aef6SQu Wenruo 				  struct super_block *sb,
1473f667aef6SQu Wenruo 				  struct security_mnt_opts *sec_opts)
1474f667aef6SQu Wenruo {
1475f667aef6SQu Wenruo 	int ret = 0;
1476f667aef6SQu Wenruo 
1477f667aef6SQu Wenruo 	/*
1478f667aef6SQu Wenruo 	 * Call security_sb_set_mnt_opts() to check whether new sec_opts
1479f667aef6SQu Wenruo 	 * is valid.
1480f667aef6SQu Wenruo 	 */
1481f667aef6SQu Wenruo 	ret = security_sb_set_mnt_opts(sb, sec_opts, 0, NULL);
1482f667aef6SQu Wenruo 	if (ret)
1483f667aef6SQu Wenruo 		return ret;
1484f667aef6SQu Wenruo 
1485a43bb39bSQu Wenruo #ifdef CONFIG_SECURITY
1486f667aef6SQu Wenruo 	if (!fs_info->security_opts.num_mnt_opts) {
1487f667aef6SQu Wenruo 		/* first time security setup, copy sec_opts to fs_info */
1488f667aef6SQu Wenruo 		memcpy(&fs_info->security_opts, sec_opts, sizeof(*sec_opts));
1489f667aef6SQu Wenruo 	} else {
1490f667aef6SQu Wenruo 		/*
1491f667aef6SQu Wenruo 		 * Since SELinux(the only one supports security_mnt_opts) does
1492f667aef6SQu Wenruo 		 * NOT support changing context during remount/mount same sb,
1493f667aef6SQu Wenruo 		 * This must be the same or part of the same security options,
1494f667aef6SQu Wenruo 		 * just free it.
1495f667aef6SQu Wenruo 		 */
1496f667aef6SQu Wenruo 		security_free_mnt_opts(sec_opts);
1497f667aef6SQu Wenruo 	}
1498a43bb39bSQu Wenruo #endif
1499f667aef6SQu Wenruo 	return ret;
1500f667aef6SQu Wenruo }
1501f667aef6SQu Wenruo 
1502edf24abeSChristoph Hellwig /*
1503edf24abeSChristoph Hellwig  * Find a superblock for the given device / mount point.
1504edf24abeSChristoph Hellwig  *
1505edf24abeSChristoph Hellwig  * Note:  This is based on get_sb_bdev from fs/super.c with a few additions
1506edf24abeSChristoph Hellwig  *	  for multiple device setup.  Make sure to keep it in sync.
1507edf24abeSChristoph Hellwig  */
1508061dbc6bSAl Viro static struct dentry *btrfs_mount(struct file_system_type *fs_type, int flags,
1509306e16ceSDavid Sterba 		const char *device_name, void *data)
15104b82d6e4SYan {
15114b82d6e4SYan 	struct block_device *bdev = NULL;
15124b82d6e4SYan 	struct super_block *s;
15138a4b83ccSChris Mason 	struct btrfs_fs_devices *fs_devices = NULL;
1514450ba0eaSJosef Bacik 	struct btrfs_fs_info *fs_info = NULL;
1515f667aef6SQu Wenruo 	struct security_mnt_opts new_sec_opts;
151697288f2cSChristoph Hellwig 	fmode_t mode = FMODE_READ;
151773f73415SJosef Bacik 	char *subvol_name = NULL;
151873f73415SJosef Bacik 	u64 subvol_objectid = 0;
15194b82d6e4SYan 	int error = 0;
15204b82d6e4SYan 
152197288f2cSChristoph Hellwig 	if (!(flags & MS_RDONLY))
152297288f2cSChristoph Hellwig 		mode |= FMODE_WRITE;
152397288f2cSChristoph Hellwig 
152497288f2cSChristoph Hellwig 	error = btrfs_parse_early_options(data, mode, fs_type,
152573f73415SJosef Bacik 					  &subvol_name, &subvol_objectid,
15265e2a4b25SDavid Sterba 					  &fs_devices);
1527f23c8af8SIlya Dryomov 	if (error) {
1528f23c8af8SIlya Dryomov 		kfree(subvol_name);
1529061dbc6bSAl Viro 		return ERR_PTR(error);
1530f23c8af8SIlya Dryomov 	}
1531edf24abeSChristoph Hellwig 
153205dbe683SOmar Sandoval 	if (subvol_name || subvol_objectid != BTRFS_FS_TREE_OBJECTID) {
1533fa330659SOmar Sandoval 		/* mount_subvol() will free subvol_name. */
1534bb289b7bSOmar Sandoval 		return mount_subvol(subvol_name, subvol_objectid, flags,
1535bb289b7bSOmar Sandoval 				    device_name, data);
1536830c4adbSJosef Bacik 	}
1537830c4adbSJosef Bacik 
1538f667aef6SQu Wenruo 	security_init_mnt_opts(&new_sec_opts);
1539f667aef6SQu Wenruo 	if (data) {
1540f667aef6SQu Wenruo 		error = parse_security_options(data, &new_sec_opts);
15418a4b83ccSChris Mason 		if (error)
1542830c4adbSJosef Bacik 			return ERR_PTR(error);
1543f667aef6SQu Wenruo 	}
1544f667aef6SQu Wenruo 
1545f667aef6SQu Wenruo 	error = btrfs_scan_one_device(device_name, mode, fs_type, &fs_devices);
1546f667aef6SQu Wenruo 	if (error)
1547f667aef6SQu Wenruo 		goto error_sec_opts;
15484b82d6e4SYan 
1549450ba0eaSJosef Bacik 	/*
1550450ba0eaSJosef Bacik 	 * Setup a dummy root and fs_info for test/set super.  This is because
1551450ba0eaSJosef Bacik 	 * we don't actually fill this stuff out until open_ctree, but we need
1552450ba0eaSJosef Bacik 	 * it for searching for existing supers, so this lets us do that and
1553450ba0eaSJosef Bacik 	 * then open_ctree will properly initialize everything later.
1554450ba0eaSJosef Bacik 	 */
1555450ba0eaSJosef Bacik 	fs_info = kzalloc(sizeof(struct btrfs_fs_info), GFP_NOFS);
1556f667aef6SQu Wenruo 	if (!fs_info) {
1557f667aef6SQu Wenruo 		error = -ENOMEM;
1558f667aef6SQu Wenruo 		goto error_sec_opts;
1559f667aef6SQu Wenruo 	}
156004d21a24SIlya Dryomov 
1561450ba0eaSJosef Bacik 	fs_info->fs_devices = fs_devices;
1562450ba0eaSJosef Bacik 
15636c41761fSDavid Sterba 	fs_info->super_copy = kzalloc(BTRFS_SUPER_INFO_SIZE, GFP_NOFS);
15646c41761fSDavid Sterba 	fs_info->super_for_commit = kzalloc(BTRFS_SUPER_INFO_SIZE, GFP_NOFS);
1565f667aef6SQu Wenruo 	security_init_mnt_opts(&fs_info->security_opts);
15666c41761fSDavid Sterba 	if (!fs_info->super_copy || !fs_info->super_for_commit) {
15676c41761fSDavid Sterba 		error = -ENOMEM;
156804d21a24SIlya Dryomov 		goto error_fs_info;
156904d21a24SIlya Dryomov 	}
157004d21a24SIlya Dryomov 
157104d21a24SIlya Dryomov 	error = btrfs_open_devices(fs_devices, mode, fs_type);
157204d21a24SIlya Dryomov 	if (error)
157304d21a24SIlya Dryomov 		goto error_fs_info;
157404d21a24SIlya Dryomov 
157504d21a24SIlya Dryomov 	if (!(flags & MS_RDONLY) && fs_devices->rw_devices == 0) {
157604d21a24SIlya Dryomov 		error = -EACCES;
15776c41761fSDavid Sterba 		goto error_close_devices;
15786c41761fSDavid Sterba 	}
15796c41761fSDavid Sterba 
1580dfe25020SChris Mason 	bdev = fs_devices->latest_bdev;
15819249e17fSDavid Howells 	s = sget(fs_type, btrfs_test_super, btrfs_set_super, flags | MS_NOSEC,
15829249e17fSDavid Howells 		 fs_info);
1583830c4adbSJosef Bacik 	if (IS_ERR(s)) {
1584830c4adbSJosef Bacik 		error = PTR_ERR(s);
1585830c4adbSJosef Bacik 		goto error_close_devices;
1586830c4adbSJosef Bacik 	}
15874b82d6e4SYan 
15884b82d6e4SYan 	if (s->s_root) {
15892b82032cSYan Zheng 		btrfs_close_devices(fs_devices);
15906c41761fSDavid Sterba 		free_fs_info(fs_info);
159159553edfSAl Viro 		if ((flags ^ s->s_flags) & MS_RDONLY)
159259553edfSAl Viro 			error = -EBUSY;
15934b82d6e4SYan 	} else {
1594a1c6f057SDmitry Monakhov 		snprintf(s->s_id, sizeof(s->s_id), "%pg", bdev);
1595815745cfSAl Viro 		btrfs_sb(s)->bdev_holder = fs_type;
15968a4b83ccSChris Mason 		error = btrfs_fill_super(s, fs_devices, data,
15978a4b83ccSChris Mason 					 flags & MS_SILENT ? 1 : 0);
15984b82d6e4SYan 	}
159905dbe683SOmar Sandoval 	if (error) {
1600e15d0542SXin Zhong 		deactivate_locked_super(s);
1601f667aef6SQu Wenruo 		goto error_sec_opts;
1602f667aef6SQu Wenruo 	}
1603f667aef6SQu Wenruo 
1604f667aef6SQu Wenruo 	fs_info = btrfs_sb(s);
1605f667aef6SQu Wenruo 	error = setup_security_options(fs_info, s, &new_sec_opts);
1606f667aef6SQu Wenruo 	if (error) {
1607f667aef6SQu Wenruo 		deactivate_locked_super(s);
1608f667aef6SQu Wenruo 		goto error_sec_opts;
1609f667aef6SQu Wenruo 	}
16104b82d6e4SYan 
161105dbe683SOmar Sandoval 	return dget(s->s_root);
16124b82d6e4SYan 
1613c146afadSYan Zheng error_close_devices:
16148a4b83ccSChris Mason 	btrfs_close_devices(fs_devices);
161504d21a24SIlya Dryomov error_fs_info:
16166c41761fSDavid Sterba 	free_fs_info(fs_info);
1617f667aef6SQu Wenruo error_sec_opts:
1618f667aef6SQu Wenruo 	security_free_mnt_opts(&new_sec_opts);
1619061dbc6bSAl Viro 	return ERR_PTR(error);
16204b82d6e4SYan }
16212e635a27SChris Mason 
16220d2450abSSergei Trofimovich static void btrfs_resize_thread_pool(struct btrfs_fs_info *fs_info,
16230d2450abSSergei Trofimovich 				     int new_pool_size, int old_pool_size)
16240d2450abSSergei Trofimovich {
16250d2450abSSergei Trofimovich 	if (new_pool_size == old_pool_size)
16260d2450abSSergei Trofimovich 		return;
16270d2450abSSergei Trofimovich 
16280d2450abSSergei Trofimovich 	fs_info->thread_pool_size = new_pool_size;
16290d2450abSSergei Trofimovich 
1630efe120a0SFrank Holton 	btrfs_info(fs_info, "resize thread pool %d -> %d",
16310d2450abSSergei Trofimovich 	       old_pool_size, new_pool_size);
16320d2450abSSergei Trofimovich 
16335cdc7ad3SQu Wenruo 	btrfs_workqueue_set_max(fs_info->workers, new_pool_size);
1634afe3d242SQu Wenruo 	btrfs_workqueue_set_max(fs_info->delalloc_workers, new_pool_size);
1635a8c93d4eSQu Wenruo 	btrfs_workqueue_set_max(fs_info->submit_workers, new_pool_size);
1636e66f0bb1SQu Wenruo 	btrfs_workqueue_set_max(fs_info->caching_workers, new_pool_size);
1637fccb5d86SQu Wenruo 	btrfs_workqueue_set_max(fs_info->endio_workers, new_pool_size);
1638fccb5d86SQu Wenruo 	btrfs_workqueue_set_max(fs_info->endio_meta_workers, new_pool_size);
1639fccb5d86SQu Wenruo 	btrfs_workqueue_set_max(fs_info->endio_meta_write_workers,
1640fccb5d86SQu Wenruo 				new_pool_size);
1641fccb5d86SQu Wenruo 	btrfs_workqueue_set_max(fs_info->endio_write_workers, new_pool_size);
1642fccb5d86SQu Wenruo 	btrfs_workqueue_set_max(fs_info->endio_freespace_worker, new_pool_size);
16435b3bc44eSQu Wenruo 	btrfs_workqueue_set_max(fs_info->delayed_workers, new_pool_size);
1644736cfa15SQu Wenruo 	btrfs_workqueue_set_max(fs_info->readahead_workers, new_pool_size);
16450339ef2fSQu Wenruo 	btrfs_workqueue_set_max(fs_info->scrub_wr_completion_workers,
1646ff023aacSStefan Behrens 				new_pool_size);
16470d2450abSSergei Trofimovich }
16480d2450abSSergei Trofimovich 
1649f42a34b2SMiao Xie static inline void btrfs_remount_prepare(struct btrfs_fs_info *fs_info)
1650dc81cdc5SMiao Xie {
1651dc81cdc5SMiao Xie 	set_bit(BTRFS_FS_STATE_REMOUNTING, &fs_info->fs_state);
1652f42a34b2SMiao Xie }
1653dc81cdc5SMiao Xie 
1654f42a34b2SMiao Xie static inline void btrfs_remount_begin(struct btrfs_fs_info *fs_info,
1655f42a34b2SMiao Xie 				       unsigned long old_opts, int flags)
1656f42a34b2SMiao Xie {
1657dc81cdc5SMiao Xie 	if (btrfs_raw_test_opt(old_opts, AUTO_DEFRAG) &&
1658dc81cdc5SMiao Xie 	    (!btrfs_raw_test_opt(fs_info->mount_opt, AUTO_DEFRAG) ||
1659dc81cdc5SMiao Xie 	     (flags & MS_RDONLY))) {
1660dc81cdc5SMiao Xie 		/* wait for any defraggers to finish */
1661dc81cdc5SMiao Xie 		wait_event(fs_info->transaction_wait,
1662dc81cdc5SMiao Xie 			   (atomic_read(&fs_info->defrag_running) == 0));
1663dc81cdc5SMiao Xie 		if (flags & MS_RDONLY)
1664dc81cdc5SMiao Xie 			sync_filesystem(fs_info->sb);
1665dc81cdc5SMiao Xie 	}
1666dc81cdc5SMiao Xie }
1667dc81cdc5SMiao Xie 
1668dc81cdc5SMiao Xie static inline void btrfs_remount_cleanup(struct btrfs_fs_info *fs_info,
1669dc81cdc5SMiao Xie 					 unsigned long old_opts)
1670dc81cdc5SMiao Xie {
1671dc81cdc5SMiao Xie 	/*
1672dc81cdc5SMiao Xie 	 * We need cleanup all defragable inodes if the autodefragment is
1673dc81cdc5SMiao Xie 	 * close or the fs is R/O.
1674dc81cdc5SMiao Xie 	 */
1675dc81cdc5SMiao Xie 	if (btrfs_raw_test_opt(old_opts, AUTO_DEFRAG) &&
1676dc81cdc5SMiao Xie 	    (!btrfs_raw_test_opt(fs_info->mount_opt, AUTO_DEFRAG) ||
1677dc81cdc5SMiao Xie 	     (fs_info->sb->s_flags & MS_RDONLY))) {
1678dc81cdc5SMiao Xie 		btrfs_cleanup_defrag_inodes(fs_info);
1679dc81cdc5SMiao Xie 	}
1680dc81cdc5SMiao Xie 
1681dc81cdc5SMiao Xie 	clear_bit(BTRFS_FS_STATE_REMOUNTING, &fs_info->fs_state);
1682dc81cdc5SMiao Xie }
1683dc81cdc5SMiao Xie 
1684c146afadSYan Zheng static int btrfs_remount(struct super_block *sb, int *flags, char *data)
1685c146afadSYan Zheng {
1686815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(sb);
1687815745cfSAl Viro 	struct btrfs_root *root = fs_info->tree_root;
168849b25e05SJeff Mahoney 	unsigned old_flags = sb->s_flags;
168949b25e05SJeff Mahoney 	unsigned long old_opts = fs_info->mount_opt;
169049b25e05SJeff Mahoney 	unsigned long old_compress_type = fs_info->compress_type;
169149b25e05SJeff Mahoney 	u64 old_max_inline = fs_info->max_inline;
169249b25e05SJeff Mahoney 	u64 old_alloc_start = fs_info->alloc_start;
169349b25e05SJeff Mahoney 	int old_thread_pool_size = fs_info->thread_pool_size;
169449b25e05SJeff Mahoney 	unsigned int old_metadata_ratio = fs_info->metadata_ratio;
1695c146afadSYan Zheng 	int ret;
1696c146afadSYan Zheng 
169702b9984dSTheodore Ts'o 	sync_filesystem(sb);
1698f42a34b2SMiao Xie 	btrfs_remount_prepare(fs_info);
1699dc81cdc5SMiao Xie 
1700f667aef6SQu Wenruo 	if (data) {
1701f667aef6SQu Wenruo 		struct security_mnt_opts new_sec_opts;
1702f667aef6SQu Wenruo 
1703f667aef6SQu Wenruo 		security_init_mnt_opts(&new_sec_opts);
1704f667aef6SQu Wenruo 		ret = parse_security_options(data, &new_sec_opts);
1705f667aef6SQu Wenruo 		if (ret)
1706f667aef6SQu Wenruo 			goto restore;
1707f667aef6SQu Wenruo 		ret = setup_security_options(fs_info, sb,
1708f667aef6SQu Wenruo 					     &new_sec_opts);
1709f667aef6SQu Wenruo 		if (ret) {
1710f667aef6SQu Wenruo 			security_free_mnt_opts(&new_sec_opts);
1711f667aef6SQu Wenruo 			goto restore;
1712f667aef6SQu Wenruo 		}
1713f667aef6SQu Wenruo 	}
1714f667aef6SQu Wenruo 
171596da0919SQu Wenruo 	ret = btrfs_parse_options(root, data, *flags);
171649b25e05SJeff Mahoney 	if (ret) {
171749b25e05SJeff Mahoney 		ret = -EINVAL;
171849b25e05SJeff Mahoney 		goto restore;
171949b25e05SJeff Mahoney 	}
1720b288052eSChris Mason 
1721f42a34b2SMiao Xie 	btrfs_remount_begin(fs_info, old_opts, *flags);
17220d2450abSSergei Trofimovich 	btrfs_resize_thread_pool(fs_info,
17230d2450abSSergei Trofimovich 		fs_info->thread_pool_size, old_thread_pool_size);
17240d2450abSSergei Trofimovich 
1725c146afadSYan Zheng 	if ((*flags & MS_RDONLY) == (sb->s_flags & MS_RDONLY))
1726dc81cdc5SMiao Xie 		goto out;
1727c146afadSYan Zheng 
1728c146afadSYan Zheng 	if (*flags & MS_RDONLY) {
17298dabb742SStefan Behrens 		/*
17308dabb742SStefan Behrens 		 * this also happens on 'umount -rf' or on shutdown, when
17318dabb742SStefan Behrens 		 * the filesystem is busy.
17328dabb742SStefan Behrens 		 */
173321c7e756SMiao Xie 		cancel_work_sync(&fs_info->async_reclaim_work);
1734361c093dSStefan Behrens 
1735361c093dSStefan Behrens 		/* wait for the uuid_scan task to finish */
1736361c093dSStefan Behrens 		down(&fs_info->uuid_tree_rescan_sem);
1737361c093dSStefan Behrens 		/* avoid complains from lockdep et al. */
1738361c093dSStefan Behrens 		up(&fs_info->uuid_tree_rescan_sem);
1739361c093dSStefan Behrens 
1740c146afadSYan Zheng 		sb->s_flags |= MS_RDONLY;
1741c146afadSYan Zheng 
1742e44163e1SJeff Mahoney 		/*
1743e44163e1SJeff Mahoney 		 * Setting MS_RDONLY will put the cleaner thread to
1744e44163e1SJeff Mahoney 		 * sleep at the next loop if it's already active.
1745e44163e1SJeff Mahoney 		 * If it's already asleep, we'll leave unused block
1746e44163e1SJeff Mahoney 		 * groups on disk until we're mounted read-write again
1747e44163e1SJeff Mahoney 		 * unless we clean them up here.
1748e44163e1SJeff Mahoney 		 */
1749e44163e1SJeff Mahoney 		btrfs_delete_unused_bgs(fs_info);
1750e44163e1SJeff Mahoney 
17518dabb742SStefan Behrens 		btrfs_dev_replace_suspend_for_unmount(fs_info);
17528dabb742SStefan Behrens 		btrfs_scrub_cancel(fs_info);
1753061594efSMiao Xie 		btrfs_pause_balance(fs_info);
17548dabb742SStefan Behrens 
1755c146afadSYan Zheng 		ret = btrfs_commit_super(root);
175649b25e05SJeff Mahoney 		if (ret)
175749b25e05SJeff Mahoney 			goto restore;
1758c146afadSYan Zheng 	} else {
17596ef3de9cSDavid Sterba 		if (test_bit(BTRFS_FS_STATE_ERROR, &root->fs_info->fs_state)) {
17606ef3de9cSDavid Sterba 			btrfs_err(fs_info,
1761efe120a0SFrank Holton 				"Remounting read-write after error is not allowed");
17626ef3de9cSDavid Sterba 			ret = -EINVAL;
17636ef3de9cSDavid Sterba 			goto restore;
17646ef3de9cSDavid Sterba 		}
17658a3db184SSergei Trofimovich 		if (fs_info->fs_devices->rw_devices == 0) {
176649b25e05SJeff Mahoney 			ret = -EACCES;
176749b25e05SJeff Mahoney 			goto restore;
17688a3db184SSergei Trofimovich 		}
17692b82032cSYan Zheng 
1770292fd7fcSStefan Behrens 		if (fs_info->fs_devices->missing_devices >
1771292fd7fcSStefan Behrens 		     fs_info->num_tolerated_disk_barrier_failures &&
1772292fd7fcSStefan Behrens 		    !(*flags & MS_RDONLY)) {
1773efe120a0SFrank Holton 			btrfs_warn(fs_info,
1774efe120a0SFrank Holton 				"too many missing devices, writeable remount is not allowed");
1775292fd7fcSStefan Behrens 			ret = -EACCES;
1776292fd7fcSStefan Behrens 			goto restore;
1777292fd7fcSStefan Behrens 		}
1778292fd7fcSStefan Behrens 
17798a3db184SSergei Trofimovich 		if (btrfs_super_log_root(fs_info->super_copy) != 0) {
178049b25e05SJeff Mahoney 			ret = -EINVAL;
178149b25e05SJeff Mahoney 			goto restore;
17828a3db184SSergei Trofimovich 		}
1783c146afadSYan Zheng 
1784815745cfSAl Viro 		ret = btrfs_cleanup_fs_roots(fs_info);
178549b25e05SJeff Mahoney 		if (ret)
178649b25e05SJeff Mahoney 			goto restore;
1787c146afadSYan Zheng 
1788d68fc57bSYan, Zheng 		/* recover relocation */
17895f316481SWang Shilong 		mutex_lock(&fs_info->cleaner_mutex);
1790d68fc57bSYan, Zheng 		ret = btrfs_recover_relocation(root);
17915f316481SWang Shilong 		mutex_unlock(&fs_info->cleaner_mutex);
179249b25e05SJeff Mahoney 		if (ret)
179349b25e05SJeff Mahoney 			goto restore;
1794c146afadSYan Zheng 
17952b6ba629SIlya Dryomov 		ret = btrfs_resume_balance_async(fs_info);
17962b6ba629SIlya Dryomov 		if (ret)
17972b6ba629SIlya Dryomov 			goto restore;
17982b6ba629SIlya Dryomov 
17998dabb742SStefan Behrens 		ret = btrfs_resume_dev_replace_async(fs_info);
18008dabb742SStefan Behrens 		if (ret) {
1801efe120a0SFrank Holton 			btrfs_warn(fs_info, "failed to resume dev_replace");
18028dabb742SStefan Behrens 			goto restore;
18038dabb742SStefan Behrens 		}
180494aebfb2SJosef Bacik 
180594aebfb2SJosef Bacik 		if (!fs_info->uuid_root) {
1806efe120a0SFrank Holton 			btrfs_info(fs_info, "creating UUID tree");
180794aebfb2SJosef Bacik 			ret = btrfs_create_uuid_tree(fs_info);
180894aebfb2SJosef Bacik 			if (ret) {
1809efe120a0SFrank Holton 				btrfs_warn(fs_info, "failed to create the UUID tree %d", ret);
181094aebfb2SJosef Bacik 				goto restore;
181194aebfb2SJosef Bacik 			}
181294aebfb2SJosef Bacik 		}
1813c146afadSYan Zheng 		sb->s_flags &= ~MS_RDONLY;
1814c146afadSYan Zheng 	}
1815dc81cdc5SMiao Xie out:
18162c6a92b0SJustin Maggard 	wake_up_process(fs_info->transaction_kthread);
1817dc81cdc5SMiao Xie 	btrfs_remount_cleanup(fs_info, old_opts);
1818c146afadSYan Zheng 	return 0;
181949b25e05SJeff Mahoney 
182049b25e05SJeff Mahoney restore:
182149b25e05SJeff Mahoney 	/* We've hit an error - don't reset MS_RDONLY */
182249b25e05SJeff Mahoney 	if (sb->s_flags & MS_RDONLY)
182349b25e05SJeff Mahoney 		old_flags |= MS_RDONLY;
182449b25e05SJeff Mahoney 	sb->s_flags = old_flags;
182549b25e05SJeff Mahoney 	fs_info->mount_opt = old_opts;
182649b25e05SJeff Mahoney 	fs_info->compress_type = old_compress_type;
182749b25e05SJeff Mahoney 	fs_info->max_inline = old_max_inline;
1828c018daecSMiao Xie 	mutex_lock(&fs_info->chunk_mutex);
182949b25e05SJeff Mahoney 	fs_info->alloc_start = old_alloc_start;
1830c018daecSMiao Xie 	mutex_unlock(&fs_info->chunk_mutex);
18310d2450abSSergei Trofimovich 	btrfs_resize_thread_pool(fs_info,
18320d2450abSSergei Trofimovich 		old_thread_pool_size, fs_info->thread_pool_size);
183349b25e05SJeff Mahoney 	fs_info->metadata_ratio = old_metadata_ratio;
1834dc81cdc5SMiao Xie 	btrfs_remount_cleanup(fs_info, old_opts);
183549b25e05SJeff Mahoney 	return ret;
1836c146afadSYan Zheng }
1837c146afadSYan Zheng 
1838bcd53741SArne Jansen /* Used to sort the devices by max_avail(descending sort) */
1839bcd53741SArne Jansen static int btrfs_cmp_device_free_bytes(const void *dev_info1,
1840bcd53741SArne Jansen 				       const void *dev_info2)
1841bcd53741SArne Jansen {
1842bcd53741SArne Jansen 	if (((struct btrfs_device_info *)dev_info1)->max_avail >
1843bcd53741SArne Jansen 	    ((struct btrfs_device_info *)dev_info2)->max_avail)
1844bcd53741SArne Jansen 		return -1;
1845bcd53741SArne Jansen 	else if (((struct btrfs_device_info *)dev_info1)->max_avail <
1846bcd53741SArne Jansen 		 ((struct btrfs_device_info *)dev_info2)->max_avail)
1847bcd53741SArne Jansen 		return 1;
1848bcd53741SArne Jansen 	else
1849bcd53741SArne Jansen 	return 0;
1850bcd53741SArne Jansen }
1851bcd53741SArne Jansen 
1852bcd53741SArne Jansen /*
1853bcd53741SArne Jansen  * sort the devices by max_avail, in which max free extent size of each device
1854bcd53741SArne Jansen  * is stored.(Descending Sort)
1855bcd53741SArne Jansen  */
1856bcd53741SArne Jansen static inline void btrfs_descending_sort_devices(
1857bcd53741SArne Jansen 					struct btrfs_device_info *devices,
1858bcd53741SArne Jansen 					size_t nr_devices)
1859bcd53741SArne Jansen {
1860bcd53741SArne Jansen 	sort(devices, nr_devices, sizeof(struct btrfs_device_info),
1861bcd53741SArne Jansen 	     btrfs_cmp_device_free_bytes, NULL);
1862bcd53741SArne Jansen }
1863bcd53741SArne Jansen 
18646d07bcecSMiao Xie /*
18656d07bcecSMiao Xie  * The helper to calc the free space on the devices that can be used to store
18666d07bcecSMiao Xie  * file data.
18676d07bcecSMiao Xie  */
18686d07bcecSMiao Xie static int btrfs_calc_avail_data_space(struct btrfs_root *root, u64 *free_bytes)
18696d07bcecSMiao Xie {
18706d07bcecSMiao Xie 	struct btrfs_fs_info *fs_info = root->fs_info;
18716d07bcecSMiao Xie 	struct btrfs_device_info *devices_info;
18726d07bcecSMiao Xie 	struct btrfs_fs_devices *fs_devices = fs_info->fs_devices;
18736d07bcecSMiao Xie 	struct btrfs_device *device;
18746d07bcecSMiao Xie 	u64 skip_space;
18756d07bcecSMiao Xie 	u64 type;
18766d07bcecSMiao Xie 	u64 avail_space;
18776d07bcecSMiao Xie 	u64 used_space;
18786d07bcecSMiao Xie 	u64 min_stripe_size;
187939fb26c3SMiao Xie 	int min_stripes = 1, num_stripes = 1;
18806d07bcecSMiao Xie 	int i = 0, nr_devices;
18816d07bcecSMiao Xie 	int ret;
18826d07bcecSMiao Xie 
18837e33fd99SJosef Bacik 	/*
18847e33fd99SJosef Bacik 	 * We aren't under the device list lock, so this is racey-ish, but good
18857e33fd99SJosef Bacik 	 * enough for our purposes.
18867e33fd99SJosef Bacik 	 */
1887b772a86eSLi Zefan 	nr_devices = fs_info->fs_devices->open_devices;
18887e33fd99SJosef Bacik 	if (!nr_devices) {
18897e33fd99SJosef Bacik 		smp_mb();
18907e33fd99SJosef Bacik 		nr_devices = fs_info->fs_devices->open_devices;
18917e33fd99SJosef Bacik 		ASSERT(nr_devices);
18927e33fd99SJosef Bacik 		if (!nr_devices) {
18937e33fd99SJosef Bacik 			*free_bytes = 0;
18947e33fd99SJosef Bacik 			return 0;
18957e33fd99SJosef Bacik 		}
18967e33fd99SJosef Bacik 	}
18976d07bcecSMiao Xie 
1898d9b0d9baSDulshani Gunawardhana 	devices_info = kmalloc_array(nr_devices, sizeof(*devices_info),
18996d07bcecSMiao Xie 			       GFP_NOFS);
19006d07bcecSMiao Xie 	if (!devices_info)
19016d07bcecSMiao Xie 		return -ENOMEM;
19026d07bcecSMiao Xie 
19036d07bcecSMiao Xie 	/* calc min stripe number for data space alloction */
19046d07bcecSMiao Xie 	type = btrfs_get_alloc_profile(root, 1);
190539fb26c3SMiao Xie 	if (type & BTRFS_BLOCK_GROUP_RAID0) {
19066d07bcecSMiao Xie 		min_stripes = 2;
190739fb26c3SMiao Xie 		num_stripes = nr_devices;
190839fb26c3SMiao Xie 	} else if (type & BTRFS_BLOCK_GROUP_RAID1) {
19096d07bcecSMiao Xie 		min_stripes = 2;
191039fb26c3SMiao Xie 		num_stripes = 2;
191139fb26c3SMiao Xie 	} else if (type & BTRFS_BLOCK_GROUP_RAID10) {
19126d07bcecSMiao Xie 		min_stripes = 4;
191339fb26c3SMiao Xie 		num_stripes = 4;
191439fb26c3SMiao Xie 	}
19156d07bcecSMiao Xie 
19166d07bcecSMiao Xie 	if (type & BTRFS_BLOCK_GROUP_DUP)
19176d07bcecSMiao Xie 		min_stripe_size = 2 * BTRFS_STRIPE_LEN;
19186d07bcecSMiao Xie 	else
19196d07bcecSMiao Xie 		min_stripe_size = BTRFS_STRIPE_LEN;
19206d07bcecSMiao Xie 
19217e33fd99SJosef Bacik 	if (fs_info->alloc_start)
19227e33fd99SJosef Bacik 		mutex_lock(&fs_devices->device_list_mutex);
19237e33fd99SJosef Bacik 	rcu_read_lock();
19247e33fd99SJosef Bacik 	list_for_each_entry_rcu(device, &fs_devices->devices, dev_list) {
192563a212abSStefan Behrens 		if (!device->in_fs_metadata || !device->bdev ||
192663a212abSStefan Behrens 		    device->is_tgtdev_for_dev_replace)
19276d07bcecSMiao Xie 			continue;
19286d07bcecSMiao Xie 
19297e33fd99SJosef Bacik 		if (i >= nr_devices)
19307e33fd99SJosef Bacik 			break;
19317e33fd99SJosef Bacik 
19326d07bcecSMiao Xie 		avail_space = device->total_bytes - device->bytes_used;
19336d07bcecSMiao Xie 
19346d07bcecSMiao Xie 		/* align with stripe_len */
1935f8c269d7SDavid Sterba 		avail_space = div_u64(avail_space, BTRFS_STRIPE_LEN);
19366d07bcecSMiao Xie 		avail_space *= BTRFS_STRIPE_LEN;
19376d07bcecSMiao Xie 
19386d07bcecSMiao Xie 		/*
19396d07bcecSMiao Xie 		 * In order to avoid overwritting the superblock on the drive,
19406d07bcecSMiao Xie 		 * btrfs starts at an offset of at least 1MB when doing chunk
19416d07bcecSMiao Xie 		 * allocation.
19426d07bcecSMiao Xie 		 */
1943ee22184bSByongho Lee 		skip_space = SZ_1M;
19446d07bcecSMiao Xie 
19456d07bcecSMiao Xie 		/* user can set the offset in fs_info->alloc_start. */
19467e33fd99SJosef Bacik 		if (fs_info->alloc_start &&
19477e33fd99SJosef Bacik 		    fs_info->alloc_start + BTRFS_STRIPE_LEN <=
19487e33fd99SJosef Bacik 		    device->total_bytes) {
19497e33fd99SJosef Bacik 			rcu_read_unlock();
19506d07bcecSMiao Xie 			skip_space = max(fs_info->alloc_start, skip_space);
19516d07bcecSMiao Xie 
19526d07bcecSMiao Xie 			/*
19537e33fd99SJosef Bacik 			 * btrfs can not use the free space in
19547e33fd99SJosef Bacik 			 * [0, skip_space - 1], we must subtract it from the
19557e33fd99SJosef Bacik 			 * total. In order to implement it, we account the used
19567e33fd99SJosef Bacik 			 * space in this range first.
19576d07bcecSMiao Xie 			 */
19587e33fd99SJosef Bacik 			ret = btrfs_account_dev_extents_size(device, 0,
19597e33fd99SJosef Bacik 							     skip_space - 1,
19606d07bcecSMiao Xie 							     &used_space);
19616d07bcecSMiao Xie 			if (ret) {
19626d07bcecSMiao Xie 				kfree(devices_info);
19637e33fd99SJosef Bacik 				mutex_unlock(&fs_devices->device_list_mutex);
19646d07bcecSMiao Xie 				return ret;
19656d07bcecSMiao Xie 			}
19666d07bcecSMiao Xie 
19677e33fd99SJosef Bacik 			rcu_read_lock();
19687e33fd99SJosef Bacik 
19696d07bcecSMiao Xie 			/* calc the free space in [0, skip_space - 1] */
19706d07bcecSMiao Xie 			skip_space -= used_space;
19717e33fd99SJosef Bacik 		}
19726d07bcecSMiao Xie 
19736d07bcecSMiao Xie 		/*
19746d07bcecSMiao Xie 		 * we can use the free space in [0, skip_space - 1], subtract
19756d07bcecSMiao Xie 		 * it from the total.
19766d07bcecSMiao Xie 		 */
19776d07bcecSMiao Xie 		if (avail_space && avail_space >= skip_space)
19786d07bcecSMiao Xie 			avail_space -= skip_space;
19796d07bcecSMiao Xie 		else
19806d07bcecSMiao Xie 			avail_space = 0;
19816d07bcecSMiao Xie 
19826d07bcecSMiao Xie 		if (avail_space < min_stripe_size)
19836d07bcecSMiao Xie 			continue;
19846d07bcecSMiao Xie 
19856d07bcecSMiao Xie 		devices_info[i].dev = device;
19866d07bcecSMiao Xie 		devices_info[i].max_avail = avail_space;
19876d07bcecSMiao Xie 
19886d07bcecSMiao Xie 		i++;
19896d07bcecSMiao Xie 	}
19907e33fd99SJosef Bacik 	rcu_read_unlock();
19917e33fd99SJosef Bacik 	if (fs_info->alloc_start)
19927e33fd99SJosef Bacik 		mutex_unlock(&fs_devices->device_list_mutex);
19936d07bcecSMiao Xie 
19946d07bcecSMiao Xie 	nr_devices = i;
19956d07bcecSMiao Xie 
19966d07bcecSMiao Xie 	btrfs_descending_sort_devices(devices_info, nr_devices);
19976d07bcecSMiao Xie 
19986d07bcecSMiao Xie 	i = nr_devices - 1;
19996d07bcecSMiao Xie 	avail_space = 0;
20006d07bcecSMiao Xie 	while (nr_devices >= min_stripes) {
200139fb26c3SMiao Xie 		if (num_stripes > nr_devices)
200239fb26c3SMiao Xie 			num_stripes = nr_devices;
200339fb26c3SMiao Xie 
20046d07bcecSMiao Xie 		if (devices_info[i].max_avail >= min_stripe_size) {
20056d07bcecSMiao Xie 			int j;
20066d07bcecSMiao Xie 			u64 alloc_size;
20076d07bcecSMiao Xie 
200839fb26c3SMiao Xie 			avail_space += devices_info[i].max_avail * num_stripes;
20096d07bcecSMiao Xie 			alloc_size = devices_info[i].max_avail;
201039fb26c3SMiao Xie 			for (j = i + 1 - num_stripes; j <= i; j++)
20116d07bcecSMiao Xie 				devices_info[j].max_avail -= alloc_size;
20126d07bcecSMiao Xie 		}
20136d07bcecSMiao Xie 		i--;
20146d07bcecSMiao Xie 		nr_devices--;
20156d07bcecSMiao Xie 	}
20166d07bcecSMiao Xie 
20176d07bcecSMiao Xie 	kfree(devices_info);
20186d07bcecSMiao Xie 	*free_bytes = avail_space;
20196d07bcecSMiao Xie 	return 0;
20206d07bcecSMiao Xie }
20216d07bcecSMiao Xie 
2022ba7b6e62SDavid Sterba /*
2023ba7b6e62SDavid Sterba  * Calculate numbers for 'df', pessimistic in case of mixed raid profiles.
2024ba7b6e62SDavid Sterba  *
2025ba7b6e62SDavid Sterba  * If there's a redundant raid level at DATA block groups, use the respective
2026ba7b6e62SDavid Sterba  * multiplier to scale the sizes.
2027ba7b6e62SDavid Sterba  *
2028ba7b6e62SDavid Sterba  * Unused device space usage is based on simulating the chunk allocator
2029ba7b6e62SDavid Sterba  * algorithm that respects the device sizes, order of allocations and the
2030ba7b6e62SDavid Sterba  * 'alloc_start' value, this is a close approximation of the actual use but
2031ba7b6e62SDavid Sterba  * there are other factors that may change the result (like a new metadata
2032ba7b6e62SDavid Sterba  * chunk).
2033ba7b6e62SDavid Sterba  *
2034ca8a51b3SDavid Sterba  * If metadata is exhausted, f_bavail will be 0.
2035ca8a51b3SDavid Sterba  *
2036ba7b6e62SDavid Sterba  * FIXME: not accurate for mixed block groups, total and free/used are ok,
2037ba7b6e62SDavid Sterba  * available appears slightly larger.
2038ba7b6e62SDavid Sterba  */
20398fd17795SChris Mason static int btrfs_statfs(struct dentry *dentry, struct kstatfs *buf)
20408fd17795SChris Mason {
2041815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(dentry->d_sb);
2042815745cfSAl Viro 	struct btrfs_super_block *disk_super = fs_info->super_copy;
2043815745cfSAl Viro 	struct list_head *head = &fs_info->space_info;
2044bd4d1088SJosef Bacik 	struct btrfs_space_info *found;
2045bd4d1088SJosef Bacik 	u64 total_used = 0;
20466d07bcecSMiao Xie 	u64 total_free_data = 0;
2047ca8a51b3SDavid Sterba 	u64 total_free_meta = 0;
2048db94535dSChris Mason 	int bits = dentry->d_sb->s_blocksize_bits;
2049815745cfSAl Viro 	__be32 *fsid = (__be32 *)fs_info->fsid;
2050ba7b6e62SDavid Sterba 	unsigned factor = 1;
2051ba7b6e62SDavid Sterba 	struct btrfs_block_rsv *block_rsv = &fs_info->global_block_rsv;
20526d07bcecSMiao Xie 	int ret;
2053ca8a51b3SDavid Sterba 	u64 thresh = 0;
20548fd17795SChris Mason 
205515484377SMiao Xie 	/*
205615484377SMiao Xie 	 * holding chunk_muext to avoid allocating new chunks, holding
205715484377SMiao Xie 	 * device_list_mutex to avoid the device being removed
205815484377SMiao Xie 	 */
2059bd4d1088SJosef Bacik 	rcu_read_lock();
206089a55897SJosef Bacik 	list_for_each_entry_rcu(found, head, list) {
20616d07bcecSMiao Xie 		if (found->flags & BTRFS_BLOCK_GROUP_DATA) {
2062ba7b6e62SDavid Sterba 			int i;
2063ba7b6e62SDavid Sterba 
20646d07bcecSMiao Xie 			total_free_data += found->disk_total - found->disk_used;
20656d07bcecSMiao Xie 			total_free_data -=
20666d07bcecSMiao Xie 				btrfs_account_ro_block_groups_free_space(found);
2067ba7b6e62SDavid Sterba 
2068ba7b6e62SDavid Sterba 			for (i = 0; i < BTRFS_NR_RAID_TYPES; i++) {
2069ba7b6e62SDavid Sterba 				if (!list_empty(&found->block_groups[i])) {
2070ba7b6e62SDavid Sterba 					switch (i) {
2071ba7b6e62SDavid Sterba 					case BTRFS_RAID_DUP:
2072ba7b6e62SDavid Sterba 					case BTRFS_RAID_RAID1:
2073ba7b6e62SDavid Sterba 					case BTRFS_RAID_RAID10:
2074ba7b6e62SDavid Sterba 						factor = 2;
2075ba7b6e62SDavid Sterba 					}
2076ba7b6e62SDavid Sterba 				}
2077ba7b6e62SDavid Sterba 			}
20786d07bcecSMiao Xie 		}
2079ca8a51b3SDavid Sterba 		if (found->flags & BTRFS_BLOCK_GROUP_METADATA)
2080ca8a51b3SDavid Sterba 			total_free_meta += found->disk_total - found->disk_used;
20816d07bcecSMiao Xie 
2082b742bb82SYan, Zheng 		total_used += found->disk_used;
208389a55897SJosef Bacik 	}
2084ba7b6e62SDavid Sterba 
2085bd4d1088SJosef Bacik 	rcu_read_unlock();
2086bd4d1088SJosef Bacik 
2087ba7b6e62SDavid Sterba 	buf->f_blocks = div_u64(btrfs_super_total_bytes(disk_super), factor);
2088ba7b6e62SDavid Sterba 	buf->f_blocks >>= bits;
2089ba7b6e62SDavid Sterba 	buf->f_bfree = buf->f_blocks - (div_u64(total_used, factor) >> bits);
2090ba7b6e62SDavid Sterba 
2091ba7b6e62SDavid Sterba 	/* Account global block reserve as used, it's in logical size already */
2092ba7b6e62SDavid Sterba 	spin_lock(&block_rsv->lock);
2093ba7b6e62SDavid Sterba 	buf->f_bfree -= block_rsv->size >> bits;
2094ba7b6e62SDavid Sterba 	spin_unlock(&block_rsv->lock);
2095ba7b6e62SDavid Sterba 
20960d95c1beSDavid Sterba 	buf->f_bavail = div_u64(total_free_data, factor);
2097815745cfSAl Viro 	ret = btrfs_calc_avail_data_space(fs_info->tree_root, &total_free_data);
20987e33fd99SJosef Bacik 	if (ret)
20996d07bcecSMiao Xie 		return ret;
2100ba7b6e62SDavid Sterba 	buf->f_bavail += div_u64(total_free_data, factor);
21016d07bcecSMiao Xie 	buf->f_bavail = buf->f_bavail >> bits;
2102d397712bSChris Mason 
2103ca8a51b3SDavid Sterba 	/*
2104ca8a51b3SDavid Sterba 	 * We calculate the remaining metadata space minus global reserve. If
2105ca8a51b3SDavid Sterba 	 * this is (supposedly) smaller than zero, there's no space. But this
2106ca8a51b3SDavid Sterba 	 * does not hold in practice, the exhausted state happens where's still
2107ca8a51b3SDavid Sterba 	 * some positive delta. So we apply some guesswork and compare the
2108ca8a51b3SDavid Sterba 	 * delta to a 4M threshold.  (Practically observed delta was ~2M.)
2109ca8a51b3SDavid Sterba 	 *
2110ca8a51b3SDavid Sterba 	 * We probably cannot calculate the exact threshold value because this
2111ca8a51b3SDavid Sterba 	 * depends on the internal reservations requested by various
2112ca8a51b3SDavid Sterba 	 * operations, so some operations that consume a few metadata will
2113ca8a51b3SDavid Sterba 	 * succeed even if the Avail is zero. But this is better than the other
2114ca8a51b3SDavid Sterba 	 * way around.
2115ca8a51b3SDavid Sterba 	 */
2116ca8a51b3SDavid Sterba 	thresh = 4 * 1024 * 1024;
2117ca8a51b3SDavid Sterba 
2118ca8a51b3SDavid Sterba 	if (total_free_meta - thresh < block_rsv->size)
2119ca8a51b3SDavid Sterba 		buf->f_bavail = 0;
2120ca8a51b3SDavid Sterba 
2121ba7b6e62SDavid Sterba 	buf->f_type = BTRFS_SUPER_MAGIC;
2122ba7b6e62SDavid Sterba 	buf->f_bsize = dentry->d_sb->s_blocksize;
2123ba7b6e62SDavid Sterba 	buf->f_namelen = BTRFS_NAME_LEN;
2124ba7b6e62SDavid Sterba 
21259d03632eSDavid Woodhouse 	/* We treat it as constant endianness (it doesn't matter _which_)
21269d03632eSDavid Woodhouse 	   because we want the fsid to come out the same whether mounted
21279d03632eSDavid Woodhouse 	   on a big-endian or little-endian host */
21289d03632eSDavid Woodhouse 	buf->f_fsid.val[0] = be32_to_cpu(fsid[0]) ^ be32_to_cpu(fsid[2]);
21299d03632eSDavid Woodhouse 	buf->f_fsid.val[1] = be32_to_cpu(fsid[1]) ^ be32_to_cpu(fsid[3]);
213032d48fa1SDavid Woodhouse 	/* Mask in the root object ID too, to disambiguate subvols */
21312b0143b5SDavid Howells 	buf->f_fsid.val[0] ^= BTRFS_I(d_inode(dentry))->root->objectid >> 32;
21322b0143b5SDavid Howells 	buf->f_fsid.val[1] ^= BTRFS_I(d_inode(dentry))->root->objectid;
213332d48fa1SDavid Woodhouse 
21348fd17795SChris Mason 	return 0;
21358fd17795SChris Mason }
2136b5133862SChris Mason 
2137aea52e19SAl Viro static void btrfs_kill_super(struct super_block *sb)
2138aea52e19SAl Viro {
2139815745cfSAl Viro 	struct btrfs_fs_info *fs_info = btrfs_sb(sb);
2140aea52e19SAl Viro 	kill_anon_super(sb);
2141aea52e19SAl Viro 	free_fs_info(fs_info);
2142aea52e19SAl Viro }
2143aea52e19SAl Viro 
21442e635a27SChris Mason static struct file_system_type btrfs_fs_type = {
21452e635a27SChris Mason 	.owner		= THIS_MODULE,
21462e635a27SChris Mason 	.name		= "btrfs",
2147061dbc6bSAl Viro 	.mount		= btrfs_mount,
2148aea52e19SAl Viro 	.kill_sb	= btrfs_kill_super,
2149f667aef6SQu Wenruo 	.fs_flags	= FS_REQUIRES_DEV | FS_BINARY_MOUNTDATA,
21502e635a27SChris Mason };
21517f78e035SEric W. Biederman MODULE_ALIAS_FS("btrfs");
2152a9218f6bSChris Mason 
2153d8620958STom Van Braeckel static int btrfs_control_open(struct inode *inode, struct file *file)
2154d8620958STom Van Braeckel {
2155d8620958STom Van Braeckel 	/*
2156d8620958STom Van Braeckel 	 * The control file's private_data is used to hold the
2157d8620958STom Van Braeckel 	 * transaction when it is started and is used to keep
2158d8620958STom Van Braeckel 	 * track of whether a transaction is already in progress.
2159d8620958STom Van Braeckel 	 */
2160d8620958STom Van Braeckel 	file->private_data = NULL;
2161d8620958STom Van Braeckel 	return 0;
2162d8620958STom Van Braeckel }
2163d8620958STom Van Braeckel 
2164d352ac68SChris Mason /*
2165d352ac68SChris Mason  * used by btrfsctl to scan devices when no FS is mounted
2166d352ac68SChris Mason  */
21678a4b83ccSChris Mason static long btrfs_control_ioctl(struct file *file, unsigned int cmd,
21688a4b83ccSChris Mason 				unsigned long arg)
21698a4b83ccSChris Mason {
21708a4b83ccSChris Mason 	struct btrfs_ioctl_vol_args *vol;
21718a4b83ccSChris Mason 	struct btrfs_fs_devices *fs_devices;
2172c071fcfdSChris Mason 	int ret = -ENOTTY;
21738a4b83ccSChris Mason 
2174e441d54dSChris Mason 	if (!capable(CAP_SYS_ADMIN))
2175e441d54dSChris Mason 		return -EPERM;
2176e441d54dSChris Mason 
2177dae7b665SLi Zefan 	vol = memdup_user((void __user *)arg, sizeof(*vol));
2178dae7b665SLi Zefan 	if (IS_ERR(vol))
2179dae7b665SLi Zefan 		return PTR_ERR(vol);
2180c071fcfdSChris Mason 
21818a4b83ccSChris Mason 	switch (cmd) {
21828a4b83ccSChris Mason 	case BTRFS_IOC_SCAN_DEV:
218397288f2cSChristoph Hellwig 		ret = btrfs_scan_one_device(vol->name, FMODE_READ,
21848a4b83ccSChris Mason 					    &btrfs_fs_type, &fs_devices);
21858a4b83ccSChris Mason 		break;
218602db0844SJosef Bacik 	case BTRFS_IOC_DEVICES_READY:
218702db0844SJosef Bacik 		ret = btrfs_scan_one_device(vol->name, FMODE_READ,
218802db0844SJosef Bacik 					    &btrfs_fs_type, &fs_devices);
218902db0844SJosef Bacik 		if (ret)
219002db0844SJosef Bacik 			break;
219102db0844SJosef Bacik 		ret = !(fs_devices->num_devices == fs_devices->total_devices);
219202db0844SJosef Bacik 		break;
2193c5868f83SDavid Sterba 	case BTRFS_IOC_GET_SUPPORTED_FEATURES:
2194d5131b65SDavid Sterba 		ret = btrfs_ioctl_get_supported_features((void __user*)arg);
2195c5868f83SDavid Sterba 		break;
21968a4b83ccSChris Mason 	}
2197dae7b665SLi Zefan 
21988a4b83ccSChris Mason 	kfree(vol);
2199f819d837SLinda Knippers 	return ret;
22008a4b83ccSChris Mason }
22018a4b83ccSChris Mason 
22020176260fSLinus Torvalds static int btrfs_freeze(struct super_block *sb)
2203ed0dab6bSYan {
2204354aa0fbSMiao Xie 	struct btrfs_trans_handle *trans;
2205354aa0fbSMiao Xie 	struct btrfs_root *root = btrfs_sb(sb)->tree_root;
2206354aa0fbSMiao Xie 
2207d4edf39bSMiao Xie 	trans = btrfs_attach_transaction_barrier(root);
2208354aa0fbSMiao Xie 	if (IS_ERR(trans)) {
2209354aa0fbSMiao Xie 		/* no transaction, don't bother */
2210354aa0fbSMiao Xie 		if (PTR_ERR(trans) == -ENOENT)
22110176260fSLinus Torvalds 			return 0;
2212354aa0fbSMiao Xie 		return PTR_ERR(trans);
2213354aa0fbSMiao Xie 	}
2214354aa0fbSMiao Xie 	return btrfs_commit_transaction(trans, root);
2215ed0dab6bSYan }
2216ed0dab6bSYan 
22179c5085c1SJosef Bacik static int btrfs_show_devname(struct seq_file *m, struct dentry *root)
22189c5085c1SJosef Bacik {
22199c5085c1SJosef Bacik 	struct btrfs_fs_info *fs_info = btrfs_sb(root->d_sb);
22209c5085c1SJosef Bacik 	struct btrfs_fs_devices *cur_devices;
22219c5085c1SJosef Bacik 	struct btrfs_device *dev, *first_dev = NULL;
22229c5085c1SJosef Bacik 	struct list_head *head;
22239c5085c1SJosef Bacik 	struct rcu_string *name;
22249c5085c1SJosef Bacik 
22259c5085c1SJosef Bacik 	mutex_lock(&fs_info->fs_devices->device_list_mutex);
22269c5085c1SJosef Bacik 	cur_devices = fs_info->fs_devices;
22279c5085c1SJosef Bacik 	while (cur_devices) {
22289c5085c1SJosef Bacik 		head = &cur_devices->devices;
22299c5085c1SJosef Bacik 		list_for_each_entry(dev, head, dev_list) {
2230aa9ddcd4SJosef Bacik 			if (dev->missing)
2231aa9ddcd4SJosef Bacik 				continue;
22320aeb8a6eSAnand Jain 			if (!dev->name)
22330aeb8a6eSAnand Jain 				continue;
22349c5085c1SJosef Bacik 			if (!first_dev || dev->devid < first_dev->devid)
22359c5085c1SJosef Bacik 				first_dev = dev;
22369c5085c1SJosef Bacik 		}
22379c5085c1SJosef Bacik 		cur_devices = cur_devices->seed;
22389c5085c1SJosef Bacik 	}
22399c5085c1SJosef Bacik 
22409c5085c1SJosef Bacik 	if (first_dev) {
22419c5085c1SJosef Bacik 		rcu_read_lock();
22429c5085c1SJosef Bacik 		name = rcu_dereference(first_dev->name);
22439c5085c1SJosef Bacik 		seq_escape(m, name->str, " \t\n\\");
22449c5085c1SJosef Bacik 		rcu_read_unlock();
22459c5085c1SJosef Bacik 	} else {
22469c5085c1SJosef Bacik 		WARN_ON(1);
22479c5085c1SJosef Bacik 	}
22489c5085c1SJosef Bacik 	mutex_unlock(&fs_info->fs_devices->device_list_mutex);
22499c5085c1SJosef Bacik 	return 0;
22509c5085c1SJosef Bacik }
22519c5085c1SJosef Bacik 
2252b87221deSAlexey Dobriyan static const struct super_operations btrfs_super_ops = {
225376dda93cSYan, Zheng 	.drop_inode	= btrfs_drop_inode,
2254bd555975SAl Viro 	.evict_inode	= btrfs_evict_inode,
2255e20d96d6SChris Mason 	.put_super	= btrfs_put_super,
2256d5719762SChris Mason 	.sync_fs	= btrfs_sync_fs,
2257a9572a15SEric Paris 	.show_options	= btrfs_show_options,
22589c5085c1SJosef Bacik 	.show_devname	= btrfs_show_devname,
22594730a4bcSChris Mason 	.write_inode	= btrfs_write_inode,
22602c90e5d6SChris Mason 	.alloc_inode	= btrfs_alloc_inode,
22612c90e5d6SChris Mason 	.destroy_inode	= btrfs_destroy_inode,
22628fd17795SChris Mason 	.statfs		= btrfs_statfs,
2263c146afadSYan Zheng 	.remount_fs	= btrfs_remount,
22640176260fSLinus Torvalds 	.freeze_fs	= btrfs_freeze,
2265e20d96d6SChris Mason };
2266a9218f6bSChris Mason 
2267a9218f6bSChris Mason static const struct file_operations btrfs_ctl_fops = {
2268d8620958STom Van Braeckel 	.open = btrfs_control_open,
2269a9218f6bSChris Mason 	.unlocked_ioctl	 = btrfs_control_ioctl,
2270a9218f6bSChris Mason 	.compat_ioctl = btrfs_control_ioctl,
2271a9218f6bSChris Mason 	.owner	 = THIS_MODULE,
22726038f373SArnd Bergmann 	.llseek = noop_llseek,
2273a9218f6bSChris Mason };
2274a9218f6bSChris Mason 
2275a9218f6bSChris Mason static struct miscdevice btrfs_misc = {
2276578454ffSKay Sievers 	.minor		= BTRFS_MINOR,
2277a9218f6bSChris Mason 	.name		= "btrfs-control",
2278a9218f6bSChris Mason 	.fops		= &btrfs_ctl_fops
2279a9218f6bSChris Mason };
2280a9218f6bSChris Mason 
2281578454ffSKay Sievers MODULE_ALIAS_MISCDEV(BTRFS_MINOR);
2282578454ffSKay Sievers MODULE_ALIAS("devname:btrfs-control");
2283578454ffSKay Sievers 
2284a9218f6bSChris Mason static int btrfs_interface_init(void)
2285a9218f6bSChris Mason {
2286a9218f6bSChris Mason 	return misc_register(&btrfs_misc);
2287a9218f6bSChris Mason }
2288a9218f6bSChris Mason 
2289b2950863SChristoph Hellwig static void btrfs_interface_exit(void)
2290a9218f6bSChris Mason {
2291f368ed60SGreg Kroah-Hartman 	misc_deregister(&btrfs_misc);
2292a9218f6bSChris Mason }
2293a9218f6bSChris Mason 
22948ae1af3cSAnand Jain static void btrfs_print_mod_info(void)
229585965600SDavid Sterba {
229685965600SDavid Sterba 	printk(KERN_INFO "Btrfs loaded"
229785965600SDavid Sterba #ifdef CONFIG_BTRFS_DEBUG
229885965600SDavid Sterba 			", debug=on"
229985965600SDavid Sterba #endif
230079556c3dSStefan Behrens #ifdef CONFIG_BTRFS_ASSERT
230179556c3dSStefan Behrens 			", assert=on"
230279556c3dSStefan Behrens #endif
230385965600SDavid Sterba #ifdef CONFIG_BTRFS_FS_CHECK_INTEGRITY
230485965600SDavid Sterba 			", integrity-checker=on"
230585965600SDavid Sterba #endif
230685965600SDavid Sterba 			"\n");
230785965600SDavid Sterba }
230885965600SDavid Sterba 
2309dc11dd5dSJosef Bacik static int btrfs_run_sanity_tests(void)
2310dc11dd5dSJosef Bacik {
231106ea65a3SJosef Bacik 	int ret;
231206ea65a3SJosef Bacik 
2313294e30feSJosef Bacik 	ret = btrfs_init_test_fs();
231406ea65a3SJosef Bacik 	if (ret)
231506ea65a3SJosef Bacik 		return ret;
2316294e30feSJosef Bacik 
2317294e30feSJosef Bacik 	ret = btrfs_test_free_space_cache();
2318294e30feSJosef Bacik 	if (ret)
2319294e30feSJosef Bacik 		goto out;
2320294e30feSJosef Bacik 	ret = btrfs_test_extent_buffer_operations();
2321294e30feSJosef Bacik 	if (ret)
2322294e30feSJosef Bacik 		goto out;
2323294e30feSJosef Bacik 	ret = btrfs_test_extent_io();
2324aaedb55bSJosef Bacik 	if (ret)
2325aaedb55bSJosef Bacik 		goto out;
2326aaedb55bSJosef Bacik 	ret = btrfs_test_inodes();
2327faa2dbf0SJosef Bacik 	if (ret)
2328faa2dbf0SJosef Bacik 		goto out;
2329faa2dbf0SJosef Bacik 	ret = btrfs_test_qgroups();
23307c55ee0cSOmar Sandoval 	if (ret)
23317c55ee0cSOmar Sandoval 		goto out;
23327c55ee0cSOmar Sandoval 	ret = btrfs_test_free_space_tree();
2333294e30feSJosef Bacik out:
2334294e30feSJosef Bacik 	btrfs_destroy_test_fs();
2335294e30feSJosef Bacik 	return ret;
2336dc11dd5dSJosef Bacik }
2337dc11dd5dSJosef Bacik 
23382e635a27SChris Mason static int __init init_btrfs_fs(void)
23392e635a27SChris Mason {
23402c90e5d6SChris Mason 	int err;
234158176a96SJosef Bacik 
234214a958e6SFilipe David Borba Manana 	err = btrfs_hash_init();
234314a958e6SFilipe David Borba Manana 	if (err)
234414a958e6SFilipe David Borba Manana 		return err;
234514a958e6SFilipe David Borba Manana 
234663541927SFilipe David Borba Manana 	btrfs_props_init();
234763541927SFilipe David Borba Manana 
234858176a96SJosef Bacik 	err = btrfs_init_sysfs();
234958176a96SJosef Bacik 	if (err)
235014a958e6SFilipe David Borba Manana 		goto free_hash;
235158176a96SJosef Bacik 
2352143bede5SJeff Mahoney 	btrfs_init_compress();
2353d1310b2eSChris Mason 
2354261507a0SLi Zefan 	err = btrfs_init_cachep();
2355261507a0SLi Zefan 	if (err)
2356261507a0SLi Zefan 		goto free_compress;
2357261507a0SLi Zefan 
2358d1310b2eSChris Mason 	err = extent_io_init();
23592f4cbe64SWyatt Banks 	if (err)
23602f4cbe64SWyatt Banks 		goto free_cachep;
23612f4cbe64SWyatt Banks 
2362d1310b2eSChris Mason 	err = extent_map_init();
2363d1310b2eSChris Mason 	if (err)
2364d1310b2eSChris Mason 		goto free_extent_io;
2365d1310b2eSChris Mason 
23666352b91dSMiao Xie 	err = ordered_data_init();
23672f4cbe64SWyatt Banks 	if (err)
23682f4cbe64SWyatt Banks 		goto free_extent_map;
2369c8b97818SChris Mason 
23706352b91dSMiao Xie 	err = btrfs_delayed_inode_init();
23716352b91dSMiao Xie 	if (err)
23726352b91dSMiao Xie 		goto free_ordered_data;
23736352b91dSMiao Xie 
23749247f317SMiao Xie 	err = btrfs_auto_defrag_init();
237516cdcec7SMiao Xie 	if (err)
237616cdcec7SMiao Xie 		goto free_delayed_inode;
237716cdcec7SMiao Xie 
237878a6184aSMiao Xie 	err = btrfs_delayed_ref_init();
23799247f317SMiao Xie 	if (err)
23809247f317SMiao Xie 		goto free_auto_defrag;
23819247f317SMiao Xie 
2382b9e9a6cbSWang Shilong 	err = btrfs_prelim_ref_init();
2383b9e9a6cbSWang Shilong 	if (err)
2384af13b492SDavid Sterba 		goto free_delayed_ref;
2385b9e9a6cbSWang Shilong 
238697eb6b69SDavid Sterba 	err = btrfs_end_io_wq_init();
238778a6184aSMiao Xie 	if (err)
2388af13b492SDavid Sterba 		goto free_prelim_ref;
238978a6184aSMiao Xie 
239097eb6b69SDavid Sterba 	err = btrfs_interface_init();
239197eb6b69SDavid Sterba 	if (err)
239297eb6b69SDavid Sterba 		goto free_end_io_wq;
239397eb6b69SDavid Sterba 
2394e565d4b9SJan Schmidt 	btrfs_init_lockdep();
2395e565d4b9SJan Schmidt 
23968ae1af3cSAnand Jain 	btrfs_print_mod_info();
2397dc11dd5dSJosef Bacik 
2398dc11dd5dSJosef Bacik 	err = btrfs_run_sanity_tests();
2399dc11dd5dSJosef Bacik 	if (err)
2400dc11dd5dSJosef Bacik 		goto unregister_ioctl;
2401dc11dd5dSJosef Bacik 
2402dc11dd5dSJosef Bacik 	err = register_filesystem(&btrfs_fs_type);
2403dc11dd5dSJosef Bacik 	if (err)
2404dc11dd5dSJosef Bacik 		goto unregister_ioctl;
240574255aa0SJosef Bacik 
24062f4cbe64SWyatt Banks 	return 0;
24072f4cbe64SWyatt Banks 
2408a9218f6bSChris Mason unregister_ioctl:
2409a9218f6bSChris Mason 	btrfs_interface_exit();
241097eb6b69SDavid Sterba free_end_io_wq:
241197eb6b69SDavid Sterba 	btrfs_end_io_wq_exit();
2412b9e9a6cbSWang Shilong free_prelim_ref:
2413b9e9a6cbSWang Shilong 	btrfs_prelim_ref_exit();
241478a6184aSMiao Xie free_delayed_ref:
241578a6184aSMiao Xie 	btrfs_delayed_ref_exit();
24169247f317SMiao Xie free_auto_defrag:
24179247f317SMiao Xie 	btrfs_auto_defrag_exit();
241816cdcec7SMiao Xie free_delayed_inode:
241916cdcec7SMiao Xie 	btrfs_delayed_inode_exit();
24206352b91dSMiao Xie free_ordered_data:
24216352b91dSMiao Xie 	ordered_data_exit();
24222f4cbe64SWyatt Banks free_extent_map:
24232f4cbe64SWyatt Banks 	extent_map_exit();
2424d1310b2eSChris Mason free_extent_io:
2425d1310b2eSChris Mason 	extent_io_exit();
24262f4cbe64SWyatt Banks free_cachep:
24272f4cbe64SWyatt Banks 	btrfs_destroy_cachep();
2428261507a0SLi Zefan free_compress:
2429261507a0SLi Zefan 	btrfs_exit_compress();
24302f4cbe64SWyatt Banks 	btrfs_exit_sysfs();
243114a958e6SFilipe David Borba Manana free_hash:
243214a958e6SFilipe David Borba Manana 	btrfs_hash_exit();
24332c90e5d6SChris Mason 	return err;
24342e635a27SChris Mason }
24352e635a27SChris Mason 
24362e635a27SChris Mason static void __exit exit_btrfs_fs(void)
24372e635a27SChris Mason {
243839279cc3SChris Mason 	btrfs_destroy_cachep();
243978a6184aSMiao Xie 	btrfs_delayed_ref_exit();
24409247f317SMiao Xie 	btrfs_auto_defrag_exit();
244116cdcec7SMiao Xie 	btrfs_delayed_inode_exit();
2442b9e9a6cbSWang Shilong 	btrfs_prelim_ref_exit();
24436352b91dSMiao Xie 	ordered_data_exit();
2444a52d9a80SChris Mason 	extent_map_exit();
2445d1310b2eSChris Mason 	extent_io_exit();
2446a9218f6bSChris Mason 	btrfs_interface_exit();
24475ed5f588SJosef Bacik 	btrfs_end_io_wq_exit();
24482e635a27SChris Mason 	unregister_filesystem(&btrfs_fs_type);
244958176a96SJosef Bacik 	btrfs_exit_sysfs();
24508a4b83ccSChris Mason 	btrfs_cleanup_fs_uuids();
2451261507a0SLi Zefan 	btrfs_exit_compress();
245214a958e6SFilipe David Borba Manana 	btrfs_hash_exit();
24532e635a27SChris Mason }
24542e635a27SChris Mason 
245560efa5ebSFilipe David Borba Manana late_initcall(init_btrfs_fs);
24562e635a27SChris Mason module_exit(exit_btrfs_fs)
24572e635a27SChris Mason 
24582e635a27SChris Mason MODULE_LICENSE("GPL");
2459