1f5166768STheodore Ts'o // SPDX-License-Identifier: GPL-2.0
2ac27a0ecSDave Kleikamp /*
3617ba13bSMingming Cao * linux/fs/ext4/super.c
4ac27a0ecSDave Kleikamp *
5ac27a0ecSDave Kleikamp * Copyright (C) 1992, 1993, 1994, 1995
6ac27a0ecSDave Kleikamp * Remy Card (card@masi.ibp.fr)
7ac27a0ecSDave Kleikamp * Laboratoire MASI - Institut Blaise Pascal
8ac27a0ecSDave Kleikamp * Universite Pierre et Marie Curie (Paris VI)
9ac27a0ecSDave Kleikamp *
10ac27a0ecSDave Kleikamp * from
11ac27a0ecSDave Kleikamp *
12ac27a0ecSDave Kleikamp * linux/fs/minix/inode.c
13ac27a0ecSDave Kleikamp *
14ac27a0ecSDave Kleikamp * Copyright (C) 1991, 1992 Linus Torvalds
15ac27a0ecSDave Kleikamp *
16ac27a0ecSDave Kleikamp * Big-endian to little-endian byte-swapping/bitmaps by
17ac27a0ecSDave Kleikamp * David S. Miller (davem@caip.rutgers.edu), 1995
18ac27a0ecSDave Kleikamp */
19ac27a0ecSDave Kleikamp
20ac27a0ecSDave Kleikamp #include <linux/module.h>
21ac27a0ecSDave Kleikamp #include <linux/string.h>
22ac27a0ecSDave Kleikamp #include <linux/fs.h>
23ac27a0ecSDave Kleikamp #include <linux/time.h>
24c5ca7c76STheodore Ts'o #include <linux/vmalloc.h>
25ac27a0ecSDave Kleikamp #include <linux/slab.h>
26ac27a0ecSDave Kleikamp #include <linux/init.h>
27ac27a0ecSDave Kleikamp #include <linux/blkdev.h>
2866114cadSTejun Heo #include <linux/backing-dev.h>
29ac27a0ecSDave Kleikamp #include <linux/parser.h>
30ac27a0ecSDave Kleikamp #include <linux/buffer_head.h>
31a5694255SChristoph Hellwig #include <linux/exportfs.h>
32ac27a0ecSDave Kleikamp #include <linux/vfs.h>
33ac27a0ecSDave Kleikamp #include <linux/random.h>
34ac27a0ecSDave Kleikamp #include <linux/mount.h>
35ac27a0ecSDave Kleikamp #include <linux/namei.h>
36ac27a0ecSDave Kleikamp #include <linux/quotaops.h>
37ac27a0ecSDave Kleikamp #include <linux/seq_file.h>
383197ebdbSTheodore Ts'o #include <linux/ctype.h>
391330593eSVignesh Babu #include <linux/log2.h>
40717d50e4SAndreas Dilger #include <linux/crc16.h>
41ef510424SDan Williams #include <linux/dax.h>
427c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
43ee73f9a5SJeff Layton #include <linux/iversion.h>
44c83ad55eSGabriel Krisman Bertazi #include <linux/unicode.h>
45c6a564ffSChristoph Hellwig #include <linux/part_stat.h>
46bfff6873SLukas Czerner #include <linux/kthread.h>
47bfff6873SLukas Czerner #include <linux/freezer.h>
489a089b21SGabriel Krisman Bertazi #include <linux/fsnotify.h>
49e5a185c2SLukas Czerner #include <linux/fs_context.h>
50e5a185c2SLukas Czerner #include <linux/fs_parser.h>
51bfff6873SLukas Czerner
523dcf5451SChristoph Hellwig #include "ext4.h"
534a092d73STheodore Ts'o #include "ext4_extents.h" /* Needed for trace points definition */
543dcf5451SChristoph Hellwig #include "ext4_jbd2.h"
55ac27a0ecSDave Kleikamp #include "xattr.h"
56ac27a0ecSDave Kleikamp #include "acl.h"
573661d286STheodore Ts'o #include "mballoc.h"
580c9ec4beSDarrick J. Wong #include "fsmap.h"
59ac27a0ecSDave Kleikamp
609bffad1eSTheodore Ts'o #define CREATE_TRACE_POINTS
619bffad1eSTheodore Ts'o #include <trace/events/ext4.h>
629bffad1eSTheodore Ts'o
630b75a840SLukas Czerner static struct ext4_lazy_init *ext4_li_info;
6459ebc7fdSZheng Yongjun static DEFINE_MUTEX(ext4_li_mtx);
65e294a537STheodore Ts'o static struct ratelimit_state ext4_mount_msg_ratelimit;
669f6200bbSTheodore Ts'o
67617ba13bSMingming Cao static int ext4_load_journal(struct super_block *, struct ext4_super_block *,
68ac27a0ecSDave Kleikamp unsigned long journal_devnum);
692adf6da8STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root);
702d01ddc8SJan Kara static void ext4_update_super(struct super_block *sb);
714392fbc4SJan Kara static int ext4_commit_super(struct super_block *sb);
7211215630SJan Kara static int ext4_mark_recovery_complete(struct super_block *sb,
73617ba13bSMingming Cao struct ext4_super_block *es);
7411215630SJan Kara static int ext4_clear_journal_err(struct super_block *sb,
75617ba13bSMingming Cao struct ext4_super_block *es);
76617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait);
77617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf);
78c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb);
79c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb);
802035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb);
812035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb);
82bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void);
83bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb);
848f1f7453SEric Sandeen static void ext4_clear_request_list(void);
85c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
86c6cb7e77SEric Whitney unsigned int journal_inum);
87da812f61SLukas Czerner static int ext4_validate_options(struct fs_context *fc);
88b6bd2435SLukas Czerner static int ext4_check_opt_consistency(struct fs_context *fc,
89e6e268cbSLukas Czerner struct super_block *sb);
9085456054SEric Biggers static void ext4_apply_options(struct fs_context *fc, struct super_block *sb);
9102f960f8SLukas Czerner static int ext4_parse_param(struct fs_context *fc, struct fs_parameter *param);
92cebe85d5SLukas Czerner static int ext4_get_tree(struct fs_context *fc);
93cebe85d5SLukas Czerner static int ext4_reconfigure(struct fs_context *fc);
94cebe85d5SLukas Czerner static void ext4_fc_free(struct fs_context *fc);
95cebe85d5SLukas Czerner static int ext4_init_fs_context(struct fs_context *fc);
961489dffdSChristoph Hellwig static void ext4_kill_sb(struct super_block *sb);
97cebe85d5SLukas Czerner static const struct fs_parameter_spec ext4_param_specs[];
98ac27a0ecSDave Kleikamp
99e74031fdSJan Kara /*
100e74031fdSJan Kara * Lock ordering
101e74031fdSJan Kara *
102e74031fdSJan Kara * page fault path:
103d4f5258eSJan Kara * mmap_lock -> sb_start_pagefault -> invalidate_lock (r) -> transaction start
104d4f5258eSJan Kara * -> page lock -> i_data_sem (rw)
105e74031fdSJan Kara *
106e74031fdSJan Kara * buffered write path:
107c1e8d7c6SMichel Lespinasse * sb_start_write -> i_mutex -> mmap_lock
108e74031fdSJan Kara * sb_start_write -> i_mutex -> transaction start -> page lock ->
109e74031fdSJan Kara * i_data_sem (rw)
110e74031fdSJan Kara *
111e74031fdSJan Kara * truncate:
112d4f5258eSJan Kara * sb_start_write -> i_mutex -> invalidate_lock (w) -> i_mmap_rwsem (w) ->
113d4f5258eSJan Kara * page lock
114d4f5258eSJan Kara * sb_start_write -> i_mutex -> invalidate_lock (w) -> transaction start ->
1151d39834fSNikolay Borisov * i_data_sem (rw)
116e74031fdSJan Kara *
117e74031fdSJan Kara * direct IO:
118c1e8d7c6SMichel Lespinasse * sb_start_write -> i_mutex -> mmap_lock
1191d39834fSNikolay Borisov * sb_start_write -> i_mutex -> transaction start -> i_data_sem (rw)
120e74031fdSJan Kara *
121e74031fdSJan Kara * writepages:
122e74031fdSJan Kara * transaction start -> page lock(s) -> i_data_sem (rw)
123e74031fdSJan Kara */
124e74031fdSJan Kara
12502f960f8SLukas Czerner static const struct fs_context_operations ext4_context_ops = {
12602f960f8SLukas Czerner .parse_param = ext4_parse_param,
127cebe85d5SLukas Czerner .get_tree = ext4_get_tree,
128cebe85d5SLukas Czerner .reconfigure = ext4_reconfigure,
129cebe85d5SLukas Czerner .free = ext4_fc_free,
13002f960f8SLukas Czerner };
13102f960f8SLukas Czerner
13202f960f8SLukas Czerner
133c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
1342035e776STheodore Ts'o static struct file_system_type ext2_fs_type = {
1352035e776STheodore Ts'o .owner = THIS_MODULE,
1362035e776STheodore Ts'o .name = "ext2",
137cebe85d5SLukas Czerner .init_fs_context = ext4_init_fs_context,
138cebe85d5SLukas Czerner .parameters = ext4_param_specs,
1391489dffdSChristoph Hellwig .kill_sb = ext4_kill_sb,
1402035e776STheodore Ts'o .fs_flags = FS_REQUIRES_DEV,
1412035e776STheodore Ts'o };
1427f78e035SEric W. Biederman MODULE_ALIAS_FS("ext2");
143fa7614ddSEric W. Biederman MODULE_ALIAS("ext2");
1444b41828bSChristoph Hellwig #define IS_EXT2_SB(sb) ((sb)->s_type == &ext2_fs_type)
1452035e776STheodore Ts'o #else
1462035e776STheodore Ts'o #define IS_EXT2_SB(sb) (0)
1472035e776STheodore Ts'o #endif
1482035e776STheodore Ts'o
1492035e776STheodore Ts'o
150ba69f9abSJan Kara static struct file_system_type ext3_fs_type = {
151ba69f9abSJan Kara .owner = THIS_MODULE,
152ba69f9abSJan Kara .name = "ext3",
153cebe85d5SLukas Czerner .init_fs_context = ext4_init_fs_context,
154cebe85d5SLukas Czerner .parameters = ext4_param_specs,
1551489dffdSChristoph Hellwig .kill_sb = ext4_kill_sb,
156ba69f9abSJan Kara .fs_flags = FS_REQUIRES_DEV,
157ba69f9abSJan Kara };
1587f78e035SEric W. Biederman MODULE_ALIAS_FS("ext3");
159fa7614ddSEric W. Biederman MODULE_ALIAS("ext3");
1604b41828bSChristoph Hellwig #define IS_EXT3_SB(sb) ((sb)->s_type == &ext3_fs_type)
161bd81d8eeSLaurent Vivier
162fa491b14Szhangyi (F)
__ext4_read_bh(struct buffer_head * bh,blk_opf_t op_flags,bh_end_io_t * end_io,bool simu_fail)16367c0f556SBart Van Assche static inline void __ext4_read_bh(struct buffer_head *bh, blk_opf_t op_flags,
16477035e4dSLong Li bh_end_io_t *end_io, bool simu_fail)
165fa491b14Szhangyi (F) {
16677035e4dSLong Li if (simu_fail) {
16777035e4dSLong Li clear_buffer_uptodate(bh);
16877035e4dSLong Li unlock_buffer(bh);
16977035e4dSLong Li return;
17077035e4dSLong Li }
17177035e4dSLong Li
172fb265c9cSTheodore Ts'o /*
173fa491b14Szhangyi (F) * buffer's verified bit is no longer valid after reading from
174fa491b14Szhangyi (F) * disk again due to write out error, clear it to make sure we
175fa491b14Szhangyi (F) * recheck the buffer contents.
176fa491b14Szhangyi (F) */
177fa491b14Szhangyi (F) clear_buffer_verified(bh);
178fa491b14Szhangyi (F)
179fa491b14Szhangyi (F) bh->b_end_io = end_io ? end_io : end_buffer_read_sync;
180fa491b14Szhangyi (F) get_bh(bh);
1811420c4a5SBart Van Assche submit_bh(REQ_OP_READ | op_flags, bh);
182fa491b14Szhangyi (F) }
183fa491b14Szhangyi (F)
ext4_read_bh_nowait(struct buffer_head * bh,blk_opf_t op_flags,bh_end_io_t * end_io,bool simu_fail)18467c0f556SBart Van Assche void ext4_read_bh_nowait(struct buffer_head *bh, blk_opf_t op_flags,
18577035e4dSLong Li bh_end_io_t *end_io, bool simu_fail)
186fa491b14Szhangyi (F) {
187fa491b14Szhangyi (F) BUG_ON(!buffer_locked(bh));
188fa491b14Szhangyi (F)
189fa491b14Szhangyi (F) if (ext4_buffer_uptodate(bh)) {
190fa491b14Szhangyi (F) unlock_buffer(bh);
191fa491b14Szhangyi (F) return;
192fa491b14Szhangyi (F) }
19377035e4dSLong Li __ext4_read_bh(bh, op_flags, end_io, simu_fail);
194fa491b14Szhangyi (F) }
195fa491b14Szhangyi (F)
ext4_read_bh(struct buffer_head * bh,blk_opf_t op_flags,bh_end_io_t * end_io,bool simu_fail)19677035e4dSLong Li int ext4_read_bh(struct buffer_head *bh, blk_opf_t op_flags,
19777035e4dSLong Li bh_end_io_t *end_io, bool simu_fail)
198fa491b14Szhangyi (F) {
199fa491b14Szhangyi (F) BUG_ON(!buffer_locked(bh));
200fa491b14Szhangyi (F)
201fa491b14Szhangyi (F) if (ext4_buffer_uptodate(bh)) {
202fa491b14Szhangyi (F) unlock_buffer(bh);
203fa491b14Szhangyi (F) return 0;
204fa491b14Szhangyi (F) }
205fa491b14Szhangyi (F)
20677035e4dSLong Li __ext4_read_bh(bh, op_flags, end_io, simu_fail);
207fa491b14Szhangyi (F)
208fa491b14Szhangyi (F) wait_on_buffer(bh);
209fa491b14Szhangyi (F) if (buffer_uptodate(bh))
210fa491b14Szhangyi (F) return 0;
211fa491b14Szhangyi (F) return -EIO;
212fa491b14Szhangyi (F) }
213fa491b14Szhangyi (F)
ext4_read_bh_lock(struct buffer_head * bh,blk_opf_t op_flags,bool wait)21467c0f556SBart Van Assche int ext4_read_bh_lock(struct buffer_head *bh, blk_opf_t op_flags, bool wait)
215fa491b14Szhangyi (F) {
2160b73284cSZhang Yi lock_buffer(bh);
2170b73284cSZhang Yi if (!wait) {
21877035e4dSLong Li ext4_read_bh_nowait(bh, op_flags, NULL, false);
219fa491b14Szhangyi (F) return 0;
220fa491b14Szhangyi (F) }
22177035e4dSLong Li return ext4_read_bh(bh, op_flags, NULL, false);
222fa491b14Szhangyi (F) }
223fa491b14Szhangyi (F)
224fb265c9cSTheodore Ts'o /*
2258394a6abSzhangyi (F) * This works like __bread_gfp() except it uses ERR_PTR for error
226fb265c9cSTheodore Ts'o * returns. Currently with sb_bread it's impossible to distinguish
227fb265c9cSTheodore Ts'o * between ENOMEM and EIO situations (since both result in a NULL
228fb265c9cSTheodore Ts'o * return.
229fb265c9cSTheodore Ts'o */
__ext4_sb_bread_gfp(struct super_block * sb,sector_t block,blk_opf_t op_flags,gfp_t gfp)2308394a6abSzhangyi (F) static struct buffer_head *__ext4_sb_bread_gfp(struct super_block *sb,
23167c0f556SBart Van Assche sector_t block,
23267c0f556SBart Van Assche blk_opf_t op_flags, gfp_t gfp)
233fb265c9cSTheodore Ts'o {
2342d069c08Szhangyi (F) struct buffer_head *bh;
2352d069c08Szhangyi (F) int ret;
236fb265c9cSTheodore Ts'o
2378394a6abSzhangyi (F) bh = sb_getblk_gfp(sb, block, gfp);
238fb265c9cSTheodore Ts'o if (bh == NULL)
239fb265c9cSTheodore Ts'o return ERR_PTR(-ENOMEM);
240cf2834a5STheodore Ts'o if (ext4_buffer_uptodate(bh))
241fb265c9cSTheodore Ts'o return bh;
2422d069c08Szhangyi (F)
2432d069c08Szhangyi (F) ret = ext4_read_bh_lock(bh, REQ_META | op_flags, true);
2442d069c08Szhangyi (F) if (ret) {
245fb265c9cSTheodore Ts'o put_bh(bh);
2462d069c08Szhangyi (F) return ERR_PTR(ret);
2472d069c08Szhangyi (F) }
2482d069c08Szhangyi (F) return bh;
249fb265c9cSTheodore Ts'o }
250fb265c9cSTheodore Ts'o
ext4_sb_bread(struct super_block * sb,sector_t block,blk_opf_t op_flags)2518394a6abSzhangyi (F) struct buffer_head *ext4_sb_bread(struct super_block *sb, sector_t block,
25267c0f556SBart Van Assche blk_opf_t op_flags)
2538394a6abSzhangyi (F) {
2548394a6abSzhangyi (F) return __ext4_sb_bread_gfp(sb, block, op_flags, __GFP_MOVABLE);
2558394a6abSzhangyi (F) }
2568394a6abSzhangyi (F)
ext4_sb_bread_unmovable(struct super_block * sb,sector_t block)2578394a6abSzhangyi (F) struct buffer_head *ext4_sb_bread_unmovable(struct super_block *sb,
2588394a6abSzhangyi (F) sector_t block)
2598394a6abSzhangyi (F) {
2608394a6abSzhangyi (F) return __ext4_sb_bread_gfp(sb, block, 0, 0);
2618394a6abSzhangyi (F) }
2628394a6abSzhangyi (F)
ext4_sb_breadahead_unmovable(struct super_block * sb,sector_t block)2635df1d412Szhangyi (F) void ext4_sb_breadahead_unmovable(struct super_block *sb, sector_t block)
2645df1d412Szhangyi (F) {
2655df1d412Szhangyi (F) struct buffer_head *bh = sb_getblk_gfp(sb, block, 0);
2665df1d412Szhangyi (F)
2675df1d412Szhangyi (F) if (likely(bh)) {
2680b73284cSZhang Yi if (trylock_buffer(bh))
26977035e4dSLong Li ext4_read_bh_nowait(bh, REQ_RAHEAD, NULL, false);
2705df1d412Szhangyi (F) brelse(bh);
2715df1d412Szhangyi (F) }
272c197855eSStephen Hemminger }
273a9c47317SDarrick J. Wong
ext4_verify_csum_type(struct super_block * sb,struct ext4_super_block * es)274a9c47317SDarrick J. Wong static int ext4_verify_csum_type(struct super_block *sb,
2759aa5d32bSDmitry Monakhov struct ext4_super_block *es)
276a9c47317SDarrick J. Wong {
277a9c47317SDarrick J. Wong if (!ext4_has_feature_metadata_csum(sb))
278a9c47317SDarrick J. Wong return 1;
279a9c47317SDarrick J. Wong
280a9c47317SDarrick J. Wong return es->s_checksum_type == EXT4_CRC32C_CHKSUM;
28106db49e6STheodore Ts'o }
282a9c47317SDarrick J. Wong
ext4_superblock_csum(struct super_block * sb,struct ext4_super_block * es)283bbc605cdSLukas Czerner __le32 ext4_superblock_csum(struct super_block *sb,
284a9c47317SDarrick J. Wong struct ext4_super_block *es)
285a9c47317SDarrick J. Wong {
286a9c47317SDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb);
287a9c47317SDarrick J. Wong int offset = offsetof(struct ext4_super_block, s_checksum);
288a9c47317SDarrick J. Wong __u32 csum;
289a9c47317SDarrick J. Wong
290a9c47317SDarrick J. Wong csum = ext4_chksum(sbi, ~0, (char *)es, offset);
291a9c47317SDarrick J. Wong
292a9c47317SDarrick J. Wong return cpu_to_le32(csum);
293a9c47317SDarrick J. Wong }
294a9c47317SDarrick J. Wong
ext4_superblock_csum_verify(struct super_block * sb,struct ext4_super_block * es)295a9c47317SDarrick J. Wong static int ext4_superblock_csum_verify(struct super_block *sb,
296a9c47317SDarrick J. Wong struct ext4_super_block *es)
297a9c47317SDarrick J. Wong {
298a9c47317SDarrick J. Wong if (!ext4_has_metadata_csum(sb))
299a9c47317SDarrick J. Wong return 1;
300a9c47317SDarrick J. Wong
301a9c47317SDarrick J. Wong return es->s_checksum == ext4_superblock_csum(sb, es);
302a9c47317SDarrick J. Wong }
303a9c47317SDarrick J. Wong
ext4_superblock_csum_set(struct super_block * sb)304a9c47317SDarrick J. Wong void ext4_superblock_csum_set(struct super_block *sb)
305a9c47317SDarrick J. Wong {
30606db49e6STheodore Ts'o struct ext4_super_block *es = EXT4_SB(sb)->s_es;
30706db49e6STheodore Ts'o
3089aa5d32bSDmitry Monakhov if (!ext4_has_metadata_csum(sb))
309a9c47317SDarrick J. Wong return;
310a9c47317SDarrick J. Wong
311a9c47317SDarrick J. Wong es->s_checksum = ext4_superblock_csum(sb, es);
312a9c47317SDarrick J. Wong }
313a9c47317SDarrick J. Wong
ext4_block_bitmap(struct super_block * sb,struct ext4_group_desc * bg)3148fadc143SAlexandre Ratchov ext4_fsblk_t ext4_block_bitmap(struct super_block *sb,
3158fadc143SAlexandre Ratchov struct ext4_group_desc *bg)
316bd81d8eeSLaurent Vivier {
3173a14589cSAneesh Kumar K.V return le32_to_cpu(bg->bg_block_bitmap_lo) |
3188fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3198fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_block_bitmap_hi) << 32 : 0);
320bd81d8eeSLaurent Vivier }
321bd81d8eeSLaurent Vivier
ext4_inode_bitmap(struct super_block * sb,struct ext4_group_desc * bg)3228fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb,
3238fadc143SAlexandre Ratchov struct ext4_group_desc *bg)
324bd81d8eeSLaurent Vivier {
3255272f837SAneesh Kumar K.V return le32_to_cpu(bg->bg_inode_bitmap_lo) |
3268fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3278fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_bitmap_hi) << 32 : 0);
328bd81d8eeSLaurent Vivier }
329bd81d8eeSLaurent Vivier
ext4_inode_table(struct super_block * sb,struct ext4_group_desc * bg)3308fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_table(struct super_block *sb,
3318fadc143SAlexandre Ratchov struct ext4_group_desc *bg)
332bd81d8eeSLaurent Vivier {
3335272f837SAneesh Kumar K.V return le32_to_cpu(bg->bg_inode_table_lo) |
3348fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3358fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_table_hi) << 32 : 0);
336bd81d8eeSLaurent Vivier }
337bd81d8eeSLaurent Vivier
ext4_free_group_clusters(struct super_block * sb,struct ext4_group_desc * bg)338021b65bbSTheodore Ts'o __u32 ext4_free_group_clusters(struct super_block *sb,
339560671a0SAneesh Kumar K.V struct ext4_group_desc *bg)
340560671a0SAneesh Kumar K.V {
341560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_free_blocks_count_lo) |
342560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
343560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_free_blocks_count_hi) << 16 : 0);
344560671a0SAneesh Kumar K.V }
345560671a0SAneesh Kumar K.V
ext4_free_inodes_count(struct super_block * sb,struct ext4_group_desc * bg)346560671a0SAneesh Kumar K.V __u32 ext4_free_inodes_count(struct super_block *sb,
347560671a0SAneesh Kumar K.V struct ext4_group_desc *bg)
348560671a0SAneesh Kumar K.V {
349786a5527SJeongjun Park return le16_to_cpu(READ_ONCE(bg->bg_free_inodes_count_lo)) |
350560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
351786a5527SJeongjun Park (__u32)le16_to_cpu(READ_ONCE(bg->bg_free_inodes_count_hi)) << 16 : 0);
352560671a0SAneesh Kumar K.V }
353560671a0SAneesh Kumar K.V
ext4_used_dirs_count(struct super_block * sb,struct ext4_group_desc * bg)354560671a0SAneesh Kumar K.V __u32 ext4_used_dirs_count(struct super_block *sb,
355560671a0SAneesh Kumar K.V struct ext4_group_desc *bg)
356560671a0SAneesh Kumar K.V {
357560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_used_dirs_count_lo) |
358560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
359560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_used_dirs_count_hi) << 16 : 0);
360560671a0SAneesh Kumar K.V }
361560671a0SAneesh Kumar K.V
ext4_itable_unused_count(struct super_block * sb,struct ext4_group_desc * bg)362560671a0SAneesh Kumar K.V __u32 ext4_itable_unused_count(struct super_block *sb,
363560671a0SAneesh Kumar K.V struct ext4_group_desc *bg)
364560671a0SAneesh Kumar K.V {
365560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_itable_unused_lo) |
366560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
367560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_itable_unused_hi) << 16 : 0);
368560671a0SAneesh Kumar K.V }
369560671a0SAneesh Kumar K.V
ext4_block_bitmap_set(struct super_block * sb,struct ext4_group_desc * bg,ext4_fsblk_t blk)3708fadc143SAlexandre Ratchov void ext4_block_bitmap_set(struct super_block *sb,
3718fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk)
372bd81d8eeSLaurent Vivier {
3733a14589cSAneesh Kumar K.V bg->bg_block_bitmap_lo = cpu_to_le32((u32)blk);
3748fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3758fadc143SAlexandre Ratchov bg->bg_block_bitmap_hi = cpu_to_le32(blk >> 32);
376bd81d8eeSLaurent Vivier }
377bd81d8eeSLaurent Vivier
ext4_inode_bitmap_set(struct super_block * sb,struct ext4_group_desc * bg,ext4_fsblk_t blk)3788fadc143SAlexandre Ratchov void ext4_inode_bitmap_set(struct super_block *sb,
3798fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk)
380bd81d8eeSLaurent Vivier {
3815272f837SAneesh Kumar K.V bg->bg_inode_bitmap_lo = cpu_to_le32((u32)blk);
3828fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3838fadc143SAlexandre Ratchov bg->bg_inode_bitmap_hi = cpu_to_le32(blk >> 32);
384bd81d8eeSLaurent Vivier }
385bd81d8eeSLaurent Vivier
ext4_inode_table_set(struct super_block * sb,struct ext4_group_desc * bg,ext4_fsblk_t blk)3868fadc143SAlexandre Ratchov void ext4_inode_table_set(struct super_block *sb,
3878fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk)
388bd81d8eeSLaurent Vivier {
3895272f837SAneesh Kumar K.V bg->bg_inode_table_lo = cpu_to_le32((u32)blk);
3908fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3918fadc143SAlexandre Ratchov bg->bg_inode_table_hi = cpu_to_le32(blk >> 32);
392bd81d8eeSLaurent Vivier }
393bd81d8eeSLaurent Vivier
ext4_free_group_clusters_set(struct super_block * sb,struct ext4_group_desc * bg,__u32 count)394021b65bbSTheodore Ts'o void ext4_free_group_clusters_set(struct super_block *sb,
395560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count)
396560671a0SAneesh Kumar K.V {
397560671a0SAneesh Kumar K.V bg->bg_free_blocks_count_lo = cpu_to_le16((__u16)count);
398560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
399560671a0SAneesh Kumar K.V bg->bg_free_blocks_count_hi = cpu_to_le16(count >> 16);
400560671a0SAneesh Kumar K.V }
401560671a0SAneesh Kumar K.V
ext4_free_inodes_set(struct super_block * sb,struct ext4_group_desc * bg,__u32 count)402560671a0SAneesh Kumar K.V void ext4_free_inodes_set(struct super_block *sb,
403560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count)
404560671a0SAneesh Kumar K.V {
405786a5527SJeongjun Park WRITE_ONCE(bg->bg_free_inodes_count_lo, cpu_to_le16((__u16)count));
406560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
407786a5527SJeongjun Park WRITE_ONCE(bg->bg_free_inodes_count_hi, cpu_to_le16(count >> 16));
408560671a0SAneesh Kumar K.V }
409560671a0SAneesh Kumar K.V
ext4_used_dirs_set(struct super_block * sb,struct ext4_group_desc * bg,__u32 count)410560671a0SAneesh Kumar K.V void ext4_used_dirs_set(struct super_block *sb,
411560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count)
412560671a0SAneesh Kumar K.V {
413560671a0SAneesh Kumar K.V bg->bg_used_dirs_count_lo = cpu_to_le16((__u16)count);
414560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
415560671a0SAneesh Kumar K.V bg->bg_used_dirs_count_hi = cpu_to_le16(count >> 16);
416560671a0SAneesh Kumar K.V }
417560671a0SAneesh Kumar K.V
ext4_itable_unused_set(struct super_block * sb,struct ext4_group_desc * bg,__u32 count)418560671a0SAneesh Kumar K.V void ext4_itable_unused_set(struct super_block *sb,
419560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count)
420560671a0SAneesh Kumar K.V {
421560671a0SAneesh Kumar K.V bg->bg_itable_unused_lo = cpu_to_le16((__u16)count);
422560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
423560671a0SAneesh Kumar K.V bg->bg_itable_unused_hi = cpu_to_le16(count >> 16);
424560671a0SAneesh Kumar K.V }
425560671a0SAneesh Kumar K.V
__ext4_update_tstamp(__le32 * lo,__u8 * hi,time64_t now)426c92dc856SJan Kara static void __ext4_update_tstamp(__le32 *lo, __u8 *hi, time64_t now)
4276a0678a7SArnd Bergmann {
4286a0678a7SArnd Bergmann now = clamp_val(now, 0, (1ull << 40) - 1);
4296a0678a7SArnd Bergmann
4306a0678a7SArnd Bergmann *lo = cpu_to_le32(lower_32_bits(now));
4316a0678a7SArnd Bergmann *hi = upper_32_bits(now);
4326a0678a7SArnd Bergmann }
4336a0678a7SArnd Bergmann
__ext4_get_tstamp(__le32 * lo,__u8 * hi)4346a0678a7SArnd Bergmann static time64_t __ext4_get_tstamp(__le32 *lo, __u8 *hi)
4356a0678a7SArnd Bergmann {
4366a0678a7SArnd Bergmann return ((time64_t)(*hi) << 32) + le32_to_cpu(*lo);
4376a0678a7SArnd Bergmann }
4386a0678a7SArnd Bergmann #define ext4_update_tstamp(es, tstamp) \
439c92dc856SJan Kara __ext4_update_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi, \
440c92dc856SJan Kara ktime_get_real_seconds())
4416a0678a7SArnd Bergmann #define ext4_get_tstamp(es, tstamp) \
4426a0678a7SArnd Bergmann __ext4_get_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi)
443d3d1faf6SCurt Wohlgemuth
444ff0722deSVitaliy Kuznetsov #define EXT4_SB_REFRESH_INTERVAL_SEC (3600) /* seconds (1 hour) */
445ff0722deSVitaliy Kuznetsov #define EXT4_SB_REFRESH_INTERVAL_KB (16384) /* kilobytes (16MB) */
446ff0722deSVitaliy Kuznetsov
447ff0722deSVitaliy Kuznetsov /*
448ff0722deSVitaliy Kuznetsov * The ext4_maybe_update_superblock() function checks and updates the
449ff0722deSVitaliy Kuznetsov * superblock if needed.
450ff0722deSVitaliy Kuznetsov *
451ff0722deSVitaliy Kuznetsov * This function is designed to update the on-disk superblock only under
452ff0722deSVitaliy Kuznetsov * certain conditions to prevent excessive disk writes and unnecessary
453ff0722deSVitaliy Kuznetsov * waking of the disk from sleep. The superblock will be updated if:
454ff0722deSVitaliy Kuznetsov * 1. More than an hour has passed since the last superblock update, and
455ff0722deSVitaliy Kuznetsov * 2. More than 16MB have been written since the last superblock update.
456ff0722deSVitaliy Kuznetsov *
457ff0722deSVitaliy Kuznetsov * @sb: The superblock
458ff0722deSVitaliy Kuznetsov */
ext4_maybe_update_superblock(struct super_block * sb)459ff0722deSVitaliy Kuznetsov static void ext4_maybe_update_superblock(struct super_block *sb)
460ff0722deSVitaliy Kuznetsov {
461ff0722deSVitaliy Kuznetsov struct ext4_sb_info *sbi = EXT4_SB(sb);
462ff0722deSVitaliy Kuznetsov struct ext4_super_block *es = sbi->s_es;
463ff0722deSVitaliy Kuznetsov journal_t *journal = sbi->s_journal;
464ff0722deSVitaliy Kuznetsov time64_t now;
465ff0722deSVitaliy Kuznetsov __u64 last_update;
466ff0722deSVitaliy Kuznetsov __u64 lifetime_write_kbytes;
467ff0722deSVitaliy Kuznetsov __u64 diff_size;
468ff0722deSVitaliy Kuznetsov
469ff0722deSVitaliy Kuznetsov if (sb_rdonly(sb) || !(sb->s_flags & SB_ACTIVE) ||
470ff0722deSVitaliy Kuznetsov !journal || (journal->j_flags & JBD2_UNMOUNT))
471ff0722deSVitaliy Kuznetsov return;
472ff0722deSVitaliy Kuznetsov
473ff0722deSVitaliy Kuznetsov now = ktime_get_real_seconds();
474ff0722deSVitaliy Kuznetsov last_update = ext4_get_tstamp(es, s_wtime);
475ff0722deSVitaliy Kuznetsov
476ff0722deSVitaliy Kuznetsov if (likely(now - last_update < EXT4_SB_REFRESH_INTERVAL_SEC))
477ff0722deSVitaliy Kuznetsov return;
478ff0722deSVitaliy Kuznetsov
479ff0722deSVitaliy Kuznetsov lifetime_write_kbytes = sbi->s_kbytes_written +
480ff0722deSVitaliy Kuznetsov ((part_stat_read(sb->s_bdev, sectors[STAT_WRITE]) -
481ff0722deSVitaliy Kuznetsov sbi->s_sectors_written_start) >> 1);
482ff0722deSVitaliy Kuznetsov
483ff0722deSVitaliy Kuznetsov /* Get the number of kilobytes not written to disk to account
484ff0722deSVitaliy Kuznetsov * for statistics and compare with a multiple of 16 MB. This
485ff0722deSVitaliy Kuznetsov * is used to determine when the next superblock commit should
486ff0722deSVitaliy Kuznetsov * occur (i.e. not more often than once per 16MB if there was
487ff0722deSVitaliy Kuznetsov * less written in an hour).
488ff0722deSVitaliy Kuznetsov */
489ff0722deSVitaliy Kuznetsov diff_size = lifetime_write_kbytes - le64_to_cpu(es->s_kbytes_written);
490ff0722deSVitaliy Kuznetsov
491ff0722deSVitaliy Kuznetsov if (diff_size > EXT4_SB_REFRESH_INTERVAL_KB)
492bb15cea2STheodore Ts'o schedule_work(&EXT4_SB(sb)->s_sb_upd_work);
493ff0722deSVitaliy Kuznetsov }
494ff0722deSVitaliy Kuznetsov
495bdfe0cbdSTheodore Ts'o /*
496bdfe0cbdSTheodore Ts'o * The del_gendisk() function uninitializes the disk-specific data
497bdfe0cbdSTheodore Ts'o * structures, including the bdi structure, without telling anyone
498bdfe0cbdSTheodore Ts'o * else. Once this happens, any attempt to call mark_buffer_dirty()
499bdfe0cbdSTheodore Ts'o * (for example, by ext4_commit_super), will cause a kernel OOPS.
500bdfe0cbdSTheodore Ts'o * This is a kludge to prevent these oops until we can put in a proper
501bdfe0cbdSTheodore Ts'o * hook in del_gendisk() to inform the VFS and file system layers.
502bdfe0cbdSTheodore Ts'o */
block_device_ejected(struct super_block * sb)503bdfe0cbdSTheodore Ts'o static int block_device_ejected(struct super_block *sb)
504bdfe0cbdSTheodore Ts'o {
505bdfe0cbdSTheodore Ts'o struct inode *bd_inode = sb->s_bdev->bd_inode;
506bdfe0cbdSTheodore Ts'o struct backing_dev_info *bdi = inode_to_bdi(bd_inode);
507bdfe0cbdSTheodore Ts'o
508bdfe0cbdSTheodore Ts'o return bdi->dev == NULL;
509bdfe0cbdSTheodore Ts'o }
510bdfe0cbdSTheodore Ts'o
ext4_journal_commit_callback(journal_t * journal,transaction_t * txn)51118aadd47SBobi Jam static void ext4_journal_commit_callback(journal_t *journal, transaction_t *txn)
51218aadd47SBobi Jam {
51318aadd47SBobi Jam struct super_block *sb = journal->j_private;
51418aadd47SBobi Jam struct ext4_sb_info *sbi = EXT4_SB(sb);
51518aadd47SBobi Jam int error = is_journal_aborted(journal);
5165d3ee208SDmitry Monakhov struct ext4_journal_cb_entry *jce;
51718aadd47SBobi Jam
5185d3ee208SDmitry Monakhov BUG_ON(txn->t_state == T_FINISHED);
519a0154344SDaeho Jeong
520a0154344SDaeho Jeong ext4_process_freed_data(sb, txn->t_tid);
521ff0722deSVitaliy Kuznetsov ext4_maybe_update_superblock(sb);
522a0154344SDaeho Jeong
52318aadd47SBobi Jam spin_lock(&sbi->s_md_lock);
5245d3ee208SDmitry Monakhov while (!list_empty(&txn->t_private_list)) {
5255d3ee208SDmitry Monakhov jce = list_entry(txn->t_private_list.next,
5265d3ee208SDmitry Monakhov struct ext4_journal_cb_entry, jce_list);
52718aadd47SBobi Jam list_del_init(&jce->jce_list);
52818aadd47SBobi Jam spin_unlock(&sbi->s_md_lock);
52918aadd47SBobi Jam jce->jce_func(sb, jce, error);
53018aadd47SBobi Jam spin_lock(&sbi->s_md_lock);
53118aadd47SBobi Jam }
53218aadd47SBobi Jam spin_unlock(&sbi->s_md_lock);
53318aadd47SBobi Jam }
5341c13d5c0STheodore Ts'o
535afb585a9SMauricio Faria de Oliveira /*
536afb585a9SMauricio Faria de Oliveira * This writepage callback for write_cache_pages()
537afb585a9SMauricio Faria de Oliveira * takes care of a few cases after page cleaning.
538afb585a9SMauricio Faria de Oliveira *
539afb585a9SMauricio Faria de Oliveira * write_cache_pages() already checks for dirty pages
540afb585a9SMauricio Faria de Oliveira * and calls clear_page_dirty_for_io(), which we want,
541afb585a9SMauricio Faria de Oliveira * to write protect the pages.
542afb585a9SMauricio Faria de Oliveira *
543afb585a9SMauricio Faria de Oliveira * However, we may have to redirty a page (see below.)
544afb585a9SMauricio Faria de Oliveira */
ext4_journalled_writepage_callback(struct folio * folio,struct writeback_control * wbc,void * data)545d585bdbeSMatthew Wilcox (Oracle) static int ext4_journalled_writepage_callback(struct folio *folio,
546afb585a9SMauricio Faria de Oliveira struct writeback_control *wbc,
547afb585a9SMauricio Faria de Oliveira void *data)
548afb585a9SMauricio Faria de Oliveira {
549afb585a9SMauricio Faria de Oliveira transaction_t *transaction = (transaction_t *) data;
550afb585a9SMauricio Faria de Oliveira struct buffer_head *bh, *head;
551afb585a9SMauricio Faria de Oliveira struct journal_head *jh;
552afb585a9SMauricio Faria de Oliveira
553d585bdbeSMatthew Wilcox (Oracle) bh = head = folio_buffers(folio);
554afb585a9SMauricio Faria de Oliveira do {
555afb585a9SMauricio Faria de Oliveira /*
556afb585a9SMauricio Faria de Oliveira * We have to redirty a page in these cases:
557afb585a9SMauricio Faria de Oliveira * 1) If buffer is dirty, it means the page was dirty because it
558afb585a9SMauricio Faria de Oliveira * contains a buffer that needs checkpointing. So the dirty bit
559afb585a9SMauricio Faria de Oliveira * needs to be preserved so that checkpointing writes the buffer
560afb585a9SMauricio Faria de Oliveira * properly.
561afb585a9SMauricio Faria de Oliveira * 2) If buffer is not part of the committing transaction
562afb585a9SMauricio Faria de Oliveira * (we may have just accidentally come across this buffer because
563afb585a9SMauricio Faria de Oliveira * inode range tracking is not exact) or if the currently running
564afb585a9SMauricio Faria de Oliveira * transaction already contains this buffer as well, dirty bit
565afb585a9SMauricio Faria de Oliveira * needs to be preserved so that the buffer gets writeprotected
566afb585a9SMauricio Faria de Oliveira * properly on running transaction's commit.
567afb585a9SMauricio Faria de Oliveira */
568afb585a9SMauricio Faria de Oliveira jh = bh2jh(bh);
569afb585a9SMauricio Faria de Oliveira if (buffer_dirty(bh) ||
570afb585a9SMauricio Faria de Oliveira (jh && (jh->b_transaction != transaction ||
571afb585a9SMauricio Faria de Oliveira jh->b_next_transaction))) {
572d585bdbeSMatthew Wilcox (Oracle) folio_redirty_for_writepage(wbc, folio);
573afb585a9SMauricio Faria de Oliveira goto out;
574afb585a9SMauricio Faria de Oliveira }
575afb585a9SMauricio Faria de Oliveira } while ((bh = bh->b_this_page) != head);
576afb585a9SMauricio Faria de Oliveira
577afb585a9SMauricio Faria de Oliveira out:
578afb585a9SMauricio Faria de Oliveira return AOP_WRITEPAGE_ACTIVATE;
579afb585a9SMauricio Faria de Oliveira }
580afb585a9SMauricio Faria de Oliveira
ext4_journalled_submit_inode_data_buffers(struct jbd2_inode * jinode)581afb585a9SMauricio Faria de Oliveira static int ext4_journalled_submit_inode_data_buffers(struct jbd2_inode *jinode)
582afb585a9SMauricio Faria de Oliveira {
583afb585a9SMauricio Faria de Oliveira struct address_space *mapping = jinode->i_vfs_inode->i_mapping;
584afb585a9SMauricio Faria de Oliveira struct writeback_control wbc = {
585afb585a9SMauricio Faria de Oliveira .sync_mode = WB_SYNC_ALL,
586afb585a9SMauricio Faria de Oliveira .nr_to_write = LONG_MAX,
587afb585a9SMauricio Faria de Oliveira .range_start = jinode->i_dirty_start,
588afb585a9SMauricio Faria de Oliveira .range_end = jinode->i_dirty_end,
589afb585a9SMauricio Faria de Oliveira };
590afb585a9SMauricio Faria de Oliveira
591afb585a9SMauricio Faria de Oliveira return write_cache_pages(mapping, &wbc,
592afb585a9SMauricio Faria de Oliveira ext4_journalled_writepage_callback,
593afb585a9SMauricio Faria de Oliveira jinode->i_transaction);
594afb585a9SMauricio Faria de Oliveira }
595afb585a9SMauricio Faria de Oliveira
ext4_journal_submit_inode_data_buffers(struct jbd2_inode * jinode)596afb585a9SMauricio Faria de Oliveira static int ext4_journal_submit_inode_data_buffers(struct jbd2_inode *jinode)
597afb585a9SMauricio Faria de Oliveira {
598afb585a9SMauricio Faria de Oliveira int ret;
599afb585a9SMauricio Faria de Oliveira
600afb585a9SMauricio Faria de Oliveira if (ext4_should_journal_data(jinode->i_vfs_inode))
601afb585a9SMauricio Faria de Oliveira ret = ext4_journalled_submit_inode_data_buffers(jinode);
602afb585a9SMauricio Faria de Oliveira else
60359205c8dSJan Kara ret = ext4_normal_submit_inode_data_buffers(jinode);
604afb585a9SMauricio Faria de Oliveira return ret;
605afb585a9SMauricio Faria de Oliveira }
606afb585a9SMauricio Faria de Oliveira
ext4_journal_finish_inode_data_buffers(struct jbd2_inode * jinode)607afb585a9SMauricio Faria de Oliveira static int ext4_journal_finish_inode_data_buffers(struct jbd2_inode *jinode)
608afb585a9SMauricio Faria de Oliveira {
609afb585a9SMauricio Faria de Oliveira int ret = 0;
610afb585a9SMauricio Faria de Oliveira
611afb585a9SMauricio Faria de Oliveira if (!ext4_should_journal_data(jinode->i_vfs_inode))
612afb585a9SMauricio Faria de Oliveira ret = jbd2_journal_finish_inode_data_buffers(jinode);
613afb585a9SMauricio Faria de Oliveira
614afb585a9SMauricio Faria de Oliveira return ret;
615afb585a9SMauricio Faria de Oliveira }
616afb585a9SMauricio Faria de Oliveira
system_going_down(void)6171dc1097fSJan Kara static bool system_going_down(void)
6181dc1097fSJan Kara {
6191dc1097fSJan Kara return system_state == SYSTEM_HALT || system_state == SYSTEM_POWER_OFF
6201dc1097fSJan Kara || system_state == SYSTEM_RESTART;
6211dc1097fSJan Kara }
6221dc1097fSJan Kara
62302a7780eSJan Kara struct ext4_err_translation {
62402a7780eSJan Kara int code;
62502a7780eSJan Kara int errno;
62602a7780eSJan Kara };
62702a7780eSJan Kara
62802a7780eSJan Kara #define EXT4_ERR_TRANSLATE(err) { .code = EXT4_ERR_##err, .errno = err }
62902a7780eSJan Kara
63002a7780eSJan Kara static struct ext4_err_translation err_translation[] = {
63102a7780eSJan Kara EXT4_ERR_TRANSLATE(EIO),
63202a7780eSJan Kara EXT4_ERR_TRANSLATE(ENOMEM),
63302a7780eSJan Kara EXT4_ERR_TRANSLATE(EFSBADCRC),
63402a7780eSJan Kara EXT4_ERR_TRANSLATE(EFSCORRUPTED),
63502a7780eSJan Kara EXT4_ERR_TRANSLATE(ENOSPC),
63602a7780eSJan Kara EXT4_ERR_TRANSLATE(ENOKEY),
63702a7780eSJan Kara EXT4_ERR_TRANSLATE(EROFS),
63802a7780eSJan Kara EXT4_ERR_TRANSLATE(EFBIG),
63902a7780eSJan Kara EXT4_ERR_TRANSLATE(EEXIST),
64002a7780eSJan Kara EXT4_ERR_TRANSLATE(ERANGE),
64102a7780eSJan Kara EXT4_ERR_TRANSLATE(EOVERFLOW),
64202a7780eSJan Kara EXT4_ERR_TRANSLATE(EBUSY),
64302a7780eSJan Kara EXT4_ERR_TRANSLATE(ENOTDIR),
64402a7780eSJan Kara EXT4_ERR_TRANSLATE(ENOTEMPTY),
64502a7780eSJan Kara EXT4_ERR_TRANSLATE(ESHUTDOWN),
64602a7780eSJan Kara EXT4_ERR_TRANSLATE(EFAULT),
64702a7780eSJan Kara };
64802a7780eSJan Kara
ext4_errno_to_code(int errno)64902a7780eSJan Kara static int ext4_errno_to_code(int errno)
65002a7780eSJan Kara {
65102a7780eSJan Kara int i;
65202a7780eSJan Kara
65302a7780eSJan Kara for (i = 0; i < ARRAY_SIZE(err_translation); i++)
65402a7780eSJan Kara if (err_translation[i].errno == errno)
65502a7780eSJan Kara return err_translation[i].code;
65602a7780eSJan Kara return EXT4_ERR_UNKNOWN;
65702a7780eSJan Kara }
65802a7780eSJan Kara
save_error_info(struct super_block * sb,int error,__u32 ino,__u64 block,const char * func,unsigned int line)6592d01ddc8SJan Kara static void save_error_info(struct super_block *sb, int error,
66040676623SJan Kara __u32 ino, __u64 block,
66140676623SJan Kara const char *func, unsigned int line)
66240676623SJan Kara {
663c92dc856SJan Kara struct ext4_sb_info *sbi = EXT4_SB(sb);
66440676623SJan Kara
66502a7780eSJan Kara /* We default to EFSCORRUPTED error... */
66602a7780eSJan Kara if (error == 0)
66702a7780eSJan Kara error = EFSCORRUPTED;
668c92dc856SJan Kara
669c92dc856SJan Kara spin_lock(&sbi->s_error_lock);
670c92dc856SJan Kara sbi->s_add_error_count++;
671c92dc856SJan Kara sbi->s_last_error_code = error;
672c92dc856SJan Kara sbi->s_last_error_line = line;
673c92dc856SJan Kara sbi->s_last_error_ino = ino;
674c92dc856SJan Kara sbi->s_last_error_block = block;
675c92dc856SJan Kara sbi->s_last_error_func = func;
676c92dc856SJan Kara sbi->s_last_error_time = ktime_get_real_seconds();
677c92dc856SJan Kara if (!sbi->s_first_error_time) {
678c92dc856SJan Kara sbi->s_first_error_code = error;
679c92dc856SJan Kara sbi->s_first_error_line = line;
680c92dc856SJan Kara sbi->s_first_error_ino = ino;
681c92dc856SJan Kara sbi->s_first_error_block = block;
682c92dc856SJan Kara sbi->s_first_error_func = func;
683c92dc856SJan Kara sbi->s_first_error_time = sbi->s_last_error_time;
68440676623SJan Kara }
685c92dc856SJan Kara spin_unlock(&sbi->s_error_lock);
68640676623SJan Kara }
68740676623SJan Kara
688ac27a0ecSDave Kleikamp /* Deal with the reporting of failure conditions on a filesystem such as
689ac27a0ecSDave Kleikamp * inconsistencies detected or read IO failures.
690ac27a0ecSDave Kleikamp *
691ac27a0ecSDave Kleikamp * On ext2, we can store the error state of the filesystem in the
692617ba13bSMingming Cao * superblock. That is not possible on ext4, because we may have other
693ac27a0ecSDave Kleikamp * write ordering constraints on the superblock which prevent us from
694ac27a0ecSDave Kleikamp * writing it out straight away; and given that the journal is about to
695ac27a0ecSDave Kleikamp * be aborted, we can't rely on the current, or future, transactions to
696ac27a0ecSDave Kleikamp * write out the superblock safely.
697ac27a0ecSDave Kleikamp *
698dab291afSMingming Cao * We'll just use the jbd2_journal_abort() error code to record an error in
699d6b198bcSThadeu Lima de Souza Cascardo * the journal instead. On recovery, the journal will complain about
700ac27a0ecSDave Kleikamp * that error until we've noted it down and cleared it.
701014c9caaSJan Kara *
702014c9caaSJan Kara * If force_ro is set, we unconditionally force the filesystem into an
703014c9caaSJan Kara * ABORT|READONLY state, unless the error response on the fs has been set to
704014c9caaSJan Kara * panic in which case we take the easy way out and panic immediately. This is
705014c9caaSJan Kara * used to deal with unrecoverable failures such as journal IO errors or ENOMEM
706014c9caaSJan Kara * at a critical moment in log management.
707ac27a0ecSDave Kleikamp */
ext4_handle_error(struct super_block * sb,bool force_ro,int error,__u32 ino,__u64 block,const char * func,unsigned int line)708e789ca0cSJan Kara static void ext4_handle_error(struct super_block *sb, bool force_ro, int error,
709e789ca0cSJan Kara __u32 ino, __u64 block,
710e789ca0cSJan Kara const char *func, unsigned int line)
711ac27a0ecSDave Kleikamp {
712b08070ecSJan Kara journal_t *journal = EXT4_SB(sb)->s_journal;
7132d01ddc8SJan Kara bool continue_fs = !force_ro && test_opt(sb, ERRORS_CONT);
714b08070ecSJan Kara
715e789ca0cSJan Kara EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
716327eaf73STheodore Ts'o if (test_opt(sb, WARN_ON_ERROR))
717327eaf73STheodore Ts'o WARN_ON_ONCE(1);
718327eaf73STheodore Ts'o
7192d01ddc8SJan Kara if (!continue_fs && !sb_rdonly(sb)) {
72095257987SJan Kara set_bit(EXT4_FLAGS_SHUTDOWN, &EXT4_SB(sb)->s_ext4_flags);
721ac27a0ecSDave Kleikamp if (journal)
722dab291afSMingming Cao jbd2_journal_abort(journal, -EIO);
7232d01ddc8SJan Kara }
7242d01ddc8SJan Kara
7252d01ddc8SJan Kara if (!bdev_read_only(sb->s_bdev)) {
7262d01ddc8SJan Kara save_error_info(sb, error, ino, block, func, line);
7272d01ddc8SJan Kara /*
7282d01ddc8SJan Kara * In case the fs should keep running, we need to writeout
7292d01ddc8SJan Kara * superblock through the journal. Due to lock ordering
7302d01ddc8SJan Kara * constraints, it may not be safe to do it right here so we
7312d01ddc8SJan Kara * defer superblock flushing to a workqueue.
7322d01ddc8SJan Kara */
733bb9464e0Syangerkun if (continue_fs && journal)
734bb15cea2STheodore Ts'o schedule_work(&EXT4_SB(sb)->s_sb_upd_work);
7352d01ddc8SJan Kara else
7362d01ddc8SJan Kara ext4_commit_super(sb);
7372d01ddc8SJan Kara }
7382d01ddc8SJan Kara
7391dc1097fSJan Kara /*
7401dc1097fSJan Kara * We force ERRORS_RO behavior when system is rebooting. Otherwise we
7411dc1097fSJan Kara * could panic during 'reboot -f' as the underlying device got already
7421dc1097fSJan Kara * disabled.
7431dc1097fSJan Kara */
744014c9caaSJan Kara if (test_opt(sb, ERRORS_PANIC) && !system_going_down()) {
745617ba13bSMingming Cao panic("EXT4-fs (device %s): panic forced after error\n",
746ac27a0ecSDave Kleikamp sb->s_id);
747ac27a0ecSDave Kleikamp }
748ac2f7ca5SYe Bin
749ac2f7ca5SYe Bin if (sb_rdonly(sb) || continue_fs)
750ac2f7ca5SYe Bin return;
751ac2f7ca5SYe Bin
752014c9caaSJan Kara ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only");
753014c9caaSJan Kara /*
75458c0648eSJan Kara * EXT4_FLAGS_SHUTDOWN was set which stops all filesystem
75558c0648eSJan Kara * modifications. We don't set SB_RDONLY because that requires
75658c0648eSJan Kara * sb->s_umount semaphore and setting it without proper remount
75758c0648eSJan Kara * procedure is confusing code such as freeze_super() leading to
75858c0648eSJan Kara * deadlocks and other problems.
759014c9caaSJan Kara */
7604327ba52SDaeho Jeong }
761ac27a0ecSDave Kleikamp
update_super_work(struct work_struct * work)762bb15cea2STheodore Ts'o static void update_super_work(struct work_struct *work)
763c92dc856SJan Kara {
764c92dc856SJan Kara struct ext4_sb_info *sbi = container_of(work, struct ext4_sb_info,
765bb15cea2STheodore Ts'o s_sb_upd_work);
7662d01ddc8SJan Kara journal_t *journal = sbi->s_journal;
7672d01ddc8SJan Kara handle_t *handle;
768c92dc856SJan Kara
7692d01ddc8SJan Kara /*
7702d01ddc8SJan Kara * If the journal is still running, we have to write out superblock
7712d01ddc8SJan Kara * through the journal to avoid collisions of other journalled sb
7722d01ddc8SJan Kara * updates.
7732d01ddc8SJan Kara *
7742d01ddc8SJan Kara * We use directly jbd2 functions here to avoid recursing back into
7752d01ddc8SJan Kara * ext4 error handling code during handling of previous errors.
7762d01ddc8SJan Kara */
7772d01ddc8SJan Kara if (!sb_rdonly(sbi->s_sb) && journal) {
778558d6450SYe Bin struct buffer_head *sbh = sbi->s_sbh;
779b9945f90STheodore Ts'o bool call_notify_err = false;
780b9945f90STheodore Ts'o
7812d01ddc8SJan Kara handle = jbd2_journal_start(journal, 1);
7822d01ddc8SJan Kara if (IS_ERR(handle))
7832d01ddc8SJan Kara goto write_directly;
784558d6450SYe Bin if (jbd2_journal_get_write_access(handle, sbh)) {
7852d01ddc8SJan Kara jbd2_journal_stop(handle);
7862d01ddc8SJan Kara goto write_directly;
7872d01ddc8SJan Kara }
788ff0722deSVitaliy Kuznetsov
789ff0722deSVitaliy Kuznetsov if (sbi->s_add_error_count > 0)
790ff0722deSVitaliy Kuznetsov call_notify_err = true;
791ff0722deSVitaliy Kuznetsov
7922d01ddc8SJan Kara ext4_update_super(sbi->s_sb);
793558d6450SYe Bin if (buffer_write_io_error(sbh) || !buffer_uptodate(sbh)) {
794558d6450SYe Bin ext4_msg(sbi->s_sb, KERN_ERR, "previous I/O error to "
795558d6450SYe Bin "superblock detected");
796558d6450SYe Bin clear_buffer_write_io_error(sbh);
797558d6450SYe Bin set_buffer_uptodate(sbh);
798558d6450SYe Bin }
799558d6450SYe Bin
800558d6450SYe Bin if (jbd2_journal_dirty_metadata(handle, sbh)) {
8012d01ddc8SJan Kara jbd2_journal_stop(handle);
8022d01ddc8SJan Kara goto write_directly;
8032d01ddc8SJan Kara }
8042d01ddc8SJan Kara jbd2_journal_stop(handle);
805ff0722deSVitaliy Kuznetsov
806ff0722deSVitaliy Kuznetsov if (call_notify_err)
807d578b994SJonathan Davies ext4_notify_error_sysfs(sbi);
808ff0722deSVitaliy Kuznetsov
8092d01ddc8SJan Kara return;
8102d01ddc8SJan Kara }
8112d01ddc8SJan Kara write_directly:
8122d01ddc8SJan Kara /*
8132d01ddc8SJan Kara * Write through journal failed. Write sb directly to get error info
8142d01ddc8SJan Kara * out and hope for the best.
8152d01ddc8SJan Kara */
8164392fbc4SJan Kara ext4_commit_super(sbi->s_sb);
817d578b994SJonathan Davies ext4_notify_error_sysfs(sbi);
818ac27a0ecSDave Kleikamp }
819ac27a0ecSDave Kleikamp
820efbed4dcSTheodore Ts'o #define ext4_error_ratelimit(sb) \
821efbed4dcSTheodore Ts'o ___ratelimit(&(EXT4_SB(sb)->s_err_ratelimit_state), \
822efbed4dcSTheodore Ts'o "EXT4-fs error")
823efbed4dcSTheodore Ts'o
__ext4_error(struct super_block * sb,const char * function,unsigned int line,bool force_ro,int error,__u64 block,const char * fmt,...)82412062dddSEric Sandeen void __ext4_error(struct super_block *sb, const char *function,
825014c9caaSJan Kara unsigned int line, bool force_ro, int error, __u64 block,
82654d3adbcSTheodore Ts'o const char *fmt, ...)
827ac27a0ecSDave Kleikamp {
8280ff2ea7dSJoe Perches struct va_format vaf;
829ac27a0ecSDave Kleikamp va_list args;
830ac27a0ecSDave Kleikamp
831eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(sb)))
8320db1ff22STheodore Ts'o return;
8330db1ff22STheodore Ts'o
834ccf0f32aSTheodore Ts'o trace_ext4_error(sb, function, line);
835efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) {
836ac27a0ecSDave Kleikamp va_start(args, fmt);
8370ff2ea7dSJoe Perches vaf.fmt = fmt;
8380ff2ea7dSJoe Perches vaf.va = &args;
839efbed4dcSTheodore Ts'o printk(KERN_CRIT
840efbed4dcSTheodore Ts'o "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n",
8410ff2ea7dSJoe Perches sb->s_id, function, line, current->comm, &vaf);
842ac27a0ecSDave Kleikamp va_end(args);
843efbed4dcSTheodore Ts'o }
8449a089b21SGabriel Krisman Bertazi fsnotify_sb_error(sb, NULL, error ? error : EFSCORRUPTED);
8459a089b21SGabriel Krisman Bertazi
846e789ca0cSJan Kara ext4_handle_error(sb, force_ro, error, 0, block, function, line);
847ac27a0ecSDave Kleikamp }
848ac27a0ecSDave Kleikamp
__ext4_error_inode(struct inode * inode,const char * function,unsigned int line,ext4_fsblk_t block,int error,const char * fmt,...)849e7c96e8eSJoe Perches void __ext4_error_inode(struct inode *inode, const char *function,
85054d3adbcSTheodore Ts'o unsigned int line, ext4_fsblk_t block, int error,
851273df556SFrank Mayhar const char *fmt, ...)
852273df556SFrank Mayhar {
853273df556SFrank Mayhar va_list args;
854f7c21177STheodore Ts'o struct va_format vaf;
855273df556SFrank Mayhar
856eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(inode->i_sb)))
8570db1ff22STheodore Ts'o return;
8580db1ff22STheodore Ts'o
859ccf0f32aSTheodore Ts'o trace_ext4_error(inode->i_sb, function, line);
860efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(inode->i_sb)) {
861273df556SFrank Mayhar va_start(args, fmt);
862f7c21177STheodore Ts'o vaf.fmt = fmt;
863f7c21177STheodore Ts'o vaf.va = &args;
864c398eda0STheodore Ts'o if (block)
865d9ee81daSJoe Perches printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
866d9ee81daSJoe Perches "inode #%lu: block %llu: comm %s: %pV\n",
867d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino,
868d9ee81daSJoe Perches block, current->comm, &vaf);
869d9ee81daSJoe Perches else
870d9ee81daSJoe Perches printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
871d9ee81daSJoe Perches "inode #%lu: comm %s: %pV\n",
872d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino,
873d9ee81daSJoe Perches current->comm, &vaf);
874273df556SFrank Mayhar va_end(args);
875efbed4dcSTheodore Ts'o }
8769a089b21SGabriel Krisman Bertazi fsnotify_sb_error(inode->i_sb, inode, error ? error : EFSCORRUPTED);
8779a089b21SGabriel Krisman Bertazi
878e789ca0cSJan Kara ext4_handle_error(inode->i_sb, false, error, inode->i_ino, block,
87954d3adbcSTheodore Ts'o function, line);
880273df556SFrank Mayhar }
881273df556SFrank Mayhar
__ext4_error_file(struct file * file,const char * function,unsigned int line,ext4_fsblk_t block,const char * fmt,...)882e7c96e8eSJoe Perches void __ext4_error_file(struct file *file, const char *function,
883f7c21177STheodore Ts'o unsigned int line, ext4_fsblk_t block,
884f7c21177STheodore Ts'o const char *fmt, ...)
885273df556SFrank Mayhar {
886273df556SFrank Mayhar va_list args;
887f7c21177STheodore Ts'o struct va_format vaf;
888496ad9aaSAl Viro struct inode *inode = file_inode(file);
889273df556SFrank Mayhar char pathname[80], *path;
890273df556SFrank Mayhar
891eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(inode->i_sb)))
8920db1ff22STheodore Ts'o return;
8930db1ff22STheodore Ts'o
894ccf0f32aSTheodore Ts'o trace_ext4_error(inode->i_sb, function, line);
895efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(inode->i_sb)) {
8969bf39ab2SMiklos Szeredi path = file_path(file, pathname, sizeof(pathname));
897f9a62d09SDan Carpenter if (IS_ERR(path))
898273df556SFrank Mayhar path = "(unknown)";
899f7c21177STheodore Ts'o va_start(args, fmt);
900f7c21177STheodore Ts'o vaf.fmt = fmt;
901f7c21177STheodore Ts'o vaf.va = &args;
902d9ee81daSJoe Perches if (block)
903d9ee81daSJoe Perches printk(KERN_CRIT
904d9ee81daSJoe Perches "EXT4-fs error (device %s): %s:%d: inode #%lu: "
905d9ee81daSJoe Perches "block %llu: comm %s: path %s: %pV\n",
906d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino,
907d9ee81daSJoe Perches block, current->comm, path, &vaf);
908d9ee81daSJoe Perches else
909d9ee81daSJoe Perches printk(KERN_CRIT
910d9ee81daSJoe Perches "EXT4-fs error (device %s): %s:%d: inode #%lu: "
911d9ee81daSJoe Perches "comm %s: path %s: %pV\n",
912d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino,
913d9ee81daSJoe Perches current->comm, path, &vaf);
914273df556SFrank Mayhar va_end(args);
915efbed4dcSTheodore Ts'o }
9169a089b21SGabriel Krisman Bertazi fsnotify_sb_error(inode->i_sb, inode, EFSCORRUPTED);
9179a089b21SGabriel Krisman Bertazi
918e789ca0cSJan Kara ext4_handle_error(inode->i_sb, false, EFSCORRUPTED, inode->i_ino, block,
91954d3adbcSTheodore Ts'o function, line);
920273df556SFrank Mayhar }
921273df556SFrank Mayhar
ext4_decode_error(struct super_block * sb,int errno,char nbuf[16])922722887ddSTheodore Ts'o const char *ext4_decode_error(struct super_block *sb, int errno,
923ac27a0ecSDave Kleikamp char nbuf[16])
924ac27a0ecSDave Kleikamp {
925ac27a0ecSDave Kleikamp char *errstr = NULL;
926ac27a0ecSDave Kleikamp
927ac27a0ecSDave Kleikamp switch (errno) {
9286a797d27SDarrick J. Wong case -EFSCORRUPTED:
9296a797d27SDarrick J. Wong errstr = "Corrupt filesystem";
9306a797d27SDarrick J. Wong break;
9316a797d27SDarrick J. Wong case -EFSBADCRC:
9326a797d27SDarrick J. Wong errstr = "Filesystem failed CRC";
9336a797d27SDarrick J. Wong break;
934ac27a0ecSDave Kleikamp case -EIO:
935ac27a0ecSDave Kleikamp errstr = "IO failure";
936ac27a0ecSDave Kleikamp break;
937ac27a0ecSDave Kleikamp case -ENOMEM:
938ac27a0ecSDave Kleikamp errstr = "Out of memory";
939ac27a0ecSDave Kleikamp break;
940ac27a0ecSDave Kleikamp case -EROFS:
94178f1ddbbSTheodore Ts'o if (!sb || (EXT4_SB(sb)->s_journal &&
94278f1ddbbSTheodore Ts'o EXT4_SB(sb)->s_journal->j_flags & JBD2_ABORT))
943ac27a0ecSDave Kleikamp errstr = "Journal has aborted";
944ac27a0ecSDave Kleikamp else
945ac27a0ecSDave Kleikamp errstr = "Readonly filesystem";
946ac27a0ecSDave Kleikamp break;
947ac27a0ecSDave Kleikamp default:
948ac27a0ecSDave Kleikamp /* If the caller passed in an extra buffer for unknown
949ac27a0ecSDave Kleikamp * errors, textualise them now. Else we just return
950ac27a0ecSDave Kleikamp * NULL. */
951ac27a0ecSDave Kleikamp if (nbuf) {
952ac27a0ecSDave Kleikamp /* Check for truncated error codes... */
953ac27a0ecSDave Kleikamp if (snprintf(nbuf, 16, "error %d", -errno) >= 0)
954ac27a0ecSDave Kleikamp errstr = nbuf;
955ac27a0ecSDave Kleikamp }
956ac27a0ecSDave Kleikamp break;
957ac27a0ecSDave Kleikamp }
958ac27a0ecSDave Kleikamp
959ac27a0ecSDave Kleikamp return errstr;
960ac27a0ecSDave Kleikamp }
961ac27a0ecSDave Kleikamp
962617ba13bSMingming Cao /* __ext4_std_error decodes expected errors from journaling functions
963ac27a0ecSDave Kleikamp * automatically and invokes the appropriate error response. */
964ac27a0ecSDave Kleikamp
__ext4_std_error(struct super_block * sb,const char * function,unsigned int line,int errno)965c398eda0STheodore Ts'o void __ext4_std_error(struct super_block *sb, const char *function,
966c398eda0STheodore Ts'o unsigned int line, int errno)
967ac27a0ecSDave Kleikamp {
968ac27a0ecSDave Kleikamp char nbuf[16];
969ac27a0ecSDave Kleikamp const char *errstr;
970ac27a0ecSDave Kleikamp
971eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(sb)))
9720db1ff22STheodore Ts'o return;
9730db1ff22STheodore Ts'o
974ac27a0ecSDave Kleikamp /* Special case: if the error is EROFS, and we're not already
975ac27a0ecSDave Kleikamp * inside a transaction, then there's really no point in logging
976ac27a0ecSDave Kleikamp * an error. */
977bc98a42cSDavid Howells if (errno == -EROFS && journal_current_handle() == NULL && sb_rdonly(sb))
978ac27a0ecSDave Kleikamp return;
979ac27a0ecSDave Kleikamp
980efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) {
981617ba13bSMingming Cao errstr = ext4_decode_error(sb, errno, nbuf);
982c398eda0STheodore Ts'o printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n",
983c398eda0STheodore Ts'o sb->s_id, function, line, errstr);
984efbed4dcSTheodore Ts'o }
9859a089b21SGabriel Krisman Bertazi fsnotify_sb_error(sb, NULL, errno ? errno : EFSCORRUPTED);
986ac27a0ecSDave Kleikamp
987e789ca0cSJan Kara ext4_handle_error(sb, false, -errno, 0, 0, function, line);
988ac27a0ecSDave Kleikamp }
989ac27a0ecSDave Kleikamp
__ext4_msg(struct super_block * sb,const char * prefix,const char * fmt,...)990e7c96e8eSJoe Perches void __ext4_msg(struct super_block *sb,
991e7c96e8eSJoe Perches const char *prefix, const char *fmt, ...)
992b31e1552SEric Sandeen {
9930ff2ea7dSJoe Perches struct va_format vaf;
994b31e1552SEric Sandeen va_list args;
995b31e1552SEric Sandeen
996da812f61SLukas Czerner if (sb) {
9971cf006edSDmitry Monakhov atomic_inc(&EXT4_SB(sb)->s_msg_count);
998da812f61SLukas Czerner if (!___ratelimit(&(EXT4_SB(sb)->s_msg_ratelimit_state),
999da812f61SLukas Czerner "EXT4-fs"))
1000efbed4dcSTheodore Ts'o return;
1001da812f61SLukas Czerner }
1002efbed4dcSTheodore Ts'o
1003b31e1552SEric Sandeen va_start(args, fmt);
10040ff2ea7dSJoe Perches vaf.fmt = fmt;
10050ff2ea7dSJoe Perches vaf.va = &args;
1006da812f61SLukas Czerner if (sb)
10070ff2ea7dSJoe Perches printk("%sEXT4-fs (%s): %pV\n", prefix, sb->s_id, &vaf);
1008da812f61SLukas Czerner else
1009da812f61SLukas Czerner printk("%sEXT4-fs: %pV\n", prefix, &vaf);
1010b31e1552SEric Sandeen va_end(args);
1011b31e1552SEric Sandeen }
1012b31e1552SEric Sandeen
ext4_warning_ratelimit(struct super_block * sb)10131cf006edSDmitry Monakhov static int ext4_warning_ratelimit(struct super_block *sb)
10141cf006edSDmitry Monakhov {
10151cf006edSDmitry Monakhov atomic_inc(&EXT4_SB(sb)->s_warning_count);
10161cf006edSDmitry Monakhov return ___ratelimit(&(EXT4_SB(sb)->s_warning_ratelimit_state),
10171cf006edSDmitry Monakhov "EXT4-fs warning");
10181cf006edSDmitry Monakhov }
1019b03a2f7eSAndreas Dilger
__ext4_warning(struct super_block * sb,const char * function,unsigned int line,const char * fmt,...)102012062dddSEric Sandeen void __ext4_warning(struct super_block *sb, const char *function,
1021c398eda0STheodore Ts'o unsigned int line, const char *fmt, ...)
1022ac27a0ecSDave Kleikamp {
10230ff2ea7dSJoe Perches struct va_format vaf;
1024ac27a0ecSDave Kleikamp va_list args;
1025ac27a0ecSDave Kleikamp
1026b03a2f7eSAndreas Dilger if (!ext4_warning_ratelimit(sb))
1027efbed4dcSTheodore Ts'o return;
1028efbed4dcSTheodore Ts'o
1029ac27a0ecSDave Kleikamp va_start(args, fmt);
10300ff2ea7dSJoe Perches vaf.fmt = fmt;
10310ff2ea7dSJoe Perches vaf.va = &args;
10320ff2ea7dSJoe Perches printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: %pV\n",
10330ff2ea7dSJoe Perches sb->s_id, function, line, &vaf);
1034ac27a0ecSDave Kleikamp va_end(args);
1035ac27a0ecSDave Kleikamp }
1036ac27a0ecSDave Kleikamp
__ext4_warning_inode(const struct inode * inode,const char * function,unsigned int line,const char * fmt,...)1037b03a2f7eSAndreas Dilger void __ext4_warning_inode(const struct inode *inode, const char *function,
1038b03a2f7eSAndreas Dilger unsigned int line, const char *fmt, ...)
1039b03a2f7eSAndreas Dilger {
1040b03a2f7eSAndreas Dilger struct va_format vaf;
1041b03a2f7eSAndreas Dilger va_list args;
1042b03a2f7eSAndreas Dilger
1043b03a2f7eSAndreas Dilger if (!ext4_warning_ratelimit(inode->i_sb))
1044b03a2f7eSAndreas Dilger return;
1045b03a2f7eSAndreas Dilger
1046b03a2f7eSAndreas Dilger va_start(args, fmt);
1047b03a2f7eSAndreas Dilger vaf.fmt = fmt;
1048b03a2f7eSAndreas Dilger vaf.va = &args;
1049b03a2f7eSAndreas Dilger printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: "
1050b03a2f7eSAndreas Dilger "inode #%lu: comm %s: %pV\n", inode->i_sb->s_id,
1051b03a2f7eSAndreas Dilger function, line, inode->i_ino, current->comm, &vaf);
1052b03a2f7eSAndreas Dilger va_end(args);
1053b03a2f7eSAndreas Dilger }
1054b03a2f7eSAndreas Dilger
__ext4_grp_locked_error(const char * function,unsigned int line,struct super_block * sb,ext4_group_t grp,unsigned long ino,ext4_fsblk_t block,const char * fmt,...)1055e29136f8STheodore Ts'o void __ext4_grp_locked_error(const char *function, unsigned int line,
1056e29136f8STheodore Ts'o struct super_block *sb, ext4_group_t grp,
1057e29136f8STheodore Ts'o unsigned long ino, ext4_fsblk_t block,
1058e29136f8STheodore Ts'o const char *fmt, ...)
10595d1b1b3fSAneesh Kumar K.V __releases(bitlock)
10605d1b1b3fSAneesh Kumar K.V __acquires(bitlock)
10615d1b1b3fSAneesh Kumar K.V {
10620ff2ea7dSJoe Perches struct va_format vaf;
10635d1b1b3fSAneesh Kumar K.V va_list args;
10645d1b1b3fSAneesh Kumar K.V
1065eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(sb)))
10660db1ff22STheodore Ts'o return;
10670db1ff22STheodore Ts'o
1068ccf0f32aSTheodore Ts'o trace_ext4_error(sb, function, line);
1069efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) {
10705d1b1b3fSAneesh Kumar K.V va_start(args, fmt);
10710ff2ea7dSJoe Perches vaf.fmt = fmt;
10720ff2ea7dSJoe Perches vaf.va = &args;
107321149d61SRobin Dong printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ",
1074e29136f8STheodore Ts'o sb->s_id, function, line, grp);
1075e29136f8STheodore Ts'o if (ino)
10760ff2ea7dSJoe Perches printk(KERN_CONT "inode %lu: ", ino);
1077e29136f8STheodore Ts'o if (block)
1078efbed4dcSTheodore Ts'o printk(KERN_CONT "block %llu:",
1079efbed4dcSTheodore Ts'o (unsigned long long) block);
10800ff2ea7dSJoe Perches printk(KERN_CONT "%pV\n", &vaf);
10815d1b1b3fSAneesh Kumar K.V va_end(args);
1082efbed4dcSTheodore Ts'o }
10835d1b1b3fSAneesh Kumar K.V
1084c92dc856SJan Kara if (test_opt(sb, ERRORS_CONT)) {
1085327eaf73STheodore Ts'o if (test_opt(sb, WARN_ON_ERROR))
1086327eaf73STheodore Ts'o WARN_ON_ONCE(1);
1087e789ca0cSJan Kara EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
10882d01ddc8SJan Kara if (!bdev_read_only(sb->s_bdev)) {
10892d01ddc8SJan Kara save_error_info(sb, EFSCORRUPTED, ino, block, function,
10902d01ddc8SJan Kara line);
1091bb15cea2STheodore Ts'o schedule_work(&EXT4_SB(sb)->s_sb_upd_work);
10922d01ddc8SJan Kara }
10935d1b1b3fSAneesh Kumar K.V return;
10945d1b1b3fSAneesh Kumar K.V }
10955d1b1b3fSAneesh Kumar K.V ext4_unlock_group(sb, grp);
1096e789ca0cSJan Kara ext4_handle_error(sb, false, EFSCORRUPTED, ino, block, function, line);
10975d1b1b3fSAneesh Kumar K.V /*
10985d1b1b3fSAneesh Kumar K.V * We only get here in the ERRORS_RO case; relocking the group
10995d1b1b3fSAneesh Kumar K.V * may be dangerous, but nothing bad will happen since the
11005d1b1b3fSAneesh Kumar K.V * filesystem will have already been marked read/only and the
11015d1b1b3fSAneesh Kumar K.V * journal has been aborted. We return 1 as a hint to callers
11025d1b1b3fSAneesh Kumar K.V * who might what to use the return value from
110325985edcSLucas De Marchi * ext4_grp_locked_error() to distinguish between the
11045d1b1b3fSAneesh Kumar K.V * ERRORS_CONT and ERRORS_RO case, and perhaps return more
11055d1b1b3fSAneesh Kumar K.V * aggressively from the ext4 function in question, with a
11065d1b1b3fSAneesh Kumar K.V * more appropriate error code.
11075d1b1b3fSAneesh Kumar K.V */
11085d1b1b3fSAneesh Kumar K.V ext4_lock_group(sb, grp);
11095d1b1b3fSAneesh Kumar K.V return;
11105d1b1b3fSAneesh Kumar K.V }
11115d1b1b3fSAneesh Kumar K.V
ext4_mark_group_bitmap_corrupted(struct super_block * sb,ext4_group_t group,unsigned int flags)1112db79e6d1SWang Shilong void ext4_mark_group_bitmap_corrupted(struct super_block *sb,
1113db79e6d1SWang Shilong ext4_group_t group,
1114db79e6d1SWang Shilong unsigned int flags)
1115db79e6d1SWang Shilong {
1116db79e6d1SWang Shilong struct ext4_sb_info *sbi = EXT4_SB(sb);
1117db79e6d1SWang Shilong struct ext4_group_info *grp = ext4_get_group_info(sb, group);
1118db79e6d1SWang Shilong struct ext4_group_desc *gdp = ext4_get_group_desc(sb, group, NULL);
11199af0b3d1SWang Shilong int ret;
1120db79e6d1SWang Shilong
11215354b2afSTheodore Ts'o if (!grp || !gdp)
11225354b2afSTheodore Ts'o return;
11239af0b3d1SWang Shilong if (flags & EXT4_GROUP_INFO_BBITMAP_CORRUPT) {
11249af0b3d1SWang Shilong ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT,
11259af0b3d1SWang Shilong &grp->bb_state);
11269af0b3d1SWang Shilong if (!ret)
1127db79e6d1SWang Shilong percpu_counter_sub(&sbi->s_freeclusters_counter,
1128db79e6d1SWang Shilong grp->bb_free);
1129db79e6d1SWang Shilong }
1130db79e6d1SWang Shilong
11319af0b3d1SWang Shilong if (flags & EXT4_GROUP_INFO_IBITMAP_CORRUPT) {
11329af0b3d1SWang Shilong ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT,
11339af0b3d1SWang Shilong &grp->bb_state);
11349af0b3d1SWang Shilong if (!ret && gdp) {
1135db79e6d1SWang Shilong int count;
1136db79e6d1SWang Shilong
1137db79e6d1SWang Shilong count = ext4_free_inodes_count(sb, gdp);
1138db79e6d1SWang Shilong percpu_counter_sub(&sbi->s_freeinodes_counter,
1139db79e6d1SWang Shilong count);
1140db79e6d1SWang Shilong }
1141db79e6d1SWang Shilong }
1142db79e6d1SWang Shilong }
1143db79e6d1SWang Shilong
ext4_update_dynamic_rev(struct super_block * sb)1144617ba13bSMingming Cao void ext4_update_dynamic_rev(struct super_block *sb)
1145ac27a0ecSDave Kleikamp {
1146617ba13bSMingming Cao struct ext4_super_block *es = EXT4_SB(sb)->s_es;
1147ac27a0ecSDave Kleikamp
1148617ba13bSMingming Cao if (le32_to_cpu(es->s_rev_level) > EXT4_GOOD_OLD_REV)
1149ac27a0ecSDave Kleikamp return;
1150ac27a0ecSDave Kleikamp
115112062dddSEric Sandeen ext4_warning(sb,
1152ac27a0ecSDave Kleikamp "updating to rev %d because of new feature flag, "
1153ac27a0ecSDave Kleikamp "running e2fsck is recommended",
1154617ba13bSMingming Cao EXT4_DYNAMIC_REV);
1155ac27a0ecSDave Kleikamp
1156617ba13bSMingming Cao es->s_first_ino = cpu_to_le32(EXT4_GOOD_OLD_FIRST_INO);
1157617ba13bSMingming Cao es->s_inode_size = cpu_to_le16(EXT4_GOOD_OLD_INODE_SIZE);
1158617ba13bSMingming Cao es->s_rev_level = cpu_to_le32(EXT4_DYNAMIC_REV);
1159ac27a0ecSDave Kleikamp /* leave es->s_feature_*compat flags alone */
1160ac27a0ecSDave Kleikamp /* es->s_uuid will be set by e2fsck if empty */
1161ac27a0ecSDave Kleikamp
1162ac27a0ecSDave Kleikamp /*
1163ac27a0ecSDave Kleikamp * The rest of the superblock fields should be zero, and if not it
1164ac27a0ecSDave Kleikamp * means they are likely already in use, so leave them alone. We
1165ac27a0ecSDave Kleikamp * can leave it up to e2fsck to clean up any inconsistencies there.
1166ac27a0ecSDave Kleikamp */
1167ac27a0ecSDave Kleikamp }
1168ac27a0ecSDave Kleikamp
orphan_list_entry(struct list_head * l)1169ac27a0ecSDave Kleikamp static inline struct inode *orphan_list_entry(struct list_head *l)
1170ac27a0ecSDave Kleikamp {
1171617ba13bSMingming Cao return &list_entry(l, struct ext4_inode_info, i_orphan)->vfs_inode;
1172ac27a0ecSDave Kleikamp }
1173ac27a0ecSDave Kleikamp
dump_orphan_list(struct super_block * sb,struct ext4_sb_info * sbi)1174617ba13bSMingming Cao static void dump_orphan_list(struct super_block *sb, struct ext4_sb_info *sbi)
1175ac27a0ecSDave Kleikamp {
1176ac27a0ecSDave Kleikamp struct list_head *l;
1177ac27a0ecSDave Kleikamp
1178b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "sb orphan head is %d",
1179ac27a0ecSDave Kleikamp le32_to_cpu(sbi->s_es->s_last_orphan));
1180ac27a0ecSDave Kleikamp
1181ac27a0ecSDave Kleikamp printk(KERN_ERR "sb_info orphan list:\n");
1182ac27a0ecSDave Kleikamp list_for_each(l, &sbi->s_orphan) {
1183ac27a0ecSDave Kleikamp struct inode *inode = orphan_list_entry(l);
1184ac27a0ecSDave Kleikamp printk(KERN_ERR " "
1185ac27a0ecSDave Kleikamp "inode %s:%lu at %p: mode %o, nlink %d, next %d\n",
1186ac27a0ecSDave Kleikamp inode->i_sb->s_id, inode->i_ino, inode,
1187ac27a0ecSDave Kleikamp inode->i_mode, inode->i_nlink,
1188ac27a0ecSDave Kleikamp NEXT_ORPHAN(inode));
1189ac27a0ecSDave Kleikamp }
1190ac27a0ecSDave Kleikamp }
1191ac27a0ecSDave Kleikamp
1192957153fcSJan Kara #ifdef CONFIG_QUOTA
1193957153fcSJan Kara static int ext4_quota_off(struct super_block *sb, int type);
1194957153fcSJan Kara
ext4_quotas_off(struct super_block * sb,int type)1195f3c1c42eSBaokun Li static inline void ext4_quotas_off(struct super_block *sb, int type)
1196957153fcSJan Kara {
1197f3c1c42eSBaokun Li BUG_ON(type > EXT4_MAXQUOTAS);
1198957153fcSJan Kara
1199957153fcSJan Kara /* Use our quota_off function to clear inode flags etc. */
1200f3c1c42eSBaokun Li for (type--; type >= 0; type--)
1201957153fcSJan Kara ext4_quota_off(sb, type);
1202957153fcSJan Kara }
120333458eabSTheodore Ts'o
120433458eabSTheodore Ts'o /*
120533458eabSTheodore Ts'o * This is a helper function which is used in the mount/remount
120633458eabSTheodore Ts'o * codepaths (which holds s_umount) to fetch the quota file name.
120733458eabSTheodore Ts'o */
get_qf_name(struct super_block * sb,struct ext4_sb_info * sbi,int type)120833458eabSTheodore Ts'o static inline char *get_qf_name(struct super_block *sb,
120933458eabSTheodore Ts'o struct ext4_sb_info *sbi,
121033458eabSTheodore Ts'o int type)
121133458eabSTheodore Ts'o {
121233458eabSTheodore Ts'o return rcu_dereference_protected(sbi->s_qf_names[type],
121333458eabSTheodore Ts'o lockdep_is_held(&sb->s_umount));
121433458eabSTheodore Ts'o }
1215957153fcSJan Kara #else
ext4_quotas_off(struct super_block * sb,int type)1216f3c1c42eSBaokun Li static inline void ext4_quotas_off(struct super_block *sb, int type)
1217957153fcSJan Kara {
1218957153fcSJan Kara }
1219957153fcSJan Kara #endif
1220957153fcSJan Kara
ext4_percpu_param_init(struct ext4_sb_info * sbi)12211f79467cSJason Yan static int ext4_percpu_param_init(struct ext4_sb_info *sbi)
12221f79467cSJason Yan {
12231f79467cSJason Yan ext4_fsblk_t block;
12241f79467cSJason Yan int err;
12251f79467cSJason Yan
12261f79467cSJason Yan block = ext4_count_free_clusters(sbi->s_sb);
12271f79467cSJason Yan ext4_free_blocks_count_set(sbi->s_es, EXT4_C2B(sbi, block));
12281f79467cSJason Yan err = percpu_counter_init(&sbi->s_freeclusters_counter, block,
12291f79467cSJason Yan GFP_KERNEL);
12301f79467cSJason Yan if (!err) {
12311f79467cSJason Yan unsigned long freei = ext4_count_free_inodes(sbi->s_sb);
12321f79467cSJason Yan sbi->s_es->s_free_inodes_count = cpu_to_le32(freei);
12331f79467cSJason Yan err = percpu_counter_init(&sbi->s_freeinodes_counter, freei,
12341f79467cSJason Yan GFP_KERNEL);
12351f79467cSJason Yan }
12361f79467cSJason Yan if (!err)
12371f79467cSJason Yan err = percpu_counter_init(&sbi->s_dirs_counter,
12381f79467cSJason Yan ext4_count_dirs(sbi->s_sb), GFP_KERNEL);
12391f79467cSJason Yan if (!err)
12401f79467cSJason Yan err = percpu_counter_init(&sbi->s_dirtyclusters_counter, 0,
12411f79467cSJason Yan GFP_KERNEL);
12421f79467cSJason Yan if (!err)
12431f79467cSJason Yan err = percpu_counter_init(&sbi->s_sra_exceeded_retry_limit, 0,
12441f79467cSJason Yan GFP_KERNEL);
12451f79467cSJason Yan if (!err)
12461f79467cSJason Yan err = percpu_init_rwsem(&sbi->s_writepages_rwsem);
12471f79467cSJason Yan
12481f79467cSJason Yan if (err)
12491f79467cSJason Yan ext4_msg(sbi->s_sb, KERN_ERR, "insufficient memory");
12501f79467cSJason Yan
12511f79467cSJason Yan return err;
12521f79467cSJason Yan }
12531f79467cSJason Yan
ext4_percpu_param_destroy(struct ext4_sb_info * sbi)12541f79467cSJason Yan static void ext4_percpu_param_destroy(struct ext4_sb_info *sbi)
12551f79467cSJason Yan {
12561f79467cSJason Yan percpu_counter_destroy(&sbi->s_freeclusters_counter);
12571f79467cSJason Yan percpu_counter_destroy(&sbi->s_freeinodes_counter);
12581f79467cSJason Yan percpu_counter_destroy(&sbi->s_dirs_counter);
12591f79467cSJason Yan percpu_counter_destroy(&sbi->s_dirtyclusters_counter);
12601f79467cSJason Yan percpu_counter_destroy(&sbi->s_sra_exceeded_retry_limit);
12611f79467cSJason Yan percpu_free_rwsem(&sbi->s_writepages_rwsem);
12621f79467cSJason Yan }
12631f79467cSJason Yan
ext4_group_desc_free(struct ext4_sb_info * sbi)12646ef68498SJason Yan static void ext4_group_desc_free(struct ext4_sb_info *sbi)
12656ef68498SJason Yan {
12666ef68498SJason Yan struct buffer_head **group_desc;
12676ef68498SJason Yan int i;
12686ef68498SJason Yan
12696ef68498SJason Yan rcu_read_lock();
12706ef68498SJason Yan group_desc = rcu_dereference(sbi->s_group_desc);
12716ef68498SJason Yan for (i = 0; i < sbi->s_gdb_count; i++)
12726ef68498SJason Yan brelse(group_desc[i]);
12736ef68498SJason Yan kvfree(group_desc);
12746ef68498SJason Yan rcu_read_unlock();
12756ef68498SJason Yan }
12766ef68498SJason Yan
ext4_flex_groups_free(struct ext4_sb_info * sbi)1277dcbf8758SJason Yan static void ext4_flex_groups_free(struct ext4_sb_info *sbi)
1278dcbf8758SJason Yan {
1279dcbf8758SJason Yan struct flex_groups **flex_groups;
1280dcbf8758SJason Yan int i;
1281dcbf8758SJason Yan
1282dcbf8758SJason Yan rcu_read_lock();
1283dcbf8758SJason Yan flex_groups = rcu_dereference(sbi->s_flex_groups);
1284dcbf8758SJason Yan if (flex_groups) {
1285dcbf8758SJason Yan for (i = 0; i < sbi->s_flex_groups_allocated; i++)
1286dcbf8758SJason Yan kvfree(flex_groups[i]);
1287dcbf8758SJason Yan kvfree(flex_groups);
1288dcbf8758SJason Yan }
1289dcbf8758SJason Yan rcu_read_unlock();
1290dcbf8758SJason Yan }
1291dcbf8758SJason Yan
ext4_put_super(struct super_block * sb)1292617ba13bSMingming Cao static void ext4_put_super(struct super_block *sb)
1293ac27a0ecSDave Kleikamp {
1294617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
1295617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es;
129697abd7d4STheodore Ts'o int aborted = 0;
1297856dd6c5SNathan Chancellor int err;
1298ac27a0ecSDave Kleikamp
1299b98535d0SYe Bin /*
1300b98535d0SYe Bin * Unregister sysfs before destroying jbd2 journal.
1301b98535d0SYe Bin * Since we could still access attr_journal_task attribute via sysfs
1302b98535d0SYe Bin * path which could have sbi->s_journal->j_task as NULL
1303bb15cea2STheodore Ts'o * Unregister sysfs before flush sbi->s_sb_upd_work.
1304b98535d0SYe Bin * Since user may read /proc/fs/ext4/xx/mb_groups during umount, If
1305b98535d0SYe Bin * read metadata verify failed then will queue error work.
1306bb15cea2STheodore Ts'o * update_super_work will call start_this_handle may trigger
1307b98535d0SYe Bin * BUG_ON.
1308b98535d0SYe Bin */
1309b98535d0SYe Bin ext4_unregister_sysfs(sb);
1310b98535d0SYe Bin
13114808cb5bSZhang Yi if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs unmount"))
1312bb0fbc78SLukas Czerner ext4_msg(sb, KERN_INFO, "unmounting filesystem %pU.",
1313bb0fbc78SLukas Czerner &sb->s_uuid);
13144808cb5bSZhang Yi
1315857ac889SLukas Czerner ext4_unregister_li_request(sb);
1316f3c1c42eSBaokun Li ext4_quotas_off(sb, EXT4_MAXQUOTAS);
1317e0ccfd95SChristoph Hellwig
1318bb15cea2STheodore Ts'o flush_work(&sbi->s_sb_upd_work);
13192e8fa54eSJan Kara destroy_workqueue(sbi->rsv_conversion_wq);
132002f310fcSJan Kara ext4_release_orphan_info(sb);
13214c0425ffSMingming Cao
13220390131bSFrank Mayhar if (sbi->s_journal) {
132397abd7d4STheodore Ts'o aborted = is_journal_aborted(sbi->s_journal);
1324ef2cabf7SHidehiro Kawai err = jbd2_journal_destroy(sbi->s_journal);
132547b4a50bSJan Kara sbi->s_journal = NULL;
1326878520acSTheodore Ts'o if ((err < 0) && !aborted) {
132754d3adbcSTheodore Ts'o ext4_abort(sb, -err, "Couldn't clean up the journal");
13280390131bSFrank Mayhar }
1329878520acSTheodore Ts'o }
1330d4edac31SJosef Bacik
1331d3922a77SZheng Liu ext4_es_unregister_shrinker(sbi);
1332292a089dSSteven Rostedt (Google) timer_shutdown_sync(&sbi->s_err_report);
1333d4edac31SJosef Bacik ext4_release_system_zone(sb);
1334d4edac31SJosef Bacik ext4_mb_release(sb);
1335d4edac31SJosef Bacik ext4_ext_release(sb);
1336d4edac31SJosef Bacik
1337bc98a42cSDavid Howells if (!sb_rdonly(sb) && !aborted) {
1338e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb);
133902f310fcSJan Kara ext4_clear_feature_orphan_present(sb);
1340ac27a0ecSDave Kleikamp es->s_state = cpu_to_le16(sbi->s_mount_state);
1341ac27a0ecSDave Kleikamp }
1342bc98a42cSDavid Howells if (!sb_rdonly(sb))
13434392fbc4SJan Kara ext4_commit_super(sb);
1344a8e25a83SArtem Bityutskiy
13456ef68498SJason Yan ext4_group_desc_free(sbi);
1346dcbf8758SJason Yan ext4_flex_groups_free(sbi);
13471f79467cSJason Yan ext4_percpu_param_destroy(sbi);
1348ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1349856dd6c5SNathan Chancellor for (int i = 0; i < EXT4_MAXQUOTAS; i++)
135033458eabSTheodore Ts'o kfree(get_qf_name(sb, sbi, i));
1351ac27a0ecSDave Kleikamp #endif
1352ac27a0ecSDave Kleikamp
1353ac27a0ecSDave Kleikamp /* Debugging code just in case the in-memory inode orphan list
1354ac27a0ecSDave Kleikamp * isn't empty. The on-disk one can be non-empty if we've
1355ac27a0ecSDave Kleikamp * detected an error and taken the fs readonly, but the
1356ac27a0ecSDave Kleikamp * in-memory list had better be clean by this point. */
1357ac27a0ecSDave Kleikamp if (!list_empty(&sbi->s_orphan))
1358ac27a0ecSDave Kleikamp dump_orphan_list(sb, sbi);
1359837c23fbSChunguang Xu ASSERT(list_empty(&sbi->s_orphan));
1360ac27a0ecSDave Kleikamp
136189d96a6fSTheodore Ts'o sync_blockdev(sb->s_bdev);
1362f98393a6SPeter Zijlstra invalidate_bdev(sb->s_bdev);
136393e92cfcSZhihao Cheng if (sbi->s_journal_bdev) {
13641489dffdSChristoph Hellwig /*
13651489dffdSChristoph Hellwig * Invalidate the journal device's buffers. We don't want them
13661489dffdSChristoph Hellwig * floating about in memory - the physical journal device may
13671489dffdSChristoph Hellwig * hotswapped, and it breaks the `ro-after' testing code.
13681489dffdSChristoph Hellwig */
1369ee7ed3aaSChunguang Xu sync_blockdev(sbi->s_journal_bdev);
13701489dffdSChristoph Hellwig invalidate_bdev(sbi->s_journal_bdev);
1371ac27a0ecSDave Kleikamp }
137250c15df6SChengguang Xu
1373dec214d0STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
1374dec214d0STahsin Erdogan sbi->s_ea_inode_cache = NULL;
137550c15df6SChengguang Xu
137647387409STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
137747387409STahsin Erdogan sbi->s_ea_block_cache = NULL;
137850c15df6SChengguang Xu
1379618f0031SPavel Skripkin ext4_stop_mmpd(sbi);
1380618f0031SPavel Skripkin
13819060dd2cSEric Sandeen brelse(sbi->s_sbh);
1382ac27a0ecSDave Kleikamp sb->s_fs_info = NULL;
13833197ebdbSTheodore Ts'o /*
13843197ebdbSTheodore Ts'o * Now that we are completely done shutting down the
13853197ebdbSTheodore Ts'o * superblock, we need to actually destroy the kobject.
13863197ebdbSTheodore Ts'o */
13873197ebdbSTheodore Ts'o kobject_put(&sbi->s_kobj);
13883197ebdbSTheodore Ts'o wait_for_completion(&sbi->s_kobj_unregister);
13890441984aSDarrick J. Wong if (sbi->s_chksum_driver)
13900441984aSDarrick J. Wong crypto_free_shash(sbi->s_chksum_driver);
1391705895b6SPekka Enberg kfree(sbi->s_blockgroup_lock);
13928012b866SShiyang Ruan fs_put_dax(sbi->s_daxdev, NULL);
1393ac4acb1fSEric Biggers fscrypt_free_dummy_policy(&sbi->s_dummy_enc_policy);
13945298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
1395f8f4acb6SDaniel Rosenberg utf8_unload(sb->s_encoding);
1396c83ad55eSGabriel Krisman Bertazi #endif
1397ac27a0ecSDave Kleikamp kfree(sbi);
1398ac27a0ecSDave Kleikamp }
1399ac27a0ecSDave Kleikamp
1400e18b890bSChristoph Lameter static struct kmem_cache *ext4_inode_cachep;
1401ac27a0ecSDave Kleikamp
1402ac27a0ecSDave Kleikamp /*
1403ac27a0ecSDave Kleikamp * Called inside transaction, so use GFP_NOFS
1404ac27a0ecSDave Kleikamp */
ext4_alloc_inode(struct super_block * sb)1405617ba13bSMingming Cao static struct inode *ext4_alloc_inode(struct super_block *sb)
1406ac27a0ecSDave Kleikamp {
1407617ba13bSMingming Cao struct ext4_inode_info *ei;
1408ac27a0ecSDave Kleikamp
1409fd60b288SMuchun Song ei = alloc_inode_sb(sb, ext4_inode_cachep, GFP_NOFS);
1410ac27a0ecSDave Kleikamp if (!ei)
1411ac27a0ecSDave Kleikamp return NULL;
14120b8e58a1SAndreas Dilger
1413ee73f9a5SJeff Layton inode_set_iversion(&ei->vfs_inode, 1);
14147ea71af9SYe Bin ei->i_flags = 0;
1415202ee5dfSTheodore Ts'o spin_lock_init(&ei->i_raw_lock);
141638727786SOjaswin Mujoo ei->i_prealloc_node = RB_ROOT;
141727bc446eSbrookxu atomic_set(&ei->i_prealloc_active, 0);
141838727786SOjaswin Mujoo rwlock_init(&ei->i_prealloc_lock);
14199a26b661SZheng Liu ext4_es_init_tree(&ei->i_es_tree);
14209a26b661SZheng Liu rwlock_init(&ei->i_es_lock);
1421edaa53caSZheng Liu INIT_LIST_HEAD(&ei->i_es_list);
1422eb68d0e2SZheng Liu ei->i_es_all_nr = 0;
1423edaa53caSZheng Liu ei->i_es_shk_nr = 0;
1424dd475925SJan Kara ei->i_es_shrink_lblk = 0;
1425d2a17637SMingming Cao ei->i_reserved_data_blocks = 0;
1426d2a17637SMingming Cao spin_lock_init(&(ei->i_block_reservation_lock));
14271dc0aa46SEric Whitney ext4_init_pending_tree(&ei->i_pending_tree);
1428a9e7f447SDmitry Monakhov #ifdef CONFIG_QUOTA
1429a9e7f447SDmitry Monakhov ei->i_reserved_quota = 0;
143096c7e0d9SJan Kara memset(&ei->i_dquot, 0, sizeof(ei->i_dquot));
1431a9e7f447SDmitry Monakhov #endif
14328aefcd55STheodore Ts'o ei->jinode = NULL;
14332e8fa54eSJan Kara INIT_LIST_HEAD(&ei->i_rsv_conversion_list);
1434744692dcSJiaying Zhang spin_lock_init(&ei->i_completed_io_lock);
1435b436b9beSJan Kara ei->i_sync_tid = 0;
1436b436b9beSJan Kara ei->i_datasync_tid = 0;
1437e27f41e1SDmitry Monakhov atomic_set(&ei->i_unwritten, 0);
14382e8fa54eSJan Kara INIT_WORK(&ei->i_rsv_conversion_work, ext4_end_io_rsv_work);
1439aa75f4d3SHarshad Shirwadkar ext4_fc_init_inode(&ei->vfs_inode);
1440aa75f4d3SHarshad Shirwadkar mutex_init(&ei->i_fc_lock);
1441ac27a0ecSDave Kleikamp return &ei->vfs_inode;
1442ac27a0ecSDave Kleikamp }
1443ac27a0ecSDave Kleikamp
ext4_drop_inode(struct inode * inode)14447ff9c073STheodore Ts'o static int ext4_drop_inode(struct inode *inode)
14457ff9c073STheodore Ts'o {
14467ff9c073STheodore Ts'o int drop = generic_drop_inode(inode);
14477ff9c073STheodore Ts'o
144829b3692eSEric Biggers if (!drop)
144929b3692eSEric Biggers drop = fscrypt_drop_inode(inode);
145029b3692eSEric Biggers
14517ff9c073STheodore Ts'o trace_ext4_drop_inode(inode, drop);
14527ff9c073STheodore Ts'o return drop;
14537ff9c073STheodore Ts'o }
14547ff9c073STheodore Ts'o
ext4_free_in_core_inode(struct inode * inode)145594053139SAl Viro static void ext4_free_in_core_inode(struct inode *inode)
1456fa0d7e3dSNick Piggin {
14572c58d548SEric Biggers fscrypt_free_inode(inode);
1458aa75f4d3SHarshad Shirwadkar if (!list_empty(&(EXT4_I(inode)->i_fc_list))) {
1459aa75f4d3SHarshad Shirwadkar pr_warn("%s: inode %ld still in fc list",
1460aa75f4d3SHarshad Shirwadkar __func__, inode->i_ino);
1461aa75f4d3SHarshad Shirwadkar }
1462fa0d7e3dSNick Piggin kmem_cache_free(ext4_inode_cachep, EXT4_I(inode));
1463fa0d7e3dSNick Piggin }
1464fa0d7e3dSNick Piggin
ext4_destroy_inode(struct inode * inode)1465617ba13bSMingming Cao static void ext4_destroy_inode(struct inode *inode)
1466ac27a0ecSDave Kleikamp {
14679f7dd93dSVasily Averin if (!list_empty(&(EXT4_I(inode)->i_orphan))) {
1468b31e1552SEric Sandeen ext4_msg(inode->i_sb, KERN_ERR,
1469b31e1552SEric Sandeen "Inode %lu (%p): orphan list check failed!",
1470b31e1552SEric Sandeen inode->i_ino, EXT4_I(inode));
14719f7dd93dSVasily Averin print_hex_dump(KERN_INFO, "", DUMP_PREFIX_ADDRESS, 16, 4,
14729f7dd93dSVasily Averin EXT4_I(inode), sizeof(struct ext4_inode_info),
14739f7dd93dSVasily Averin true);
14749f7dd93dSVasily Averin dump_stack();
14759f7dd93dSVasily Averin }
14766fed8395SJeffle Xu
14776fed8395SJeffle Xu if (EXT4_I(inode)->i_reserved_data_blocks)
14786fed8395SJeffle Xu ext4_msg(inode->i_sb, KERN_ERR,
14796fed8395SJeffle Xu "Inode %lu (%p): i_reserved_data_blocks (%u) not cleared!",
14806fed8395SJeffle Xu inode->i_ino, EXT4_I(inode),
14816fed8395SJeffle Xu EXT4_I(inode)->i_reserved_data_blocks);
1482ac27a0ecSDave Kleikamp }
1483ac27a0ecSDave Kleikamp
ext4_shutdown(struct super_block * sb)1484f5db130dSChristoph Hellwig static void ext4_shutdown(struct super_block *sb)
1485f5db130dSChristoph Hellwig {
1486f5db130dSChristoph Hellwig ext4_force_shutdown(sb, EXT4_GOING_FLAGS_NOLOGFLUSH);
1487f5db130dSChristoph Hellwig }
1488f5db130dSChristoph Hellwig
init_once(void * foo)148951cc5068SAlexey Dobriyan static void init_once(void *foo)
1490ac27a0ecSDave Kleikamp {
1491c30365b9SYu Zhe struct ext4_inode_info *ei = foo;
1492ac27a0ecSDave Kleikamp
1493ac27a0ecSDave Kleikamp INIT_LIST_HEAD(&ei->i_orphan);
1494ac27a0ecSDave Kleikamp init_rwsem(&ei->xattr_sem);
14950e855ac8SAneesh Kumar K.V init_rwsem(&ei->i_data_sem);
1496ac27a0ecSDave Kleikamp inode_init_once(&ei->vfs_inode);
1497aa75f4d3SHarshad Shirwadkar ext4_fc_init_inode(&ei->vfs_inode);
1498ac27a0ecSDave Kleikamp }
1499ac27a0ecSDave Kleikamp
init_inodecache(void)1500e67bc2b3SFabian Frederick static int __init init_inodecache(void)
1501ac27a0ecSDave Kleikamp {
1502f8dd7c70SDavid Windsor ext4_inode_cachep = kmem_cache_create_usercopy("ext4_inode_cache",
1503f8dd7c70SDavid Windsor sizeof(struct ext4_inode_info), 0,
1504f8dd7c70SDavid Windsor (SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD|
1505f8dd7c70SDavid Windsor SLAB_ACCOUNT),
1506f8dd7c70SDavid Windsor offsetof(struct ext4_inode_info, i_data),
1507f8dd7c70SDavid Windsor sizeof_field(struct ext4_inode_info, i_data),
150820c2df83SPaul Mundt init_once);
1509617ba13bSMingming Cao if (ext4_inode_cachep == NULL)
1510ac27a0ecSDave Kleikamp return -ENOMEM;
1511ac27a0ecSDave Kleikamp return 0;
1512ac27a0ecSDave Kleikamp }
1513ac27a0ecSDave Kleikamp
destroy_inodecache(void)1514ac27a0ecSDave Kleikamp static void destroy_inodecache(void)
1515ac27a0ecSDave Kleikamp {
15168c0a8537SKirill A. Shutemov /*
15178c0a8537SKirill A. Shutemov * Make sure all delayed rcu free inodes are flushed before we
15188c0a8537SKirill A. Shutemov * destroy cache.
15198c0a8537SKirill A. Shutemov */
15208c0a8537SKirill A. Shutemov rcu_barrier();
1521617ba13bSMingming Cao kmem_cache_destroy(ext4_inode_cachep);
1522ac27a0ecSDave Kleikamp }
1523ac27a0ecSDave Kleikamp
ext4_clear_inode(struct inode * inode)15240930fcc1SAl Viro void ext4_clear_inode(struct inode *inode)
1525ac27a0ecSDave Kleikamp {
1526aa75f4d3SHarshad Shirwadkar ext4_fc_del(inode);
15270930fcc1SAl Viro invalidate_inode_buffers(inode);
1528dbd5768fSJan Kara clear_inode(inode);
152927bc446eSbrookxu ext4_discard_preallocations(inode, 0);
153051865fdaSZheng Liu ext4_es_remove_extent(inode, 0, EXT_MAX_BLOCKS);
1531f4c2d372SJan Kara dquot_drop(inode);
15328aefcd55STheodore Ts'o if (EXT4_I(inode)->jinode) {
15338aefcd55STheodore Ts'o jbd2_journal_release_jbd_inode(EXT4_JOURNAL(inode),
15348aefcd55STheodore Ts'o EXT4_I(inode)->jinode);
15358aefcd55STheodore Ts'o jbd2_free_inode(EXT4_I(inode)->jinode);
15368aefcd55STheodore Ts'o EXT4_I(inode)->jinode = NULL;
15378aefcd55STheodore Ts'o }
15383d204e24SEric Biggers fscrypt_put_encryption_info(inode);
1539c93d8f88SEric Biggers fsverity_cleanup_inode(inode);
1540ac27a0ecSDave Kleikamp }
1541ac27a0ecSDave Kleikamp
ext4_nfs_get_inode(struct super_block * sb,u64 ino,u32 generation)15421b961ac0SChristoph Hellwig static struct inode *ext4_nfs_get_inode(struct super_block *sb,
15431b961ac0SChristoph Hellwig u64 ino, u32 generation)
1544ac27a0ecSDave Kleikamp {
1545ac27a0ecSDave Kleikamp struct inode *inode;
1546ac27a0ecSDave Kleikamp
15478a363970STheodore Ts'o /*
1548ac27a0ecSDave Kleikamp * Currently we don't know the generation for parent directory, so
1549ac27a0ecSDave Kleikamp * a generation of 0 means "accept any"
1550ac27a0ecSDave Kleikamp */
15518a363970STheodore Ts'o inode = ext4_iget(sb, ino, EXT4_IGET_HANDLE);
15521d1fe1eeSDavid Howells if (IS_ERR(inode))
15531d1fe1eeSDavid Howells return ERR_CAST(inode);
15541d1fe1eeSDavid Howells if (generation && inode->i_generation != generation) {
1555ac27a0ecSDave Kleikamp iput(inode);
1556ac27a0ecSDave Kleikamp return ERR_PTR(-ESTALE);
1557ac27a0ecSDave Kleikamp }
15581b961ac0SChristoph Hellwig
15591b961ac0SChristoph Hellwig return inode;
1560ac27a0ecSDave Kleikamp }
15611b961ac0SChristoph Hellwig
ext4_fh_to_dentry(struct super_block * sb,struct fid * fid,int fh_len,int fh_type)15621b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_dentry(struct super_block *sb, struct fid *fid,
15631b961ac0SChristoph Hellwig int fh_len, int fh_type)
15641b961ac0SChristoph Hellwig {
15651b961ac0SChristoph Hellwig return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
15661b961ac0SChristoph Hellwig ext4_nfs_get_inode);
15671b961ac0SChristoph Hellwig }
15681b961ac0SChristoph Hellwig
ext4_fh_to_parent(struct super_block * sb,struct fid * fid,int fh_len,int fh_type)15691b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_parent(struct super_block *sb, struct fid *fid,
15701b961ac0SChristoph Hellwig int fh_len, int fh_type)
15711b961ac0SChristoph Hellwig {
15721b961ac0SChristoph Hellwig return generic_fh_to_parent(sb, fid, fh_len, fh_type,
15731b961ac0SChristoph Hellwig ext4_nfs_get_inode);
1574ac27a0ecSDave Kleikamp }
1575ac27a0ecSDave Kleikamp
ext4_nfs_commit_metadata(struct inode * inode)1576fde87268STheodore Ts'o static int ext4_nfs_commit_metadata(struct inode *inode)
1577fde87268STheodore Ts'o {
1578fde87268STheodore Ts'o struct writeback_control wbc = {
1579fde87268STheodore Ts'o .sync_mode = WB_SYNC_ALL
1580fde87268STheodore Ts'o };
1581fde87268STheodore Ts'o
1582fde87268STheodore Ts'o trace_ext4_nfs_commit_metadata(inode);
1583fde87268STheodore Ts'o return ext4_write_inode(inode, &wbc);
1584fde87268STheodore Ts'o }
1585fde87268STheodore Ts'o
1586ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1587d6006186SEric Biggers static const char * const quotatypes[] = INITQFNAMES;
1588689c958cSLi Xi #define QTYPE2NAME(t) (quotatypes[t])
1589ac27a0ecSDave Kleikamp
1590617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot);
1591617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot);
1592617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot);
1593617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot);
1594617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type);
15956f28e087SJan Kara static int ext4_quota_on(struct super_block *sb, int type, int format_id,
15968c54ca9cSAl Viro const struct path *path);
1597617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
1598ac27a0ecSDave Kleikamp size_t len, loff_t off);
1599617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
1600ac27a0ecSDave Kleikamp const char *data, size_t len, loff_t off);
16017c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
16027c319d32SAditya Kali unsigned int flags);
1603ac27a0ecSDave Kleikamp
ext4_get_dquots(struct inode * inode)160442954c37SJan Kara static struct dquot __rcu **ext4_get_dquots(struct inode *inode)
160596c7e0d9SJan Kara {
160696c7e0d9SJan Kara return EXT4_I(inode)->i_dquot;
160796c7e0d9SJan Kara }
160896c7e0d9SJan Kara
160961e225dcSAlexey Dobriyan static const struct dquot_operations ext4_quota_operations = {
161060e58e0fSMingming Cao .get_reserved_space = ext4_get_reserved_space,
1611617ba13bSMingming Cao .write_dquot = ext4_write_dquot,
1612617ba13bSMingming Cao .acquire_dquot = ext4_acquire_dquot,
1613617ba13bSMingming Cao .release_dquot = ext4_release_dquot,
1614617ba13bSMingming Cao .mark_dirty = ext4_mark_dquot_dirty,
1615a5b5ee32SJan Kara .write_info = ext4_write_info,
1616a5b5ee32SJan Kara .alloc_dquot = dquot_alloc,
1617a5b5ee32SJan Kara .destroy_dquot = dquot_destroy,
1618040cb378SLi Xi .get_projid = ext4_get_projid,
16197a9ca53aSTahsin Erdogan .get_inode_usage = ext4_get_inode_usage,
1620ebc11f7bSChengguang Xu .get_next_id = dquot_get_next_id,
1621ac27a0ecSDave Kleikamp };
1622ac27a0ecSDave Kleikamp
16230d54b217SAlexey Dobriyan static const struct quotactl_ops ext4_qctl_operations = {
1624617ba13bSMingming Cao .quota_on = ext4_quota_on,
1625ca0e05e4SDmitry Monakhov .quota_off = ext4_quota_off,
1626287a8095SChristoph Hellwig .quota_sync = dquot_quota_sync,
16270a240339SJan Kara .get_state = dquot_get_state,
1628287a8095SChristoph Hellwig .set_info = dquot_set_dqinfo,
1629287a8095SChristoph Hellwig .get_dqblk = dquot_get_dqblk,
16306332b9b5SEric Sandeen .set_dqblk = dquot_set_dqblk,
16316332b9b5SEric Sandeen .get_nextdqblk = dquot_get_next_dqblk,
1632ac27a0ecSDave Kleikamp };
1633ac27a0ecSDave Kleikamp #endif
1634ac27a0ecSDave Kleikamp
1635ee9b6d61SJosef 'Jeff' Sipek static const struct super_operations ext4_sops = {
1636617ba13bSMingming Cao .alloc_inode = ext4_alloc_inode,
163794053139SAl Viro .free_inode = ext4_free_in_core_inode,
1638617ba13bSMingming Cao .destroy_inode = ext4_destroy_inode,
1639617ba13bSMingming Cao .write_inode = ext4_write_inode,
1640617ba13bSMingming Cao .dirty_inode = ext4_dirty_inode,
16417ff9c073STheodore Ts'o .drop_inode = ext4_drop_inode,
16420930fcc1SAl Viro .evict_inode = ext4_evict_inode,
1643617ba13bSMingming Cao .put_super = ext4_put_super,
1644617ba13bSMingming Cao .sync_fs = ext4_sync_fs,
1645c4be0c1dSTakashi Sato .freeze_fs = ext4_freeze,
1646c4be0c1dSTakashi Sato .unfreeze_fs = ext4_unfreeze,
1647617ba13bSMingming Cao .statfs = ext4_statfs,
1648617ba13bSMingming Cao .show_options = ext4_show_options,
1649f5db130dSChristoph Hellwig .shutdown = ext4_shutdown,
1650ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1651617ba13bSMingming Cao .quota_read = ext4_quota_read,
1652617ba13bSMingming Cao .quota_write = ext4_quota_write,
165396c7e0d9SJan Kara .get_dquots = ext4_get_dquots,
1654ac27a0ecSDave Kleikamp #endif
1655ac27a0ecSDave Kleikamp };
1656ac27a0ecSDave Kleikamp
165739655164SChristoph Hellwig static const struct export_operations ext4_export_ops = {
16581b961ac0SChristoph Hellwig .fh_to_dentry = ext4_fh_to_dentry,
16591b961ac0SChristoph Hellwig .fh_to_parent = ext4_fh_to_parent,
1660617ba13bSMingming Cao .get_parent = ext4_get_parent,
1661fde87268STheodore Ts'o .commit_metadata = ext4_nfs_commit_metadata,
1662ac27a0ecSDave Kleikamp };
1663ac27a0ecSDave Kleikamp
1664ac27a0ecSDave Kleikamp enum {
1665ac27a0ecSDave Kleikamp Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid,
1666ba2e524dSLukas Czerner Opt_resgid, Opt_resuid, Opt_sb,
166772578c33STheodore Ts'o Opt_nouid32, Opt_debug, Opt_removed,
16682d544ec9SYang Xu Opt_user_xattr, Opt_acl,
166972578c33STheodore Ts'o Opt_auto_da_alloc, Opt_noauto_da_alloc, Opt_noload,
1670ad4eec61SEric Sandeen Opt_commit, Opt_min_batch_time, Opt_max_batch_time, Opt_journal_dev,
1671ad4eec61SEric Sandeen Opt_journal_path, Opt_journal_checksum, Opt_journal_async_commit,
1672ac27a0ecSDave Kleikamp Opt_abort, Opt_data_journal, Opt_data_ordered, Opt_data_writeback,
16736ddb2447STheodore Ts'o Opt_data_err_abort, Opt_data_err_ignore, Opt_test_dummy_encryption,
16744f74d15fSEric Biggers Opt_inlinecrypt,
1675ba2e524dSLukas Czerner Opt_usrjquota, Opt_grpjquota, Opt_quota,
1676ee4a3fcdSTheodore Ts'o Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err,
16771ff20307SJeff Layton Opt_usrquota, Opt_grpquota, Opt_prjquota,
16789cb20f94SIra Weiny Opt_dax, Opt_dax_always, Opt_dax_inode, Opt_dax_never,
1679327eaf73STheodore Ts'o Opt_stripe, Opt_delalloc, Opt_nodelalloc, Opt_warn_on_error,
16804437992bSLukas Czerner Opt_nowarn_on_error, Opt_mblk_io_submit, Opt_debug_want_extra_isize,
16811449032bSTheodore Ts'o Opt_nomblk_io_submit, Opt_block_validity, Opt_noblock_validity,
16825328e635SEric Sandeen Opt_inode_readahead_blks, Opt_journal_ioprio,
1683744692dcSJiaying Zhang Opt_dioread_nolock, Opt_dioread_lock,
1684fc6cb1cdSTheodore Ts'o Opt_discard, Opt_nodiscard, Opt_init_itable, Opt_noinit_itable,
1685cdb7ee4cSTahsin Erdogan Opt_max_dir_size_kb, Opt_nojournal_checksum, Opt_nombcache,
168621175ca4SHarshad Shirwadkar Opt_no_prefetch_block_bitmaps, Opt_mb_optimize_scan,
1687e5a185c2SLukas Czerner Opt_errors, Opt_data, Opt_data_err, Opt_jqfmt, Opt_dax_type,
16888016e29fSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
168999c880deSHarshad Shirwadkar Opt_fc_debug_max_replay, Opt_fc_debug_force
16908016e29fSHarshad Shirwadkar #endif
1691ac27a0ecSDave Kleikamp };
1692ac27a0ecSDave Kleikamp
1693e5a185c2SLukas Czerner static const struct constant_table ext4_param_errors[] = {
1694ba2e524dSLukas Czerner {"continue", EXT4_MOUNT_ERRORS_CONT},
1695ba2e524dSLukas Czerner {"panic", EXT4_MOUNT_ERRORS_PANIC},
1696ba2e524dSLukas Czerner {"remount-ro", EXT4_MOUNT_ERRORS_RO},
1697e5a185c2SLukas Czerner {}
1698e5a185c2SLukas Czerner };
1699e5a185c2SLukas Czerner
1700e5a185c2SLukas Czerner static const struct constant_table ext4_param_data[] = {
1701ba2e524dSLukas Czerner {"journal", EXT4_MOUNT_JOURNAL_DATA},
1702ba2e524dSLukas Czerner {"ordered", EXT4_MOUNT_ORDERED_DATA},
1703ba2e524dSLukas Czerner {"writeback", EXT4_MOUNT_WRITEBACK_DATA},
1704e5a185c2SLukas Czerner {}
1705e5a185c2SLukas Czerner };
1706e5a185c2SLukas Czerner
1707e5a185c2SLukas Czerner static const struct constant_table ext4_param_data_err[] = {
1708e5a185c2SLukas Czerner {"abort", Opt_data_err_abort},
1709e5a185c2SLukas Czerner {"ignore", Opt_data_err_ignore},
1710e5a185c2SLukas Czerner {}
1711e5a185c2SLukas Czerner };
1712e5a185c2SLukas Czerner
1713e5a185c2SLukas Czerner static const struct constant_table ext4_param_jqfmt[] = {
1714ba2e524dSLukas Czerner {"vfsold", QFMT_VFS_OLD},
1715ba2e524dSLukas Czerner {"vfsv0", QFMT_VFS_V0},
1716ba2e524dSLukas Czerner {"vfsv1", QFMT_VFS_V1},
1717e5a185c2SLukas Czerner {}
1718e5a185c2SLukas Czerner };
1719e5a185c2SLukas Czerner
1720e5a185c2SLukas Czerner static const struct constant_table ext4_param_dax[] = {
1721e5a185c2SLukas Czerner {"always", Opt_dax_always},
1722e5a185c2SLukas Czerner {"inode", Opt_dax_inode},
1723e5a185c2SLukas Czerner {"never", Opt_dax_never},
1724e5a185c2SLukas Czerner {}
1725e5a185c2SLukas Czerner };
1726e5a185c2SLukas Czerner
1727e5a185c2SLukas Czerner /* String parameter that allows empty argument */
1728e5a185c2SLukas Czerner #define fsparam_string_empty(NAME, OPT) \
1729e5a185c2SLukas Czerner __fsparam(fs_param_is_string, NAME, OPT, fs_param_can_be_empty, NULL)
1730e5a185c2SLukas Czerner
1731e5a185c2SLukas Czerner /*
1732e5a185c2SLukas Czerner * Mount option specification
1733e5a185c2SLukas Czerner * We don't use fsparam_flag_no because of the way we set the
1734e5a185c2SLukas Czerner * options and the way we show them in _ext4_show_options(). To
1735e5a185c2SLukas Czerner * keep the changes to a minimum, let's keep the negative options
1736e5a185c2SLukas Czerner * separate for now.
1737e5a185c2SLukas Czerner */
1738e5a185c2SLukas Czerner static const struct fs_parameter_spec ext4_param_specs[] = {
1739e5a185c2SLukas Czerner fsparam_flag ("bsddf", Opt_bsd_df),
1740e5a185c2SLukas Czerner fsparam_flag ("minixdf", Opt_minix_df),
1741e5a185c2SLukas Czerner fsparam_flag ("grpid", Opt_grpid),
1742e5a185c2SLukas Czerner fsparam_flag ("bsdgroups", Opt_grpid),
1743e5a185c2SLukas Czerner fsparam_flag ("nogrpid", Opt_nogrpid),
1744e5a185c2SLukas Czerner fsparam_flag ("sysvgroups", Opt_nogrpid),
1745e5a185c2SLukas Czerner fsparam_u32 ("resgid", Opt_resgid),
1746e5a185c2SLukas Czerner fsparam_u32 ("resuid", Opt_resuid),
1747e5a185c2SLukas Czerner fsparam_u32 ("sb", Opt_sb),
1748e5a185c2SLukas Czerner fsparam_enum ("errors", Opt_errors, ext4_param_errors),
1749e5a185c2SLukas Czerner fsparam_flag ("nouid32", Opt_nouid32),
1750e5a185c2SLukas Czerner fsparam_flag ("debug", Opt_debug),
1751e5a185c2SLukas Czerner fsparam_flag ("oldalloc", Opt_removed),
1752e5a185c2SLukas Czerner fsparam_flag ("orlov", Opt_removed),
1753e5a185c2SLukas Czerner fsparam_flag ("user_xattr", Opt_user_xattr),
1754e5a185c2SLukas Czerner fsparam_flag ("acl", Opt_acl),
1755e5a185c2SLukas Czerner fsparam_flag ("norecovery", Opt_noload),
1756e5a185c2SLukas Czerner fsparam_flag ("noload", Opt_noload),
1757e5a185c2SLukas Czerner fsparam_flag ("bh", Opt_removed),
1758e5a185c2SLukas Czerner fsparam_flag ("nobh", Opt_removed),
1759e5a185c2SLukas Czerner fsparam_u32 ("commit", Opt_commit),
1760e5a185c2SLukas Czerner fsparam_u32 ("min_batch_time", Opt_min_batch_time),
1761e5a185c2SLukas Czerner fsparam_u32 ("max_batch_time", Opt_max_batch_time),
1762e5a185c2SLukas Czerner fsparam_u32 ("journal_dev", Opt_journal_dev),
1763e5a185c2SLukas Czerner fsparam_bdev ("journal_path", Opt_journal_path),
1764e5a185c2SLukas Czerner fsparam_flag ("journal_checksum", Opt_journal_checksum),
1765e5a185c2SLukas Czerner fsparam_flag ("nojournal_checksum", Opt_nojournal_checksum),
1766e5a185c2SLukas Czerner fsparam_flag ("journal_async_commit",Opt_journal_async_commit),
1767e5a185c2SLukas Czerner fsparam_flag ("abort", Opt_abort),
1768e5a185c2SLukas Czerner fsparam_enum ("data", Opt_data, ext4_param_data),
1769e5a185c2SLukas Czerner fsparam_enum ("data_err", Opt_data_err,
1770e5a185c2SLukas Czerner ext4_param_data_err),
1771e5a185c2SLukas Czerner fsparam_string_empty
1772e5a185c2SLukas Czerner ("usrjquota", Opt_usrjquota),
1773e5a185c2SLukas Czerner fsparam_string_empty
1774e5a185c2SLukas Czerner ("grpjquota", Opt_grpjquota),
1775e5a185c2SLukas Czerner fsparam_enum ("jqfmt", Opt_jqfmt, ext4_param_jqfmt),
1776e5a185c2SLukas Czerner fsparam_flag ("grpquota", Opt_grpquota),
1777e5a185c2SLukas Czerner fsparam_flag ("quota", Opt_quota),
1778e5a185c2SLukas Czerner fsparam_flag ("noquota", Opt_noquota),
1779e5a185c2SLukas Czerner fsparam_flag ("usrquota", Opt_usrquota),
1780e5a185c2SLukas Czerner fsparam_flag ("prjquota", Opt_prjquota),
1781e5a185c2SLukas Czerner fsparam_flag ("barrier", Opt_barrier),
1782e5a185c2SLukas Czerner fsparam_u32 ("barrier", Opt_barrier),
1783e5a185c2SLukas Czerner fsparam_flag ("nobarrier", Opt_nobarrier),
17841ff20307SJeff Layton fsparam_flag ("i_version", Opt_removed),
1785e5a185c2SLukas Czerner fsparam_flag ("dax", Opt_dax),
1786e5a185c2SLukas Czerner fsparam_enum ("dax", Opt_dax_type, ext4_param_dax),
1787e5a185c2SLukas Czerner fsparam_u32 ("stripe", Opt_stripe),
1788e5a185c2SLukas Czerner fsparam_flag ("delalloc", Opt_delalloc),
1789e5a185c2SLukas Czerner fsparam_flag ("nodelalloc", Opt_nodelalloc),
1790e5a185c2SLukas Czerner fsparam_flag ("warn_on_error", Opt_warn_on_error),
1791e5a185c2SLukas Czerner fsparam_flag ("nowarn_on_error", Opt_nowarn_on_error),
1792e5a185c2SLukas Czerner fsparam_u32 ("debug_want_extra_isize",
1793e5a185c2SLukas Czerner Opt_debug_want_extra_isize),
1794e5a185c2SLukas Czerner fsparam_flag ("mblk_io_submit", Opt_removed),
1795e5a185c2SLukas Czerner fsparam_flag ("nomblk_io_submit", Opt_removed),
1796e5a185c2SLukas Czerner fsparam_flag ("block_validity", Opt_block_validity),
1797e5a185c2SLukas Czerner fsparam_flag ("noblock_validity", Opt_noblock_validity),
1798e5a185c2SLukas Czerner fsparam_u32 ("inode_readahead_blks",
1799e5a185c2SLukas Czerner Opt_inode_readahead_blks),
1800e5a185c2SLukas Czerner fsparam_u32 ("journal_ioprio", Opt_journal_ioprio),
1801e5a185c2SLukas Czerner fsparam_u32 ("auto_da_alloc", Opt_auto_da_alloc),
1802e5a185c2SLukas Czerner fsparam_flag ("auto_da_alloc", Opt_auto_da_alloc),
1803e5a185c2SLukas Czerner fsparam_flag ("noauto_da_alloc", Opt_noauto_da_alloc),
1804e5a185c2SLukas Czerner fsparam_flag ("dioread_nolock", Opt_dioread_nolock),
1805e5a185c2SLukas Czerner fsparam_flag ("nodioread_nolock", Opt_dioread_lock),
1806e5a185c2SLukas Czerner fsparam_flag ("dioread_lock", Opt_dioread_lock),
1807e5a185c2SLukas Czerner fsparam_flag ("discard", Opt_discard),
1808e5a185c2SLukas Czerner fsparam_flag ("nodiscard", Opt_nodiscard),
1809e5a185c2SLukas Czerner fsparam_u32 ("init_itable", Opt_init_itable),
1810e5a185c2SLukas Czerner fsparam_flag ("init_itable", Opt_init_itable),
1811e5a185c2SLukas Czerner fsparam_flag ("noinit_itable", Opt_noinit_itable),
1812e5a185c2SLukas Czerner #ifdef CONFIG_EXT4_DEBUG
1813e5a185c2SLukas Czerner fsparam_flag ("fc_debug_force", Opt_fc_debug_force),
1814e5a185c2SLukas Czerner fsparam_u32 ("fc_debug_max_replay", Opt_fc_debug_max_replay),
1815e5a185c2SLukas Czerner #endif
1816e5a185c2SLukas Czerner fsparam_u32 ("max_dir_size_kb", Opt_max_dir_size_kb),
1817e5a185c2SLukas Czerner fsparam_flag ("test_dummy_encryption",
1818e5a185c2SLukas Czerner Opt_test_dummy_encryption),
1819e5a185c2SLukas Czerner fsparam_string ("test_dummy_encryption",
1820e5a185c2SLukas Czerner Opt_test_dummy_encryption),
1821e5a185c2SLukas Czerner fsparam_flag ("inlinecrypt", Opt_inlinecrypt),
1822e5a185c2SLukas Czerner fsparam_flag ("nombcache", Opt_nombcache),
1823e5a185c2SLukas Czerner fsparam_flag ("no_mbcache", Opt_nombcache), /* for backward compatibility */
1824e5a185c2SLukas Czerner fsparam_flag ("prefetch_block_bitmaps",
1825e5a185c2SLukas Czerner Opt_removed),
1826e5a185c2SLukas Czerner fsparam_flag ("no_prefetch_block_bitmaps",
1827e5a185c2SLukas Czerner Opt_no_prefetch_block_bitmaps),
1828e5a185c2SLukas Czerner fsparam_s32 ("mb_optimize_scan", Opt_mb_optimize_scan),
1829e5a185c2SLukas Czerner fsparam_string ("check", Opt_removed), /* mount option from ext2/3 */
1830e5a185c2SLukas Czerner fsparam_flag ("nocheck", Opt_removed), /* mount option from ext2/3 */
1831e5a185c2SLukas Czerner fsparam_flag ("reservation", Opt_removed), /* mount option from ext2/3 */
1832e5a185c2SLukas Czerner fsparam_flag ("noreservation", Opt_removed), /* mount option from ext2/3 */
1833e5a185c2SLukas Czerner fsparam_u32 ("journal", Opt_removed), /* mount option from ext2/3 */
1834e5a185c2SLukas Czerner {}
1835e5a185c2SLukas Czerner };
1836e5a185c2SLukas Czerner
1837b3881f74STheodore Ts'o #define DEFAULT_JOURNAL_IOPRIO (IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, 3))
1838196e402aSHarshad Shirwadkar
183926092bf5STheodore Ts'o #define MOPT_SET 0x0001
184026092bf5STheodore Ts'o #define MOPT_CLEAR 0x0002
184126092bf5STheodore Ts'o #define MOPT_NOSUPPORT 0x0004
184226092bf5STheodore Ts'o #define MOPT_EXPLICIT 0x0008
184326092bf5STheodore Ts'o #ifdef CONFIG_QUOTA
184426092bf5STheodore Ts'o #define MOPT_Q 0
1845ba2e524dSLukas Czerner #define MOPT_QFMT 0x0010
184626092bf5STheodore Ts'o #else
184726092bf5STheodore Ts'o #define MOPT_Q MOPT_NOSUPPORT
184826092bf5STheodore Ts'o #define MOPT_QFMT MOPT_NOSUPPORT
184926092bf5STheodore Ts'o #endif
1850ba2e524dSLukas Czerner #define MOPT_NO_EXT2 0x0020
1851ba2e524dSLukas Czerner #define MOPT_NO_EXT3 0x0040
18528dc0aa8cSTheodore Ts'o #define MOPT_EXT4_ONLY (MOPT_NO_EXT2 | MOPT_NO_EXT3)
1853ba2e524dSLukas Czerner #define MOPT_SKIP 0x0080
1854ba2e524dSLukas Czerner #define MOPT_2 0x0100
185526092bf5STheodore Ts'o
185626092bf5STheodore Ts'o static const struct mount_opts {
185726092bf5STheodore Ts'o int token;
185826092bf5STheodore Ts'o int mount_opt;
185926092bf5STheodore Ts'o int flags;
186026092bf5STheodore Ts'o } ext4_mount_opts[] = {
186126092bf5STheodore Ts'o {Opt_minix_df, EXT4_MOUNT_MINIX_DF, MOPT_SET},
186226092bf5STheodore Ts'o {Opt_bsd_df, EXT4_MOUNT_MINIX_DF, MOPT_CLEAR},
186326092bf5STheodore Ts'o {Opt_grpid, EXT4_MOUNT_GRPID, MOPT_SET},
186426092bf5STheodore Ts'o {Opt_nogrpid, EXT4_MOUNT_GRPID, MOPT_CLEAR},
186526092bf5STheodore Ts'o {Opt_block_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_SET},
186626092bf5STheodore Ts'o {Opt_noblock_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_CLEAR},
18678dc0aa8cSTheodore Ts'o {Opt_dioread_nolock, EXT4_MOUNT_DIOREAD_NOLOCK,
18688dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_SET},
18698dc0aa8cSTheodore Ts'o {Opt_dioread_lock, EXT4_MOUNT_DIOREAD_NOLOCK,
18708dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_CLEAR},
187126092bf5STheodore Ts'o {Opt_discard, EXT4_MOUNT_DISCARD, MOPT_SET},
187226092bf5STheodore Ts'o {Opt_nodiscard, EXT4_MOUNT_DISCARD, MOPT_CLEAR},
18738dc0aa8cSTheodore Ts'o {Opt_delalloc, EXT4_MOUNT_DELALLOC,
18748dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
18758dc0aa8cSTheodore Ts'o {Opt_nodelalloc, EXT4_MOUNT_DELALLOC,
187659d9fa5cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_CLEAR},
1877327eaf73STheodore Ts'o {Opt_warn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_SET},
1878327eaf73STheodore Ts'o {Opt_nowarn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_CLEAR},
1879cb8435dcSEric Biggers {Opt_commit, 0, MOPT_NO_EXT2},
1880c6d3d56dSDarrick J. Wong {Opt_nojournal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
1881c6d3d56dSDarrick J. Wong MOPT_EXT4_ONLY | MOPT_CLEAR},
18828dc0aa8cSTheodore Ts'o {Opt_journal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
18831e381f60SDmitry Monakhov MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
188426092bf5STheodore Ts'o {Opt_journal_async_commit, (EXT4_MOUNT_JOURNAL_ASYNC_COMMIT |
18858dc0aa8cSTheodore Ts'o EXT4_MOUNT_JOURNAL_CHECKSUM),
18861e381f60SDmitry Monakhov MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
18878dc0aa8cSTheodore Ts'o {Opt_noload, EXT4_MOUNT_NOLOAD, MOPT_NO_EXT2 | MOPT_SET},
1888ba2e524dSLukas Czerner {Opt_data_err, EXT4_MOUNT_DATA_ERR_ABORT, MOPT_NO_EXT2},
188926092bf5STheodore Ts'o {Opt_barrier, EXT4_MOUNT_BARRIER, MOPT_SET},
189026092bf5STheodore Ts'o {Opt_nobarrier, EXT4_MOUNT_BARRIER, MOPT_CLEAR},
189126092bf5STheodore Ts'o {Opt_noauto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_SET},
189226092bf5STheodore Ts'o {Opt_auto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_CLEAR},
189326092bf5STheodore Ts'o {Opt_noinit_itable, EXT4_MOUNT_INIT_INODE_TABLE, MOPT_CLEAR},
1894ba2e524dSLukas Czerner {Opt_dax_type, 0, MOPT_EXT4_ONLY},
1895ba2e524dSLukas Czerner {Opt_journal_dev, 0, MOPT_NO_EXT2},
1896ba2e524dSLukas Czerner {Opt_journal_path, 0, MOPT_NO_EXT2},
1897ba2e524dSLukas Czerner {Opt_journal_ioprio, 0, MOPT_NO_EXT2},
1898ba2e524dSLukas Czerner {Opt_data, 0, MOPT_NO_EXT2},
189926092bf5STheodore Ts'o {Opt_user_xattr, EXT4_MOUNT_XATTR_USER, MOPT_SET},
190026092bf5STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
190126092bf5STheodore Ts'o {Opt_acl, EXT4_MOUNT_POSIX_ACL, MOPT_SET},
190226092bf5STheodore Ts'o #else
190326092bf5STheodore Ts'o {Opt_acl, 0, MOPT_NOSUPPORT},
190426092bf5STheodore Ts'o #endif
190526092bf5STheodore Ts'o {Opt_nouid32, EXT4_MOUNT_NO_UID32, MOPT_SET},
190626092bf5STheodore Ts'o {Opt_debug, EXT4_MOUNT_DEBUG, MOPT_SET},
190726092bf5STheodore Ts'o {Opt_quota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA, MOPT_SET | MOPT_Q},
190826092bf5STheodore Ts'o {Opt_usrquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA,
190926092bf5STheodore Ts'o MOPT_SET | MOPT_Q},
191026092bf5STheodore Ts'o {Opt_grpquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_GRPQUOTA,
191126092bf5STheodore Ts'o MOPT_SET | MOPT_Q},
191249da9392SJan Kara {Opt_prjquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_PRJQUOTA,
191349da9392SJan Kara MOPT_SET | MOPT_Q},
191426092bf5STheodore Ts'o {Opt_noquota, (EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA |
191549da9392SJan Kara EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA),
191649da9392SJan Kara MOPT_CLEAR | MOPT_Q},
1917ba2e524dSLukas Czerner {Opt_usrjquota, 0, MOPT_Q},
1918ba2e524dSLukas Czerner {Opt_grpjquota, 0, MOPT_Q},
1919ba2e524dSLukas Czerner {Opt_jqfmt, 0, MOPT_QFMT},
1920cdb7ee4cSTahsin Erdogan {Opt_nombcache, EXT4_MOUNT_NO_MBCACHE, MOPT_SET},
192121175ca4SHarshad Shirwadkar {Opt_no_prefetch_block_bitmaps, EXT4_MOUNT_NO_PREFETCH_BLOCK_BITMAPS,
19223d392b26STheodore Ts'o MOPT_SET},
192399c880deSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
19240f0672ffSHarshad Shirwadkar {Opt_fc_debug_force, EXT4_MOUNT2_JOURNAL_FAST_COMMIT,
19250f0672ffSHarshad Shirwadkar MOPT_SET | MOPT_2 | MOPT_EXT4_ONLY},
19268016e29fSHarshad Shirwadkar #endif
192722b8d707SJan Kara {Opt_abort, EXT4_MOUNT2_ABORT, MOPT_SET | MOPT_2},
192826092bf5STheodore Ts'o {Opt_err, 0, 0}
192926092bf5STheodore Ts'o };
193026092bf5STheodore Ts'o
19315298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
1932c83ad55eSGabriel Krisman Bertazi static const struct ext4_sb_encodings {
1933c83ad55eSGabriel Krisman Bertazi __u16 magic;
1934c83ad55eSGabriel Krisman Bertazi char *name;
193549bd03ccSChristoph Hellwig unsigned int version;
1936c83ad55eSGabriel Krisman Bertazi } ext4_sb_encoding_map[] = {
193749bd03ccSChristoph Hellwig {EXT4_ENC_UTF8_12_1, "utf8", UNICODE_AGE(12, 1, 0)},
1938c83ad55eSGabriel Krisman Bertazi };
1939c83ad55eSGabriel Krisman Bertazi
1940aa8bf298SChristoph Hellwig static const struct ext4_sb_encodings *
ext4_sb_read_encoding(const struct ext4_super_block * es)1941aa8bf298SChristoph Hellwig ext4_sb_read_encoding(const struct ext4_super_block *es)
1942c83ad55eSGabriel Krisman Bertazi {
1943c83ad55eSGabriel Krisman Bertazi __u16 magic = le16_to_cpu(es->s_encoding);
1944c83ad55eSGabriel Krisman Bertazi int i;
1945c83ad55eSGabriel Krisman Bertazi
1946c83ad55eSGabriel Krisman Bertazi for (i = 0; i < ARRAY_SIZE(ext4_sb_encoding_map); i++)
1947c83ad55eSGabriel Krisman Bertazi if (magic == ext4_sb_encoding_map[i].magic)
1948aa8bf298SChristoph Hellwig return &ext4_sb_encoding_map[i];
1949c83ad55eSGabriel Krisman Bertazi
1950aa8bf298SChristoph Hellwig return NULL;
1951c83ad55eSGabriel Krisman Bertazi }
1952c83ad55eSGabriel Krisman Bertazi #endif
1953c83ad55eSGabriel Krisman Bertazi
19546e47a3ccSLukas Czerner #define EXT4_SPEC_JQUOTA (1 << 0)
19556e47a3ccSLukas Czerner #define EXT4_SPEC_JQFMT (1 << 1)
19566e47a3ccSLukas Czerner #define EXT4_SPEC_DATAJ (1 << 2)
19576e47a3ccSLukas Czerner #define EXT4_SPEC_SB_BLOCK (1 << 3)
19586e47a3ccSLukas Czerner #define EXT4_SPEC_JOURNAL_DEV (1 << 4)
19596e47a3ccSLukas Czerner #define EXT4_SPEC_JOURNAL_IOPRIO (1 << 5)
19606e47a3ccSLukas Czerner #define EXT4_SPEC_s_want_extra_isize (1 << 7)
19616e47a3ccSLukas Czerner #define EXT4_SPEC_s_max_batch_time (1 << 8)
19626e47a3ccSLukas Czerner #define EXT4_SPEC_s_min_batch_time (1 << 9)
19636e47a3ccSLukas Czerner #define EXT4_SPEC_s_inode_readahead_blks (1 << 10)
19646e47a3ccSLukas Czerner #define EXT4_SPEC_s_li_wait_mult (1 << 11)
19656e47a3ccSLukas Czerner #define EXT4_SPEC_s_max_dir_size_kb (1 << 12)
19666e47a3ccSLukas Czerner #define EXT4_SPEC_s_stripe (1 << 13)
19676e47a3ccSLukas Czerner #define EXT4_SPEC_s_resuid (1 << 14)
19686e47a3ccSLukas Czerner #define EXT4_SPEC_s_resgid (1 << 15)
19696e47a3ccSLukas Czerner #define EXT4_SPEC_s_commit_interval (1 << 16)
19706e47a3ccSLukas Czerner #define EXT4_SPEC_s_fc_debug_max_replay (1 << 17)
19717edfd85bSLukas Czerner #define EXT4_SPEC_s_sb_block (1 << 18)
197227b38686SOjaswin Mujoo #define EXT4_SPEC_mb_optimize_scan (1 << 19)
19736e47a3ccSLukas Czerner
1974461c3af0SLukas Czerner struct ext4_fs_context {
1975e6e268cbSLukas Czerner char *s_qf_names[EXT4_MAXQUOTAS];
197685456054SEric Biggers struct fscrypt_dummy_policy dummy_enc_policy;
1977e6e268cbSLukas Czerner int s_jquota_fmt; /* Format of quota to use */
19786e47a3ccSLukas Czerner #ifdef CONFIG_EXT4_DEBUG
19796e47a3ccSLukas Czerner int s_fc_debug_max_replay;
19806e47a3ccSLukas Czerner #endif
19816e47a3ccSLukas Czerner unsigned short qname_spec;
19826e47a3ccSLukas Czerner unsigned long vals_s_flags; /* Bits to set in s_flags */
19836e47a3ccSLukas Czerner unsigned long mask_s_flags; /* Bits changed in s_flags */
19846e47a3ccSLukas Czerner unsigned long journal_devnum;
19856e47a3ccSLukas Czerner unsigned long s_commit_interval;
19866e47a3ccSLukas Czerner unsigned long s_stripe;
19876e47a3ccSLukas Czerner unsigned int s_inode_readahead_blks;
19886e47a3ccSLukas Czerner unsigned int s_want_extra_isize;
19896e47a3ccSLukas Czerner unsigned int s_li_wait_mult;
19906e47a3ccSLukas Czerner unsigned int s_max_dir_size_kb;
19916e47a3ccSLukas Czerner unsigned int journal_ioprio;
19926e47a3ccSLukas Czerner unsigned int vals_s_mount_opt;
19936e47a3ccSLukas Czerner unsigned int mask_s_mount_opt;
19946e47a3ccSLukas Czerner unsigned int vals_s_mount_opt2;
19956e47a3ccSLukas Czerner unsigned int mask_s_mount_opt2;
1996b6bd2435SLukas Czerner unsigned int opt_flags; /* MOPT flags */
19976e47a3ccSLukas Czerner unsigned int spec;
19986e47a3ccSLukas Czerner u32 s_max_batch_time;
19996e47a3ccSLukas Czerner u32 s_min_batch_time;
20006e47a3ccSLukas Czerner kuid_t s_resuid;
20016e47a3ccSLukas Czerner kgid_t s_resgid;
20027edfd85bSLukas Czerner ext4_fsblk_t s_sb_block;
2003b237e304SHarshad Shirwadkar };
2004b237e304SHarshad Shirwadkar
ext4_fc_free(struct fs_context * fc)2005cebe85d5SLukas Czerner static void ext4_fc_free(struct fs_context *fc)
2006cebe85d5SLukas Czerner {
2007cebe85d5SLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2008cebe85d5SLukas Czerner int i;
2009cebe85d5SLukas Czerner
2010cebe85d5SLukas Czerner if (!ctx)
2011cebe85d5SLukas Czerner return;
2012cebe85d5SLukas Czerner
2013cebe85d5SLukas Czerner for (i = 0; i < EXT4_MAXQUOTAS; i++)
2014cebe85d5SLukas Czerner kfree(ctx->s_qf_names[i]);
2015cebe85d5SLukas Czerner
201685456054SEric Biggers fscrypt_free_dummy_policy(&ctx->dummy_enc_policy);
2017cebe85d5SLukas Czerner kfree(ctx);
2018cebe85d5SLukas Czerner }
2019cebe85d5SLukas Czerner
ext4_init_fs_context(struct fs_context * fc)2020cebe85d5SLukas Czerner int ext4_init_fs_context(struct fs_context *fc)
2021cebe85d5SLukas Czerner {
2022da9e4802SDan Carpenter struct ext4_fs_context *ctx;
2023cebe85d5SLukas Czerner
2024cebe85d5SLukas Czerner ctx = kzalloc(sizeof(struct ext4_fs_context), GFP_KERNEL);
2025cebe85d5SLukas Czerner if (!ctx)
2026cebe85d5SLukas Czerner return -ENOMEM;
2027cebe85d5SLukas Czerner
2028cebe85d5SLukas Czerner fc->fs_private = ctx;
2029cebe85d5SLukas Czerner fc->ops = &ext4_context_ops;
2030cebe85d5SLukas Czerner
2031cebe85d5SLukas Czerner return 0;
2032cebe85d5SLukas Czerner }
2033cebe85d5SLukas Czerner
2034e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
2035e6e268cbSLukas Czerner /*
2036e6e268cbSLukas Czerner * Note the name of the specified quota file.
2037e6e268cbSLukas Czerner */
note_qf_name(struct fs_context * fc,int qtype,struct fs_parameter * param)2038e6e268cbSLukas Czerner static int note_qf_name(struct fs_context *fc, int qtype,
2039e6e268cbSLukas Czerner struct fs_parameter *param)
2040e6e268cbSLukas Czerner {
2041e6e268cbSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2042e6e268cbSLukas Czerner char *qname;
2043e6e268cbSLukas Czerner
2044e6e268cbSLukas Czerner if (param->size < 1) {
2045e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR, "Missing quota name");
2046e6e268cbSLukas Czerner return -EINVAL;
2047e6e268cbSLukas Czerner }
2048e6e268cbSLukas Czerner if (strchr(param->string, '/')) {
2049e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR,
2050e6e268cbSLukas Czerner "quotafile must be on filesystem root");
2051e6e268cbSLukas Czerner return -EINVAL;
2052e6e268cbSLukas Czerner }
2053e6e268cbSLukas Czerner if (ctx->s_qf_names[qtype]) {
2054e6e268cbSLukas Czerner if (strcmp(ctx->s_qf_names[qtype], param->string) != 0) {
2055e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR,
2056e6e268cbSLukas Czerner "%s quota file already specified",
2057e6e268cbSLukas Czerner QTYPE2NAME(qtype));
2058e6e268cbSLukas Czerner return -EINVAL;
2059e6e268cbSLukas Czerner }
2060e6e268cbSLukas Czerner return 0;
2061e6e268cbSLukas Czerner }
2062e6e268cbSLukas Czerner
2063e6e268cbSLukas Czerner qname = kmemdup_nul(param->string, param->size, GFP_KERNEL);
2064e6e268cbSLukas Czerner if (!qname) {
2065e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR,
2066e6e268cbSLukas Czerner "Not enough memory for storing quotafile name");
2067e6e268cbSLukas Czerner return -ENOMEM;
2068e6e268cbSLukas Czerner }
2069e6e268cbSLukas Czerner ctx->s_qf_names[qtype] = qname;
2070e6e268cbSLukas Czerner ctx->qname_spec |= 1 << qtype;
20716e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_JQUOTA;
2072e6e268cbSLukas Czerner return 0;
2073e6e268cbSLukas Czerner }
2074e6e268cbSLukas Czerner
2075e6e268cbSLukas Czerner /*
2076e6e268cbSLukas Czerner * Clear the name of the specified quota file.
2077e6e268cbSLukas Czerner */
unnote_qf_name(struct fs_context * fc,int qtype)2078e6e268cbSLukas Czerner static int unnote_qf_name(struct fs_context *fc, int qtype)
2079e6e268cbSLukas Czerner {
2080e6e268cbSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2081e6e268cbSLukas Czerner
2082e6e268cbSLukas Czerner if (ctx->s_qf_names[qtype])
2083e6e268cbSLukas Czerner kfree(ctx->s_qf_names[qtype]);
2084e6e268cbSLukas Czerner
2085e6e268cbSLukas Czerner ctx->s_qf_names[qtype] = NULL;
2086e6e268cbSLukas Czerner ctx->qname_spec |= 1 << qtype;
20876e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_JQUOTA;
2088e6e268cbSLukas Czerner return 0;
2089e6e268cbSLukas Czerner }
2090e6e268cbSLukas Czerner #endif
2091e6e268cbSLukas Czerner
ext4_parse_test_dummy_encryption(const struct fs_parameter * param,struct ext4_fs_context * ctx)209285456054SEric Biggers static int ext4_parse_test_dummy_encryption(const struct fs_parameter *param,
209385456054SEric Biggers struct ext4_fs_context *ctx)
209485456054SEric Biggers {
209585456054SEric Biggers int err;
209685456054SEric Biggers
209785456054SEric Biggers if (!IS_ENABLED(CONFIG_FS_ENCRYPTION)) {
209885456054SEric Biggers ext4_msg(NULL, KERN_WARNING,
209985456054SEric Biggers "test_dummy_encryption option not supported");
210085456054SEric Biggers return -EINVAL;
210185456054SEric Biggers }
210285456054SEric Biggers err = fscrypt_parse_test_dummy_encryption(param,
210385456054SEric Biggers &ctx->dummy_enc_policy);
210485456054SEric Biggers if (err == -EINVAL) {
210585456054SEric Biggers ext4_msg(NULL, KERN_WARNING,
210685456054SEric Biggers "Value of option \"%s\" is unrecognized", param->key);
210785456054SEric Biggers } else if (err == -EEXIST) {
210885456054SEric Biggers ext4_msg(NULL, KERN_WARNING,
210985456054SEric Biggers "Conflicting test_dummy_encryption options");
211085456054SEric Biggers return -EINVAL;
211185456054SEric Biggers }
211285456054SEric Biggers return err;
211385456054SEric Biggers }
211485456054SEric Biggers
21156e47a3ccSLukas Czerner #define EXT4_SET_CTX(name) \
21164c246728SLukas Czerner static inline void ctx_set_##name(struct ext4_fs_context *ctx, \
21174c246728SLukas Czerner unsigned long flag) \
21186e47a3ccSLukas Czerner { \
21196e47a3ccSLukas Czerner ctx->mask_s_##name |= flag; \
21206e47a3ccSLukas Czerner ctx->vals_s_##name |= flag; \
2121e3952fccSLukas Czerner }
2122e3952fccSLukas Czerner
2123e3952fccSLukas Czerner #define EXT4_CLEAR_CTX(name) \
21244c246728SLukas Czerner static inline void ctx_clear_##name(struct ext4_fs_context *ctx, \
21254c246728SLukas Czerner unsigned long flag) \
21266e47a3ccSLukas Czerner { \
21276e47a3ccSLukas Czerner ctx->mask_s_##name |= flag; \
21286e47a3ccSLukas Czerner ctx->vals_s_##name &= ~flag; \
2129e3952fccSLukas Czerner }
2130e3952fccSLukas Czerner
2131e3952fccSLukas Czerner #define EXT4_TEST_CTX(name) \
21324c246728SLukas Czerner static inline unsigned long \
21334c246728SLukas Czerner ctx_test_##name(struct ext4_fs_context *ctx, unsigned long flag) \
21346e47a3ccSLukas Czerner { \
21354c246728SLukas Czerner return (ctx->vals_s_##name & flag); \
2136e3952fccSLukas Czerner }
21376e47a3ccSLukas Czerner
2138e3952fccSLukas Czerner EXT4_SET_CTX(flags); /* set only */
21396e47a3ccSLukas Czerner EXT4_SET_CTX(mount_opt);
2140e3952fccSLukas Czerner EXT4_CLEAR_CTX(mount_opt);
2141e3952fccSLukas Czerner EXT4_TEST_CTX(mount_opt);
21426e47a3ccSLukas Czerner EXT4_SET_CTX(mount_opt2);
2143e3952fccSLukas Czerner EXT4_CLEAR_CTX(mount_opt2);
2144e3952fccSLukas Czerner EXT4_TEST_CTX(mount_opt2);
2145e3952fccSLukas Czerner
ext4_parse_param(struct fs_context * fc,struct fs_parameter * param)214602f960f8SLukas Czerner static int ext4_parse_param(struct fs_context *fc, struct fs_parameter *param)
214726092bf5STheodore Ts'o {
2148461c3af0SLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2149461c3af0SLukas Czerner struct fs_parse_result result;
215026092bf5STheodore Ts'o const struct mount_opts *m;
2151461c3af0SLukas Czerner int is_remount;
215208cefc7aSEric W. Biederman kuid_t uid;
215308cefc7aSEric W. Biederman kgid_t gid;
2154461c3af0SLukas Czerner int token;
2155461c3af0SLukas Czerner
2156461c3af0SLukas Czerner token = fs_parse(fc, ext4_param_specs, param, &result);
2157461c3af0SLukas Czerner if (token < 0)
2158461c3af0SLukas Czerner return token;
2159461c3af0SLukas Czerner is_remount = fc->purpose == FS_CONTEXT_FOR_RECONFIGURE;
216026092bf5STheodore Ts'o
2161ba2e524dSLukas Czerner for (m = ext4_mount_opts; m->token != Opt_err; m++)
2162ba2e524dSLukas Czerner if (token == m->token)
2163ba2e524dSLukas Czerner break;
2164ba2e524dSLukas Czerner
2165ba2e524dSLukas Czerner ctx->opt_flags |= m->flags;
2166ba2e524dSLukas Czerner
2167ba2e524dSLukas Czerner if (m->flags & MOPT_EXPLICIT) {
2168ba2e524dSLukas Czerner if (m->mount_opt & EXT4_MOUNT_DELALLOC) {
2169ba2e524dSLukas Czerner ctx_set_mount_opt2(ctx, EXT4_MOUNT2_EXPLICIT_DELALLOC);
2170ba2e524dSLukas Czerner } else if (m->mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) {
2171ba2e524dSLukas Czerner ctx_set_mount_opt2(ctx,
2172ba2e524dSLukas Czerner EXT4_MOUNT2_EXPLICIT_JOURNAL_CHECKSUM);
2173ba2e524dSLukas Czerner } else
2174ba2e524dSLukas Czerner return -EINVAL;
2175ba2e524dSLukas Czerner }
2176ba2e524dSLukas Czerner
2177ba2e524dSLukas Czerner if (m->flags & MOPT_NOSUPPORT) {
2178ba2e524dSLukas Czerner ext4_msg(NULL, KERN_ERR, "%s option not supported",
2179ba2e524dSLukas Czerner param->key);
2180ba2e524dSLukas Czerner return 0;
2181ba2e524dSLukas Czerner }
2182ba2e524dSLukas Czerner
2183ba2e524dSLukas Czerner switch (token) {
218457f73c2cSTheodore Ts'o #ifdef CONFIG_QUOTA
2185ba2e524dSLukas Czerner case Opt_usrjquota:
2186461c3af0SLukas Czerner if (!*param->string)
2187e6e268cbSLukas Czerner return unnote_qf_name(fc, USRQUOTA);
2188461c3af0SLukas Czerner else
2189e6e268cbSLukas Czerner return note_qf_name(fc, USRQUOTA, param);
2190ba2e524dSLukas Czerner case Opt_grpjquota:
2191461c3af0SLukas Czerner if (!*param->string)
2192e6e268cbSLukas Czerner return unnote_qf_name(fc, GRPQUOTA);
2193461c3af0SLukas Czerner else
2194e6e268cbSLukas Czerner return note_qf_name(fc, GRPQUOTA, param);
219557f73c2cSTheodore Ts'o #endif
219626092bf5STheodore Ts'o case Opt_sb:
21977edfd85bSLukas Czerner if (fc->purpose == FS_CONTEXT_FOR_RECONFIGURE) {
21987edfd85bSLukas Czerner ext4_msg(NULL, KERN_WARNING,
21997edfd85bSLukas Czerner "Ignoring %s option on remount", param->key);
22007edfd85bSLukas Czerner } else {
22017edfd85bSLukas Czerner ctx->s_sb_block = result.uint_32;
22027edfd85bSLukas Czerner ctx->spec |= EXT4_SPEC_s_sb_block;
22037edfd85bSLukas Czerner }
220402f960f8SLukas Czerner return 0;
220526092bf5STheodore Ts'o case Opt_removed:
2206da812f61SLukas Czerner ext4_msg(NULL, KERN_WARNING, "Ignoring removed %s option",
2207461c3af0SLukas Czerner param->key);
220802f960f8SLukas Czerner return 0;
22094f74d15fSEric Biggers case Opt_inlinecrypt:
22104f74d15fSEric Biggers #ifdef CONFIG_FS_ENCRYPTION_INLINE_CRYPT
22116e47a3ccSLukas Czerner ctx_set_flags(ctx, SB_INLINECRYPT);
22124f74d15fSEric Biggers #else
2213da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "inline encryption not supported");
22144f74d15fSEric Biggers #endif
221502f960f8SLukas Czerner return 0;
2216461c3af0SLukas Czerner case Opt_errors:
22176e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_ERRORS_MASK);
2218ba2e524dSLukas Czerner ctx_set_mount_opt(ctx, result.uint_32);
2219ba2e524dSLukas Czerner return 0;
2220ba2e524dSLukas Czerner #ifdef CONFIG_QUOTA
2221ba2e524dSLukas Czerner case Opt_jqfmt:
2222ba2e524dSLukas Czerner ctx->s_jquota_fmt = result.uint_32;
2223ba2e524dSLukas Czerner ctx->spec |= EXT4_SPEC_JQFMT;
2224ba2e524dSLukas Czerner return 0;
2225ba2e524dSLukas Czerner #endif
2226ba2e524dSLukas Czerner case Opt_data:
2227ba2e524dSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS);
2228ba2e524dSLukas Czerner ctx_set_mount_opt(ctx, result.uint_32);
2229ba2e524dSLukas Czerner ctx->spec |= EXT4_SPEC_DATAJ;
2230ba2e524dSLukas Czerner return 0;
2231ba2e524dSLukas Czerner case Opt_commit:
2232461c3af0SLukas Czerner if (result.uint_32 == 0)
2233934b0de1SWang Jianjian result.uint_32 = JBD2_DEFAULT_MAX_COMMIT_AGE;
2234461c3af0SLukas Czerner else if (result.uint_32 > INT_MAX / HZ) {
2235da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR,
22369ba55543Szhangyi (F) "Invalid commit interval %d, "
22379ba55543Szhangyi (F) "must be smaller than %d",
2238461c3af0SLukas Czerner result.uint_32, INT_MAX / HZ);
2239da812f61SLukas Czerner return -EINVAL;
22409ba55543Szhangyi (F) }
22416e47a3ccSLukas Czerner ctx->s_commit_interval = HZ * result.uint_32;
22426e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_commit_interval;
2243ba2e524dSLukas Czerner return 0;
2244ba2e524dSLukas Czerner case Opt_debug_want_extra_isize:
22456e47a3ccSLukas Czerner if ((result.uint_32 & 1) || (result.uint_32 < 4)) {
2246da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR,
2247461c3af0SLukas Czerner "Invalid want_extra_isize %d", result.uint_32);
2248da812f61SLukas Czerner return -EINVAL;
22499803387cSTheodore Ts'o }
22506e47a3ccSLukas Czerner ctx->s_want_extra_isize = result.uint_32;
22516e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_want_extra_isize;
2252ba2e524dSLukas Czerner return 0;
2253ba2e524dSLukas Czerner case Opt_max_batch_time:
22546e47a3ccSLukas Czerner ctx->s_max_batch_time = result.uint_32;
22556e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_max_batch_time;
2256ba2e524dSLukas Czerner return 0;
2257ba2e524dSLukas Czerner case Opt_min_batch_time:
22586e47a3ccSLukas Czerner ctx->s_min_batch_time = result.uint_32;
22596e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_min_batch_time;
2260ba2e524dSLukas Czerner return 0;
2261ba2e524dSLukas Czerner case Opt_inode_readahead_blks:
2262461c3af0SLukas Czerner if (result.uint_32 &&
2263461c3af0SLukas Czerner (result.uint_32 > (1 << 30) ||
2264461c3af0SLukas Czerner !is_power_of_2(result.uint_32))) {
2265da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR,
2266e33e60eaSJan Kara "EXT4-fs: inode_readahead_blks must be "
2267e33e60eaSJan Kara "0 or a power of 2 smaller than 2^31");
2268da812f61SLukas Czerner return -EINVAL;
226926092bf5STheodore Ts'o }
22706e47a3ccSLukas Czerner ctx->s_inode_readahead_blks = result.uint_32;
22716e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_inode_readahead_blks;
2272ba2e524dSLukas Czerner return 0;
2273ba2e524dSLukas Czerner case Opt_init_itable:
22746e47a3ccSLukas Czerner ctx_set_mount_opt(ctx, EXT4_MOUNT_INIT_INODE_TABLE);
22756e47a3ccSLukas Czerner ctx->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT;
2276461c3af0SLukas Czerner if (param->type == fs_value_is_string)
22776e47a3ccSLukas Czerner ctx->s_li_wait_mult = result.uint_32;
22786e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_li_wait_mult;
2279ba2e524dSLukas Czerner return 0;
2280ba2e524dSLukas Czerner case Opt_max_dir_size_kb:
22816e47a3ccSLukas Czerner ctx->s_max_dir_size_kb = result.uint_32;
22826e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_max_dir_size_kb;
2283ba2e524dSLukas Czerner return 0;
22848016e29fSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
2285ba2e524dSLukas Czerner case Opt_fc_debug_max_replay:
22866e47a3ccSLukas Czerner ctx->s_fc_debug_max_replay = result.uint_32;
22876e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_fc_debug_max_replay;
2288ba2e524dSLukas Czerner return 0;
22898016e29fSHarshad Shirwadkar #endif
2290ba2e524dSLukas Czerner case Opt_stripe:
22916e47a3ccSLukas Czerner ctx->s_stripe = result.uint_32;
22926e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_stripe;
2293ba2e524dSLukas Czerner return 0;
2294ba2e524dSLukas Czerner case Opt_resuid:
2295461c3af0SLukas Czerner uid = make_kuid(current_user_ns(), result.uint_32);
22960efb3b23SJan Kara if (!uid_valid(uid)) {
2297da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "Invalid uid value %d",
2298461c3af0SLukas Czerner result.uint_32);
2299da812f61SLukas Czerner return -EINVAL;
23000efb3b23SJan Kara }
23016e47a3ccSLukas Czerner ctx->s_resuid = uid;
23026e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_resuid;
2303ba2e524dSLukas Czerner return 0;
2304ba2e524dSLukas Czerner case Opt_resgid:
2305461c3af0SLukas Czerner gid = make_kgid(current_user_ns(), result.uint_32);
23060efb3b23SJan Kara if (!gid_valid(gid)) {
2307da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "Invalid gid value %d",
2308461c3af0SLukas Czerner result.uint_32);
2309da812f61SLukas Czerner return -EINVAL;
23100efb3b23SJan Kara }
23116e47a3ccSLukas Czerner ctx->s_resgid = gid;
23126e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_s_resgid;
2313ba2e524dSLukas Czerner return 0;
2314ba2e524dSLukas Czerner case Opt_journal_dev:
23150efb3b23SJan Kara if (is_remount) {
2316da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR,
23170efb3b23SJan Kara "Cannot specify journal on remount");
2318da812f61SLukas Czerner return -EINVAL;
23190efb3b23SJan Kara }
2320461c3af0SLukas Czerner ctx->journal_devnum = result.uint_32;
23216e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_JOURNAL_DEV;
2322ba2e524dSLukas Czerner return 0;
2323ba2e524dSLukas Czerner case Opt_journal_path:
2324ba2e524dSLukas Czerner {
2325ad4eec61SEric Sandeen struct inode *journal_inode;
2326ad4eec61SEric Sandeen struct path path;
2327ad4eec61SEric Sandeen int error;
2328ad4eec61SEric Sandeen
2329ad4eec61SEric Sandeen if (is_remount) {
2330da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR,
2331ad4eec61SEric Sandeen "Cannot specify journal on remount");
2332da812f61SLukas Czerner return -EINVAL;
2333ad4eec61SEric Sandeen }
2334ad4eec61SEric Sandeen
2335e3ea75eeSLukas Czerner error = fs_lookup_param(fc, param, 1, LOOKUP_FOLLOW, &path);
2336ad4eec61SEric Sandeen if (error) {
2337da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "error: could not find "
2338461c3af0SLukas Czerner "journal device path");
2339da812f61SLukas Czerner return -EINVAL;
2340ad4eec61SEric Sandeen }
2341ad4eec61SEric Sandeen
23422b0143b5SDavid Howells journal_inode = d_inode(path.dentry);
2343461c3af0SLukas Czerner ctx->journal_devnum = new_encode_dev(journal_inode->i_rdev);
23446e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_JOURNAL_DEV;
2345ad4eec61SEric Sandeen path_put(&path);
2346ba2e524dSLukas Czerner return 0;
2347ba2e524dSLukas Czerner }
2348ba2e524dSLukas Czerner case Opt_journal_ioprio:
2349461c3af0SLukas Czerner if (result.uint_32 > 7) {
2350da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "Invalid journal IO priority"
23510efb3b23SJan Kara " (must be 0-7)");
2352da812f61SLukas Czerner return -EINVAL;
23530efb3b23SJan Kara }
2354461c3af0SLukas Czerner ctx->journal_ioprio =
2355461c3af0SLukas Czerner IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, result.uint_32);
23566e47a3ccSLukas Czerner ctx->spec |= EXT4_SPEC_JOURNAL_IOPRIO;
2357ba2e524dSLukas Czerner return 0;
2358ba2e524dSLukas Czerner case Opt_test_dummy_encryption:
235985456054SEric Biggers return ext4_parse_test_dummy_encryption(param, ctx);
2360ba2e524dSLukas Czerner case Opt_dax:
2361ba2e524dSLukas Czerner case Opt_dax_type:
2362ef83b6e8SDan Williams #ifdef CONFIG_FS_DAX
2363ba2e524dSLukas Czerner {
2364ba2e524dSLukas Czerner int type = (token == Opt_dax) ?
2365ba2e524dSLukas Czerner Opt_dax : result.uint_32;
2366ba2e524dSLukas Czerner
2367ba2e524dSLukas Czerner switch (type) {
23689cb20f94SIra Weiny case Opt_dax:
23699cb20f94SIra Weiny case Opt_dax_always:
2370ba2e524dSLukas Czerner ctx_set_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23716e47a3ccSLukas Czerner ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23729cb20f94SIra Weiny break;
23739cb20f94SIra Weiny case Opt_dax_never:
2374ba2e524dSLukas Czerner ctx_set_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23756e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23769cb20f94SIra Weiny break;
23779cb20f94SIra Weiny case Opt_dax_inode:
23786e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23796e47a3ccSLukas Czerner ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23809cb20f94SIra Weiny /* Strictly for printing options */
2381ba2e524dSLukas Czerner ctx_set_mount_opt2(ctx, EXT4_MOUNT2_DAX_INODE);
23829cb20f94SIra Weiny break;
23839cb20f94SIra Weiny }
2384ba2e524dSLukas Czerner return 0;
2385ba2e524dSLukas Czerner }
2386ef83b6e8SDan Williams #else
2387da812f61SLukas Czerner ext4_msg(NULL, KERN_INFO, "dax option not supported");
2388da812f61SLukas Czerner return -EINVAL;
2389923ae0ffSRoss Zwisler #endif
2390ba2e524dSLukas Czerner case Opt_data_err:
2391ba2e524dSLukas Czerner if (result.uint_32 == Opt_data_err_abort)
23926e47a3ccSLukas Czerner ctx_set_mount_opt(ctx, m->mount_opt);
2393ba2e524dSLukas Czerner else if (result.uint_32 == Opt_data_err_ignore)
23946e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, m->mount_opt);
2395ba2e524dSLukas Czerner return 0;
2396ba2e524dSLukas Czerner case Opt_mb_optimize_scan:
239727b38686SOjaswin Mujoo if (result.int_32 == 1) {
239827b38686SOjaswin Mujoo ctx_set_mount_opt2(ctx, EXT4_MOUNT2_MB_OPTIMIZE_SCAN);
239927b38686SOjaswin Mujoo ctx->spec |= EXT4_SPEC_mb_optimize_scan;
240027b38686SOjaswin Mujoo } else if (result.int_32 == 0) {
240127b38686SOjaswin Mujoo ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_MB_OPTIMIZE_SCAN);
240227b38686SOjaswin Mujoo ctx->spec |= EXT4_SPEC_mb_optimize_scan;
240327b38686SOjaswin Mujoo } else {
2404da812f61SLukas Czerner ext4_msg(NULL, KERN_WARNING,
2405196e402aSHarshad Shirwadkar "mb_optimize_scan should be set to 0 or 1.");
2406da812f61SLukas Czerner return -EINVAL;
2407196e402aSHarshad Shirwadkar }
2408ba2e524dSLukas Czerner return 0;
2409ba2e524dSLukas Czerner }
2410ba2e524dSLukas Czerner
2411ba2e524dSLukas Czerner /*
2412ba2e524dSLukas Czerner * At this point we should only be getting options requiring MOPT_SET,
2413ba2e524dSLukas Czerner * or MOPT_CLEAR. Anything else is a bug
2414ba2e524dSLukas Czerner */
2415ba2e524dSLukas Czerner if (m->token == Opt_err) {
2416ba2e524dSLukas Czerner ext4_msg(NULL, KERN_WARNING, "buggy handling of option %s",
2417ba2e524dSLukas Czerner param->key);
2418ba2e524dSLukas Czerner WARN_ON(1);
2419ba2e524dSLukas Czerner return -EINVAL;
2420ba2e524dSLukas Czerner }
2421ba2e524dSLukas Czerner
2422ba2e524dSLukas Czerner else {
2423461c3af0SLukas Czerner unsigned int set = 0;
2424461c3af0SLukas Czerner
2425461c3af0SLukas Czerner if ((param->type == fs_value_is_flag) ||
2426461c3af0SLukas Czerner result.uint_32 > 0)
2427461c3af0SLukas Czerner set = 1;
2428461c3af0SLukas Czerner
242926092bf5STheodore Ts'o if (m->flags & MOPT_CLEAR)
2430461c3af0SLukas Czerner set = !set;
243126092bf5STheodore Ts'o else if (unlikely(!(m->flags & MOPT_SET))) {
2432da812f61SLukas Czerner ext4_msg(NULL, KERN_WARNING,
2433461c3af0SLukas Czerner "buggy handling of option %s",
2434461c3af0SLukas Czerner param->key);
243526092bf5STheodore Ts'o WARN_ON(1);
2436da812f61SLukas Czerner return -EINVAL;
243726092bf5STheodore Ts'o }
2438995a3ed6SHarshad Shirwadkar if (m->flags & MOPT_2) {
2439461c3af0SLukas Czerner if (set != 0)
24406e47a3ccSLukas Czerner ctx_set_mount_opt2(ctx, m->mount_opt);
2441995a3ed6SHarshad Shirwadkar else
24426e47a3ccSLukas Czerner ctx_clear_mount_opt2(ctx, m->mount_opt);
2443995a3ed6SHarshad Shirwadkar } else {
2444461c3af0SLukas Czerner if (set != 0)
24456e47a3ccSLukas Czerner ctx_set_mount_opt(ctx, m->mount_opt);
244626092bf5STheodore Ts'o else
24476e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, m->mount_opt);
244826092bf5STheodore Ts'o }
2449995a3ed6SHarshad Shirwadkar }
2450ba2e524dSLukas Czerner
245102f960f8SLukas Czerner return 0;
245226092bf5STheodore Ts'o }
245326092bf5STheodore Ts'o
parse_options(struct fs_context * fc,char * options)24547edfd85bSLukas Czerner static int parse_options(struct fs_context *fc, char *options)
2455ac27a0ecSDave Kleikamp {
2456461c3af0SLukas Czerner struct fs_parameter param;
2457461c3af0SLukas Czerner int ret;
2458461c3af0SLukas Czerner char *key;
2459ac27a0ecSDave Kleikamp
2460ac27a0ecSDave Kleikamp if (!options)
24617edfd85bSLukas Czerner return 0;
2462461c3af0SLukas Czerner
2463461c3af0SLukas Czerner while ((key = strsep(&options, ",")) != NULL) {
2464461c3af0SLukas Czerner if (*key) {
2465461c3af0SLukas Czerner size_t v_len = 0;
2466461c3af0SLukas Czerner char *value = strchr(key, '=');
2467461c3af0SLukas Czerner
2468461c3af0SLukas Czerner param.type = fs_value_is_flag;
2469461c3af0SLukas Czerner param.string = NULL;
2470461c3af0SLukas Czerner
2471461c3af0SLukas Czerner if (value) {
2472461c3af0SLukas Czerner if (value == key)
2473ac27a0ecSDave Kleikamp continue;
2474461c3af0SLukas Czerner
2475461c3af0SLukas Czerner *value++ = 0;
2476461c3af0SLukas Czerner v_len = strlen(value);
2477461c3af0SLukas Czerner param.string = kmemdup_nul(value, v_len,
2478461c3af0SLukas Czerner GFP_KERNEL);
2479461c3af0SLukas Czerner if (!param.string)
24807edfd85bSLukas Czerner return -ENOMEM;
2481461c3af0SLukas Czerner param.type = fs_value_is_string;
2482461c3af0SLukas Czerner }
2483461c3af0SLukas Czerner
2484461c3af0SLukas Czerner param.key = key;
2485461c3af0SLukas Czerner param.size = v_len;
2486461c3af0SLukas Czerner
248702f960f8SLukas Czerner ret = ext4_parse_param(fc, ¶m);
2488461c3af0SLukas Czerner if (param.string)
2489461c3af0SLukas Czerner kfree(param.string);
2490461c3af0SLukas Czerner if (ret < 0)
24917edfd85bSLukas Czerner return ret;
2492ac27a0ecSDave Kleikamp }
2493461c3af0SLukas Czerner }
2494461c3af0SLukas Czerner
24957edfd85bSLukas Czerner ret = ext4_validate_options(fc);
2496da812f61SLukas Czerner if (ret < 0)
24977edfd85bSLukas Czerner return ret;
24987edfd85bSLukas Czerner
24997edfd85bSLukas Czerner return 0;
25007edfd85bSLukas Czerner }
25017edfd85bSLukas Czerner
parse_apply_sb_mount_options(struct super_block * sb,struct ext4_fs_context * m_ctx)25027edfd85bSLukas Czerner static int parse_apply_sb_mount_options(struct super_block *sb,
25037edfd85bSLukas Czerner struct ext4_fs_context *m_ctx)
25047edfd85bSLukas Czerner {
25057edfd85bSLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb);
25067edfd85bSLukas Czerner char *s_mount_opts = NULL;
25077edfd85bSLukas Czerner struct ext4_fs_context *s_ctx = NULL;
25087edfd85bSLukas Czerner struct fs_context *fc = NULL;
25097edfd85bSLukas Czerner int ret = -ENOMEM;
25107edfd85bSLukas Czerner
25117edfd85bSLukas Czerner if (!sbi->s_es->s_mount_opts[0])
2512da812f61SLukas Czerner return 0;
2513da812f61SLukas Czerner
25147edfd85bSLukas Czerner s_mount_opts = kstrndup(sbi->s_es->s_mount_opts,
25157edfd85bSLukas Czerner sizeof(sbi->s_es->s_mount_opts),
25167edfd85bSLukas Czerner GFP_KERNEL);
25177edfd85bSLukas Czerner if (!s_mount_opts)
25187edfd85bSLukas Czerner return ret;
2519e6e268cbSLukas Czerner
25207edfd85bSLukas Czerner fc = kzalloc(sizeof(struct fs_context), GFP_KERNEL);
25217edfd85bSLukas Czerner if (!fc)
25227edfd85bSLukas Czerner goto out_free;
2523e6e268cbSLukas Czerner
25247edfd85bSLukas Czerner s_ctx = kzalloc(sizeof(struct ext4_fs_context), GFP_KERNEL);
25257edfd85bSLukas Czerner if (!s_ctx)
25267edfd85bSLukas Czerner goto out_free;
25277edfd85bSLukas Czerner
25287edfd85bSLukas Czerner fc->fs_private = s_ctx;
25297edfd85bSLukas Czerner fc->s_fs_info = sbi;
25307edfd85bSLukas Czerner
25317edfd85bSLukas Czerner ret = parse_options(fc, s_mount_opts);
25327edfd85bSLukas Czerner if (ret < 0)
25337edfd85bSLukas Czerner goto parse_failed;
25347edfd85bSLukas Czerner
25357edfd85bSLukas Czerner ret = ext4_check_opt_consistency(fc, sb);
25367edfd85bSLukas Czerner if (ret < 0) {
25377edfd85bSLukas Czerner parse_failed:
25387edfd85bSLukas Czerner ext4_msg(sb, KERN_WARNING,
25397edfd85bSLukas Czerner "failed to parse options in superblock: %s",
25407edfd85bSLukas Czerner s_mount_opts);
25417edfd85bSLukas Czerner ret = 0;
25427edfd85bSLukas Czerner goto out_free;
25437edfd85bSLukas Czerner }
25447edfd85bSLukas Czerner
25457edfd85bSLukas Czerner if (s_ctx->spec & EXT4_SPEC_JOURNAL_DEV)
25467edfd85bSLukas Czerner m_ctx->journal_devnum = s_ctx->journal_devnum;
25477edfd85bSLukas Czerner if (s_ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO)
25487edfd85bSLukas Czerner m_ctx->journal_ioprio = s_ctx->journal_ioprio;
25497edfd85bSLukas Czerner
255085456054SEric Biggers ext4_apply_options(fc, sb);
255185456054SEric Biggers ret = 0;
25527edfd85bSLukas Czerner
25537edfd85bSLukas Czerner out_free:
2554c069db76SEric Biggers if (fc) {
2555c069db76SEric Biggers ext4_fc_free(fc);
25567edfd85bSLukas Czerner kfree(fc);
2557c069db76SEric Biggers }
25587edfd85bSLukas Czerner kfree(s_mount_opts);
25597edfd85bSLukas Czerner return ret;
25604c94bff9SLukas Czerner }
25614c94bff9SLukas Czerner
ext4_apply_quota_options(struct fs_context * fc,struct super_block * sb)2562e6e268cbSLukas Czerner static void ext4_apply_quota_options(struct fs_context *fc,
2563e6e268cbSLukas Czerner struct super_block *sb)
2564e6e268cbSLukas Czerner {
2565e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
25666e47a3ccSLukas Czerner bool quota_feature = ext4_has_feature_quota(sb);
2567e6e268cbSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2568e6e268cbSLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb);
2569e6e268cbSLukas Czerner char *qname;
2570e6e268cbSLukas Czerner int i;
2571e6e268cbSLukas Czerner
25726e47a3ccSLukas Czerner if (quota_feature)
25736e47a3ccSLukas Czerner return;
25746e47a3ccSLukas Czerner
25756e47a3ccSLukas Czerner if (ctx->spec & EXT4_SPEC_JQUOTA) {
2576e6e268cbSLukas Czerner for (i = 0; i < EXT4_MAXQUOTAS; i++) {
2577e6e268cbSLukas Czerner if (!(ctx->qname_spec & (1 << i)))
2578e6e268cbSLukas Czerner continue;
25796e47a3ccSLukas Czerner
2580e6e268cbSLukas Czerner qname = ctx->s_qf_names[i]; /* May be NULL */
25814c1bd5a9SLukas Czerner if (qname)
25824c1bd5a9SLukas Czerner set_opt(sb, QUOTA);
2583e6e268cbSLukas Czerner ctx->s_qf_names[i] = NULL;
258413b215a9SLukas Czerner qname = rcu_replace_pointer(sbi->s_qf_names[i], qname,
258513b215a9SLukas Czerner lockdep_is_held(&sb->s_umount));
258613b215a9SLukas Czerner if (qname)
258710e4f310SUladzislau Rezki (Sony) kfree_rcu_mightsleep(qname);
2588e6e268cbSLukas Czerner }
25896e47a3ccSLukas Czerner }
25906e47a3ccSLukas Czerner
25916e47a3ccSLukas Czerner if (ctx->spec & EXT4_SPEC_JQFMT)
25926e47a3ccSLukas Czerner sbi->s_jquota_fmt = ctx->s_jquota_fmt;
2593e6e268cbSLukas Czerner #endif
2594e6e268cbSLukas Czerner }
2595e6e268cbSLukas Czerner
2596e6e268cbSLukas Czerner /*
2597e6e268cbSLukas Czerner * Check quota settings consistency.
2598e6e268cbSLukas Czerner */
ext4_check_quota_consistency(struct fs_context * fc,struct super_block * sb)2599e6e268cbSLukas Czerner static int ext4_check_quota_consistency(struct fs_context *fc,
2600e6e268cbSLukas Czerner struct super_block *sb)
2601e6e268cbSLukas Czerner {
2602e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
2603e6e268cbSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
2604e6e268cbSLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb);
2605e6e268cbSLukas Czerner bool quota_feature = ext4_has_feature_quota(sb);
2606e6e268cbSLukas Czerner bool quota_loaded = sb_any_quota_loaded(sb);
26076e47a3ccSLukas Czerner bool usr_qf_name, grp_qf_name, usrquota, grpquota;
26086e47a3ccSLukas Czerner int quota_flags, i;
2609e6e268cbSLukas Czerner
26106e47a3ccSLukas Czerner /*
26116e47a3ccSLukas Czerner * We do the test below only for project quotas. 'usrquota' and
26126e47a3ccSLukas Czerner * 'grpquota' mount options are allowed even without quota feature
26136e47a3ccSLukas Czerner * to support legacy quotas in quota files.
26146e47a3ccSLukas Czerner */
26156e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_PRJQUOTA) &&
26166e47a3ccSLukas Czerner !ext4_has_feature_project(sb)) {
26176e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "Project quota feature not enabled. "
26186e47a3ccSLukas Czerner "Cannot enable project quota enforcement.");
26196e47a3ccSLukas Czerner return -EINVAL;
26206e47a3ccSLukas Czerner }
26216e47a3ccSLukas Czerner
26226e47a3ccSLukas Czerner quota_flags = EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA |
26236e47a3ccSLukas Czerner EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA;
26246e47a3ccSLukas Czerner if (quota_loaded &&
26256e47a3ccSLukas Czerner ctx->mask_s_mount_opt & quota_flags &&
26266e47a3ccSLukas Czerner !ctx_test_mount_opt(ctx, quota_flags))
26276e47a3ccSLukas Czerner goto err_quota_change;
26286e47a3ccSLukas Czerner
26296e47a3ccSLukas Czerner if (ctx->spec & EXT4_SPEC_JQUOTA) {
2630e6e268cbSLukas Czerner
2631e6e268cbSLukas Czerner for (i = 0; i < EXT4_MAXQUOTAS; i++) {
2632e6e268cbSLukas Czerner if (!(ctx->qname_spec & (1 << i)))
2633e6e268cbSLukas Czerner continue;
2634e6e268cbSLukas Czerner
26356e47a3ccSLukas Czerner if (quota_loaded &&
26366e47a3ccSLukas Czerner !!sbi->s_qf_names[i] != !!ctx->s_qf_names[i])
2637e6e268cbSLukas Czerner goto err_jquota_change;
2638e6e268cbSLukas Czerner
2639e6e268cbSLukas Czerner if (sbi->s_qf_names[i] && ctx->s_qf_names[i] &&
264013b215a9SLukas Czerner strcmp(get_qf_name(sb, sbi, i),
2641e6e268cbSLukas Czerner ctx->s_qf_names[i]) != 0)
2642e6e268cbSLukas Czerner goto err_jquota_specified;
2643e6e268cbSLukas Czerner }
26446e47a3ccSLukas Czerner
26456e47a3ccSLukas Czerner if (quota_feature) {
26466e47a3ccSLukas Czerner ext4_msg(NULL, KERN_INFO,
26476e47a3ccSLukas Czerner "Journaled quota options ignored when "
26486e47a3ccSLukas Czerner "QUOTA feature is enabled");
26496e47a3ccSLukas Czerner return 0;
26506e47a3ccSLukas Czerner }
2651e6e268cbSLukas Czerner }
2652e6e268cbSLukas Czerner
26536e47a3ccSLukas Czerner if (ctx->spec & EXT4_SPEC_JQFMT) {
2654e6e268cbSLukas Czerner if (sbi->s_jquota_fmt != ctx->s_jquota_fmt && quota_loaded)
26556e47a3ccSLukas Czerner goto err_jquota_change;
2656e6e268cbSLukas Czerner if (quota_feature) {
2657e6e268cbSLukas Czerner ext4_msg(NULL, KERN_INFO, "Quota format mount options "
2658e6e268cbSLukas Czerner "ignored when QUOTA feature is enabled");
2659e6e268cbSLukas Czerner return 0;
2660e6e268cbSLukas Czerner }
2661e6e268cbSLukas Czerner }
26626e47a3ccSLukas Czerner
26636e47a3ccSLukas Czerner /* Make sure we don't mix old and new quota format */
26646e47a3ccSLukas Czerner usr_qf_name = (get_qf_name(sb, sbi, USRQUOTA) ||
26656e47a3ccSLukas Czerner ctx->s_qf_names[USRQUOTA]);
26666e47a3ccSLukas Czerner grp_qf_name = (get_qf_name(sb, sbi, GRPQUOTA) ||
26676e47a3ccSLukas Czerner ctx->s_qf_names[GRPQUOTA]);
26686e47a3ccSLukas Czerner
26696e47a3ccSLukas Czerner usrquota = (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) ||
26706e47a3ccSLukas Czerner test_opt(sb, USRQUOTA));
26716e47a3ccSLukas Czerner
26726e47a3ccSLukas Czerner grpquota = (ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA) ||
26736e47a3ccSLukas Czerner test_opt(sb, GRPQUOTA));
26746e47a3ccSLukas Czerner
26756e47a3ccSLukas Czerner if (usr_qf_name) {
26766e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_USRQUOTA);
26776e47a3ccSLukas Czerner usrquota = false;
26786e47a3ccSLukas Czerner }
26796e47a3ccSLukas Czerner if (grp_qf_name) {
26806e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA);
26816e47a3ccSLukas Czerner grpquota = false;
26826e47a3ccSLukas Czerner }
26836e47a3ccSLukas Czerner
26846e47a3ccSLukas Czerner if (usr_qf_name || grp_qf_name) {
26856e47a3ccSLukas Czerner if (usrquota || grpquota) {
26866e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "old and new quota "
26876e47a3ccSLukas Czerner "format mixing");
26886e47a3ccSLukas Czerner return -EINVAL;
26896e47a3ccSLukas Czerner }
26906e47a3ccSLukas Czerner
26916e47a3ccSLukas Czerner if (!(ctx->spec & EXT4_SPEC_JQFMT || sbi->s_jquota_fmt)) {
26926e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "journaled quota format "
26936e47a3ccSLukas Czerner "not specified");
26946e47a3ccSLukas Czerner return -EINVAL;
26956e47a3ccSLukas Czerner }
26966e47a3ccSLukas Czerner }
26976e47a3ccSLukas Czerner
2698e6e268cbSLukas Czerner return 0;
2699e6e268cbSLukas Czerner
2700e6e268cbSLukas Czerner err_quota_change:
2701e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR,
2702e6e268cbSLukas Czerner "Cannot change quota options when quota turned on");
2703e6e268cbSLukas Czerner return -EINVAL;
2704e6e268cbSLukas Czerner err_jquota_change:
2705e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR, "Cannot change journaled quota "
2706e6e268cbSLukas Czerner "options when quota turned on");
2707e6e268cbSLukas Czerner return -EINVAL;
2708e6e268cbSLukas Czerner err_jquota_specified:
2709e6e268cbSLukas Czerner ext4_msg(NULL, KERN_ERR, "%s quota file already specified",
2710e6e268cbSLukas Czerner QTYPE2NAME(i));
2711e6e268cbSLukas Czerner return -EINVAL;
2712e6e268cbSLukas Czerner #else
2713e6e268cbSLukas Czerner return 0;
2714e6e268cbSLukas Czerner #endif
2715e6e268cbSLukas Czerner }
2716e6e268cbSLukas Czerner
ext4_check_test_dummy_encryption(const struct fs_context * fc,struct super_block * sb)27175f41fdaeSEric Biggers static int ext4_check_test_dummy_encryption(const struct fs_context *fc,
27185f41fdaeSEric Biggers struct super_block *sb)
27195f41fdaeSEric Biggers {
27205f41fdaeSEric Biggers const struct ext4_fs_context *ctx = fc->fs_private;
27215f41fdaeSEric Biggers const struct ext4_sb_info *sbi = EXT4_SB(sb);
27225f41fdaeSEric Biggers
272385456054SEric Biggers if (!fscrypt_is_dummy_policy_set(&ctx->dummy_enc_policy))
27245f41fdaeSEric Biggers return 0;
27255f41fdaeSEric Biggers
27265f41fdaeSEric Biggers if (!ext4_has_feature_encrypt(sb)) {
27275f41fdaeSEric Biggers ext4_msg(NULL, KERN_WARNING,
27285f41fdaeSEric Biggers "test_dummy_encryption requires encrypt feature");
27295f41fdaeSEric Biggers return -EINVAL;
27305f41fdaeSEric Biggers }
27315f41fdaeSEric Biggers /*
27325f41fdaeSEric Biggers * This mount option is just for testing, and it's not worthwhile to
27335f41fdaeSEric Biggers * implement the extra complexity (e.g. RCU protection) that would be
27345f41fdaeSEric Biggers * needed to allow it to be set or changed during remount. We do allow
27355f41fdaeSEric Biggers * it to be specified during remount, but only if there is no change.
27365f41fdaeSEric Biggers */
273785456054SEric Biggers if (fc->purpose == FS_CONTEXT_FOR_RECONFIGURE) {
273885456054SEric Biggers if (fscrypt_dummy_policies_equal(&sbi->s_dummy_enc_policy,
273985456054SEric Biggers &ctx->dummy_enc_policy))
274085456054SEric Biggers return 0;
27415f41fdaeSEric Biggers ext4_msg(NULL, KERN_WARNING,
274285456054SEric Biggers "Can't set or change test_dummy_encryption on remount");
27435f41fdaeSEric Biggers return -EINVAL;
27445f41fdaeSEric Biggers }
274585456054SEric Biggers /* Also make sure s_mount_opts didn't contain a conflicting value. */
274685456054SEric Biggers if (fscrypt_is_dummy_policy_set(&sbi->s_dummy_enc_policy)) {
274785456054SEric Biggers if (fscrypt_dummy_policies_equal(&sbi->s_dummy_enc_policy,
274885456054SEric Biggers &ctx->dummy_enc_policy))
27495f41fdaeSEric Biggers return 0;
275085456054SEric Biggers ext4_msg(NULL, KERN_WARNING,
275185456054SEric Biggers "Conflicting test_dummy_encryption options");
275285456054SEric Biggers return -EINVAL;
275385456054SEric Biggers }
27547959eb19SEric Biggers return 0;
275585456054SEric Biggers }
275685456054SEric Biggers
ext4_apply_test_dummy_encryption(struct ext4_fs_context * ctx,struct super_block * sb)275785456054SEric Biggers static void ext4_apply_test_dummy_encryption(struct ext4_fs_context *ctx,
275885456054SEric Biggers struct super_block *sb)
275985456054SEric Biggers {
276085456054SEric Biggers if (!fscrypt_is_dummy_policy_set(&ctx->dummy_enc_policy) ||
276185456054SEric Biggers /* if already set, it was already verified to be the same */
276285456054SEric Biggers fscrypt_is_dummy_policy_set(&EXT4_SB(sb)->s_dummy_enc_policy))
276385456054SEric Biggers return;
276485456054SEric Biggers EXT4_SB(sb)->s_dummy_enc_policy = ctx->dummy_enc_policy;
276585456054SEric Biggers memset(&ctx->dummy_enc_policy, 0, sizeof(ctx->dummy_enc_policy));
276685456054SEric Biggers ext4_msg(sb, KERN_WARNING, "Test dummy encryption mode enabled");
27675f41fdaeSEric Biggers }
27685f41fdaeSEric Biggers
ext4_check_opt_consistency(struct fs_context * fc,struct super_block * sb)2769b6bd2435SLukas Czerner static int ext4_check_opt_consistency(struct fs_context *fc,
2770b6bd2435SLukas Czerner struct super_block *sb)
2771b6bd2435SLukas Czerner {
2772b6bd2435SLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
27736e47a3ccSLukas Czerner struct ext4_sb_info *sbi = fc->s_fs_info;
27746e47a3ccSLukas Czerner int is_remount = fc->purpose == FS_CONTEXT_FOR_RECONFIGURE;
27755f41fdaeSEric Biggers int err;
2776b6bd2435SLukas Czerner
2777b6bd2435SLukas Czerner if ((ctx->opt_flags & MOPT_NO_EXT2) && IS_EXT2_SB(sb)) {
2778b6bd2435SLukas Czerner ext4_msg(NULL, KERN_ERR,
2779b6bd2435SLukas Czerner "Mount option(s) incompatible with ext2");
2780b6bd2435SLukas Czerner return -EINVAL;
2781b6bd2435SLukas Czerner }
2782b6bd2435SLukas Czerner if ((ctx->opt_flags & MOPT_NO_EXT3) && IS_EXT3_SB(sb)) {
2783b6bd2435SLukas Czerner ext4_msg(NULL, KERN_ERR,
2784b6bd2435SLukas Czerner "Mount option(s) incompatible with ext3");
2785b6bd2435SLukas Czerner return -EINVAL;
2786b6bd2435SLukas Czerner }
2787b6bd2435SLukas Czerner
27886e47a3ccSLukas Czerner if (ctx->s_want_extra_isize >
27896e47a3ccSLukas Czerner (sbi->s_inode_size - EXT4_GOOD_OLD_INODE_SIZE)) {
27906e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR,
27916e47a3ccSLukas Czerner "Invalid want_extra_isize %d",
27926e47a3ccSLukas Czerner ctx->s_want_extra_isize);
27936e47a3ccSLukas Czerner return -EINVAL;
27946e47a3ccSLukas Czerner }
27956e47a3ccSLukas Czerner
27966e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DIOREAD_NOLOCK)) {
27976e47a3ccSLukas Czerner int blocksize =
27986e47a3ccSLukas Czerner BLOCK_SIZE << le32_to_cpu(sbi->s_es->s_log_block_size);
27996e47a3ccSLukas Czerner if (blocksize < PAGE_SIZE)
28006e47a3ccSLukas Czerner ext4_msg(NULL, KERN_WARNING, "Warning: mounting with an "
28016e47a3ccSLukas Czerner "experimental mount option 'dioread_nolock' "
28026e47a3ccSLukas Czerner "for blocksize < PAGE_SIZE");
28036e47a3ccSLukas Czerner }
28046e47a3ccSLukas Czerner
28055f41fdaeSEric Biggers err = ext4_check_test_dummy_encryption(fc, sb);
28065f41fdaeSEric Biggers if (err)
28075f41fdaeSEric Biggers return err;
28086e47a3ccSLukas Czerner
28096e47a3ccSLukas Czerner if ((ctx->spec & EXT4_SPEC_DATAJ) && is_remount) {
28106e47a3ccSLukas Czerner if (!sbi->s_journal) {
28116e47a3ccSLukas Czerner ext4_msg(NULL, KERN_WARNING,
28126e47a3ccSLukas Czerner "Remounting file system with no journal "
28136e47a3ccSLukas Czerner "so ignoring journalled data option");
28146e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS);
28154c246728SLukas Czerner } else if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS) !=
28164c246728SLukas Czerner test_opt(sb, DATA_FLAGS)) {
28176e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "Cannot change data mode "
28186e47a3ccSLukas Czerner "on remount");
28196e47a3ccSLukas Czerner return -EINVAL;
28206e47a3ccSLukas Czerner }
28216e47a3ccSLukas Czerner }
28226e47a3ccSLukas Czerner
28236e47a3ccSLukas Czerner if (is_remount) {
28246e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS) &&
28256e47a3ccSLukas Czerner (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)) {
28266e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "can't mount with "
28276e47a3ccSLukas Czerner "both data=journal and dax");
28286e47a3ccSLukas Czerner return -EINVAL;
28296e47a3ccSLukas Czerner }
28306e47a3ccSLukas Czerner
28316e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS) &&
28326e47a3ccSLukas Czerner (!(sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) ||
28336e47a3ccSLukas Czerner (sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER))) {
28346e47a3ccSLukas Czerner fail_dax_change_remount:
28356e47a3ccSLukas Czerner ext4_msg(NULL, KERN_ERR, "can't change "
28366e47a3ccSLukas Czerner "dax mount option while remounting");
28376e47a3ccSLukas Czerner return -EINVAL;
28386e47a3ccSLukas Czerner } else if (ctx_test_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER) &&
28396e47a3ccSLukas Czerner (!(sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER) ||
28406e47a3ccSLukas Czerner (sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS))) {
28416e47a3ccSLukas Czerner goto fail_dax_change_remount;
28426e47a3ccSLukas Czerner } else if (ctx_test_mount_opt2(ctx, EXT4_MOUNT2_DAX_INODE) &&
28436e47a3ccSLukas Czerner ((sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) ||
28446e47a3ccSLukas Czerner (sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER) ||
28456e47a3ccSLukas Czerner !(sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_INODE))) {
28466e47a3ccSLukas Czerner goto fail_dax_change_remount;
28476e47a3ccSLukas Czerner }
28486e47a3ccSLukas Czerner }
28496e47a3ccSLukas Czerner
2850b6bd2435SLukas Czerner return ext4_check_quota_consistency(fc, sb);
2851b6bd2435SLukas Czerner }
2852b6bd2435SLukas Czerner
ext4_apply_options(struct fs_context * fc,struct super_block * sb)285385456054SEric Biggers static void ext4_apply_options(struct fs_context *fc, struct super_block *sb)
28546e47a3ccSLukas Czerner {
28556e47a3ccSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
28566e47a3ccSLukas Czerner struct ext4_sb_info *sbi = fc->s_fs_info;
28576e47a3ccSLukas Czerner
28586e47a3ccSLukas Czerner sbi->s_mount_opt &= ~ctx->mask_s_mount_opt;
28596e47a3ccSLukas Czerner sbi->s_mount_opt |= ctx->vals_s_mount_opt;
28606e47a3ccSLukas Czerner sbi->s_mount_opt2 &= ~ctx->mask_s_mount_opt2;
28616e47a3ccSLukas Czerner sbi->s_mount_opt2 |= ctx->vals_s_mount_opt2;
28626e47a3ccSLukas Czerner sb->s_flags &= ~ctx->mask_s_flags;
28636e47a3ccSLukas Czerner sb->s_flags |= ctx->vals_s_flags;
28646e47a3ccSLukas Czerner
28656e47a3ccSLukas Czerner #define APPLY(X) ({ if (ctx->spec & EXT4_SPEC_##X) sbi->X = ctx->X; })
28666e47a3ccSLukas Czerner APPLY(s_commit_interval);
28676e47a3ccSLukas Czerner APPLY(s_stripe);
28686e47a3ccSLukas Czerner APPLY(s_max_batch_time);
28696e47a3ccSLukas Czerner APPLY(s_min_batch_time);
28706e47a3ccSLukas Czerner APPLY(s_want_extra_isize);
28716e47a3ccSLukas Czerner APPLY(s_inode_readahead_blks);
28726e47a3ccSLukas Czerner APPLY(s_max_dir_size_kb);
28736e47a3ccSLukas Czerner APPLY(s_li_wait_mult);
28746e47a3ccSLukas Czerner APPLY(s_resgid);
28756e47a3ccSLukas Czerner APPLY(s_resuid);
28766e47a3ccSLukas Czerner
28776e47a3ccSLukas Czerner #ifdef CONFIG_EXT4_DEBUG
28786e47a3ccSLukas Czerner APPLY(s_fc_debug_max_replay);
28796e47a3ccSLukas Czerner #endif
28806e47a3ccSLukas Czerner
28816e47a3ccSLukas Czerner ext4_apply_quota_options(fc, sb);
288285456054SEric Biggers ext4_apply_test_dummy_encryption(ctx, sb);
28836e47a3ccSLukas Czerner }
28846e47a3ccSLukas Czerner
28856e47a3ccSLukas Czerner
ext4_validate_options(struct fs_context * fc)2886da812f61SLukas Czerner static int ext4_validate_options(struct fs_context *fc)
28874c94bff9SLukas Czerner {
2888ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
28896e47a3ccSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
28904c94bff9SLukas Czerner char *usr_qf_name, *grp_qf_name;
28916e47a3ccSLukas Czerner
28926e47a3ccSLukas Czerner usr_qf_name = ctx->s_qf_names[USRQUOTA];
28936e47a3ccSLukas Czerner grp_qf_name = ctx->s_qf_names[GRPQUOTA];
28946e47a3ccSLukas Czerner
289533458eabSTheodore Ts'o if (usr_qf_name || grp_qf_name) {
28966e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) && usr_qf_name)
28976e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_USRQUOTA);
2898ac27a0ecSDave Kleikamp
28996e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA) && grp_qf_name)
29006e47a3ccSLukas Czerner ctx_clear_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA);
2901ac27a0ecSDave Kleikamp
29026e47a3ccSLukas Czerner if (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) ||
29036e47a3ccSLukas Czerner ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA)) {
2904da812f61SLukas Czerner ext4_msg(NULL, KERN_ERR, "old and new quota "
2905b31e1552SEric Sandeen "format mixing");
2906da812f61SLukas Czerner return -EINVAL;
2907ac27a0ecSDave Kleikamp }
2908ac27a0ecSDave Kleikamp }
2909ac27a0ecSDave Kleikamp #endif
29106e47a3ccSLukas Czerner return 1;
2911ac27a0ecSDave Kleikamp }
2912ac27a0ecSDave Kleikamp
ext4_show_quota_options(struct seq_file * seq,struct super_block * sb)29132adf6da8STheodore Ts'o static inline void ext4_show_quota_options(struct seq_file *seq,
29142adf6da8STheodore Ts'o struct super_block *sb)
29152adf6da8STheodore Ts'o {
29162adf6da8STheodore Ts'o #if defined(CONFIG_QUOTA)
29172adf6da8STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
291833458eabSTheodore Ts'o char *usr_qf_name, *grp_qf_name;
29192adf6da8STheodore Ts'o
29202adf6da8STheodore Ts'o if (sbi->s_jquota_fmt) {
29212adf6da8STheodore Ts'o char *fmtname = "";
29222adf6da8STheodore Ts'o
29232adf6da8STheodore Ts'o switch (sbi->s_jquota_fmt) {
29242adf6da8STheodore Ts'o case QFMT_VFS_OLD:
29252adf6da8STheodore Ts'o fmtname = "vfsold";
29262adf6da8STheodore Ts'o break;
29272adf6da8STheodore Ts'o case QFMT_VFS_V0:
29282adf6da8STheodore Ts'o fmtname = "vfsv0";
29292adf6da8STheodore Ts'o break;
29302adf6da8STheodore Ts'o case QFMT_VFS_V1:
29312adf6da8STheodore Ts'o fmtname = "vfsv1";
29322adf6da8STheodore Ts'o break;
29332adf6da8STheodore Ts'o }
29342adf6da8STheodore Ts'o seq_printf(seq, ",jqfmt=%s", fmtname);
29352adf6da8STheodore Ts'o }
29362adf6da8STheodore Ts'o
293733458eabSTheodore Ts'o rcu_read_lock();
293833458eabSTheodore Ts'o usr_qf_name = rcu_dereference(sbi->s_qf_names[USRQUOTA]);
293933458eabSTheodore Ts'o grp_qf_name = rcu_dereference(sbi->s_qf_names[GRPQUOTA]);
294033458eabSTheodore Ts'o if (usr_qf_name)
294133458eabSTheodore Ts'o seq_show_option(seq, "usrjquota", usr_qf_name);
294233458eabSTheodore Ts'o if (grp_qf_name)
294333458eabSTheodore Ts'o seq_show_option(seq, "grpjquota", grp_qf_name);
294433458eabSTheodore Ts'o rcu_read_unlock();
29452adf6da8STheodore Ts'o #endif
29462adf6da8STheodore Ts'o }
29472adf6da8STheodore Ts'o
token2str(int token)29485a916be1STheodore Ts'o static const char *token2str(int token)
29495a916be1STheodore Ts'o {
295097d8a670SLukas Czerner const struct fs_parameter_spec *spec;
29515a916be1STheodore Ts'o
295297d8a670SLukas Czerner for (spec = ext4_param_specs; spec->name != NULL; spec++)
295397d8a670SLukas Czerner if (spec->opt == token && !spec->type)
29545a916be1STheodore Ts'o break;
295597d8a670SLukas Czerner return spec->name;
29565a916be1STheodore Ts'o }
29575a916be1STheodore Ts'o
29582adf6da8STheodore Ts'o /*
29592adf6da8STheodore Ts'o * Show an option if
29602adf6da8STheodore Ts'o * - it's set to a non-default value OR
29612adf6da8STheodore Ts'o * - if the per-sb default is different from the global default
29622adf6da8STheodore Ts'o */
_ext4_show_options(struct seq_file * seq,struct super_block * sb,int nodefs)296366acdcf4STheodore Ts'o static int _ext4_show_options(struct seq_file *seq, struct super_block *sb,
296466acdcf4STheodore Ts'o int nodefs)
29652adf6da8STheodore Ts'o {
29662adf6da8STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
29672adf6da8STheodore Ts'o struct ext4_super_block *es = sbi->s_es;
2968e3645d72SZhang Yi int def_errors;
29695a916be1STheodore Ts'o const struct mount_opts *m;
297066acdcf4STheodore Ts'o char sep = nodefs ? '\n' : ',';
29712adf6da8STheodore Ts'o
297266acdcf4STheodore Ts'o #define SEQ_OPTS_PUTS(str) seq_printf(seq, "%c" str, sep)
297366acdcf4STheodore Ts'o #define SEQ_OPTS_PRINT(str, arg) seq_printf(seq, "%c" str, sep, arg)
29742adf6da8STheodore Ts'o
29752adf6da8STheodore Ts'o if (sbi->s_sb_block != 1)
29765a916be1STheodore Ts'o SEQ_OPTS_PRINT("sb=%llu", sbi->s_sb_block);
29775a916be1STheodore Ts'o
29785a916be1STheodore Ts'o for (m = ext4_mount_opts; m->token != Opt_err; m++) {
29795a916be1STheodore Ts'o int want_set = m->flags & MOPT_SET;
2980e3645d72SZhang Yi int opt_2 = m->flags & MOPT_2;
2981e3645d72SZhang Yi unsigned int mount_opt, def_mount_opt;
2982e3645d72SZhang Yi
29835a916be1STheodore Ts'o if (((m->flags & (MOPT_SET|MOPT_CLEAR)) == 0) ||
2984ba2e524dSLukas Czerner m->flags & MOPT_SKIP)
29855a916be1STheodore Ts'o continue;
2986e3645d72SZhang Yi
2987e3645d72SZhang Yi if (opt_2) {
2988e3645d72SZhang Yi mount_opt = sbi->s_mount_opt2;
2989e3645d72SZhang Yi def_mount_opt = sbi->s_def_mount_opt2;
2990e3645d72SZhang Yi } else {
2991e3645d72SZhang Yi mount_opt = sbi->s_mount_opt;
2992e3645d72SZhang Yi def_mount_opt = sbi->s_def_mount_opt;
2993e3645d72SZhang Yi }
2994e3645d72SZhang Yi /* skip if same as the default */
2995e3645d72SZhang Yi if (!nodefs && !(m->mount_opt & (mount_opt ^ def_mount_opt)))
2996e3645d72SZhang Yi continue;
2997e3645d72SZhang Yi /* select Opt_noFoo vs Opt_Foo */
29985a916be1STheodore Ts'o if ((want_set &&
2999e3645d72SZhang Yi (mount_opt & m->mount_opt) != m->mount_opt) ||
3000e3645d72SZhang Yi (!want_set && (mount_opt & m->mount_opt)))
3001e3645d72SZhang Yi continue;
30025a916be1STheodore Ts'o SEQ_OPTS_PRINT("%s", token2str(m->token));
30035a916be1STheodore Ts'o }
30045a916be1STheodore Ts'o
300508cefc7aSEric W. Biederman if (nodefs || !uid_eq(sbi->s_resuid, make_kuid(&init_user_ns, EXT4_DEF_RESUID)) ||
30065a916be1STheodore Ts'o le16_to_cpu(es->s_def_resuid) != EXT4_DEF_RESUID)
300708cefc7aSEric W. Biederman SEQ_OPTS_PRINT("resuid=%u",
300808cefc7aSEric W. Biederman from_kuid_munged(&init_user_ns, sbi->s_resuid));
300908cefc7aSEric W. Biederman if (nodefs || !gid_eq(sbi->s_resgid, make_kgid(&init_user_ns, EXT4_DEF_RESGID)) ||
30105a916be1STheodore Ts'o le16_to_cpu(es->s_def_resgid) != EXT4_DEF_RESGID)
301108cefc7aSEric W. Biederman SEQ_OPTS_PRINT("resgid=%u",
301208cefc7aSEric W. Biederman from_kgid_munged(&init_user_ns, sbi->s_resgid));
301366acdcf4STheodore Ts'o def_errors = nodefs ? -1 : le16_to_cpu(es->s_errors);
30145a916be1STheodore Ts'o if (test_opt(sb, ERRORS_RO) && def_errors != EXT4_ERRORS_RO)
30155a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=remount-ro");
30162adf6da8STheodore Ts'o if (test_opt(sb, ERRORS_CONT) && def_errors != EXT4_ERRORS_CONTINUE)
30175a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=continue");
30182adf6da8STheodore Ts'o if (test_opt(sb, ERRORS_PANIC) && def_errors != EXT4_ERRORS_PANIC)
30195a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=panic");
302066acdcf4STheodore Ts'o if (nodefs || sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ)
30215a916be1STheodore Ts'o SEQ_OPTS_PRINT("commit=%lu", sbi->s_commit_interval / HZ);
302266acdcf4STheodore Ts'o if (nodefs || sbi->s_min_batch_time != EXT4_DEF_MIN_BATCH_TIME)
30235a916be1STheodore Ts'o SEQ_OPTS_PRINT("min_batch_time=%u", sbi->s_min_batch_time);
302466acdcf4STheodore Ts'o if (nodefs || sbi->s_max_batch_time != EXT4_DEF_MAX_BATCH_TIME)
30255a916be1STheodore Ts'o SEQ_OPTS_PRINT("max_batch_time=%u", sbi->s_max_batch_time);
302666acdcf4STheodore Ts'o if (nodefs || sbi->s_stripe)
30275a916be1STheodore Ts'o SEQ_OPTS_PRINT("stripe=%lu", sbi->s_stripe);
302868afa7e0STyson Nottingham if (nodefs || EXT4_MOUNT_DATA_FLAGS &
3029e3645d72SZhang Yi (sbi->s_mount_opt ^ sbi->s_def_mount_opt)) {
30302adf6da8STheodore Ts'o if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
30315a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=journal");
30322adf6da8STheodore Ts'o else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
30335a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=ordered");
30342adf6da8STheodore Ts'o else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA)
30355a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=writeback");
30365a916be1STheodore Ts'o }
303766acdcf4STheodore Ts'o if (nodefs ||
303866acdcf4STheodore Ts'o sbi->s_inode_readahead_blks != EXT4_DEF_INODE_READAHEAD_BLKS)
30395a916be1STheodore Ts'o SEQ_OPTS_PRINT("inode_readahead_blks=%u",
30402adf6da8STheodore Ts'o sbi->s_inode_readahead_blks);
30412adf6da8STheodore Ts'o
3042ceec0376STyson Nottingham if (test_opt(sb, INIT_INODE_TABLE) && (nodefs ||
304366acdcf4STheodore Ts'o (sbi->s_li_wait_mult != EXT4_DEF_LI_WAIT_MULT)))
30445a916be1STheodore Ts'o SEQ_OPTS_PRINT("init_itable=%u", sbi->s_li_wait_mult);
3045df981d03STheodore Ts'o if (nodefs || sbi->s_max_dir_size_kb)
3046df981d03STheodore Ts'o SEQ_OPTS_PRINT("max_dir_size_kb=%u", sbi->s_max_dir_size_kb);
30477915a861SAles Novak if (test_opt(sb, DATA_ERR_ABORT))
30487915a861SAles Novak SEQ_OPTS_PUTS("data_err=abort");
3049ed318a6cSEric Biggers
3050ed318a6cSEric Biggers fscrypt_show_test_dummy_encryption(seq, sep, sb);
30512adf6da8STheodore Ts'o
30524f74d15fSEric Biggers if (sb->s_flags & SB_INLINECRYPT)
30534f74d15fSEric Biggers SEQ_OPTS_PUTS("inlinecrypt");
30544f74d15fSEric Biggers
30559cb20f94SIra Weiny if (test_opt(sb, DAX_ALWAYS)) {
30569cb20f94SIra Weiny if (IS_EXT2_SB(sb))
30579cb20f94SIra Weiny SEQ_OPTS_PUTS("dax");
30589cb20f94SIra Weiny else
30599cb20f94SIra Weiny SEQ_OPTS_PUTS("dax=always");
30609cb20f94SIra Weiny } else if (test_opt2(sb, DAX_NEVER)) {
30619cb20f94SIra Weiny SEQ_OPTS_PUTS("dax=never");
30629cb20f94SIra Weiny } else if (test_opt2(sb, DAX_INODE)) {
30639cb20f94SIra Weiny SEQ_OPTS_PUTS("dax=inode");
30649cb20f94SIra Weiny }
30653fa5d23eSOjaswin Mujoo
30663fa5d23eSOjaswin Mujoo if (sbi->s_groups_count >= MB_DEFAULT_LINEAR_SCAN_THRESHOLD &&
30673fa5d23eSOjaswin Mujoo !test_opt2(sb, MB_OPTIMIZE_SCAN)) {
30683fa5d23eSOjaswin Mujoo SEQ_OPTS_PUTS("mb_optimize_scan=0");
30693fa5d23eSOjaswin Mujoo } else if (sbi->s_groups_count < MB_DEFAULT_LINEAR_SCAN_THRESHOLD &&
30703fa5d23eSOjaswin Mujoo test_opt2(sb, MB_OPTIMIZE_SCAN)) {
30713fa5d23eSOjaswin Mujoo SEQ_OPTS_PUTS("mb_optimize_scan=1");
30723fa5d23eSOjaswin Mujoo }
30733fa5d23eSOjaswin Mujoo
30742adf6da8STheodore Ts'o ext4_show_quota_options(seq, sb);
30752adf6da8STheodore Ts'o return 0;
30762adf6da8STheodore Ts'o }
30772adf6da8STheodore Ts'o
ext4_show_options(struct seq_file * seq,struct dentry * root)307866acdcf4STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root)
307966acdcf4STheodore Ts'o {
308066acdcf4STheodore Ts'o return _ext4_show_options(seq, root->d_sb, 0);
308166acdcf4STheodore Ts'o }
308266acdcf4STheodore Ts'o
ext4_seq_options_show(struct seq_file * seq,void * offset)3083ebd173beSTheodore Ts'o int ext4_seq_options_show(struct seq_file *seq, void *offset)
308466acdcf4STheodore Ts'o {
308566acdcf4STheodore Ts'o struct super_block *sb = seq->private;
308666acdcf4STheodore Ts'o int rc;
308766acdcf4STheodore Ts'o
3088bc98a42cSDavid Howells seq_puts(seq, sb_rdonly(sb) ? "ro" : "rw");
308966acdcf4STheodore Ts'o rc = _ext4_show_options(seq, sb, 1);
309066acdcf4STheodore Ts'o seq_puts(seq, "\n");
309166acdcf4STheodore Ts'o return rc;
309266acdcf4STheodore Ts'o }
309366acdcf4STheodore Ts'o
ext4_setup_super(struct super_block * sb,struct ext4_super_block * es,int read_only)3094617ba13bSMingming Cao static int ext4_setup_super(struct super_block *sb, struct ext4_super_block *es,
3095ac27a0ecSDave Kleikamp int read_only)
3096ac27a0ecSDave Kleikamp {
3097617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
3098c89128a0SJaegeuk Kim int err = 0;
3099ac27a0ecSDave Kleikamp
3100617ba13bSMingming Cao if (le32_to_cpu(es->s_rev_level) > EXT4_MAX_SUPP_REV) {
3101b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "revision level too high, "
3102b31e1552SEric Sandeen "forcing read-only mode");
3103c89128a0SJaegeuk Kim err = -EROFS;
31045adaccacSyangerkun goto done;
3105ac27a0ecSDave Kleikamp }
3106ac27a0ecSDave Kleikamp if (read_only)
3107281b5995STheodore Ts'o goto done;
3108617ba13bSMingming Cao if (!(sbi->s_mount_state & EXT4_VALID_FS))
3109b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "warning: mounting unchecked fs, "
3110b31e1552SEric Sandeen "running e2fsck is recommended");
3111c8b459f4SLukas Czerner else if (sbi->s_mount_state & EXT4_ERROR_FS)
3112b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING,
3113b31e1552SEric Sandeen "warning: mounting fs with errors, "
3114b31e1552SEric Sandeen "running e2fsck is recommended");
3115ed3ce80aSTao Ma else if ((__s16) le16_to_cpu(es->s_max_mnt_count) > 0 &&
3116ac27a0ecSDave Kleikamp le16_to_cpu(es->s_mnt_count) >=
3117ac27a0ecSDave Kleikamp (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count))
3118b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING,
3119b31e1552SEric Sandeen "warning: maximal mount count reached, "
3120b31e1552SEric Sandeen "running e2fsck is recommended");
3121ac27a0ecSDave Kleikamp else if (le32_to_cpu(es->s_checkinterval) &&
31226a0678a7SArnd Bergmann (ext4_get_tstamp(es, s_lastcheck) +
31236a0678a7SArnd Bergmann le32_to_cpu(es->s_checkinterval) <= ktime_get_real_seconds()))
3124b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING,
3125b31e1552SEric Sandeen "warning: checktime reached, "
3126b31e1552SEric Sandeen "running e2fsck is recommended");
31270390131bSFrank Mayhar if (!sbi->s_journal)
3128216c34b2SMarcin Slusarz es->s_state &= cpu_to_le16(~EXT4_VALID_FS);
3129ac27a0ecSDave Kleikamp if (!(__s16) le16_to_cpu(es->s_max_mnt_count))
3130617ba13bSMingming Cao es->s_max_mnt_count = cpu_to_le16(EXT4_DFL_MAX_MNT_COUNT);
3131e8546d06SMarcin Slusarz le16_add_cpu(&es->s_mnt_count, 1);
31326a0678a7SArnd Bergmann ext4_update_tstamp(es, s_mtime);
313302f310fcSJan Kara if (sbi->s_journal) {
3134e2b911c5SDarrick J. Wong ext4_set_feature_journal_needs_recovery(sb);
313502f310fcSJan Kara if (ext4_has_feature_orphan_file(sb))
313602f310fcSJan Kara ext4_set_feature_orphan_present(sb);
313702f310fcSJan Kara }
3138ac27a0ecSDave Kleikamp
31394392fbc4SJan Kara err = ext4_commit_super(sb);
3140281b5995STheodore Ts'o done:
3141ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG))
3142a9df9a49STheodore Ts'o printk(KERN_INFO "[EXT4 FS bs=%lu, gc=%u, "
3143a2595b8aSTheodore Ts'o "bpg=%lu, ipg=%lu, mo=%04x, mo2=%04x]\n",
3144ac27a0ecSDave Kleikamp sb->s_blocksize,
3145ac27a0ecSDave Kleikamp sbi->s_groups_count,
3146617ba13bSMingming Cao EXT4_BLOCKS_PER_GROUP(sb),
3147617ba13bSMingming Cao EXT4_INODES_PER_GROUP(sb),
3148a2595b8aSTheodore Ts'o sbi->s_mount_opt, sbi->s_mount_opt2);
3149c89128a0SJaegeuk Kim return err;
3150ac27a0ecSDave Kleikamp }
3151ac27a0ecSDave Kleikamp
ext4_alloc_flex_bg_array(struct super_block * sb,ext4_group_t ngroup)3152117fff10STheodore Ts'o int ext4_alloc_flex_bg_array(struct super_block *sb, ext4_group_t ngroup)
3153117fff10STheodore Ts'o {
3154117fff10STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
31557c990728SSuraj Jitindar Singh struct flex_groups **old_groups, **new_groups;
315637b0b6b8SDan Carpenter int size, i, j;
3157117fff10STheodore Ts'o
3158117fff10STheodore Ts'o if (!sbi->s_log_groups_per_flex)
3159117fff10STheodore Ts'o return 0;
3160117fff10STheodore Ts'o
3161117fff10STheodore Ts'o size = ext4_flex_group(sbi, ngroup - 1) + 1;
3162117fff10STheodore Ts'o if (size <= sbi->s_flex_groups_allocated)
3163117fff10STheodore Ts'o return 0;
3164117fff10STheodore Ts'o
31657c990728SSuraj Jitindar Singh new_groups = kvzalloc(roundup_pow_of_two(size *
31667c990728SSuraj Jitindar Singh sizeof(*sbi->s_flex_groups)), GFP_KERNEL);
3167117fff10STheodore Ts'o if (!new_groups) {
31687c990728SSuraj Jitindar Singh ext4_msg(sb, KERN_ERR,
31697c990728SSuraj Jitindar Singh "not enough memory for %d flex group pointers", size);
3170117fff10STheodore Ts'o return -ENOMEM;
3171117fff10STheodore Ts'o }
31727c990728SSuraj Jitindar Singh for (i = sbi->s_flex_groups_allocated; i < size; i++) {
31737c990728SSuraj Jitindar Singh new_groups[i] = kvzalloc(roundup_pow_of_two(
31747c990728SSuraj Jitindar Singh sizeof(struct flex_groups)),
31757c990728SSuraj Jitindar Singh GFP_KERNEL);
31767c990728SSuraj Jitindar Singh if (!new_groups[i]) {
317737b0b6b8SDan Carpenter for (j = sbi->s_flex_groups_allocated; j < i; j++)
317837b0b6b8SDan Carpenter kvfree(new_groups[j]);
31797c990728SSuraj Jitindar Singh kvfree(new_groups);
31807c990728SSuraj Jitindar Singh ext4_msg(sb, KERN_ERR,
31817c990728SSuraj Jitindar Singh "not enough memory for %d flex groups", size);
31827c990728SSuraj Jitindar Singh return -ENOMEM;
3183117fff10STheodore Ts'o }
31847c990728SSuraj Jitindar Singh }
31857c990728SSuraj Jitindar Singh rcu_read_lock();
31867c990728SSuraj Jitindar Singh old_groups = rcu_dereference(sbi->s_flex_groups);
31877c990728SSuraj Jitindar Singh if (old_groups)
31887c990728SSuraj Jitindar Singh memcpy(new_groups, old_groups,
31897c990728SSuraj Jitindar Singh (sbi->s_flex_groups_allocated *
31907c990728SSuraj Jitindar Singh sizeof(struct flex_groups *)));
31917c990728SSuraj Jitindar Singh rcu_read_unlock();
31927c990728SSuraj Jitindar Singh rcu_assign_pointer(sbi->s_flex_groups, new_groups);
31937c990728SSuraj Jitindar Singh sbi->s_flex_groups_allocated = size;
31947c990728SSuraj Jitindar Singh if (old_groups)
31957c990728SSuraj Jitindar Singh ext4_kvfree_array_rcu(old_groups);
3196117fff10STheodore Ts'o return 0;
3197117fff10STheodore Ts'o }
3198117fff10STheodore Ts'o
ext4_fill_flex_info(struct super_block * sb)3199772cb7c8SJose R. Santos static int ext4_fill_flex_info(struct super_block *sb)
3200772cb7c8SJose R. Santos {
3201772cb7c8SJose R. Santos struct ext4_sb_info *sbi = EXT4_SB(sb);
3202772cb7c8SJose R. Santos struct ext4_group_desc *gdp = NULL;
32037c990728SSuraj Jitindar Singh struct flex_groups *fg;
3204772cb7c8SJose R. Santos ext4_group_t flex_group;
3205117fff10STheodore Ts'o int i, err;
3206772cb7c8SJose R. Santos
3207503358aeSTheodore Ts'o sbi->s_log_groups_per_flex = sbi->s_es->s_log_groups_per_flex;
3208d50f2ab6SXi Wang if (sbi->s_log_groups_per_flex < 1 || sbi->s_log_groups_per_flex > 31) {
3209772cb7c8SJose R. Santos sbi->s_log_groups_per_flex = 0;
3210772cb7c8SJose R. Santos return 1;
3211772cb7c8SJose R. Santos }
3212772cb7c8SJose R. Santos
3213117fff10STheodore Ts'o err = ext4_alloc_flex_bg_array(sb, sbi->s_groups_count);
3214117fff10STheodore Ts'o if (err)
3215772cb7c8SJose R. Santos goto failed;
3216772cb7c8SJose R. Santos
3217772cb7c8SJose R. Santos for (i = 0; i < sbi->s_groups_count; i++) {
321888b6edd1STheodore Ts'o gdp = ext4_get_group_desc(sb, i, NULL);
3219772cb7c8SJose R. Santos
3220772cb7c8SJose R. Santos flex_group = ext4_flex_group(sbi, i);
32217c990728SSuraj Jitindar Singh fg = sbi_array_rcu_deref(sbi, s_flex_groups, flex_group);
32227c990728SSuraj Jitindar Singh atomic_add(ext4_free_inodes_count(sb, gdp), &fg->free_inodes);
322390ba983fSTheodore Ts'o atomic64_add(ext4_free_group_clusters(sb, gdp),
32247c990728SSuraj Jitindar Singh &fg->free_clusters);
32257c990728SSuraj Jitindar Singh atomic_add(ext4_used_dirs_count(sb, gdp), &fg->used_dirs);
3226772cb7c8SJose R. Santos }
3227772cb7c8SJose R. Santos
3228772cb7c8SJose R. Santos return 1;
3229772cb7c8SJose R. Santos failed:
3230772cb7c8SJose R. Santos return 0;
3231772cb7c8SJose R. Santos }
3232772cb7c8SJose R. Santos
ext4_group_desc_csum(struct super_block * sb,__u32 block_group,struct ext4_group_desc * gdp)3233e2b911c5SDarrick J. Wong static __le16 ext4_group_desc_csum(struct super_block *sb, __u32 block_group,
3234717d50e4SAndreas Dilger struct ext4_group_desc *gdp)
3235717d50e4SAndreas Dilger {
3236b47820edSDaeho Jeong int offset = offsetof(struct ext4_group_desc, bg_checksum);
3237717d50e4SAndreas Dilger __u16 crc = 0;
3238717d50e4SAndreas Dilger __le32 le_group = cpu_to_le32(block_group);
3239e2b911c5SDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb);
3240717d50e4SAndreas Dilger
32419aa5d32bSDmitry Monakhov if (ext4_has_metadata_csum(sbi->s_sb)) {
3242feb0ab32SDarrick J. Wong /* Use new metadata_csum algorithm */
3243feb0ab32SDarrick J. Wong __u32 csum32;
3244b47820edSDaeho Jeong __u16 dummy_csum = 0;
3245feb0ab32SDarrick J. Wong
3246feb0ab32SDarrick J. Wong csum32 = ext4_chksum(sbi, sbi->s_csum_seed, (__u8 *)&le_group,
3247feb0ab32SDarrick J. Wong sizeof(le_group));
3248b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp, offset);
3249b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)&dummy_csum,
3250b47820edSDaeho Jeong sizeof(dummy_csum));
3251b47820edSDaeho Jeong offset += sizeof(dummy_csum);
3252b47820edSDaeho Jeong if (offset < sbi->s_desc_size)
3253b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp + offset,
3254b47820edSDaeho Jeong sbi->s_desc_size - offset);
3255feb0ab32SDarrick J. Wong
3256feb0ab32SDarrick J. Wong crc = csum32 & 0xFFFF;
3257feb0ab32SDarrick J. Wong goto out;
3258feb0ab32SDarrick J. Wong }
3259feb0ab32SDarrick J. Wong
3260feb0ab32SDarrick J. Wong /* old crc16 code */
3261e2b911c5SDarrick J. Wong if (!ext4_has_feature_gdt_csum(sb))
3262813d32f9SDarrick J. Wong return 0;
3263813d32f9SDarrick J. Wong
3264717d50e4SAndreas Dilger crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
3265717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group));
3266717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)gdp, offset);
3267717d50e4SAndreas Dilger offset += sizeof(gdp->bg_checksum); /* skip checksum */
3268717d50e4SAndreas Dilger /* for checksum of struct ext4_group_desc do the rest...*/
32694f043518STudor Ambarus if (ext4_has_feature_64bit(sb) && offset < sbi->s_desc_size)
3270717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)gdp + offset,
32714f043518STudor Ambarus sbi->s_desc_size - offset);
3272717d50e4SAndreas Dilger
3273feb0ab32SDarrick J. Wong out:
3274717d50e4SAndreas Dilger return cpu_to_le16(crc);
3275717d50e4SAndreas Dilger }
3276717d50e4SAndreas Dilger
ext4_group_desc_csum_verify(struct super_block * sb,__u32 block_group,struct ext4_group_desc * gdp)3277feb0ab32SDarrick J. Wong int ext4_group_desc_csum_verify(struct super_block *sb, __u32 block_group,
3278717d50e4SAndreas Dilger struct ext4_group_desc *gdp)
3279717d50e4SAndreas Dilger {
3280feb0ab32SDarrick J. Wong if (ext4_has_group_desc_csum(sb) &&
3281e2b911c5SDarrick J. Wong (gdp->bg_checksum != ext4_group_desc_csum(sb, block_group, gdp)))
3282717d50e4SAndreas Dilger return 0;
3283717d50e4SAndreas Dilger
3284717d50e4SAndreas Dilger return 1;
3285717d50e4SAndreas Dilger }
3286717d50e4SAndreas Dilger
ext4_group_desc_csum_set(struct super_block * sb,__u32 block_group,struct ext4_group_desc * gdp)3287feb0ab32SDarrick J. Wong void ext4_group_desc_csum_set(struct super_block *sb, __u32 block_group,
3288feb0ab32SDarrick J. Wong struct ext4_group_desc *gdp)
3289feb0ab32SDarrick J. Wong {
3290feb0ab32SDarrick J. Wong if (!ext4_has_group_desc_csum(sb))
3291feb0ab32SDarrick J. Wong return;
3292e2b911c5SDarrick J. Wong gdp->bg_checksum = ext4_group_desc_csum(sb, block_group, gdp);
3293feb0ab32SDarrick J. Wong }
3294feb0ab32SDarrick J. Wong
3295ac27a0ecSDave Kleikamp /* Called at mount-time, super-block is locked */
ext4_check_descriptors(struct super_block * sb,ext4_fsblk_t sb_block,ext4_group_t * first_not_zeroed)3296bfff6873SLukas Czerner static int ext4_check_descriptors(struct super_block *sb,
3297829fa70dSTheodore Ts'o ext4_fsblk_t sb_block,
3298bfff6873SLukas Czerner ext4_group_t *first_not_zeroed)
3299ac27a0ecSDave Kleikamp {
3300617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
3301617ba13bSMingming Cao ext4_fsblk_t first_block = le32_to_cpu(sbi->s_es->s_first_data_block);
3302617ba13bSMingming Cao ext4_fsblk_t last_block;
330344de022cSTheodore Ts'o ext4_fsblk_t last_bg_block = sb_block + ext4_bg_num_gdb(sb, 0);
3304bd81d8eeSLaurent Vivier ext4_fsblk_t block_bitmap;
3305bd81d8eeSLaurent Vivier ext4_fsblk_t inode_bitmap;
3306bd81d8eeSLaurent Vivier ext4_fsblk_t inode_table;
3307ce421581SJose R. Santos int flexbg_flag = 0;
3308bfff6873SLukas Czerner ext4_group_t i, grp = sbi->s_groups_count;
3309ac27a0ecSDave Kleikamp
3310e2b911c5SDarrick J. Wong if (ext4_has_feature_flex_bg(sb))
3311ce421581SJose R. Santos flexbg_flag = 1;
3312ce421581SJose R. Santos
3313617ba13bSMingming Cao ext4_debug("Checking group descriptors");
3314ac27a0ecSDave Kleikamp
3315197cd65aSAkinobu Mita for (i = 0; i < sbi->s_groups_count; i++) {
3316197cd65aSAkinobu Mita struct ext4_group_desc *gdp = ext4_get_group_desc(sb, i, NULL);
3317197cd65aSAkinobu Mita
3318ce421581SJose R. Santos if (i == sbi->s_groups_count - 1 || flexbg_flag)
3319bd81d8eeSLaurent Vivier last_block = ext4_blocks_count(sbi->s_es) - 1;
3320ac27a0ecSDave Kleikamp else
3321ac27a0ecSDave Kleikamp last_block = first_block +
3322617ba13bSMingming Cao (EXT4_BLOCKS_PER_GROUP(sb) - 1);
3323ac27a0ecSDave Kleikamp
3324bfff6873SLukas Czerner if ((grp == sbi->s_groups_count) &&
3325bfff6873SLukas Czerner !(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3326bfff6873SLukas Czerner grp = i;
3327bfff6873SLukas Czerner
33288fadc143SAlexandre Ratchov block_bitmap = ext4_block_bitmap(sb, gdp);
3329829fa70dSTheodore Ts'o if (block_bitmap == sb_block) {
3330829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3331829fa70dSTheodore Ts'o "Block bitmap for group %u overlaps "
3332829fa70dSTheodore Ts'o "superblock", i);
333318db4b4eSTheodore Ts'o if (!sb_rdonly(sb))
333418db4b4eSTheodore Ts'o return 0;
3335829fa70dSTheodore Ts'o }
333677260807STheodore Ts'o if (block_bitmap >= sb_block + 1 &&
333777260807STheodore Ts'o block_bitmap <= last_bg_block) {
333877260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
333977260807STheodore Ts'o "Block bitmap for group %u overlaps "
334077260807STheodore Ts'o "block group descriptors", i);
334177260807STheodore Ts'o if (!sb_rdonly(sb))
334277260807STheodore Ts'o return 0;
334377260807STheodore Ts'o }
33442b2d6d01STheodore Ts'o if (block_bitmap < first_block || block_bitmap > last_block) {
3345b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3346a9df9a49STheodore Ts'o "Block bitmap for group %u not in group "
3347b31e1552SEric Sandeen "(block %llu)!", i, block_bitmap);
3348ac27a0ecSDave Kleikamp return 0;
3349ac27a0ecSDave Kleikamp }
33508fadc143SAlexandre Ratchov inode_bitmap = ext4_inode_bitmap(sb, gdp);
3351829fa70dSTheodore Ts'o if (inode_bitmap == sb_block) {
3352829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3353829fa70dSTheodore Ts'o "Inode bitmap for group %u overlaps "
3354829fa70dSTheodore Ts'o "superblock", i);
335518db4b4eSTheodore Ts'o if (!sb_rdonly(sb))
335618db4b4eSTheodore Ts'o return 0;
3357829fa70dSTheodore Ts'o }
335877260807STheodore Ts'o if (inode_bitmap >= sb_block + 1 &&
335977260807STheodore Ts'o inode_bitmap <= last_bg_block) {
336077260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
336177260807STheodore Ts'o "Inode bitmap for group %u overlaps "
336277260807STheodore Ts'o "block group descriptors", i);
336377260807STheodore Ts'o if (!sb_rdonly(sb))
336477260807STheodore Ts'o return 0;
336577260807STheodore Ts'o }
33662b2d6d01STheodore Ts'o if (inode_bitmap < first_block || inode_bitmap > last_block) {
3367b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3368a9df9a49STheodore Ts'o "Inode bitmap for group %u not in group "
3369b31e1552SEric Sandeen "(block %llu)!", i, inode_bitmap);
3370ac27a0ecSDave Kleikamp return 0;
3371ac27a0ecSDave Kleikamp }
33728fadc143SAlexandre Ratchov inode_table = ext4_inode_table(sb, gdp);
3373829fa70dSTheodore Ts'o if (inode_table == sb_block) {
3374829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3375829fa70dSTheodore Ts'o "Inode table for group %u overlaps "
3376829fa70dSTheodore Ts'o "superblock", i);
337718db4b4eSTheodore Ts'o if (!sb_rdonly(sb))
337818db4b4eSTheodore Ts'o return 0;
3379829fa70dSTheodore Ts'o }
338077260807STheodore Ts'o if (inode_table >= sb_block + 1 &&
338177260807STheodore Ts'o inode_table <= last_bg_block) {
338277260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
338377260807STheodore Ts'o "Inode table for group %u overlaps "
338477260807STheodore Ts'o "block group descriptors", i);
338577260807STheodore Ts'o if (!sb_rdonly(sb))
338677260807STheodore Ts'o return 0;
338777260807STheodore Ts'o }
3388bd81d8eeSLaurent Vivier if (inode_table < first_block ||
33892b2d6d01STheodore Ts'o inode_table + sbi->s_itb_per_group - 1 > last_block) {
3390b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3391a9df9a49STheodore Ts'o "Inode table for group %u not in group "
3392b31e1552SEric Sandeen "(block %llu)!", i, inode_table);
3393ac27a0ecSDave Kleikamp return 0;
3394ac27a0ecSDave Kleikamp }
3395955ce5f5SAneesh Kumar K.V ext4_lock_group(sb, i);
3396feb0ab32SDarrick J. Wong if (!ext4_group_desc_csum_verify(sb, i, gdp)) {
3397b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3398b31e1552SEric Sandeen "Checksum for group %u failed (%u!=%u)",
3399e2b911c5SDarrick J. Wong i, le16_to_cpu(ext4_group_desc_csum(sb, i,
3400fd2d4291SAvantika Mathur gdp)), le16_to_cpu(gdp->bg_checksum));
3401bc98a42cSDavid Howells if (!sb_rdonly(sb)) {
3402955ce5f5SAneesh Kumar K.V ext4_unlock_group(sb, i);
3403717d50e4SAndreas Dilger return 0;
3404717d50e4SAndreas Dilger }
34057ee1ec4cSLi Zefan }
3406955ce5f5SAneesh Kumar K.V ext4_unlock_group(sb, i);
3407ce421581SJose R. Santos if (!flexbg_flag)
3408617ba13bSMingming Cao first_block += EXT4_BLOCKS_PER_GROUP(sb);
3409ac27a0ecSDave Kleikamp }
3410bfff6873SLukas Czerner if (NULL != first_not_zeroed)
3411bfff6873SLukas Czerner *first_not_zeroed = grp;
3412ac27a0ecSDave Kleikamp return 1;
3413ac27a0ecSDave Kleikamp }
3414ac27a0ecSDave Kleikamp
3415cd2291a4SEric Sandeen /*
3416cd2291a4SEric Sandeen * Maximal extent format file size.
3417cd2291a4SEric Sandeen * Resulting logical blkno at s_maxbytes must fit in our on-disk
3418cd2291a4SEric Sandeen * extent format containers, within a sector_t, and within i_blocks
3419cd2291a4SEric Sandeen * in the vfs. ext4 inode has 48 bits of i_block in fsblock units,
3420cd2291a4SEric Sandeen * so that won't be a limiting factor.
3421cd2291a4SEric Sandeen *
3422f17722f9SLukas Czerner * However there is other limiting factor. We do store extents in the form
3423f17722f9SLukas Czerner * of starting block and length, hence the resulting length of the extent
3424f17722f9SLukas Czerner * covering maximum file size must fit into on-disk format containers as
3425f17722f9SLukas Czerner * well. Given that length is always by 1 unit bigger than max unit (because
3426f17722f9SLukas Czerner * we count 0 as well) we have to lower the s_maxbytes by one fs block.
3427f17722f9SLukas Czerner *
3428cd2291a4SEric Sandeen * Note, this does *not* consider any metadata overhead for vfs i_blocks.
3429cd2291a4SEric Sandeen */
ext4_max_size(int blkbits,int has_huge_files)3430f287a1a5STheodore Ts'o static loff_t ext4_max_size(int blkbits, int has_huge_files)
3431cd2291a4SEric Sandeen {
3432cd2291a4SEric Sandeen loff_t res;
3433cd2291a4SEric Sandeen loff_t upper_limit = MAX_LFS_FILESIZE;
3434cd2291a4SEric Sandeen
343572deb455SChristoph Hellwig BUILD_BUG_ON(sizeof(blkcnt_t) < sizeof(u64));
343672deb455SChristoph Hellwig
343772deb455SChristoph Hellwig if (!has_huge_files) {
3438cd2291a4SEric Sandeen upper_limit = (1LL << 32) - 1;
3439cd2291a4SEric Sandeen
3440cd2291a4SEric Sandeen /* total blocks in file system block size */
3441cd2291a4SEric Sandeen upper_limit >>= (blkbits - 9);
3442cd2291a4SEric Sandeen upper_limit <<= blkbits;
3443cd2291a4SEric Sandeen }
3444cd2291a4SEric Sandeen
3445f17722f9SLukas Czerner /*
3446f17722f9SLukas Czerner * 32-bit extent-start container, ee_block. We lower the maxbytes
3447f17722f9SLukas Czerner * by one fs block, so ee_len can cover the extent of maximum file
3448f17722f9SLukas Czerner * size
3449f17722f9SLukas Czerner */
3450f17722f9SLukas Czerner res = (1LL << 32) - 1;
3451cd2291a4SEric Sandeen res <<= blkbits;
3452cd2291a4SEric Sandeen
3453cd2291a4SEric Sandeen /* Sanity check against vm- & vfs- imposed limits */
3454cd2291a4SEric Sandeen if (res > upper_limit)
3455cd2291a4SEric Sandeen res = upper_limit;
3456cd2291a4SEric Sandeen
3457cd2291a4SEric Sandeen return res;
3458cd2291a4SEric Sandeen }
3459ac27a0ecSDave Kleikamp
3460ac27a0ecSDave Kleikamp /*
3461cd2291a4SEric Sandeen * Maximal bitmap file size. There is a direct, and {,double-,triple-}indirect
34620fc1b451SAneesh Kumar K.V * block limit, and also a limit of (2^48 - 1) 512-byte sectors in i_blocks.
34630fc1b451SAneesh Kumar K.V * We need to be 1 filesystem block less than the 2^48 sector limit.
3464ac27a0ecSDave Kleikamp */
ext4_max_bitmap_size(int bits,int has_huge_files)3465f287a1a5STheodore Ts'o static loff_t ext4_max_bitmap_size(int bits, int has_huge_files)
3466ac27a0ecSDave Kleikamp {
34675c93e8ecSZhang Yi loff_t upper_limit, res = EXT4_NDIR_BLOCKS;
34680fc1b451SAneesh Kumar K.V int meta_blocks;
34695c93e8ecSZhang Yi unsigned int ppb = 1 << (bits - 2);
347075ca6ad4SRitesh Harjani
347175ca6ad4SRitesh Harjani /*
347275ca6ad4SRitesh Harjani * This is calculated to be the largest file size for a dense, block
34730b8e58a1SAndreas Dilger * mapped file such that the file's total number of 512-byte sectors,
34740b8e58a1SAndreas Dilger * including data and all indirect blocks, does not exceed (2^48 - 1).
34750b8e58a1SAndreas Dilger *
34760b8e58a1SAndreas Dilger * __u32 i_blocks_lo and _u16 i_blocks_high represent the total
34770b8e58a1SAndreas Dilger * number of 512-byte sectors of the file.
34780fc1b451SAneesh Kumar K.V */
347972deb455SChristoph Hellwig if (!has_huge_files) {
34800fc1b451SAneesh Kumar K.V /*
348172deb455SChristoph Hellwig * !has_huge_files or implies that the inode i_block field
348272deb455SChristoph Hellwig * represents total file blocks in 2^32 512-byte sectors ==
348372deb455SChristoph Hellwig * size of vfs inode i_blocks * 8
34840fc1b451SAneesh Kumar K.V */
34850fc1b451SAneesh Kumar K.V upper_limit = (1LL << 32) - 1;
34860fc1b451SAneesh Kumar K.V
34870fc1b451SAneesh Kumar K.V /* total blocks in file system block size */
34880fc1b451SAneesh Kumar K.V upper_limit >>= (bits - 9);
34890fc1b451SAneesh Kumar K.V
34900fc1b451SAneesh Kumar K.V } else {
34918180a562SAneesh Kumar K.V /*
34928180a562SAneesh Kumar K.V * We use 48 bit ext4_inode i_blocks
34938180a562SAneesh Kumar K.V * With EXT4_HUGE_FILE_FL set the i_blocks
34948180a562SAneesh Kumar K.V * represent total number of blocks in
34958180a562SAneesh Kumar K.V * file system block size
34968180a562SAneesh Kumar K.V */
34970fc1b451SAneesh Kumar K.V upper_limit = (1LL << 48) - 1;
34980fc1b451SAneesh Kumar K.V
34990fc1b451SAneesh Kumar K.V }
35000fc1b451SAneesh Kumar K.V
35015c93e8ecSZhang Yi /* Compute how many blocks we can address by block tree */
35025c93e8ecSZhang Yi res += ppb;
35035c93e8ecSZhang Yi res += ppb * ppb;
35045c93e8ecSZhang Yi res += ((loff_t)ppb) * ppb * ppb;
35055c93e8ecSZhang Yi /* Compute how many metadata blocks are needed */
35065c93e8ecSZhang Yi meta_blocks = 1;
35075c93e8ecSZhang Yi meta_blocks += 1 + ppb;
35085c93e8ecSZhang Yi meta_blocks += 1 + ppb + ppb * ppb;
35095c93e8ecSZhang Yi /* Does block tree limit file size? */
35105c93e8ecSZhang Yi if (res + meta_blocks <= upper_limit)
35115c93e8ecSZhang Yi goto check_lfs;
35125c93e8ecSZhang Yi
35135c93e8ecSZhang Yi res = upper_limit;
35145c93e8ecSZhang Yi /* How many metadata blocks are needed for addressing upper_limit? */
35155c93e8ecSZhang Yi upper_limit -= EXT4_NDIR_BLOCKS;
35160fc1b451SAneesh Kumar K.V /* indirect blocks */
35170fc1b451SAneesh Kumar K.V meta_blocks = 1;
35185c93e8ecSZhang Yi upper_limit -= ppb;
35190fc1b451SAneesh Kumar K.V /* double indirect blocks */
35205c93e8ecSZhang Yi if (upper_limit < ppb * ppb) {
35215c93e8ecSZhang Yi meta_blocks += 1 + DIV_ROUND_UP_ULL(upper_limit, ppb);
35225c93e8ecSZhang Yi res -= meta_blocks;
35235c93e8ecSZhang Yi goto check_lfs;
35245c93e8ecSZhang Yi }
35255c93e8ecSZhang Yi meta_blocks += 1 + ppb;
35265c93e8ecSZhang Yi upper_limit -= ppb * ppb;
35275c93e8ecSZhang Yi /* tripple indirect blocks for the rest */
35285c93e8ecSZhang Yi meta_blocks += 1 + DIV_ROUND_UP_ULL(upper_limit, ppb) +
35295c93e8ecSZhang Yi DIV_ROUND_UP_ULL(upper_limit, ppb*ppb);
35305c93e8ecSZhang Yi res -= meta_blocks;
35315c93e8ecSZhang Yi check_lfs:
3532ac27a0ecSDave Kleikamp res <<= bits;
35330fc1b451SAneesh Kumar K.V if (res > MAX_LFS_FILESIZE)
35340fc1b451SAneesh Kumar K.V res = MAX_LFS_FILESIZE;
35350fc1b451SAneesh Kumar K.V
35365c93e8ecSZhang Yi return res;
3537ac27a0ecSDave Kleikamp }
3538ac27a0ecSDave Kleikamp
descriptor_loc(struct super_block * sb,ext4_fsblk_t logical_sb_block,int nr)3539617ba13bSMingming Cao static ext4_fsblk_t descriptor_loc(struct super_block *sb,
354070bbb3e0SAndrew Morton ext4_fsblk_t logical_sb_block, int nr)
3541ac27a0ecSDave Kleikamp {
3542617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
3543fd2d4291SAvantika Mathur ext4_group_t bg, first_meta_bg;
3544ac27a0ecSDave Kleikamp int has_super = 0;
3545ac27a0ecSDave Kleikamp
3546ac27a0ecSDave Kleikamp first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg);
3547ac27a0ecSDave Kleikamp
3548e2b911c5SDarrick J. Wong if (!ext4_has_feature_meta_bg(sb) || nr < first_meta_bg)
354970bbb3e0SAndrew Morton return logical_sb_block + nr + 1;
3550ac27a0ecSDave Kleikamp bg = sbi->s_desc_per_block * nr;
3551617ba13bSMingming Cao if (ext4_bg_has_super(sb, bg))
3552ac27a0ecSDave Kleikamp has_super = 1;
35530b8e58a1SAndreas Dilger
3554bd63f6b0SDarrick J. Wong /*
3555bd63f6b0SDarrick J. Wong * If we have a meta_bg fs with 1k blocks, group 0's GDT is at
3556bd63f6b0SDarrick J. Wong * block 2, not 1. If s_first_data_block == 0 (bigalloc is enabled
3557bd63f6b0SDarrick J. Wong * on modern mke2fs or blksize > 1k on older mke2fs) then we must
3558bd63f6b0SDarrick J. Wong * compensate.
3559bd63f6b0SDarrick J. Wong */
3560bd63f6b0SDarrick J. Wong if (sb->s_blocksize == 1024 && nr == 0 &&
356149598e04SJun Piao le32_to_cpu(sbi->s_es->s_first_data_block) == 0)
3562bd63f6b0SDarrick J. Wong has_super++;
3563bd63f6b0SDarrick J. Wong
3564617ba13bSMingming Cao return (has_super + ext4_group_first_block_no(sb, bg));
3565ac27a0ecSDave Kleikamp }
3566ac27a0ecSDave Kleikamp
3567c9de560dSAlex Tomas /**
3568c9de560dSAlex Tomas * ext4_get_stripe_size: Get the stripe size.
3569c9de560dSAlex Tomas * @sbi: In memory super block info
3570c9de560dSAlex Tomas *
3571c9de560dSAlex Tomas * If we have specified it via mount option, then
3572c9de560dSAlex Tomas * use the mount option value. If the value specified at mount time is
3573c9de560dSAlex Tomas * greater than the blocks per group use the super block value.
3574c9de560dSAlex Tomas * If the super block value is greater than blocks per group return 0.
3575c9de560dSAlex Tomas * Allocator needs it be less than blocks per group.
3576c9de560dSAlex Tomas *
3577c9de560dSAlex Tomas */
ext4_get_stripe_size(struct ext4_sb_info * sbi)3578c9de560dSAlex Tomas static unsigned long ext4_get_stripe_size(struct ext4_sb_info *sbi)
3579c9de560dSAlex Tomas {
3580c9de560dSAlex Tomas unsigned long stride = le16_to_cpu(sbi->s_es->s_raid_stride);
3581c9de560dSAlex Tomas unsigned long stripe_width =
3582c9de560dSAlex Tomas le32_to_cpu(sbi->s_es->s_raid_stripe_width);
35833eb08658SDan Ehrenberg int ret;
3584c9de560dSAlex Tomas
3585c9de560dSAlex Tomas if (sbi->s_stripe && sbi->s_stripe <= sbi->s_blocks_per_group)
35863eb08658SDan Ehrenberg ret = sbi->s_stripe;
35875469d7c3SJan Kara else if (stripe_width && stripe_width <= sbi->s_blocks_per_group)
35883eb08658SDan Ehrenberg ret = stripe_width;
35895469d7c3SJan Kara else if (stride && stride <= sbi->s_blocks_per_group)
35903eb08658SDan Ehrenberg ret = stride;
35913eb08658SDan Ehrenberg else
35923eb08658SDan Ehrenberg ret = 0;
3593c9de560dSAlex Tomas
35943eb08658SDan Ehrenberg /*
35953eb08658SDan Ehrenberg * If the stripe width is 1, this makes no sense and
35963eb08658SDan Ehrenberg * we set it to 0 to turn off stripe handling code.
35973eb08658SDan Ehrenberg */
35983eb08658SDan Ehrenberg if (ret <= 1)
35993eb08658SDan Ehrenberg ret = 0;
3600c9de560dSAlex Tomas
36013eb08658SDan Ehrenberg return ret;
3602c9de560dSAlex Tomas }
3603ac27a0ecSDave Kleikamp
3604a13fb1a4SEric Sandeen /*
3605a13fb1a4SEric Sandeen * Check whether this filesystem can be mounted based on
3606a13fb1a4SEric Sandeen * the features present and the RDONLY/RDWR mount requested.
3607a13fb1a4SEric Sandeen * Returns 1 if this filesystem can be mounted as requested,
3608a13fb1a4SEric Sandeen * 0 if it cannot be.
3609a13fb1a4SEric Sandeen */
ext4_feature_set_ok(struct super_block * sb,int readonly)361025c6d98fSJan Kara int ext4_feature_set_ok(struct super_block *sb, int readonly)
3611a13fb1a4SEric Sandeen {
3612e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext4_incompat_features(sb)) {
3613a13fb1a4SEric Sandeen ext4_msg(sb, KERN_ERR,
3614a13fb1a4SEric Sandeen "Couldn't mount because of "
3615a13fb1a4SEric Sandeen "unsupported optional features (%x)",
3616a13fb1a4SEric Sandeen (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_incompat) &
3617a13fb1a4SEric Sandeen ~EXT4_FEATURE_INCOMPAT_SUPP));
3618a13fb1a4SEric Sandeen return 0;
3619a13fb1a4SEric Sandeen }
3620a13fb1a4SEric Sandeen
36215298d4bfSChristoph Hellwig #if !IS_ENABLED(CONFIG_UNICODE)
3622c83ad55eSGabriel Krisman Bertazi if (ext4_has_feature_casefold(sb)) {
3623c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_ERR,
3624c83ad55eSGabriel Krisman Bertazi "Filesystem with casefold feature cannot be "
3625c83ad55eSGabriel Krisman Bertazi "mounted without CONFIG_UNICODE");
3626c83ad55eSGabriel Krisman Bertazi return 0;
3627c83ad55eSGabriel Krisman Bertazi }
3628c83ad55eSGabriel Krisman Bertazi #endif
3629c83ad55eSGabriel Krisman Bertazi
3630a13fb1a4SEric Sandeen if (readonly)
3631a13fb1a4SEric Sandeen return 1;
3632a13fb1a4SEric Sandeen
3633e2b911c5SDarrick J. Wong if (ext4_has_feature_readonly(sb)) {
36342cb5cc8bSDarrick J. Wong ext4_msg(sb, KERN_INFO, "filesystem is read-only");
36351751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY;
36362cb5cc8bSDarrick J. Wong return 1;
36372cb5cc8bSDarrick J. Wong }
36382cb5cc8bSDarrick J. Wong
3639a13fb1a4SEric Sandeen /* Check that feature set is OK for a read-write mount */
3640e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext4_ro_compat_features(sb)) {
3641a13fb1a4SEric Sandeen ext4_msg(sb, KERN_ERR, "couldn't mount RDWR because of "
3642a13fb1a4SEric Sandeen "unsupported optional features (%x)",
3643a13fb1a4SEric Sandeen (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_ro_compat) &
3644a13fb1a4SEric Sandeen ~EXT4_FEATURE_RO_COMPAT_SUPP));
3645a13fb1a4SEric Sandeen return 0;
3646a13fb1a4SEric Sandeen }
3647e2b911c5SDarrick J. Wong if (ext4_has_feature_bigalloc(sb) && !ext4_has_feature_extents(sb)) {
3648bab08ab9STheodore Ts'o ext4_msg(sb, KERN_ERR,
3649bab08ab9STheodore Ts'o "Can't support bigalloc feature without "
3650bab08ab9STheodore Ts'o "extents feature\n");
3651bab08ab9STheodore Ts'o return 0;
3652bab08ab9STheodore Ts'o }
36537c319d32SAditya Kali
36549db176bcSJan Kara #if !IS_ENABLED(CONFIG_QUOTA) || !IS_ENABLED(CONFIG_QFMT_V2)
3655d65d87a0STheodore Ts'o if (!readonly && (ext4_has_feature_quota(sb) ||
3656d65d87a0STheodore Ts'o ext4_has_feature_project(sb))) {
36577c319d32SAditya Kali ext4_msg(sb, KERN_ERR,
3658d65d87a0STheodore Ts'o "The kernel was not built with CONFIG_QUOTA and CONFIG_QFMT_V2");
3659689c958cSLi Xi return 0;
3660689c958cSLi Xi }
36617c319d32SAditya Kali #endif /* CONFIG_QUOTA */
3662a13fb1a4SEric Sandeen return 1;
3663a13fb1a4SEric Sandeen }
3664a13fb1a4SEric Sandeen
366566e61a9eSTheodore Ts'o /*
366666e61a9eSTheodore Ts'o * This function is called once a day if we have errors logged
366766e61a9eSTheodore Ts'o * on the file system
366866e61a9eSTheodore Ts'o */
print_daily_error_info(struct timer_list * t)3669235699a8SKees Cook static void print_daily_error_info(struct timer_list *t)
367066e61a9eSTheodore Ts'o {
3671235699a8SKees Cook struct ext4_sb_info *sbi = from_timer(sbi, t, s_err_report);
3672235699a8SKees Cook struct super_block *sb = sbi->s_sb;
3673235699a8SKees Cook struct ext4_super_block *es = sbi->s_es;
367466e61a9eSTheodore Ts'o
367566e61a9eSTheodore Ts'o if (es->s_error_count)
3676ae0f78deSTheodore Ts'o /* fsck newer than v1.41.13 is needed to clean this condition. */
3677ae0f78deSTheodore Ts'o ext4_msg(sb, KERN_NOTICE, "error count since last fsck: %u",
367866e61a9eSTheodore Ts'o le32_to_cpu(es->s_error_count));
367966e61a9eSTheodore Ts'o if (es->s_first_error_time) {
36806a0678a7SArnd Bergmann printk(KERN_NOTICE "EXT4-fs (%s): initial error at time %llu: %.*s:%d",
36816a0678a7SArnd Bergmann sb->s_id,
36826a0678a7SArnd Bergmann ext4_get_tstamp(es, s_first_error_time),
368366e61a9eSTheodore Ts'o (int) sizeof(es->s_first_error_func),
368466e61a9eSTheodore Ts'o es->s_first_error_func,
368566e61a9eSTheodore Ts'o le32_to_cpu(es->s_first_error_line));
368666e61a9eSTheodore Ts'o if (es->s_first_error_ino)
3687651e1c3bSJoe Perches printk(KERN_CONT ": inode %u",
368866e61a9eSTheodore Ts'o le32_to_cpu(es->s_first_error_ino));
368966e61a9eSTheodore Ts'o if (es->s_first_error_block)
3690651e1c3bSJoe Perches printk(KERN_CONT ": block %llu", (unsigned long long)
369166e61a9eSTheodore Ts'o le64_to_cpu(es->s_first_error_block));
3692651e1c3bSJoe Perches printk(KERN_CONT "\n");
369366e61a9eSTheodore Ts'o }
369466e61a9eSTheodore Ts'o if (es->s_last_error_time) {
36956a0678a7SArnd Bergmann printk(KERN_NOTICE "EXT4-fs (%s): last error at time %llu: %.*s:%d",
36966a0678a7SArnd Bergmann sb->s_id,
36976a0678a7SArnd Bergmann ext4_get_tstamp(es, s_last_error_time),
369866e61a9eSTheodore Ts'o (int) sizeof(es->s_last_error_func),
369966e61a9eSTheodore Ts'o es->s_last_error_func,
370066e61a9eSTheodore Ts'o le32_to_cpu(es->s_last_error_line));
370166e61a9eSTheodore Ts'o if (es->s_last_error_ino)
3702651e1c3bSJoe Perches printk(KERN_CONT ": inode %u",
370366e61a9eSTheodore Ts'o le32_to_cpu(es->s_last_error_ino));
370466e61a9eSTheodore Ts'o if (es->s_last_error_block)
3705651e1c3bSJoe Perches printk(KERN_CONT ": block %llu", (unsigned long long)
370666e61a9eSTheodore Ts'o le64_to_cpu(es->s_last_error_block));
3707651e1c3bSJoe Perches printk(KERN_CONT "\n");
370866e61a9eSTheodore Ts'o }
370966e61a9eSTheodore Ts'o mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ); /* Once a day */
371066e61a9eSTheodore Ts'o }
371166e61a9eSTheodore Ts'o
3712bfff6873SLukas Czerner /* Find next suitable group and run ext4_init_inode_table */
ext4_run_li_request(struct ext4_li_request * elr)3713bfff6873SLukas Czerner static int ext4_run_li_request(struct ext4_li_request *elr)
3714bfff6873SLukas Czerner {
3715bfff6873SLukas Czerner struct ext4_group_desc *gdp = NULL;
37163d392b26STheodore Ts'o struct super_block *sb = elr->lr_super;
37173d392b26STheodore Ts'o ext4_group_t ngroups = EXT4_SB(sb)->s_groups_count;
37183d392b26STheodore Ts'o ext4_group_t group = elr->lr_next_group;
37193d392b26STheodore Ts'o unsigned int prefetch_ios = 0;
3720bfff6873SLukas Czerner int ret = 0;
37214f3d1e45SOjaswin Mujoo int nr = EXT4_SB(sb)->s_mb_prefetch;
372239fec688SShaoying Xu u64 start_time;
3723bfff6873SLukas Czerner
37243d392b26STheodore Ts'o if (elr->lr_mode == EXT4_LI_MODE_PREFETCH_BBITMAP) {
37254f3d1e45SOjaswin Mujoo elr->lr_next_group = ext4_mb_prefetch(sb, group, nr, &prefetch_ios);
37264f3d1e45SOjaswin Mujoo ext4_mb_prefetch_fini(sb, elr->lr_next_group, nr);
37274f3d1e45SOjaswin Mujoo trace_ext4_prefetch_bitmaps(sb, group, elr->lr_next_group, nr);
37283d392b26STheodore Ts'o if (group >= elr->lr_next_group) {
37293d392b26STheodore Ts'o ret = 1;
37303d392b26STheodore Ts'o if (elr->lr_first_not_zeroed != ngroups &&
37313d392b26STheodore Ts'o !sb_rdonly(sb) && test_opt(sb, INIT_INODE_TABLE)) {
37323d392b26STheodore Ts'o elr->lr_next_group = elr->lr_first_not_zeroed;
37333d392b26STheodore Ts'o elr->lr_mode = EXT4_LI_MODE_ITABLE;
37343d392b26STheodore Ts'o ret = 0;
37353d392b26STheodore Ts'o }
37363d392b26STheodore Ts'o }
37373d392b26STheodore Ts'o return ret;
37383d392b26STheodore Ts'o }
3739bfff6873SLukas Czerner
37403d392b26STheodore Ts'o for (; group < ngroups; group++) {
3741bfff6873SLukas Czerner gdp = ext4_get_group_desc(sb, group, NULL);
3742bfff6873SLukas Czerner if (!gdp) {
3743bfff6873SLukas Czerner ret = 1;
3744bfff6873SLukas Czerner break;
3745bfff6873SLukas Czerner }
3746bfff6873SLukas Czerner
3747bfff6873SLukas Czerner if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3748bfff6873SLukas Czerner break;
3749bfff6873SLukas Czerner }
3750bfff6873SLukas Czerner
37517f511862STheodore Ts'o if (group >= ngroups)
3752bfff6873SLukas Czerner ret = 1;
3753bfff6873SLukas Czerner
3754bfff6873SLukas Czerner if (!ret) {
375539fec688SShaoying Xu start_time = ktime_get_real_ns();
3756bfff6873SLukas Czerner ret = ext4_init_inode_table(sb, group,
3757bfff6873SLukas Czerner elr->lr_timeout ? 0 : 1);
37583d392b26STheodore Ts'o trace_ext4_lazy_itable_init(sb, group);
3759bfff6873SLukas Czerner if (elr->lr_timeout == 0) {
376039fec688SShaoying Xu elr->lr_timeout = nsecs_to_jiffies((ktime_get_real_ns() - start_time) *
376139fec688SShaoying Xu EXT4_SB(elr->lr_super)->s_li_wait_mult);
3762bfff6873SLukas Czerner }
3763bfff6873SLukas Czerner elr->lr_next_sched = jiffies + elr->lr_timeout;
3764bfff6873SLukas Czerner elr->lr_next_group = group + 1;
3765bfff6873SLukas Czerner }
3766bfff6873SLukas Czerner return ret;
3767bfff6873SLukas Czerner }
3768bfff6873SLukas Czerner
3769bfff6873SLukas Czerner /*
3770bfff6873SLukas Czerner * Remove lr_request from the list_request and free the
37714ed5c033SLukas Czerner * request structure. Should be called with li_list_mtx held
3772bfff6873SLukas Czerner */
ext4_remove_li_request(struct ext4_li_request * elr)3773bfff6873SLukas Czerner static void ext4_remove_li_request(struct ext4_li_request *elr)
3774bfff6873SLukas Czerner {
3775bfff6873SLukas Czerner if (!elr)
3776bfff6873SLukas Czerner return;
3777bfff6873SLukas Czerner
3778bfff6873SLukas Czerner list_del(&elr->lr_request);
37793d392b26STheodore Ts'o EXT4_SB(elr->lr_super)->s_li_request = NULL;
3780bfff6873SLukas Czerner kfree(elr);
3781bfff6873SLukas Czerner }
3782bfff6873SLukas Czerner
ext4_unregister_li_request(struct super_block * sb)3783bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb)
3784bfff6873SLukas Czerner {
37851bb933fbSLukas Czerner mutex_lock(&ext4_li_mtx);
37861bb933fbSLukas Czerner if (!ext4_li_info) {
37871bb933fbSLukas Czerner mutex_unlock(&ext4_li_mtx);
3788bfff6873SLukas Czerner return;
37891bb933fbSLukas Czerner }
3790bfff6873SLukas Czerner
3791bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx);
37921bb933fbSLukas Czerner ext4_remove_li_request(EXT4_SB(sb)->s_li_request);
3793bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx);
37941bb933fbSLukas Czerner mutex_unlock(&ext4_li_mtx);
3795bfff6873SLukas Czerner }
3796bfff6873SLukas Czerner
37978f1f7453SEric Sandeen static struct task_struct *ext4_lazyinit_task;
37988f1f7453SEric Sandeen
3799bfff6873SLukas Czerner /*
3800bfff6873SLukas Czerner * This is the function where ext4lazyinit thread lives. It walks
3801bfff6873SLukas Czerner * through the request list searching for next scheduled filesystem.
3802bfff6873SLukas Czerner * When such a fs is found, run the lazy initialization request
3803bfff6873SLukas Czerner * (ext4_rn_li_request) and keep track of the time spend in this
3804bfff6873SLukas Czerner * function. Based on that time we compute next schedule time of
3805bfff6873SLukas Czerner * the request. When walking through the list is complete, compute
3806bfff6873SLukas Czerner * next waking time and put itself into sleep.
3807bfff6873SLukas Czerner */
ext4_lazyinit_thread(void * arg)3808bfff6873SLukas Czerner static int ext4_lazyinit_thread(void *arg)
3809bfff6873SLukas Czerner {
3810c30365b9SYu Zhe struct ext4_lazy_init *eli = arg;
3811bfff6873SLukas Czerner struct list_head *pos, *n;
3812bfff6873SLukas Czerner struct ext4_li_request *elr;
38134ed5c033SLukas Czerner unsigned long next_wakeup, cur;
3814bfff6873SLukas Czerner
3815bfff6873SLukas Czerner BUG_ON(NULL == eli);
38163b575495SLalith Rajendran set_freezable();
3817bfff6873SLukas Czerner
3818bfff6873SLukas Czerner cont_thread:
3819bfff6873SLukas Czerner while (true) {
3820bfff6873SLukas Czerner next_wakeup = MAX_JIFFY_OFFSET;
3821bfff6873SLukas Czerner
3822bfff6873SLukas Czerner mutex_lock(&eli->li_list_mtx);
3823bfff6873SLukas Czerner if (list_empty(&eli->li_request_list)) {
3824bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx);
3825bfff6873SLukas Czerner goto exit_thread;
3826bfff6873SLukas Czerner }
3827bfff6873SLukas Czerner list_for_each_safe(pos, n, &eli->li_request_list) {
3828e22834f0SDmitry Monakhov int err = 0;
3829e22834f0SDmitry Monakhov int progress = 0;
3830bfff6873SLukas Czerner elr = list_entry(pos, struct ext4_li_request,
3831bfff6873SLukas Czerner lr_request);
3832bfff6873SLukas Czerner
3833e22834f0SDmitry Monakhov if (time_before(jiffies, elr->lr_next_sched)) {
3834e22834f0SDmitry Monakhov if (time_before(elr->lr_next_sched, next_wakeup))
3835e22834f0SDmitry Monakhov next_wakeup = elr->lr_next_sched;
3836e22834f0SDmitry Monakhov continue;
3837e22834f0SDmitry Monakhov }
3838e22834f0SDmitry Monakhov if (down_read_trylock(&elr->lr_super->s_umount)) {
3839e22834f0SDmitry Monakhov if (sb_start_write_trylock(elr->lr_super)) {
3840e22834f0SDmitry Monakhov progress = 1;
3841e22834f0SDmitry Monakhov /*
3842e22834f0SDmitry Monakhov * We hold sb->s_umount, sb can not
3843e22834f0SDmitry Monakhov * be removed from the list, it is
3844e22834f0SDmitry Monakhov * now safe to drop li_list_mtx
3845e22834f0SDmitry Monakhov */
3846e22834f0SDmitry Monakhov mutex_unlock(&eli->li_list_mtx);
3847e22834f0SDmitry Monakhov err = ext4_run_li_request(elr);
3848e22834f0SDmitry Monakhov sb_end_write(elr->lr_super);
3849e22834f0SDmitry Monakhov mutex_lock(&eli->li_list_mtx);
3850e22834f0SDmitry Monakhov n = pos->next;
3851e22834f0SDmitry Monakhov }
3852e22834f0SDmitry Monakhov up_read((&elr->lr_super->s_umount));
3853e22834f0SDmitry Monakhov }
3854b2c78cd0STheodore Ts'o /* error, remove the lazy_init job */
3855e22834f0SDmitry Monakhov if (err) {
3856bfff6873SLukas Czerner ext4_remove_li_request(elr);
3857bfff6873SLukas Czerner continue;
3858bfff6873SLukas Czerner }
3859e22834f0SDmitry Monakhov if (!progress) {
3860e22834f0SDmitry Monakhov elr->lr_next_sched = jiffies +
38618032bf12SJason A. Donenfeld get_random_u32_below(EXT4_DEF_LI_MAX_START_DELAY * HZ);
3862b2c78cd0STheodore Ts'o }
3863bfff6873SLukas Czerner if (time_before(elr->lr_next_sched, next_wakeup))
3864bfff6873SLukas Czerner next_wakeup = elr->lr_next_sched;
3865bfff6873SLukas Czerner }
3866bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx);
3867bfff6873SLukas Czerner
3868a0acae0eSTejun Heo try_to_freeze();
3869bfff6873SLukas Czerner
38704ed5c033SLukas Czerner cur = jiffies;
38714ed5c033SLukas Czerner if ((time_after_eq(cur, next_wakeup)) ||
3872f4245bd4SLukas Czerner (MAX_JIFFY_OFFSET == next_wakeup)) {
3873bfff6873SLukas Czerner cond_resched();
3874bfff6873SLukas Czerner continue;
3875bfff6873SLukas Czerner }
3876bfff6873SLukas Czerner
38774ed5c033SLukas Czerner schedule_timeout_interruptible(next_wakeup - cur);
38784ed5c033SLukas Czerner
38798f1f7453SEric Sandeen if (kthread_should_stop()) {
38808f1f7453SEric Sandeen ext4_clear_request_list();
38818f1f7453SEric Sandeen goto exit_thread;
38828f1f7453SEric Sandeen }
3883bfff6873SLukas Czerner }
3884bfff6873SLukas Czerner
3885bfff6873SLukas Czerner exit_thread:
3886bfff6873SLukas Czerner /*
3887bfff6873SLukas Czerner * It looks like the request list is empty, but we need
3888bfff6873SLukas Czerner * to check it under the li_list_mtx lock, to prevent any
3889bfff6873SLukas Czerner * additions into it, and of course we should lock ext4_li_mtx
3890bfff6873SLukas Czerner * to atomically free the list and ext4_li_info, because at
3891bfff6873SLukas Czerner * this point another ext4 filesystem could be registering
3892bfff6873SLukas Czerner * new one.
3893bfff6873SLukas Czerner */
3894bfff6873SLukas Czerner mutex_lock(&ext4_li_mtx);
3895bfff6873SLukas Czerner mutex_lock(&eli->li_list_mtx);
3896bfff6873SLukas Czerner if (!list_empty(&eli->li_request_list)) {
3897bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx);
3898bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx);
3899bfff6873SLukas Czerner goto cont_thread;
3900bfff6873SLukas Czerner }
3901bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx);
3902bfff6873SLukas Czerner kfree(ext4_li_info);
3903bfff6873SLukas Czerner ext4_li_info = NULL;
3904bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx);
3905bfff6873SLukas Czerner
3906bfff6873SLukas Czerner return 0;
3907bfff6873SLukas Czerner }
3908bfff6873SLukas Czerner
ext4_clear_request_list(void)3909bfff6873SLukas Czerner static void ext4_clear_request_list(void)
3910bfff6873SLukas Czerner {
3911bfff6873SLukas Czerner struct list_head *pos, *n;
3912bfff6873SLukas Czerner struct ext4_li_request *elr;
3913bfff6873SLukas Czerner
3914bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx);
3915bfff6873SLukas Czerner list_for_each_safe(pos, n, &ext4_li_info->li_request_list) {
3916bfff6873SLukas Czerner elr = list_entry(pos, struct ext4_li_request,
3917bfff6873SLukas Czerner lr_request);
3918bfff6873SLukas Czerner ext4_remove_li_request(elr);
3919bfff6873SLukas Czerner }
3920bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx);
3921bfff6873SLukas Czerner }
3922bfff6873SLukas Czerner
ext4_run_lazyinit_thread(void)3923bfff6873SLukas Czerner static int ext4_run_lazyinit_thread(void)
3924bfff6873SLukas Czerner {
39258f1f7453SEric Sandeen ext4_lazyinit_task = kthread_run(ext4_lazyinit_thread,
39268f1f7453SEric Sandeen ext4_li_info, "ext4lazyinit");
39278f1f7453SEric Sandeen if (IS_ERR(ext4_lazyinit_task)) {
39288f1f7453SEric Sandeen int err = PTR_ERR(ext4_lazyinit_task);
3929bfff6873SLukas Czerner ext4_clear_request_list();
3930bfff6873SLukas Czerner kfree(ext4_li_info);
3931bfff6873SLukas Czerner ext4_li_info = NULL;
393292b97816STheodore Ts'o printk(KERN_CRIT "EXT4-fs: error %d creating inode table "
3933bfff6873SLukas Czerner "initialization thread\n",
3934bfff6873SLukas Czerner err);
3935bfff6873SLukas Czerner return err;
3936bfff6873SLukas Czerner }
3937bfff6873SLukas Czerner ext4_li_info->li_state |= EXT4_LAZYINIT_RUNNING;
3938bfff6873SLukas Czerner return 0;
3939bfff6873SLukas Czerner }
3940bfff6873SLukas Czerner
3941bfff6873SLukas Czerner /*
3942bfff6873SLukas Czerner * Check whether it make sense to run itable init. thread or not.
3943bfff6873SLukas Czerner * If there is at least one uninitialized inode table, return
3944bfff6873SLukas Czerner * corresponding group number, else the loop goes through all
3945bfff6873SLukas Czerner * groups and return total number of groups.
3946bfff6873SLukas Czerner */
ext4_has_uninit_itable(struct super_block * sb)3947bfff6873SLukas Czerner static ext4_group_t ext4_has_uninit_itable(struct super_block *sb)
3948bfff6873SLukas Czerner {
3949bfff6873SLukas Czerner ext4_group_t group, ngroups = EXT4_SB(sb)->s_groups_count;
3950bfff6873SLukas Czerner struct ext4_group_desc *gdp = NULL;
3951bfff6873SLukas Czerner
39528844618dSTheodore Ts'o if (!ext4_has_group_desc_csum(sb))
39538844618dSTheodore Ts'o return ngroups;
39548844618dSTheodore Ts'o
3955bfff6873SLukas Czerner for (group = 0; group < ngroups; group++) {
3956bfff6873SLukas Czerner gdp = ext4_get_group_desc(sb, group, NULL);
3957bfff6873SLukas Czerner if (!gdp)
3958bfff6873SLukas Czerner continue;
3959bfff6873SLukas Czerner
396050122847STheodore Ts'o if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3961bfff6873SLukas Czerner break;
3962bfff6873SLukas Czerner }
3963bfff6873SLukas Czerner
3964bfff6873SLukas Czerner return group;
3965bfff6873SLukas Czerner }
3966bfff6873SLukas Czerner
ext4_li_info_new(void)3967bfff6873SLukas Czerner static int ext4_li_info_new(void)
3968bfff6873SLukas Czerner {
3969bfff6873SLukas Czerner struct ext4_lazy_init *eli = NULL;
3970bfff6873SLukas Czerner
3971bfff6873SLukas Czerner eli = kzalloc(sizeof(*eli), GFP_KERNEL);
3972bfff6873SLukas Czerner if (!eli)
3973bfff6873SLukas Czerner return -ENOMEM;
3974bfff6873SLukas Czerner
3975bfff6873SLukas Czerner INIT_LIST_HEAD(&eli->li_request_list);
3976bfff6873SLukas Czerner mutex_init(&eli->li_list_mtx);
3977bfff6873SLukas Czerner
3978bfff6873SLukas Czerner eli->li_state |= EXT4_LAZYINIT_QUIT;
3979bfff6873SLukas Czerner
3980bfff6873SLukas Czerner ext4_li_info = eli;
3981bfff6873SLukas Czerner
3982bfff6873SLukas Czerner return 0;
3983bfff6873SLukas Czerner }
3984bfff6873SLukas Czerner
ext4_li_request_new(struct super_block * sb,ext4_group_t start)3985bfff6873SLukas Czerner static struct ext4_li_request *ext4_li_request_new(struct super_block *sb,
3986bfff6873SLukas Czerner ext4_group_t start)
3987bfff6873SLukas Czerner {
3988bfff6873SLukas Czerner struct ext4_li_request *elr;
3989bfff6873SLukas Czerner
3990bfff6873SLukas Czerner elr = kzalloc(sizeof(*elr), GFP_KERNEL);
3991bfff6873SLukas Czerner if (!elr)
3992bfff6873SLukas Czerner return NULL;
3993bfff6873SLukas Czerner
3994bfff6873SLukas Czerner elr->lr_super = sb;
39953d392b26STheodore Ts'o elr->lr_first_not_zeroed = start;
399621175ca4SHarshad Shirwadkar if (test_opt(sb, NO_PREFETCH_BLOCK_BITMAPS)) {
39973d392b26STheodore Ts'o elr->lr_mode = EXT4_LI_MODE_ITABLE;
3998bfff6873SLukas Czerner elr->lr_next_group = start;
399921175ca4SHarshad Shirwadkar } else {
400021175ca4SHarshad Shirwadkar elr->lr_mode = EXT4_LI_MODE_PREFETCH_BBITMAP;
40013d392b26STheodore Ts'o }
4002bfff6873SLukas Czerner
4003bfff6873SLukas Czerner /*
4004bfff6873SLukas Czerner * Randomize first schedule time of the request to
4005bfff6873SLukas Czerner * spread the inode table initialization requests
4006bfff6873SLukas Czerner * better.
4007bfff6873SLukas Czerner */
40088032bf12SJason A. Donenfeld elr->lr_next_sched = jiffies + get_random_u32_below(EXT4_DEF_LI_MAX_START_DELAY * HZ);
4009bfff6873SLukas Czerner return elr;
4010bfff6873SLukas Czerner }
4011bfff6873SLukas Czerner
ext4_register_li_request(struct super_block * sb,ext4_group_t first_not_zeroed)40127f511862STheodore Ts'o int ext4_register_li_request(struct super_block *sb,
4013bfff6873SLukas Czerner ext4_group_t first_not_zeroed)
4014bfff6873SLukas Czerner {
4015bfff6873SLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb);
40167f511862STheodore Ts'o struct ext4_li_request *elr = NULL;
401749598e04SJun Piao ext4_group_t ngroups = sbi->s_groups_count;
40186c5a6cb9SAndrew Morton int ret = 0;
4019bfff6873SLukas Czerner
40207f511862STheodore Ts'o mutex_lock(&ext4_li_mtx);
402151ce6511SLukas Czerner if (sbi->s_li_request != NULL) {
402251ce6511SLukas Czerner /*
402351ce6511SLukas Czerner * Reset timeout so it can be computed again, because
402451ce6511SLukas Czerner * s_li_wait_mult might have changed.
402551ce6511SLukas Czerner */
402651ce6511SLukas Czerner sbi->s_li_request->lr_timeout = 0;
40277f511862STheodore Ts'o goto out;
402851ce6511SLukas Czerner }
4029bfff6873SLukas Czerner
4030426d15adSJosh Triplett if (sb_rdonly(sb) ||
4031426d15adSJosh Triplett (test_opt(sb, NO_PREFETCH_BLOCK_BITMAPS) &&
4032426d15adSJosh Triplett (first_not_zeroed == ngroups || !test_opt(sb, INIT_INODE_TABLE))))
40337f511862STheodore Ts'o goto out;
4034bfff6873SLukas Czerner
4035bfff6873SLukas Czerner elr = ext4_li_request_new(sb, first_not_zeroed);
40367f511862STheodore Ts'o if (!elr) {
40377f511862STheodore Ts'o ret = -ENOMEM;
40387f511862STheodore Ts'o goto out;
40397f511862STheodore Ts'o }
4040bfff6873SLukas Czerner
4041bfff6873SLukas Czerner if (NULL == ext4_li_info) {
4042bfff6873SLukas Czerner ret = ext4_li_info_new();
4043bfff6873SLukas Czerner if (ret)
4044bfff6873SLukas Czerner goto out;
4045bfff6873SLukas Czerner }
4046bfff6873SLukas Czerner
4047bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx);
4048bfff6873SLukas Czerner list_add(&elr->lr_request, &ext4_li_info->li_request_list);
4049bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx);
4050bfff6873SLukas Czerner
4051bfff6873SLukas Czerner sbi->s_li_request = elr;
405246e4690bSTao Ma /*
405346e4690bSTao Ma * set elr to NULL here since it has been inserted to
405446e4690bSTao Ma * the request_list and the removal and free of it is
405546e4690bSTao Ma * handled by ext4_clear_request_list from now on.
405646e4690bSTao Ma */
405746e4690bSTao Ma elr = NULL;
4058bfff6873SLukas Czerner
4059bfff6873SLukas Czerner if (!(ext4_li_info->li_state & EXT4_LAZYINIT_RUNNING)) {
4060bfff6873SLukas Czerner ret = ext4_run_lazyinit_thread();
4061bfff6873SLukas Czerner if (ret)
4062bfff6873SLukas Czerner goto out;
4063bfff6873SLukas Czerner }
4064bfff6873SLukas Czerner out:
4065bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx);
4066beed5ecbSNicolas Kaiser if (ret)
4067bfff6873SLukas Czerner kfree(elr);
4068bfff6873SLukas Czerner return ret;
4069bfff6873SLukas Czerner }
4070bfff6873SLukas Czerner
4071bfff6873SLukas Czerner /*
4072bfff6873SLukas Czerner * We do not need to lock anything since this is called on
4073bfff6873SLukas Czerner * module unload.
4074bfff6873SLukas Czerner */
ext4_destroy_lazyinit_thread(void)4075bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void)
4076bfff6873SLukas Czerner {
4077bfff6873SLukas Czerner /*
4078bfff6873SLukas Czerner * If thread exited earlier
4079bfff6873SLukas Czerner * there's nothing to be done.
4080bfff6873SLukas Czerner */
40818f1f7453SEric Sandeen if (!ext4_li_info || !ext4_lazyinit_task)
4082bfff6873SLukas Czerner return;
4083bfff6873SLukas Czerner
40848f1f7453SEric Sandeen kthread_stop(ext4_lazyinit_task);
4085bfff6873SLukas Czerner }
4086bfff6873SLukas Czerner
set_journal_csum_feature_set(struct super_block * sb)408725ed6e8aSDarrick J. Wong static int set_journal_csum_feature_set(struct super_block *sb)
408825ed6e8aSDarrick J. Wong {
408925ed6e8aSDarrick J. Wong int ret = 1;
409025ed6e8aSDarrick J. Wong int compat, incompat;
409125ed6e8aSDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb);
409225ed6e8aSDarrick J. Wong
40939aa5d32bSDmitry Monakhov if (ext4_has_metadata_csum(sb)) {
4094db9ee220SDarrick J. Wong /* journal checksum v3 */
409525ed6e8aSDarrick J. Wong compat = 0;
4096db9ee220SDarrick J. Wong incompat = JBD2_FEATURE_INCOMPAT_CSUM_V3;
409725ed6e8aSDarrick J. Wong } else {
409825ed6e8aSDarrick J. Wong /* journal checksum v1 */
409925ed6e8aSDarrick J. Wong compat = JBD2_FEATURE_COMPAT_CHECKSUM;
410025ed6e8aSDarrick J. Wong incompat = 0;
410125ed6e8aSDarrick J. Wong }
410225ed6e8aSDarrick J. Wong
4103feb8c6d3SDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal,
4104feb8c6d3SDarrick J. Wong JBD2_FEATURE_COMPAT_CHECKSUM, 0,
4105feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_CSUM_V3 |
4106feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_CSUM_V2);
410725ed6e8aSDarrick J. Wong if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
410825ed6e8aSDarrick J. Wong ret = jbd2_journal_set_features(sbi->s_journal,
410925ed6e8aSDarrick J. Wong compat, 0,
411025ed6e8aSDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT |
411125ed6e8aSDarrick J. Wong incompat);
411225ed6e8aSDarrick J. Wong } else if (test_opt(sb, JOURNAL_CHECKSUM)) {
411325ed6e8aSDarrick J. Wong ret = jbd2_journal_set_features(sbi->s_journal,
411425ed6e8aSDarrick J. Wong compat, 0,
411525ed6e8aSDarrick J. Wong incompat);
411625ed6e8aSDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal, 0, 0,
411725ed6e8aSDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
411825ed6e8aSDarrick J. Wong } else {
4119feb8c6d3SDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal, 0, 0,
4120feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
412125ed6e8aSDarrick J. Wong }
412225ed6e8aSDarrick J. Wong
412325ed6e8aSDarrick J. Wong return ret;
412425ed6e8aSDarrick J. Wong }
412525ed6e8aSDarrick J. Wong
4126952fc18eSTheodore Ts'o /*
4127952fc18eSTheodore Ts'o * Note: calculating the overhead so we can be compatible with
4128952fc18eSTheodore Ts'o * historical BSD practice is quite difficult in the face of
4129952fc18eSTheodore Ts'o * clusters/bigalloc. This is because multiple metadata blocks from
4130952fc18eSTheodore Ts'o * different block group can end up in the same allocation cluster.
4131952fc18eSTheodore Ts'o * Calculating the exact overhead in the face of clustered allocation
4132952fc18eSTheodore Ts'o * requires either O(all block bitmaps) in memory or O(number of block
4133952fc18eSTheodore Ts'o * groups**2) in time. We will still calculate the superblock for
4134952fc18eSTheodore Ts'o * older file systems --- and if we come across with a bigalloc file
4135952fc18eSTheodore Ts'o * system with zero in s_overhead_clusters the estimate will be close to
4136952fc18eSTheodore Ts'o * correct especially for very large cluster sizes --- but for newer
4137952fc18eSTheodore Ts'o * file systems, it's better to calculate this figure once at mkfs
4138952fc18eSTheodore Ts'o * time, and store it in the superblock. If the superblock value is
4139952fc18eSTheodore Ts'o * present (even for non-bigalloc file systems), we will use it.
4140952fc18eSTheodore Ts'o */
count_overhead(struct super_block * sb,ext4_group_t grp,char * buf)4141952fc18eSTheodore Ts'o static int count_overhead(struct super_block *sb, ext4_group_t grp,
4142952fc18eSTheodore Ts'o char *buf)
4143952fc18eSTheodore Ts'o {
4144952fc18eSTheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
4145952fc18eSTheodore Ts'o struct ext4_group_desc *gdp;
4146952fc18eSTheodore Ts'o ext4_fsblk_t first_block, last_block, b;
4147952fc18eSTheodore Ts'o ext4_group_t i, ngroups = ext4_get_groups_count(sb);
4148952fc18eSTheodore Ts'o int s, j, count = 0;
414910b01ee9STheodore Ts'o int has_super = ext4_bg_has_super(sb, grp);
4150952fc18eSTheodore Ts'o
4151e2b911c5SDarrick J. Wong if (!ext4_has_feature_bigalloc(sb))
415210b01ee9STheodore Ts'o return (has_super + ext4_bg_num_gdb(sb, grp) +
415310b01ee9STheodore Ts'o (has_super ? le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) : 0) +
41540548bbb8STheodore Ts'o sbi->s_itb_per_group + 2);
41550548bbb8STheodore Ts'o
4156952fc18eSTheodore Ts'o first_block = le32_to_cpu(sbi->s_es->s_first_data_block) +
4157952fc18eSTheodore Ts'o (grp * EXT4_BLOCKS_PER_GROUP(sb));
4158952fc18eSTheodore Ts'o last_block = first_block + EXT4_BLOCKS_PER_GROUP(sb) - 1;
4159952fc18eSTheodore Ts'o for (i = 0; i < ngroups; i++) {
4160952fc18eSTheodore Ts'o gdp = ext4_get_group_desc(sb, i, NULL);
4161952fc18eSTheodore Ts'o b = ext4_block_bitmap(sb, gdp);
4162952fc18eSTheodore Ts'o if (b >= first_block && b <= last_block) {
4163952fc18eSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
4164952fc18eSTheodore Ts'o count++;
4165952fc18eSTheodore Ts'o }
4166952fc18eSTheodore Ts'o b = ext4_inode_bitmap(sb, gdp);
4167952fc18eSTheodore Ts'o if (b >= first_block && b <= last_block) {
4168952fc18eSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
4169952fc18eSTheodore Ts'o count++;
4170952fc18eSTheodore Ts'o }
4171952fc18eSTheodore Ts'o b = ext4_inode_table(sb, gdp);
4172952fc18eSTheodore Ts'o if (b >= first_block && b + sbi->s_itb_per_group <= last_block)
4173952fc18eSTheodore Ts'o for (j = 0; j < sbi->s_itb_per_group; j++, b++) {
4174952fc18eSTheodore Ts'o int c = EXT4_B2C(sbi, b - first_block);
4175952fc18eSTheodore Ts'o ext4_set_bit(c, buf);
4176952fc18eSTheodore Ts'o count++;
4177952fc18eSTheodore Ts'o }
4178952fc18eSTheodore Ts'o if (i != grp)
4179952fc18eSTheodore Ts'o continue;
4180952fc18eSTheodore Ts'o s = 0;
4181952fc18eSTheodore Ts'o if (ext4_bg_has_super(sb, grp)) {
4182952fc18eSTheodore Ts'o ext4_set_bit(s++, buf);
4183952fc18eSTheodore Ts'o count++;
4184952fc18eSTheodore Ts'o }
4185c48ae41bSTheodore Ts'o j = ext4_bg_num_gdb(sb, grp);
4186c48ae41bSTheodore Ts'o if (s + j > EXT4_BLOCKS_PER_GROUP(sb)) {
4187c48ae41bSTheodore Ts'o ext4_error(sb, "Invalid number of block group "
4188c48ae41bSTheodore Ts'o "descriptor blocks: %d", j);
4189c48ae41bSTheodore Ts'o j = EXT4_BLOCKS_PER_GROUP(sb) - s;
4190952fc18eSTheodore Ts'o }
4191c48ae41bSTheodore Ts'o count += j;
4192c48ae41bSTheodore Ts'o for (; j > 0; j--)
4193c48ae41bSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, s++), buf);
4194952fc18eSTheodore Ts'o }
4195952fc18eSTheodore Ts'o if (!count)
4196952fc18eSTheodore Ts'o return 0;
4197952fc18eSTheodore Ts'o return EXT4_CLUSTERS_PER_GROUP(sb) -
4198952fc18eSTheodore Ts'o ext4_count_free(buf, EXT4_CLUSTERS_PER_GROUP(sb) / 8);
4199952fc18eSTheodore Ts'o }
4200952fc18eSTheodore Ts'o
4201952fc18eSTheodore Ts'o /*
4202952fc18eSTheodore Ts'o * Compute the overhead and stash it in sbi->s_overhead
4203952fc18eSTheodore Ts'o */
ext4_calculate_overhead(struct super_block * sb)4204952fc18eSTheodore Ts'o int ext4_calculate_overhead(struct super_block *sb)
4205952fc18eSTheodore Ts'o {
4206952fc18eSTheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
4207952fc18eSTheodore Ts'o struct ext4_super_block *es = sbi->s_es;
42083c816dedSEric Whitney struct inode *j_inode;
42093c816dedSEric Whitney unsigned int j_blocks, j_inum = le32_to_cpu(es->s_journal_inum);
4210952fc18eSTheodore Ts'o ext4_group_t i, ngroups = ext4_get_groups_count(sb);
4211952fc18eSTheodore Ts'o ext4_fsblk_t overhead = 0;
42124fdb5543SDmitry Monakhov char *buf = (char *) get_zeroed_page(GFP_NOFS);
4213952fc18eSTheodore Ts'o
4214952fc18eSTheodore Ts'o if (!buf)
4215952fc18eSTheodore Ts'o return -ENOMEM;
4216952fc18eSTheodore Ts'o
4217952fc18eSTheodore Ts'o /*
4218952fc18eSTheodore Ts'o * Compute the overhead (FS structures). This is constant
4219952fc18eSTheodore Ts'o * for a given filesystem unless the number of block groups
4220952fc18eSTheodore Ts'o * changes so we cache the previous value until it does.
4221952fc18eSTheodore Ts'o */
4222952fc18eSTheodore Ts'o
4223952fc18eSTheodore Ts'o /*
4224952fc18eSTheodore Ts'o * All of the blocks before first_data_block are overhead
4225952fc18eSTheodore Ts'o */
4226952fc18eSTheodore Ts'o overhead = EXT4_B2C(sbi, le32_to_cpu(es->s_first_data_block));
4227952fc18eSTheodore Ts'o
4228952fc18eSTheodore Ts'o /*
4229952fc18eSTheodore Ts'o * Add the overhead found in each block group
4230952fc18eSTheodore Ts'o */
4231952fc18eSTheodore Ts'o for (i = 0; i < ngroups; i++) {
4232952fc18eSTheodore Ts'o int blks;
4233952fc18eSTheodore Ts'o
4234952fc18eSTheodore Ts'o blks = count_overhead(sb, i, buf);
4235952fc18eSTheodore Ts'o overhead += blks;
4236952fc18eSTheodore Ts'o if (blks)
4237952fc18eSTheodore Ts'o memset(buf, 0, PAGE_SIZE);
4238952fc18eSTheodore Ts'o cond_resched();
4239952fc18eSTheodore Ts'o }
42403c816dedSEric Whitney
42413c816dedSEric Whitney /*
42423c816dedSEric Whitney * Add the internal journal blocks whether the journal has been
42433c816dedSEric Whitney * loaded or not
42443c816dedSEric Whitney */
4245ee7ed3aaSChunguang Xu if (sbi->s_journal && !sbi->s_journal_bdev)
4246ede7dc7fSHarshad Shirwadkar overhead += EXT4_NUM_B2C(sbi, sbi->s_journal->j_total_len);
4247f1eec3b0SRitesh Harjani else if (ext4_has_feature_journal(sb) && !sbi->s_journal && j_inum) {
4248f1eec3b0SRitesh Harjani /* j_inum for internal journal is non-zero */
42493c816dedSEric Whitney j_inode = ext4_get_journal_inode(sb, j_inum);
4250ee5c8071SZhang Yi if (!IS_ERR(j_inode)) {
42513c816dedSEric Whitney j_blocks = j_inode->i_size >> sb->s_blocksize_bits;
42523c816dedSEric Whitney overhead += EXT4_NUM_B2C(sbi, j_blocks);
42533c816dedSEric Whitney iput(j_inode);
42543c816dedSEric Whitney } else {
42553c816dedSEric Whitney ext4_msg(sb, KERN_ERR, "can't get journal size");
42563c816dedSEric Whitney }
42573c816dedSEric Whitney }
4258952fc18eSTheodore Ts'o sbi->s_overhead = overhead;
4259952fc18eSTheodore Ts'o smp_wmb();
4260952fc18eSTheodore Ts'o free_page((unsigned long) buf);
4261952fc18eSTheodore Ts'o return 0;
4262952fc18eSTheodore Ts'o }
4263952fc18eSTheodore Ts'o
ext4_set_resv_clusters(struct super_block * sb)4264b5799018STheodore Ts'o static void ext4_set_resv_clusters(struct super_block *sb)
426527dd4385SLukas Czerner {
426627dd4385SLukas Czerner ext4_fsblk_t resv_clusters;
4267b5799018STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb);
426827dd4385SLukas Czerner
426927dd4385SLukas Czerner /*
427030fac0f7SJan Kara * There's no need to reserve anything when we aren't using extents.
427130fac0f7SJan Kara * The space estimates are exact, there are no unwritten extents,
427230fac0f7SJan Kara * hole punching doesn't need new metadata... This is needed especially
427330fac0f7SJan Kara * to keep ext2/3 backward compatibility.
427430fac0f7SJan Kara */
4275e2b911c5SDarrick J. Wong if (!ext4_has_feature_extents(sb))
4276b5799018STheodore Ts'o return;
427730fac0f7SJan Kara /*
427827dd4385SLukas Czerner * By default we reserve 2% or 4096 clusters, whichever is smaller.
427927dd4385SLukas Czerner * This should cover the situations where we can not afford to run
428027dd4385SLukas Czerner * out of space like for example punch hole, or converting
4281556615dcSLukas Czerner * unwritten extents in delalloc path. In most cases such
428227dd4385SLukas Czerner * allocation would require 1, or 2 blocks, higher numbers are
428327dd4385SLukas Czerner * very rare.
428427dd4385SLukas Czerner */
4285b5799018STheodore Ts'o resv_clusters = (ext4_blocks_count(sbi->s_es) >>
4286b5799018STheodore Ts'o sbi->s_cluster_bits);
428727dd4385SLukas Czerner
428827dd4385SLukas Czerner do_div(resv_clusters, 50);
428927dd4385SLukas Czerner resv_clusters = min_t(ext4_fsblk_t, resv_clusters, 4096);
429027dd4385SLukas Czerner
4291b5799018STheodore Ts'o atomic64_set(&sbi->s_resv_clusters, resv_clusters);
429227dd4385SLukas Czerner }
429327dd4385SLukas Czerner
ext4_quota_mode(struct super_block * sb)4294ca9b404fSRoman Anufriev static const char *ext4_quota_mode(struct super_block *sb)
4295ca9b404fSRoman Anufriev {
4296ca9b404fSRoman Anufriev #ifdef CONFIG_QUOTA
4297ca9b404fSRoman Anufriev if (!ext4_quota_capable(sb))
4298ca9b404fSRoman Anufriev return "none";
4299ca9b404fSRoman Anufriev
4300ca9b404fSRoman Anufriev if (EXT4_SB(sb)->s_journal && ext4_is_quota_journalled(sb))
4301ca9b404fSRoman Anufriev return "journalled";
4302ca9b404fSRoman Anufriev else
4303ca9b404fSRoman Anufriev return "writeback";
4304ca9b404fSRoman Anufriev #else
4305ca9b404fSRoman Anufriev return "disabled";
4306ca9b404fSRoman Anufriev #endif
4307ca9b404fSRoman Anufriev }
4308ca9b404fSRoman Anufriev
ext4_setup_csum_trigger(struct super_block * sb,enum ext4_journal_trigger_type type,void (* trigger)(struct jbd2_buffer_trigger_type * type,struct buffer_head * bh,void * mapped_data,size_t size))4309188c299eSJan Kara static void ext4_setup_csum_trigger(struct super_block *sb,
4310188c299eSJan Kara enum ext4_journal_trigger_type type,
4311188c299eSJan Kara void (*trigger)(
4312188c299eSJan Kara struct jbd2_buffer_trigger_type *type,
4313188c299eSJan Kara struct buffer_head *bh,
4314188c299eSJan Kara void *mapped_data,
4315188c299eSJan Kara size_t size))
4316188c299eSJan Kara {
4317188c299eSJan Kara struct ext4_sb_info *sbi = EXT4_SB(sb);
4318188c299eSJan Kara
4319188c299eSJan Kara sbi->s_journal_triggers[type].sb = sb;
4320188c299eSJan Kara sbi->s_journal_triggers[type].tr_triggers.t_frozen = trigger;
4321188c299eSJan Kara }
4322188c299eSJan Kara
ext4_free_sbi(struct ext4_sb_info * sbi)43237edfd85bSLukas Czerner static void ext4_free_sbi(struct ext4_sb_info *sbi)
4324ac27a0ecSDave Kleikamp {
43257edfd85bSLukas Czerner if (!sbi)
43267edfd85bSLukas Czerner return;
43277edfd85bSLukas Czerner
43287edfd85bSLukas Czerner kfree(sbi->s_blockgroup_lock);
43298012b866SShiyang Ruan fs_put_dax(sbi->s_daxdev, NULL);
43307edfd85bSLukas Czerner kfree(sbi);
43317edfd85bSLukas Czerner }
43327edfd85bSLukas Czerner
ext4_alloc_sbi(struct super_block * sb)43337edfd85bSLukas Czerner static struct ext4_sb_info *ext4_alloc_sbi(struct super_block *sb)
43347edfd85bSLukas Czerner {
43357edfd85bSLukas Czerner struct ext4_sb_info *sbi;
43367edfd85bSLukas Czerner
43377edfd85bSLukas Czerner sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
43387edfd85bSLukas Czerner if (!sbi)
43397edfd85bSLukas Czerner return NULL;
43407edfd85bSLukas Czerner
43418012b866SShiyang Ruan sbi->s_daxdev = fs_dax_get_by_bdev(sb->s_bdev, &sbi->s_dax_part_off,
43428012b866SShiyang Ruan NULL, NULL);
43437edfd85bSLukas Czerner
43447edfd85bSLukas Czerner sbi->s_blockgroup_lock =
43457edfd85bSLukas Czerner kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL);
43467edfd85bSLukas Czerner
43477edfd85bSLukas Czerner if (!sbi->s_blockgroup_lock)
43487edfd85bSLukas Czerner goto err_out;
43497edfd85bSLukas Czerner
43507edfd85bSLukas Czerner sb->s_fs_info = sbi;
43517edfd85bSLukas Czerner sbi->s_sb = sb;
43527edfd85bSLukas Czerner return sbi;
43537edfd85bSLukas Czerner err_out:
43548012b866SShiyang Ruan fs_put_dax(sbi->s_daxdev, NULL);
43557edfd85bSLukas Czerner kfree(sbi);
43567edfd85bSLukas Czerner return NULL;
43577edfd85bSLukas Czerner }
43587edfd85bSLukas Czerner
ext4_set_def_opts(struct super_block * sb,struct ext4_super_block * es)43595f6d662dSJason Yan static void ext4_set_def_opts(struct super_block *sb,
43605f6d662dSJason Yan struct ext4_super_block *es)
43615f6d662dSJason Yan {
43625f6d662dSJason Yan unsigned long def_mount_opts;
43635f6d662dSJason Yan
43645f6d662dSJason Yan /* Set defaults before we parse the mount options */
43655f6d662dSJason Yan def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
43665f6d662dSJason Yan set_opt(sb, INIT_INODE_TABLE);
43675f6d662dSJason Yan if (def_mount_opts & EXT4_DEFM_DEBUG)
43685f6d662dSJason Yan set_opt(sb, DEBUG);
43695f6d662dSJason Yan if (def_mount_opts & EXT4_DEFM_BSDGROUPS)
43705f6d662dSJason Yan set_opt(sb, GRPID);
43715f6d662dSJason Yan if (def_mount_opts & EXT4_DEFM_UID16)
43725f6d662dSJason Yan set_opt(sb, NO_UID32);
43735f6d662dSJason Yan /* xattr user namespace & acls are now defaulted on */
43745f6d662dSJason Yan set_opt(sb, XATTR_USER);
43755f6d662dSJason Yan #ifdef CONFIG_EXT4_FS_POSIX_ACL
43765f6d662dSJason Yan set_opt(sb, POSIX_ACL);
43775f6d662dSJason Yan #endif
43785f6d662dSJason Yan if (ext4_has_feature_fast_commit(sb))
43795f6d662dSJason Yan set_opt2(sb, JOURNAL_FAST_COMMIT);
43805f6d662dSJason Yan /* don't forget to enable journal_csum when metadata_csum is enabled. */
43815f6d662dSJason Yan if (ext4_has_metadata_csum(sb))
43825f6d662dSJason Yan set_opt(sb, JOURNAL_CHECKSUM);
43835f6d662dSJason Yan
43845f6d662dSJason Yan if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_DATA)
43855f6d662dSJason Yan set_opt(sb, JOURNAL_DATA);
43865f6d662dSJason Yan else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_ORDERED)
43875f6d662dSJason Yan set_opt(sb, ORDERED_DATA);
43885f6d662dSJason Yan else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_WBACK)
43895f6d662dSJason Yan set_opt(sb, WRITEBACK_DATA);
43905f6d662dSJason Yan
43915f6d662dSJason Yan if (le16_to_cpu(es->s_errors) == EXT4_ERRORS_PANIC)
43925f6d662dSJason Yan set_opt(sb, ERRORS_PANIC);
43935f6d662dSJason Yan else if (le16_to_cpu(es->s_errors) == EXT4_ERRORS_CONTINUE)
43945f6d662dSJason Yan set_opt(sb, ERRORS_CONT);
43955f6d662dSJason Yan else
43965f6d662dSJason Yan set_opt(sb, ERRORS_RO);
43975f6d662dSJason Yan /* block_validity enabled by default; disable with noblock_validity */
43985f6d662dSJason Yan set_opt(sb, BLOCK_VALIDITY);
43995f6d662dSJason Yan if (def_mount_opts & EXT4_DEFM_DISCARD)
44005f6d662dSJason Yan set_opt(sb, DISCARD);
44015f6d662dSJason Yan
44025f6d662dSJason Yan if ((def_mount_opts & EXT4_DEFM_NOBARRIER) == 0)
44035f6d662dSJason Yan set_opt(sb, BARRIER);
44045f6d662dSJason Yan
44055f6d662dSJason Yan /*
44065f6d662dSJason Yan * enable delayed allocation by default
44075f6d662dSJason Yan * Use -o nodelalloc to turn it off
44085f6d662dSJason Yan */
44095f6d662dSJason Yan if (!IS_EXT3_SB(sb) && !IS_EXT2_SB(sb) &&
44105f6d662dSJason Yan ((def_mount_opts & EXT4_DEFM_NODELALLOC) == 0))
44115f6d662dSJason Yan set_opt(sb, DELALLOC);
44123df11e27SJason Yan
44133df11e27SJason Yan if (sb->s_blocksize == PAGE_SIZE)
44143df11e27SJason Yan set_opt(sb, DIOREAD_NOLOCK);
44155f6d662dSJason Yan }
44165f6d662dSJason Yan
ext4_handle_clustersize(struct super_block * sb)4417c8267c51SJason Yan static int ext4_handle_clustersize(struct super_block *sb)
44184a8557b0SJason Yan {
44194a8557b0SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
44204a8557b0SJason Yan struct ext4_super_block *es = sbi->s_es;
44214a8557b0SJason Yan int clustersize;
44224a8557b0SJason Yan
44234a8557b0SJason Yan /* Handle clustersize */
44244a8557b0SJason Yan clustersize = BLOCK_SIZE << le32_to_cpu(es->s_log_cluster_size);
44254a8557b0SJason Yan if (ext4_has_feature_bigalloc(sb)) {
4426c8267c51SJason Yan if (clustersize < sb->s_blocksize) {
44274a8557b0SJason Yan ext4_msg(sb, KERN_ERR,
44284a8557b0SJason Yan "cluster size (%d) smaller than "
4429c8267c51SJason Yan "block size (%lu)", clustersize, sb->s_blocksize);
44304a8557b0SJason Yan return -EINVAL;
44314a8557b0SJason Yan }
44324a8557b0SJason Yan sbi->s_cluster_bits = le32_to_cpu(es->s_log_cluster_size) -
44334a8557b0SJason Yan le32_to_cpu(es->s_log_block_size);
44344a8557b0SJason Yan sbi->s_clusters_per_group =
44354a8557b0SJason Yan le32_to_cpu(es->s_clusters_per_group);
4436c8267c51SJason Yan if (sbi->s_clusters_per_group > sb->s_blocksize * 8) {
44374a8557b0SJason Yan ext4_msg(sb, KERN_ERR,
44384a8557b0SJason Yan "#clusters per group too big: %lu",
44394a8557b0SJason Yan sbi->s_clusters_per_group);
44404a8557b0SJason Yan return -EINVAL;
44414a8557b0SJason Yan }
44424a8557b0SJason Yan if (sbi->s_blocks_per_group !=
4443c8267c51SJason Yan (sbi->s_clusters_per_group * (clustersize / sb->s_blocksize))) {
44444a8557b0SJason Yan ext4_msg(sb, KERN_ERR, "blocks per group (%lu) and "
44454a8557b0SJason Yan "clusters per group (%lu) inconsistent",
44464a8557b0SJason Yan sbi->s_blocks_per_group,
44474a8557b0SJason Yan sbi->s_clusters_per_group);
44484a8557b0SJason Yan return -EINVAL;
44494a8557b0SJason Yan }
44504a8557b0SJason Yan } else {
4451c8267c51SJason Yan if (clustersize != sb->s_blocksize) {
44524a8557b0SJason Yan ext4_msg(sb, KERN_ERR,
44534a8557b0SJason Yan "fragment/cluster size (%d) != "
4454c8267c51SJason Yan "block size (%lu)", clustersize, sb->s_blocksize);
44554a8557b0SJason Yan return -EINVAL;
44564a8557b0SJason Yan }
4457c8267c51SJason Yan if (sbi->s_blocks_per_group > sb->s_blocksize * 8) {
44584a8557b0SJason Yan ext4_msg(sb, KERN_ERR,
44594a8557b0SJason Yan "#blocks per group too big: %lu",
44604a8557b0SJason Yan sbi->s_blocks_per_group);
44614a8557b0SJason Yan return -EINVAL;
44624a8557b0SJason Yan }
44634a8557b0SJason Yan sbi->s_clusters_per_group = sbi->s_blocks_per_group;
44644a8557b0SJason Yan sbi->s_cluster_bits = 0;
44654a8557b0SJason Yan }
4466c8267c51SJason Yan sbi->s_cluster_ratio = clustersize / sb->s_blocksize;
44674a8557b0SJason Yan
44684a8557b0SJason Yan /* Do we have standard group size of clustersize * 8 blocks ? */
44694a8557b0SJason Yan if (sbi->s_blocks_per_group == clustersize << 3)
44704a8557b0SJason Yan set_opt2(sb, STD_GROUP_SIZE);
44714a8557b0SJason Yan
44724a8557b0SJason Yan return 0;
44734a8557b0SJason Yan }
44744a8557b0SJason Yan
ext4_fast_commit_init(struct super_block * sb)4475f7314a67SJason Yan static void ext4_fast_commit_init(struct super_block *sb)
4476f7314a67SJason Yan {
4477f7314a67SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
4478f7314a67SJason Yan
4479f7314a67SJason Yan /* Initialize fast commit stuff */
4480f7314a67SJason Yan atomic_set(&sbi->s_fc_subtid, 0);
4481f7314a67SJason Yan INIT_LIST_HEAD(&sbi->s_fc_q[FC_Q_MAIN]);
4482f7314a67SJason Yan INIT_LIST_HEAD(&sbi->s_fc_q[FC_Q_STAGING]);
4483f7314a67SJason Yan INIT_LIST_HEAD(&sbi->s_fc_dentry_q[FC_Q_MAIN]);
4484f7314a67SJason Yan INIT_LIST_HEAD(&sbi->s_fc_dentry_q[FC_Q_STAGING]);
4485f7314a67SJason Yan sbi->s_fc_bytes = 0;
4486f7314a67SJason Yan ext4_clear_mount_flag(sb, EXT4_MF_FC_INELIGIBLE);
4487f7314a67SJason Yan sbi->s_fc_ineligible_tid = 0;
4488f7314a67SJason Yan spin_lock_init(&sbi->s_fc_lock);
4489f7314a67SJason Yan memset(&sbi->s_fc_stats, 0, sizeof(sbi->s_fc_stats));
4490f7314a67SJason Yan sbi->s_fc_replay_state.fc_regions = NULL;
4491f7314a67SJason Yan sbi->s_fc_replay_state.fc_regions_size = 0;
4492f7314a67SJason Yan sbi->s_fc_replay_state.fc_regions_used = 0;
4493f7314a67SJason Yan sbi->s_fc_replay_state.fc_regions_valid = 0;
4494f7314a67SJason Yan sbi->s_fc_replay_state.fc_modified_inodes = NULL;
4495f7314a67SJason Yan sbi->s_fc_replay_state.fc_modified_inodes_size = 0;
4496f7314a67SJason Yan sbi->s_fc_replay_state.fc_modified_inodes_used = 0;
4497f7314a67SJason Yan }
4498f7314a67SJason Yan
ext4_inode_info_init(struct super_block * sb,struct ext4_super_block * es)44990e495f7cSJason Yan static int ext4_inode_info_init(struct super_block *sb,
4500c8267c51SJason Yan struct ext4_super_block *es)
45010e495f7cSJason Yan {
45020e495f7cSJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
45030e495f7cSJason Yan
45040e495f7cSJason Yan if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV) {
45050e495f7cSJason Yan sbi->s_inode_size = EXT4_GOOD_OLD_INODE_SIZE;
45060e495f7cSJason Yan sbi->s_first_ino = EXT4_GOOD_OLD_FIRST_INO;
45070e495f7cSJason Yan } else {
45080e495f7cSJason Yan sbi->s_inode_size = le16_to_cpu(es->s_inode_size);
45090e495f7cSJason Yan sbi->s_first_ino = le32_to_cpu(es->s_first_ino);
45100e495f7cSJason Yan if (sbi->s_first_ino < EXT4_GOOD_OLD_FIRST_INO) {
45110e495f7cSJason Yan ext4_msg(sb, KERN_ERR, "invalid first ino: %u",
45120e495f7cSJason Yan sbi->s_first_ino);
45130e495f7cSJason Yan return -EINVAL;
45140e495f7cSJason Yan }
45150e495f7cSJason Yan if ((sbi->s_inode_size < EXT4_GOOD_OLD_INODE_SIZE) ||
45160e495f7cSJason Yan (!is_power_of_2(sbi->s_inode_size)) ||
4517c8267c51SJason Yan (sbi->s_inode_size > sb->s_blocksize)) {
45180e495f7cSJason Yan ext4_msg(sb, KERN_ERR,
45190e495f7cSJason Yan "unsupported inode size: %d",
45200e495f7cSJason Yan sbi->s_inode_size);
4521c8267c51SJason Yan ext4_msg(sb, KERN_ERR, "blocksize: %lu", sb->s_blocksize);
45220e495f7cSJason Yan return -EINVAL;
45230e495f7cSJason Yan }
45240e495f7cSJason Yan /*
45250e495f7cSJason Yan * i_atime_extra is the last extra field available for
45260e495f7cSJason Yan * [acm]times in struct ext4_inode. Checking for that
45270e495f7cSJason Yan * field should suffice to ensure we have extra space
45280e495f7cSJason Yan * for all three.
45290e495f7cSJason Yan */
45300e495f7cSJason Yan if (sbi->s_inode_size >= offsetof(struct ext4_inode, i_atime_extra) +
45310e495f7cSJason Yan sizeof(((struct ext4_inode *)0)->i_atime_extra)) {
45320e495f7cSJason Yan sb->s_time_gran = 1;
45330e495f7cSJason Yan sb->s_time_max = EXT4_EXTRA_TIMESTAMP_MAX;
45340e495f7cSJason Yan } else {
45350e495f7cSJason Yan sb->s_time_gran = NSEC_PER_SEC;
45360e495f7cSJason Yan sb->s_time_max = EXT4_NON_EXTRA_TIMESTAMP_MAX;
45370e495f7cSJason Yan }
45380e495f7cSJason Yan sb->s_time_min = EXT4_TIMESTAMP_MIN;
45390e495f7cSJason Yan }
45400e495f7cSJason Yan
45410e495f7cSJason Yan if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE) {
45420e495f7cSJason Yan sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
45430e495f7cSJason Yan EXT4_GOOD_OLD_INODE_SIZE;
45440e495f7cSJason Yan if (ext4_has_feature_extra_isize(sb)) {
45450e495f7cSJason Yan unsigned v, max = (sbi->s_inode_size -
45460e495f7cSJason Yan EXT4_GOOD_OLD_INODE_SIZE);
45470e495f7cSJason Yan
45480e495f7cSJason Yan v = le16_to_cpu(es->s_want_extra_isize);
45490e495f7cSJason Yan if (v > max) {
45500e495f7cSJason Yan ext4_msg(sb, KERN_ERR,
45510e495f7cSJason Yan "bad s_want_extra_isize: %d", v);
45520e495f7cSJason Yan return -EINVAL;
45530e495f7cSJason Yan }
45540e495f7cSJason Yan if (sbi->s_want_extra_isize < v)
45550e495f7cSJason Yan sbi->s_want_extra_isize = v;
45560e495f7cSJason Yan
45570e495f7cSJason Yan v = le16_to_cpu(es->s_min_extra_isize);
45580e495f7cSJason Yan if (v > max) {
45590e495f7cSJason Yan ext4_msg(sb, KERN_ERR,
45600e495f7cSJason Yan "bad s_min_extra_isize: %d", v);
45610e495f7cSJason Yan return -EINVAL;
45620e495f7cSJason Yan }
45630e495f7cSJason Yan if (sbi->s_want_extra_isize < v)
45640e495f7cSJason Yan sbi->s_want_extra_isize = v;
45650e495f7cSJason Yan }
45660e495f7cSJason Yan }
45670e495f7cSJason Yan
45680e495f7cSJason Yan return 0;
45690e495f7cSJason Yan }
45700e495f7cSJason Yan
457139c135b0SJason Yan #if IS_ENABLED(CONFIG_UNICODE)
ext4_encoding_init(struct super_block * sb,struct ext4_super_block * es)457239c135b0SJason Yan static int ext4_encoding_init(struct super_block *sb, struct ext4_super_block *es)
457339c135b0SJason Yan {
457439c135b0SJason Yan const struct ext4_sb_encodings *encoding_info;
457539c135b0SJason Yan struct unicode_map *encoding;
457639c135b0SJason Yan __u16 encoding_flags = le16_to_cpu(es->s_encoding_flags);
457739c135b0SJason Yan
457839c135b0SJason Yan if (!ext4_has_feature_casefold(sb) || sb->s_encoding)
457939c135b0SJason Yan return 0;
458039c135b0SJason Yan
458139c135b0SJason Yan encoding_info = ext4_sb_read_encoding(es);
458239c135b0SJason Yan if (!encoding_info) {
458339c135b0SJason Yan ext4_msg(sb, KERN_ERR,
458439c135b0SJason Yan "Encoding requested by superblock is unknown");
458539c135b0SJason Yan return -EINVAL;
458639c135b0SJason Yan }
458739c135b0SJason Yan
458839c135b0SJason Yan encoding = utf8_load(encoding_info->version);
458939c135b0SJason Yan if (IS_ERR(encoding)) {
459039c135b0SJason Yan ext4_msg(sb, KERN_ERR,
459139c135b0SJason Yan "can't mount with superblock charset: %s-%u.%u.%u "
459239c135b0SJason Yan "not supported by the kernel. flags: 0x%x.",
459339c135b0SJason Yan encoding_info->name,
459439c135b0SJason Yan unicode_major(encoding_info->version),
459539c135b0SJason Yan unicode_minor(encoding_info->version),
459639c135b0SJason Yan unicode_rev(encoding_info->version),
459739c135b0SJason Yan encoding_flags);
459839c135b0SJason Yan return -EINVAL;
459939c135b0SJason Yan }
460039c135b0SJason Yan ext4_msg(sb, KERN_INFO,"Using encoding defined by superblock: "
460139c135b0SJason Yan "%s-%u.%u.%u with flags 0x%hx", encoding_info->name,
460239c135b0SJason Yan unicode_major(encoding_info->version),
460339c135b0SJason Yan unicode_minor(encoding_info->version),
460439c135b0SJason Yan unicode_rev(encoding_info->version),
460539c135b0SJason Yan encoding_flags);
460639c135b0SJason Yan
460739c135b0SJason Yan sb->s_encoding = encoding;
460839c135b0SJason Yan sb->s_encoding_flags = encoding_flags;
460939c135b0SJason Yan
461039c135b0SJason Yan return 0;
461139c135b0SJason Yan }
461239c135b0SJason Yan #else
ext4_encoding_init(struct super_block * sb,struct ext4_super_block * es)461339c135b0SJason Yan static inline int ext4_encoding_init(struct super_block *sb, struct ext4_super_block *es)
461439c135b0SJason Yan {
461539c135b0SJason Yan return 0;
461639c135b0SJason Yan }
461739c135b0SJason Yan #endif
461839c135b0SJason Yan
ext4_init_metadata_csum(struct super_block * sb,struct ext4_super_block * es)4619b26458d1SJason Yan static int ext4_init_metadata_csum(struct super_block *sb, struct ext4_super_block *es)
4620b26458d1SJason Yan {
4621b26458d1SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
4622b26458d1SJason Yan
4623b26458d1SJason Yan /* Warn if metadata_csum and gdt_csum are both set. */
4624b26458d1SJason Yan if (ext4_has_feature_metadata_csum(sb) &&
4625b26458d1SJason Yan ext4_has_feature_gdt_csum(sb))
4626b26458d1SJason Yan ext4_warning(sb, "metadata_csum and uninit_bg are "
4627b26458d1SJason Yan "redundant flags; please run fsck.");
4628b26458d1SJason Yan
4629b26458d1SJason Yan /* Check for a known checksum algorithm */
4630b26458d1SJason Yan if (!ext4_verify_csum_type(sb, es)) {
4631b26458d1SJason Yan ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
4632b26458d1SJason Yan "unknown checksum algorithm.");
4633b26458d1SJason Yan return -EINVAL;
4634b26458d1SJason Yan }
4635b26458d1SJason Yan ext4_setup_csum_trigger(sb, EXT4_JTR_ORPHAN_FILE,
4636b26458d1SJason Yan ext4_orphan_file_block_trigger);
4637b26458d1SJason Yan
4638b26458d1SJason Yan /* Load the checksum driver */
4639b26458d1SJason Yan sbi->s_chksum_driver = crypto_alloc_shash("crc32c", 0, 0);
4640b26458d1SJason Yan if (IS_ERR(sbi->s_chksum_driver)) {
4641b26458d1SJason Yan int ret = PTR_ERR(sbi->s_chksum_driver);
4642b26458d1SJason Yan ext4_msg(sb, KERN_ERR, "Cannot load crc32c driver.");
4643b26458d1SJason Yan sbi->s_chksum_driver = NULL;
4644b26458d1SJason Yan return ret;
4645b26458d1SJason Yan }
4646b26458d1SJason Yan
4647b26458d1SJason Yan /* Check superblock checksum */
4648b26458d1SJason Yan if (!ext4_superblock_csum_verify(sb, es)) {
4649b26458d1SJason Yan ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
4650b26458d1SJason Yan "invalid superblock checksum. Run e2fsck?");
4651b26458d1SJason Yan return -EFSBADCRC;
4652b26458d1SJason Yan }
4653b26458d1SJason Yan
4654b26458d1SJason Yan /* Precompute checksum seed for all metadata */
4655b26458d1SJason Yan if (ext4_has_feature_csum_seed(sb))
4656b26458d1SJason Yan sbi->s_csum_seed = le32_to_cpu(es->s_checksum_seed);
4657b26458d1SJason Yan else if (ext4_has_metadata_csum(sb) || ext4_has_feature_ea_inode(sb))
4658b26458d1SJason Yan sbi->s_csum_seed = ext4_chksum(sbi, ~0, es->s_uuid,
4659b26458d1SJason Yan sizeof(es->s_uuid));
4660b26458d1SJason Yan return 0;
4661b26458d1SJason Yan }
4662b26458d1SJason Yan
ext4_check_feature_compatibility(struct super_block * sb,struct ext4_super_block * es,int silent)4663d7f3542bSJason Yan static int ext4_check_feature_compatibility(struct super_block *sb,
4664d7f3542bSJason Yan struct ext4_super_block *es,
4665d7f3542bSJason Yan int silent)
4666d7f3542bSJason Yan {
466754902099SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
466854902099SJason Yan
4669d7f3542bSJason Yan if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV &&
4670d7f3542bSJason Yan (ext4_has_compat_features(sb) ||
4671d7f3542bSJason Yan ext4_has_ro_compat_features(sb) ||
4672d7f3542bSJason Yan ext4_has_incompat_features(sb)))
4673d7f3542bSJason Yan ext4_msg(sb, KERN_WARNING,
4674d7f3542bSJason Yan "feature flags set on rev 0 fs, "
4675d7f3542bSJason Yan "running e2fsck is recommended");
4676d7f3542bSJason Yan
4677d7f3542bSJason Yan if (es->s_creator_os == cpu_to_le32(EXT4_OS_HURD)) {
4678d7f3542bSJason Yan set_opt2(sb, HURD_COMPAT);
4679d7f3542bSJason Yan if (ext4_has_feature_64bit(sb)) {
4680d7f3542bSJason Yan ext4_msg(sb, KERN_ERR,
4681d7f3542bSJason Yan "The Hurd can't support 64-bit file systems");
4682d7f3542bSJason Yan return -EINVAL;
4683d7f3542bSJason Yan }
4684d7f3542bSJason Yan
4685d7f3542bSJason Yan /*
4686d7f3542bSJason Yan * ea_inode feature uses l_i_version field which is not
4687d7f3542bSJason Yan * available in HURD_COMPAT mode.
4688d7f3542bSJason Yan */
4689d7f3542bSJason Yan if (ext4_has_feature_ea_inode(sb)) {
4690d7f3542bSJason Yan ext4_msg(sb, KERN_ERR,
4691d7f3542bSJason Yan "ea_inode feature is not supported for Hurd");
4692d7f3542bSJason Yan return -EINVAL;
4693d7f3542bSJason Yan }
4694d7f3542bSJason Yan }
4695d7f3542bSJason Yan
4696d7f3542bSJason Yan if (IS_EXT2_SB(sb)) {
4697d7f3542bSJason Yan if (ext2_feature_set_ok(sb))
4698d7f3542bSJason Yan ext4_msg(sb, KERN_INFO, "mounting ext2 file system "
4699d7f3542bSJason Yan "using the ext4 subsystem");
4700d7f3542bSJason Yan else {
4701d7f3542bSJason Yan /*
4702d7f3542bSJason Yan * If we're probing be silent, if this looks like
4703d7f3542bSJason Yan * it's actually an ext[34] filesystem.
4704d7f3542bSJason Yan */
4705d7f3542bSJason Yan if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
4706d7f3542bSJason Yan return -EINVAL;
4707d7f3542bSJason Yan ext4_msg(sb, KERN_ERR, "couldn't mount as ext2 due "
4708d7f3542bSJason Yan "to feature incompatibilities");
4709d7f3542bSJason Yan return -EINVAL;
4710d7f3542bSJason Yan }
4711d7f3542bSJason Yan }
4712d7f3542bSJason Yan
4713d7f3542bSJason Yan if (IS_EXT3_SB(sb)) {
4714d7f3542bSJason Yan if (ext3_feature_set_ok(sb))
4715d7f3542bSJason Yan ext4_msg(sb, KERN_INFO, "mounting ext3 file system "
4716d7f3542bSJason Yan "using the ext4 subsystem");
4717d7f3542bSJason Yan else {
4718d7f3542bSJason Yan /*
4719d7f3542bSJason Yan * If we're probing be silent, if this looks like
4720d7f3542bSJason Yan * it's actually an ext4 filesystem.
4721d7f3542bSJason Yan */
4722d7f3542bSJason Yan if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
4723d7f3542bSJason Yan return -EINVAL;
4724d7f3542bSJason Yan ext4_msg(sb, KERN_ERR, "couldn't mount as ext3 due "
4725d7f3542bSJason Yan "to feature incompatibilities");
4726d7f3542bSJason Yan return -EINVAL;
4727d7f3542bSJason Yan }
4728d7f3542bSJason Yan }
4729d7f3542bSJason Yan
4730d7f3542bSJason Yan /*
4731d7f3542bSJason Yan * Check feature flags regardless of the revision level, since we
4732d7f3542bSJason Yan * previously didn't change the revision level when setting the flags,
4733d7f3542bSJason Yan * so there is a chance incompat flags are set on a rev 0 filesystem.
4734d7f3542bSJason Yan */
4735d7f3542bSJason Yan if (!ext4_feature_set_ok(sb, (sb_rdonly(sb))))
4736d7f3542bSJason Yan return -EINVAL;
4737d7f3542bSJason Yan
473854902099SJason Yan if (sbi->s_daxdev) {
473954902099SJason Yan if (sb->s_blocksize == PAGE_SIZE)
474054902099SJason Yan set_bit(EXT4_FLAGS_BDEV_IS_DAX, &sbi->s_ext4_flags);
474154902099SJason Yan else
474254902099SJason Yan ext4_msg(sb, KERN_ERR, "unsupported blocksize for DAX\n");
474354902099SJason Yan }
474454902099SJason Yan
474554902099SJason Yan if (sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) {
474654902099SJason Yan if (ext4_has_feature_inline_data(sb)) {
474754902099SJason Yan ext4_msg(sb, KERN_ERR, "Cannot use DAX on a filesystem"
474854902099SJason Yan " that may contain inline data");
474954902099SJason Yan return -EINVAL;
475054902099SJason Yan }
475154902099SJason Yan if (!test_bit(EXT4_FLAGS_BDEV_IS_DAX, &sbi->s_ext4_flags)) {
475254902099SJason Yan ext4_msg(sb, KERN_ERR,
475354902099SJason Yan "DAX unsupported by block device.");
475454902099SJason Yan return -EINVAL;
475554902099SJason Yan }
475654902099SJason Yan }
475754902099SJason Yan
475854902099SJason Yan if (ext4_has_feature_encrypt(sb) && es->s_encryption_level) {
475954902099SJason Yan ext4_msg(sb, KERN_ERR, "Unsupported encryption level %d",
476054902099SJason Yan es->s_encryption_level);
476154902099SJason Yan return -EINVAL;
476254902099SJason Yan }
476354902099SJason Yan
4764d7f3542bSJason Yan return 0;
4765d7f3542bSJason Yan }
4766d7f3542bSJason Yan
ext4_check_geometry(struct super_block * sb,struct ext4_super_block * es)476768e62439SJason Yan static int ext4_check_geometry(struct super_block *sb,
4768bc62dbf9SJason Yan struct ext4_super_block *es)
4769bc62dbf9SJason Yan {
4770bc62dbf9SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
4771bc62dbf9SJason Yan __u64 blocks_count;
4772269e9226SJason Yan int err;
4773269e9226SJason Yan
4774269e9226SJason Yan if (le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) > (sb->s_blocksize / 4)) {
4775269e9226SJason Yan ext4_msg(sb, KERN_ERR,
4776269e9226SJason Yan "Number of reserved GDT blocks insanely large: %d",
4777269e9226SJason Yan le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks));
4778269e9226SJason Yan return -EINVAL;
4779269e9226SJason Yan }
4780269e9226SJason Yan /*
4781269e9226SJason Yan * Test whether we have more sectors than will fit in sector_t,
4782269e9226SJason Yan * and whether the max offset is addressable by the page cache.
4783269e9226SJason Yan */
4784269e9226SJason Yan err = generic_check_addressable(sb->s_blocksize_bits,
4785269e9226SJason Yan ext4_blocks_count(es));
4786269e9226SJason Yan if (err) {
4787269e9226SJason Yan ext4_msg(sb, KERN_ERR, "filesystem"
4788269e9226SJason Yan " too large to mount safely on this system");
4789269e9226SJason Yan return err;
4790269e9226SJason Yan }
4791bc62dbf9SJason Yan
4792bc62dbf9SJason Yan /* check blocks count against device size */
4793bc62dbf9SJason Yan blocks_count = sb_bdev_nr_blocks(sb);
4794bc62dbf9SJason Yan if (blocks_count && ext4_blocks_count(es) > blocks_count) {
4795bc62dbf9SJason Yan ext4_msg(sb, KERN_WARNING, "bad geometry: block count %llu "
4796bc62dbf9SJason Yan "exceeds size of device (%llu blocks)",
4797bc62dbf9SJason Yan ext4_blocks_count(es), blocks_count);
4798bc62dbf9SJason Yan return -EINVAL;
4799bc62dbf9SJason Yan }
4800bc62dbf9SJason Yan
4801bc62dbf9SJason Yan /*
4802bc62dbf9SJason Yan * It makes no sense for the first data block to be beyond the end
4803bc62dbf9SJason Yan * of the filesystem.
4804bc62dbf9SJason Yan */
4805bc62dbf9SJason Yan if (le32_to_cpu(es->s_first_data_block) >= ext4_blocks_count(es)) {
4806bc62dbf9SJason Yan ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4807bc62dbf9SJason Yan "block %u is beyond end of filesystem (%llu)",
4808bc62dbf9SJason Yan le32_to_cpu(es->s_first_data_block),
4809bc62dbf9SJason Yan ext4_blocks_count(es));
4810bc62dbf9SJason Yan return -EINVAL;
4811bc62dbf9SJason Yan }
4812bc62dbf9SJason Yan if ((es->s_first_data_block == 0) && (es->s_log_block_size == 0) &&
4813bc62dbf9SJason Yan (sbi->s_cluster_ratio == 1)) {
4814bc62dbf9SJason Yan ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4815bc62dbf9SJason Yan "block is 0 with a 1k block and cluster size");
4816bc62dbf9SJason Yan return -EINVAL;
4817bc62dbf9SJason Yan }
4818bc62dbf9SJason Yan
4819bc62dbf9SJason Yan blocks_count = (ext4_blocks_count(es) -
4820bc62dbf9SJason Yan le32_to_cpu(es->s_first_data_block) +
4821bc62dbf9SJason Yan EXT4_BLOCKS_PER_GROUP(sb) - 1);
4822bc62dbf9SJason Yan do_div(blocks_count, EXT4_BLOCKS_PER_GROUP(sb));
4823bc62dbf9SJason Yan if (blocks_count > ((uint64_t)1<<32) - EXT4_DESC_PER_BLOCK(sb)) {
4824bc62dbf9SJason Yan ext4_msg(sb, KERN_WARNING, "groups count too large: %llu "
4825bc62dbf9SJason Yan "(block count %llu, first data block %u, "
4826bc62dbf9SJason Yan "blocks per group %lu)", blocks_count,
4827bc62dbf9SJason Yan ext4_blocks_count(es),
4828bc62dbf9SJason Yan le32_to_cpu(es->s_first_data_block),
4829bc62dbf9SJason Yan EXT4_BLOCKS_PER_GROUP(sb));
4830bc62dbf9SJason Yan return -EINVAL;
4831bc62dbf9SJason Yan }
4832bc62dbf9SJason Yan sbi->s_groups_count = blocks_count;
4833bc62dbf9SJason Yan sbi->s_blockfile_groups = min_t(ext4_group_t, sbi->s_groups_count,
4834bc62dbf9SJason Yan (EXT4_MAX_BLOCK_FILE_PHYS / EXT4_BLOCKS_PER_GROUP(sb)));
4835bc62dbf9SJason Yan if (((u64)sbi->s_groups_count * sbi->s_inodes_per_group) !=
4836bc62dbf9SJason Yan le32_to_cpu(es->s_inodes_count)) {
4837bc62dbf9SJason Yan ext4_msg(sb, KERN_ERR, "inodes count not valid: %u vs %llu",
4838bc62dbf9SJason Yan le32_to_cpu(es->s_inodes_count),
4839bc62dbf9SJason Yan ((u64)sbi->s_groups_count * sbi->s_inodes_per_group));
4840bc62dbf9SJason Yan return -EINVAL;
4841bc62dbf9SJason Yan }
4842bc62dbf9SJason Yan
4843bc62dbf9SJason Yan return 0;
4844bc62dbf9SJason Yan }
4845bc62dbf9SJason Yan
ext4_group_desc_init(struct super_block * sb,struct ext4_super_block * es,ext4_fsblk_t logical_sb_block,ext4_group_t * first_not_zeroed)4846a4e6a511SJason Yan static int ext4_group_desc_init(struct super_block *sb,
4847a4e6a511SJason Yan struct ext4_super_block *es,
4848a4e6a511SJason Yan ext4_fsblk_t logical_sb_block,
4849a4e6a511SJason Yan ext4_group_t *first_not_zeroed)
4850a4e6a511SJason Yan {
4851a4e6a511SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
4852a4e6a511SJason Yan unsigned int db_count;
4853a4e6a511SJason Yan ext4_fsblk_t block;
4854a4e6a511SJason Yan int i;
4855a4e6a511SJason Yan
4856a4e6a511SJason Yan db_count = (sbi->s_groups_count + EXT4_DESC_PER_BLOCK(sb) - 1) /
4857a4e6a511SJason Yan EXT4_DESC_PER_BLOCK(sb);
4858a4e6a511SJason Yan if (ext4_has_feature_meta_bg(sb)) {
4859a4e6a511SJason Yan if (le32_to_cpu(es->s_first_meta_bg) > db_count) {
4860a4e6a511SJason Yan ext4_msg(sb, KERN_WARNING,
4861a4e6a511SJason Yan "first meta block group too large: %u "
4862a4e6a511SJason Yan "(group descriptor block count %u)",
4863a4e6a511SJason Yan le32_to_cpu(es->s_first_meta_bg), db_count);
4864a4e6a511SJason Yan return -EINVAL;
4865a4e6a511SJason Yan }
4866a4e6a511SJason Yan }
4867a4e6a511SJason Yan rcu_assign_pointer(sbi->s_group_desc,
4868a4e6a511SJason Yan kvmalloc_array(db_count,
4869a4e6a511SJason Yan sizeof(struct buffer_head *),
4870a4e6a511SJason Yan GFP_KERNEL));
4871a4e6a511SJason Yan if (sbi->s_group_desc == NULL) {
4872a4e6a511SJason Yan ext4_msg(sb, KERN_ERR, "not enough memory");
4873a4e6a511SJason Yan return -ENOMEM;
4874a4e6a511SJason Yan }
4875a4e6a511SJason Yan
4876a4e6a511SJason Yan bgl_lock_init(sbi->s_blockgroup_lock);
4877a4e6a511SJason Yan
4878a4e6a511SJason Yan /* Pre-read the descriptors into the buffer cache */
4879a4e6a511SJason Yan for (i = 0; i < db_count; i++) {
4880a4e6a511SJason Yan block = descriptor_loc(sb, logical_sb_block, i);
4881a4e6a511SJason Yan ext4_sb_breadahead_unmovable(sb, block);
4882a4e6a511SJason Yan }
4883a4e6a511SJason Yan
4884a4e6a511SJason Yan for (i = 0; i < db_count; i++) {
4885a4e6a511SJason Yan struct buffer_head *bh;
4886a4e6a511SJason Yan
4887a4e6a511SJason Yan block = descriptor_loc(sb, logical_sb_block, i);
4888a4e6a511SJason Yan bh = ext4_sb_bread_unmovable(sb, block);
4889a4e6a511SJason Yan if (IS_ERR(bh)) {
4890a4e6a511SJason Yan ext4_msg(sb, KERN_ERR,
4891a4e6a511SJason Yan "can't read group descriptor %d", i);
4892a4e6a511SJason Yan sbi->s_gdb_count = i;
4893172e344eSYe Bin return PTR_ERR(bh);
4894a4e6a511SJason Yan }
4895a4e6a511SJason Yan rcu_read_lock();
4896a4e6a511SJason Yan rcu_dereference(sbi->s_group_desc)[i] = bh;
4897a4e6a511SJason Yan rcu_read_unlock();
4898a4e6a511SJason Yan }
4899a4e6a511SJason Yan sbi->s_gdb_count = db_count;
4900a4e6a511SJason Yan if (!ext4_check_descriptors(sb, logical_sb_block, first_not_zeroed)) {
4901a4e6a511SJason Yan ext4_msg(sb, KERN_ERR, "group descriptors corrupted!");
4902172e344eSYe Bin return -EFSCORRUPTED;
4903a4e6a511SJason Yan }
4904172e344eSYe Bin
4905a4e6a511SJason Yan return 0;
4906a4e6a511SJason Yan }
4907a4e6a511SJason Yan
ext4_load_and_init_journal(struct super_block * sb,struct ext4_super_block * es,struct ext4_fs_context * ctx)49089c1dd22dSJason Yan static int ext4_load_and_init_journal(struct super_block *sb,
49099c1dd22dSJason Yan struct ext4_super_block *es,
49109c1dd22dSJason Yan struct ext4_fs_context *ctx)
49119c1dd22dSJason Yan {
49129c1dd22dSJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
49139c1dd22dSJason Yan int err;
49149c1dd22dSJason Yan
49159c1dd22dSJason Yan err = ext4_load_journal(sb, es, ctx->journal_devnum);
49169c1dd22dSJason Yan if (err)
49179c1dd22dSJason Yan return err;
49189c1dd22dSJason Yan
49199c1dd22dSJason Yan if (ext4_has_feature_64bit(sb) &&
49209c1dd22dSJason Yan !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
49219c1dd22dSJason Yan JBD2_FEATURE_INCOMPAT_64BIT)) {
49229c1dd22dSJason Yan ext4_msg(sb, KERN_ERR, "Failed to set 64-bit journal feature");
49239c1dd22dSJason Yan goto out;
49249c1dd22dSJason Yan }
49259c1dd22dSJason Yan
49269c1dd22dSJason Yan if (!set_journal_csum_feature_set(sb)) {
49279c1dd22dSJason Yan ext4_msg(sb, KERN_ERR, "Failed to set journal checksum "
49289c1dd22dSJason Yan "feature set");
49299c1dd22dSJason Yan goto out;
49309c1dd22dSJason Yan }
49319c1dd22dSJason Yan
49329c1dd22dSJason Yan if (test_opt2(sb, JOURNAL_FAST_COMMIT) &&
49339c1dd22dSJason Yan !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
49349c1dd22dSJason Yan JBD2_FEATURE_INCOMPAT_FAST_COMMIT)) {
49359c1dd22dSJason Yan ext4_msg(sb, KERN_ERR,
49369c1dd22dSJason Yan "Failed to set fast commit journal feature");
49379c1dd22dSJason Yan goto out;
49389c1dd22dSJason Yan }
49399c1dd22dSJason Yan
49409c1dd22dSJason Yan /* We have now updated the journal if required, so we can
49419c1dd22dSJason Yan * validate the data journaling mode. */
49429c1dd22dSJason Yan switch (test_opt(sb, DATA_FLAGS)) {
49439c1dd22dSJason Yan case 0:
49449c1dd22dSJason Yan /* No mode set, assume a default based on the journal
49459c1dd22dSJason Yan * capabilities: ORDERED_DATA if the journal can
49469c1dd22dSJason Yan * cope, else JOURNAL_DATA
49479c1dd22dSJason Yan */
49489c1dd22dSJason Yan if (jbd2_journal_check_available_features
49499c1dd22dSJason Yan (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
49509c1dd22dSJason Yan set_opt(sb, ORDERED_DATA);
49519c1dd22dSJason Yan sbi->s_def_mount_opt |= EXT4_MOUNT_ORDERED_DATA;
49529c1dd22dSJason Yan } else {
49539c1dd22dSJason Yan set_opt(sb, JOURNAL_DATA);
49549c1dd22dSJason Yan sbi->s_def_mount_opt |= EXT4_MOUNT_JOURNAL_DATA;
49559c1dd22dSJason Yan }
49569c1dd22dSJason Yan break;
49579c1dd22dSJason Yan
49589c1dd22dSJason Yan case EXT4_MOUNT_ORDERED_DATA:
49599c1dd22dSJason Yan case EXT4_MOUNT_WRITEBACK_DATA:
49609c1dd22dSJason Yan if (!jbd2_journal_check_available_features
49619c1dd22dSJason Yan (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
49629c1dd22dSJason Yan ext4_msg(sb, KERN_ERR, "Journal does not support "
49639c1dd22dSJason Yan "requested data journaling mode");
49649c1dd22dSJason Yan goto out;
49659c1dd22dSJason Yan }
49669c1dd22dSJason Yan break;
49679c1dd22dSJason Yan default:
49689c1dd22dSJason Yan break;
49699c1dd22dSJason Yan }
49709c1dd22dSJason Yan
49719c1dd22dSJason Yan if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA &&
49729c1dd22dSJason Yan test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
49739c1dd22dSJason Yan ext4_msg(sb, KERN_ERR, "can't mount with "
49749c1dd22dSJason Yan "journal_async_commit in data=ordered mode");
49759c1dd22dSJason Yan goto out;
49769c1dd22dSJason Yan }
49779c1dd22dSJason Yan
49789c1dd22dSJason Yan set_task_ioprio(sbi->s_journal->j_task, ctx->journal_ioprio);
49799c1dd22dSJason Yan
49809c1dd22dSJason Yan sbi->s_journal->j_submit_inode_data_buffers =
49819c1dd22dSJason Yan ext4_journal_submit_inode_data_buffers;
49829c1dd22dSJason Yan sbi->s_journal->j_finish_inode_data_buffers =
49839c1dd22dSJason Yan ext4_journal_finish_inode_data_buffers;
49849c1dd22dSJason Yan
49859c1dd22dSJason Yan return 0;
49869c1dd22dSJason Yan
49879c1dd22dSJason Yan out:
4988bb15cea2STheodore Ts'o /* flush s_sb_upd_work before destroying the journal. */
4989bb15cea2STheodore Ts'o flush_work(&sbi->s_sb_upd_work);
49909c1dd22dSJason Yan jbd2_journal_destroy(sbi->s_journal);
49919c1dd22dSJason Yan sbi->s_journal = NULL;
49929f2a1d9fSJason Yan return -EINVAL;
49939c1dd22dSJason Yan }
49949c1dd22dSJason Yan
ext4_check_journal_data_mode(struct super_block * sb)499568e62439SJason Yan static int ext4_check_journal_data_mode(struct super_block *sb)
4996a5991e53SJason Yan {
4997a5991e53SJason Yan if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
4998a5991e53SJason Yan printk_once(KERN_WARNING "EXT4-fs: Warning: mounting with "
4999a5991e53SJason Yan "data=journal disables delayed allocation, "
5000a5991e53SJason Yan "dioread_nolock, O_DIRECT and fast_commit support!\n");
5001a5991e53SJason Yan /* can't mount with both data=journal and dioread_nolock. */
5002a5991e53SJason Yan clear_opt(sb, DIOREAD_NOLOCK);
5003a5991e53SJason Yan clear_opt2(sb, JOURNAL_FAST_COMMIT);
5004a5991e53SJason Yan if (test_opt2(sb, EXPLICIT_DELALLOC)) {
5005a5991e53SJason Yan ext4_msg(sb, KERN_ERR, "can't mount with "
5006a5991e53SJason Yan "both data=journal and delalloc");
5007a5991e53SJason Yan return -EINVAL;
5008a5991e53SJason Yan }
5009a5991e53SJason Yan if (test_opt(sb, DAX_ALWAYS)) {
5010a5991e53SJason Yan ext4_msg(sb, KERN_ERR, "can't mount with "
5011a5991e53SJason Yan "both data=journal and dax");
5012a5991e53SJason Yan return -EINVAL;
5013a5991e53SJason Yan }
5014a5991e53SJason Yan if (ext4_has_feature_encrypt(sb)) {
5015a5991e53SJason Yan ext4_msg(sb, KERN_WARNING,
5016a5991e53SJason Yan "encrypted files will use data=ordered "
5017a5991e53SJason Yan "instead of data journaling mode");
5018a5991e53SJason Yan }
5019a5991e53SJason Yan if (test_opt(sb, DELALLOC))
5020a5991e53SJason Yan clear_opt(sb, DELALLOC);
5021a5991e53SJason Yan } else {
5022a5991e53SJason Yan sb->s_iflags |= SB_I_CGROUPWB;
5023a5991e53SJason Yan }
5024a5991e53SJason Yan
5025a5991e53SJason Yan return 0;
5026a5991e53SJason Yan }
5027a5991e53SJason Yan
ext4_load_super(struct super_block * sb,ext4_fsblk_t * lsb,int silent)5028a7a79c29SJason Yan static int ext4_load_super(struct super_block *sb, ext4_fsblk_t *lsb,
5029a7a79c29SJason Yan int silent)
5030a7a79c29SJason Yan {
5031a7a79c29SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
5032a7a79c29SJason Yan struct ext4_super_block *es;
5033a7a79c29SJason Yan ext4_fsblk_t logical_sb_block;
5034a7a79c29SJason Yan unsigned long offset = 0;
5035a7a79c29SJason Yan struct buffer_head *bh;
5036a7a79c29SJason Yan int ret = -EINVAL;
5037a7a79c29SJason Yan int blocksize;
5038a7a79c29SJason Yan
5039a7a79c29SJason Yan blocksize = sb_min_blocksize(sb, EXT4_MIN_BLOCK_SIZE);
5040a7a79c29SJason Yan if (!blocksize) {
5041a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "unable to set blocksize");
5042a7a79c29SJason Yan return -EINVAL;
5043a7a79c29SJason Yan }
5044a7a79c29SJason Yan
5045a7a79c29SJason Yan /*
5046a7a79c29SJason Yan * The ext4 superblock will not be buffer aligned for other than 1kB
5047a7a79c29SJason Yan * block sizes. We need to calculate the offset from buffer start.
5048a7a79c29SJason Yan */
5049a7a79c29SJason Yan if (blocksize != EXT4_MIN_BLOCK_SIZE) {
5050a7a79c29SJason Yan logical_sb_block = sbi->s_sb_block * EXT4_MIN_BLOCK_SIZE;
5051a7a79c29SJason Yan offset = do_div(logical_sb_block, blocksize);
5052a7a79c29SJason Yan } else {
5053a7a79c29SJason Yan logical_sb_block = sbi->s_sb_block;
5054a7a79c29SJason Yan }
5055a7a79c29SJason Yan
5056a7a79c29SJason Yan bh = ext4_sb_bread_unmovable(sb, logical_sb_block);
5057a7a79c29SJason Yan if (IS_ERR(bh)) {
5058a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "unable to read superblock");
5059a7a79c29SJason Yan return PTR_ERR(bh);
5060a7a79c29SJason Yan }
5061a7a79c29SJason Yan /*
5062a7a79c29SJason Yan * Note: s_es must be initialized as soon as possible because
5063a7a79c29SJason Yan * some ext4 macro-instructions depend on its value
5064a7a79c29SJason Yan */
5065a7a79c29SJason Yan es = (struct ext4_super_block *) (bh->b_data + offset);
5066a7a79c29SJason Yan sbi->s_es = es;
5067a7a79c29SJason Yan sb->s_magic = le16_to_cpu(es->s_magic);
5068a7a79c29SJason Yan if (sb->s_magic != EXT4_SUPER_MAGIC) {
5069a7a79c29SJason Yan if (!silent)
5070a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem");
5071a7a79c29SJason Yan goto out;
5072a7a79c29SJason Yan }
5073a7a79c29SJason Yan
5074a7a79c29SJason Yan if (le32_to_cpu(es->s_log_block_size) >
5075a7a79c29SJason Yan (EXT4_MAX_BLOCK_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
5076a7a79c29SJason Yan ext4_msg(sb, KERN_ERR,
5077a7a79c29SJason Yan "Invalid log block size: %u",
5078a7a79c29SJason Yan le32_to_cpu(es->s_log_block_size));
5079a7a79c29SJason Yan goto out;
5080a7a79c29SJason Yan }
5081a7a79c29SJason Yan if (le32_to_cpu(es->s_log_cluster_size) >
5082a7a79c29SJason Yan (EXT4_MAX_CLUSTER_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
5083a7a79c29SJason Yan ext4_msg(sb, KERN_ERR,
5084a7a79c29SJason Yan "Invalid log cluster size: %u",
5085a7a79c29SJason Yan le32_to_cpu(es->s_log_cluster_size));
5086a7a79c29SJason Yan goto out;
5087a7a79c29SJason Yan }
5088a7a79c29SJason Yan
5089a7a79c29SJason Yan blocksize = EXT4_MIN_BLOCK_SIZE << le32_to_cpu(es->s_log_block_size);
5090a7a79c29SJason Yan
5091a7a79c29SJason Yan /*
5092a7a79c29SJason Yan * If the default block size is not the same as the real block size,
5093a7a79c29SJason Yan * we need to reload it.
5094a7a79c29SJason Yan */
5095a7a79c29SJason Yan if (sb->s_blocksize == blocksize) {
5096a7a79c29SJason Yan *lsb = logical_sb_block;
5097a7a79c29SJason Yan sbi->s_sbh = bh;
5098a7a79c29SJason Yan return 0;
5099a7a79c29SJason Yan }
5100a7a79c29SJason Yan
5101a7a79c29SJason Yan /*
5102a7a79c29SJason Yan * bh must be released before kill_bdev(), otherwise
5103a7a79c29SJason Yan * it won't be freed and its page also. kill_bdev()
5104a7a79c29SJason Yan * is called by sb_set_blocksize().
5105a7a79c29SJason Yan */
5106a7a79c29SJason Yan brelse(bh);
5107a7a79c29SJason Yan /* Validate the filesystem blocksize */
5108a7a79c29SJason Yan if (!sb_set_blocksize(sb, blocksize)) {
5109a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "bad block size %d",
5110a7a79c29SJason Yan blocksize);
5111a7a79c29SJason Yan bh = NULL;
5112a7a79c29SJason Yan goto out;
5113a7a79c29SJason Yan }
5114a7a79c29SJason Yan
5115a7a79c29SJason Yan logical_sb_block = sbi->s_sb_block * EXT4_MIN_BLOCK_SIZE;
5116a7a79c29SJason Yan offset = do_div(logical_sb_block, blocksize);
5117a7a79c29SJason Yan bh = ext4_sb_bread_unmovable(sb, logical_sb_block);
5118a7a79c29SJason Yan if (IS_ERR(bh)) {
5119a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "Can't read superblock on 2nd try");
5120a7a79c29SJason Yan ret = PTR_ERR(bh);
5121a7a79c29SJason Yan bh = NULL;
5122a7a79c29SJason Yan goto out;
5123a7a79c29SJason Yan }
5124a7a79c29SJason Yan es = (struct ext4_super_block *)(bh->b_data + offset);
5125a7a79c29SJason Yan sbi->s_es = es;
5126a7a79c29SJason Yan if (es->s_magic != cpu_to_le16(EXT4_SUPER_MAGIC)) {
5127a7a79c29SJason Yan ext4_msg(sb, KERN_ERR, "Magic mismatch, very weird!");
5128a7a79c29SJason Yan goto out;
5129a7a79c29SJason Yan }
5130a7a79c29SJason Yan *lsb = logical_sb_block;
5131a7a79c29SJason Yan sbi->s_sbh = bh;
5132a7a79c29SJason Yan return 0;
5133a7a79c29SJason Yan out:
5134a7a79c29SJason Yan brelse(bh);
5135a7a79c29SJason Yan return ret;
5136a7a79c29SJason Yan }
5137a7a79c29SJason Yan
ext4_hash_info_init(struct super_block * sb)5138db9345d9SJason Yan static void ext4_hash_info_init(struct super_block *sb)
5139db9345d9SJason Yan {
5140db9345d9SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
5141db9345d9SJason Yan struct ext4_super_block *es = sbi->s_es;
5142db9345d9SJason Yan unsigned int i;
5143db9345d9SJason Yan
5144db9345d9SJason Yan for (i = 0; i < 4; i++)
5145db9345d9SJason Yan sbi->s_hash_seed[i] = le32_to_cpu(es->s_hash_seed[i]);
5146db9345d9SJason Yan
5147db9345d9SJason Yan sbi->s_def_hash_version = es->s_def_hash_version;
5148db9345d9SJason Yan if (ext4_has_feature_dir_index(sb)) {
5149db9345d9SJason Yan i = le32_to_cpu(es->s_flags);
5150db9345d9SJason Yan if (i & EXT2_FLAGS_UNSIGNED_HASH)
5151db9345d9SJason Yan sbi->s_hash_unsigned = 3;
5152db9345d9SJason Yan else if ((i & EXT2_FLAGS_SIGNED_HASH) == 0) {
5153db9345d9SJason Yan #ifdef __CHAR_UNSIGNED__
5154db9345d9SJason Yan if (!sb_rdonly(sb))
5155db9345d9SJason Yan es->s_flags |=
5156db9345d9SJason Yan cpu_to_le32(EXT2_FLAGS_UNSIGNED_HASH);
5157db9345d9SJason Yan sbi->s_hash_unsigned = 3;
5158db9345d9SJason Yan #else
5159db9345d9SJason Yan if (!sb_rdonly(sb))
5160db9345d9SJason Yan es->s_flags |=
5161db9345d9SJason Yan cpu_to_le32(EXT2_FLAGS_SIGNED_HASH);
5162db9345d9SJason Yan #endif
5163db9345d9SJason Yan }
5164db9345d9SJason Yan }
5165db9345d9SJason Yan }
5166db9345d9SJason Yan
ext4_block_group_meta_init(struct super_block * sb,int silent)5167107d2be9SJason Yan static int ext4_block_group_meta_init(struct super_block *sb, int silent)
5168107d2be9SJason Yan {
5169107d2be9SJason Yan struct ext4_sb_info *sbi = EXT4_SB(sb);
5170107d2be9SJason Yan struct ext4_super_block *es = sbi->s_es;
5171107d2be9SJason Yan int has_huge_files;
5172107d2be9SJason Yan
5173107d2be9SJason Yan has_huge_files = ext4_has_feature_huge_file(sb);
5174107d2be9SJason Yan sbi->s_bitmap_maxbytes = ext4_max_bitmap_size(sb->s_blocksize_bits,
5175107d2be9SJason Yan has_huge_files);
5176107d2be9SJason Yan sb->s_maxbytes = ext4_max_size(sb->s_blocksize_bits, has_huge_files);
5177107d2be9SJason Yan
5178107d2be9SJason Yan sbi->s_desc_size = le16_to_cpu(es->s_desc_size);
5179107d2be9SJason Yan if (ext4_has_feature_64bit(sb)) {
5180107d2be9SJason Yan if (sbi->s_desc_size < EXT4_MIN_DESC_SIZE_64BIT ||
5181107d2be9SJason Yan sbi->s_desc_size > EXT4_MAX_DESC_SIZE ||
5182107d2be9SJason Yan !is_power_of_2(sbi->s_desc_size)) {
5183107d2be9SJason Yan ext4_msg(sb, KERN_ERR,
5184107d2be9SJason Yan "unsupported descriptor size %lu",
5185107d2be9SJason Yan sbi->s_desc_size);
5186107d2be9SJason Yan return -EINVAL;
5187107d2be9SJason Yan }
5188107d2be9SJason Yan } else
5189107d2be9SJason Yan sbi->s_desc_size = EXT4_MIN_DESC_SIZE;
5190107d2be9SJason Yan
5191107d2be9SJason Yan sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group);
5192107d2be9SJason Yan sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group);
5193107d2be9SJason Yan
5194107d2be9SJason Yan sbi->s_inodes_per_block = sb->s_blocksize / EXT4_INODE_SIZE(sb);
5195107d2be9SJason Yan if (sbi->s_inodes_per_block == 0 || sbi->s_blocks_per_group == 0) {
5196107d2be9SJason Yan if (!silent)
5197107d2be9SJason Yan ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem");
5198107d2be9SJason Yan return -EINVAL;
5199107d2be9SJason Yan }
5200107d2be9SJason Yan if (sbi->s_inodes_per_group < sbi->s_inodes_per_block ||
5201107d2be9SJason Yan sbi->s_inodes_per_group > sb->s_blocksize * 8) {
5202107d2be9SJason Yan ext4_msg(sb, KERN_ERR, "invalid inodes per group: %lu\n",
5203107d2be9SJason Yan sbi->s_inodes_per_group);
5204107d2be9SJason Yan return -EINVAL;
5205107d2be9SJason Yan }
5206107d2be9SJason Yan sbi->s_itb_per_group = sbi->s_inodes_per_group /
5207107d2be9SJason Yan sbi->s_inodes_per_block;
5208107d2be9SJason Yan sbi->s_desc_per_block = sb->s_blocksize / EXT4_DESC_SIZE(sb);
5209107d2be9SJason Yan sbi->s_mount_state = le16_to_cpu(es->s_state) & ~EXT4_FC_REPLAY;
5210107d2be9SJason Yan sbi->s_addr_per_block_bits = ilog2(EXT4_ADDR_PER_BLOCK(sb));
5211107d2be9SJason Yan sbi->s_desc_per_block_bits = ilog2(EXT4_DESC_PER_BLOCK(sb));
5212107d2be9SJason Yan
5213107d2be9SJason Yan return 0;
5214107d2be9SJason Yan }
5215107d2be9SJason Yan
5216faeff8b1SOjaswin Mujoo /*
5217faeff8b1SOjaswin Mujoo * It's hard to get stripe aligned blocks if stripe is not aligned with
5218faeff8b1SOjaswin Mujoo * cluster, just disable stripe and alert user to simplify code and avoid
5219faeff8b1SOjaswin Mujoo * stripe aligned allocation which will rarely succeed.
5220faeff8b1SOjaswin Mujoo */
ext4_is_stripe_incompatible(struct super_block * sb,unsigned long stripe)5221faeff8b1SOjaswin Mujoo static bool ext4_is_stripe_incompatible(struct super_block *sb, unsigned long stripe)
5222faeff8b1SOjaswin Mujoo {
5223faeff8b1SOjaswin Mujoo struct ext4_sb_info *sbi = EXT4_SB(sb);
5224faeff8b1SOjaswin Mujoo return (stripe > 0 && sbi->s_cluster_ratio > 1 &&
5225faeff8b1SOjaswin Mujoo stripe % sbi->s_cluster_ratio != 0);
5226faeff8b1SOjaswin Mujoo }
5227faeff8b1SOjaswin Mujoo
__ext4_fill_super(struct fs_context * fc,struct super_block * sb)5228960e0ab6SLukas Czerner static int __ext4_fill_super(struct fs_context *fc, struct super_block *sb)
52297edfd85bSLukas Czerner {
5230617ba13bSMingming Cao struct ext4_super_block *es = NULL;
52317edfd85bSLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb);
523270bbb3e0SAndrew Morton ext4_fsblk_t logical_sb_block;
5233ac27a0ecSDave Kleikamp struct inode *root;
5234107d2be9SJason Yan int needs_recovery;
5235d4fab7b2STheodore Ts'o int err;
5236bfff6873SLukas Czerner ext4_group_t first_not_zeroed;
52377edfd85bSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
5238960e0ab6SLukas Czerner int silent = fc->sb_flags & SB_SILENT;
5239b237e304SHarshad Shirwadkar
5240b237e304SHarshad Shirwadkar /* Set defaults for the variables that will be set during parsing */
5241e4e58e5dSOjaswin Mujoo if (!(ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO))
52427edfd85bSLukas Czerner ctx->journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
5243ac27a0ecSDave Kleikamp
5244240799cdSTheodore Ts'o sbi->s_inode_readahead_blks = EXT4_DEF_INODE_READAHEAD_BLKS;
5245f613dfcbSTheodore Ts'o sbi->s_sectors_written_start =
52468446fe92SChristoph Hellwig part_stat_read(sb->s_bdev, sectors[STAT_WRITE]);
5247ac27a0ecSDave Kleikamp
5248a7a79c29SJason Yan err = ext4_load_super(sb, &logical_sb_block, silent);
5249a7a79c29SJason Yan if (err)
5250ac27a0ecSDave Kleikamp goto out_fail;
5251ac27a0ecSDave Kleikamp
5252a7a79c29SJason Yan es = sbi->s_es;
5253afc32f7eSTheodore Ts'o sbi->s_kbytes_written = le64_to_cpu(es->s_kbytes_written);
5254ac27a0ecSDave Kleikamp
5255b26458d1SJason Yan err = ext4_init_metadata_csum(sb, es);
5256b26458d1SJason Yan if (err)
5257a5fc5119SJason Yan goto failed_mount;
5258a9c47317SDarrick J. Wong
52595f6d662dSJason Yan ext4_set_def_opts(sb, es);
5260ac27a0ecSDave Kleikamp
526108cefc7aSEric W. Biederman sbi->s_resuid = make_kuid(&init_user_ns, le16_to_cpu(es->s_def_resuid));
526208cefc7aSEric W. Biederman sbi->s_resgid = make_kgid(&init_user_ns, le16_to_cpu(es->s_def_resgid));
526330773840STheodore Ts'o sbi->s_commit_interval = JBD2_DEFAULT_MAX_COMMIT_AGE * HZ;
526430773840STheodore Ts'o sbi->s_min_batch_time = EXT4_DEF_MIN_BATCH_TIME;
526530773840STheodore Ts'o sbi->s_max_batch_time = EXT4_DEF_MAX_BATCH_TIME;
5266ac27a0ecSDave Kleikamp
526751ce6511SLukas Czerner /*
526851ce6511SLukas Czerner * set default s_li_wait_mult for lazyinit, for the case there is
526951ce6511SLukas Czerner * no mount option specified.
527051ce6511SLukas Czerner */
527151ce6511SLukas Czerner sbi->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT;
527251ce6511SLukas Czerner
5273d4fab7b2STheodore Ts'o err = ext4_inode_info_init(sb, es);
5274d4fab7b2STheodore Ts'o if (err)
52759803387cSTheodore Ts'o goto failed_mount;
52769803387cSTheodore Ts'o
52777edfd85bSLukas Czerner err = parse_apply_sb_mount_options(sb, ctx);
52787edfd85bSLukas Czerner if (err < 0)
52795aee0f8aSTheodore Ts'o goto failed_mount;
52807edfd85bSLukas Czerner
52815a916be1STheodore Ts'o sbi->s_def_mount_opt = sbi->s_mount_opt;
5282e3645d72SZhang Yi sbi->s_def_mount_opt2 = sbi->s_mount_opt2;
52837edfd85bSLukas Czerner
52847edfd85bSLukas Czerner err = ext4_check_opt_consistency(fc, sb);
52857edfd85bSLukas Czerner if (err < 0)
52867edfd85bSLukas Czerner goto failed_mount;
52877edfd85bSLukas Czerner
528885456054SEric Biggers ext4_apply_options(fc, sb);
5289ac27a0ecSDave Kleikamp
5290d4fab7b2STheodore Ts'o err = ext4_encoding_init(sb, es);
5291d4fab7b2STheodore Ts'o if (err)
5292c83ad55eSGabriel Krisman Bertazi goto failed_mount;
5293c83ad55eSGabriel Krisman Bertazi
5294d4fab7b2STheodore Ts'o err = ext4_check_journal_data_mode(sb);
5295d4fab7b2STheodore Ts'o if (err)
529656889787STheodore Ts'o goto failed_mount;
529756889787STheodore Ts'o
52981751e8a6SLinus Torvalds sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
52991751e8a6SLinus Torvalds (test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
5300ac27a0ecSDave Kleikamp
53011ff20307SJeff Layton /* i_version is always enabled now */
53021ff20307SJeff Layton sb->s_flags |= SB_I_VERSION;
53031ff20307SJeff Layton
5304d4fab7b2STheodore Ts'o err = ext4_check_feature_compatibility(sb, es, silent);
5305d4fab7b2STheodore Ts'o if (err)
5306ac27a0ecSDave Kleikamp goto failed_mount;
5307a13fb1a4SEric Sandeen
5308d4fab7b2STheodore Ts'o err = ext4_block_group_meta_init(sb, silent);
5309d4fab7b2STheodore Ts'o if (err)
53105b9554dcSTheodore Ts'o goto failed_mount;
53115b9554dcSTheodore Ts'o
5312db9345d9SJason Yan ext4_hash_info_init(sb);
5313ac27a0ecSDave Kleikamp
5314d4fab7b2STheodore Ts'o err = ext4_handle_clustersize(sb);
5315d4fab7b2STheodore Ts'o if (err)
5316281b5995STheodore Ts'o goto failed_mount;
5317960fd856STheodore Ts'o
5318d4fab7b2STheodore Ts'o err = ext4_check_geometry(sb, es);
5319d4fab7b2STheodore Ts'o if (err)
53200f2ddca6SFrom: Thiemo Nagel goto failed_mount;
53210f2ddca6SFrom: Thiemo Nagel
5322235699a8SKees Cook timer_setup(&sbi->s_err_report, print_daily_error_info, 0);
5323c92dc856SJan Kara spin_lock_init(&sbi->s_error_lock);
5324bb15cea2STheodore Ts'o INIT_WORK(&sbi->s_sb_upd_work, update_super_work);
532504496411STao Ma
5326172e344eSYe Bin err = ext4_group_desc_init(sb, es, logical_sb_block, &first_not_zeroed);
5327172e344eSYe Bin if (err)
5328172e344eSYe Bin goto failed_mount3;
5329172e344eSYe Bin
5330d4fab7b2STheodore Ts'o err = ext4_es_register_shrinker(sbi);
5331d4fab7b2STheodore Ts'o if (err)
5332ce7e010aSTheodore Ts'o goto failed_mount3;
5333ce7e010aSTheodore Ts'o
5334c9de560dSAlex Tomas sbi->s_stripe = ext4_get_stripe_size(sbi);
5335faeff8b1SOjaswin Mujoo if (ext4_is_stripe_incompatible(sb, sbi->s_stripe)) {
5336c3defd99SKemeng Shi ext4_msg(sb, KERN_WARNING,
5337c3defd99SKemeng Shi "stripe (%lu) is not aligned with cluster size (%u), "
5338c3defd99SKemeng Shi "stripe is disabled",
5339c3defd99SKemeng Shi sbi->s_stripe, sbi->s_cluster_ratio);
5340c3defd99SKemeng Shi sbi->s_stripe = 0;
5341c3defd99SKemeng Shi }
534267a5da56SZheng Liu sbi->s_extent_max_zeroout_kb = 32;
5343c9de560dSAlex Tomas
5344f9ae9cf5STheodore Ts'o /*
5345f9ae9cf5STheodore Ts'o * set up enough so that it can read an inode
5346f9ae9cf5STheodore Ts'o */
5347f9ae9cf5STheodore Ts'o sb->s_op = &ext4_sops;
5348617ba13bSMingming Cao sb->s_export_op = &ext4_export_ops;
5349617ba13bSMingming Cao sb->s_xattr = ext4_xattr_handlers;
5350643fa961SChandan Rajendra #ifdef CONFIG_FS_ENCRYPTION
5351a7550b30SJaegeuk Kim sb->s_cop = &ext4_cryptops;
5352ffcc4182SEric Biggers #endif
5353c93d8f88SEric Biggers #ifdef CONFIG_FS_VERITY
5354c93d8f88SEric Biggers sb->s_vop = &ext4_verityops;
5355c93d8f88SEric Biggers #endif
5356ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5357617ba13bSMingming Cao sb->dq_op = &ext4_quota_operations;
5358e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb))
53591fa5efe3SJan Kara sb->s_qcop = &dquot_quotactl_sysfile_ops;
5360262b4662SJan Kara else
5361262b4662SJan Kara sb->s_qcop = &ext4_qctl_operations;
5362689c958cSLi Xi sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP | QTYPE_MASK_PRJ;
5363ac27a0ecSDave Kleikamp #endif
536485787090SChristoph Hellwig memcpy(&sb->s_uuid, es->s_uuid, sizeof(es->s_uuid));
5365f2fa2ffcSAneesh Kumar K.V
5366ac27a0ecSDave Kleikamp INIT_LIST_HEAD(&sbi->s_orphan); /* unlinked but open files */
53673b9d4ed2STheodore Ts'o mutex_init(&sbi->s_orphan_lock);
5368ac27a0ecSDave Kleikamp
5369*6e35f560SLuis Henriques (SUSE) spin_lock_init(&sbi->s_bdev_wb_lock);
5370*6e35f560SLuis Henriques (SUSE)
5371f7314a67SJason Yan ext4_fast_commit_init(sb);
5372aa75f4d3SHarshad Shirwadkar
5373ac27a0ecSDave Kleikamp sb->s_root = NULL;
5374ac27a0ecSDave Kleikamp
5375ac27a0ecSDave Kleikamp needs_recovery = (es->s_last_orphan != 0 ||
537602f310fcSJan Kara ext4_has_feature_orphan_present(sb) ||
5377e2b911c5SDarrick J. Wong ext4_has_feature_journal_needs_recovery(sb));
5378ac27a0ecSDave Kleikamp
53793b50d501STheodore Ts'o if (ext4_has_feature_mmp(sb) && !sb_rdonly(sb)) {
53803b50d501STheodore Ts'o err = ext4_multi_mount_protect(sb, le64_to_cpu(es->s_mmp_block));
53813b50d501STheodore Ts'o if (err)
538250460fe8SDarrick J. Wong goto failed_mount3a;
53833b50d501STheodore Ts'o }
5384c5e06d10SJohann Lombardi
5385d4fab7b2STheodore Ts'o err = -EINVAL;
5386ac27a0ecSDave Kleikamp /*
5387ac27a0ecSDave Kleikamp * The first inode we look at is the journal inode. Don't try
5388ac27a0ecSDave Kleikamp * root first: it may be modified in the journal!
5389ac27a0ecSDave Kleikamp */
5390e2b911c5SDarrick J. Wong if (!test_opt(sb, NOLOAD) && ext4_has_feature_journal(sb)) {
53919c1dd22dSJason Yan err = ext4_load_and_init_journal(sb, es, ctx);
53924753d8a2STheodore Ts'o if (err)
539350460fe8SDarrick J. Wong goto failed_mount3a;
5394bc98a42cSDavid Howells } else if (test_opt(sb, NOLOAD) && !sb_rdonly(sb) &&
5395e2b911c5SDarrick J. Wong ext4_has_feature_journal_needs_recovery(sb)) {
5396b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "required journal recovery "
5397b31e1552SEric Sandeen "suppressed and not mounted read-only");
539843bd6f1bSJason Yan goto failed_mount3a;
5399ac27a0ecSDave Kleikamp } else {
54001e381f60SDmitry Monakhov /* Nojournal mode, all journal mount options are illegal */
54011e381f60SDmitry Monakhov if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
54021e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with "
54031e381f60SDmitry Monakhov "journal_async_commit, fs mounted w/o journal");
540443bd6f1bSJason Yan goto failed_mount3a;
54051e381f60SDmitry Monakhov }
540689481b5fSBaokun Li
540789481b5fSBaokun Li if (test_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM)) {
540889481b5fSBaokun Li ext4_msg(sb, KERN_ERR, "can't mount with "
540989481b5fSBaokun Li "journal_checksum, fs mounted w/o journal");
541089481b5fSBaokun Li goto failed_mount3a;
541189481b5fSBaokun Li }
54121e381f60SDmitry Monakhov if (sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) {
54131e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with "
54141e381f60SDmitry Monakhov "commit=%lu, fs mounted w/o journal",
54151e381f60SDmitry Monakhov sbi->s_commit_interval / HZ);
541643bd6f1bSJason Yan goto failed_mount3a;
54171e381f60SDmitry Monakhov }
54181e381f60SDmitry Monakhov if (EXT4_MOUNT_DATA_FLAGS &
54191e381f60SDmitry Monakhov (sbi->s_mount_opt ^ sbi->s_def_mount_opt)) {
54201e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with "
54211e381f60SDmitry Monakhov "data=, fs mounted w/o journal");
542243bd6f1bSJason Yan goto failed_mount3a;
54231e381f60SDmitry Monakhov }
542450b29d8fSDebabrata Banerjee sbi->s_def_mount_opt &= ~EXT4_MOUNT_JOURNAL_CHECKSUM;
54251e381f60SDmitry Monakhov clear_opt(sb, JOURNAL_CHECKSUM);
5426fd8c37ecSTheodore Ts'o clear_opt(sb, DATA_FLAGS);
5427995a3ed6SHarshad Shirwadkar clear_opt2(sb, JOURNAL_FAST_COMMIT);
54280390131bSFrank Mayhar sbi->s_journal = NULL;
54290390131bSFrank Mayhar needs_recovery = 0;
5430ac27a0ecSDave Kleikamp }
5431ac27a0ecSDave Kleikamp
5432cdb7ee4cSTahsin Erdogan if (!test_opt(sb, NO_MBCACHE)) {
543347387409STahsin Erdogan sbi->s_ea_block_cache = ext4_xattr_create_cache();
543447387409STahsin Erdogan if (!sbi->s_ea_block_cache) {
5435cdb7ee4cSTahsin Erdogan ext4_msg(sb, KERN_ERR,
5436cdb7ee4cSTahsin Erdogan "Failed to create ea_block_cache");
5437d4fab7b2STheodore Ts'o err = -EINVAL;
54389c191f70ST Makphaibulchoke goto failed_mount_wq;
54399c191f70ST Makphaibulchoke }
54409c191f70ST Makphaibulchoke
5441dec214d0STahsin Erdogan if (ext4_has_feature_ea_inode(sb)) {
5442dec214d0STahsin Erdogan sbi->s_ea_inode_cache = ext4_xattr_create_cache();
5443dec214d0STahsin Erdogan if (!sbi->s_ea_inode_cache) {
5444dec214d0STahsin Erdogan ext4_msg(sb, KERN_ERR,
5445dec214d0STahsin Erdogan "Failed to create ea_inode_cache");
5446d4fab7b2STheodore Ts'o err = -EINVAL;
5447dec214d0STahsin Erdogan goto failed_mount_wq;
5448dec214d0STahsin Erdogan }
5449dec214d0STahsin Erdogan }
5450cdb7ee4cSTahsin Erdogan }
5451dec214d0STahsin Erdogan
5452fd89d5f2STejun Heo /*
5453952fc18eSTheodore Ts'o * Get the # of file system overhead blocks from the
5454952fc18eSTheodore Ts'o * superblock if present.
5455952fc18eSTheodore Ts'o */
5456952fc18eSTheodore Ts'o sbi->s_overhead = le32_to_cpu(es->s_overhead_clusters);
545785d825dbSTheodore Ts'o /* ignore the precalculated value if it is ridiculous */
545885d825dbSTheodore Ts'o if (sbi->s_overhead > ext4_blocks_count(es))
545985d825dbSTheodore Ts'o sbi->s_overhead = 0;
546085d825dbSTheodore Ts'o /*
546185d825dbSTheodore Ts'o * If the bigalloc feature is not enabled recalculating the
546285d825dbSTheodore Ts'o * overhead doesn't take long, so we might as well just redo
546385d825dbSTheodore Ts'o * it to make sure we are using the correct value.
546485d825dbSTheodore Ts'o */
546585d825dbSTheodore Ts'o if (!ext4_has_feature_bigalloc(sb))
546685d825dbSTheodore Ts'o sbi->s_overhead = 0;
546785d825dbSTheodore Ts'o if (sbi->s_overhead == 0) {
546807aa2ea1SLukas Czerner err = ext4_calculate_overhead(sb);
546907aa2ea1SLukas Czerner if (err)
5470952fc18eSTheodore Ts'o goto failed_mount_wq;
5471952fc18eSTheodore Ts'o }
5472952fc18eSTheodore Ts'o
5473952fc18eSTheodore Ts'o /*
5474fd89d5f2STejun Heo * The maximum number of concurrent works can be high and
5475fd89d5f2STejun Heo * concurrency isn't really necessary. Limit it to 1.
5476fd89d5f2STejun Heo */
54772e8fa54eSJan Kara EXT4_SB(sb)->rsv_conversion_wq =
54782e8fa54eSJan Kara alloc_workqueue("ext4-rsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1);
54792e8fa54eSJan Kara if (!EXT4_SB(sb)->rsv_conversion_wq) {
54802e8fa54eSJan Kara printk(KERN_ERR "EXT4-fs: failed to create workqueue\n");
5481d4fab7b2STheodore Ts'o err = -ENOMEM;
54822e8fa54eSJan Kara goto failed_mount4;
54832e8fa54eSJan Kara }
54842e8fa54eSJan Kara
5485ac27a0ecSDave Kleikamp /*
5486dab291afSMingming Cao * The jbd2_journal_load will have done any necessary log recovery,
5487ac27a0ecSDave Kleikamp * so we can safely mount the rest of the filesystem now.
5488ac27a0ecSDave Kleikamp */
5489ac27a0ecSDave Kleikamp
54908a363970STheodore Ts'o root = ext4_iget(sb, EXT4_ROOT_INO, EXT4_IGET_SPECIAL);
54911d1fe1eeSDavid Howells if (IS_ERR(root)) {
5492b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "get root inode failed");
5493d4fab7b2STheodore Ts'o err = PTR_ERR(root);
549432a9bb57SManish Katiyar root = NULL;
5495ac27a0ecSDave Kleikamp goto failed_mount4;
5496ac27a0ecSDave Kleikamp }
5497ac27a0ecSDave Kleikamp if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) {
5498b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "corrupt root inode, run e2fsck");
549994bf608aSAl Viro iput(root);
5500d4fab7b2STheodore Ts'o err = -EFSCORRUPTED;
5501ac27a0ecSDave Kleikamp goto failed_mount4;
5502ac27a0ecSDave Kleikamp }
5503b886ee3eSGabriel Krisman Bertazi
550448fde701SAl Viro sb->s_root = d_make_root(root);
55051d1fe1eeSDavid Howells if (!sb->s_root) {
5506b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "get root dentry failed");
5507d4fab7b2STheodore Ts'o err = -ENOMEM;
55081d1fe1eeSDavid Howells goto failed_mount4;
55091d1fe1eeSDavid Howells }
5510ac27a0ecSDave Kleikamp
5511d4fab7b2STheodore Ts'o err = ext4_setup_super(sb, es, sb_rdonly(sb));
5512d4fab7b2STheodore Ts'o if (err == -EROFS) {
55131751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY;
5514d4fab7b2STheodore Ts'o } else if (err)
5515c89128a0SJaegeuk Kim goto failed_mount4a;
5516ef7f3835SKalpak Shah
5517b5799018STheodore Ts'o ext4_set_resv_clusters(sb);
551827dd4385SLukas Czerner
55190f5bde1dSJan Kara if (test_opt(sb, BLOCK_VALIDITY)) {
55206fd058f7STheodore Ts'o err = ext4_setup_system_zone(sb);
55216fd058f7STheodore Ts'o if (err) {
5522b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "failed to initialize system "
5523fbe845ddSCurt Wohlgemuth "zone (%d)", err);
5524f9ae9cf5STheodore Ts'o goto failed_mount4a;
5525f9ae9cf5STheodore Ts'o }
55260f5bde1dSJan Kara }
55278016e29fSHarshad Shirwadkar ext4_fc_replay_cleanup(sb);
5528f9ae9cf5STheodore Ts'o
5529f9ae9cf5STheodore Ts'o ext4_ext_init(sb);
5530196e402aSHarshad Shirwadkar
5531196e402aSHarshad Shirwadkar /*
5532196e402aSHarshad Shirwadkar * Enable optimize_scan if number of groups is > threshold. This can be
5533196e402aSHarshad Shirwadkar * turned off by passing "mb_optimize_scan=0". This can also be
5534196e402aSHarshad Shirwadkar * turned on forcefully by passing "mb_optimize_scan=1".
5535196e402aSHarshad Shirwadkar */
553627b38686SOjaswin Mujoo if (!(ctx->spec & EXT4_SPEC_mb_optimize_scan)) {
553727b38686SOjaswin Mujoo if (sbi->s_groups_count >= MB_DEFAULT_LINEAR_SCAN_THRESHOLD)
5538196e402aSHarshad Shirwadkar set_opt2(sb, MB_OPTIMIZE_SCAN);
553927b38686SOjaswin Mujoo else
5540196e402aSHarshad Shirwadkar clear_opt2(sb, MB_OPTIMIZE_SCAN);
554127b38686SOjaswin Mujoo }
5542196e402aSHarshad Shirwadkar
5543f9ae9cf5STheodore Ts'o err = ext4_mb_init(sb);
5544f9ae9cf5STheodore Ts'o if (err) {
5545f9ae9cf5STheodore Ts'o ext4_msg(sb, KERN_ERR, "failed to initialize mballoc (%d)",
5546f9ae9cf5STheodore Ts'o err);
5547dcf2d804STao Ma goto failed_mount5;
5548c2774d84SAneesh Kumar K.V }
5549c2774d84SAneesh Kumar K.V
5550027f14f5STheodore Ts'o /*
5551027f14f5STheodore Ts'o * We can only set up the journal commit callback once
5552027f14f5STheodore Ts'o * mballoc is initialized
5553027f14f5STheodore Ts'o */
5554027f14f5STheodore Ts'o if (sbi->s_journal)
5555027f14f5STheodore Ts'o sbi->s_journal->j_commit_callback =
5556027f14f5STheodore Ts'o ext4_journal_commit_callback;
5557027f14f5STheodore Ts'o
5558d5e72c4eSTheodore Ts'o err = ext4_percpu_param_init(sbi);
5559d5e72c4eSTheodore Ts'o if (err)
5560d5e03cbbSTheodore Ts'o goto failed_mount6;
5561d5e03cbbSTheodore Ts'o
5562e2b911c5SDarrick J. Wong if (ext4_has_feature_flex_bg(sb))
5563d5e03cbbSTheodore Ts'o if (!ext4_fill_flex_info(sb)) {
5564d5e03cbbSTheodore Ts'o ext4_msg(sb, KERN_ERR,
5565d5e03cbbSTheodore Ts'o "unable to initialize "
5566d5e03cbbSTheodore Ts'o "flex_bg meta info!");
5567d4fab7b2STheodore Ts'o err = -ENOMEM;
5568d5e03cbbSTheodore Ts'o goto failed_mount6;
5569d5e03cbbSTheodore Ts'o }
5570d5e03cbbSTheodore Ts'o
5571bfff6873SLukas Czerner err = ext4_register_li_request(sb, first_not_zeroed);
5572bfff6873SLukas Czerner if (err)
5573dcf2d804STao Ma goto failed_mount6;
5574bfff6873SLukas Czerner
557502f310fcSJan Kara err = ext4_init_orphan_info(sb);
557602f310fcSJan Kara if (err)
557723afcd52SBaokun Li goto failed_mount7;
55789b2ff357SJan Kara #ifdef CONFIG_QUOTA
55799b2ff357SJan Kara /* Enable quota usage during mount. */
5580bc98a42cSDavid Howells if (ext4_has_feature_quota(sb) && !sb_rdonly(sb)) {
55819b2ff357SJan Kara err = ext4_enable_quotas(sb);
55829b2ff357SJan Kara if (err)
558323afcd52SBaokun Li goto failed_mount8;
55849b2ff357SJan Kara }
55859b2ff357SJan Kara #endif /* CONFIG_QUOTA */
55869b2ff357SJan Kara
5587bc71726cSzhangyi (F) /*
5588bc71726cSzhangyi (F) * Save the original bdev mapping's wb_err value which could be
5589bc71726cSzhangyi (F) * used to detect the metadata async write error.
5590bc71726cSzhangyi (F) */
5591bc71726cSzhangyi (F) errseq_check_and_advance(&sb->s_bdev->bd_inode->i_mapping->wb_err,
5592bc71726cSzhangyi (F) &sbi->s_bdev_wb_err);
5593617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state |= EXT4_ORPHAN_FS;
5594617ba13bSMingming Cao ext4_orphan_cleanup(sb, es);
5595617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state &= ~EXT4_ORPHAN_FS;
55969b6641ddSYe Bin /*
55979b6641ddSYe Bin * Update the checksum after updating free space/inode counters and
55989b6641ddSYe Bin * ext4_orphan_cleanup. Otherwise the superblock can have an incorrect
55999b6641ddSYe Bin * checksum in the buffer cache until it is written out and
56009b6641ddSYe Bin * e2fsprogs programs trying to open a file system immediately
56019b6641ddSYe Bin * after it is mounted can fail.
56029b6641ddSYe Bin */
56039b6641ddSYe Bin ext4_superblock_csum_set(sb);
56040390131bSFrank Mayhar if (needs_recovery) {
5605b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "recovery complete");
560611215630SJan Kara err = ext4_mark_recovery_complete(sb, es);
560711215630SJan Kara if (err)
560823afcd52SBaokun Li goto failed_mount9;
56090390131bSFrank Mayhar }
56100390131bSFrank Mayhar
561170200574SChristoph Hellwig if (test_opt(sb, DISCARD) && !bdev_max_discard_sectors(sb->s_bdev))
561279add3a3SLukas Czerner ext4_msg(sb, KERN_WARNING,
561370200574SChristoph Hellwig "mounting with \"discard\" option, but the device does not support discard");
561479add3a3SLukas Czerner
561566e61a9eSTheodore Ts'o if (es->s_error_count)
561666e61a9eSTheodore Ts'o mod_timer(&sbi->s_err_report, jiffies + 300*HZ); /* 5 minutes */
5617ac27a0ecSDave Kleikamp
5618efbed4dcSTheodore Ts'o /* Enable message ratelimiting. Default is 10 messages per 5 secs. */
5619efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_err_ratelimit_state, 5 * HZ, 10);
5620efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_warning_ratelimit_state, 5 * HZ, 10);
5621efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_msg_ratelimit_state, 5 * HZ, 10);
56221cf006edSDmitry Monakhov atomic_set(&sbi->s_warning_count, 0);
56231cf006edSDmitry Monakhov atomic_set(&sbi->s_msg_count, 0);
5624efbed4dcSTheodore Ts'o
562523afcd52SBaokun Li /* Register sysfs after all initializations are complete. */
562623afcd52SBaokun Li err = ext4_register_sysfs(sb);
562723afcd52SBaokun Li if (err)
562823afcd52SBaokun Li goto failed_mount9;
562923afcd52SBaokun Li
5630ac27a0ecSDave Kleikamp return 0;
5631ac27a0ecSDave Kleikamp
563223afcd52SBaokun Li failed_mount9:
5633f3c1c42eSBaokun Li ext4_quotas_off(sb, EXT4_MAXQUOTAS);
563423afcd52SBaokun Li failed_mount8: __maybe_unused
563502f310fcSJan Kara ext4_release_orphan_info(sb);
5636dcf2d804STao Ma failed_mount7:
5637dcf2d804STao Ma ext4_unregister_li_request(sb);
5638dcf2d804STao Ma failed_mount6:
5639f9ae9cf5STheodore Ts'o ext4_mb_release(sb);
5640dcbf8758SJason Yan ext4_flex_groups_free(sbi);
56411f79467cSJason Yan ext4_percpu_param_destroy(sbi);
564200764937SAzat Khuzhin failed_mount5:
5643f9ae9cf5STheodore Ts'o ext4_ext_release(sb);
5644f9ae9cf5STheodore Ts'o ext4_release_system_zone(sb);
5645f9ae9cf5STheodore Ts'o failed_mount4a:
564694bf608aSAl Viro dput(sb->s_root);
564732a9bb57SManish Katiyar sb->s_root = NULL;
564894bf608aSAl Viro failed_mount4:
5649b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "mount failed");
56502e8fa54eSJan Kara if (EXT4_SB(sb)->rsv_conversion_wq)
56512e8fa54eSJan Kara destroy_workqueue(EXT4_SB(sb)->rsv_conversion_wq);
56524c0425ffSMingming Cao failed_mount_wq:
5653dec214d0STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
5654dec214d0STahsin Erdogan sbi->s_ea_inode_cache = NULL;
565550c15df6SChengguang Xu
565647387409STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
565747387409STahsin Erdogan sbi->s_ea_block_cache = NULL;
565850c15df6SChengguang Xu
56590390131bSFrank Mayhar if (sbi->s_journal) {
5660bb15cea2STheodore Ts'o /* flush s_sb_upd_work before journal destroy. */
5661bb15cea2STheodore Ts'o flush_work(&sbi->s_sb_upd_work);
5662dab291afSMingming Cao jbd2_journal_destroy(sbi->s_journal);
566347b4a50bSJan Kara sbi->s_journal = NULL;
56640390131bSFrank Mayhar }
566550460fe8SDarrick J. Wong failed_mount3a:
5666d3922a77SZheng Liu ext4_es_unregister_shrinker(sbi);
5667eb68d0e2SZheng Liu failed_mount3:
5668bb15cea2STheodore Ts'o /* flush s_sb_upd_work before sbi destroy */
5669bb15cea2STheodore Ts'o flush_work(&sbi->s_sb_upd_work);
5670618f0031SPavel Skripkin ext4_stop_mmpd(sbi);
56719203817bSXiaxi Shen del_timer_sync(&sbi->s_err_report);
5672a4e6a511SJason Yan ext4_group_desc_free(sbi);
5673ac27a0ecSDave Kleikamp failed_mount:
56740441984aSDarrick J. Wong if (sbi->s_chksum_driver)
56750441984aSDarrick J. Wong crypto_free_shash(sbi->s_chksum_driver);
5676c83ad55eSGabriel Krisman Bertazi
56775298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
5678f8f4acb6SDaniel Rosenberg utf8_unload(sb->s_encoding);
5679c83ad55eSGabriel Krisman Bertazi #endif
5680c83ad55eSGabriel Krisman Bertazi
5681ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5682856dd6c5SNathan Chancellor for (unsigned int i = 0; i < EXT4_MAXQUOTAS; i++)
56830ba33facSTheodore Ts'o kfree(get_qf_name(sb, sbi, i));
5684ac27a0ecSDave Kleikamp #endif
5685ac4acb1fSEric Biggers fscrypt_free_dummy_policy(&sbi->s_dummy_enc_policy);
5686a7a79c29SJason Yan brelse(sbi->s_sbh);
56871489dffdSChristoph Hellwig if (sbi->s_journal_bdev) {
56881489dffdSChristoph Hellwig invalidate_bdev(sbi->s_journal_bdev);
56891489dffdSChristoph Hellwig blkdev_put(sbi->s_journal_bdev, sb);
56901489dffdSChristoph Hellwig }
5691ac27a0ecSDave Kleikamp out_fail:
569226fb5290SZhihao Cheng invalidate_bdev(sb->s_bdev);
5693ac27a0ecSDave Kleikamp sb->s_fs_info = NULL;
5694d4fab7b2STheodore Ts'o return err;
5695ac27a0ecSDave Kleikamp }
5696ac27a0ecSDave Kleikamp
ext4_fill_super(struct super_block * sb,struct fs_context * fc)5697cebe85d5SLukas Czerner static int ext4_fill_super(struct super_block *sb, struct fs_context *fc)
56987edfd85bSLukas Czerner {
5699cebe85d5SLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
57007edfd85bSLukas Czerner struct ext4_sb_info *sbi;
57017edfd85bSLukas Czerner const char *descr;
5702cebe85d5SLukas Czerner int ret;
57037edfd85bSLukas Czerner
5704cebe85d5SLukas Czerner sbi = ext4_alloc_sbi(sb);
5705cebe85d5SLukas Czerner if (!sbi)
57067c268d4cSLukas Czerner return -ENOMEM;
5707cebe85d5SLukas Czerner
5708cebe85d5SLukas Czerner fc->s_fs_info = sbi;
57097edfd85bSLukas Czerner
57107edfd85bSLukas Czerner /* Cleanup superblock name */
57117edfd85bSLukas Czerner strreplace(sb->s_id, '/', '!');
57127edfd85bSLukas Czerner
57137edfd85bSLukas Czerner sbi->s_sb_block = 1; /* Default super block location */
5714cebe85d5SLukas Czerner if (ctx->spec & EXT4_SPEC_s_sb_block)
5715cebe85d5SLukas Czerner sbi->s_sb_block = ctx->s_sb_block;
57167edfd85bSLukas Czerner
5717960e0ab6SLukas Czerner ret = __ext4_fill_super(fc, sb);
57187edfd85bSLukas Czerner if (ret < 0)
57197edfd85bSLukas Czerner goto free_sbi;
57207edfd85bSLukas Czerner
5721cebe85d5SLukas Czerner if (sbi->s_journal) {
57227edfd85bSLukas Czerner if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
57237edfd85bSLukas Czerner descr = " journalled data mode";
57247edfd85bSLukas Czerner else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
57257edfd85bSLukas Czerner descr = " ordered data mode";
57267edfd85bSLukas Czerner else
57277edfd85bSLukas Czerner descr = " writeback data mode";
57287edfd85bSLukas Czerner } else
57297edfd85bSLukas Czerner descr = "out journal";
57307edfd85bSLukas Czerner
57317edfd85bSLukas Czerner if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs mount"))
57326dcc98fbSTheodore Ts'o ext4_msg(sb, KERN_INFO, "mounted filesystem %pU %s with%s. "
57336dcc98fbSTheodore Ts'o "Quota mode: %s.", &sb->s_uuid,
57346dcc98fbSTheodore Ts'o sb_rdonly(sb) ? "ro" : "r/w", descr,
5735bb0fbc78SLukas Czerner ext4_quota_mode(sb));
57367edfd85bSLukas Czerner
5737eb705421STheodore Ts'o /* Update the s_overhead_clusters if necessary */
5738827891a3STheodore Ts'o ext4_update_overhead(sb, false);
57397edfd85bSLukas Czerner return 0;
5740cebe85d5SLukas Czerner
57417edfd85bSLukas Czerner free_sbi:
57427edfd85bSLukas Czerner ext4_free_sbi(sbi);
5743cebe85d5SLukas Czerner fc->s_fs_info = NULL;
57447edfd85bSLukas Czerner return ret;
57457edfd85bSLukas Czerner }
57467edfd85bSLukas Czerner
ext4_get_tree(struct fs_context * fc)5747cebe85d5SLukas Czerner static int ext4_get_tree(struct fs_context *fc)
5748cebe85d5SLukas Czerner {
5749cebe85d5SLukas Czerner return get_tree_bdev(fc, ext4_fill_super);
5750cebe85d5SLukas Czerner }
5751cebe85d5SLukas Czerner
5752ac27a0ecSDave Kleikamp /*
5753ac27a0ecSDave Kleikamp * Setup any per-fs journal parameters now. We'll do this both on
5754ac27a0ecSDave Kleikamp * initial mount, once the journal has been initialised but before we've
5755ac27a0ecSDave Kleikamp * done any recovery; and again on any subsequent remount.
5756ac27a0ecSDave Kleikamp */
ext4_init_journal_params(struct super_block * sb,journal_t * journal)5757617ba13bSMingming Cao static void ext4_init_journal_params(struct super_block *sb, journal_t *journal)
5758ac27a0ecSDave Kleikamp {
5759617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
5760ac27a0ecSDave Kleikamp
5761ac27a0ecSDave Kleikamp journal->j_commit_interval = sbi->s_commit_interval;
576230773840STheodore Ts'o journal->j_min_batch_time = sbi->s_min_batch_time;
576330773840STheodore Ts'o journal->j_max_batch_time = sbi->s_max_batch_time;
57646866d7b3SHarshad Shirwadkar ext4_fc_init(sb, journal);
5765ac27a0ecSDave Kleikamp
5766a931da6aSTheodore Ts'o write_lock(&journal->j_state_lock);
5767ac27a0ecSDave Kleikamp if (test_opt(sb, BARRIER))
5768dab291afSMingming Cao journal->j_flags |= JBD2_BARRIER;
5769ac27a0ecSDave Kleikamp else
5770dab291afSMingming Cao journal->j_flags &= ~JBD2_BARRIER;
57715bf5683aSHidehiro Kawai if (test_opt(sb, DATA_ERR_ABORT))
57725bf5683aSHidehiro Kawai journal->j_flags |= JBD2_ABORT_ON_SYNCDATA_ERR;
57735bf5683aSHidehiro Kawai else
57745bf5683aSHidehiro Kawai journal->j_flags &= ~JBD2_ABORT_ON_SYNCDATA_ERR;
577572945058SZhang Yi /*
577672945058SZhang Yi * Always enable journal cycle record option, letting the journal
577772945058SZhang Yi * records log transactions continuously between each mount.
577872945058SZhang Yi */
577972945058SZhang Yi journal->j_flags |= JBD2_CYCLE_RECORD;
5780a931da6aSTheodore Ts'o write_unlock(&journal->j_state_lock);
5781ac27a0ecSDave Kleikamp }
5782ac27a0ecSDave Kleikamp
ext4_get_journal_inode(struct super_block * sb,unsigned int journal_inum)5783c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
5784ac27a0ecSDave Kleikamp unsigned int journal_inum)
5785ac27a0ecSDave Kleikamp {
5786ac27a0ecSDave Kleikamp struct inode *journal_inode;
5787ac27a0ecSDave Kleikamp
5788c6cb7e77SEric Whitney /*
5789c6cb7e77SEric Whitney * Test for the existence of a valid inode on disk. Bad things
5790c6cb7e77SEric Whitney * happen if we iget() an unused inode, as the subsequent iput()
5791c6cb7e77SEric Whitney * will try to delete it.
5792c6cb7e77SEric Whitney */
57938a363970STheodore Ts'o journal_inode = ext4_iget(sb, journal_inum, EXT4_IGET_SPECIAL);
57941d1fe1eeSDavid Howells if (IS_ERR(journal_inode)) {
5795b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "no journal found");
5796ee5c8071SZhang Yi return ERR_CAST(journal_inode);
5797ac27a0ecSDave Kleikamp }
5798ac27a0ecSDave Kleikamp if (!journal_inode->i_nlink) {
5799ac27a0ecSDave Kleikamp make_bad_inode(journal_inode);
5800ac27a0ecSDave Kleikamp iput(journal_inode);
5801b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "journal inode is deleted");
5802ee5c8071SZhang Yi return ERR_PTR(-EFSCORRUPTED);
5803ac27a0ecSDave Kleikamp }
5804105c78e1SEric Biggers if (!S_ISREG(journal_inode->i_mode) || IS_ENCRYPTED(journal_inode)) {
5805b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "invalid journal inode");
5806ac27a0ecSDave Kleikamp iput(journal_inode);
5807ee5c8071SZhang Yi return ERR_PTR(-EFSCORRUPTED);
5808c6cb7e77SEric Whitney }
5809c6cb7e77SEric Whitney
5810c6cb7e77SEric Whitney ext4_debug("Journal inode found at %p: %lld bytes\n",
5811c6cb7e77SEric Whitney journal_inode, journal_inode->i_size);
5812c6cb7e77SEric Whitney return journal_inode;
5813c6cb7e77SEric Whitney }
5814c6cb7e77SEric Whitney
ext4_journal_bmap(journal_t * journal,sector_t * block)581562913ae9STheodore Ts'o static int ext4_journal_bmap(journal_t *journal, sector_t *block)
581662913ae9STheodore Ts'o {
581762913ae9STheodore Ts'o struct ext4_map_blocks map;
581862913ae9STheodore Ts'o int ret;
581962913ae9STheodore Ts'o
582062913ae9STheodore Ts'o if (journal->j_inode == NULL)
582162913ae9STheodore Ts'o return 0;
582262913ae9STheodore Ts'o
582362913ae9STheodore Ts'o map.m_lblk = *block;
582462913ae9STheodore Ts'o map.m_len = 1;
582562913ae9STheodore Ts'o ret = ext4_map_blocks(NULL, journal->j_inode, &map, 0);
582662913ae9STheodore Ts'o if (ret <= 0) {
582762913ae9STheodore Ts'o ext4_msg(journal->j_inode->i_sb, KERN_CRIT,
582862913ae9STheodore Ts'o "journal bmap failed: block %llu ret %d\n",
582962913ae9STheodore Ts'o *block, ret);
583062913ae9STheodore Ts'o jbd2_journal_abort(journal, ret ? ret : -EIO);
583162913ae9STheodore Ts'o return ret;
583262913ae9STheodore Ts'o }
583362913ae9STheodore Ts'o *block = map.m_pblk;
583462913ae9STheodore Ts'o return 0;
583562913ae9STheodore Ts'o }
583662913ae9STheodore Ts'o
ext4_open_inode_journal(struct super_block * sb,unsigned int journal_inum)5837ee5c8071SZhang Yi static journal_t *ext4_open_inode_journal(struct super_block *sb,
5838c6cb7e77SEric Whitney unsigned int journal_inum)
5839c6cb7e77SEric Whitney {
5840c6cb7e77SEric Whitney struct inode *journal_inode;
5841c6cb7e77SEric Whitney journal_t *journal;
5842c6cb7e77SEric Whitney
5843c6cb7e77SEric Whitney journal_inode = ext4_get_journal_inode(sb, journal_inum);
5844ee5c8071SZhang Yi if (IS_ERR(journal_inode))
5845ee5c8071SZhang Yi return ERR_CAST(journal_inode);
5846ac27a0ecSDave Kleikamp
5847dab291afSMingming Cao journal = jbd2_journal_init_inode(journal_inode);
58488e6cf5fbSZhang Yi if (IS_ERR(journal)) {
5849b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "Could not load journal inode");
5850ac27a0ecSDave Kleikamp iput(journal_inode);
5851ee5c8071SZhang Yi return ERR_CAST(journal);
5852ac27a0ecSDave Kleikamp }
5853ac27a0ecSDave Kleikamp journal->j_private = sb;
585462913ae9STheodore Ts'o journal->j_bmap = ext4_journal_bmap;
5855617ba13bSMingming Cao ext4_init_journal_params(sb, journal);
5856ac27a0ecSDave Kleikamp return journal;
5857ac27a0ecSDave Kleikamp }
5858ac27a0ecSDave Kleikamp
ext4_get_journal_blkdev(struct super_block * sb,dev_t j_dev,ext4_fsblk_t * j_start,ext4_fsblk_t * j_len)5859bc74e6a3SZhang Yi static struct block_device *ext4_get_journal_blkdev(struct super_block *sb,
5860bc74e6a3SZhang Yi dev_t j_dev, ext4_fsblk_t *j_start,
5861bc74e6a3SZhang Yi ext4_fsblk_t *j_len)
5862ac27a0ecSDave Kleikamp {
5863ac27a0ecSDave Kleikamp struct buffer_head *bh;
5864bc74e6a3SZhang Yi struct block_device *bdev;
5865ac27a0ecSDave Kleikamp int hblock, blocksize;
5866617ba13bSMingming Cao ext4_fsblk_t sb_block;
5867ac27a0ecSDave Kleikamp unsigned long offset;
5868617ba13bSMingming Cao struct ext4_super_block *es;
5869ee5c8071SZhang Yi int errno;
58700390131bSFrank Mayhar
58716f5fc7deSChristoph Hellwig /* see get_tree_bdev why this is needed and safe */
58726f5fc7deSChristoph Hellwig up_write(&sb->s_umount);
5873bc74e6a3SZhang Yi bdev = blkdev_get_by_dev(j_dev, BLK_OPEN_READ | BLK_OPEN_WRITE, sb,
58743ef96fcfSLinus Torvalds &fs_holder_ops);
58756f5fc7deSChristoph Hellwig down_write(&sb->s_umount);
5876bc74e6a3SZhang Yi if (IS_ERR(bdev)) {
5877bc74e6a3SZhang Yi ext4_msg(sb, KERN_ERR,
5878bc74e6a3SZhang Yi "failed to open journal device unknown-block(%u,%u) %ld",
5879bc74e6a3SZhang Yi MAJOR(j_dev), MINOR(j_dev), PTR_ERR(bdev));
5880ee5c8071SZhang Yi return ERR_CAST(bdev);
5881bc74e6a3SZhang Yi }
5882ac27a0ecSDave Kleikamp
5883ac27a0ecSDave Kleikamp blocksize = sb->s_blocksize;
5884e1defc4fSMartin K. Petersen hblock = bdev_logical_block_size(bdev);
5885ac27a0ecSDave Kleikamp if (blocksize < hblock) {
5886b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR,
5887b31e1552SEric Sandeen "blocksize too small for journal device");
5888ee5c8071SZhang Yi errno = -EINVAL;
5889ac27a0ecSDave Kleikamp goto out_bdev;
5890ac27a0ecSDave Kleikamp }
5891ac27a0ecSDave Kleikamp
5892617ba13bSMingming Cao sb_block = EXT4_MIN_BLOCK_SIZE / blocksize;
5893617ba13bSMingming Cao offset = EXT4_MIN_BLOCK_SIZE % blocksize;
5894ac27a0ecSDave Kleikamp set_blocksize(bdev, blocksize);
5895bc74e6a3SZhang Yi bh = __bread(bdev, sb_block, blocksize);
5896bc74e6a3SZhang Yi if (!bh) {
5897b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "couldn't read superblock of "
5898b31e1552SEric Sandeen "external journal");
5899ee5c8071SZhang Yi errno = -EINVAL;
5900ac27a0ecSDave Kleikamp goto out_bdev;
5901ac27a0ecSDave Kleikamp }
5902ac27a0ecSDave Kleikamp
59032716b802STheodore Ts'o es = (struct ext4_super_block *) (bh->b_data + offset);
5904617ba13bSMingming Cao if ((le16_to_cpu(es->s_magic) != EXT4_SUPER_MAGIC) ||
5905ac27a0ecSDave Kleikamp !(le32_to_cpu(es->s_feature_incompat) &
5906617ba13bSMingming Cao EXT4_FEATURE_INCOMPAT_JOURNAL_DEV)) {
5907bc74e6a3SZhang Yi ext4_msg(sb, KERN_ERR, "external journal has bad superblock");
5908ee5c8071SZhang Yi errno = -EFSCORRUPTED;
5909bc74e6a3SZhang Yi goto out_bh;
5910ac27a0ecSDave Kleikamp }
5911ac27a0ecSDave Kleikamp
5912df4763beSDarrick J. Wong if ((le32_to_cpu(es->s_feature_ro_compat) &
5913df4763beSDarrick J. Wong EXT4_FEATURE_RO_COMPAT_METADATA_CSUM) &&
5914df4763beSDarrick J. Wong es->s_checksum != ext4_superblock_csum(sb, es)) {
5915bc74e6a3SZhang Yi ext4_msg(sb, KERN_ERR, "external journal has corrupt superblock");
5916ee5c8071SZhang Yi errno = -EFSCORRUPTED;
5917bc74e6a3SZhang Yi goto out_bh;
5918df4763beSDarrick J. Wong }
5919df4763beSDarrick J. Wong
5920617ba13bSMingming Cao if (memcmp(EXT4_SB(sb)->s_es->s_journal_uuid, es->s_uuid, 16)) {
5921b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "journal UUID does not match");
5922ee5c8071SZhang Yi errno = -EFSCORRUPTED;
5923bc74e6a3SZhang Yi goto out_bh;
5924ac27a0ecSDave Kleikamp }
5925ac27a0ecSDave Kleikamp
5926bc74e6a3SZhang Yi *j_start = sb_block + 1;
5927bc74e6a3SZhang Yi *j_len = ext4_blocks_count(es);
5928ac27a0ecSDave Kleikamp brelse(bh);
5929bc74e6a3SZhang Yi return bdev;
5930ac27a0ecSDave Kleikamp
5931bc74e6a3SZhang Yi out_bh:
5932bc74e6a3SZhang Yi brelse(bh);
5933bc74e6a3SZhang Yi out_bdev:
5934bc74e6a3SZhang Yi blkdev_put(bdev, sb);
5935ee5c8071SZhang Yi return ERR_PTR(errno);
5936ac27a0ecSDave Kleikamp }
5937ac27a0ecSDave Kleikamp
ext4_open_dev_journal(struct super_block * sb,dev_t j_dev)5938ee5c8071SZhang Yi static journal_t *ext4_open_dev_journal(struct super_block *sb,
5939bc74e6a3SZhang Yi dev_t j_dev)
5940bc74e6a3SZhang Yi {
5941bc74e6a3SZhang Yi journal_t *journal;
5942bc74e6a3SZhang Yi ext4_fsblk_t j_start;
5943bc74e6a3SZhang Yi ext4_fsblk_t j_len;
5944bc74e6a3SZhang Yi struct block_device *journal_bdev;
5945ee5c8071SZhang Yi int errno = 0;
5946ac27a0ecSDave Kleikamp
5947bc74e6a3SZhang Yi journal_bdev = ext4_get_journal_blkdev(sb, j_dev, &j_start, &j_len);
5948ee5c8071SZhang Yi if (IS_ERR(journal_bdev))
5949ee5c8071SZhang Yi return ERR_CAST(journal_bdev);
5950bc74e6a3SZhang Yi
5951bc74e6a3SZhang Yi journal = jbd2_journal_init_dev(journal_bdev, sb->s_bdev, j_start,
5952bc74e6a3SZhang Yi j_len, sb->s_blocksize);
59538e6cf5fbSZhang Yi if (IS_ERR(journal)) {
5954b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "failed to create device journal");
5955ee5c8071SZhang Yi errno = PTR_ERR(journal);
5956ac27a0ecSDave Kleikamp goto out_bdev;
5957ac27a0ecSDave Kleikamp }
5958ac27a0ecSDave Kleikamp if (be32_to_cpu(journal->j_superblock->s_nr_users) != 1) {
5959b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "External journal has more than one "
5960b31e1552SEric Sandeen "user (unsupported) - %d",
5961ac27a0ecSDave Kleikamp be32_to_cpu(journal->j_superblock->s_nr_users));
5962ee5c8071SZhang Yi errno = -EINVAL;
5963ac27a0ecSDave Kleikamp goto out_journal;
5964ac27a0ecSDave Kleikamp }
5965bc74e6a3SZhang Yi journal->j_private = sb;
5966bc74e6a3SZhang Yi EXT4_SB(sb)->s_journal_bdev = journal_bdev;
5967617ba13bSMingming Cao ext4_init_journal_params(sb, journal);
5968ac27a0ecSDave Kleikamp return journal;
59690b8e58a1SAndreas Dilger
5970ac27a0ecSDave Kleikamp out_journal:
5971dab291afSMingming Cao jbd2_journal_destroy(journal);
5972ac27a0ecSDave Kleikamp out_bdev:
5973bc74e6a3SZhang Yi blkdev_put(journal_bdev, sb);
5974ee5c8071SZhang Yi return ERR_PTR(errno);
5975ac27a0ecSDave Kleikamp }
5976ac27a0ecSDave Kleikamp
ext4_load_journal(struct super_block * sb,struct ext4_super_block * es,unsigned long journal_devnum)5977617ba13bSMingming Cao static int ext4_load_journal(struct super_block *sb,
5978617ba13bSMingming Cao struct ext4_super_block *es,
5979ac27a0ecSDave Kleikamp unsigned long journal_devnum)
5980ac27a0ecSDave Kleikamp {
5981ac27a0ecSDave Kleikamp journal_t *journal;
5982ac27a0ecSDave Kleikamp unsigned int journal_inum = le32_to_cpu(es->s_journal_inum);
5983ac27a0ecSDave Kleikamp dev_t journal_dev;
5984ac27a0ecSDave Kleikamp int err = 0;
5985ac27a0ecSDave Kleikamp int really_read_only;
5986273108faSLukas Czerner int journal_dev_ro;
5987ac27a0ecSDave Kleikamp
598811215630SJan Kara if (WARN_ON_ONCE(!ext4_has_feature_journal(sb)))
598911215630SJan Kara return -EFSCORRUPTED;
59900390131bSFrank Mayhar
5991ac27a0ecSDave Kleikamp if (journal_devnum &&
5992ac27a0ecSDave Kleikamp journal_devnum != le32_to_cpu(es->s_journal_dev)) {
5993b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "external journal device major/minor "
5994b31e1552SEric Sandeen "numbers have changed");
5995ac27a0ecSDave Kleikamp journal_dev = new_decode_dev(journal_devnum);
5996ac27a0ecSDave Kleikamp } else
5997ac27a0ecSDave Kleikamp journal_dev = new_decode_dev(le32_to_cpu(es->s_journal_dev));
5998ac27a0ecSDave Kleikamp
5999273108faSLukas Czerner if (journal_inum && journal_dev) {
6000273108faSLukas Czerner ext4_msg(sb, KERN_ERR,
6001273108faSLukas Czerner "filesystem has both journal inode and journal device!");
6002273108faSLukas Czerner return -EINVAL;
6003273108faSLukas Czerner }
6004273108faSLukas Czerner
6005273108faSLukas Czerner if (journal_inum) {
6006ee5c8071SZhang Yi journal = ext4_open_inode_journal(sb, journal_inum);
6007ee5c8071SZhang Yi if (IS_ERR(journal))
6008ee5c8071SZhang Yi return PTR_ERR(journal);
6009273108faSLukas Czerner } else {
6010ee5c8071SZhang Yi journal = ext4_open_dev_journal(sb, journal_dev);
6011ee5c8071SZhang Yi if (IS_ERR(journal))
6012ee5c8071SZhang Yi return PTR_ERR(journal);
6013273108faSLukas Czerner }
6014273108faSLukas Czerner
6015273108faSLukas Czerner journal_dev_ro = bdev_read_only(journal->j_dev);
6016273108faSLukas Czerner really_read_only = bdev_read_only(sb->s_bdev) | journal_dev_ro;
6017273108faSLukas Czerner
6018273108faSLukas Czerner if (journal_dev_ro && !sb_rdonly(sb)) {
6019273108faSLukas Czerner ext4_msg(sb, KERN_ERR,
6020273108faSLukas Czerner "journal device read-only, try mounting with '-o ro'");
6021273108faSLukas Czerner err = -EROFS;
6022273108faSLukas Czerner goto err_out;
6023273108faSLukas Czerner }
6024ac27a0ecSDave Kleikamp
6025ac27a0ecSDave Kleikamp /*
6026ac27a0ecSDave Kleikamp * Are we loading a blank journal or performing recovery after a
6027ac27a0ecSDave Kleikamp * crash? For recovery, we need to check in advance whether we
6028ac27a0ecSDave Kleikamp * can get read-write access to the device.
6029ac27a0ecSDave Kleikamp */
6030e2b911c5SDarrick J. Wong if (ext4_has_feature_journal_needs_recovery(sb)) {
6031bc98a42cSDavid Howells if (sb_rdonly(sb)) {
6032b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "INFO: recovery "
6033b31e1552SEric Sandeen "required on readonly filesystem");
6034ac27a0ecSDave Kleikamp if (really_read_only) {
6035b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "write access "
6036d98bf8cdSSimon Ruderich "unavailable, cannot proceed "
6037d98bf8cdSSimon Ruderich "(try mounting with noload)");
6038273108faSLukas Czerner err = -EROFS;
6039273108faSLukas Czerner goto err_out;
6040ac27a0ecSDave Kleikamp }
6041b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "write access will "
6042b31e1552SEric Sandeen "be enabled during recovery");
6043ac27a0ecSDave Kleikamp }
6044ac27a0ecSDave Kleikamp }
6045ac27a0ecSDave Kleikamp
604690576c0bSTheodore Ts'o if (!(journal->j_flags & JBD2_BARRIER))
6047b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "barriers disabled");
60484776004fSTheodore Ts'o
6049e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal_needs_recovery(sb))
6050dab291afSMingming Cao err = jbd2_journal_wipe(journal, !really_read_only);
60511c13d5c0STheodore Ts'o if (!err) {
60521c13d5c0STheodore Ts'o char *save = kmalloc(EXT4_S_ERR_LEN, GFP_KERNEL);
60532ef6c32aSTheodore Ts'o __le16 orig_state;
60542ef6c32aSTheodore Ts'o bool changed = false;
6055eee00237SYe Bin
60561c13d5c0STheodore Ts'o if (save)
60571c13d5c0STheodore Ts'o memcpy(save, ((char *) es) +
60581c13d5c0STheodore Ts'o EXT4_S_ERR_START, EXT4_S_ERR_LEN);
6059dab291afSMingming Cao err = jbd2_journal_load(journal);
60602ef6c32aSTheodore Ts'o if (save && memcmp(((char *) es) + EXT4_S_ERR_START,
60612ef6c32aSTheodore Ts'o save, EXT4_S_ERR_LEN)) {
60621c13d5c0STheodore Ts'o memcpy(((char *) es) + EXT4_S_ERR_START,
60631c13d5c0STheodore Ts'o save, EXT4_S_ERR_LEN);
60642ef6c32aSTheodore Ts'o changed = true;
60652ef6c32aSTheodore Ts'o }
60661c13d5c0STheodore Ts'o kfree(save);
60672ef6c32aSTheodore Ts'o orig_state = es->s_state;
6068eee00237SYe Bin es->s_state |= cpu_to_le16(EXT4_SB(sb)->s_mount_state &
6069eee00237SYe Bin EXT4_ERROR_FS);
60702ef6c32aSTheodore Ts'o if (orig_state != es->s_state)
60712ef6c32aSTheodore Ts'o changed = true;
6072eee00237SYe Bin /* Write out restored error information to the superblock */
60732ef6c32aSTheodore Ts'o if (changed && !really_read_only) {
6074eee00237SYe Bin int err2;
6075eee00237SYe Bin err2 = ext4_commit_super(sb);
6076eee00237SYe Bin err = err ? : err2;
6077eee00237SYe Bin }
60781c13d5c0STheodore Ts'o }
6079ac27a0ecSDave Kleikamp
6080ac27a0ecSDave Kleikamp if (err) {
6081b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "error loading journal");
6082273108faSLukas Czerner goto err_out;
6083ac27a0ecSDave Kleikamp }
6084ac27a0ecSDave Kleikamp
6085617ba13bSMingming Cao EXT4_SB(sb)->s_journal = journal;
608611215630SJan Kara err = ext4_clear_journal_err(sb, es);
608711215630SJan Kara if (err) {
608811215630SJan Kara EXT4_SB(sb)->s_journal = NULL;
608911215630SJan Kara jbd2_journal_destroy(journal);
609011215630SJan Kara return err;
609111215630SJan Kara }
6092ac27a0ecSDave Kleikamp
6093c41303ceSMaciej Żenczykowski if (!really_read_only && journal_devnum &&
6094ac27a0ecSDave Kleikamp journal_devnum != le32_to_cpu(es->s_journal_dev)) {
6095ac27a0ecSDave Kleikamp es->s_journal_dev = cpu_to_le32(journal_devnum);
60963039d8b8SBaokun Li ext4_commit_super(sb);
60973039d8b8SBaokun Li }
60983039d8b8SBaokun Li if (!really_read_only && journal_inum &&
60993039d8b8SBaokun Li journal_inum != le32_to_cpu(es->s_journal_inum)) {
61003039d8b8SBaokun Li es->s_journal_inum = cpu_to_le32(journal_inum);
61014392fbc4SJan Kara ext4_commit_super(sb);
6102ac27a0ecSDave Kleikamp }
6103ac27a0ecSDave Kleikamp
6104ac27a0ecSDave Kleikamp return 0;
6105273108faSLukas Czerner
6106273108faSLukas Czerner err_out:
6107273108faSLukas Czerner jbd2_journal_destroy(journal);
6108273108faSLukas Czerner return err;
6109ac27a0ecSDave Kleikamp }
6110ac27a0ecSDave Kleikamp
61112d01ddc8SJan Kara /* Copy state of EXT4_SB(sb) into buffer for on-disk superblock */
ext4_update_super(struct super_block * sb)61122d01ddc8SJan Kara static void ext4_update_super(struct super_block *sb)
6113ac27a0ecSDave Kleikamp {
6114c92dc856SJan Kara struct ext4_sb_info *sbi = EXT4_SB(sb);
6115e92ad03fSJan Kara struct ext4_super_block *es = sbi->s_es;
6116e92ad03fSJan Kara struct buffer_head *sbh = sbi->s_sbh;
6117ac27a0ecSDave Kleikamp
611805c2c00fSJan Kara lock_buffer(sbh);
6119a17712c8SJon Derrick /*
612071290b36STheodore Ts'o * If the file system is mounted read-only, don't update the
612171290b36STheodore Ts'o * superblock write time. This avoids updating the superblock
612271290b36STheodore Ts'o * write time when we are mounting the root file system
612371290b36STheodore Ts'o * read/only but we need to replay the journal; at that point,
612471290b36STheodore Ts'o * for people who are east of GMT and who make their clock
612571290b36STheodore Ts'o * tick in localtime for Windows bug-for-bug compatibility,
612671290b36STheodore Ts'o * the clock is set in the future, and this will cause e2fsck
612771290b36STheodore Ts'o * to complain and force a full file system check.
612871290b36STheodore Ts'o */
6129d5d020b3SJan Kara if (!sb_rdonly(sb))
61306a0678a7SArnd Bergmann ext4_update_tstamp(es, s_wtime);
6131afc32f7eSTheodore Ts'o es->s_kbytes_written =
6132e92ad03fSJan Kara cpu_to_le64(sbi->s_kbytes_written +
61338446fe92SChristoph Hellwig ((part_stat_read(sb->s_bdev, sectors[STAT_WRITE]) -
6134e92ad03fSJan Kara sbi->s_sectors_written_start) >> 1));
6135e92ad03fSJan Kara if (percpu_counter_initialized(&sbi->s_freeclusters_counter))
613657042651STheodore Ts'o ext4_free_blocks_count_set(es,
6137e92ad03fSJan Kara EXT4_C2B(sbi, percpu_counter_sum_positive(
6138e92ad03fSJan Kara &sbi->s_freeclusters_counter)));
6139e92ad03fSJan Kara if (percpu_counter_initialized(&sbi->s_freeinodes_counter))
61407f93cff9STheodore Ts'o es->s_free_inodes_count =
61417f93cff9STheodore Ts'o cpu_to_le32(percpu_counter_sum_positive(
6142e92ad03fSJan Kara &sbi->s_freeinodes_counter));
6143c92dc856SJan Kara /* Copy error information to the on-disk superblock */
6144c92dc856SJan Kara spin_lock(&sbi->s_error_lock);
6145c92dc856SJan Kara if (sbi->s_add_error_count > 0) {
6146c92dc856SJan Kara es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
6147c92dc856SJan Kara if (!es->s_first_error_time && !es->s_first_error_time_hi) {
6148c92dc856SJan Kara __ext4_update_tstamp(&es->s_first_error_time,
6149c92dc856SJan Kara &es->s_first_error_time_hi,
6150c92dc856SJan Kara sbi->s_first_error_time);
6151c92dc856SJan Kara strncpy(es->s_first_error_func, sbi->s_first_error_func,
6152c92dc856SJan Kara sizeof(es->s_first_error_func));
6153c92dc856SJan Kara es->s_first_error_line =
6154c92dc856SJan Kara cpu_to_le32(sbi->s_first_error_line);
6155c92dc856SJan Kara es->s_first_error_ino =
6156c92dc856SJan Kara cpu_to_le32(sbi->s_first_error_ino);
6157c92dc856SJan Kara es->s_first_error_block =
6158c92dc856SJan Kara cpu_to_le64(sbi->s_first_error_block);
6159c92dc856SJan Kara es->s_first_error_errcode =
6160c92dc856SJan Kara ext4_errno_to_code(sbi->s_first_error_code);
6161c92dc856SJan Kara }
6162c92dc856SJan Kara __ext4_update_tstamp(&es->s_last_error_time,
6163c92dc856SJan Kara &es->s_last_error_time_hi,
6164c92dc856SJan Kara sbi->s_last_error_time);
6165c92dc856SJan Kara strncpy(es->s_last_error_func, sbi->s_last_error_func,
6166c92dc856SJan Kara sizeof(es->s_last_error_func));
6167c92dc856SJan Kara es->s_last_error_line = cpu_to_le32(sbi->s_last_error_line);
6168c92dc856SJan Kara es->s_last_error_ino = cpu_to_le32(sbi->s_last_error_ino);
6169c92dc856SJan Kara es->s_last_error_block = cpu_to_le64(sbi->s_last_error_block);
6170c92dc856SJan Kara es->s_last_error_errcode =
6171c92dc856SJan Kara ext4_errno_to_code(sbi->s_last_error_code);
6172c92dc856SJan Kara /*
6173c92dc856SJan Kara * Start the daily error reporting function if it hasn't been
6174c92dc856SJan Kara * started already
6175c92dc856SJan Kara */
6176c92dc856SJan Kara if (!es->s_error_count)
6177c92dc856SJan Kara mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ);
6178c92dc856SJan Kara le32_add_cpu(&es->s_error_count, sbi->s_add_error_count);
6179c92dc856SJan Kara sbi->s_add_error_count = 0;
6180c92dc856SJan Kara }
6181c92dc856SJan Kara spin_unlock(&sbi->s_error_lock);
6182c92dc856SJan Kara
618306db49e6STheodore Ts'o ext4_superblock_csum_set(sb);
61842d01ddc8SJan Kara unlock_buffer(sbh);
61852d01ddc8SJan Kara }
61862d01ddc8SJan Kara
ext4_commit_super(struct super_block * sb)61872d01ddc8SJan Kara static int ext4_commit_super(struct super_block *sb)
61882d01ddc8SJan Kara {
61892d01ddc8SJan Kara struct buffer_head *sbh = EXT4_SB(sb)->s_sbh;
61902d01ddc8SJan Kara
6191f88f1466SFengnan Chang if (!sbh)
6192f88f1466SFengnan Chang return -EINVAL;
6193f88f1466SFengnan Chang if (block_device_ejected(sb))
6194f88f1466SFengnan Chang return -ENODEV;
61952d01ddc8SJan Kara
61962d01ddc8SJan Kara ext4_update_super(sb);
61972d01ddc8SJan Kara
619815baa7dcSZhang Yi lock_buffer(sbh);
619915baa7dcSZhang Yi /* Buffer got discarded which means block device got invalidated */
620015baa7dcSZhang Yi if (!buffer_mapped(sbh)) {
620115baa7dcSZhang Yi unlock_buffer(sbh);
620215baa7dcSZhang Yi return -EIO;
620315baa7dcSZhang Yi }
620415baa7dcSZhang Yi
6205e8680786STheodore Ts'o if (buffer_write_io_error(sbh) || !buffer_uptodate(sbh)) {
62064743f839SPranay Kr. Srivastava /*
62074743f839SPranay Kr. Srivastava * Oh, dear. A previous attempt to write the
62084743f839SPranay Kr. Srivastava * superblock failed. This could happen because the
62094743f839SPranay Kr. Srivastava * USB device was yanked out. Or it could happen to
62104743f839SPranay Kr. Srivastava * be a transient write error and maybe the block will
62114743f839SPranay Kr. Srivastava * be remapped. Nothing we can do but to retry the
62124743f839SPranay Kr. Srivastava * write and hope for the best.
62134743f839SPranay Kr. Srivastava */
62144743f839SPranay Kr. Srivastava ext4_msg(sb, KERN_ERR, "previous I/O error to "
62154743f839SPranay Kr. Srivastava "superblock detected");
62164743f839SPranay Kr. Srivastava clear_buffer_write_io_error(sbh);
62174743f839SPranay Kr. Srivastava set_buffer_uptodate(sbh);
62184743f839SPranay Kr. Srivastava }
621915baa7dcSZhang Yi get_bh(sbh);
622015baa7dcSZhang Yi /* Clear potential dirty bit if it was journalled update */
622115baa7dcSZhang Yi clear_buffer_dirty(sbh);
622215baa7dcSZhang Yi sbh->b_end_io = end_buffer_write_sync;
62231420c4a5SBart Van Assche submit_bh(REQ_OP_WRITE | REQ_SYNC |
62241420c4a5SBart Van Assche (test_opt(sb, BARRIER) ? REQ_FUA : 0), sbh);
622515baa7dcSZhang Yi wait_on_buffer(sbh);
6226c89128a0SJaegeuk Kim if (buffer_write_io_error(sbh)) {
6227b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "I/O error while writing "
6228b31e1552SEric Sandeen "superblock");
6229914258bfSTheodore Ts'o clear_buffer_write_io_error(sbh);
6230914258bfSTheodore Ts'o set_buffer_uptodate(sbh);
623115baa7dcSZhang Yi return -EIO;
6232914258bfSTheodore Ts'o }
623315baa7dcSZhang Yi return 0;
6234ac27a0ecSDave Kleikamp }
6235ac27a0ecSDave Kleikamp
6236ac27a0ecSDave Kleikamp /*
6237ac27a0ecSDave Kleikamp * Have we just finished recovery? If so, and if we are mounting (or
6238ac27a0ecSDave Kleikamp * remounting) the filesystem readonly, then we will end up with a
6239ac27a0ecSDave Kleikamp * consistent fs on disk. Record that fact.
6240ac27a0ecSDave Kleikamp */
ext4_mark_recovery_complete(struct super_block * sb,struct ext4_super_block * es)624111215630SJan Kara static int ext4_mark_recovery_complete(struct super_block *sb,
6242617ba13bSMingming Cao struct ext4_super_block *es)
6243ac27a0ecSDave Kleikamp {
624411215630SJan Kara int err;
6245617ba13bSMingming Cao journal_t *journal = EXT4_SB(sb)->s_journal;
6246ac27a0ecSDave Kleikamp
6247e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal(sb)) {
624811215630SJan Kara if (journal != NULL) {
624911215630SJan Kara ext4_error(sb, "Journal got removed while the fs was "
625011215630SJan Kara "mounted!");
625111215630SJan Kara return -EFSCORRUPTED;
625211215630SJan Kara }
625311215630SJan Kara return 0;
62540390131bSFrank Mayhar }
6255dab291afSMingming Cao jbd2_journal_lock_updates(journal);
625601d5d965SLeah Rumancik err = jbd2_journal_flush(journal, 0);
625711215630SJan Kara if (err < 0)
62587ffe1ea8SHidehiro Kawai goto out;
62597ffe1ea8SHidehiro Kawai
626002f310fcSJan Kara if (sb_rdonly(sb) && (ext4_has_feature_journal_needs_recovery(sb) ||
626102f310fcSJan Kara ext4_has_feature_orphan_present(sb))) {
626202f310fcSJan Kara if (!ext4_orphan_file_empty(sb)) {
626302f310fcSJan Kara ext4_error(sb, "Orphan file not empty on read-only fs.");
626402f310fcSJan Kara err = -EFSCORRUPTED;
626502f310fcSJan Kara goto out;
626602f310fcSJan Kara }
6267e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb);
626802f310fcSJan Kara ext4_clear_feature_orphan_present(sb);
62694392fbc4SJan Kara ext4_commit_super(sb);
6270ac27a0ecSDave Kleikamp }
62717ffe1ea8SHidehiro Kawai out:
6272dab291afSMingming Cao jbd2_journal_unlock_updates(journal);
627311215630SJan Kara return err;
6274ac27a0ecSDave Kleikamp }
6275ac27a0ecSDave Kleikamp
6276ac27a0ecSDave Kleikamp /*
6277ac27a0ecSDave Kleikamp * If we are mounting (or read-write remounting) a filesystem whose journal
6278ac27a0ecSDave Kleikamp * has recorded an error from a previous lifetime, move that error to the
6279ac27a0ecSDave Kleikamp * main filesystem now.
6280ac27a0ecSDave Kleikamp */
ext4_clear_journal_err(struct super_block * sb,struct ext4_super_block * es)628111215630SJan Kara static int ext4_clear_journal_err(struct super_block *sb,
6282617ba13bSMingming Cao struct ext4_super_block *es)
6283ac27a0ecSDave Kleikamp {
6284ac27a0ecSDave Kleikamp journal_t *journal;
6285ac27a0ecSDave Kleikamp int j_errno;
6286ac27a0ecSDave Kleikamp const char *errstr;
6287ac27a0ecSDave Kleikamp
628811215630SJan Kara if (!ext4_has_feature_journal(sb)) {
628911215630SJan Kara ext4_error(sb, "Journal got removed while the fs was mounted!");
629011215630SJan Kara return -EFSCORRUPTED;
629111215630SJan Kara }
62920390131bSFrank Mayhar
6293617ba13bSMingming Cao journal = EXT4_SB(sb)->s_journal;
6294ac27a0ecSDave Kleikamp
6295ac27a0ecSDave Kleikamp /*
6296ac27a0ecSDave Kleikamp * Now check for any error status which may have been recorded in the
6297617ba13bSMingming Cao * journal by a prior ext4_error() or ext4_abort()
6298ac27a0ecSDave Kleikamp */
6299ac27a0ecSDave Kleikamp
6300dab291afSMingming Cao j_errno = jbd2_journal_errno(journal);
6301ac27a0ecSDave Kleikamp if (j_errno) {
6302ac27a0ecSDave Kleikamp char nbuf[16];
6303ac27a0ecSDave Kleikamp
6304617ba13bSMingming Cao errstr = ext4_decode_error(sb, j_errno, nbuf);
630512062dddSEric Sandeen ext4_warning(sb, "Filesystem error recorded "
6306ac27a0ecSDave Kleikamp "from previous mount: %s", errstr);
6307ac27a0ecSDave Kleikamp
6308617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
6309617ba13bSMingming Cao es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
6310f57886caSYe Bin j_errno = ext4_commit_super(sb);
6311f57886caSYe Bin if (j_errno)
6312f57886caSYe Bin return j_errno;
6313f57886caSYe Bin ext4_warning(sb, "Marked fs in need of filesystem check.");
6314ac27a0ecSDave Kleikamp
6315dab291afSMingming Cao jbd2_journal_clear_err(journal);
6316d796c52eSTheodore Ts'o jbd2_journal_update_sb_errno(journal);
6317ac27a0ecSDave Kleikamp }
631811215630SJan Kara return 0;
6319ac27a0ecSDave Kleikamp }
6320ac27a0ecSDave Kleikamp
6321ac27a0ecSDave Kleikamp /*
6322ac27a0ecSDave Kleikamp * Force the running and committing transactions to commit,
6323ac27a0ecSDave Kleikamp * and wait on the commit.
6324ac27a0ecSDave Kleikamp */
ext4_force_commit(struct super_block * sb)6325617ba13bSMingming Cao int ext4_force_commit(struct super_block *sb)
6326ac27a0ecSDave Kleikamp {
6327889860e4SJan Kara return ext4_journal_force_commit(EXT4_SB(sb)->s_journal);
6328ac27a0ecSDave Kleikamp }
6329ac27a0ecSDave Kleikamp
ext4_sync_fs(struct super_block * sb,int wait)6330617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait)
6331ac27a0ecSDave Kleikamp {
633214ce0cb4STheodore Ts'o int ret = 0;
63339eddacf9SJan Kara tid_t target;
633406a407f1SDmitry Monakhov bool needs_barrier = false;
63358d5d02e6SMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
6336ac27a0ecSDave Kleikamp
6337eb8ab444SJan Kara if (unlikely(ext4_forced_shutdown(sb)))
63380db1ff22STheodore Ts'o return 0;
63390db1ff22STheodore Ts'o
63409bffad1eSTheodore Ts'o trace_ext4_sync_fs(sb, wait);
63412e8fa54eSJan Kara flush_workqueue(sbi->rsv_conversion_wq);
6342a1177825SJan Kara /*
6343a1177825SJan Kara * Writeback quota in non-journalled quota case - journalled quota has
6344a1177825SJan Kara * no dirty dquots
6345a1177825SJan Kara */
6346a1177825SJan Kara dquot_writeback_dquots(sb, -1);
634706a407f1SDmitry Monakhov /*
634806a407f1SDmitry Monakhov * Data writeback is possible w/o journal transaction, so barrier must
634906a407f1SDmitry Monakhov * being sent at the end of the function. But we can skip it if
635006a407f1SDmitry Monakhov * transaction_commit will do it for us.
635106a407f1SDmitry Monakhov */
6352bda32530STheodore Ts'o if (sbi->s_journal) {
635306a407f1SDmitry Monakhov target = jbd2_get_latest_transaction(sbi->s_journal);
635406a407f1SDmitry Monakhov if (wait && sbi->s_journal->j_flags & JBD2_BARRIER &&
635506a407f1SDmitry Monakhov !jbd2_trans_will_send_data_barrier(sbi->s_journal, target))
635606a407f1SDmitry Monakhov needs_barrier = true;
635706a407f1SDmitry Monakhov
63588d5d02e6SMingming Cao if (jbd2_journal_start_commit(sbi->s_journal, &target)) {
6359ac27a0ecSDave Kleikamp if (wait)
6360bda32530STheodore Ts'o ret = jbd2_log_wait_commit(sbi->s_journal,
6361bda32530STheodore Ts'o target);
63620390131bSFrank Mayhar }
6363bda32530STheodore Ts'o } else if (wait && test_opt(sb, BARRIER))
6364bda32530STheodore Ts'o needs_barrier = true;
636506a407f1SDmitry Monakhov if (needs_barrier) {
636606a407f1SDmitry Monakhov int err;
6367c6bf3f0eSChristoph Hellwig err = blkdev_issue_flush(sb->s_bdev);
636806a407f1SDmitry Monakhov if (!ret)
636906a407f1SDmitry Monakhov ret = err;
637006a407f1SDmitry Monakhov }
637106a407f1SDmitry Monakhov
637206a407f1SDmitry Monakhov return ret;
637306a407f1SDmitry Monakhov }
637406a407f1SDmitry Monakhov
6375ac27a0ecSDave Kleikamp /*
6376ac27a0ecSDave Kleikamp * LVM calls this function before a (read-only) snapshot is created. This
6377ac27a0ecSDave Kleikamp * gives us a chance to flush the journal completely and mark the fs clean.
6378be4f27d3SYongqiang Yang *
6379be4f27d3SYongqiang Yang * Note that only this function cannot bring a filesystem to be in a clean
63808e8ad8a5SJan Kara * state independently. It relies on upper layer to stop all data & metadata
63818e8ad8a5SJan Kara * modifications.
6382ac27a0ecSDave Kleikamp */
ext4_freeze(struct super_block * sb)6383c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb)
6384ac27a0ecSDave Kleikamp {
6385c4be0c1dSTakashi Sato int error = 0;
638698175720SJan Kara journal_t *journal = EXT4_SB(sb)->s_journal;
6387ac27a0ecSDave Kleikamp
6388bb044576STheodore Ts'o if (journal) {
6389ac27a0ecSDave Kleikamp /* Now we set up the journal barrier. */
6390dab291afSMingming Cao jbd2_journal_lock_updates(journal);
63917ffe1ea8SHidehiro Kawai
63927ffe1ea8SHidehiro Kawai /*
6393bb044576STheodore Ts'o * Don't clear the needs_recovery flag if we failed to
6394bb044576STheodore Ts'o * flush the journal.
63957ffe1ea8SHidehiro Kawai */
639601d5d965SLeah Rumancik error = jbd2_journal_flush(journal, 0);
63976b0310fbSEric Sandeen if (error < 0)
63986b0310fbSEric Sandeen goto out;
6399ac27a0ecSDave Kleikamp
6400ac27a0ecSDave Kleikamp /* Journal blocked and flushed, clear needs_recovery flag. */
6401e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb);
640202f310fcSJan Kara if (ext4_orphan_file_empty(sb))
640302f310fcSJan Kara ext4_clear_feature_orphan_present(sb);
6404c642dc9eSEric Sandeen }
6405c642dc9eSEric Sandeen
64064392fbc4SJan Kara error = ext4_commit_super(sb);
64076b0310fbSEric Sandeen out:
6408bb044576STheodore Ts'o if (journal)
64098e8ad8a5SJan Kara /* we rely on upper layer to stop further updates */
6410bb044576STheodore Ts'o jbd2_journal_unlock_updates(journal);
64116b0310fbSEric Sandeen return error;
6412ac27a0ecSDave Kleikamp }
6413ac27a0ecSDave Kleikamp
6414ac27a0ecSDave Kleikamp /*
6415ac27a0ecSDave Kleikamp * Called by LVM after the snapshot is done. We need to reset the RECOVER
6416ac27a0ecSDave Kleikamp * flag here, even though the filesystem is not technically dirty yet.
6417ac27a0ecSDave Kleikamp */
ext4_unfreeze(struct super_block * sb)6418c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb)
6419ac27a0ecSDave Kleikamp {
6420eb8ab444SJan Kara if (ext4_forced_shutdown(sb))
64219ca92389STheodore Ts'o return 0;
64229ca92389STheodore Ts'o
6423c642dc9eSEric Sandeen if (EXT4_SB(sb)->s_journal) {
64249ca92389STheodore Ts'o /* Reset the needs_recovery flag before the fs is unlocked. */
6425e2b911c5SDarrick J. Wong ext4_set_feature_journal_needs_recovery(sb);
642602f310fcSJan Kara if (ext4_has_feature_orphan_file(sb))
642702f310fcSJan Kara ext4_set_feature_orphan_present(sb);
6428c642dc9eSEric Sandeen }
6429c642dc9eSEric Sandeen
64304392fbc4SJan Kara ext4_commit_super(sb);
6431c4be0c1dSTakashi Sato return 0;
6432ac27a0ecSDave Kleikamp }
6433ac27a0ecSDave Kleikamp
6434673c6100STheodore Ts'o /*
6435673c6100STheodore Ts'o * Structure to save mount options for ext4_remount's benefit
6436673c6100STheodore Ts'o */
6437673c6100STheodore Ts'o struct ext4_mount_options {
6438673c6100STheodore Ts'o unsigned long s_mount_opt;
6439a2595b8aSTheodore Ts'o unsigned long s_mount_opt2;
644008cefc7aSEric W. Biederman kuid_t s_resuid;
644108cefc7aSEric W. Biederman kgid_t s_resgid;
6442673c6100STheodore Ts'o unsigned long s_commit_interval;
6443673c6100STheodore Ts'o u32 s_min_batch_time, s_max_batch_time;
6444673c6100STheodore Ts'o #ifdef CONFIG_QUOTA
6445673c6100STheodore Ts'o int s_jquota_fmt;
6446a2d4a646SJan Kara char *s_qf_names[EXT4_MAXQUOTAS];
6447673c6100STheodore Ts'o #endif
6448673c6100STheodore Ts'o };
6449673c6100STheodore Ts'o
__ext4_remount(struct fs_context * fc,struct super_block * sb)6450960e0ab6SLukas Czerner static int __ext4_remount(struct fs_context *fc, struct super_block *sb)
6451ac27a0ecSDave Kleikamp {
64527edfd85bSLukas Czerner struct ext4_fs_context *ctx = fc->fs_private;
6453617ba13bSMingming Cao struct ext4_super_block *es;
6454617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
6455960e0ab6SLukas Czerner unsigned long old_sb_flags;
6456617ba13bSMingming Cao struct ext4_mount_options old_opts;
64578a266467STheodore Ts'o ext4_group_t g;
6458c5e06d10SJohann Lombardi int err = 0;
6459904fa65cSBaokun Li int alloc_ctx;
6460ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
64613bbef91bSAustin Kim int enable_quota = 0;
646203dafb5fSChen Gang int i, j;
646333458eabSTheodore Ts'o char *to_free[EXT4_MAXQUOTAS];
6464ac27a0ecSDave Kleikamp #endif
6465b237e304SHarshad Shirwadkar
646621ac738eSChengguang Xu
6467ac27a0ecSDave Kleikamp /* Store the original options */
6468ac27a0ecSDave Kleikamp old_sb_flags = sb->s_flags;
6469ac27a0ecSDave Kleikamp old_opts.s_mount_opt = sbi->s_mount_opt;
6470a2595b8aSTheodore Ts'o old_opts.s_mount_opt2 = sbi->s_mount_opt2;
6471ac27a0ecSDave Kleikamp old_opts.s_resuid = sbi->s_resuid;
6472ac27a0ecSDave Kleikamp old_opts.s_resgid = sbi->s_resgid;
6473ac27a0ecSDave Kleikamp old_opts.s_commit_interval = sbi->s_commit_interval;
647430773840STheodore Ts'o old_opts.s_min_batch_time = sbi->s_min_batch_time;
647530773840STheodore Ts'o old_opts.s_max_batch_time = sbi->s_max_batch_time;
6476ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6477ac27a0ecSDave Kleikamp old_opts.s_jquota_fmt = sbi->s_jquota_fmt;
6478a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++)
647903dafb5fSChen Gang if (sbi->s_qf_names[i]) {
648033458eabSTheodore Ts'o char *qf_name = get_qf_name(sb, sbi, i);
648133458eabSTheodore Ts'o
648233458eabSTheodore Ts'o old_opts.s_qf_names[i] = kstrdup(qf_name, GFP_KERNEL);
648303dafb5fSChen Gang if (!old_opts.s_qf_names[i]) {
648403dafb5fSChen Gang for (j = 0; j < i; j++)
648503dafb5fSChen Gang kfree(old_opts.s_qf_names[j]);
648603dafb5fSChen Gang return -ENOMEM;
648703dafb5fSChen Gang }
648803dafb5fSChen Gang } else
648903dafb5fSChen Gang old_opts.s_qf_names[i] = NULL;
6490ac27a0ecSDave Kleikamp #endif
6491e4e58e5dSOjaswin Mujoo if (!(ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO)) {
6492b3881f74STheodore Ts'o if (sbi->s_journal && sbi->s_journal->j_task->io_context)
64937edfd85bSLukas Czerner ctx->journal_ioprio =
6494b237e304SHarshad Shirwadkar sbi->s_journal->j_task->io_context->ioprio;
6495e4e58e5dSOjaswin Mujoo else
6496e4e58e5dSOjaswin Mujoo ctx->journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
6497e4e58e5dSOjaswin Mujoo
6498e4e58e5dSOjaswin Mujoo }
6499ac27a0ecSDave Kleikamp
6500faeff8b1SOjaswin Mujoo if ((ctx->spec & EXT4_SPEC_s_stripe) &&
6501faeff8b1SOjaswin Mujoo ext4_is_stripe_incompatible(sb, ctx->s_stripe)) {
6502faeff8b1SOjaswin Mujoo ext4_msg(sb, KERN_WARNING,
6503faeff8b1SOjaswin Mujoo "stripe (%lu) is not aligned with cluster size (%u), "
6504faeff8b1SOjaswin Mujoo "stripe is disabled",
6505faeff8b1SOjaswin Mujoo ctx->s_stripe, sbi->s_cluster_ratio);
6506faeff8b1SOjaswin Mujoo ctx->s_stripe = 0;
6507faeff8b1SOjaswin Mujoo }
6508faeff8b1SOjaswin Mujoo
6509904fa65cSBaokun Li /*
6510904fa65cSBaokun Li * Changing the DIOREAD_NOLOCK or DELALLOC mount options may cause
6511904fa65cSBaokun Li * two calls to ext4_should_dioread_nolock() to return inconsistent
6512904fa65cSBaokun Li * values, triggering WARN_ON in ext4_add_complete_io(). we grab
6513904fa65cSBaokun Li * here s_writepages_rwsem to avoid race between writepages ops and
6514904fa65cSBaokun Li * remount.
6515904fa65cSBaokun Li */
6516904fa65cSBaokun Li alloc_ctx = ext4_writepages_down_write(sb);
65177edfd85bSLukas Czerner ext4_apply_options(fc, sb);
6518904fa65cSBaokun Li ext4_writepages_up_write(sb, alloc_ctx);
6519ac27a0ecSDave Kleikamp
65206b992ff2SDarrick J. Wong if ((old_opts.s_mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) ^
65216b992ff2SDarrick J. Wong test_opt(sb, JOURNAL_CHECKSUM)) {
65226b992ff2SDarrick J. Wong ext4_msg(sb, KERN_ERR, "changing journal_checksum "
65232d5b86e0SEric Sandeen "during remount not supported; ignoring");
65242d5b86e0SEric Sandeen sbi->s_mount_opt ^= EXT4_MOUNT_JOURNAL_CHECKSUM;
6525c6d3d56dSDarrick J. Wong }
6526c6d3d56dSDarrick J. Wong
65276ae6514bSPiotr Sarna if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
65286ae6514bSPiotr Sarna if (test_opt2(sb, EXPLICIT_DELALLOC)) {
65296ae6514bSPiotr Sarna ext4_msg(sb, KERN_ERR, "can't mount with "
65306ae6514bSPiotr Sarna "both data=journal and delalloc");
65316ae6514bSPiotr Sarna err = -EINVAL;
65326ae6514bSPiotr Sarna goto restore_opts;
65336ae6514bSPiotr Sarna }
65346ae6514bSPiotr Sarna if (test_opt(sb, DIOREAD_NOLOCK)) {
65356ae6514bSPiotr Sarna ext4_msg(sb, KERN_ERR, "can't mount with "
65366ae6514bSPiotr Sarna "both data=journal and dioread_nolock");
65376ae6514bSPiotr Sarna err = -EINVAL;
65386ae6514bSPiotr Sarna goto restore_opts;
65396ae6514bSPiotr Sarna }
6540ab04df78SJan Kara } else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) {
6541ab04df78SJan Kara if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
6542ab04df78SJan Kara ext4_msg(sb, KERN_ERR, "can't mount with "
6543ab04df78SJan Kara "journal_async_commit in data=ordered mode");
6544ab04df78SJan Kara err = -EINVAL;
6545ab04df78SJan Kara goto restore_opts;
6546ab04df78SJan Kara }
6547923ae0ffSRoss Zwisler }
6548923ae0ffSRoss Zwisler
6549cdb7ee4cSTahsin Erdogan if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_NO_MBCACHE) {
6550cdb7ee4cSTahsin Erdogan ext4_msg(sb, KERN_ERR, "can't enable nombcache during remount");
6551cdb7ee4cSTahsin Erdogan err = -EINVAL;
6552cdb7ee4cSTahsin Erdogan goto restore_opts;
6553cdb7ee4cSTahsin Erdogan }
6554cdb7ee4cSTahsin Erdogan
65551751e8a6SLinus Torvalds sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
65561751e8a6SLinus Torvalds (test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
6557ac27a0ecSDave Kleikamp
6558ac27a0ecSDave Kleikamp es = sbi->s_es;
6559ac27a0ecSDave Kleikamp
6560b3881f74STheodore Ts'o if (sbi->s_journal) {
6561617ba13bSMingming Cao ext4_init_journal_params(sb, sbi->s_journal);
65627edfd85bSLukas Czerner set_task_ioprio(sbi->s_journal->j_task, ctx->journal_ioprio);
6563b3881f74STheodore Ts'o }
6564ac27a0ecSDave Kleikamp
6565c92dc856SJan Kara /* Flush outstanding errors before changing fs state */
6566bb15cea2STheodore Ts'o flush_work(&sbi->s_sb_upd_work);
6567c92dc856SJan Kara
6568960e0ab6SLukas Czerner if ((bool)(fc->sb_flags & SB_RDONLY) != sb_rdonly(sb)) {
656995257987SJan Kara if (ext4_forced_shutdown(sb)) {
6570ac27a0ecSDave Kleikamp err = -EROFS;
6571ac27a0ecSDave Kleikamp goto restore_opts;
6572ac27a0ecSDave Kleikamp }
6573ac27a0ecSDave Kleikamp
6574960e0ab6SLukas Czerner if (fc->sb_flags & SB_RDONLY) {
657538c03b34STheodore Ts'o err = sync_filesystem(sb);
657638c03b34STheodore Ts'o if (err < 0)
657738c03b34STheodore Ts'o goto restore_opts;
65780f0dd62fSChristoph Hellwig err = dquot_suspend(sb, -1);
65790f0dd62fSChristoph Hellwig if (err < 0)
6580c79d967dSChristoph Hellwig goto restore_opts;
6581c79d967dSChristoph Hellwig
6582ac27a0ecSDave Kleikamp /*
6583ac27a0ecSDave Kleikamp * First of all, the unconditional stuff we have to do
6584ac27a0ecSDave Kleikamp * to disable replay of the journal when we next remount
6585ac27a0ecSDave Kleikamp */
65861751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY;
6587ac27a0ecSDave Kleikamp
6588ac27a0ecSDave Kleikamp /*
6589ac27a0ecSDave Kleikamp * OK, test if we are remounting a valid rw partition
6590ac27a0ecSDave Kleikamp * readonly, and if so set the rdonly flag and then
6591ac27a0ecSDave Kleikamp * mark the partition as valid again.
6592ac27a0ecSDave Kleikamp */
6593617ba13bSMingming Cao if (!(es->s_state & cpu_to_le16(EXT4_VALID_FS)) &&
6594617ba13bSMingming Cao (sbi->s_mount_state & EXT4_VALID_FS))
6595ac27a0ecSDave Kleikamp es->s_state = cpu_to_le16(sbi->s_mount_state);
6596ac27a0ecSDave Kleikamp
659711215630SJan Kara if (sbi->s_journal) {
659811215630SJan Kara /*
659911215630SJan Kara * We let remount-ro finish even if marking fs
660011215630SJan Kara * as clean failed...
660111215630SJan Kara */
6602617ba13bSMingming Cao ext4_mark_recovery_complete(sb, es);
660311215630SJan Kara }
6604ac27a0ecSDave Kleikamp } else {
6605a13fb1a4SEric Sandeen /* Make sure we can mount this feature set readwrite */
6606e2b911c5SDarrick J. Wong if (ext4_has_feature_readonly(sb) ||
66072cb5cc8bSDarrick J. Wong !ext4_feature_set_ok(sb, 0)) {
6608ac27a0ecSDave Kleikamp err = -EROFS;
6609ac27a0ecSDave Kleikamp goto restore_opts;
6610ac27a0ecSDave Kleikamp }
6611ead6596bSEric Sandeen /*
66128a266467STheodore Ts'o * Make sure the group descriptor checksums
66130b8e58a1SAndreas Dilger * are sane. If they aren't, refuse to remount r/w.
66148a266467STheodore Ts'o */
66158a266467STheodore Ts'o for (g = 0; g < sbi->s_groups_count; g++) {
66168a266467STheodore Ts'o struct ext4_group_desc *gdp =
66178a266467STheodore Ts'o ext4_get_group_desc(sb, g, NULL);
66188a266467STheodore Ts'o
6619feb0ab32SDarrick J. Wong if (!ext4_group_desc_csum_verify(sb, g, gdp)) {
6620b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR,
6621b31e1552SEric Sandeen "ext4_remount: Checksum for group %u failed (%u!=%u)",
6622e2b911c5SDarrick J. Wong g, le16_to_cpu(ext4_group_desc_csum(sb, g, gdp)),
66238a266467STheodore Ts'o le16_to_cpu(gdp->bg_checksum));
66246a797d27SDarrick J. Wong err = -EFSBADCRC;
66258a266467STheodore Ts'o goto restore_opts;
66268a266467STheodore Ts'o }
66278a266467STheodore Ts'o }
66288a266467STheodore Ts'o
66298a266467STheodore Ts'o /*
6630ead6596bSEric Sandeen * If we have an unprocessed orphan list hanging
6631ead6596bSEric Sandeen * around from a previously readonly bdev mount,
6632ead6596bSEric Sandeen * require a full umount/remount for now.
6633ead6596bSEric Sandeen */
663402f310fcSJan Kara if (es->s_last_orphan || !ext4_orphan_file_empty(sb)) {
6635b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "Couldn't "
6636ead6596bSEric Sandeen "remount RDWR because of unprocessed "
6637ead6596bSEric Sandeen "orphan inode list. Please "
6638b31e1552SEric Sandeen "umount/remount instead");
6639ead6596bSEric Sandeen err = -EINVAL;
6640ead6596bSEric Sandeen goto restore_opts;
6641ead6596bSEric Sandeen }
6642ead6596bSEric Sandeen
6643ac27a0ecSDave Kleikamp /*
6644ac27a0ecSDave Kleikamp * Mounting a RDONLY partition read-write, so reread
6645ac27a0ecSDave Kleikamp * and store the current valid flag. (It may have
6646ac27a0ecSDave Kleikamp * been changed by e2fsck since we originally mounted
6647ac27a0ecSDave Kleikamp * the partition.)
6648ac27a0ecSDave Kleikamp */
664911215630SJan Kara if (sbi->s_journal) {
665011215630SJan Kara err = ext4_clear_journal_err(sb, es);
665111215630SJan Kara if (err)
665211215630SJan Kara goto restore_opts;
665311215630SJan Kara }
6654c878bea3STheodore Ts'o sbi->s_mount_state = (le16_to_cpu(es->s_state) &
6655c878bea3STheodore Ts'o ~EXT4_FC_REPLAY);
6656c89128a0SJaegeuk Kim
6657c89128a0SJaegeuk Kim err = ext4_setup_super(sb, es, 0);
6658c89128a0SJaegeuk Kim if (err)
6659c89128a0SJaegeuk Kim goto restore_opts;
6660c89128a0SJaegeuk Kim
66611b292439STheodore Ts'o sb->s_flags &= ~SB_RDONLY;
66623b50d501STheodore Ts'o if (ext4_has_feature_mmp(sb)) {
66633b50d501STheodore Ts'o err = ext4_multi_mount_protect(sb,
66643b50d501STheodore Ts'o le64_to_cpu(es->s_mmp_block));
66653b50d501STheodore Ts'o if (err)
6666c5e06d10SJohann Lombardi goto restore_opts;
6667c5e06d10SJohann Lombardi }
66683bbef91bSAustin Kim #ifdef CONFIG_QUOTA
6669c79d967dSChristoph Hellwig enable_quota = 1;
66703bbef91bSAustin Kim #endif
6671ac27a0ecSDave Kleikamp }
6672ac27a0ecSDave Kleikamp }
6673bfff6873SLukas Czerner
6674bfff6873SLukas Czerner /*
66750f5bde1dSJan Kara * Handle creation of system zone data early because it can fail.
66760f5bde1dSJan Kara * Releasing of existing data is done when we are sure remount will
66770f5bde1dSJan Kara * succeed.
66780f5bde1dSJan Kara */
6679dd0db94fSChunguang Xu if (test_opt(sb, BLOCK_VALIDITY) && !sbi->s_system_blks) {
6680d176b1f6SJan Kara err = ext4_setup_system_zone(sb);
6681d176b1f6SJan Kara if (err)
6682d176b1f6SJan Kara goto restore_opts;
66830f5bde1dSJan Kara }
6684d176b1f6SJan Kara
6685c89128a0SJaegeuk Kim if (sbi->s_journal == NULL && !(old_sb_flags & SB_RDONLY)) {
66864392fbc4SJan Kara err = ext4_commit_super(sb);
6687c89128a0SJaegeuk Kim if (err)
6688c89128a0SJaegeuk Kim goto restore_opts;
6689c89128a0SJaegeuk Kim }
66900390131bSFrank Mayhar
6691ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
66927c319d32SAditya Kali if (enable_quota) {
66937c319d32SAditya Kali if (sb_any_quota_suspended(sb))
66940f0dd62fSChristoph Hellwig dquot_resume(sb, -1);
6695e2b911c5SDarrick J. Wong else if (ext4_has_feature_quota(sb)) {
66967c319d32SAditya Kali err = ext4_enable_quotas(sb);
669707724f98STheodore Ts'o if (err)
66987c319d32SAditya Kali goto restore_opts;
66997c319d32SAditya Kali }
67007c319d32SAditya Kali }
67014c0b4818STheodore Ts'o /* Release old quota file names */
67024c0b4818STheodore Ts'o for (i = 0; i < EXT4_MAXQUOTAS; i++)
67034c0b4818STheodore Ts'o kfree(old_opts.s_qf_names[i]);
67047c319d32SAditya Kali #endif
6705dd0db94fSChunguang Xu if (!test_opt(sb, BLOCK_VALIDITY) && sbi->s_system_blks)
67060f5bde1dSJan Kara ext4_release_system_zone(sb);
6707d4c402d9SCurt Wohlgemuth
6708eb1f822cSTheodore Ts'o /*
6709eb1f822cSTheodore Ts'o * Reinitialize lazy itable initialization thread based on
6710eb1f822cSTheodore Ts'o * current settings
6711eb1f822cSTheodore Ts'o */
6712eb1f822cSTheodore Ts'o if (sb_rdonly(sb) || !test_opt(sb, INIT_INODE_TABLE))
6713eb1f822cSTheodore Ts'o ext4_unregister_li_request(sb);
6714eb1f822cSTheodore Ts'o else {
6715eb1f822cSTheodore Ts'o ext4_group_t first_not_zeroed;
6716eb1f822cSTheodore Ts'o first_not_zeroed = ext4_has_uninit_itable(sb);
6717eb1f822cSTheodore Ts'o ext4_register_li_request(sb, first_not_zeroed);
6718eb1f822cSTheodore Ts'o }
6719eb1f822cSTheodore Ts'o
672061bb4a1cSTheodore Ts'o if (!ext4_has_feature_mmp(sb) || sb_rdonly(sb))
672161bb4a1cSTheodore Ts'o ext4_stop_mmpd(sbi);
672261bb4a1cSTheodore Ts'o
67236c63de9bSJan Kara /*
67246c63de9bSJan Kara * Handle aborting the filesystem as the last thing during remount to
67256c63de9bSJan Kara * avoid obsure errors during remount when some option changes fail to
67266c63de9bSJan Kara * apply due to shutdown filesystem.
67276c63de9bSJan Kara */
67286c63de9bSJan Kara if (test_opt2(sb, ABORT))
67296c63de9bSJan Kara ext4_abort(sb, ESHUTDOWN, "Abort forced by user");
67306c63de9bSJan Kara
6731ac27a0ecSDave Kleikamp return 0;
67320b8e58a1SAndreas Dilger
6733ac27a0ecSDave Kleikamp restore_opts:
67344c0b4818STheodore Ts'o /*
67354c0b4818STheodore Ts'o * If there was a failing r/w to ro transition, we may need to
67364c0b4818STheodore Ts'o * re-enable quota
67374c0b4818STheodore Ts'o */
6738d5d020b3SJan Kara if (sb_rdonly(sb) && !(old_sb_flags & SB_RDONLY) &&
67394c0b4818STheodore Ts'o sb_any_quota_suspended(sb))
67404c0b4818STheodore Ts'o dquot_resume(sb, -1);
6741904fa65cSBaokun Li
6742904fa65cSBaokun Li alloc_ctx = ext4_writepages_down_write(sb);
6743ac27a0ecSDave Kleikamp sb->s_flags = old_sb_flags;
6744ac27a0ecSDave Kleikamp sbi->s_mount_opt = old_opts.s_mount_opt;
6745a2595b8aSTheodore Ts'o sbi->s_mount_opt2 = old_opts.s_mount_opt2;
6746ac27a0ecSDave Kleikamp sbi->s_resuid = old_opts.s_resuid;
6747ac27a0ecSDave Kleikamp sbi->s_resgid = old_opts.s_resgid;
6748ac27a0ecSDave Kleikamp sbi->s_commit_interval = old_opts.s_commit_interval;
674930773840STheodore Ts'o sbi->s_min_batch_time = old_opts.s_min_batch_time;
675030773840STheodore Ts'o sbi->s_max_batch_time = old_opts.s_max_batch_time;
6751904fa65cSBaokun Li ext4_writepages_up_write(sb, alloc_ctx);
6752904fa65cSBaokun Li
6753dd0db94fSChunguang Xu if (!test_opt(sb, BLOCK_VALIDITY) && sbi->s_system_blks)
67540f5bde1dSJan Kara ext4_release_system_zone(sb);
6755ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6756ac27a0ecSDave Kleikamp sbi->s_jquota_fmt = old_opts.s_jquota_fmt;
6757a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) {
675833458eabSTheodore Ts'o to_free[i] = get_qf_name(sb, sbi, i);
675933458eabSTheodore Ts'o rcu_assign_pointer(sbi->s_qf_names[i], old_opts.s_qf_names[i]);
6760ac27a0ecSDave Kleikamp }
676133458eabSTheodore Ts'o synchronize_rcu();
676233458eabSTheodore Ts'o for (i = 0; i < EXT4_MAXQUOTAS; i++)
676333458eabSTheodore Ts'o kfree(to_free[i]);
6764ac27a0ecSDave Kleikamp #endif
676561bb4a1cSTheodore Ts'o if (!ext4_has_feature_mmp(sb) || sb_rdonly(sb))
676661bb4a1cSTheodore Ts'o ext4_stop_mmpd(sbi);
6767ac27a0ecSDave Kleikamp return err;
6768ac27a0ecSDave Kleikamp }
6769ac27a0ecSDave Kleikamp
ext4_reconfigure(struct fs_context * fc)6770cebe85d5SLukas Czerner static int ext4_reconfigure(struct fs_context *fc)
67717edfd85bSLukas Czerner {
6772cebe85d5SLukas Czerner struct super_block *sb = fc->root->d_sb;
67737edfd85bSLukas Czerner int ret;
67747edfd85bSLukas Czerner
6775cebe85d5SLukas Czerner fc->s_fs_info = EXT4_SB(sb);
67767edfd85bSLukas Czerner
6777cebe85d5SLukas Czerner ret = ext4_check_opt_consistency(fc, sb);
67787edfd85bSLukas Czerner if (ret < 0)
67797edfd85bSLukas Czerner return ret;
6780cebe85d5SLukas Czerner
6781960e0ab6SLukas Czerner ret = __ext4_remount(fc, sb);
6782cebe85d5SLukas Czerner if (ret < 0)
6783cebe85d5SLukas Czerner return ret;
6784cebe85d5SLukas Czerner
67856dcc98fbSTheodore Ts'o ext4_msg(sb, KERN_INFO, "re-mounted %pU %s. Quota mode: %s.",
67866dcc98fbSTheodore Ts'o &sb->s_uuid, sb_rdonly(sb) ? "ro" : "r/w",
67876dcc98fbSTheodore Ts'o ext4_quota_mode(sb));
6788cebe85d5SLukas Czerner
6789cebe85d5SLukas Czerner return 0;
67907edfd85bSLukas Czerner }
67917edfd85bSLukas Czerner
6792689c958cSLi Xi #ifdef CONFIG_QUOTA
ext4_statfs_project(struct super_block * sb,kprojid_t projid,struct kstatfs * buf)6793689c958cSLi Xi static int ext4_statfs_project(struct super_block *sb,
6794689c958cSLi Xi kprojid_t projid, struct kstatfs *buf)
6795689c958cSLi Xi {
6796689c958cSLi Xi struct kqid qid;
6797689c958cSLi Xi struct dquot *dquot;
6798689c958cSLi Xi u64 limit;
6799689c958cSLi Xi u64 curblock;
6800689c958cSLi Xi
6801689c958cSLi Xi qid = make_kqid_projid(projid);
6802689c958cSLi Xi dquot = dqget(sb, qid);
6803689c958cSLi Xi if (IS_ERR(dquot))
6804689c958cSLi Xi return PTR_ERR(dquot);
68057b9ca4c6SJan Kara spin_lock(&dquot->dq_dqb_lock);
6806689c958cSLi Xi
6807a08fe66eSChengguang Xu limit = min_not_zero(dquot->dq_dqb.dqb_bsoftlimit,
6808a08fe66eSChengguang Xu dquot->dq_dqb.dqb_bhardlimit);
680957c32ea4SChengguang Xu limit >>= sb->s_blocksize_bits;
681057c32ea4SChengguang Xu
6811689c958cSLi Xi if (limit && buf->f_blocks > limit) {
6812f06925c7SKonstantin Khlebnikov curblock = (dquot->dq_dqb.dqb_curspace +
6813f06925c7SKonstantin Khlebnikov dquot->dq_dqb.dqb_rsvspace) >> sb->s_blocksize_bits;
6814689c958cSLi Xi buf->f_blocks = limit;
6815689c958cSLi Xi buf->f_bfree = buf->f_bavail =
6816689c958cSLi Xi (buf->f_blocks > curblock) ?
6817689c958cSLi Xi (buf->f_blocks - curblock) : 0;
6818689c958cSLi Xi }
6819689c958cSLi Xi
6820a08fe66eSChengguang Xu limit = min_not_zero(dquot->dq_dqb.dqb_isoftlimit,
6821a08fe66eSChengguang Xu dquot->dq_dqb.dqb_ihardlimit);
6822689c958cSLi Xi if (limit && buf->f_files > limit) {
6823689c958cSLi Xi buf->f_files = limit;
6824689c958cSLi Xi buf->f_ffree =
6825689c958cSLi Xi (buf->f_files > dquot->dq_dqb.dqb_curinodes) ?
6826689c958cSLi Xi (buf->f_files - dquot->dq_dqb.dqb_curinodes) : 0;
6827689c958cSLi Xi }
6828689c958cSLi Xi
68297b9ca4c6SJan Kara spin_unlock(&dquot->dq_dqb_lock);
6830689c958cSLi Xi dqput(dquot);
6831689c958cSLi Xi return 0;
6832689c958cSLi Xi }
6833689c958cSLi Xi #endif
6834689c958cSLi Xi
ext4_statfs(struct dentry * dentry,struct kstatfs * buf)6835617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf)
6836ac27a0ecSDave Kleikamp {
6837ac27a0ecSDave Kleikamp struct super_block *sb = dentry->d_sb;
6838617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb);
6839617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es;
684027dd4385SLukas Czerner ext4_fsblk_t overhead = 0, resv_blocks;
6841d02a9391SKazuya Mio s64 bfree;
684227dd4385SLukas Czerner resv_blocks = EXT4_C2B(sbi, atomic64_read(&sbi->s_resv_clusters));
6843ac27a0ecSDave Kleikamp
6844952fc18eSTheodore Ts'o if (!test_opt(sb, MINIX_DF))
6845952fc18eSTheodore Ts'o overhead = sbi->s_overhead;
6846ac27a0ecSDave Kleikamp
6847617ba13bSMingming Cao buf->f_type = EXT4_SUPER_MAGIC;
6848ac27a0ecSDave Kleikamp buf->f_bsize = sb->s_blocksize;
6849b72f78cbSEric Sandeen buf->f_blocks = ext4_blocks_count(es) - EXT4_C2B(sbi, overhead);
685057042651STheodore Ts'o bfree = percpu_counter_sum_positive(&sbi->s_freeclusters_counter) -
685157042651STheodore Ts'o percpu_counter_sum_positive(&sbi->s_dirtyclusters_counter);
6852d02a9391SKazuya Mio /* prevent underflow in case that few free space is available */
685357042651STheodore Ts'o buf->f_bfree = EXT4_C2B(sbi, max_t(s64, bfree, 0));
685427dd4385SLukas Czerner buf->f_bavail = buf->f_bfree -
685527dd4385SLukas Czerner (ext4_r_blocks_count(es) + resv_blocks);
685627dd4385SLukas Czerner if (buf->f_bfree < (ext4_r_blocks_count(es) + resv_blocks))
6857ac27a0ecSDave Kleikamp buf->f_bavail = 0;
6858ac27a0ecSDave Kleikamp buf->f_files = le32_to_cpu(es->s_inodes_count);
685952d9f3b4SPeter Zijlstra buf->f_ffree = percpu_counter_sum_positive(&sbi->s_freeinodes_counter);
6860617ba13bSMingming Cao buf->f_namelen = EXT4_NAME_LEN;
68619591c3a3SAmir Goldstein buf->f_fsid = uuid_to_fsid(es->s_uuid);
68620b8e58a1SAndreas Dilger
6863689c958cSLi Xi #ifdef CONFIG_QUOTA
6864689c958cSLi Xi if (ext4_test_inode_flag(dentry->d_inode, EXT4_INODE_PROJINHERIT) &&
6865689c958cSLi Xi sb_has_quota_limits_enabled(sb, PRJQUOTA))
6866689c958cSLi Xi ext4_statfs_project(sb, EXT4_I(dentry->d_inode)->i_projid, buf);
6867689c958cSLi Xi #endif
6868ac27a0ecSDave Kleikamp return 0;
6869ac27a0ecSDave Kleikamp }
6870ac27a0ecSDave Kleikamp
6871ac27a0ecSDave Kleikamp
6872ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6873ac27a0ecSDave Kleikamp
6874bc8230eeSJan Kara /*
6875bc8230eeSJan Kara * Helper functions so that transaction is started before we acquire dqio_sem
6876bc8230eeSJan Kara * to keep correct lock ordering of transaction > dqio_sem
6877bc8230eeSJan Kara */
dquot_to_inode(struct dquot * dquot)6878ac27a0ecSDave Kleikamp static inline struct inode *dquot_to_inode(struct dquot *dquot)
6879ac27a0ecSDave Kleikamp {
68804c376dcaSEric W. Biederman return sb_dqopt(dquot->dq_sb)->files[dquot->dq_id.type];
6881ac27a0ecSDave Kleikamp }
6882ac27a0ecSDave Kleikamp
ext4_write_dquot(struct dquot * dquot)6883617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot)
6884ac27a0ecSDave Kleikamp {
6885ac27a0ecSDave Kleikamp int ret, err;
6886ac27a0ecSDave Kleikamp handle_t *handle;
6887ac27a0ecSDave Kleikamp struct inode *inode;
6888ac27a0ecSDave Kleikamp
6889ac27a0ecSDave Kleikamp inode = dquot_to_inode(dquot);
68909924a92aSTheodore Ts'o handle = ext4_journal_start(inode, EXT4_HT_QUOTA,
6891617ba13bSMingming Cao EXT4_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
6892ac27a0ecSDave Kleikamp if (IS_ERR(handle))
6893ac27a0ecSDave Kleikamp return PTR_ERR(handle);
6894ac27a0ecSDave Kleikamp ret = dquot_commit(dquot);
6895a5e76867SYe Bin if (ret < 0)
6896a5e76867SYe Bin ext4_error_err(dquot->dq_sb, -ret,
6897a5e76867SYe Bin "Failed to commit dquot type %d",
6898a5e76867SYe Bin dquot->dq_id.type);
6899617ba13bSMingming Cao err = ext4_journal_stop(handle);
6900ac27a0ecSDave Kleikamp if (!ret)
6901ac27a0ecSDave Kleikamp ret = err;
6902ac27a0ecSDave Kleikamp return ret;
6903ac27a0ecSDave Kleikamp }
6904ac27a0ecSDave Kleikamp
ext4_acquire_dquot(struct dquot * dquot)6905617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot)
6906ac27a0ecSDave Kleikamp {
6907ac27a0ecSDave Kleikamp int ret, err;
6908ac27a0ecSDave Kleikamp handle_t *handle;
6909ac27a0ecSDave Kleikamp
69109924a92aSTheodore Ts'o handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
6911617ba13bSMingming Cao EXT4_QUOTA_INIT_BLOCKS(dquot->dq_sb));
6912ac27a0ecSDave Kleikamp if (IS_ERR(handle))
6913ac27a0ecSDave Kleikamp return PTR_ERR(handle);
6914ac27a0ecSDave Kleikamp ret = dquot_acquire(dquot);
6915a5e76867SYe Bin if (ret < 0)
6916a5e76867SYe Bin ext4_error_err(dquot->dq_sb, -ret,
6917a5e76867SYe Bin "Failed to acquire dquot type %d",
6918a5e76867SYe Bin dquot->dq_id.type);
6919617ba13bSMingming Cao err = ext4_journal_stop(handle);
6920ac27a0ecSDave Kleikamp if (!ret)
6921ac27a0ecSDave Kleikamp ret = err;
6922ac27a0ecSDave Kleikamp return ret;
6923ac27a0ecSDave Kleikamp }
6924ac27a0ecSDave Kleikamp
ext4_release_dquot(struct dquot * dquot)6925617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot)
6926ac27a0ecSDave Kleikamp {
6927ac27a0ecSDave Kleikamp int ret, err;
6928ac27a0ecSDave Kleikamp handle_t *handle;
6929ac27a0ecSDave Kleikamp
69309924a92aSTheodore Ts'o handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
6931617ba13bSMingming Cao EXT4_QUOTA_DEL_BLOCKS(dquot->dq_sb));
69329c3013e9SJan Kara if (IS_ERR(handle)) {
69339c3013e9SJan Kara /* Release dquot anyway to avoid endless cycle in dqput() */
69349c3013e9SJan Kara dquot_release(dquot);
6935ac27a0ecSDave Kleikamp return PTR_ERR(handle);
69369c3013e9SJan Kara }
6937ac27a0ecSDave Kleikamp ret = dquot_release(dquot);
6938a5e76867SYe Bin if (ret < 0)
6939a5e76867SYe Bin ext4_error_err(dquot->dq_sb, -ret,
6940a5e76867SYe Bin "Failed to release dquot type %d",
6941a5e76867SYe Bin dquot->dq_id.type);
6942617ba13bSMingming Cao err = ext4_journal_stop(handle);
6943ac27a0ecSDave Kleikamp if (!ret)
6944ac27a0ecSDave Kleikamp ret = err;
6945ac27a0ecSDave Kleikamp return ret;
6946ac27a0ecSDave Kleikamp }
6947ac27a0ecSDave Kleikamp
ext4_mark_dquot_dirty(struct dquot * dquot)6948617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot)
6949ac27a0ecSDave Kleikamp {
6950262b4662SJan Kara struct super_block *sb = dquot->dq_sb;
6951262b4662SJan Kara
6952f177ee08SRoman Anufriev if (ext4_is_quota_journalled(sb)) {
6953ac27a0ecSDave Kleikamp dquot_mark_dquot_dirty(dquot);
6954617ba13bSMingming Cao return ext4_write_dquot(dquot);
6955ac27a0ecSDave Kleikamp } else {
6956ac27a0ecSDave Kleikamp return dquot_mark_dquot_dirty(dquot);
6957ac27a0ecSDave Kleikamp }
6958ac27a0ecSDave Kleikamp }
6959ac27a0ecSDave Kleikamp
ext4_write_info(struct super_block * sb,int type)6960617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type)
6961ac27a0ecSDave Kleikamp {
6962ac27a0ecSDave Kleikamp int ret, err;
6963ac27a0ecSDave Kleikamp handle_t *handle;
6964ac27a0ecSDave Kleikamp
6965ac27a0ecSDave Kleikamp /* Data block + inode block */
6966f9c1f248SBaokun Li handle = ext4_journal_start_sb(sb, EXT4_HT_QUOTA, 2);
6967ac27a0ecSDave Kleikamp if (IS_ERR(handle))
6968ac27a0ecSDave Kleikamp return PTR_ERR(handle);
6969ac27a0ecSDave Kleikamp ret = dquot_commit_info(sb, type);
6970617ba13bSMingming Cao err = ext4_journal_stop(handle);
6971ac27a0ecSDave Kleikamp if (!ret)
6972ac27a0ecSDave Kleikamp ret = err;
6973ac27a0ecSDave Kleikamp return ret;
6974ac27a0ecSDave Kleikamp }
6975ac27a0ecSDave Kleikamp
lockdep_set_quota_inode(struct inode * inode,int subclass)6976daf647d2STheodore Ts'o static void lockdep_set_quota_inode(struct inode *inode, int subclass)
6977daf647d2STheodore Ts'o {
6978daf647d2STheodore Ts'o struct ext4_inode_info *ei = EXT4_I(inode);
6979daf647d2STheodore Ts'o
6980daf647d2STheodore Ts'o /* The first argument of lockdep_set_subclass has to be
6981daf647d2STheodore Ts'o * *exactly* the same as the argument to init_rwsem() --- in
6982daf647d2STheodore Ts'o * this case, in init_once() --- or lockdep gets unhappy
6983daf647d2STheodore Ts'o * because the name of the lock is set using the
6984daf647d2STheodore Ts'o * stringification of the argument to init_rwsem().
6985daf647d2STheodore Ts'o */
6986daf647d2STheodore Ts'o (void) ei; /* shut up clang warning if !CONFIG_LOCKDEP */
6987daf647d2STheodore Ts'o lockdep_set_subclass(&ei->i_data_sem, subclass);
6988daf647d2STheodore Ts'o }
6989daf647d2STheodore Ts'o
6990ac27a0ecSDave Kleikamp /*
6991ac27a0ecSDave Kleikamp * Standard function to be called on quota_on
6992ac27a0ecSDave Kleikamp */
ext4_quota_on(struct super_block * sb,int type,int format_id,const struct path * path)6993617ba13bSMingming Cao static int ext4_quota_on(struct super_block *sb, int type, int format_id,
69948c54ca9cSAl Viro const struct path *path)
6995ac27a0ecSDave Kleikamp {
6996ac27a0ecSDave Kleikamp int err;
6997ac27a0ecSDave Kleikamp
6998ac27a0ecSDave Kleikamp if (!test_opt(sb, QUOTA))
6999ac27a0ecSDave Kleikamp return -EINVAL;
70000623543bSJan Kara
7001ac27a0ecSDave Kleikamp /* Quotafile not on the same filesystem? */
7002d8c9584eSAl Viro if (path->dentry->d_sb != sb)
7003ac27a0ecSDave Kleikamp return -EXDEV;
7004e0770e91SJan Kara
7005e0770e91SJan Kara /* Quota already enabled for this file? */
7006e0770e91SJan Kara if (IS_NOQUOTA(d_inode(path->dentry)))
7007e0770e91SJan Kara return -EBUSY;
7008e0770e91SJan Kara
70090623543bSJan Kara /* Journaling quota? */
70100623543bSJan Kara if (EXT4_SB(sb)->s_qf_names[type]) {
70112b2d6d01STheodore Ts'o /* Quotafile not in fs root? */
7012f00c9e44SJan Kara if (path->dentry->d_parent != sb->s_root)
7013b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING,
7014b31e1552SEric Sandeen "Quota file not on filesystem root. "
7015b31e1552SEric Sandeen "Journaled quota will not work");
701691389240SJan Kara sb_dqopt(sb)->flags |= DQUOT_NOLIST_DIRTY;
701791389240SJan Kara } else {
701891389240SJan Kara /*
701991389240SJan Kara * Clear the flag just in case mount options changed since
702091389240SJan Kara * last time.
702191389240SJan Kara */
702291389240SJan Kara sb_dqopt(sb)->flags &= ~DQUOT_NOLIST_DIRTY;
70230623543bSJan Kara }
70240623543bSJan Kara
7025daf647d2STheodore Ts'o lockdep_set_quota_inode(path->dentry->d_inode, I_DATA_SEM_QUOTA);
7026daf647d2STheodore Ts'o err = dquot_quota_on(sb, type, format_id, path);
702715fc69bbSJan Kara if (!err) {
7028957153fcSJan Kara struct inode *inode = d_inode(path->dentry);
7029957153fcSJan Kara handle_t *handle;
7030957153fcSJan Kara
703161a92987SJan Kara /*
703261a92987SJan Kara * Set inode flags to prevent userspace from messing with quota
703361a92987SJan Kara * files. If this fails, we return success anyway since quotas
703461a92987SJan Kara * are already enabled and this is not a hard failure.
703561a92987SJan Kara */
7036957153fcSJan Kara inode_lock(inode);
7037957153fcSJan Kara handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
7038957153fcSJan Kara if (IS_ERR(handle))
7039957153fcSJan Kara goto unlock_inode;
7040957153fcSJan Kara EXT4_I(inode)->i_flags |= EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL;
7041957153fcSJan Kara inode_set_flags(inode, S_NOATIME | S_IMMUTABLE,
7042957153fcSJan Kara S_NOATIME | S_IMMUTABLE);
70434209ae12SHarshad Shirwadkar err = ext4_mark_inode_dirty(handle, inode);
7044957153fcSJan Kara ext4_journal_stop(handle);
7045957153fcSJan Kara unlock_inode:
7046957153fcSJan Kara inode_unlock(inode);
704715fc69bbSJan Kara if (err)
704815fc69bbSJan Kara dquot_quota_off(sb, type);
7049957153fcSJan Kara }
705015fc69bbSJan Kara if (err)
705115fc69bbSJan Kara lockdep_set_quota_inode(path->dentry->d_inode,
705215fc69bbSJan Kara I_DATA_SEM_NORMAL);
7053daf647d2STheodore Ts'o return err;
7054ac27a0ecSDave Kleikamp }
7055ac27a0ecSDave Kleikamp
ext4_check_quota_inum(int type,unsigned long qf_inum)705607342ec2SBaokun Li static inline bool ext4_check_quota_inum(int type, unsigned long qf_inum)
705707342ec2SBaokun Li {
705807342ec2SBaokun Li switch (type) {
705907342ec2SBaokun Li case USRQUOTA:
706007342ec2SBaokun Li return qf_inum == EXT4_USR_QUOTA_INO;
706107342ec2SBaokun Li case GRPQUOTA:
706207342ec2SBaokun Li return qf_inum == EXT4_GRP_QUOTA_INO;
706307342ec2SBaokun Li case PRJQUOTA:
706407342ec2SBaokun Li return qf_inum >= EXT4_GOOD_OLD_FIRST_INO;
706507342ec2SBaokun Li default:
706607342ec2SBaokun Li BUG();
706707342ec2SBaokun Li }
706807342ec2SBaokun Li }
706907342ec2SBaokun Li
ext4_quota_enable(struct super_block * sb,int type,int format_id,unsigned int flags)70707c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
70717c319d32SAditya Kali unsigned int flags)
70727c319d32SAditya Kali {
70737c319d32SAditya Kali int err;
70747c319d32SAditya Kali struct inode *qf_inode;
7075a2d4a646SJan Kara unsigned long qf_inums[EXT4_MAXQUOTAS] = {
70767c319d32SAditya Kali le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
7077689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
7078689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
70797c319d32SAditya Kali };
70807c319d32SAditya Kali
7081e2b911c5SDarrick J. Wong BUG_ON(!ext4_has_feature_quota(sb));
70827c319d32SAditya Kali
70837c319d32SAditya Kali if (!qf_inums[type])
70847c319d32SAditya Kali return -EPERM;
70857c319d32SAditya Kali
708607342ec2SBaokun Li if (!ext4_check_quota_inum(type, qf_inums[type])) {
708707342ec2SBaokun Li ext4_error(sb, "Bad quota inum: %lu, type: %d",
708807342ec2SBaokun Li qf_inums[type], type);
708907342ec2SBaokun Li return -EUCLEAN;
709007342ec2SBaokun Li }
709107342ec2SBaokun Li
70928a363970STheodore Ts'o qf_inode = ext4_iget(sb, qf_inums[type], EXT4_IGET_SPECIAL);
70937c319d32SAditya Kali if (IS_ERR(qf_inode)) {
709407342ec2SBaokun Li ext4_error(sb, "Bad quota inode: %lu, type: %d",
709507342ec2SBaokun Li qf_inums[type], type);
70967c319d32SAditya Kali return PTR_ERR(qf_inode);
70977c319d32SAditya Kali }
70987c319d32SAditya Kali
7099bcb13850SJan Kara /* Don't account quota for quota files to avoid recursion */
7100bcb13850SJan Kara qf_inode->i_flags |= S_NOQUOTA;
7101daf647d2STheodore Ts'o lockdep_set_quota_inode(qf_inode, I_DATA_SEM_QUOTA);
71027212b95eSJan Kara err = dquot_load_quota_inode(qf_inode, type, format_id, flags);
7103daf647d2STheodore Ts'o if (err)
7104daf647d2STheodore Ts'o lockdep_set_quota_inode(qf_inode, I_DATA_SEM_NORMAL);
710561157b24SPan Bian iput(qf_inode);
71067c319d32SAditya Kali
71077c319d32SAditya Kali return err;
71087c319d32SAditya Kali }
71097c319d32SAditya Kali
71107c319d32SAditya Kali /* Enable usage tracking for all quota types. */
ext4_enable_quotas(struct super_block * sb)711125c6d98fSJan Kara int ext4_enable_quotas(struct super_block *sb)
71127c319d32SAditya Kali {
71137c319d32SAditya Kali int type, err = 0;
7114a2d4a646SJan Kara unsigned long qf_inums[EXT4_MAXQUOTAS] = {
71157c319d32SAditya Kali le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
7116689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
7117689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
71187c319d32SAditya Kali };
711949da9392SJan Kara bool quota_mopt[EXT4_MAXQUOTAS] = {
712049da9392SJan Kara test_opt(sb, USRQUOTA),
712149da9392SJan Kara test_opt(sb, GRPQUOTA),
712249da9392SJan Kara test_opt(sb, PRJQUOTA),
712349da9392SJan Kara };
71247c319d32SAditya Kali
712591389240SJan Kara sb_dqopt(sb)->flags |= DQUOT_QUOTA_SYS_FILE | DQUOT_NOLIST_DIRTY;
7126a2d4a646SJan Kara for (type = 0; type < EXT4_MAXQUOTAS; type++) {
71277c319d32SAditya Kali if (qf_inums[type]) {
71287c319d32SAditya Kali err = ext4_quota_enable(sb, type, QFMT_VFS_V1,
712949da9392SJan Kara DQUOT_USAGE_ENABLED |
713049da9392SJan Kara (quota_mopt[type] ? DQUOT_LIMITS_ENABLED : 0));
71317c319d32SAditya Kali if (err) {
71327c319d32SAditya Kali ext4_warning(sb,
713372ba7450STheodore Ts'o "Failed to enable quota tracking "
713407342ec2SBaokun Li "(type=%d, err=%d, ino=%lu). "
713507342ec2SBaokun Li "Please run e2fsck to fix.", type,
713607342ec2SBaokun Li err, qf_inums[type]);
71374013d47aSJan Kara
7138f3c1c42eSBaokun Li ext4_quotas_off(sb, type);
71397c319d32SAditya Kali return err;
71407c319d32SAditya Kali }
71417c319d32SAditya Kali }
71427c319d32SAditya Kali }
71437c319d32SAditya Kali return 0;
71447c319d32SAditya Kali }
71457c319d32SAditya Kali
ext4_quota_off(struct super_block * sb,int type)7146ca0e05e4SDmitry Monakhov static int ext4_quota_off(struct super_block *sb, int type)
7147ca0e05e4SDmitry Monakhov {
714821f97697SJan Kara struct inode *inode = sb_dqopt(sb)->files[type];
714921f97697SJan Kara handle_t *handle;
7150957153fcSJan Kara int err;
715121f97697SJan Kara
715287009d86SDmitry Monakhov /* Force all delayed allocation blocks to be allocated.
715387009d86SDmitry Monakhov * Caller already holds s_umount sem */
715487009d86SDmitry Monakhov if (test_opt(sb, DELALLOC))
7155ca0e05e4SDmitry Monakhov sync_filesystem(sb);
7156ca0e05e4SDmitry Monakhov
7157957153fcSJan Kara if (!inode || !igrab(inode))
71580b268590SAmir Goldstein goto out;
71590b268590SAmir Goldstein
7160957153fcSJan Kara err = dquot_quota_off(sb, type);
7161964edf66SJan Kara if (err || ext4_has_feature_quota(sb))
7162957153fcSJan Kara goto out_put;
7163e0e985f3SJan Kara /*
7164e0e985f3SJan Kara * When the filesystem was remounted read-only first, we cannot cleanup
7165e0e985f3SJan Kara * inode flags here. Bad luck but people should be using QUOTA feature
7166e0e985f3SJan Kara * these days anyway.
7167e0e985f3SJan Kara */
7168e0e985f3SJan Kara if (sb_rdonly(sb))
7169e0e985f3SJan Kara goto out_put;
7170957153fcSJan Kara
7171957153fcSJan Kara inode_lock(inode);
717261a92987SJan Kara /*
717361a92987SJan Kara * Update modification times of quota files when userspace can
717461a92987SJan Kara * start looking at them. If we fail, we return success anyway since
717561a92987SJan Kara * this is not a hard failure and quotas are already disabled.
717661a92987SJan Kara */
71779924a92aSTheodore Ts'o handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
71784209ae12SHarshad Shirwadkar if (IS_ERR(handle)) {
71794209ae12SHarshad Shirwadkar err = PTR_ERR(handle);
7180957153fcSJan Kara goto out_unlock;
71814209ae12SHarshad Shirwadkar }
7182957153fcSJan Kara EXT4_I(inode)->i_flags &= ~(EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL);
7183957153fcSJan Kara inode_set_flags(inode, 0, S_NOATIME | S_IMMUTABLE);
7184fa42d5f1SJeff Layton inode_set_mtime_to_ts(inode, inode_set_ctime_current(inode));
71854209ae12SHarshad Shirwadkar err = ext4_mark_inode_dirty(handle, inode);
718621f97697SJan Kara ext4_journal_stop(handle);
7187957153fcSJan Kara out_unlock:
7188957153fcSJan Kara inode_unlock(inode);
7189957153fcSJan Kara out_put:
7190964edf66SJan Kara lockdep_set_quota_inode(inode, I_DATA_SEM_NORMAL);
7191957153fcSJan Kara iput(inode);
7192957153fcSJan Kara return err;
719321f97697SJan Kara out:
7194ca0e05e4SDmitry Monakhov return dquot_quota_off(sb, type);
7195ca0e05e4SDmitry Monakhov }
7196ca0e05e4SDmitry Monakhov
7197ac27a0ecSDave Kleikamp /* Read data from quotafile - avoid pagecache and such because we cannot afford
7198ac27a0ecSDave Kleikamp * acquiring the locks... As quota files are never truncated and quota code
7199ac27a0ecSDave Kleikamp * itself serializes the operations (and no one else should touch the files)
7200ac27a0ecSDave Kleikamp * we don't have to be afraid of races */
ext4_quota_read(struct super_block * sb,int type,char * data,size_t len,loff_t off)7201617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
7202ac27a0ecSDave Kleikamp size_t len, loff_t off)
7203ac27a0ecSDave Kleikamp {
7204ac27a0ecSDave Kleikamp struct inode *inode = sb_dqopt(sb)->files[type];
7205725d26d3SAneesh Kumar K.V ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
7206ac27a0ecSDave Kleikamp int offset = off & (sb->s_blocksize - 1);
7207ac27a0ecSDave Kleikamp int tocopy;
7208ac27a0ecSDave Kleikamp size_t toread;
7209ac27a0ecSDave Kleikamp struct buffer_head *bh;
7210ac27a0ecSDave Kleikamp loff_t i_size = i_size_read(inode);
7211ac27a0ecSDave Kleikamp
7212ac27a0ecSDave Kleikamp if (off > i_size)
7213ac27a0ecSDave Kleikamp return 0;
7214ac27a0ecSDave Kleikamp if (off+len > i_size)
7215ac27a0ecSDave Kleikamp len = i_size-off;
7216ac27a0ecSDave Kleikamp toread = len;
7217ac27a0ecSDave Kleikamp while (toread > 0) {
721866267814SJiangshan Yi tocopy = min_t(unsigned long, sb->s_blocksize - offset, toread);
72191c215028STheodore Ts'o bh = ext4_bread(NULL, inode, blk, 0);
72201c215028STheodore Ts'o if (IS_ERR(bh))
72211c215028STheodore Ts'o return PTR_ERR(bh);
7222ac27a0ecSDave Kleikamp if (!bh) /* A hole? */
7223ac27a0ecSDave Kleikamp memset(data, 0, tocopy);
7224ac27a0ecSDave Kleikamp else
7225ac27a0ecSDave Kleikamp memcpy(data, bh->b_data+offset, tocopy);
7226ac27a0ecSDave Kleikamp brelse(bh);
7227ac27a0ecSDave Kleikamp offset = 0;
7228ac27a0ecSDave Kleikamp toread -= tocopy;
7229ac27a0ecSDave Kleikamp data += tocopy;
7230ac27a0ecSDave Kleikamp blk++;
7231ac27a0ecSDave Kleikamp }
7232ac27a0ecSDave Kleikamp return len;
7233ac27a0ecSDave Kleikamp }
7234ac27a0ecSDave Kleikamp
7235ac27a0ecSDave Kleikamp /* Write to quotafile (we know the transaction is already started and has
7236ac27a0ecSDave Kleikamp * enough credits) */
ext4_quota_write(struct super_block * sb,int type,const char * data,size_t len,loff_t off)7237617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
7238ac27a0ecSDave Kleikamp const char *data, size_t len, loff_t off)
7239ac27a0ecSDave Kleikamp {
7240ac27a0ecSDave Kleikamp struct inode *inode = sb_dqopt(sb)->files[type];
7241725d26d3SAneesh Kumar K.V ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
72424209ae12SHarshad Shirwadkar int err = 0, err2 = 0, offset = off & (sb->s_blocksize - 1);
7243c5e298aeSTheodore Ts'o int retries = 0;
7244ac27a0ecSDave Kleikamp struct buffer_head *bh;
7245ac27a0ecSDave Kleikamp handle_t *handle = journal_current_handle();
7246ac27a0ecSDave Kleikamp
7247380a0091SYe Bin if (!handle) {
7248b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
7249b31e1552SEric Sandeen " cancelled because transaction is not started",
72509c3013e9SJan Kara (unsigned long long)off, (unsigned long long)len);
72519c3013e9SJan Kara return -EIO;
72529c3013e9SJan Kara }
725367eeb568SDmitry Monakhov /*
725467eeb568SDmitry Monakhov * Since we account only one data block in transaction credits,
725567eeb568SDmitry Monakhov * then it is impossible to cross a block boundary.
725667eeb568SDmitry Monakhov */
725767eeb568SDmitry Monakhov if (sb->s_blocksize - offset < len) {
725867eeb568SDmitry Monakhov ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
725967eeb568SDmitry Monakhov " cancelled because not block aligned",
726067eeb568SDmitry Monakhov (unsigned long long)off, (unsigned long long)len);
726167eeb568SDmitry Monakhov return -EIO;
726267eeb568SDmitry Monakhov }
726367eeb568SDmitry Monakhov
7264c5e298aeSTheodore Ts'o do {
7265c5e298aeSTheodore Ts'o bh = ext4_bread(handle, inode, blk,
7266c5e298aeSTheodore Ts'o EXT4_GET_BLOCKS_CREATE |
7267c5e298aeSTheodore Ts'o EXT4_GET_BLOCKS_METADATA_NOFAIL);
726845586c70SMasahiro Yamada } while (PTR_ERR(bh) == -ENOSPC &&
7269c5e298aeSTheodore Ts'o ext4_should_retry_alloc(inode->i_sb, &retries));
72701c215028STheodore Ts'o if (IS_ERR(bh))
72711c215028STheodore Ts'o return PTR_ERR(bh);
7272ac27a0ecSDave Kleikamp if (!bh)
7273ac27a0ecSDave Kleikamp goto out;
72745d601255Sliang xie BUFFER_TRACE(bh, "get write access");
7275188c299eSJan Kara err = ext4_journal_get_write_access(handle, sb, bh, EXT4_JTR_NONE);
7276ac27a0ecSDave Kleikamp if (err) {
7277ac27a0ecSDave Kleikamp brelse(bh);
72781c215028STheodore Ts'o return err;
7279ac27a0ecSDave Kleikamp }
7280ac27a0ecSDave Kleikamp lock_buffer(bh);
728167eeb568SDmitry Monakhov memcpy(bh->b_data+offset, data, len);
7282ac27a0ecSDave Kleikamp flush_dcache_page(bh->b_page);
7283ac27a0ecSDave Kleikamp unlock_buffer(bh);
72840390131bSFrank Mayhar err = ext4_handle_dirty_metadata(handle, NULL, bh);
7285ac27a0ecSDave Kleikamp brelse(bh);
7286ac27a0ecSDave Kleikamp out:
728767eeb568SDmitry Monakhov if (inode->i_size < off + len) {
728867eeb568SDmitry Monakhov i_size_write(inode, off + len);
7289617ba13bSMingming Cao EXT4_I(inode)->i_disksize = inode->i_size;
72904209ae12SHarshad Shirwadkar err2 = ext4_mark_inode_dirty(handle, inode);
72914209ae12SHarshad Shirwadkar if (unlikely(err2 && !err))
72924209ae12SHarshad Shirwadkar err = err2;
729321f97697SJan Kara }
72944209ae12SHarshad Shirwadkar return err ? err : len;
7295ac27a0ecSDave Kleikamp }
7296ac27a0ecSDave Kleikamp #endif
7297ac27a0ecSDave Kleikamp
7298c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
register_as_ext2(void)729924b58424STheodore Ts'o static inline void register_as_ext2(void)
730024b58424STheodore Ts'o {
730124b58424STheodore Ts'o int err = register_filesystem(&ext2_fs_type);
730224b58424STheodore Ts'o if (err)
730324b58424STheodore Ts'o printk(KERN_WARNING
730424b58424STheodore Ts'o "EXT4-fs: Unable to register as ext2 (%d)\n", err);
730524b58424STheodore Ts'o }
730624b58424STheodore Ts'o
unregister_as_ext2(void)730724b58424STheodore Ts'o static inline void unregister_as_ext2(void)
730824b58424STheodore Ts'o {
730924b58424STheodore Ts'o unregister_filesystem(&ext2_fs_type);
731024b58424STheodore Ts'o }
73112035e776STheodore Ts'o
ext2_feature_set_ok(struct super_block * sb)73122035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb)
73132035e776STheodore Ts'o {
7314e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext2_incompat_features(sb))
73152035e776STheodore Ts'o return 0;
7316bc98a42cSDavid Howells if (sb_rdonly(sb))
73172035e776STheodore Ts'o return 1;
7318e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext2_ro_compat_features(sb))
73192035e776STheodore Ts'o return 0;
73202035e776STheodore Ts'o return 1;
73212035e776STheodore Ts'o }
732224b58424STheodore Ts'o #else
register_as_ext2(void)732324b58424STheodore Ts'o static inline void register_as_ext2(void) { }
unregister_as_ext2(void)732424b58424STheodore Ts'o static inline void unregister_as_ext2(void) { }
ext2_feature_set_ok(struct super_block * sb)73252035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb) { return 0; }
732624b58424STheodore Ts'o #endif
732724b58424STheodore Ts'o
register_as_ext3(void)732824b58424STheodore Ts'o static inline void register_as_ext3(void)
732924b58424STheodore Ts'o {
733024b58424STheodore Ts'o int err = register_filesystem(&ext3_fs_type);
733124b58424STheodore Ts'o if (err)
733224b58424STheodore Ts'o printk(KERN_WARNING
733324b58424STheodore Ts'o "EXT4-fs: Unable to register as ext3 (%d)\n", err);
733424b58424STheodore Ts'o }
733524b58424STheodore Ts'o
unregister_as_ext3(void)733624b58424STheodore Ts'o static inline void unregister_as_ext3(void)
733724b58424STheodore Ts'o {
733824b58424STheodore Ts'o unregister_filesystem(&ext3_fs_type);
733924b58424STheodore Ts'o }
73402035e776STheodore Ts'o
ext3_feature_set_ok(struct super_block * sb)73412035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb)
73422035e776STheodore Ts'o {
7343e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext3_incompat_features(sb))
73442035e776STheodore Ts'o return 0;
7345e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal(sb))
73462035e776STheodore Ts'o return 0;
7347bc98a42cSDavid Howells if (sb_rdonly(sb))
73482035e776STheodore Ts'o return 1;
7349e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext3_ro_compat_features(sb))
73502035e776STheodore Ts'o return 0;
73512035e776STheodore Ts'o return 1;
73522035e776STheodore Ts'o }
735324b58424STheodore Ts'o
ext4_kill_sb(struct super_block * sb)73541489dffdSChristoph Hellwig static void ext4_kill_sb(struct super_block *sb)
73551489dffdSChristoph Hellwig {
73561489dffdSChristoph Hellwig struct ext4_sb_info *sbi = EXT4_SB(sb);
73571489dffdSChristoph Hellwig struct block_device *journal_bdev = sbi ? sbi->s_journal_bdev : NULL;
73581489dffdSChristoph Hellwig
73591489dffdSChristoph Hellwig kill_block_super(sb);
73601489dffdSChristoph Hellwig
73611489dffdSChristoph Hellwig if (journal_bdev)
73621489dffdSChristoph Hellwig blkdev_put(journal_bdev, sb);
73631489dffdSChristoph Hellwig }
73641489dffdSChristoph Hellwig
736503010a33STheodore Ts'o static struct file_system_type ext4_fs_type = {
7366ac27a0ecSDave Kleikamp .owner = THIS_MODULE,
736703010a33STheodore Ts'o .name = "ext4",
7368cebe85d5SLukas Czerner .init_fs_context = ext4_init_fs_context,
7369cebe85d5SLukas Czerner .parameters = ext4_param_specs,
73701489dffdSChristoph Hellwig .kill_sb = ext4_kill_sb,
737150ec1d72SChristian Brauner .fs_flags = FS_REQUIRES_DEV | FS_ALLOW_IDMAP,
7372ac27a0ecSDave Kleikamp };
73737f78e035SEric W. Biederman MODULE_ALIAS_FS("ext4");
7374ac27a0ecSDave Kleikamp
7375e9e3bcecSEric Sandeen /* Shared across all ext4 file systems */
7376e9e3bcecSEric Sandeen wait_queue_head_t ext4__ioend_wq[EXT4_WQ_HASH_SZ];
7377e9e3bcecSEric Sandeen
ext4_init_fs(void)73785dabfc78STheodore Ts'o static int __init ext4_init_fs(void)
7379ac27a0ecSDave Kleikamp {
7380e9e3bcecSEric Sandeen int i, err;
7381c9de560dSAlex Tomas
7382e294a537STheodore Ts'o ratelimit_state_init(&ext4_mount_msg_ratelimit, 30 * HZ, 64);
738307c0c5d8SAl Viro ext4_li_info = NULL;
738407c0c5d8SAl Viro
73859a4c8019SCarlos Maiolino /* Build-time check for flags consistency */
738612e9b892SDmitry Monakhov ext4_check_flag_values();
7387e9e3bcecSEric Sandeen
7388e142d052SJan Kara for (i = 0; i < EXT4_WQ_HASH_SZ; i++)
7389e9e3bcecSEric Sandeen init_waitqueue_head(&ext4__ioend_wq[i]);
7390e9e3bcecSEric Sandeen
739151865fdaSZheng Liu err = ext4_init_es();
73926fd058f7STheodore Ts'o if (err)
73936fd058f7STheodore Ts'o return err;
739451865fdaSZheng Liu
73951dc0aa46SEric Whitney err = ext4_init_pending();
73961dc0aa46SEric Whitney if (err)
739722cfe4b4SEric Biggers goto out7;
739822cfe4b4SEric Biggers
739922cfe4b4SEric Biggers err = ext4_init_post_read_processing();
740022cfe4b4SEric Biggers if (err)
74011dc0aa46SEric Whitney goto out6;
74021dc0aa46SEric Whitney
740351865fdaSZheng Liu err = ext4_init_pageio();
740451865fdaSZheng Liu if (err)
7405b5799018STheodore Ts'o goto out5;
740651865fdaSZheng Liu
74075dabfc78STheodore Ts'o err = ext4_init_system_zone();
7408bd2d0210STheodore Ts'o if (err)
7409b5799018STheodore Ts'o goto out4;
7410857ac889SLukas Czerner
7411b5799018STheodore Ts'o err = ext4_init_sysfs();
7412dd68314cSTheodore Ts'o if (err)
7413b5799018STheodore Ts'o goto out3;
7414857ac889SLukas Czerner
74155dabfc78STheodore Ts'o err = ext4_init_mballoc();
7416ac27a0ecSDave Kleikamp if (err)
7417c9de560dSAlex Tomas goto out2;
7418ac27a0ecSDave Kleikamp err = init_inodecache();
7419ac27a0ecSDave Kleikamp if (err)
7420ac27a0ecSDave Kleikamp goto out1;
7421aa75f4d3SHarshad Shirwadkar
7422aa75f4d3SHarshad Shirwadkar err = ext4_fc_init_dentry_cache();
7423aa75f4d3SHarshad Shirwadkar if (err)
7424aa75f4d3SHarshad Shirwadkar goto out05;
7425aa75f4d3SHarshad Shirwadkar
742624b58424STheodore Ts'o register_as_ext3();
74272035e776STheodore Ts'o register_as_ext2();
742803010a33STheodore Ts'o err = register_filesystem(&ext4_fs_type);
7429ac27a0ecSDave Kleikamp if (err)
7430ac27a0ecSDave Kleikamp goto out;
7431bfff6873SLukas Czerner
7432ac27a0ecSDave Kleikamp return 0;
7433ac27a0ecSDave Kleikamp out:
743424b58424STheodore Ts'o unregister_as_ext2();
743524b58424STheodore Ts'o unregister_as_ext3();
7436ab047d51SSebastian Andrzej Siewior ext4_fc_destroy_dentry_cache();
7437aa75f4d3SHarshad Shirwadkar out05:
7438ac27a0ecSDave Kleikamp destroy_inodecache();
7439ac27a0ecSDave Kleikamp out1:
74405dabfc78STheodore Ts'o ext4_exit_mballoc();
74419c191f70ST Makphaibulchoke out2:
7442b5799018STheodore Ts'o ext4_exit_sysfs();
7443b5799018STheodore Ts'o out3:
7444dd68314cSTheodore Ts'o ext4_exit_system_zone();
7445b5799018STheodore Ts'o out4:
74465dabfc78STheodore Ts'o ext4_exit_pageio();
7447b5799018STheodore Ts'o out5:
744822cfe4b4SEric Biggers ext4_exit_post_read_processing();
74491dc0aa46SEric Whitney out6:
745022cfe4b4SEric Biggers ext4_exit_pending();
745122cfe4b4SEric Biggers out7:
745251865fdaSZheng Liu ext4_exit_es();
745351865fdaSZheng Liu
7454ac27a0ecSDave Kleikamp return err;
7455ac27a0ecSDave Kleikamp }
7456ac27a0ecSDave Kleikamp
ext4_exit_fs(void)74575dabfc78STheodore Ts'o static void __exit ext4_exit_fs(void)
7458ac27a0ecSDave Kleikamp {
7459bfff6873SLukas Czerner ext4_destroy_lazyinit_thread();
746024b58424STheodore Ts'o unregister_as_ext2();
746124b58424STheodore Ts'o unregister_as_ext3();
746203010a33STheodore Ts'o unregister_filesystem(&ext4_fs_type);
7463ab047d51SSebastian Andrzej Siewior ext4_fc_destroy_dentry_cache();
7464ac27a0ecSDave Kleikamp destroy_inodecache();
74655dabfc78STheodore Ts'o ext4_exit_mballoc();
7466b5799018STheodore Ts'o ext4_exit_sysfs();
74675dabfc78STheodore Ts'o ext4_exit_system_zone();
74685dabfc78STheodore Ts'o ext4_exit_pageio();
746922cfe4b4SEric Biggers ext4_exit_post_read_processing();
7470dd12ed14SEric Sandeen ext4_exit_es();
74711dc0aa46SEric Whitney ext4_exit_pending();
7472ac27a0ecSDave Kleikamp }
7473ac27a0ecSDave Kleikamp
7474ac27a0ecSDave Kleikamp MODULE_AUTHOR("Remy Card, Stephen Tweedie, Andrew Morton, Andreas Dilger, Theodore Ts'o and others");
747583982b6fSTheodore Ts'o MODULE_DESCRIPTION("Fourth Extended Filesystem");
7476ac27a0ecSDave Kleikamp MODULE_LICENSE("GPL");
74777ef79ad5STheodore Ts'o MODULE_SOFTDEP("pre: crc32c");
74785dabfc78STheodore Ts'o module_init(ext4_init_fs)
74795dabfc78STheodore Ts'o module_exit(ext4_exit_fs)
7480