1ac27a0ecSDave Kleikamp /* 2617ba13bSMingming Cao * linux/fs/ext4/resize.c 3ac27a0ecSDave Kleikamp * 4617ba13bSMingming Cao * Support for resizing an ext4 filesystem while it is mounted. 5ac27a0ecSDave Kleikamp * 6ac27a0ecSDave Kleikamp * Copyright (C) 2001, 2002 Andreas Dilger <adilger@clusterfs.com> 7ac27a0ecSDave Kleikamp * 8ac27a0ecSDave Kleikamp * This could probably be made into a module, because it is not often in use. 9ac27a0ecSDave Kleikamp */ 10ac27a0ecSDave Kleikamp 11ac27a0ecSDave Kleikamp 12617ba13bSMingming Cao #define EXT4FS_DEBUG 13ac27a0ecSDave Kleikamp 14ac27a0ecSDave Kleikamp #include <linux/errno.h> 15ac27a0ecSDave Kleikamp #include <linux/slab.h> 16ac27a0ecSDave Kleikamp 173dcf5451SChristoph Hellwig #include "ext4_jbd2.h" 18ac27a0ecSDave Kleikamp 198f82f840SYongqiang Yang int ext4_resize_begin(struct super_block *sb) 208f82f840SYongqiang Yang { 218f82f840SYongqiang Yang int ret = 0; 228f82f840SYongqiang Yang 238f82f840SYongqiang Yang if (!capable(CAP_SYS_RESOURCE)) 248f82f840SYongqiang Yang return -EPERM; 258f82f840SYongqiang Yang 26ce723c31SYongqiang Yang /* 27ce723c31SYongqiang Yang * We are not allowed to do online-resizing on a filesystem mounted 28ce723c31SYongqiang Yang * with error, because it can destroy the filesystem easily. 29ce723c31SYongqiang Yang */ 30ce723c31SYongqiang Yang if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) { 31ce723c31SYongqiang Yang ext4_warning(sb, "There are errors in the filesystem, " 32ce723c31SYongqiang Yang "so online resizing is not allowed\n"); 33ce723c31SYongqiang Yang return -EPERM; 34ce723c31SYongqiang Yang } 35ce723c31SYongqiang Yang 368f82f840SYongqiang Yang if (test_and_set_bit_lock(EXT4_RESIZING, &EXT4_SB(sb)->s_resize_flags)) 378f82f840SYongqiang Yang ret = -EBUSY; 388f82f840SYongqiang Yang 398f82f840SYongqiang Yang return ret; 408f82f840SYongqiang Yang } 418f82f840SYongqiang Yang 428f82f840SYongqiang Yang void ext4_resize_end(struct super_block *sb) 438f82f840SYongqiang Yang { 448f82f840SYongqiang Yang clear_bit_unlock(EXT4_RESIZING, &EXT4_SB(sb)->s_resize_flags); 458f82f840SYongqiang Yang smp_mb__after_clear_bit(); 468f82f840SYongqiang Yang } 478f82f840SYongqiang Yang 48ac27a0ecSDave Kleikamp #define outside(b, first, last) ((b) < (first) || (b) >= (last)) 49ac27a0ecSDave Kleikamp #define inside(b, first, last) ((b) >= (first) && (b) < (last)) 50ac27a0ecSDave Kleikamp 51ac27a0ecSDave Kleikamp static int verify_group_input(struct super_block *sb, 52617ba13bSMingming Cao struct ext4_new_group_data *input) 53ac27a0ecSDave Kleikamp { 54617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 55617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 56bd81d8eeSLaurent Vivier ext4_fsblk_t start = ext4_blocks_count(es); 57617ba13bSMingming Cao ext4_fsblk_t end = start + input->blocks_count; 58fd2d4291SAvantika Mathur ext4_group_t group = input->group; 59617ba13bSMingming Cao ext4_fsblk_t itend = input->inode_table + sbi->s_itb_per_group; 60617ba13bSMingming Cao unsigned overhead = ext4_bg_has_super(sb, group) ? 61617ba13bSMingming Cao (1 + ext4_bg_num_gdb(sb, group) + 62ac27a0ecSDave Kleikamp le16_to_cpu(es->s_reserved_gdt_blocks)) : 0; 63617ba13bSMingming Cao ext4_fsblk_t metaend = start + overhead; 64ac27a0ecSDave Kleikamp struct buffer_head *bh = NULL; 653a5b2ecdSMingming Cao ext4_grpblk_t free_blocks_count, offset; 66ac27a0ecSDave Kleikamp int err = -EINVAL; 67ac27a0ecSDave Kleikamp 68ac27a0ecSDave Kleikamp input->free_blocks_count = free_blocks_count = 69ac27a0ecSDave Kleikamp input->blocks_count - 2 - overhead - sbi->s_itb_per_group; 70ac27a0ecSDave Kleikamp 71ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 72617ba13bSMingming Cao printk(KERN_DEBUG "EXT4-fs: adding %s group %u: %u blocks " 73ac27a0ecSDave Kleikamp "(%d free, %u reserved)\n", 74617ba13bSMingming Cao ext4_bg_has_super(sb, input->group) ? "normal" : 75ac27a0ecSDave Kleikamp "no-super", input->group, input->blocks_count, 76ac27a0ecSDave Kleikamp free_blocks_count, input->reserved_blocks); 77ac27a0ecSDave Kleikamp 783a5b2ecdSMingming Cao ext4_get_group_no_and_offset(sb, start, NULL, &offset); 79ac27a0ecSDave Kleikamp if (group != sbi->s_groups_count) 8012062dddSEric Sandeen ext4_warning(sb, "Cannot add at group %u (only %u groups)", 81ac27a0ecSDave Kleikamp input->group, sbi->s_groups_count); 823a5b2ecdSMingming Cao else if (offset != 0) 8312062dddSEric Sandeen ext4_warning(sb, "Last group not full"); 84ac27a0ecSDave Kleikamp else if (input->reserved_blocks > input->blocks_count / 5) 8512062dddSEric Sandeen ext4_warning(sb, "Reserved blocks too high (%u)", 86ac27a0ecSDave Kleikamp input->reserved_blocks); 87ac27a0ecSDave Kleikamp else if (free_blocks_count < 0) 8812062dddSEric Sandeen ext4_warning(sb, "Bad blocks count %u", 89ac27a0ecSDave Kleikamp input->blocks_count); 90ac27a0ecSDave Kleikamp else if (!(bh = sb_bread(sb, end - 1))) 9112062dddSEric Sandeen ext4_warning(sb, "Cannot read last block (%llu)", 92ac27a0ecSDave Kleikamp end - 1); 93ac27a0ecSDave Kleikamp else if (outside(input->block_bitmap, start, end)) 9412062dddSEric Sandeen ext4_warning(sb, "Block bitmap not in group (block %llu)", 951939e49aSRandy Dunlap (unsigned long long)input->block_bitmap); 96ac27a0ecSDave Kleikamp else if (outside(input->inode_bitmap, start, end)) 9712062dddSEric Sandeen ext4_warning(sb, "Inode bitmap not in group (block %llu)", 981939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap); 99ac27a0ecSDave Kleikamp else if (outside(input->inode_table, start, end) || 100ac27a0ecSDave Kleikamp outside(itend - 1, start, end)) 10112062dddSEric Sandeen ext4_warning(sb, "Inode table not in group (blocks %llu-%llu)", 1021939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 103ac27a0ecSDave Kleikamp else if (input->inode_bitmap == input->block_bitmap) 10412062dddSEric Sandeen ext4_warning(sb, "Block bitmap same as inode bitmap (%llu)", 1051939e49aSRandy Dunlap (unsigned long long)input->block_bitmap); 106ac27a0ecSDave Kleikamp else if (inside(input->block_bitmap, input->inode_table, itend)) 10712062dddSEric Sandeen ext4_warning(sb, "Block bitmap (%llu) in inode table " 10812062dddSEric Sandeen "(%llu-%llu)", 1091939e49aSRandy Dunlap (unsigned long long)input->block_bitmap, 1101939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 111ac27a0ecSDave Kleikamp else if (inside(input->inode_bitmap, input->inode_table, itend)) 11212062dddSEric Sandeen ext4_warning(sb, "Inode bitmap (%llu) in inode table " 11312062dddSEric Sandeen "(%llu-%llu)", 1141939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap, 1151939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 116ac27a0ecSDave Kleikamp else if (inside(input->block_bitmap, start, metaend)) 11712062dddSEric Sandeen ext4_warning(sb, "Block bitmap (%llu) in GDT table (%llu-%llu)", 1181939e49aSRandy Dunlap (unsigned long long)input->block_bitmap, 1191939e49aSRandy Dunlap start, metaend - 1); 120ac27a0ecSDave Kleikamp else if (inside(input->inode_bitmap, start, metaend)) 12112062dddSEric Sandeen ext4_warning(sb, "Inode bitmap (%llu) in GDT table (%llu-%llu)", 1221939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap, 1231939e49aSRandy Dunlap start, metaend - 1); 124ac27a0ecSDave Kleikamp else if (inside(input->inode_table, start, metaend) || 125ac27a0ecSDave Kleikamp inside(itend - 1, start, metaend)) 12612062dddSEric Sandeen ext4_warning(sb, "Inode table (%llu-%llu) overlaps GDT table " 12712062dddSEric Sandeen "(%llu-%llu)", 1281939e49aSRandy Dunlap (unsigned long long)input->inode_table, 1291939e49aSRandy Dunlap itend - 1, start, metaend - 1); 130ac27a0ecSDave Kleikamp else 131ac27a0ecSDave Kleikamp err = 0; 132ac27a0ecSDave Kleikamp brelse(bh); 133ac27a0ecSDave Kleikamp 134ac27a0ecSDave Kleikamp return err; 135ac27a0ecSDave Kleikamp } 136ac27a0ecSDave Kleikamp 13728c7bac0SYongqiang Yang /* 13828c7bac0SYongqiang Yang * ext4_new_flex_group_data is used by 64bit-resize interface to add a flex 13928c7bac0SYongqiang Yang * group each time. 14028c7bac0SYongqiang Yang */ 14128c7bac0SYongqiang Yang struct ext4_new_flex_group_data { 14228c7bac0SYongqiang Yang struct ext4_new_group_data *groups; /* new_group_data for groups 14328c7bac0SYongqiang Yang in the flex group */ 14428c7bac0SYongqiang Yang __u16 *bg_flags; /* block group flags of groups 14528c7bac0SYongqiang Yang in @groups */ 14628c7bac0SYongqiang Yang ext4_group_t count; /* number of groups in @groups 14728c7bac0SYongqiang Yang */ 14828c7bac0SYongqiang Yang }; 14928c7bac0SYongqiang Yang 15028c7bac0SYongqiang Yang /* 15128c7bac0SYongqiang Yang * alloc_flex_gd() allocates a ext4_new_flex_group_data with size of 15228c7bac0SYongqiang Yang * @flexbg_size. 15328c7bac0SYongqiang Yang * 15428c7bac0SYongqiang Yang * Returns NULL on failure otherwise address of the allocated structure. 15528c7bac0SYongqiang Yang */ 15628c7bac0SYongqiang Yang static struct ext4_new_flex_group_data *alloc_flex_gd(unsigned long flexbg_size) 15728c7bac0SYongqiang Yang { 15828c7bac0SYongqiang Yang struct ext4_new_flex_group_data *flex_gd; 15928c7bac0SYongqiang Yang 16028c7bac0SYongqiang Yang flex_gd = kmalloc(sizeof(*flex_gd), GFP_NOFS); 16128c7bac0SYongqiang Yang if (flex_gd == NULL) 16228c7bac0SYongqiang Yang goto out3; 16328c7bac0SYongqiang Yang 16428c7bac0SYongqiang Yang flex_gd->count = flexbg_size; 16528c7bac0SYongqiang Yang 16628c7bac0SYongqiang Yang flex_gd->groups = kmalloc(sizeof(struct ext4_new_group_data) * 16728c7bac0SYongqiang Yang flexbg_size, GFP_NOFS); 16828c7bac0SYongqiang Yang if (flex_gd->groups == NULL) 16928c7bac0SYongqiang Yang goto out2; 17028c7bac0SYongqiang Yang 17128c7bac0SYongqiang Yang flex_gd->bg_flags = kmalloc(flexbg_size * sizeof(__u16), GFP_NOFS); 17228c7bac0SYongqiang Yang if (flex_gd->bg_flags == NULL) 17328c7bac0SYongqiang Yang goto out1; 17428c7bac0SYongqiang Yang 17528c7bac0SYongqiang Yang return flex_gd; 17628c7bac0SYongqiang Yang 17728c7bac0SYongqiang Yang out1: 17828c7bac0SYongqiang Yang kfree(flex_gd->groups); 17928c7bac0SYongqiang Yang out2: 18028c7bac0SYongqiang Yang kfree(flex_gd); 18128c7bac0SYongqiang Yang out3: 18228c7bac0SYongqiang Yang return NULL; 18328c7bac0SYongqiang Yang } 18428c7bac0SYongqiang Yang 18528c7bac0SYongqiang Yang static void free_flex_gd(struct ext4_new_flex_group_data *flex_gd) 18628c7bac0SYongqiang Yang { 18728c7bac0SYongqiang Yang kfree(flex_gd->bg_flags); 18828c7bac0SYongqiang Yang kfree(flex_gd->groups); 18928c7bac0SYongqiang Yang kfree(flex_gd); 19028c7bac0SYongqiang Yang } 19128c7bac0SYongqiang Yang 192ac27a0ecSDave Kleikamp static struct buffer_head *bclean(handle_t *handle, struct super_block *sb, 193617ba13bSMingming Cao ext4_fsblk_t blk) 194ac27a0ecSDave Kleikamp { 195ac27a0ecSDave Kleikamp struct buffer_head *bh; 196ac27a0ecSDave Kleikamp int err; 197ac27a0ecSDave Kleikamp 198ac27a0ecSDave Kleikamp bh = sb_getblk(sb, blk); 199ac27a0ecSDave Kleikamp if (!bh) 200ac27a0ecSDave Kleikamp return ERR_PTR(-EIO); 201617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, bh))) { 202ac27a0ecSDave Kleikamp brelse(bh); 203ac27a0ecSDave Kleikamp bh = ERR_PTR(err); 204ac27a0ecSDave Kleikamp } else { 205ac27a0ecSDave Kleikamp memset(bh->b_data, 0, sb->s_blocksize); 206ac27a0ecSDave Kleikamp set_buffer_uptodate(bh); 207ac27a0ecSDave Kleikamp } 208ac27a0ecSDave Kleikamp 209ac27a0ecSDave Kleikamp return bh; 210ac27a0ecSDave Kleikamp } 211ac27a0ecSDave Kleikamp 212ac27a0ecSDave Kleikamp /* 21314904107SEric Sandeen * If we have fewer than thresh credits, extend by EXT4_MAX_TRANS_DATA. 21414904107SEric Sandeen * If that fails, restart the transaction & regain write access for the 21514904107SEric Sandeen * buffer head which is used for block_bitmap modifications. 21614904107SEric Sandeen */ 2176d40bc5aSYongqiang Yang static int extend_or_restart_transaction(handle_t *handle, int thresh) 21814904107SEric Sandeen { 21914904107SEric Sandeen int err; 22014904107SEric Sandeen 2210390131bSFrank Mayhar if (ext4_handle_has_enough_credits(handle, thresh)) 22214904107SEric Sandeen return 0; 22314904107SEric Sandeen 22414904107SEric Sandeen err = ext4_journal_extend(handle, EXT4_MAX_TRANS_DATA); 22514904107SEric Sandeen if (err < 0) 22614904107SEric Sandeen return err; 22714904107SEric Sandeen if (err) { 2286d40bc5aSYongqiang Yang err = ext4_journal_restart(handle, EXT4_MAX_TRANS_DATA); 2296d40bc5aSYongqiang Yang if (err) 23014904107SEric Sandeen return err; 23114904107SEric Sandeen } 23214904107SEric Sandeen 23314904107SEric Sandeen return 0; 23414904107SEric Sandeen } 23514904107SEric Sandeen 23614904107SEric Sandeen /* 237*33afdcc5SYongqiang Yang * set_flexbg_block_bitmap() mark @count blocks starting from @block used. 238*33afdcc5SYongqiang Yang * 239*33afdcc5SYongqiang Yang * Helper function for ext4_setup_new_group_blocks() which set . 240*33afdcc5SYongqiang Yang * 241*33afdcc5SYongqiang Yang * @sb: super block 242*33afdcc5SYongqiang Yang * @handle: journal handle 243*33afdcc5SYongqiang Yang * @flex_gd: flex group data 244*33afdcc5SYongqiang Yang */ 245*33afdcc5SYongqiang Yang static int set_flexbg_block_bitmap(struct super_block *sb, handle_t *handle, 246*33afdcc5SYongqiang Yang struct ext4_new_flex_group_data *flex_gd, 247*33afdcc5SYongqiang Yang ext4_fsblk_t block, ext4_group_t count) 248*33afdcc5SYongqiang Yang { 249*33afdcc5SYongqiang Yang ext4_group_t count2; 250*33afdcc5SYongqiang Yang 251*33afdcc5SYongqiang Yang ext4_debug("mark blocks [%llu/%u] used\n", block, count); 252*33afdcc5SYongqiang Yang for (count2 = count; count > 0; count -= count2, block += count2) { 253*33afdcc5SYongqiang Yang ext4_fsblk_t start; 254*33afdcc5SYongqiang Yang struct buffer_head *bh; 255*33afdcc5SYongqiang Yang ext4_group_t group; 256*33afdcc5SYongqiang Yang int err; 257*33afdcc5SYongqiang Yang 258*33afdcc5SYongqiang Yang ext4_get_group_no_and_offset(sb, block, &group, NULL); 259*33afdcc5SYongqiang Yang start = ext4_group_first_block_no(sb, group); 260*33afdcc5SYongqiang Yang group -= flex_gd->groups[0].group; 261*33afdcc5SYongqiang Yang 262*33afdcc5SYongqiang Yang count2 = sb->s_blocksize * 8 - (block - start); 263*33afdcc5SYongqiang Yang if (count2 > count) 264*33afdcc5SYongqiang Yang count2 = count; 265*33afdcc5SYongqiang Yang 266*33afdcc5SYongqiang Yang if (flex_gd->bg_flags[group] & EXT4_BG_BLOCK_UNINIT) { 267*33afdcc5SYongqiang Yang BUG_ON(flex_gd->count > 1); 268*33afdcc5SYongqiang Yang continue; 269*33afdcc5SYongqiang Yang } 270*33afdcc5SYongqiang Yang 271*33afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 272*33afdcc5SYongqiang Yang if (err) 273*33afdcc5SYongqiang Yang return err; 274*33afdcc5SYongqiang Yang 275*33afdcc5SYongqiang Yang bh = sb_getblk(sb, flex_gd->groups[group].block_bitmap); 276*33afdcc5SYongqiang Yang if (!bh) 277*33afdcc5SYongqiang Yang return -EIO; 278*33afdcc5SYongqiang Yang 279*33afdcc5SYongqiang Yang err = ext4_journal_get_write_access(handle, bh); 280*33afdcc5SYongqiang Yang if (err) 281*33afdcc5SYongqiang Yang return err; 282*33afdcc5SYongqiang Yang ext4_debug("mark block bitmap %#04llx (+%llu/%u)\n", block, 283*33afdcc5SYongqiang Yang block - start, count2); 284*33afdcc5SYongqiang Yang ext4_set_bits(bh->b_data, block - start, count2); 285*33afdcc5SYongqiang Yang 286*33afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 287*33afdcc5SYongqiang Yang if (unlikely(err)) 288*33afdcc5SYongqiang Yang return err; 289*33afdcc5SYongqiang Yang brelse(bh); 290*33afdcc5SYongqiang Yang } 291*33afdcc5SYongqiang Yang 292*33afdcc5SYongqiang Yang return 0; 293*33afdcc5SYongqiang Yang } 294*33afdcc5SYongqiang Yang 295*33afdcc5SYongqiang Yang /* 296*33afdcc5SYongqiang Yang * Set up the block and inode bitmaps, and the inode table for the new groups. 297*33afdcc5SYongqiang Yang * This doesn't need to be part of the main transaction, since we are only 298*33afdcc5SYongqiang Yang * changing blocks outside the actual filesystem. We still do journaling to 299*33afdcc5SYongqiang Yang * ensure the recovery is correct in case of a failure just after resize. 300*33afdcc5SYongqiang Yang * If any part of this fails, we simply abort the resize. 301*33afdcc5SYongqiang Yang * 302*33afdcc5SYongqiang Yang * setup_new_flex_group_blocks handles a flex group as follow: 303*33afdcc5SYongqiang Yang * 1. copy super block and GDT, and initialize group tables if necessary. 304*33afdcc5SYongqiang Yang * In this step, we only set bits in blocks bitmaps for blocks taken by 305*33afdcc5SYongqiang Yang * super block and GDT. 306*33afdcc5SYongqiang Yang * 2. allocate group tables in block bitmaps, that is, set bits in block 307*33afdcc5SYongqiang Yang * bitmap for blocks taken by group tables. 308*33afdcc5SYongqiang Yang */ 309*33afdcc5SYongqiang Yang static int setup_new_flex_group_blocks(struct super_block *sb, 310*33afdcc5SYongqiang Yang struct ext4_new_flex_group_data *flex_gd) 311*33afdcc5SYongqiang Yang { 312*33afdcc5SYongqiang Yang int group_table_count[] = {1, 1, EXT4_SB(sb)->s_itb_per_group}; 313*33afdcc5SYongqiang Yang ext4_fsblk_t start; 314*33afdcc5SYongqiang Yang ext4_fsblk_t block; 315*33afdcc5SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 316*33afdcc5SYongqiang Yang struct ext4_super_block *es = sbi->s_es; 317*33afdcc5SYongqiang Yang struct ext4_new_group_data *group_data = flex_gd->groups; 318*33afdcc5SYongqiang Yang __u16 *bg_flags = flex_gd->bg_flags; 319*33afdcc5SYongqiang Yang handle_t *handle; 320*33afdcc5SYongqiang Yang ext4_group_t group, count; 321*33afdcc5SYongqiang Yang struct buffer_head *bh = NULL; 322*33afdcc5SYongqiang Yang int reserved_gdb, i, j, err = 0, err2; 323*33afdcc5SYongqiang Yang 324*33afdcc5SYongqiang Yang BUG_ON(!flex_gd->count || !group_data || 325*33afdcc5SYongqiang Yang group_data[0].group != sbi->s_groups_count); 326*33afdcc5SYongqiang Yang 327*33afdcc5SYongqiang Yang reserved_gdb = le16_to_cpu(es->s_reserved_gdt_blocks); 328*33afdcc5SYongqiang Yang 329*33afdcc5SYongqiang Yang /* This transaction may be extended/restarted along the way */ 330*33afdcc5SYongqiang Yang handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 331*33afdcc5SYongqiang Yang if (IS_ERR(handle)) 332*33afdcc5SYongqiang Yang return PTR_ERR(handle); 333*33afdcc5SYongqiang Yang 334*33afdcc5SYongqiang Yang group = group_data[0].group; 335*33afdcc5SYongqiang Yang for (i = 0; i < flex_gd->count; i++, group++) { 336*33afdcc5SYongqiang Yang unsigned long gdblocks; 337*33afdcc5SYongqiang Yang 338*33afdcc5SYongqiang Yang gdblocks = ext4_bg_num_gdb(sb, group); 339*33afdcc5SYongqiang Yang start = ext4_group_first_block_no(sb, group); 340*33afdcc5SYongqiang Yang 341*33afdcc5SYongqiang Yang /* Copy all of the GDT blocks into the backup in this group */ 342*33afdcc5SYongqiang Yang for (j = 0, block = start + 1; j < gdblocks; j++, block++) { 343*33afdcc5SYongqiang Yang struct buffer_head *gdb; 344*33afdcc5SYongqiang Yang 345*33afdcc5SYongqiang Yang ext4_debug("update backup group %#04llx\n", block); 346*33afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 347*33afdcc5SYongqiang Yang if (err) 348*33afdcc5SYongqiang Yang goto out; 349*33afdcc5SYongqiang Yang 350*33afdcc5SYongqiang Yang gdb = sb_getblk(sb, block); 351*33afdcc5SYongqiang Yang if (!gdb) { 352*33afdcc5SYongqiang Yang err = -EIO; 353*33afdcc5SYongqiang Yang goto out; 354*33afdcc5SYongqiang Yang } 355*33afdcc5SYongqiang Yang 356*33afdcc5SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb); 357*33afdcc5SYongqiang Yang if (err) { 358*33afdcc5SYongqiang Yang brelse(gdb); 359*33afdcc5SYongqiang Yang goto out; 360*33afdcc5SYongqiang Yang } 361*33afdcc5SYongqiang Yang memcpy(gdb->b_data, sbi->s_group_desc[j]->b_data, 362*33afdcc5SYongqiang Yang gdb->b_size); 363*33afdcc5SYongqiang Yang set_buffer_uptodate(gdb); 364*33afdcc5SYongqiang Yang 365*33afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, gdb); 366*33afdcc5SYongqiang Yang if (unlikely(err)) { 367*33afdcc5SYongqiang Yang brelse(gdb); 368*33afdcc5SYongqiang Yang goto out; 369*33afdcc5SYongqiang Yang } 370*33afdcc5SYongqiang Yang brelse(gdb); 371*33afdcc5SYongqiang Yang } 372*33afdcc5SYongqiang Yang 373*33afdcc5SYongqiang Yang /* Zero out all of the reserved backup group descriptor 374*33afdcc5SYongqiang Yang * table blocks 375*33afdcc5SYongqiang Yang */ 376*33afdcc5SYongqiang Yang if (ext4_bg_has_super(sb, group)) { 377*33afdcc5SYongqiang Yang err = sb_issue_zeroout(sb, gdblocks + start + 1, 378*33afdcc5SYongqiang Yang reserved_gdb, GFP_NOFS); 379*33afdcc5SYongqiang Yang if (err) 380*33afdcc5SYongqiang Yang goto out; 381*33afdcc5SYongqiang Yang } 382*33afdcc5SYongqiang Yang 383*33afdcc5SYongqiang Yang /* Initialize group tables of the grop @group */ 384*33afdcc5SYongqiang Yang if (!(bg_flags[i] & EXT4_BG_INODE_ZEROED)) 385*33afdcc5SYongqiang Yang goto handle_bb; 386*33afdcc5SYongqiang Yang 387*33afdcc5SYongqiang Yang /* Zero out all of the inode table blocks */ 388*33afdcc5SYongqiang Yang block = group_data[i].inode_table; 389*33afdcc5SYongqiang Yang ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 390*33afdcc5SYongqiang Yang block, sbi->s_itb_per_group); 391*33afdcc5SYongqiang Yang err = sb_issue_zeroout(sb, block, sbi->s_itb_per_group, 392*33afdcc5SYongqiang Yang GFP_NOFS); 393*33afdcc5SYongqiang Yang if (err) 394*33afdcc5SYongqiang Yang goto out; 395*33afdcc5SYongqiang Yang 396*33afdcc5SYongqiang Yang handle_bb: 397*33afdcc5SYongqiang Yang if (bg_flags[i] & EXT4_BG_BLOCK_UNINIT) 398*33afdcc5SYongqiang Yang goto handle_ib; 399*33afdcc5SYongqiang Yang 400*33afdcc5SYongqiang Yang /* Initialize block bitmap of the @group */ 401*33afdcc5SYongqiang Yang block = group_data[i].block_bitmap; 402*33afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 403*33afdcc5SYongqiang Yang if (err) 404*33afdcc5SYongqiang Yang goto out; 405*33afdcc5SYongqiang Yang 406*33afdcc5SYongqiang Yang bh = bclean(handle, sb, block); 407*33afdcc5SYongqiang Yang if (IS_ERR(bh)) { 408*33afdcc5SYongqiang Yang err = PTR_ERR(bh); 409*33afdcc5SYongqiang Yang goto out; 410*33afdcc5SYongqiang Yang } 411*33afdcc5SYongqiang Yang if (ext4_bg_has_super(sb, group)) { 412*33afdcc5SYongqiang Yang ext4_debug("mark backup superblock %#04llx (+0)\n", 413*33afdcc5SYongqiang Yang start); 414*33afdcc5SYongqiang Yang ext4_set_bits(bh->b_data, 0, gdblocks + reserved_gdb + 415*33afdcc5SYongqiang Yang 1); 416*33afdcc5SYongqiang Yang } 417*33afdcc5SYongqiang Yang ext4_mark_bitmap_end(group_data[i].blocks_count, 418*33afdcc5SYongqiang Yang sb->s_blocksize * 8, bh->b_data); 419*33afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 420*33afdcc5SYongqiang Yang if (err) 421*33afdcc5SYongqiang Yang goto out; 422*33afdcc5SYongqiang Yang brelse(bh); 423*33afdcc5SYongqiang Yang 424*33afdcc5SYongqiang Yang handle_ib: 425*33afdcc5SYongqiang Yang if (bg_flags[i] & EXT4_BG_INODE_UNINIT) 426*33afdcc5SYongqiang Yang continue; 427*33afdcc5SYongqiang Yang 428*33afdcc5SYongqiang Yang /* Initialize inode bitmap of the @group */ 429*33afdcc5SYongqiang Yang block = group_data[i].inode_bitmap; 430*33afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 431*33afdcc5SYongqiang Yang if (err) 432*33afdcc5SYongqiang Yang goto out; 433*33afdcc5SYongqiang Yang /* Mark unused entries in inode bitmap used */ 434*33afdcc5SYongqiang Yang bh = bclean(handle, sb, block); 435*33afdcc5SYongqiang Yang if (IS_ERR(bh)) { 436*33afdcc5SYongqiang Yang err = PTR_ERR(bh); 437*33afdcc5SYongqiang Yang goto out; 438*33afdcc5SYongqiang Yang } 439*33afdcc5SYongqiang Yang 440*33afdcc5SYongqiang Yang ext4_mark_bitmap_end(EXT4_INODES_PER_GROUP(sb), 441*33afdcc5SYongqiang Yang sb->s_blocksize * 8, bh->b_data); 442*33afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 443*33afdcc5SYongqiang Yang if (err) 444*33afdcc5SYongqiang Yang goto out; 445*33afdcc5SYongqiang Yang brelse(bh); 446*33afdcc5SYongqiang Yang } 447*33afdcc5SYongqiang Yang bh = NULL; 448*33afdcc5SYongqiang Yang 449*33afdcc5SYongqiang Yang /* Mark group tables in block bitmap */ 450*33afdcc5SYongqiang Yang for (j = 0; j < GROUP_TABLE_COUNT; j++) { 451*33afdcc5SYongqiang Yang count = group_table_count[j]; 452*33afdcc5SYongqiang Yang start = (&group_data[0].block_bitmap)[j]; 453*33afdcc5SYongqiang Yang block = start; 454*33afdcc5SYongqiang Yang for (i = 1; i < flex_gd->count; i++) { 455*33afdcc5SYongqiang Yang block += group_table_count[j]; 456*33afdcc5SYongqiang Yang if (block == (&group_data[i].block_bitmap)[j]) { 457*33afdcc5SYongqiang Yang count += group_table_count[j]; 458*33afdcc5SYongqiang Yang continue; 459*33afdcc5SYongqiang Yang } 460*33afdcc5SYongqiang Yang err = set_flexbg_block_bitmap(sb, handle, 461*33afdcc5SYongqiang Yang flex_gd, start, count); 462*33afdcc5SYongqiang Yang if (err) 463*33afdcc5SYongqiang Yang goto out; 464*33afdcc5SYongqiang Yang count = group_table_count[j]; 465*33afdcc5SYongqiang Yang start = group_data[i].block_bitmap; 466*33afdcc5SYongqiang Yang block = start; 467*33afdcc5SYongqiang Yang } 468*33afdcc5SYongqiang Yang 469*33afdcc5SYongqiang Yang if (count) { 470*33afdcc5SYongqiang Yang err = set_flexbg_block_bitmap(sb, handle, 471*33afdcc5SYongqiang Yang flex_gd, start, count); 472*33afdcc5SYongqiang Yang if (err) 473*33afdcc5SYongqiang Yang goto out; 474*33afdcc5SYongqiang Yang } 475*33afdcc5SYongqiang Yang } 476*33afdcc5SYongqiang Yang 477*33afdcc5SYongqiang Yang out: 478*33afdcc5SYongqiang Yang brelse(bh); 479*33afdcc5SYongqiang Yang err2 = ext4_journal_stop(handle); 480*33afdcc5SYongqiang Yang if (err2 && !err) 481*33afdcc5SYongqiang Yang err = err2; 482*33afdcc5SYongqiang Yang 483*33afdcc5SYongqiang Yang return err; 484*33afdcc5SYongqiang Yang } 485*33afdcc5SYongqiang Yang 486*33afdcc5SYongqiang Yang /* 487ac27a0ecSDave Kleikamp * Set up the block and inode bitmaps, and the inode table for the new group. 488ac27a0ecSDave Kleikamp * This doesn't need to be part of the main transaction, since we are only 489ac27a0ecSDave Kleikamp * changing blocks outside the actual filesystem. We still do journaling to 490ac27a0ecSDave Kleikamp * ensure the recovery is correct in case of a failure just after resize. 491ac27a0ecSDave Kleikamp * If any part of this fails, we simply abort the resize. 492ac27a0ecSDave Kleikamp */ 493ac27a0ecSDave Kleikamp static int setup_new_group_blocks(struct super_block *sb, 494617ba13bSMingming Cao struct ext4_new_group_data *input) 495ac27a0ecSDave Kleikamp { 496617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 497617ba13bSMingming Cao ext4_fsblk_t start = ext4_group_first_block_no(sb, input->group); 498617ba13bSMingming Cao int reserved_gdb = ext4_bg_has_super(sb, input->group) ? 499ac27a0ecSDave Kleikamp le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) : 0; 500617ba13bSMingming Cao unsigned long gdblocks = ext4_bg_num_gdb(sb, input->group); 501ac27a0ecSDave Kleikamp struct buffer_head *bh; 502ac27a0ecSDave Kleikamp handle_t *handle; 503617ba13bSMingming Cao ext4_fsblk_t block; 504617ba13bSMingming Cao ext4_grpblk_t bit; 505ac27a0ecSDave Kleikamp int i; 506ac27a0ecSDave Kleikamp int err = 0, err2; 507ac27a0ecSDave Kleikamp 50814904107SEric Sandeen /* This transaction may be extended/restarted along the way */ 50914904107SEric Sandeen handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 51014904107SEric Sandeen 511ac27a0ecSDave Kleikamp if (IS_ERR(handle)) 512ac27a0ecSDave Kleikamp return PTR_ERR(handle); 513ac27a0ecSDave Kleikamp 5148f82f840SYongqiang Yang BUG_ON(input->group != sbi->s_groups_count); 515ac27a0ecSDave Kleikamp 516ac27a0ecSDave Kleikamp /* Copy all of the GDT blocks into the backup in this group */ 517ac27a0ecSDave Kleikamp for (i = 0, bit = 1, block = start + 1; 518ac27a0ecSDave Kleikamp i < gdblocks; i++, block++, bit++) { 519ac27a0ecSDave Kleikamp struct buffer_head *gdb; 520ac27a0ecSDave Kleikamp 521c549a95dSEric Sandeen ext4_debug("update backup group %#04llx (+%d)\n", block, bit); 5226d40bc5aSYongqiang Yang err = extend_or_restart_transaction(handle, 1); 5236d40bc5aSYongqiang Yang if (err) 5246d40bc5aSYongqiang Yang goto exit_journal; 52514904107SEric Sandeen 526ac27a0ecSDave Kleikamp gdb = sb_getblk(sb, block); 527ac27a0ecSDave Kleikamp if (!gdb) { 528ac27a0ecSDave Kleikamp err = -EIO; 5296d40bc5aSYongqiang Yang goto exit_journal; 530ac27a0ecSDave Kleikamp } 531617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, gdb))) { 532ac27a0ecSDave Kleikamp brelse(gdb); 5336d40bc5aSYongqiang Yang goto exit_journal; 534ac27a0ecSDave Kleikamp } 5355b615287SEric Sandeen memcpy(gdb->b_data, sbi->s_group_desc[i]->b_data, gdb->b_size); 536ac27a0ecSDave Kleikamp set_buffer_uptodate(gdb); 537b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, gdb); 538b4097142STheodore Ts'o if (unlikely(err)) { 539b4097142STheodore Ts'o brelse(gdb); 5406d40bc5aSYongqiang Yang goto exit_journal; 541b4097142STheodore Ts'o } 542ac27a0ecSDave Kleikamp brelse(gdb); 543ac27a0ecSDave Kleikamp } 544ac27a0ecSDave Kleikamp 545ac27a0ecSDave Kleikamp /* Zero out all of the reserved backup group descriptor table blocks */ 546da488945STheodore Ts'o ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 547a31437b8SLukas Czerner block, sbi->s_itb_per_group); 548a31437b8SLukas Czerner err = sb_issue_zeroout(sb, gdblocks + start + 1, reserved_gdb, 549a107e5a3STheodore Ts'o GFP_NOFS); 550a31437b8SLukas Czerner if (err) 5516d40bc5aSYongqiang Yang goto exit_journal; 5526d40bc5aSYongqiang Yang 5536d40bc5aSYongqiang Yang err = extend_or_restart_transaction(handle, 2); 5546d40bc5aSYongqiang Yang if (err) 5556d40bc5aSYongqiang Yang goto exit_journal; 5566d40bc5aSYongqiang Yang 5576d40bc5aSYongqiang Yang bh = bclean(handle, sb, input->block_bitmap); 5586d40bc5aSYongqiang Yang if (IS_ERR(bh)) { 5596d40bc5aSYongqiang Yang err = PTR_ERR(bh); 5606d40bc5aSYongqiang Yang goto exit_journal; 5616d40bc5aSYongqiang Yang } 562c3e94d1dSYongqiang Yang 563c3e94d1dSYongqiang Yang if (ext4_bg_has_super(sb, input->group)) { 564c3e94d1dSYongqiang Yang ext4_debug("mark backup group tables %#04llx (+0)\n", start); 565c3e94d1dSYongqiang Yang ext4_set_bits(bh->b_data, 0, gdblocks + reserved_gdb + 1); 566c3e94d1dSYongqiang Yang } 56714904107SEric Sandeen 568c549a95dSEric Sandeen ext4_debug("mark block bitmap %#04llx (+%llu)\n", input->block_bitmap, 569ac27a0ecSDave Kleikamp input->block_bitmap - start); 570617ba13bSMingming Cao ext4_set_bit(input->block_bitmap - start, bh->b_data); 571c549a95dSEric Sandeen ext4_debug("mark inode bitmap %#04llx (+%llu)\n", input->inode_bitmap, 572ac27a0ecSDave Kleikamp input->inode_bitmap - start); 573617ba13bSMingming Cao ext4_set_bit(input->inode_bitmap - start, bh->b_data); 574ac27a0ecSDave Kleikamp 575ac27a0ecSDave Kleikamp /* Zero out all of the inode table blocks */ 576a31437b8SLukas Czerner block = input->inode_table; 577da488945STheodore Ts'o ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 578a31437b8SLukas Czerner block, sbi->s_itb_per_group); 579a107e5a3STheodore Ts'o err = sb_issue_zeroout(sb, block, sbi->s_itb_per_group, GFP_NOFS); 580a31437b8SLukas Czerner if (err) 58114904107SEric Sandeen goto exit_bh; 582c3e94d1dSYongqiang Yang ext4_set_bits(bh->b_data, input->inode_table - start, 583c3e94d1dSYongqiang Yang sbi->s_itb_per_group); 58414904107SEric Sandeen 58514904107SEric Sandeen 58661d08673STheodore Ts'o ext4_mark_bitmap_end(input->blocks_count, sb->s_blocksize * 8, 58761d08673STheodore Ts'o bh->b_data); 588b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 589b4097142STheodore Ts'o if (unlikely(err)) { 590b4097142STheodore Ts'o ext4_std_error(sb, err); 591b4097142STheodore Ts'o goto exit_bh; 592b4097142STheodore Ts'o } 593ac27a0ecSDave Kleikamp brelse(bh); 594ac27a0ecSDave Kleikamp /* Mark unused entries in inode bitmap used */ 595c549a95dSEric Sandeen ext4_debug("clear inode bitmap %#04llx (+%llu)\n", 596ac27a0ecSDave Kleikamp input->inode_bitmap, input->inode_bitmap - start); 597ac27a0ecSDave Kleikamp if (IS_ERR(bh = bclean(handle, sb, input->inode_bitmap))) { 598ac27a0ecSDave Kleikamp err = PTR_ERR(bh); 599ac27a0ecSDave Kleikamp goto exit_journal; 600ac27a0ecSDave Kleikamp } 601ac27a0ecSDave Kleikamp 60261d08673STheodore Ts'o ext4_mark_bitmap_end(EXT4_INODES_PER_GROUP(sb), sb->s_blocksize * 8, 603ac27a0ecSDave Kleikamp bh->b_data); 604b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 605b4097142STheodore Ts'o if (unlikely(err)) 606b4097142STheodore Ts'o ext4_std_error(sb, err); 607ac27a0ecSDave Kleikamp exit_bh: 608ac27a0ecSDave Kleikamp brelse(bh); 609ac27a0ecSDave Kleikamp 610ac27a0ecSDave Kleikamp exit_journal: 611617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 612ac27a0ecSDave Kleikamp err = err2; 613ac27a0ecSDave Kleikamp 614ac27a0ecSDave Kleikamp return err; 615ac27a0ecSDave Kleikamp } 616ac27a0ecSDave Kleikamp 617ac27a0ecSDave Kleikamp /* 618ac27a0ecSDave Kleikamp * Iterate through the groups which hold BACKUP superblock/GDT copies in an 619617ba13bSMingming Cao * ext4 filesystem. The counters should be initialized to 1, 5, and 7 before 620ac27a0ecSDave Kleikamp * calling this for the first time. In a sparse filesystem it will be the 621ac27a0ecSDave Kleikamp * sequence of powers of 3, 5, and 7: 1, 3, 5, 7, 9, 25, 27, 49, 81, ... 622ac27a0ecSDave Kleikamp * For a non-sparse filesystem it will be every group: 1, 2, 3, 4, ... 623ac27a0ecSDave Kleikamp */ 624617ba13bSMingming Cao static unsigned ext4_list_backups(struct super_block *sb, unsigned *three, 625ac27a0ecSDave Kleikamp unsigned *five, unsigned *seven) 626ac27a0ecSDave Kleikamp { 627ac27a0ecSDave Kleikamp unsigned *min = three; 628ac27a0ecSDave Kleikamp int mult = 3; 629ac27a0ecSDave Kleikamp unsigned ret; 630ac27a0ecSDave Kleikamp 631617ba13bSMingming Cao if (!EXT4_HAS_RO_COMPAT_FEATURE(sb, 632617ba13bSMingming Cao EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER)) { 633ac27a0ecSDave Kleikamp ret = *min; 634ac27a0ecSDave Kleikamp *min += 1; 635ac27a0ecSDave Kleikamp return ret; 636ac27a0ecSDave Kleikamp } 637ac27a0ecSDave Kleikamp 638ac27a0ecSDave Kleikamp if (*five < *min) { 639ac27a0ecSDave Kleikamp min = five; 640ac27a0ecSDave Kleikamp mult = 5; 641ac27a0ecSDave Kleikamp } 642ac27a0ecSDave Kleikamp if (*seven < *min) { 643ac27a0ecSDave Kleikamp min = seven; 644ac27a0ecSDave Kleikamp mult = 7; 645ac27a0ecSDave Kleikamp } 646ac27a0ecSDave Kleikamp 647ac27a0ecSDave Kleikamp ret = *min; 648ac27a0ecSDave Kleikamp *min *= mult; 649ac27a0ecSDave Kleikamp 650ac27a0ecSDave Kleikamp return ret; 651ac27a0ecSDave Kleikamp } 652ac27a0ecSDave Kleikamp 653ac27a0ecSDave Kleikamp /* 654ac27a0ecSDave Kleikamp * Check that all of the backup GDT blocks are held in the primary GDT block. 655ac27a0ecSDave Kleikamp * It is assumed that they are stored in group order. Returns the number of 656ac27a0ecSDave Kleikamp * groups in current filesystem that have BACKUPS, or -ve error code. 657ac27a0ecSDave Kleikamp */ 658ac27a0ecSDave Kleikamp static int verify_reserved_gdb(struct super_block *sb, 659ac27a0ecSDave Kleikamp struct buffer_head *primary) 660ac27a0ecSDave Kleikamp { 661617ba13bSMingming Cao const ext4_fsblk_t blk = primary->b_blocknr; 662fd2d4291SAvantika Mathur const ext4_group_t end = EXT4_SB(sb)->s_groups_count; 663ac27a0ecSDave Kleikamp unsigned three = 1; 664ac27a0ecSDave Kleikamp unsigned five = 5; 665ac27a0ecSDave Kleikamp unsigned seven = 7; 666ac27a0ecSDave Kleikamp unsigned grp; 667ac27a0ecSDave Kleikamp __le32 *p = (__le32 *)primary->b_data; 668ac27a0ecSDave Kleikamp int gdbackups = 0; 669ac27a0ecSDave Kleikamp 670617ba13bSMingming Cao while ((grp = ext4_list_backups(sb, &three, &five, &seven)) < end) { 671bd81d8eeSLaurent Vivier if (le32_to_cpu(*p++) != 672bd81d8eeSLaurent Vivier grp * EXT4_BLOCKS_PER_GROUP(sb) + blk){ 67312062dddSEric Sandeen ext4_warning(sb, "reserved GDT %llu" 6742ae02107SMingming Cao " missing grp %d (%llu)", 675ac27a0ecSDave Kleikamp blk, grp, 676bd81d8eeSLaurent Vivier grp * 677bd81d8eeSLaurent Vivier (ext4_fsblk_t)EXT4_BLOCKS_PER_GROUP(sb) + 678bd81d8eeSLaurent Vivier blk); 679ac27a0ecSDave Kleikamp return -EINVAL; 680ac27a0ecSDave Kleikamp } 681617ba13bSMingming Cao if (++gdbackups > EXT4_ADDR_PER_BLOCK(sb)) 682ac27a0ecSDave Kleikamp return -EFBIG; 683ac27a0ecSDave Kleikamp } 684ac27a0ecSDave Kleikamp 685ac27a0ecSDave Kleikamp return gdbackups; 686ac27a0ecSDave Kleikamp } 687ac27a0ecSDave Kleikamp 688ac27a0ecSDave Kleikamp /* 689ac27a0ecSDave Kleikamp * Called when we need to bring a reserved group descriptor table block into 690ac27a0ecSDave Kleikamp * use from the resize inode. The primary copy of the new GDT block currently 691ac27a0ecSDave Kleikamp * is an indirect block (under the double indirect block in the resize inode). 692ac27a0ecSDave Kleikamp * The new backup GDT blocks will be stored as leaf blocks in this indirect 693ac27a0ecSDave Kleikamp * block, in group order. Even though we know all the block numbers we need, 694ac27a0ecSDave Kleikamp * we check to ensure that the resize inode has actually reserved these blocks. 695ac27a0ecSDave Kleikamp * 696ac27a0ecSDave Kleikamp * Don't need to update the block bitmaps because the blocks are still in use. 697ac27a0ecSDave Kleikamp * 698ac27a0ecSDave Kleikamp * We get all of the error cases out of the way, so that we are sure to not 699ac27a0ecSDave Kleikamp * fail once we start modifying the data on disk, because JBD has no rollback. 700ac27a0ecSDave Kleikamp */ 701ac27a0ecSDave Kleikamp static int add_new_gdb(handle_t *handle, struct inode *inode, 7022f919710SYongqiang Yang ext4_group_t group) 703ac27a0ecSDave Kleikamp { 704ac27a0ecSDave Kleikamp struct super_block *sb = inode->i_sb; 705617ba13bSMingming Cao struct ext4_super_block *es = EXT4_SB(sb)->s_es; 7062f919710SYongqiang Yang unsigned long gdb_num = group / EXT4_DESC_PER_BLOCK(sb); 707617ba13bSMingming Cao ext4_fsblk_t gdblock = EXT4_SB(sb)->s_sbh->b_blocknr + 1 + gdb_num; 708ac27a0ecSDave Kleikamp struct buffer_head **o_group_desc, **n_group_desc; 709ac27a0ecSDave Kleikamp struct buffer_head *dind; 7102f919710SYongqiang Yang struct buffer_head *gdb_bh; 711ac27a0ecSDave Kleikamp int gdbackups; 712617ba13bSMingming Cao struct ext4_iloc iloc; 713ac27a0ecSDave Kleikamp __le32 *data; 714ac27a0ecSDave Kleikamp int err; 715ac27a0ecSDave Kleikamp 716ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 717ac27a0ecSDave Kleikamp printk(KERN_DEBUG 718617ba13bSMingming Cao "EXT4-fs: ext4_add_new_gdb: adding group block %lu\n", 719ac27a0ecSDave Kleikamp gdb_num); 720ac27a0ecSDave Kleikamp 721ac27a0ecSDave Kleikamp /* 722ac27a0ecSDave Kleikamp * If we are not using the primary superblock/GDT copy don't resize, 723ac27a0ecSDave Kleikamp * because the user tools have no way of handling this. Probably a 724ac27a0ecSDave Kleikamp * bad time to do it anyways. 725ac27a0ecSDave Kleikamp */ 726617ba13bSMingming Cao if (EXT4_SB(sb)->s_sbh->b_blocknr != 727617ba13bSMingming Cao le32_to_cpu(EXT4_SB(sb)->s_es->s_first_data_block)) { 72812062dddSEric Sandeen ext4_warning(sb, "won't resize using backup superblock at %llu", 729617ba13bSMingming Cao (unsigned long long)EXT4_SB(sb)->s_sbh->b_blocknr); 730ac27a0ecSDave Kleikamp return -EPERM; 731ac27a0ecSDave Kleikamp } 732ac27a0ecSDave Kleikamp 7332f919710SYongqiang Yang gdb_bh = sb_bread(sb, gdblock); 7342f919710SYongqiang Yang if (!gdb_bh) 735ac27a0ecSDave Kleikamp return -EIO; 736ac27a0ecSDave Kleikamp 7372f919710SYongqiang Yang gdbackups = verify_reserved_gdb(sb, gdb_bh); 7382f919710SYongqiang Yang if (gdbackups < 0) { 739ac27a0ecSDave Kleikamp err = gdbackups; 740ac27a0ecSDave Kleikamp goto exit_bh; 741ac27a0ecSDave Kleikamp } 742ac27a0ecSDave Kleikamp 743617ba13bSMingming Cao data = EXT4_I(inode)->i_data + EXT4_DIND_BLOCK; 744ac27a0ecSDave Kleikamp dind = sb_bread(sb, le32_to_cpu(*data)); 745ac27a0ecSDave Kleikamp if (!dind) { 746ac27a0ecSDave Kleikamp err = -EIO; 747ac27a0ecSDave Kleikamp goto exit_bh; 748ac27a0ecSDave Kleikamp } 749ac27a0ecSDave Kleikamp 750ac27a0ecSDave Kleikamp data = (__le32 *)dind->b_data; 751617ba13bSMingming Cao if (le32_to_cpu(data[gdb_num % EXT4_ADDR_PER_BLOCK(sb)]) != gdblock) { 75212062dddSEric Sandeen ext4_warning(sb, "new group %u GDT block %llu not reserved", 7532f919710SYongqiang Yang group, gdblock); 754ac27a0ecSDave Kleikamp err = -EINVAL; 755ac27a0ecSDave Kleikamp goto exit_dind; 756ac27a0ecSDave Kleikamp } 757ac27a0ecSDave Kleikamp 758b4097142STheodore Ts'o err = ext4_journal_get_write_access(handle, EXT4_SB(sb)->s_sbh); 759b4097142STheodore Ts'o if (unlikely(err)) 760ac27a0ecSDave Kleikamp goto exit_dind; 761ac27a0ecSDave Kleikamp 7622f919710SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb_bh); 763b4097142STheodore Ts'o if (unlikely(err)) 764ac27a0ecSDave Kleikamp goto exit_sbh; 765ac27a0ecSDave Kleikamp 766b4097142STheodore Ts'o err = ext4_journal_get_write_access(handle, dind); 767b4097142STheodore Ts'o if (unlikely(err)) 768b4097142STheodore Ts'o ext4_std_error(sb, err); 769ac27a0ecSDave Kleikamp 770617ba13bSMingming Cao /* ext4_reserve_inode_write() gets a reference on the iloc */ 771b4097142STheodore Ts'o err = ext4_reserve_inode_write(handle, inode, &iloc); 772b4097142STheodore Ts'o if (unlikely(err)) 773ac27a0ecSDave Kleikamp goto exit_dindj; 774ac27a0ecSDave Kleikamp 775f18a5f21STheodore Ts'o n_group_desc = ext4_kvmalloc((gdb_num + 1) * 776f18a5f21STheodore Ts'o sizeof(struct buffer_head *), 777216553c4SJosef Bacik GFP_NOFS); 778ac27a0ecSDave Kleikamp if (!n_group_desc) { 779ac27a0ecSDave Kleikamp err = -ENOMEM; 780f18a5f21STheodore Ts'o ext4_warning(sb, "not enough memory for %lu groups", 781f18a5f21STheodore Ts'o gdb_num + 1); 782ac27a0ecSDave Kleikamp goto exit_inode; 783ac27a0ecSDave Kleikamp } 784ac27a0ecSDave Kleikamp 785ac27a0ecSDave Kleikamp /* 786ac27a0ecSDave Kleikamp * Finally, we have all of the possible failures behind us... 787ac27a0ecSDave Kleikamp * 788ac27a0ecSDave Kleikamp * Remove new GDT block from inode double-indirect block and clear out 789ac27a0ecSDave Kleikamp * the new GDT block for use (which also "frees" the backup GDT blocks 790ac27a0ecSDave Kleikamp * from the reserved inode). We don't need to change the bitmaps for 791ac27a0ecSDave Kleikamp * these blocks, because they are marked as in-use from being in the 792ac27a0ecSDave Kleikamp * reserved inode, and will become GDT blocks (primary and backup). 793ac27a0ecSDave Kleikamp */ 794617ba13bSMingming Cao data[gdb_num % EXT4_ADDR_PER_BLOCK(sb)] = 0; 795b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, dind); 796b4097142STheodore Ts'o if (unlikely(err)) { 797b4097142STheodore Ts'o ext4_std_error(sb, err); 798b4097142STheodore Ts'o goto exit_inode; 799b4097142STheodore Ts'o } 800ac27a0ecSDave Kleikamp inode->i_blocks -= (gdbackups + 1) * sb->s_blocksize >> 9; 801617ba13bSMingming Cao ext4_mark_iloc_dirty(handle, inode, &iloc); 8022f919710SYongqiang Yang memset(gdb_bh->b_data, 0, sb->s_blocksize); 8032f919710SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, gdb_bh); 804b4097142STheodore Ts'o if (unlikely(err)) { 805b4097142STheodore Ts'o ext4_std_error(sb, err); 806b4097142STheodore Ts'o goto exit_inode; 807b4097142STheodore Ts'o } 808b4097142STheodore Ts'o brelse(dind); 809ac27a0ecSDave Kleikamp 810617ba13bSMingming Cao o_group_desc = EXT4_SB(sb)->s_group_desc; 811ac27a0ecSDave Kleikamp memcpy(n_group_desc, o_group_desc, 812617ba13bSMingming Cao EXT4_SB(sb)->s_gdb_count * sizeof(struct buffer_head *)); 8132f919710SYongqiang Yang n_group_desc[gdb_num] = gdb_bh; 814617ba13bSMingming Cao EXT4_SB(sb)->s_group_desc = n_group_desc; 815617ba13bSMingming Cao EXT4_SB(sb)->s_gdb_count++; 816f18a5f21STheodore Ts'o ext4_kvfree(o_group_desc); 817ac27a0ecSDave Kleikamp 818e8546d06SMarcin Slusarz le16_add_cpu(&es->s_reserved_gdt_blocks, -1); 819b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, EXT4_SB(sb)->s_sbh); 820b4097142STheodore Ts'o if (err) 821b4097142STheodore Ts'o ext4_std_error(sb, err); 822ac27a0ecSDave Kleikamp 823b4097142STheodore Ts'o return err; 824ac27a0ecSDave Kleikamp 825ac27a0ecSDave Kleikamp exit_inode: 826f18a5f21STheodore Ts'o ext4_kvfree(n_group_desc); 827537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, iloc.bh); */ 828ac27a0ecSDave Kleikamp brelse(iloc.bh); 829ac27a0ecSDave Kleikamp exit_dindj: 830537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, dind); */ 831ac27a0ecSDave Kleikamp exit_sbh: 832537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, EXT4_SB(sb)->s_sbh); */ 833ac27a0ecSDave Kleikamp exit_dind: 834ac27a0ecSDave Kleikamp brelse(dind); 835ac27a0ecSDave Kleikamp exit_bh: 8362f919710SYongqiang Yang brelse(gdb_bh); 837ac27a0ecSDave Kleikamp 838617ba13bSMingming Cao ext4_debug("leaving with error %d\n", err); 839ac27a0ecSDave Kleikamp return err; 840ac27a0ecSDave Kleikamp } 841ac27a0ecSDave Kleikamp 842ac27a0ecSDave Kleikamp /* 843ac27a0ecSDave Kleikamp * Called when we are adding a new group which has a backup copy of each of 844ac27a0ecSDave Kleikamp * the GDT blocks (i.e. sparse group) and there are reserved GDT blocks. 845ac27a0ecSDave Kleikamp * We need to add these reserved backup GDT blocks to the resize inode, so 846ac27a0ecSDave Kleikamp * that they are kept for future resizing and not allocated to files. 847ac27a0ecSDave Kleikamp * 848ac27a0ecSDave Kleikamp * Each reserved backup GDT block will go into a different indirect block. 849ac27a0ecSDave Kleikamp * The indirect blocks are actually the primary reserved GDT blocks, 850ac27a0ecSDave Kleikamp * so we know in advance what their block numbers are. We only get the 851ac27a0ecSDave Kleikamp * double-indirect block to verify it is pointing to the primary reserved 852ac27a0ecSDave Kleikamp * GDT blocks so we don't overwrite a data block by accident. The reserved 853ac27a0ecSDave Kleikamp * backup GDT blocks are stored in their reserved primary GDT block. 854ac27a0ecSDave Kleikamp */ 855ac27a0ecSDave Kleikamp static int reserve_backup_gdb(handle_t *handle, struct inode *inode, 856668f4dc5SYongqiang Yang ext4_group_t group) 857ac27a0ecSDave Kleikamp { 858ac27a0ecSDave Kleikamp struct super_block *sb = inode->i_sb; 859617ba13bSMingming Cao int reserved_gdb =le16_to_cpu(EXT4_SB(sb)->s_es->s_reserved_gdt_blocks); 860ac27a0ecSDave Kleikamp struct buffer_head **primary; 861ac27a0ecSDave Kleikamp struct buffer_head *dind; 862617ba13bSMingming Cao struct ext4_iloc iloc; 863617ba13bSMingming Cao ext4_fsblk_t blk; 864ac27a0ecSDave Kleikamp __le32 *data, *end; 865ac27a0ecSDave Kleikamp int gdbackups = 0; 866ac27a0ecSDave Kleikamp int res, i; 867ac27a0ecSDave Kleikamp int err; 868ac27a0ecSDave Kleikamp 869216553c4SJosef Bacik primary = kmalloc(reserved_gdb * sizeof(*primary), GFP_NOFS); 870ac27a0ecSDave Kleikamp if (!primary) 871ac27a0ecSDave Kleikamp return -ENOMEM; 872ac27a0ecSDave Kleikamp 873617ba13bSMingming Cao data = EXT4_I(inode)->i_data + EXT4_DIND_BLOCK; 874ac27a0ecSDave Kleikamp dind = sb_bread(sb, le32_to_cpu(*data)); 875ac27a0ecSDave Kleikamp if (!dind) { 876ac27a0ecSDave Kleikamp err = -EIO; 877ac27a0ecSDave Kleikamp goto exit_free; 878ac27a0ecSDave Kleikamp } 879ac27a0ecSDave Kleikamp 880617ba13bSMingming Cao blk = EXT4_SB(sb)->s_sbh->b_blocknr + 1 + EXT4_SB(sb)->s_gdb_count; 88194460093SJosef Bacik data = (__le32 *)dind->b_data + (EXT4_SB(sb)->s_gdb_count % 88294460093SJosef Bacik EXT4_ADDR_PER_BLOCK(sb)); 883617ba13bSMingming Cao end = (__le32 *)dind->b_data + EXT4_ADDR_PER_BLOCK(sb); 884ac27a0ecSDave Kleikamp 885ac27a0ecSDave Kleikamp /* Get each reserved primary GDT block and verify it holds backups */ 886ac27a0ecSDave Kleikamp for (res = 0; res < reserved_gdb; res++, blk++) { 887ac27a0ecSDave Kleikamp if (le32_to_cpu(*data) != blk) { 88812062dddSEric Sandeen ext4_warning(sb, "reserved block %llu" 889ac27a0ecSDave Kleikamp " not at offset %ld", 890ac27a0ecSDave Kleikamp blk, 891ac27a0ecSDave Kleikamp (long)(data - (__le32 *)dind->b_data)); 892ac27a0ecSDave Kleikamp err = -EINVAL; 893ac27a0ecSDave Kleikamp goto exit_bh; 894ac27a0ecSDave Kleikamp } 895ac27a0ecSDave Kleikamp primary[res] = sb_bread(sb, blk); 896ac27a0ecSDave Kleikamp if (!primary[res]) { 897ac27a0ecSDave Kleikamp err = -EIO; 898ac27a0ecSDave Kleikamp goto exit_bh; 899ac27a0ecSDave Kleikamp } 900ac27a0ecSDave Kleikamp if ((gdbackups = verify_reserved_gdb(sb, primary[res])) < 0) { 901ac27a0ecSDave Kleikamp brelse(primary[res]); 902ac27a0ecSDave Kleikamp err = gdbackups; 903ac27a0ecSDave Kleikamp goto exit_bh; 904ac27a0ecSDave Kleikamp } 905ac27a0ecSDave Kleikamp if (++data >= end) 906ac27a0ecSDave Kleikamp data = (__le32 *)dind->b_data; 907ac27a0ecSDave Kleikamp } 908ac27a0ecSDave Kleikamp 909ac27a0ecSDave Kleikamp for (i = 0; i < reserved_gdb; i++) { 910617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, primary[i]))) { 911ac27a0ecSDave Kleikamp /* 912ac27a0ecSDave Kleikamp int j; 913ac27a0ecSDave Kleikamp for (j = 0; j < i; j++) 914537a0310SAmir Goldstein ext4_handle_release_buffer(handle, primary[j]); 915ac27a0ecSDave Kleikamp */ 916ac27a0ecSDave Kleikamp goto exit_bh; 917ac27a0ecSDave Kleikamp } 918ac27a0ecSDave Kleikamp } 919ac27a0ecSDave Kleikamp 920617ba13bSMingming Cao if ((err = ext4_reserve_inode_write(handle, inode, &iloc))) 921ac27a0ecSDave Kleikamp goto exit_bh; 922ac27a0ecSDave Kleikamp 923ac27a0ecSDave Kleikamp /* 924ac27a0ecSDave Kleikamp * Finally we can add each of the reserved backup GDT blocks from 925ac27a0ecSDave Kleikamp * the new group to its reserved primary GDT block. 926ac27a0ecSDave Kleikamp */ 927668f4dc5SYongqiang Yang blk = group * EXT4_BLOCKS_PER_GROUP(sb); 928ac27a0ecSDave Kleikamp for (i = 0; i < reserved_gdb; i++) { 929ac27a0ecSDave Kleikamp int err2; 930ac27a0ecSDave Kleikamp data = (__le32 *)primary[i]->b_data; 931ac27a0ecSDave Kleikamp /* printk("reserving backup %lu[%u] = %lu\n", 932ac27a0ecSDave Kleikamp primary[i]->b_blocknr, gdbackups, 933ac27a0ecSDave Kleikamp blk + primary[i]->b_blocknr); */ 934ac27a0ecSDave Kleikamp data[gdbackups] = cpu_to_le32(blk + primary[i]->b_blocknr); 9350390131bSFrank Mayhar err2 = ext4_handle_dirty_metadata(handle, NULL, primary[i]); 936ac27a0ecSDave Kleikamp if (!err) 937ac27a0ecSDave Kleikamp err = err2; 938ac27a0ecSDave Kleikamp } 939ac27a0ecSDave Kleikamp inode->i_blocks += reserved_gdb * sb->s_blocksize >> 9; 940617ba13bSMingming Cao ext4_mark_iloc_dirty(handle, inode, &iloc); 941ac27a0ecSDave Kleikamp 942ac27a0ecSDave Kleikamp exit_bh: 943ac27a0ecSDave Kleikamp while (--res >= 0) 944ac27a0ecSDave Kleikamp brelse(primary[res]); 945ac27a0ecSDave Kleikamp brelse(dind); 946ac27a0ecSDave Kleikamp 947ac27a0ecSDave Kleikamp exit_free: 948ac27a0ecSDave Kleikamp kfree(primary); 949ac27a0ecSDave Kleikamp 950ac27a0ecSDave Kleikamp return err; 951ac27a0ecSDave Kleikamp } 952ac27a0ecSDave Kleikamp 953ac27a0ecSDave Kleikamp /* 954617ba13bSMingming Cao * Update the backup copies of the ext4 metadata. These don't need to be part 955ac27a0ecSDave Kleikamp * of the main resize transaction, because e2fsck will re-write them if there 956ac27a0ecSDave Kleikamp * is a problem (basically only OOM will cause a problem). However, we 957ac27a0ecSDave Kleikamp * _should_ update the backups if possible, in case the primary gets trashed 958ac27a0ecSDave Kleikamp * for some reason and we need to run e2fsck from a backup superblock. The 959ac27a0ecSDave Kleikamp * important part is that the new block and inode counts are in the backup 960ac27a0ecSDave Kleikamp * superblocks, and the location of the new group metadata in the GDT backups. 961ac27a0ecSDave Kleikamp * 96232ed5058STheodore Ts'o * We do not need take the s_resize_lock for this, because these 96332ed5058STheodore Ts'o * blocks are not otherwise touched by the filesystem code when it is 96432ed5058STheodore Ts'o * mounted. We don't need to worry about last changing from 96532ed5058STheodore Ts'o * sbi->s_groups_count, because the worst that can happen is that we 96632ed5058STheodore Ts'o * do not copy the full number of backups at this time. The resize 96732ed5058STheodore Ts'o * which changed s_groups_count will backup again. 968ac27a0ecSDave Kleikamp */ 969ac27a0ecSDave Kleikamp static void update_backups(struct super_block *sb, 970ac27a0ecSDave Kleikamp int blk_off, char *data, int size) 971ac27a0ecSDave Kleikamp { 972617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 973fd2d4291SAvantika Mathur const ext4_group_t last = sbi->s_groups_count; 974617ba13bSMingming Cao const int bpg = EXT4_BLOCKS_PER_GROUP(sb); 975ac27a0ecSDave Kleikamp unsigned three = 1; 976ac27a0ecSDave Kleikamp unsigned five = 5; 977ac27a0ecSDave Kleikamp unsigned seven = 7; 978fd2d4291SAvantika Mathur ext4_group_t group; 979ac27a0ecSDave Kleikamp int rest = sb->s_blocksize - size; 980ac27a0ecSDave Kleikamp handle_t *handle; 981ac27a0ecSDave Kleikamp int err = 0, err2; 982ac27a0ecSDave Kleikamp 983617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 984ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 985ac27a0ecSDave Kleikamp group = 1; 986ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 987ac27a0ecSDave Kleikamp goto exit_err; 988ac27a0ecSDave Kleikamp } 989ac27a0ecSDave Kleikamp 990617ba13bSMingming Cao while ((group = ext4_list_backups(sb, &three, &five, &seven)) < last) { 991ac27a0ecSDave Kleikamp struct buffer_head *bh; 992ac27a0ecSDave Kleikamp 993ac27a0ecSDave Kleikamp /* Out of journal space, and can't get more - abort - so sad */ 9940390131bSFrank Mayhar if (ext4_handle_valid(handle) && 9950390131bSFrank Mayhar handle->h_buffer_credits == 0 && 996617ba13bSMingming Cao ext4_journal_extend(handle, EXT4_MAX_TRANS_DATA) && 997617ba13bSMingming Cao (err = ext4_journal_restart(handle, EXT4_MAX_TRANS_DATA))) 998ac27a0ecSDave Kleikamp break; 999ac27a0ecSDave Kleikamp 1000ac27a0ecSDave Kleikamp bh = sb_getblk(sb, group * bpg + blk_off); 1001ac27a0ecSDave Kleikamp if (!bh) { 1002ac27a0ecSDave Kleikamp err = -EIO; 1003ac27a0ecSDave Kleikamp break; 1004ac27a0ecSDave Kleikamp } 1005617ba13bSMingming Cao ext4_debug("update metadata backup %#04lx\n", 1006ac27a0ecSDave Kleikamp (unsigned long)bh->b_blocknr); 1007617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, bh))) 1008ac27a0ecSDave Kleikamp break; 1009ac27a0ecSDave Kleikamp lock_buffer(bh); 1010ac27a0ecSDave Kleikamp memcpy(bh->b_data, data, size); 1011ac27a0ecSDave Kleikamp if (rest) 1012ac27a0ecSDave Kleikamp memset(bh->b_data + size, 0, rest); 1013ac27a0ecSDave Kleikamp set_buffer_uptodate(bh); 1014ac27a0ecSDave Kleikamp unlock_buffer(bh); 1015b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 1016b4097142STheodore Ts'o if (unlikely(err)) 1017b4097142STheodore Ts'o ext4_std_error(sb, err); 1018ac27a0ecSDave Kleikamp brelse(bh); 1019ac27a0ecSDave Kleikamp } 1020617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 1021ac27a0ecSDave Kleikamp err = err2; 1022ac27a0ecSDave Kleikamp 1023ac27a0ecSDave Kleikamp /* 1024ac27a0ecSDave Kleikamp * Ugh! Need to have e2fsck write the backup copies. It is too 1025ac27a0ecSDave Kleikamp * late to revert the resize, we shouldn't fail just because of 1026ac27a0ecSDave Kleikamp * the backup copies (they are only needed in case of corruption). 1027ac27a0ecSDave Kleikamp * 1028ac27a0ecSDave Kleikamp * However, if we got here we have a journal problem too, so we 1029ac27a0ecSDave Kleikamp * can't really start a transaction to mark the superblock. 1030ac27a0ecSDave Kleikamp * Chicken out and just set the flag on the hope it will be written 1031ac27a0ecSDave Kleikamp * to disk, and if not - we will simply wait until next fsck. 1032ac27a0ecSDave Kleikamp */ 1033ac27a0ecSDave Kleikamp exit_err: 1034ac27a0ecSDave Kleikamp if (err) { 103512062dddSEric Sandeen ext4_warning(sb, "can't update backup for group %u (err %d), " 1036ac27a0ecSDave Kleikamp "forcing fsck on next reboot", group, err); 1037617ba13bSMingming Cao sbi->s_mount_state &= ~EXT4_VALID_FS; 1038617ba13bSMingming Cao sbi->s_es->s_state &= cpu_to_le16(~EXT4_VALID_FS); 1039ac27a0ecSDave Kleikamp mark_buffer_dirty(sbi->s_sbh); 1040ac27a0ecSDave Kleikamp } 1041ac27a0ecSDave Kleikamp } 1042ac27a0ecSDave Kleikamp 1043bb08c1e7SYongqiang Yang /* 1044bb08c1e7SYongqiang Yang * ext4_add_new_descs() adds @count group descriptor of groups 1045bb08c1e7SYongqiang Yang * starting at @group 1046bb08c1e7SYongqiang Yang * 1047bb08c1e7SYongqiang Yang * @handle: journal handle 1048bb08c1e7SYongqiang Yang * @sb: super block 1049bb08c1e7SYongqiang Yang * @group: the group no. of the first group desc to be added 1050bb08c1e7SYongqiang Yang * @resize_inode: the resize inode 1051bb08c1e7SYongqiang Yang * @count: number of group descriptors to be added 1052bb08c1e7SYongqiang Yang */ 1053bb08c1e7SYongqiang Yang static int ext4_add_new_descs(handle_t *handle, struct super_block *sb, 1054bb08c1e7SYongqiang Yang ext4_group_t group, struct inode *resize_inode, 1055bb08c1e7SYongqiang Yang ext4_group_t count) 1056bb08c1e7SYongqiang Yang { 1057bb08c1e7SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 1058bb08c1e7SYongqiang Yang struct ext4_super_block *es = sbi->s_es; 1059bb08c1e7SYongqiang Yang struct buffer_head *gdb_bh; 1060bb08c1e7SYongqiang Yang int i, gdb_off, gdb_num, err = 0; 1061bb08c1e7SYongqiang Yang 1062bb08c1e7SYongqiang Yang for (i = 0; i < count; i++, group++) { 1063bb08c1e7SYongqiang Yang int reserved_gdb = ext4_bg_has_super(sb, group) ? 1064bb08c1e7SYongqiang Yang le16_to_cpu(es->s_reserved_gdt_blocks) : 0; 1065bb08c1e7SYongqiang Yang 1066bb08c1e7SYongqiang Yang gdb_off = group % EXT4_DESC_PER_BLOCK(sb); 1067bb08c1e7SYongqiang Yang gdb_num = group / EXT4_DESC_PER_BLOCK(sb); 1068bb08c1e7SYongqiang Yang 1069bb08c1e7SYongqiang Yang /* 1070bb08c1e7SYongqiang Yang * We will only either add reserved group blocks to a backup group 1071bb08c1e7SYongqiang Yang * or remove reserved blocks for the first group in a new group block. 1072bb08c1e7SYongqiang Yang * Doing both would be mean more complex code, and sane people don't 1073bb08c1e7SYongqiang Yang * use non-sparse filesystems anymore. This is already checked above. 1074bb08c1e7SYongqiang Yang */ 1075bb08c1e7SYongqiang Yang if (gdb_off) { 1076bb08c1e7SYongqiang Yang gdb_bh = sbi->s_group_desc[gdb_num]; 1077bb08c1e7SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb_bh); 1078bb08c1e7SYongqiang Yang 1079bb08c1e7SYongqiang Yang if (!err && reserved_gdb && ext4_bg_num_gdb(sb, group)) 1080bb08c1e7SYongqiang Yang err = reserve_backup_gdb(handle, resize_inode, group); 1081bb08c1e7SYongqiang Yang } else 1082bb08c1e7SYongqiang Yang err = add_new_gdb(handle, resize_inode, group); 1083bb08c1e7SYongqiang Yang if (err) 1084bb08c1e7SYongqiang Yang break; 1085bb08c1e7SYongqiang Yang } 1086bb08c1e7SYongqiang Yang return err; 1087bb08c1e7SYongqiang Yang } 1088bb08c1e7SYongqiang Yang 1089ac27a0ecSDave Kleikamp /* Add group descriptor data to an existing or new group descriptor block. 1090ac27a0ecSDave Kleikamp * Ensure we handle all possible error conditions _before_ we start modifying 1091ac27a0ecSDave Kleikamp * the filesystem, because we cannot abort the transaction and not have it 1092ac27a0ecSDave Kleikamp * write the data to disk. 1093ac27a0ecSDave Kleikamp * 1094ac27a0ecSDave Kleikamp * If we are on a GDT block boundary, we need to get the reserved GDT block. 1095ac27a0ecSDave Kleikamp * Otherwise, we may need to add backup GDT blocks for a sparse group. 1096ac27a0ecSDave Kleikamp * 1097ac27a0ecSDave Kleikamp * We only need to hold the superblock lock while we are actually adding 1098ac27a0ecSDave Kleikamp * in the new group's counts to the superblock. Prior to that we have 1099ac27a0ecSDave Kleikamp * not really "added" the group at all. We re-check that we are still 1100ac27a0ecSDave Kleikamp * adding in the last group in case things have changed since verifying. 1101ac27a0ecSDave Kleikamp */ 1102617ba13bSMingming Cao int ext4_group_add(struct super_block *sb, struct ext4_new_group_data *input) 1103ac27a0ecSDave Kleikamp { 1104617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 1105617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 1106617ba13bSMingming Cao int reserved_gdb = ext4_bg_has_super(sb, input->group) ? 1107ac27a0ecSDave Kleikamp le16_to_cpu(es->s_reserved_gdt_blocks) : 0; 1108ac27a0ecSDave Kleikamp struct buffer_head *primary = NULL; 1109617ba13bSMingming Cao struct ext4_group_desc *gdp; 1110ac27a0ecSDave Kleikamp struct inode *inode = NULL; 1111ac27a0ecSDave Kleikamp handle_t *handle; 1112ac27a0ecSDave Kleikamp int gdb_off, gdb_num; 1113ac27a0ecSDave Kleikamp int err, err2; 1114ac27a0ecSDave Kleikamp 1115617ba13bSMingming Cao gdb_num = input->group / EXT4_DESC_PER_BLOCK(sb); 1116617ba13bSMingming Cao gdb_off = input->group % EXT4_DESC_PER_BLOCK(sb); 1117ac27a0ecSDave Kleikamp 1118617ba13bSMingming Cao if (gdb_off == 0 && !EXT4_HAS_RO_COMPAT_FEATURE(sb, 1119617ba13bSMingming Cao EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER)) { 112012062dddSEric Sandeen ext4_warning(sb, "Can't resize non-sparse filesystem further"); 1121ac27a0ecSDave Kleikamp return -EPERM; 1122ac27a0ecSDave Kleikamp } 1123ac27a0ecSDave Kleikamp 1124bd81d8eeSLaurent Vivier if (ext4_blocks_count(es) + input->blocks_count < 1125bd81d8eeSLaurent Vivier ext4_blocks_count(es)) { 112612062dddSEric Sandeen ext4_warning(sb, "blocks_count overflow"); 1127ac27a0ecSDave Kleikamp return -EINVAL; 1128ac27a0ecSDave Kleikamp } 1129ac27a0ecSDave Kleikamp 1130617ba13bSMingming Cao if (le32_to_cpu(es->s_inodes_count) + EXT4_INODES_PER_GROUP(sb) < 1131ac27a0ecSDave Kleikamp le32_to_cpu(es->s_inodes_count)) { 113212062dddSEric Sandeen ext4_warning(sb, "inodes_count overflow"); 1133ac27a0ecSDave Kleikamp return -EINVAL; 1134ac27a0ecSDave Kleikamp } 1135ac27a0ecSDave Kleikamp 1136ac27a0ecSDave Kleikamp if (reserved_gdb || gdb_off == 0) { 1137617ba13bSMingming Cao if (!EXT4_HAS_COMPAT_FEATURE(sb, 113837609fd5SJosef Bacik EXT4_FEATURE_COMPAT_RESIZE_INODE) 113937609fd5SJosef Bacik || !le16_to_cpu(es->s_reserved_gdt_blocks)) { 114012062dddSEric Sandeen ext4_warning(sb, 1141ac27a0ecSDave Kleikamp "No reserved GDT blocks, can't resize"); 1142ac27a0ecSDave Kleikamp return -EPERM; 1143ac27a0ecSDave Kleikamp } 11441d1fe1eeSDavid Howells inode = ext4_iget(sb, EXT4_RESIZE_INO); 11451d1fe1eeSDavid Howells if (IS_ERR(inode)) { 114612062dddSEric Sandeen ext4_warning(sb, "Error opening resize inode"); 11471d1fe1eeSDavid Howells return PTR_ERR(inode); 1148ac27a0ecSDave Kleikamp } 1149ac27a0ecSDave Kleikamp } 1150ac27a0ecSDave Kleikamp 1151920313a7SAneesh Kumar K.V 1152ac27a0ecSDave Kleikamp if ((err = verify_group_input(sb, input))) 1153ac27a0ecSDave Kleikamp goto exit_put; 1154ac27a0ecSDave Kleikamp 1155ac27a0ecSDave Kleikamp if ((err = setup_new_group_blocks(sb, input))) 1156ac27a0ecSDave Kleikamp goto exit_put; 1157ac27a0ecSDave Kleikamp 1158ac27a0ecSDave Kleikamp /* 1159ac27a0ecSDave Kleikamp * We will always be modifying at least the superblock and a GDT 1160ac27a0ecSDave Kleikamp * block. If we are adding a group past the last current GDT block, 1161ac27a0ecSDave Kleikamp * we will also modify the inode and the dindirect block. If we 1162ac27a0ecSDave Kleikamp * are adding a group with superblock/GDT backups we will also 1163ac27a0ecSDave Kleikamp * modify each of the reserved GDT dindirect blocks. 1164ac27a0ecSDave Kleikamp */ 1165617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, 1166617ba13bSMingming Cao ext4_bg_has_super(sb, input->group) ? 1167ac27a0ecSDave Kleikamp 3 + reserved_gdb : 4); 1168ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 1169ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 1170ac27a0ecSDave Kleikamp goto exit_put; 1171ac27a0ecSDave Kleikamp } 1172ac27a0ecSDave Kleikamp 1173617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, sbi->s_sbh))) 1174ac27a0ecSDave Kleikamp goto exit_journal; 1175ac27a0ecSDave Kleikamp 1176ac27a0ecSDave Kleikamp /* 1177ac27a0ecSDave Kleikamp * We will only either add reserved group blocks to a backup group 1178ac27a0ecSDave Kleikamp * or remove reserved blocks for the first group in a new group block. 1179ac27a0ecSDave Kleikamp * Doing both would be mean more complex code, and sane people don't 1180ac27a0ecSDave Kleikamp * use non-sparse filesystems anymore. This is already checked above. 1181ac27a0ecSDave Kleikamp */ 1182ac27a0ecSDave Kleikamp if (gdb_off) { 1183ac27a0ecSDave Kleikamp primary = sbi->s_group_desc[gdb_num]; 1184617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, primary))) 1185ac27a0ecSDave Kleikamp goto exit_journal; 1186ac27a0ecSDave Kleikamp 1187668f4dc5SYongqiang Yang if (reserved_gdb && ext4_bg_num_gdb(sb, input->group)) { 1188668f4dc5SYongqiang Yang err = reserve_backup_gdb(handle, inode, input->group); 1189668f4dc5SYongqiang Yang if (err) 1190ac27a0ecSDave Kleikamp goto exit_journal; 1191668f4dc5SYongqiang Yang } 11922f919710SYongqiang Yang } else { 11932f919710SYongqiang Yang /* 11942f919710SYongqiang Yang * Note that we can access new group descriptor block safely 11952f919710SYongqiang Yang * only if add_new_gdb() succeeds. 11962f919710SYongqiang Yang */ 11972f919710SYongqiang Yang err = add_new_gdb(handle, inode, input->group); 11982f919710SYongqiang Yang if (err) 1199ac27a0ecSDave Kleikamp goto exit_journal; 12002f919710SYongqiang Yang primary = sbi->s_group_desc[gdb_num]; 12012f919710SYongqiang Yang } 1202ac27a0ecSDave Kleikamp 1203ac27a0ecSDave Kleikamp /* 1204ac27a0ecSDave Kleikamp * OK, now we've set up the new group. Time to make it active. 1205ac27a0ecSDave Kleikamp * 1206ac27a0ecSDave Kleikamp * so we have to be safe wrt. concurrent accesses the group 1207ac27a0ecSDave Kleikamp * data. So we need to be careful to set all of the relevant 1208ac27a0ecSDave Kleikamp * group descriptor data etc. *before* we enable the group. 1209ac27a0ecSDave Kleikamp * 1210ac27a0ecSDave Kleikamp * The key field here is sbi->s_groups_count: as long as 1211ac27a0ecSDave Kleikamp * that retains its old value, nobody is going to access the new 1212ac27a0ecSDave Kleikamp * group. 1213ac27a0ecSDave Kleikamp * 1214ac27a0ecSDave Kleikamp * So first we update all the descriptor metadata for the new 1215ac27a0ecSDave Kleikamp * group; then we update the total disk blocks count; then we 1216ac27a0ecSDave Kleikamp * update the groups count to enable the group; then finally we 1217ac27a0ecSDave Kleikamp * update the free space counts so that the system can start 1218ac27a0ecSDave Kleikamp * using the new disk blocks. 1219ac27a0ecSDave Kleikamp */ 1220ac27a0ecSDave Kleikamp 1221ac27a0ecSDave Kleikamp /* Update group descriptor block for new group */ 12222856922cSFrederic Bohe gdp = (struct ext4_group_desc *)((char *)primary->b_data + 12232856922cSFrederic Bohe gdb_off * EXT4_DESC_SIZE(sb)); 1224ac27a0ecSDave Kleikamp 1225fdff73f0STheodore Ts'o memset(gdp, 0, EXT4_DESC_SIZE(sb)); 12268fadc143SAlexandre Ratchov ext4_block_bitmap_set(sb, gdp, input->block_bitmap); /* LV FIXME */ 12278fadc143SAlexandre Ratchov ext4_inode_bitmap_set(sb, gdp, input->inode_bitmap); /* LV FIXME */ 12288fadc143SAlexandre Ratchov ext4_inode_table_set(sb, gdp, input->inode_table); /* LV FIXME */ 1229021b65bbSTheodore Ts'o ext4_free_group_clusters_set(sb, gdp, input->free_blocks_count); 1230560671a0SAneesh Kumar K.V ext4_free_inodes_set(sb, gdp, EXT4_INODES_PER_GROUP(sb)); 1231fdff73f0STheodore Ts'o gdp->bg_flags = cpu_to_le16(EXT4_BG_INODE_ZEROED); 1232717d50e4SAndreas Dilger gdp->bg_checksum = ext4_group_desc_csum(sbi, input->group, gdp); 1233ac27a0ecSDave Kleikamp 1234ac27a0ecSDave Kleikamp /* 12355f21b0e6SFrederic Bohe * We can allocate memory for mb_alloc based on the new group 12365f21b0e6SFrederic Bohe * descriptor 12375f21b0e6SFrederic Bohe */ 1238920313a7SAneesh Kumar K.V err = ext4_mb_add_groupinfo(sb, input->group, gdp); 123908c3a813SAneesh Kumar K.V if (err) 12405f21b0e6SFrederic Bohe goto exit_journal; 1241c2ea3fdeSTheodore Ts'o 12425f21b0e6SFrederic Bohe /* 1243ac27a0ecSDave Kleikamp * Make the new blocks and inodes valid next. We do this before 1244ac27a0ecSDave Kleikamp * increasing the group count so that once the group is enabled, 1245ac27a0ecSDave Kleikamp * all of its blocks and inodes are already valid. 1246ac27a0ecSDave Kleikamp * 1247ac27a0ecSDave Kleikamp * We always allocate group-by-group, then block-by-block or 1248ac27a0ecSDave Kleikamp * inode-by-inode within a group, so enabling these 1249ac27a0ecSDave Kleikamp * blocks/inodes before the group is live won't actually let us 1250ac27a0ecSDave Kleikamp * allocate the new space yet. 1251ac27a0ecSDave Kleikamp */ 1252bd81d8eeSLaurent Vivier ext4_blocks_count_set(es, ext4_blocks_count(es) + 1253ac27a0ecSDave Kleikamp input->blocks_count); 1254e8546d06SMarcin Slusarz le32_add_cpu(&es->s_inodes_count, EXT4_INODES_PER_GROUP(sb)); 1255ac27a0ecSDave Kleikamp 1256ac27a0ecSDave Kleikamp /* 1257ac27a0ecSDave Kleikamp * We need to protect s_groups_count against other CPUs seeing 1258ac27a0ecSDave Kleikamp * inconsistent state in the superblock. 1259ac27a0ecSDave Kleikamp * 1260ac27a0ecSDave Kleikamp * The precise rules we use are: 1261ac27a0ecSDave Kleikamp * 1262ac27a0ecSDave Kleikamp * * Writers must perform a smp_wmb() after updating all dependent 1263ac27a0ecSDave Kleikamp * data and before modifying the groups count 1264ac27a0ecSDave Kleikamp * 1265ac27a0ecSDave Kleikamp * * Readers must perform an smp_rmb() after reading the groups count 1266ac27a0ecSDave Kleikamp * and before reading any dependent data. 1267ac27a0ecSDave Kleikamp * 1268ac27a0ecSDave Kleikamp * NB. These rules can be relaxed when checking the group count 1269ac27a0ecSDave Kleikamp * while freeing data, as we can only allocate from a block 1270ac27a0ecSDave Kleikamp * group after serialising against the group count, and we can 1271ac27a0ecSDave Kleikamp * only then free after serialising in turn against that 1272ac27a0ecSDave Kleikamp * allocation. 1273ac27a0ecSDave Kleikamp */ 1274ac27a0ecSDave Kleikamp smp_wmb(); 1275ac27a0ecSDave Kleikamp 1276ac27a0ecSDave Kleikamp /* Update the global fs size fields */ 1277ac27a0ecSDave Kleikamp sbi->s_groups_count++; 1278ac27a0ecSDave Kleikamp 1279b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, primary); 1280b4097142STheodore Ts'o if (unlikely(err)) { 1281b4097142STheodore Ts'o ext4_std_error(sb, err); 1282b4097142STheodore Ts'o goto exit_journal; 1283b4097142STheodore Ts'o } 1284ac27a0ecSDave Kleikamp 1285ac27a0ecSDave Kleikamp /* Update the reserved block counts only once the new group is 1286ac27a0ecSDave Kleikamp * active. */ 1287bd81d8eeSLaurent Vivier ext4_r_blocks_count_set(es, ext4_r_blocks_count(es) + 1288ac27a0ecSDave Kleikamp input->reserved_blocks); 1289ac27a0ecSDave Kleikamp 1290ac27a0ecSDave Kleikamp /* Update the free space counts */ 129157042651STheodore Ts'o percpu_counter_add(&sbi->s_freeclusters_counter, 129257042651STheodore Ts'o EXT4_B2C(sbi, input->free_blocks_count)); 1293aa0dff2dSPeter Zijlstra percpu_counter_add(&sbi->s_freeinodes_counter, 1294617ba13bSMingming Cao EXT4_INODES_PER_GROUP(sb)); 1295ac27a0ecSDave Kleikamp 129642007efdSEric Sandeen if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_FLEX_BG) && 129742007efdSEric Sandeen sbi->s_log_groups_per_flex) { 1298c62a11fdSFrederic Bohe ext4_group_t flex_group; 1299c62a11fdSFrederic Bohe flex_group = ext4_flex_group(sbi, input->group); 130024aaa8efSTheodore Ts'o atomic_add(EXT4_B2C(sbi, input->free_blocks_count), 130124aaa8efSTheodore Ts'o &sbi->s_flex_groups[flex_group].free_clusters); 13029f24e420STheodore Ts'o atomic_add(EXT4_INODES_PER_GROUP(sb), 13039f24e420STheodore Ts'o &sbi->s_flex_groups[flex_group].free_inodes); 1304c62a11fdSFrederic Bohe } 1305c62a11fdSFrederic Bohe 1306a0375156STheodore Ts'o ext4_handle_dirty_super(handle, sb); 1307ac27a0ecSDave Kleikamp 1308ac27a0ecSDave Kleikamp exit_journal: 1309617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 1310ac27a0ecSDave Kleikamp err = err2; 13112f919710SYongqiang Yang if (!err && primary) { 1312ac27a0ecSDave Kleikamp update_backups(sb, sbi->s_sbh->b_blocknr, (char *)es, 1313617ba13bSMingming Cao sizeof(struct ext4_super_block)); 1314ac27a0ecSDave Kleikamp update_backups(sb, primary->b_blocknr, primary->b_data, 1315ac27a0ecSDave Kleikamp primary->b_size); 1316ac27a0ecSDave Kleikamp } 1317ac27a0ecSDave Kleikamp exit_put: 1318ac27a0ecSDave Kleikamp iput(inode); 1319ac27a0ecSDave Kleikamp return err; 1320617ba13bSMingming Cao } /* ext4_group_add */ 1321ac27a0ecSDave Kleikamp 13222b2d6d01STheodore Ts'o /* 132318e31438SYongqiang Yang * extend a group without checking assuming that checking has been done. 132418e31438SYongqiang Yang */ 132518e31438SYongqiang Yang static int ext4_group_extend_no_check(struct super_block *sb, 132618e31438SYongqiang Yang ext4_fsblk_t o_blocks_count, ext4_grpblk_t add) 132718e31438SYongqiang Yang { 132818e31438SYongqiang Yang struct ext4_super_block *es = EXT4_SB(sb)->s_es; 132918e31438SYongqiang Yang handle_t *handle; 133018e31438SYongqiang Yang int err = 0, err2; 133118e31438SYongqiang Yang 133218e31438SYongqiang Yang /* We will update the superblock, one block bitmap, and 133318e31438SYongqiang Yang * one group descriptor via ext4_group_add_blocks(). 133418e31438SYongqiang Yang */ 133518e31438SYongqiang Yang handle = ext4_journal_start_sb(sb, 3); 133618e31438SYongqiang Yang if (IS_ERR(handle)) { 133718e31438SYongqiang Yang err = PTR_ERR(handle); 133818e31438SYongqiang Yang ext4_warning(sb, "error %d on journal start", err); 133918e31438SYongqiang Yang return err; 134018e31438SYongqiang Yang } 134118e31438SYongqiang Yang 134218e31438SYongqiang Yang err = ext4_journal_get_write_access(handle, EXT4_SB(sb)->s_sbh); 134318e31438SYongqiang Yang if (err) { 134418e31438SYongqiang Yang ext4_warning(sb, "error %d on journal write access", err); 134518e31438SYongqiang Yang goto errout; 134618e31438SYongqiang Yang } 134718e31438SYongqiang Yang 134818e31438SYongqiang Yang ext4_blocks_count_set(es, o_blocks_count + add); 134918e31438SYongqiang Yang ext4_debug("freeing blocks %llu through %llu\n", o_blocks_count, 135018e31438SYongqiang Yang o_blocks_count + add); 135118e31438SYongqiang Yang /* We add the blocks to the bitmap and set the group need init bit */ 135218e31438SYongqiang Yang err = ext4_group_add_blocks(handle, sb, o_blocks_count, add); 135318e31438SYongqiang Yang if (err) 135418e31438SYongqiang Yang goto errout; 135518e31438SYongqiang Yang ext4_handle_dirty_super(handle, sb); 135618e31438SYongqiang Yang ext4_debug("freed blocks %llu through %llu\n", o_blocks_count, 135718e31438SYongqiang Yang o_blocks_count + add); 135818e31438SYongqiang Yang errout: 135918e31438SYongqiang Yang err2 = ext4_journal_stop(handle); 136018e31438SYongqiang Yang if (err2 && !err) 136118e31438SYongqiang Yang err = err2; 136218e31438SYongqiang Yang 136318e31438SYongqiang Yang if (!err) { 136418e31438SYongqiang Yang if (test_opt(sb, DEBUG)) 136518e31438SYongqiang Yang printk(KERN_DEBUG "EXT4-fs: extended group to %llu " 136618e31438SYongqiang Yang "blocks\n", ext4_blocks_count(es)); 136718e31438SYongqiang Yang update_backups(sb, EXT4_SB(sb)->s_sbh->b_blocknr, (char *)es, 136818e31438SYongqiang Yang sizeof(struct ext4_super_block)); 136918e31438SYongqiang Yang } 137018e31438SYongqiang Yang return err; 137118e31438SYongqiang Yang } 137218e31438SYongqiang Yang 137318e31438SYongqiang Yang /* 13742b2d6d01STheodore Ts'o * Extend the filesystem to the new number of blocks specified. This entry 1375ac27a0ecSDave Kleikamp * point is only used to extend the current filesystem to the end of the last 1376ac27a0ecSDave Kleikamp * existing group. It can be accessed via ioctl, or by "remount,resize=<size>" 1377ac27a0ecSDave Kleikamp * for emergencies (because it has no dependencies on reserved blocks). 1378ac27a0ecSDave Kleikamp * 1379617ba13bSMingming Cao * If we _really_ wanted, we could use default values to call ext4_group_add() 1380ac27a0ecSDave Kleikamp * allow the "remount" trick to work for arbitrary resizing, assuming enough 1381ac27a0ecSDave Kleikamp * GDT blocks are reserved to grow to the desired size. 1382ac27a0ecSDave Kleikamp */ 1383617ba13bSMingming Cao int ext4_group_extend(struct super_block *sb, struct ext4_super_block *es, 1384617ba13bSMingming Cao ext4_fsblk_t n_blocks_count) 1385ac27a0ecSDave Kleikamp { 1386617ba13bSMingming Cao ext4_fsblk_t o_blocks_count; 1387617ba13bSMingming Cao ext4_grpblk_t last; 1388617ba13bSMingming Cao ext4_grpblk_t add; 1389ac27a0ecSDave Kleikamp struct buffer_head *bh; 1390ac27a0ecSDave Kleikamp handle_t *handle; 1391cc7365dfSYongqiang Yang int err, err2; 13925f21b0e6SFrederic Bohe ext4_group_t group; 1393ac27a0ecSDave Kleikamp 1394bd81d8eeSLaurent Vivier o_blocks_count = ext4_blocks_count(es); 1395ac27a0ecSDave Kleikamp 1396ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 13972b79b09dSYongqiang Yang printk(KERN_DEBUG "EXT4-fs: extending last group from %llu to %llu blocks\n", 1398ac27a0ecSDave Kleikamp o_blocks_count, n_blocks_count); 1399ac27a0ecSDave Kleikamp 1400ac27a0ecSDave Kleikamp if (n_blocks_count == 0 || n_blocks_count == o_blocks_count) 1401ac27a0ecSDave Kleikamp return 0; 1402ac27a0ecSDave Kleikamp 1403ac27a0ecSDave Kleikamp if (n_blocks_count > (sector_t)(~0ULL) >> (sb->s_blocksize_bits - 9)) { 1404617ba13bSMingming Cao printk(KERN_ERR "EXT4-fs: filesystem on %s:" 14052ae02107SMingming Cao " too large to resize to %llu blocks safely\n", 1406ac27a0ecSDave Kleikamp sb->s_id, n_blocks_count); 1407ac27a0ecSDave Kleikamp if (sizeof(sector_t) < 8) 140812062dddSEric Sandeen ext4_warning(sb, "CONFIG_LBDAF not enabled"); 1409ac27a0ecSDave Kleikamp return -EINVAL; 1410ac27a0ecSDave Kleikamp } 1411ac27a0ecSDave Kleikamp 1412ac27a0ecSDave Kleikamp if (n_blocks_count < o_blocks_count) { 141312062dddSEric Sandeen ext4_warning(sb, "can't shrink FS - resize aborted"); 14148f82f840SYongqiang Yang return -EINVAL; 1415ac27a0ecSDave Kleikamp } 1416ac27a0ecSDave Kleikamp 1417ac27a0ecSDave Kleikamp /* Handle the remaining blocks in the last group only. */ 14185f21b0e6SFrederic Bohe ext4_get_group_no_and_offset(sb, o_blocks_count, &group, &last); 1419ac27a0ecSDave Kleikamp 1420ac27a0ecSDave Kleikamp if (last == 0) { 142112062dddSEric Sandeen ext4_warning(sb, "need to use ext2online to resize further"); 1422ac27a0ecSDave Kleikamp return -EPERM; 1423ac27a0ecSDave Kleikamp } 1424ac27a0ecSDave Kleikamp 1425617ba13bSMingming Cao add = EXT4_BLOCKS_PER_GROUP(sb) - last; 1426ac27a0ecSDave Kleikamp 1427ac27a0ecSDave Kleikamp if (o_blocks_count + add < o_blocks_count) { 142812062dddSEric Sandeen ext4_warning(sb, "blocks_count overflow"); 1429ac27a0ecSDave Kleikamp return -EINVAL; 1430ac27a0ecSDave Kleikamp } 1431ac27a0ecSDave Kleikamp 1432ac27a0ecSDave Kleikamp if (o_blocks_count + add > n_blocks_count) 1433ac27a0ecSDave Kleikamp add = n_blocks_count - o_blocks_count; 1434ac27a0ecSDave Kleikamp 1435ac27a0ecSDave Kleikamp if (o_blocks_count + add < n_blocks_count) 143612062dddSEric Sandeen ext4_warning(sb, "will only finish group (%llu blocks, %u new)", 1437ac27a0ecSDave Kleikamp o_blocks_count + add, add); 1438ac27a0ecSDave Kleikamp 1439ac27a0ecSDave Kleikamp /* See if the device is actually as big as what was requested */ 1440ac27a0ecSDave Kleikamp bh = sb_bread(sb, o_blocks_count + add - 1); 1441ac27a0ecSDave Kleikamp if (!bh) { 144212062dddSEric Sandeen ext4_warning(sb, "can't read last block, resize aborted"); 1443ac27a0ecSDave Kleikamp return -ENOSPC; 1444ac27a0ecSDave Kleikamp } 1445ac27a0ecSDave Kleikamp brelse(bh); 1446ac27a0ecSDave Kleikamp 1447ac27a0ecSDave Kleikamp /* We will update the superblock, one block bitmap, and 1448617ba13bSMingming Cao * one group descriptor via ext4_free_blocks(). 1449ac27a0ecSDave Kleikamp */ 1450617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, 3); 1451ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 1452ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 145312062dddSEric Sandeen ext4_warning(sb, "error %d on journal start", err); 1454ac27a0ecSDave Kleikamp goto exit_put; 1455ac27a0ecSDave Kleikamp } 1456ac27a0ecSDave Kleikamp 1457617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, 1458617ba13bSMingming Cao EXT4_SB(sb)->s_sbh))) { 145912062dddSEric Sandeen ext4_warning(sb, "error %d on journal write access", err); 1460617ba13bSMingming Cao ext4_journal_stop(handle); 1461ac27a0ecSDave Kleikamp goto exit_put; 1462ac27a0ecSDave Kleikamp } 1463bd81d8eeSLaurent Vivier ext4_blocks_count_set(es, o_blocks_count + add); 1464c549a95dSEric Sandeen ext4_debug("freeing blocks %llu through %llu\n", o_blocks_count, 1465ac27a0ecSDave Kleikamp o_blocks_count + add); 1466e21675d4SAneesh Kumar K.V /* We add the blocks to the bitmap and set the group need init bit */ 1467cc7365dfSYongqiang Yang err = ext4_group_add_blocks(handle, sb, o_blocks_count, add); 1468a0375156STheodore Ts'o ext4_handle_dirty_super(handle, sb); 14692ae02107SMingming Cao ext4_debug("freed blocks %llu through %llu\n", o_blocks_count, 1470ac27a0ecSDave Kleikamp o_blocks_count + add); 1471cc7365dfSYongqiang Yang err2 = ext4_journal_stop(handle); 1472cc7365dfSYongqiang Yang if (!err && err2) 1473cc7365dfSYongqiang Yang err = err2; 1474cc7365dfSYongqiang Yang 1475cc7365dfSYongqiang Yang if (err) 1476ac27a0ecSDave Kleikamp goto exit_put; 14775f21b0e6SFrederic Bohe 1478ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 1479bd81d8eeSLaurent Vivier printk(KERN_DEBUG "EXT4-fs: extended group to %llu blocks\n", 1480bd81d8eeSLaurent Vivier ext4_blocks_count(es)); 1481617ba13bSMingming Cao update_backups(sb, EXT4_SB(sb)->s_sbh->b_blocknr, (char *)es, 1482617ba13bSMingming Cao sizeof(struct ext4_super_block)); 1483ac27a0ecSDave Kleikamp exit_put: 1484ac27a0ecSDave Kleikamp return err; 1485617ba13bSMingming Cao } /* ext4_group_extend */ 1486