1ac27a0ecSDave Kleikamp /* 2617ba13bSMingming Cao * linux/fs/ext4/resize.c 3ac27a0ecSDave Kleikamp * 4617ba13bSMingming Cao * Support for resizing an ext4 filesystem while it is mounted. 5ac27a0ecSDave Kleikamp * 6ac27a0ecSDave Kleikamp * Copyright (C) 2001, 2002 Andreas Dilger <adilger@clusterfs.com> 7ac27a0ecSDave Kleikamp * 8ac27a0ecSDave Kleikamp * This could probably be made into a module, because it is not often in use. 9ac27a0ecSDave Kleikamp */ 10ac27a0ecSDave Kleikamp 11ac27a0ecSDave Kleikamp 12617ba13bSMingming Cao #define EXT4FS_DEBUG 13ac27a0ecSDave Kleikamp 14ac27a0ecSDave Kleikamp #include <linux/errno.h> 15ac27a0ecSDave Kleikamp #include <linux/slab.h> 16ac27a0ecSDave Kleikamp 173dcf5451SChristoph Hellwig #include "ext4_jbd2.h" 18ac27a0ecSDave Kleikamp 198f82f840SYongqiang Yang int ext4_resize_begin(struct super_block *sb) 208f82f840SYongqiang Yang { 218f82f840SYongqiang Yang int ret = 0; 228f82f840SYongqiang Yang 238f82f840SYongqiang Yang if (!capable(CAP_SYS_RESOURCE)) 248f82f840SYongqiang Yang return -EPERM; 258f82f840SYongqiang Yang 26ce723c31SYongqiang Yang /* 27ce723c31SYongqiang Yang * We are not allowed to do online-resizing on a filesystem mounted 28ce723c31SYongqiang Yang * with error, because it can destroy the filesystem easily. 29ce723c31SYongqiang Yang */ 30ce723c31SYongqiang Yang if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) { 31ce723c31SYongqiang Yang ext4_warning(sb, "There are errors in the filesystem, " 32ce723c31SYongqiang Yang "so online resizing is not allowed\n"); 33ce723c31SYongqiang Yang return -EPERM; 34ce723c31SYongqiang Yang } 35ce723c31SYongqiang Yang 368f82f840SYongqiang Yang if (test_and_set_bit_lock(EXT4_RESIZING, &EXT4_SB(sb)->s_resize_flags)) 378f82f840SYongqiang Yang ret = -EBUSY; 388f82f840SYongqiang Yang 398f82f840SYongqiang Yang return ret; 408f82f840SYongqiang Yang } 418f82f840SYongqiang Yang 428f82f840SYongqiang Yang void ext4_resize_end(struct super_block *sb) 438f82f840SYongqiang Yang { 448f82f840SYongqiang Yang clear_bit_unlock(EXT4_RESIZING, &EXT4_SB(sb)->s_resize_flags); 458f82f840SYongqiang Yang smp_mb__after_clear_bit(); 468f82f840SYongqiang Yang } 478f82f840SYongqiang Yang 48ac27a0ecSDave Kleikamp #define outside(b, first, last) ((b) < (first) || (b) >= (last)) 49ac27a0ecSDave Kleikamp #define inside(b, first, last) ((b) >= (first) && (b) < (last)) 50ac27a0ecSDave Kleikamp 51ac27a0ecSDave Kleikamp static int verify_group_input(struct super_block *sb, 52617ba13bSMingming Cao struct ext4_new_group_data *input) 53ac27a0ecSDave Kleikamp { 54617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 55617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 56bd81d8eeSLaurent Vivier ext4_fsblk_t start = ext4_blocks_count(es); 57617ba13bSMingming Cao ext4_fsblk_t end = start + input->blocks_count; 58fd2d4291SAvantika Mathur ext4_group_t group = input->group; 59617ba13bSMingming Cao ext4_fsblk_t itend = input->inode_table + sbi->s_itb_per_group; 60617ba13bSMingming Cao unsigned overhead = ext4_bg_has_super(sb, group) ? 61617ba13bSMingming Cao (1 + ext4_bg_num_gdb(sb, group) + 62ac27a0ecSDave Kleikamp le16_to_cpu(es->s_reserved_gdt_blocks)) : 0; 63617ba13bSMingming Cao ext4_fsblk_t metaend = start + overhead; 64ac27a0ecSDave Kleikamp struct buffer_head *bh = NULL; 653a5b2ecdSMingming Cao ext4_grpblk_t free_blocks_count, offset; 66ac27a0ecSDave Kleikamp int err = -EINVAL; 67ac27a0ecSDave Kleikamp 68ac27a0ecSDave Kleikamp input->free_blocks_count = free_blocks_count = 69ac27a0ecSDave Kleikamp input->blocks_count - 2 - overhead - sbi->s_itb_per_group; 70ac27a0ecSDave Kleikamp 71ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 72617ba13bSMingming Cao printk(KERN_DEBUG "EXT4-fs: adding %s group %u: %u blocks " 73ac27a0ecSDave Kleikamp "(%d free, %u reserved)\n", 74617ba13bSMingming Cao ext4_bg_has_super(sb, input->group) ? "normal" : 75ac27a0ecSDave Kleikamp "no-super", input->group, input->blocks_count, 76ac27a0ecSDave Kleikamp free_blocks_count, input->reserved_blocks); 77ac27a0ecSDave Kleikamp 783a5b2ecdSMingming Cao ext4_get_group_no_and_offset(sb, start, NULL, &offset); 79ac27a0ecSDave Kleikamp if (group != sbi->s_groups_count) 8012062dddSEric Sandeen ext4_warning(sb, "Cannot add at group %u (only %u groups)", 81ac27a0ecSDave Kleikamp input->group, sbi->s_groups_count); 823a5b2ecdSMingming Cao else if (offset != 0) 8312062dddSEric Sandeen ext4_warning(sb, "Last group not full"); 84ac27a0ecSDave Kleikamp else if (input->reserved_blocks > input->blocks_count / 5) 8512062dddSEric Sandeen ext4_warning(sb, "Reserved blocks too high (%u)", 86ac27a0ecSDave Kleikamp input->reserved_blocks); 87ac27a0ecSDave Kleikamp else if (free_blocks_count < 0) 8812062dddSEric Sandeen ext4_warning(sb, "Bad blocks count %u", 89ac27a0ecSDave Kleikamp input->blocks_count); 90ac27a0ecSDave Kleikamp else if (!(bh = sb_bread(sb, end - 1))) 9112062dddSEric Sandeen ext4_warning(sb, "Cannot read last block (%llu)", 92ac27a0ecSDave Kleikamp end - 1); 93ac27a0ecSDave Kleikamp else if (outside(input->block_bitmap, start, end)) 9412062dddSEric Sandeen ext4_warning(sb, "Block bitmap not in group (block %llu)", 951939e49aSRandy Dunlap (unsigned long long)input->block_bitmap); 96ac27a0ecSDave Kleikamp else if (outside(input->inode_bitmap, start, end)) 9712062dddSEric Sandeen ext4_warning(sb, "Inode bitmap not in group (block %llu)", 981939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap); 99ac27a0ecSDave Kleikamp else if (outside(input->inode_table, start, end) || 100ac27a0ecSDave Kleikamp outside(itend - 1, start, end)) 10112062dddSEric Sandeen ext4_warning(sb, "Inode table not in group (blocks %llu-%llu)", 1021939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 103ac27a0ecSDave Kleikamp else if (input->inode_bitmap == input->block_bitmap) 10412062dddSEric Sandeen ext4_warning(sb, "Block bitmap same as inode bitmap (%llu)", 1051939e49aSRandy Dunlap (unsigned long long)input->block_bitmap); 106ac27a0ecSDave Kleikamp else if (inside(input->block_bitmap, input->inode_table, itend)) 10712062dddSEric Sandeen ext4_warning(sb, "Block bitmap (%llu) in inode table " 10812062dddSEric Sandeen "(%llu-%llu)", 1091939e49aSRandy Dunlap (unsigned long long)input->block_bitmap, 1101939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 111ac27a0ecSDave Kleikamp else if (inside(input->inode_bitmap, input->inode_table, itend)) 11212062dddSEric Sandeen ext4_warning(sb, "Inode bitmap (%llu) in inode table " 11312062dddSEric Sandeen "(%llu-%llu)", 1141939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap, 1151939e49aSRandy Dunlap (unsigned long long)input->inode_table, itend - 1); 116ac27a0ecSDave Kleikamp else if (inside(input->block_bitmap, start, metaend)) 11712062dddSEric Sandeen ext4_warning(sb, "Block bitmap (%llu) in GDT table (%llu-%llu)", 1181939e49aSRandy Dunlap (unsigned long long)input->block_bitmap, 1191939e49aSRandy Dunlap start, metaend - 1); 120ac27a0ecSDave Kleikamp else if (inside(input->inode_bitmap, start, metaend)) 12112062dddSEric Sandeen ext4_warning(sb, "Inode bitmap (%llu) in GDT table (%llu-%llu)", 1221939e49aSRandy Dunlap (unsigned long long)input->inode_bitmap, 1231939e49aSRandy Dunlap start, metaend - 1); 124ac27a0ecSDave Kleikamp else if (inside(input->inode_table, start, metaend) || 125ac27a0ecSDave Kleikamp inside(itend - 1, start, metaend)) 12612062dddSEric Sandeen ext4_warning(sb, "Inode table (%llu-%llu) overlaps GDT table " 12712062dddSEric Sandeen "(%llu-%llu)", 1281939e49aSRandy Dunlap (unsigned long long)input->inode_table, 1291939e49aSRandy Dunlap itend - 1, start, metaend - 1); 130ac27a0ecSDave Kleikamp else 131ac27a0ecSDave Kleikamp err = 0; 132ac27a0ecSDave Kleikamp brelse(bh); 133ac27a0ecSDave Kleikamp 134ac27a0ecSDave Kleikamp return err; 135ac27a0ecSDave Kleikamp } 136ac27a0ecSDave Kleikamp 13728c7bac0SYongqiang Yang /* 13828c7bac0SYongqiang Yang * ext4_new_flex_group_data is used by 64bit-resize interface to add a flex 13928c7bac0SYongqiang Yang * group each time. 14028c7bac0SYongqiang Yang */ 14128c7bac0SYongqiang Yang struct ext4_new_flex_group_data { 14228c7bac0SYongqiang Yang struct ext4_new_group_data *groups; /* new_group_data for groups 14328c7bac0SYongqiang Yang in the flex group */ 14428c7bac0SYongqiang Yang __u16 *bg_flags; /* block group flags of groups 14528c7bac0SYongqiang Yang in @groups */ 14628c7bac0SYongqiang Yang ext4_group_t count; /* number of groups in @groups 14728c7bac0SYongqiang Yang */ 14828c7bac0SYongqiang Yang }; 14928c7bac0SYongqiang Yang 15028c7bac0SYongqiang Yang /* 15128c7bac0SYongqiang Yang * alloc_flex_gd() allocates a ext4_new_flex_group_data with size of 15228c7bac0SYongqiang Yang * @flexbg_size. 15328c7bac0SYongqiang Yang * 15428c7bac0SYongqiang Yang * Returns NULL on failure otherwise address of the allocated structure. 15528c7bac0SYongqiang Yang */ 15628c7bac0SYongqiang Yang static struct ext4_new_flex_group_data *alloc_flex_gd(unsigned long flexbg_size) 15728c7bac0SYongqiang Yang { 15828c7bac0SYongqiang Yang struct ext4_new_flex_group_data *flex_gd; 15928c7bac0SYongqiang Yang 16028c7bac0SYongqiang Yang flex_gd = kmalloc(sizeof(*flex_gd), GFP_NOFS); 16128c7bac0SYongqiang Yang if (flex_gd == NULL) 16228c7bac0SYongqiang Yang goto out3; 16328c7bac0SYongqiang Yang 16428c7bac0SYongqiang Yang flex_gd->count = flexbg_size; 16528c7bac0SYongqiang Yang 16628c7bac0SYongqiang Yang flex_gd->groups = kmalloc(sizeof(struct ext4_new_group_data) * 16728c7bac0SYongqiang Yang flexbg_size, GFP_NOFS); 16828c7bac0SYongqiang Yang if (flex_gd->groups == NULL) 16928c7bac0SYongqiang Yang goto out2; 17028c7bac0SYongqiang Yang 17128c7bac0SYongqiang Yang flex_gd->bg_flags = kmalloc(flexbg_size * sizeof(__u16), GFP_NOFS); 17228c7bac0SYongqiang Yang if (flex_gd->bg_flags == NULL) 17328c7bac0SYongqiang Yang goto out1; 17428c7bac0SYongqiang Yang 17528c7bac0SYongqiang Yang return flex_gd; 17628c7bac0SYongqiang Yang 17728c7bac0SYongqiang Yang out1: 17828c7bac0SYongqiang Yang kfree(flex_gd->groups); 17928c7bac0SYongqiang Yang out2: 18028c7bac0SYongqiang Yang kfree(flex_gd); 18128c7bac0SYongqiang Yang out3: 18228c7bac0SYongqiang Yang return NULL; 18328c7bac0SYongqiang Yang } 18428c7bac0SYongqiang Yang 18528c7bac0SYongqiang Yang static void free_flex_gd(struct ext4_new_flex_group_data *flex_gd) 18628c7bac0SYongqiang Yang { 18728c7bac0SYongqiang Yang kfree(flex_gd->bg_flags); 18828c7bac0SYongqiang Yang kfree(flex_gd->groups); 18928c7bac0SYongqiang Yang kfree(flex_gd); 19028c7bac0SYongqiang Yang } 19128c7bac0SYongqiang Yang 192*3fbea4b3SYongqiang Yang /* 193*3fbea4b3SYongqiang Yang * ext4_alloc_group_tables() allocates block bitmaps, inode bitmaps 194*3fbea4b3SYongqiang Yang * and inode tables for a flex group. 195*3fbea4b3SYongqiang Yang * 196*3fbea4b3SYongqiang Yang * This function is used by 64bit-resize. Note that this function allocates 197*3fbea4b3SYongqiang Yang * group tables from the 1st group of groups contained by @flexgd, which may 198*3fbea4b3SYongqiang Yang * be a partial of a flex group. 199*3fbea4b3SYongqiang Yang * 200*3fbea4b3SYongqiang Yang * @sb: super block of fs to which the groups belongs 201*3fbea4b3SYongqiang Yang */ 202*3fbea4b3SYongqiang Yang static void ext4_alloc_group_tables(struct super_block *sb, 203*3fbea4b3SYongqiang Yang struct ext4_new_flex_group_data *flex_gd, 204*3fbea4b3SYongqiang Yang int flexbg_size) 205*3fbea4b3SYongqiang Yang { 206*3fbea4b3SYongqiang Yang struct ext4_new_group_data *group_data = flex_gd->groups; 207*3fbea4b3SYongqiang Yang struct ext4_super_block *es = EXT4_SB(sb)->s_es; 208*3fbea4b3SYongqiang Yang ext4_fsblk_t start_blk; 209*3fbea4b3SYongqiang Yang ext4_fsblk_t last_blk; 210*3fbea4b3SYongqiang Yang ext4_group_t src_group; 211*3fbea4b3SYongqiang Yang ext4_group_t bb_index = 0; 212*3fbea4b3SYongqiang Yang ext4_group_t ib_index = 0; 213*3fbea4b3SYongqiang Yang ext4_group_t it_index = 0; 214*3fbea4b3SYongqiang Yang ext4_group_t group; 215*3fbea4b3SYongqiang Yang ext4_group_t last_group; 216*3fbea4b3SYongqiang Yang unsigned overhead; 217*3fbea4b3SYongqiang Yang 218*3fbea4b3SYongqiang Yang BUG_ON(flex_gd->count == 0 || group_data == NULL); 219*3fbea4b3SYongqiang Yang 220*3fbea4b3SYongqiang Yang src_group = group_data[0].group; 221*3fbea4b3SYongqiang Yang last_group = src_group + flex_gd->count - 1; 222*3fbea4b3SYongqiang Yang 223*3fbea4b3SYongqiang Yang BUG_ON((flexbg_size > 1) && ((src_group & ~(flexbg_size - 1)) != 224*3fbea4b3SYongqiang Yang (last_group & ~(flexbg_size - 1)))); 225*3fbea4b3SYongqiang Yang next_group: 226*3fbea4b3SYongqiang Yang group = group_data[0].group; 227*3fbea4b3SYongqiang Yang start_blk = ext4_group_first_block_no(sb, src_group); 228*3fbea4b3SYongqiang Yang last_blk = start_blk + group_data[src_group - group].blocks_count; 229*3fbea4b3SYongqiang Yang 230*3fbea4b3SYongqiang Yang overhead = ext4_bg_has_super(sb, src_group) ? 231*3fbea4b3SYongqiang Yang (1 + ext4_bg_num_gdb(sb, src_group) + 232*3fbea4b3SYongqiang Yang le16_to_cpu(es->s_reserved_gdt_blocks)) : 0; 233*3fbea4b3SYongqiang Yang 234*3fbea4b3SYongqiang Yang start_blk += overhead; 235*3fbea4b3SYongqiang Yang 236*3fbea4b3SYongqiang Yang BUG_ON(src_group >= group_data[0].group + flex_gd->count); 237*3fbea4b3SYongqiang Yang /* We collect contiguous blocks as much as possible. */ 238*3fbea4b3SYongqiang Yang src_group++; 239*3fbea4b3SYongqiang Yang for (; src_group <= last_group; src_group++) 240*3fbea4b3SYongqiang Yang if (!ext4_bg_has_super(sb, src_group)) 241*3fbea4b3SYongqiang Yang last_blk += group_data[src_group - group].blocks_count; 242*3fbea4b3SYongqiang Yang else 243*3fbea4b3SYongqiang Yang break; 244*3fbea4b3SYongqiang Yang 245*3fbea4b3SYongqiang Yang /* Allocate block bitmaps */ 246*3fbea4b3SYongqiang Yang for (; bb_index < flex_gd->count; bb_index++) { 247*3fbea4b3SYongqiang Yang if (start_blk >= last_blk) 248*3fbea4b3SYongqiang Yang goto next_group; 249*3fbea4b3SYongqiang Yang group_data[bb_index].block_bitmap = start_blk++; 250*3fbea4b3SYongqiang Yang ext4_get_group_no_and_offset(sb, start_blk - 1, &group, NULL); 251*3fbea4b3SYongqiang Yang group -= group_data[0].group; 252*3fbea4b3SYongqiang Yang group_data[group].free_blocks_count--; 253*3fbea4b3SYongqiang Yang if (flexbg_size > 1) 254*3fbea4b3SYongqiang Yang flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; 255*3fbea4b3SYongqiang Yang } 256*3fbea4b3SYongqiang Yang 257*3fbea4b3SYongqiang Yang /* Allocate inode bitmaps */ 258*3fbea4b3SYongqiang Yang for (; ib_index < flex_gd->count; ib_index++) { 259*3fbea4b3SYongqiang Yang if (start_blk >= last_blk) 260*3fbea4b3SYongqiang Yang goto next_group; 261*3fbea4b3SYongqiang Yang group_data[ib_index].inode_bitmap = start_blk++; 262*3fbea4b3SYongqiang Yang ext4_get_group_no_and_offset(sb, start_blk - 1, &group, NULL); 263*3fbea4b3SYongqiang Yang group -= group_data[0].group; 264*3fbea4b3SYongqiang Yang group_data[group].free_blocks_count--; 265*3fbea4b3SYongqiang Yang if (flexbg_size > 1) 266*3fbea4b3SYongqiang Yang flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; 267*3fbea4b3SYongqiang Yang } 268*3fbea4b3SYongqiang Yang 269*3fbea4b3SYongqiang Yang /* Allocate inode tables */ 270*3fbea4b3SYongqiang Yang for (; it_index < flex_gd->count; it_index++) { 271*3fbea4b3SYongqiang Yang if (start_blk + EXT4_SB(sb)->s_itb_per_group > last_blk) 272*3fbea4b3SYongqiang Yang goto next_group; 273*3fbea4b3SYongqiang Yang group_data[it_index].inode_table = start_blk; 274*3fbea4b3SYongqiang Yang ext4_get_group_no_and_offset(sb, start_blk, &group, NULL); 275*3fbea4b3SYongqiang Yang group -= group_data[0].group; 276*3fbea4b3SYongqiang Yang group_data[group].free_blocks_count -= 277*3fbea4b3SYongqiang Yang EXT4_SB(sb)->s_itb_per_group; 278*3fbea4b3SYongqiang Yang if (flexbg_size > 1) 279*3fbea4b3SYongqiang Yang flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; 280*3fbea4b3SYongqiang Yang 281*3fbea4b3SYongqiang Yang start_blk += EXT4_SB(sb)->s_itb_per_group; 282*3fbea4b3SYongqiang Yang } 283*3fbea4b3SYongqiang Yang 284*3fbea4b3SYongqiang Yang if (test_opt(sb, DEBUG)) { 285*3fbea4b3SYongqiang Yang int i; 286*3fbea4b3SYongqiang Yang group = group_data[0].group; 287*3fbea4b3SYongqiang Yang 288*3fbea4b3SYongqiang Yang printk(KERN_DEBUG "EXT4-fs: adding a flex group with " 289*3fbea4b3SYongqiang Yang "%d groups, flexbg size is %d:\n", flex_gd->count, 290*3fbea4b3SYongqiang Yang flexbg_size); 291*3fbea4b3SYongqiang Yang 292*3fbea4b3SYongqiang Yang for (i = 0; i < flex_gd->count; i++) { 293*3fbea4b3SYongqiang Yang printk(KERN_DEBUG "adding %s group %u: %u " 294*3fbea4b3SYongqiang Yang "blocks (%d free)\n", 295*3fbea4b3SYongqiang Yang ext4_bg_has_super(sb, group + i) ? "normal" : 296*3fbea4b3SYongqiang Yang "no-super", group + i, 297*3fbea4b3SYongqiang Yang group_data[i].blocks_count, 298*3fbea4b3SYongqiang Yang group_data[i].free_blocks_count); 299*3fbea4b3SYongqiang Yang } 300*3fbea4b3SYongqiang Yang } 301*3fbea4b3SYongqiang Yang } 302*3fbea4b3SYongqiang Yang 303ac27a0ecSDave Kleikamp static struct buffer_head *bclean(handle_t *handle, struct super_block *sb, 304617ba13bSMingming Cao ext4_fsblk_t blk) 305ac27a0ecSDave Kleikamp { 306ac27a0ecSDave Kleikamp struct buffer_head *bh; 307ac27a0ecSDave Kleikamp int err; 308ac27a0ecSDave Kleikamp 309ac27a0ecSDave Kleikamp bh = sb_getblk(sb, blk); 310ac27a0ecSDave Kleikamp if (!bh) 311ac27a0ecSDave Kleikamp return ERR_PTR(-EIO); 312617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, bh))) { 313ac27a0ecSDave Kleikamp brelse(bh); 314ac27a0ecSDave Kleikamp bh = ERR_PTR(err); 315ac27a0ecSDave Kleikamp } else { 316ac27a0ecSDave Kleikamp memset(bh->b_data, 0, sb->s_blocksize); 317ac27a0ecSDave Kleikamp set_buffer_uptodate(bh); 318ac27a0ecSDave Kleikamp } 319ac27a0ecSDave Kleikamp 320ac27a0ecSDave Kleikamp return bh; 321ac27a0ecSDave Kleikamp } 322ac27a0ecSDave Kleikamp 323ac27a0ecSDave Kleikamp /* 32414904107SEric Sandeen * If we have fewer than thresh credits, extend by EXT4_MAX_TRANS_DATA. 32514904107SEric Sandeen * If that fails, restart the transaction & regain write access for the 32614904107SEric Sandeen * buffer head which is used for block_bitmap modifications. 32714904107SEric Sandeen */ 3286d40bc5aSYongqiang Yang static int extend_or_restart_transaction(handle_t *handle, int thresh) 32914904107SEric Sandeen { 33014904107SEric Sandeen int err; 33114904107SEric Sandeen 3320390131bSFrank Mayhar if (ext4_handle_has_enough_credits(handle, thresh)) 33314904107SEric Sandeen return 0; 33414904107SEric Sandeen 33514904107SEric Sandeen err = ext4_journal_extend(handle, EXT4_MAX_TRANS_DATA); 33614904107SEric Sandeen if (err < 0) 33714904107SEric Sandeen return err; 33814904107SEric Sandeen if (err) { 3396d40bc5aSYongqiang Yang err = ext4_journal_restart(handle, EXT4_MAX_TRANS_DATA); 3406d40bc5aSYongqiang Yang if (err) 34114904107SEric Sandeen return err; 34214904107SEric Sandeen } 34314904107SEric Sandeen 34414904107SEric Sandeen return 0; 34514904107SEric Sandeen } 34614904107SEric Sandeen 34714904107SEric Sandeen /* 34833afdcc5SYongqiang Yang * set_flexbg_block_bitmap() mark @count blocks starting from @block used. 34933afdcc5SYongqiang Yang * 35033afdcc5SYongqiang Yang * Helper function for ext4_setup_new_group_blocks() which set . 35133afdcc5SYongqiang Yang * 35233afdcc5SYongqiang Yang * @sb: super block 35333afdcc5SYongqiang Yang * @handle: journal handle 35433afdcc5SYongqiang Yang * @flex_gd: flex group data 35533afdcc5SYongqiang Yang */ 35633afdcc5SYongqiang Yang static int set_flexbg_block_bitmap(struct super_block *sb, handle_t *handle, 35733afdcc5SYongqiang Yang struct ext4_new_flex_group_data *flex_gd, 35833afdcc5SYongqiang Yang ext4_fsblk_t block, ext4_group_t count) 35933afdcc5SYongqiang Yang { 36033afdcc5SYongqiang Yang ext4_group_t count2; 36133afdcc5SYongqiang Yang 36233afdcc5SYongqiang Yang ext4_debug("mark blocks [%llu/%u] used\n", block, count); 36333afdcc5SYongqiang Yang for (count2 = count; count > 0; count -= count2, block += count2) { 36433afdcc5SYongqiang Yang ext4_fsblk_t start; 36533afdcc5SYongqiang Yang struct buffer_head *bh; 36633afdcc5SYongqiang Yang ext4_group_t group; 36733afdcc5SYongqiang Yang int err; 36833afdcc5SYongqiang Yang 36933afdcc5SYongqiang Yang ext4_get_group_no_and_offset(sb, block, &group, NULL); 37033afdcc5SYongqiang Yang start = ext4_group_first_block_no(sb, group); 37133afdcc5SYongqiang Yang group -= flex_gd->groups[0].group; 37233afdcc5SYongqiang Yang 37333afdcc5SYongqiang Yang count2 = sb->s_blocksize * 8 - (block - start); 37433afdcc5SYongqiang Yang if (count2 > count) 37533afdcc5SYongqiang Yang count2 = count; 37633afdcc5SYongqiang Yang 37733afdcc5SYongqiang Yang if (flex_gd->bg_flags[group] & EXT4_BG_BLOCK_UNINIT) { 37833afdcc5SYongqiang Yang BUG_ON(flex_gd->count > 1); 37933afdcc5SYongqiang Yang continue; 38033afdcc5SYongqiang Yang } 38133afdcc5SYongqiang Yang 38233afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 38333afdcc5SYongqiang Yang if (err) 38433afdcc5SYongqiang Yang return err; 38533afdcc5SYongqiang Yang 38633afdcc5SYongqiang Yang bh = sb_getblk(sb, flex_gd->groups[group].block_bitmap); 38733afdcc5SYongqiang Yang if (!bh) 38833afdcc5SYongqiang Yang return -EIO; 38933afdcc5SYongqiang Yang 39033afdcc5SYongqiang Yang err = ext4_journal_get_write_access(handle, bh); 39133afdcc5SYongqiang Yang if (err) 39233afdcc5SYongqiang Yang return err; 39333afdcc5SYongqiang Yang ext4_debug("mark block bitmap %#04llx (+%llu/%u)\n", block, 39433afdcc5SYongqiang Yang block - start, count2); 39533afdcc5SYongqiang Yang ext4_set_bits(bh->b_data, block - start, count2); 39633afdcc5SYongqiang Yang 39733afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 39833afdcc5SYongqiang Yang if (unlikely(err)) 39933afdcc5SYongqiang Yang return err; 40033afdcc5SYongqiang Yang brelse(bh); 40133afdcc5SYongqiang Yang } 40233afdcc5SYongqiang Yang 40333afdcc5SYongqiang Yang return 0; 40433afdcc5SYongqiang Yang } 40533afdcc5SYongqiang Yang 40633afdcc5SYongqiang Yang /* 40733afdcc5SYongqiang Yang * Set up the block and inode bitmaps, and the inode table for the new groups. 40833afdcc5SYongqiang Yang * This doesn't need to be part of the main transaction, since we are only 40933afdcc5SYongqiang Yang * changing blocks outside the actual filesystem. We still do journaling to 41033afdcc5SYongqiang Yang * ensure the recovery is correct in case of a failure just after resize. 41133afdcc5SYongqiang Yang * If any part of this fails, we simply abort the resize. 41233afdcc5SYongqiang Yang * 41333afdcc5SYongqiang Yang * setup_new_flex_group_blocks handles a flex group as follow: 41433afdcc5SYongqiang Yang * 1. copy super block and GDT, and initialize group tables if necessary. 41533afdcc5SYongqiang Yang * In this step, we only set bits in blocks bitmaps for blocks taken by 41633afdcc5SYongqiang Yang * super block and GDT. 41733afdcc5SYongqiang Yang * 2. allocate group tables in block bitmaps, that is, set bits in block 41833afdcc5SYongqiang Yang * bitmap for blocks taken by group tables. 41933afdcc5SYongqiang Yang */ 42033afdcc5SYongqiang Yang static int setup_new_flex_group_blocks(struct super_block *sb, 42133afdcc5SYongqiang Yang struct ext4_new_flex_group_data *flex_gd) 42233afdcc5SYongqiang Yang { 42333afdcc5SYongqiang Yang int group_table_count[] = {1, 1, EXT4_SB(sb)->s_itb_per_group}; 42433afdcc5SYongqiang Yang ext4_fsblk_t start; 42533afdcc5SYongqiang Yang ext4_fsblk_t block; 42633afdcc5SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 42733afdcc5SYongqiang Yang struct ext4_super_block *es = sbi->s_es; 42833afdcc5SYongqiang Yang struct ext4_new_group_data *group_data = flex_gd->groups; 42933afdcc5SYongqiang Yang __u16 *bg_flags = flex_gd->bg_flags; 43033afdcc5SYongqiang Yang handle_t *handle; 43133afdcc5SYongqiang Yang ext4_group_t group, count; 43233afdcc5SYongqiang Yang struct buffer_head *bh = NULL; 43333afdcc5SYongqiang Yang int reserved_gdb, i, j, err = 0, err2; 43433afdcc5SYongqiang Yang 43533afdcc5SYongqiang Yang BUG_ON(!flex_gd->count || !group_data || 43633afdcc5SYongqiang Yang group_data[0].group != sbi->s_groups_count); 43733afdcc5SYongqiang Yang 43833afdcc5SYongqiang Yang reserved_gdb = le16_to_cpu(es->s_reserved_gdt_blocks); 43933afdcc5SYongqiang Yang 44033afdcc5SYongqiang Yang /* This transaction may be extended/restarted along the way */ 44133afdcc5SYongqiang Yang handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 44233afdcc5SYongqiang Yang if (IS_ERR(handle)) 44333afdcc5SYongqiang Yang return PTR_ERR(handle); 44433afdcc5SYongqiang Yang 44533afdcc5SYongqiang Yang group = group_data[0].group; 44633afdcc5SYongqiang Yang for (i = 0; i < flex_gd->count; i++, group++) { 44733afdcc5SYongqiang Yang unsigned long gdblocks; 44833afdcc5SYongqiang Yang 44933afdcc5SYongqiang Yang gdblocks = ext4_bg_num_gdb(sb, group); 45033afdcc5SYongqiang Yang start = ext4_group_first_block_no(sb, group); 45133afdcc5SYongqiang Yang 45233afdcc5SYongqiang Yang /* Copy all of the GDT blocks into the backup in this group */ 45333afdcc5SYongqiang Yang for (j = 0, block = start + 1; j < gdblocks; j++, block++) { 45433afdcc5SYongqiang Yang struct buffer_head *gdb; 45533afdcc5SYongqiang Yang 45633afdcc5SYongqiang Yang ext4_debug("update backup group %#04llx\n", block); 45733afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 45833afdcc5SYongqiang Yang if (err) 45933afdcc5SYongqiang Yang goto out; 46033afdcc5SYongqiang Yang 46133afdcc5SYongqiang Yang gdb = sb_getblk(sb, block); 46233afdcc5SYongqiang Yang if (!gdb) { 46333afdcc5SYongqiang Yang err = -EIO; 46433afdcc5SYongqiang Yang goto out; 46533afdcc5SYongqiang Yang } 46633afdcc5SYongqiang Yang 46733afdcc5SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb); 46833afdcc5SYongqiang Yang if (err) { 46933afdcc5SYongqiang Yang brelse(gdb); 47033afdcc5SYongqiang Yang goto out; 47133afdcc5SYongqiang Yang } 47233afdcc5SYongqiang Yang memcpy(gdb->b_data, sbi->s_group_desc[j]->b_data, 47333afdcc5SYongqiang Yang gdb->b_size); 47433afdcc5SYongqiang Yang set_buffer_uptodate(gdb); 47533afdcc5SYongqiang Yang 47633afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, gdb); 47733afdcc5SYongqiang Yang if (unlikely(err)) { 47833afdcc5SYongqiang Yang brelse(gdb); 47933afdcc5SYongqiang Yang goto out; 48033afdcc5SYongqiang Yang } 48133afdcc5SYongqiang Yang brelse(gdb); 48233afdcc5SYongqiang Yang } 48333afdcc5SYongqiang Yang 48433afdcc5SYongqiang Yang /* Zero out all of the reserved backup group descriptor 48533afdcc5SYongqiang Yang * table blocks 48633afdcc5SYongqiang Yang */ 48733afdcc5SYongqiang Yang if (ext4_bg_has_super(sb, group)) { 48833afdcc5SYongqiang Yang err = sb_issue_zeroout(sb, gdblocks + start + 1, 48933afdcc5SYongqiang Yang reserved_gdb, GFP_NOFS); 49033afdcc5SYongqiang Yang if (err) 49133afdcc5SYongqiang Yang goto out; 49233afdcc5SYongqiang Yang } 49333afdcc5SYongqiang Yang 49433afdcc5SYongqiang Yang /* Initialize group tables of the grop @group */ 49533afdcc5SYongqiang Yang if (!(bg_flags[i] & EXT4_BG_INODE_ZEROED)) 49633afdcc5SYongqiang Yang goto handle_bb; 49733afdcc5SYongqiang Yang 49833afdcc5SYongqiang Yang /* Zero out all of the inode table blocks */ 49933afdcc5SYongqiang Yang block = group_data[i].inode_table; 50033afdcc5SYongqiang Yang ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 50133afdcc5SYongqiang Yang block, sbi->s_itb_per_group); 50233afdcc5SYongqiang Yang err = sb_issue_zeroout(sb, block, sbi->s_itb_per_group, 50333afdcc5SYongqiang Yang GFP_NOFS); 50433afdcc5SYongqiang Yang if (err) 50533afdcc5SYongqiang Yang goto out; 50633afdcc5SYongqiang Yang 50733afdcc5SYongqiang Yang handle_bb: 50833afdcc5SYongqiang Yang if (bg_flags[i] & EXT4_BG_BLOCK_UNINIT) 50933afdcc5SYongqiang Yang goto handle_ib; 51033afdcc5SYongqiang Yang 51133afdcc5SYongqiang Yang /* Initialize block bitmap of the @group */ 51233afdcc5SYongqiang Yang block = group_data[i].block_bitmap; 51333afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 51433afdcc5SYongqiang Yang if (err) 51533afdcc5SYongqiang Yang goto out; 51633afdcc5SYongqiang Yang 51733afdcc5SYongqiang Yang bh = bclean(handle, sb, block); 51833afdcc5SYongqiang Yang if (IS_ERR(bh)) { 51933afdcc5SYongqiang Yang err = PTR_ERR(bh); 52033afdcc5SYongqiang Yang goto out; 52133afdcc5SYongqiang Yang } 52233afdcc5SYongqiang Yang if (ext4_bg_has_super(sb, group)) { 52333afdcc5SYongqiang Yang ext4_debug("mark backup superblock %#04llx (+0)\n", 52433afdcc5SYongqiang Yang start); 52533afdcc5SYongqiang Yang ext4_set_bits(bh->b_data, 0, gdblocks + reserved_gdb + 52633afdcc5SYongqiang Yang 1); 52733afdcc5SYongqiang Yang } 52833afdcc5SYongqiang Yang ext4_mark_bitmap_end(group_data[i].blocks_count, 52933afdcc5SYongqiang Yang sb->s_blocksize * 8, bh->b_data); 53033afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 53133afdcc5SYongqiang Yang if (err) 53233afdcc5SYongqiang Yang goto out; 53333afdcc5SYongqiang Yang brelse(bh); 53433afdcc5SYongqiang Yang 53533afdcc5SYongqiang Yang handle_ib: 53633afdcc5SYongqiang Yang if (bg_flags[i] & EXT4_BG_INODE_UNINIT) 53733afdcc5SYongqiang Yang continue; 53833afdcc5SYongqiang Yang 53933afdcc5SYongqiang Yang /* Initialize inode bitmap of the @group */ 54033afdcc5SYongqiang Yang block = group_data[i].inode_bitmap; 54133afdcc5SYongqiang Yang err = extend_or_restart_transaction(handle, 1); 54233afdcc5SYongqiang Yang if (err) 54333afdcc5SYongqiang Yang goto out; 54433afdcc5SYongqiang Yang /* Mark unused entries in inode bitmap used */ 54533afdcc5SYongqiang Yang bh = bclean(handle, sb, block); 54633afdcc5SYongqiang Yang if (IS_ERR(bh)) { 54733afdcc5SYongqiang Yang err = PTR_ERR(bh); 54833afdcc5SYongqiang Yang goto out; 54933afdcc5SYongqiang Yang } 55033afdcc5SYongqiang Yang 55133afdcc5SYongqiang Yang ext4_mark_bitmap_end(EXT4_INODES_PER_GROUP(sb), 55233afdcc5SYongqiang Yang sb->s_blocksize * 8, bh->b_data); 55333afdcc5SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, bh); 55433afdcc5SYongqiang Yang if (err) 55533afdcc5SYongqiang Yang goto out; 55633afdcc5SYongqiang Yang brelse(bh); 55733afdcc5SYongqiang Yang } 55833afdcc5SYongqiang Yang bh = NULL; 55933afdcc5SYongqiang Yang 56033afdcc5SYongqiang Yang /* Mark group tables in block bitmap */ 56133afdcc5SYongqiang Yang for (j = 0; j < GROUP_TABLE_COUNT; j++) { 56233afdcc5SYongqiang Yang count = group_table_count[j]; 56333afdcc5SYongqiang Yang start = (&group_data[0].block_bitmap)[j]; 56433afdcc5SYongqiang Yang block = start; 56533afdcc5SYongqiang Yang for (i = 1; i < flex_gd->count; i++) { 56633afdcc5SYongqiang Yang block += group_table_count[j]; 56733afdcc5SYongqiang Yang if (block == (&group_data[i].block_bitmap)[j]) { 56833afdcc5SYongqiang Yang count += group_table_count[j]; 56933afdcc5SYongqiang Yang continue; 57033afdcc5SYongqiang Yang } 57133afdcc5SYongqiang Yang err = set_flexbg_block_bitmap(sb, handle, 57233afdcc5SYongqiang Yang flex_gd, start, count); 57333afdcc5SYongqiang Yang if (err) 57433afdcc5SYongqiang Yang goto out; 57533afdcc5SYongqiang Yang count = group_table_count[j]; 57633afdcc5SYongqiang Yang start = group_data[i].block_bitmap; 57733afdcc5SYongqiang Yang block = start; 57833afdcc5SYongqiang Yang } 57933afdcc5SYongqiang Yang 58033afdcc5SYongqiang Yang if (count) { 58133afdcc5SYongqiang Yang err = set_flexbg_block_bitmap(sb, handle, 58233afdcc5SYongqiang Yang flex_gd, start, count); 58333afdcc5SYongqiang Yang if (err) 58433afdcc5SYongqiang Yang goto out; 58533afdcc5SYongqiang Yang } 58633afdcc5SYongqiang Yang } 58733afdcc5SYongqiang Yang 58833afdcc5SYongqiang Yang out: 58933afdcc5SYongqiang Yang brelse(bh); 59033afdcc5SYongqiang Yang err2 = ext4_journal_stop(handle); 59133afdcc5SYongqiang Yang if (err2 && !err) 59233afdcc5SYongqiang Yang err = err2; 59333afdcc5SYongqiang Yang 59433afdcc5SYongqiang Yang return err; 59533afdcc5SYongqiang Yang } 59633afdcc5SYongqiang Yang 59733afdcc5SYongqiang Yang /* 598ac27a0ecSDave Kleikamp * Set up the block and inode bitmaps, and the inode table for the new group. 599ac27a0ecSDave Kleikamp * This doesn't need to be part of the main transaction, since we are only 600ac27a0ecSDave Kleikamp * changing blocks outside the actual filesystem. We still do journaling to 601ac27a0ecSDave Kleikamp * ensure the recovery is correct in case of a failure just after resize. 602ac27a0ecSDave Kleikamp * If any part of this fails, we simply abort the resize. 603ac27a0ecSDave Kleikamp */ 604ac27a0ecSDave Kleikamp static int setup_new_group_blocks(struct super_block *sb, 605617ba13bSMingming Cao struct ext4_new_group_data *input) 606ac27a0ecSDave Kleikamp { 607617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 608617ba13bSMingming Cao ext4_fsblk_t start = ext4_group_first_block_no(sb, input->group); 609617ba13bSMingming Cao int reserved_gdb = ext4_bg_has_super(sb, input->group) ? 610ac27a0ecSDave Kleikamp le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) : 0; 611617ba13bSMingming Cao unsigned long gdblocks = ext4_bg_num_gdb(sb, input->group); 612ac27a0ecSDave Kleikamp struct buffer_head *bh; 613ac27a0ecSDave Kleikamp handle_t *handle; 614617ba13bSMingming Cao ext4_fsblk_t block; 615617ba13bSMingming Cao ext4_grpblk_t bit; 616ac27a0ecSDave Kleikamp int i; 617ac27a0ecSDave Kleikamp int err = 0, err2; 618ac27a0ecSDave Kleikamp 61914904107SEric Sandeen /* This transaction may be extended/restarted along the way */ 62014904107SEric Sandeen handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 62114904107SEric Sandeen 622ac27a0ecSDave Kleikamp if (IS_ERR(handle)) 623ac27a0ecSDave Kleikamp return PTR_ERR(handle); 624ac27a0ecSDave Kleikamp 6258f82f840SYongqiang Yang BUG_ON(input->group != sbi->s_groups_count); 626ac27a0ecSDave Kleikamp 627ac27a0ecSDave Kleikamp /* Copy all of the GDT blocks into the backup in this group */ 628ac27a0ecSDave Kleikamp for (i = 0, bit = 1, block = start + 1; 629ac27a0ecSDave Kleikamp i < gdblocks; i++, block++, bit++) { 630ac27a0ecSDave Kleikamp struct buffer_head *gdb; 631ac27a0ecSDave Kleikamp 632c549a95dSEric Sandeen ext4_debug("update backup group %#04llx (+%d)\n", block, bit); 6336d40bc5aSYongqiang Yang err = extend_or_restart_transaction(handle, 1); 6346d40bc5aSYongqiang Yang if (err) 6356d40bc5aSYongqiang Yang goto exit_journal; 63614904107SEric Sandeen 637ac27a0ecSDave Kleikamp gdb = sb_getblk(sb, block); 638ac27a0ecSDave Kleikamp if (!gdb) { 639ac27a0ecSDave Kleikamp err = -EIO; 6406d40bc5aSYongqiang Yang goto exit_journal; 641ac27a0ecSDave Kleikamp } 642617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, gdb))) { 643ac27a0ecSDave Kleikamp brelse(gdb); 6446d40bc5aSYongqiang Yang goto exit_journal; 645ac27a0ecSDave Kleikamp } 6465b615287SEric Sandeen memcpy(gdb->b_data, sbi->s_group_desc[i]->b_data, gdb->b_size); 647ac27a0ecSDave Kleikamp set_buffer_uptodate(gdb); 648b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, gdb); 649b4097142STheodore Ts'o if (unlikely(err)) { 650b4097142STheodore Ts'o brelse(gdb); 6516d40bc5aSYongqiang Yang goto exit_journal; 652b4097142STheodore Ts'o } 653ac27a0ecSDave Kleikamp brelse(gdb); 654ac27a0ecSDave Kleikamp } 655ac27a0ecSDave Kleikamp 656ac27a0ecSDave Kleikamp /* Zero out all of the reserved backup group descriptor table blocks */ 657da488945STheodore Ts'o ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 658a31437b8SLukas Czerner block, sbi->s_itb_per_group); 659a31437b8SLukas Czerner err = sb_issue_zeroout(sb, gdblocks + start + 1, reserved_gdb, 660a107e5a3STheodore Ts'o GFP_NOFS); 661a31437b8SLukas Czerner if (err) 6626d40bc5aSYongqiang Yang goto exit_journal; 6636d40bc5aSYongqiang Yang 6646d40bc5aSYongqiang Yang err = extend_or_restart_transaction(handle, 2); 6656d40bc5aSYongqiang Yang if (err) 6666d40bc5aSYongqiang Yang goto exit_journal; 6676d40bc5aSYongqiang Yang 6686d40bc5aSYongqiang Yang bh = bclean(handle, sb, input->block_bitmap); 6696d40bc5aSYongqiang Yang if (IS_ERR(bh)) { 6706d40bc5aSYongqiang Yang err = PTR_ERR(bh); 6716d40bc5aSYongqiang Yang goto exit_journal; 6726d40bc5aSYongqiang Yang } 673c3e94d1dSYongqiang Yang 674c3e94d1dSYongqiang Yang if (ext4_bg_has_super(sb, input->group)) { 675c3e94d1dSYongqiang Yang ext4_debug("mark backup group tables %#04llx (+0)\n", start); 676c3e94d1dSYongqiang Yang ext4_set_bits(bh->b_data, 0, gdblocks + reserved_gdb + 1); 677c3e94d1dSYongqiang Yang } 67814904107SEric Sandeen 679c549a95dSEric Sandeen ext4_debug("mark block bitmap %#04llx (+%llu)\n", input->block_bitmap, 680ac27a0ecSDave Kleikamp input->block_bitmap - start); 681617ba13bSMingming Cao ext4_set_bit(input->block_bitmap - start, bh->b_data); 682c549a95dSEric Sandeen ext4_debug("mark inode bitmap %#04llx (+%llu)\n", input->inode_bitmap, 683ac27a0ecSDave Kleikamp input->inode_bitmap - start); 684617ba13bSMingming Cao ext4_set_bit(input->inode_bitmap - start, bh->b_data); 685ac27a0ecSDave Kleikamp 686ac27a0ecSDave Kleikamp /* Zero out all of the inode table blocks */ 687a31437b8SLukas Czerner block = input->inode_table; 688da488945STheodore Ts'o ext4_debug("clear inode table blocks %#04llx -> %#04lx\n", 689a31437b8SLukas Czerner block, sbi->s_itb_per_group); 690a107e5a3STheodore Ts'o err = sb_issue_zeroout(sb, block, sbi->s_itb_per_group, GFP_NOFS); 691a31437b8SLukas Czerner if (err) 69214904107SEric Sandeen goto exit_bh; 693c3e94d1dSYongqiang Yang ext4_set_bits(bh->b_data, input->inode_table - start, 694c3e94d1dSYongqiang Yang sbi->s_itb_per_group); 69514904107SEric Sandeen 69614904107SEric Sandeen 69761d08673STheodore Ts'o ext4_mark_bitmap_end(input->blocks_count, sb->s_blocksize * 8, 69861d08673STheodore Ts'o bh->b_data); 699b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 700b4097142STheodore Ts'o if (unlikely(err)) { 701b4097142STheodore Ts'o ext4_std_error(sb, err); 702b4097142STheodore Ts'o goto exit_bh; 703b4097142STheodore Ts'o } 704ac27a0ecSDave Kleikamp brelse(bh); 705ac27a0ecSDave Kleikamp /* Mark unused entries in inode bitmap used */ 706c549a95dSEric Sandeen ext4_debug("clear inode bitmap %#04llx (+%llu)\n", 707ac27a0ecSDave Kleikamp input->inode_bitmap, input->inode_bitmap - start); 708ac27a0ecSDave Kleikamp if (IS_ERR(bh = bclean(handle, sb, input->inode_bitmap))) { 709ac27a0ecSDave Kleikamp err = PTR_ERR(bh); 710ac27a0ecSDave Kleikamp goto exit_journal; 711ac27a0ecSDave Kleikamp } 712ac27a0ecSDave Kleikamp 71361d08673STheodore Ts'o ext4_mark_bitmap_end(EXT4_INODES_PER_GROUP(sb), sb->s_blocksize * 8, 714ac27a0ecSDave Kleikamp bh->b_data); 715b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 716b4097142STheodore Ts'o if (unlikely(err)) 717b4097142STheodore Ts'o ext4_std_error(sb, err); 718ac27a0ecSDave Kleikamp exit_bh: 719ac27a0ecSDave Kleikamp brelse(bh); 720ac27a0ecSDave Kleikamp 721ac27a0ecSDave Kleikamp exit_journal: 722617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 723ac27a0ecSDave Kleikamp err = err2; 724ac27a0ecSDave Kleikamp 725ac27a0ecSDave Kleikamp return err; 726ac27a0ecSDave Kleikamp } 727ac27a0ecSDave Kleikamp 728ac27a0ecSDave Kleikamp /* 729ac27a0ecSDave Kleikamp * Iterate through the groups which hold BACKUP superblock/GDT copies in an 730617ba13bSMingming Cao * ext4 filesystem. The counters should be initialized to 1, 5, and 7 before 731ac27a0ecSDave Kleikamp * calling this for the first time. In a sparse filesystem it will be the 732ac27a0ecSDave Kleikamp * sequence of powers of 3, 5, and 7: 1, 3, 5, 7, 9, 25, 27, 49, 81, ... 733ac27a0ecSDave Kleikamp * For a non-sparse filesystem it will be every group: 1, 2, 3, 4, ... 734ac27a0ecSDave Kleikamp */ 735617ba13bSMingming Cao static unsigned ext4_list_backups(struct super_block *sb, unsigned *three, 736ac27a0ecSDave Kleikamp unsigned *five, unsigned *seven) 737ac27a0ecSDave Kleikamp { 738ac27a0ecSDave Kleikamp unsigned *min = three; 739ac27a0ecSDave Kleikamp int mult = 3; 740ac27a0ecSDave Kleikamp unsigned ret; 741ac27a0ecSDave Kleikamp 742617ba13bSMingming Cao if (!EXT4_HAS_RO_COMPAT_FEATURE(sb, 743617ba13bSMingming Cao EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER)) { 744ac27a0ecSDave Kleikamp ret = *min; 745ac27a0ecSDave Kleikamp *min += 1; 746ac27a0ecSDave Kleikamp return ret; 747ac27a0ecSDave Kleikamp } 748ac27a0ecSDave Kleikamp 749ac27a0ecSDave Kleikamp if (*five < *min) { 750ac27a0ecSDave Kleikamp min = five; 751ac27a0ecSDave Kleikamp mult = 5; 752ac27a0ecSDave Kleikamp } 753ac27a0ecSDave Kleikamp if (*seven < *min) { 754ac27a0ecSDave Kleikamp min = seven; 755ac27a0ecSDave Kleikamp mult = 7; 756ac27a0ecSDave Kleikamp } 757ac27a0ecSDave Kleikamp 758ac27a0ecSDave Kleikamp ret = *min; 759ac27a0ecSDave Kleikamp *min *= mult; 760ac27a0ecSDave Kleikamp 761ac27a0ecSDave Kleikamp return ret; 762ac27a0ecSDave Kleikamp } 763ac27a0ecSDave Kleikamp 764ac27a0ecSDave Kleikamp /* 765ac27a0ecSDave Kleikamp * Check that all of the backup GDT blocks are held in the primary GDT block. 766ac27a0ecSDave Kleikamp * It is assumed that they are stored in group order. Returns the number of 767ac27a0ecSDave Kleikamp * groups in current filesystem that have BACKUPS, or -ve error code. 768ac27a0ecSDave Kleikamp */ 769ac27a0ecSDave Kleikamp static int verify_reserved_gdb(struct super_block *sb, 770c72df9f9SYongqiang Yang ext4_group_t end, 771ac27a0ecSDave Kleikamp struct buffer_head *primary) 772ac27a0ecSDave Kleikamp { 773617ba13bSMingming Cao const ext4_fsblk_t blk = primary->b_blocknr; 774ac27a0ecSDave Kleikamp unsigned three = 1; 775ac27a0ecSDave Kleikamp unsigned five = 5; 776ac27a0ecSDave Kleikamp unsigned seven = 7; 777ac27a0ecSDave Kleikamp unsigned grp; 778ac27a0ecSDave Kleikamp __le32 *p = (__le32 *)primary->b_data; 779ac27a0ecSDave Kleikamp int gdbackups = 0; 780ac27a0ecSDave Kleikamp 781617ba13bSMingming Cao while ((grp = ext4_list_backups(sb, &three, &five, &seven)) < end) { 782bd81d8eeSLaurent Vivier if (le32_to_cpu(*p++) != 783bd81d8eeSLaurent Vivier grp * EXT4_BLOCKS_PER_GROUP(sb) + blk){ 78412062dddSEric Sandeen ext4_warning(sb, "reserved GDT %llu" 7852ae02107SMingming Cao " missing grp %d (%llu)", 786ac27a0ecSDave Kleikamp blk, grp, 787bd81d8eeSLaurent Vivier grp * 788bd81d8eeSLaurent Vivier (ext4_fsblk_t)EXT4_BLOCKS_PER_GROUP(sb) + 789bd81d8eeSLaurent Vivier blk); 790ac27a0ecSDave Kleikamp return -EINVAL; 791ac27a0ecSDave Kleikamp } 792617ba13bSMingming Cao if (++gdbackups > EXT4_ADDR_PER_BLOCK(sb)) 793ac27a0ecSDave Kleikamp return -EFBIG; 794ac27a0ecSDave Kleikamp } 795ac27a0ecSDave Kleikamp 796ac27a0ecSDave Kleikamp return gdbackups; 797ac27a0ecSDave Kleikamp } 798ac27a0ecSDave Kleikamp 799ac27a0ecSDave Kleikamp /* 800ac27a0ecSDave Kleikamp * Called when we need to bring a reserved group descriptor table block into 801ac27a0ecSDave Kleikamp * use from the resize inode. The primary copy of the new GDT block currently 802ac27a0ecSDave Kleikamp * is an indirect block (under the double indirect block in the resize inode). 803ac27a0ecSDave Kleikamp * The new backup GDT blocks will be stored as leaf blocks in this indirect 804ac27a0ecSDave Kleikamp * block, in group order. Even though we know all the block numbers we need, 805ac27a0ecSDave Kleikamp * we check to ensure that the resize inode has actually reserved these blocks. 806ac27a0ecSDave Kleikamp * 807ac27a0ecSDave Kleikamp * Don't need to update the block bitmaps because the blocks are still in use. 808ac27a0ecSDave Kleikamp * 809ac27a0ecSDave Kleikamp * We get all of the error cases out of the way, so that we are sure to not 810ac27a0ecSDave Kleikamp * fail once we start modifying the data on disk, because JBD has no rollback. 811ac27a0ecSDave Kleikamp */ 812ac27a0ecSDave Kleikamp static int add_new_gdb(handle_t *handle, struct inode *inode, 8132f919710SYongqiang Yang ext4_group_t group) 814ac27a0ecSDave Kleikamp { 815ac27a0ecSDave Kleikamp struct super_block *sb = inode->i_sb; 816617ba13bSMingming Cao struct ext4_super_block *es = EXT4_SB(sb)->s_es; 8172f919710SYongqiang Yang unsigned long gdb_num = group / EXT4_DESC_PER_BLOCK(sb); 818617ba13bSMingming Cao ext4_fsblk_t gdblock = EXT4_SB(sb)->s_sbh->b_blocknr + 1 + gdb_num; 819ac27a0ecSDave Kleikamp struct buffer_head **o_group_desc, **n_group_desc; 820ac27a0ecSDave Kleikamp struct buffer_head *dind; 8212f919710SYongqiang Yang struct buffer_head *gdb_bh; 822ac27a0ecSDave Kleikamp int gdbackups; 823617ba13bSMingming Cao struct ext4_iloc iloc; 824ac27a0ecSDave Kleikamp __le32 *data; 825ac27a0ecSDave Kleikamp int err; 826ac27a0ecSDave Kleikamp 827ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 828ac27a0ecSDave Kleikamp printk(KERN_DEBUG 829617ba13bSMingming Cao "EXT4-fs: ext4_add_new_gdb: adding group block %lu\n", 830ac27a0ecSDave Kleikamp gdb_num); 831ac27a0ecSDave Kleikamp 832ac27a0ecSDave Kleikamp /* 833ac27a0ecSDave Kleikamp * If we are not using the primary superblock/GDT copy don't resize, 834ac27a0ecSDave Kleikamp * because the user tools have no way of handling this. Probably a 835ac27a0ecSDave Kleikamp * bad time to do it anyways. 836ac27a0ecSDave Kleikamp */ 837617ba13bSMingming Cao if (EXT4_SB(sb)->s_sbh->b_blocknr != 838617ba13bSMingming Cao le32_to_cpu(EXT4_SB(sb)->s_es->s_first_data_block)) { 83912062dddSEric Sandeen ext4_warning(sb, "won't resize using backup superblock at %llu", 840617ba13bSMingming Cao (unsigned long long)EXT4_SB(sb)->s_sbh->b_blocknr); 841ac27a0ecSDave Kleikamp return -EPERM; 842ac27a0ecSDave Kleikamp } 843ac27a0ecSDave Kleikamp 8442f919710SYongqiang Yang gdb_bh = sb_bread(sb, gdblock); 8452f919710SYongqiang Yang if (!gdb_bh) 846ac27a0ecSDave Kleikamp return -EIO; 847ac27a0ecSDave Kleikamp 848c72df9f9SYongqiang Yang gdbackups = verify_reserved_gdb(sb, group, gdb_bh); 8492f919710SYongqiang Yang if (gdbackups < 0) { 850ac27a0ecSDave Kleikamp err = gdbackups; 851ac27a0ecSDave Kleikamp goto exit_bh; 852ac27a0ecSDave Kleikamp } 853ac27a0ecSDave Kleikamp 854617ba13bSMingming Cao data = EXT4_I(inode)->i_data + EXT4_DIND_BLOCK; 855ac27a0ecSDave Kleikamp dind = sb_bread(sb, le32_to_cpu(*data)); 856ac27a0ecSDave Kleikamp if (!dind) { 857ac27a0ecSDave Kleikamp err = -EIO; 858ac27a0ecSDave Kleikamp goto exit_bh; 859ac27a0ecSDave Kleikamp } 860ac27a0ecSDave Kleikamp 861ac27a0ecSDave Kleikamp data = (__le32 *)dind->b_data; 862617ba13bSMingming Cao if (le32_to_cpu(data[gdb_num % EXT4_ADDR_PER_BLOCK(sb)]) != gdblock) { 86312062dddSEric Sandeen ext4_warning(sb, "new group %u GDT block %llu not reserved", 8642f919710SYongqiang Yang group, gdblock); 865ac27a0ecSDave Kleikamp err = -EINVAL; 866ac27a0ecSDave Kleikamp goto exit_dind; 867ac27a0ecSDave Kleikamp } 868ac27a0ecSDave Kleikamp 869b4097142STheodore Ts'o err = ext4_journal_get_write_access(handle, EXT4_SB(sb)->s_sbh); 870b4097142STheodore Ts'o if (unlikely(err)) 871ac27a0ecSDave Kleikamp goto exit_dind; 872ac27a0ecSDave Kleikamp 8732f919710SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb_bh); 874b4097142STheodore Ts'o if (unlikely(err)) 875ac27a0ecSDave Kleikamp goto exit_sbh; 876ac27a0ecSDave Kleikamp 877b4097142STheodore Ts'o err = ext4_journal_get_write_access(handle, dind); 878b4097142STheodore Ts'o if (unlikely(err)) 879b4097142STheodore Ts'o ext4_std_error(sb, err); 880ac27a0ecSDave Kleikamp 881617ba13bSMingming Cao /* ext4_reserve_inode_write() gets a reference on the iloc */ 882b4097142STheodore Ts'o err = ext4_reserve_inode_write(handle, inode, &iloc); 883b4097142STheodore Ts'o if (unlikely(err)) 884ac27a0ecSDave Kleikamp goto exit_dindj; 885ac27a0ecSDave Kleikamp 886f18a5f21STheodore Ts'o n_group_desc = ext4_kvmalloc((gdb_num + 1) * 887f18a5f21STheodore Ts'o sizeof(struct buffer_head *), 888216553c4SJosef Bacik GFP_NOFS); 889ac27a0ecSDave Kleikamp if (!n_group_desc) { 890ac27a0ecSDave Kleikamp err = -ENOMEM; 891f18a5f21STheodore Ts'o ext4_warning(sb, "not enough memory for %lu groups", 892f18a5f21STheodore Ts'o gdb_num + 1); 893ac27a0ecSDave Kleikamp goto exit_inode; 894ac27a0ecSDave Kleikamp } 895ac27a0ecSDave Kleikamp 896ac27a0ecSDave Kleikamp /* 897ac27a0ecSDave Kleikamp * Finally, we have all of the possible failures behind us... 898ac27a0ecSDave Kleikamp * 899ac27a0ecSDave Kleikamp * Remove new GDT block from inode double-indirect block and clear out 900ac27a0ecSDave Kleikamp * the new GDT block for use (which also "frees" the backup GDT blocks 901ac27a0ecSDave Kleikamp * from the reserved inode). We don't need to change the bitmaps for 902ac27a0ecSDave Kleikamp * these blocks, because they are marked as in-use from being in the 903ac27a0ecSDave Kleikamp * reserved inode, and will become GDT blocks (primary and backup). 904ac27a0ecSDave Kleikamp */ 905617ba13bSMingming Cao data[gdb_num % EXT4_ADDR_PER_BLOCK(sb)] = 0; 906b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, dind); 907b4097142STheodore Ts'o if (unlikely(err)) { 908b4097142STheodore Ts'o ext4_std_error(sb, err); 909b4097142STheodore Ts'o goto exit_inode; 910b4097142STheodore Ts'o } 911ac27a0ecSDave Kleikamp inode->i_blocks -= (gdbackups + 1) * sb->s_blocksize >> 9; 912617ba13bSMingming Cao ext4_mark_iloc_dirty(handle, inode, &iloc); 9132f919710SYongqiang Yang memset(gdb_bh->b_data, 0, sb->s_blocksize); 9142f919710SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, gdb_bh); 915b4097142STheodore Ts'o if (unlikely(err)) { 916b4097142STheodore Ts'o ext4_std_error(sb, err); 917b4097142STheodore Ts'o goto exit_inode; 918b4097142STheodore Ts'o } 919b4097142STheodore Ts'o brelse(dind); 920ac27a0ecSDave Kleikamp 921617ba13bSMingming Cao o_group_desc = EXT4_SB(sb)->s_group_desc; 922ac27a0ecSDave Kleikamp memcpy(n_group_desc, o_group_desc, 923617ba13bSMingming Cao EXT4_SB(sb)->s_gdb_count * sizeof(struct buffer_head *)); 9242f919710SYongqiang Yang n_group_desc[gdb_num] = gdb_bh; 925617ba13bSMingming Cao EXT4_SB(sb)->s_group_desc = n_group_desc; 926617ba13bSMingming Cao EXT4_SB(sb)->s_gdb_count++; 927f18a5f21STheodore Ts'o ext4_kvfree(o_group_desc); 928ac27a0ecSDave Kleikamp 929e8546d06SMarcin Slusarz le16_add_cpu(&es->s_reserved_gdt_blocks, -1); 930b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, EXT4_SB(sb)->s_sbh); 931b4097142STheodore Ts'o if (err) 932b4097142STheodore Ts'o ext4_std_error(sb, err); 933ac27a0ecSDave Kleikamp 934b4097142STheodore Ts'o return err; 935ac27a0ecSDave Kleikamp 936ac27a0ecSDave Kleikamp exit_inode: 937f18a5f21STheodore Ts'o ext4_kvfree(n_group_desc); 938537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, iloc.bh); */ 939ac27a0ecSDave Kleikamp brelse(iloc.bh); 940ac27a0ecSDave Kleikamp exit_dindj: 941537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, dind); */ 942ac27a0ecSDave Kleikamp exit_sbh: 943537a0310SAmir Goldstein /* ext4_handle_release_buffer(handle, EXT4_SB(sb)->s_sbh); */ 944ac27a0ecSDave Kleikamp exit_dind: 945ac27a0ecSDave Kleikamp brelse(dind); 946ac27a0ecSDave Kleikamp exit_bh: 9472f919710SYongqiang Yang brelse(gdb_bh); 948ac27a0ecSDave Kleikamp 949617ba13bSMingming Cao ext4_debug("leaving with error %d\n", err); 950ac27a0ecSDave Kleikamp return err; 951ac27a0ecSDave Kleikamp } 952ac27a0ecSDave Kleikamp 953ac27a0ecSDave Kleikamp /* 954ac27a0ecSDave Kleikamp * Called when we are adding a new group which has a backup copy of each of 955ac27a0ecSDave Kleikamp * the GDT blocks (i.e. sparse group) and there are reserved GDT blocks. 956ac27a0ecSDave Kleikamp * We need to add these reserved backup GDT blocks to the resize inode, so 957ac27a0ecSDave Kleikamp * that they are kept for future resizing and not allocated to files. 958ac27a0ecSDave Kleikamp * 959ac27a0ecSDave Kleikamp * Each reserved backup GDT block will go into a different indirect block. 960ac27a0ecSDave Kleikamp * The indirect blocks are actually the primary reserved GDT blocks, 961ac27a0ecSDave Kleikamp * so we know in advance what their block numbers are. We only get the 962ac27a0ecSDave Kleikamp * double-indirect block to verify it is pointing to the primary reserved 963ac27a0ecSDave Kleikamp * GDT blocks so we don't overwrite a data block by accident. The reserved 964ac27a0ecSDave Kleikamp * backup GDT blocks are stored in their reserved primary GDT block. 965ac27a0ecSDave Kleikamp */ 966ac27a0ecSDave Kleikamp static int reserve_backup_gdb(handle_t *handle, struct inode *inode, 967668f4dc5SYongqiang Yang ext4_group_t group) 968ac27a0ecSDave Kleikamp { 969ac27a0ecSDave Kleikamp struct super_block *sb = inode->i_sb; 970617ba13bSMingming Cao int reserved_gdb =le16_to_cpu(EXT4_SB(sb)->s_es->s_reserved_gdt_blocks); 971ac27a0ecSDave Kleikamp struct buffer_head **primary; 972ac27a0ecSDave Kleikamp struct buffer_head *dind; 973617ba13bSMingming Cao struct ext4_iloc iloc; 974617ba13bSMingming Cao ext4_fsblk_t blk; 975ac27a0ecSDave Kleikamp __le32 *data, *end; 976ac27a0ecSDave Kleikamp int gdbackups = 0; 977ac27a0ecSDave Kleikamp int res, i; 978ac27a0ecSDave Kleikamp int err; 979ac27a0ecSDave Kleikamp 980216553c4SJosef Bacik primary = kmalloc(reserved_gdb * sizeof(*primary), GFP_NOFS); 981ac27a0ecSDave Kleikamp if (!primary) 982ac27a0ecSDave Kleikamp return -ENOMEM; 983ac27a0ecSDave Kleikamp 984617ba13bSMingming Cao data = EXT4_I(inode)->i_data + EXT4_DIND_BLOCK; 985ac27a0ecSDave Kleikamp dind = sb_bread(sb, le32_to_cpu(*data)); 986ac27a0ecSDave Kleikamp if (!dind) { 987ac27a0ecSDave Kleikamp err = -EIO; 988ac27a0ecSDave Kleikamp goto exit_free; 989ac27a0ecSDave Kleikamp } 990ac27a0ecSDave Kleikamp 991617ba13bSMingming Cao blk = EXT4_SB(sb)->s_sbh->b_blocknr + 1 + EXT4_SB(sb)->s_gdb_count; 99294460093SJosef Bacik data = (__le32 *)dind->b_data + (EXT4_SB(sb)->s_gdb_count % 99394460093SJosef Bacik EXT4_ADDR_PER_BLOCK(sb)); 994617ba13bSMingming Cao end = (__le32 *)dind->b_data + EXT4_ADDR_PER_BLOCK(sb); 995ac27a0ecSDave Kleikamp 996ac27a0ecSDave Kleikamp /* Get each reserved primary GDT block and verify it holds backups */ 997ac27a0ecSDave Kleikamp for (res = 0; res < reserved_gdb; res++, blk++) { 998ac27a0ecSDave Kleikamp if (le32_to_cpu(*data) != blk) { 99912062dddSEric Sandeen ext4_warning(sb, "reserved block %llu" 1000ac27a0ecSDave Kleikamp " not at offset %ld", 1001ac27a0ecSDave Kleikamp blk, 1002ac27a0ecSDave Kleikamp (long)(data - (__le32 *)dind->b_data)); 1003ac27a0ecSDave Kleikamp err = -EINVAL; 1004ac27a0ecSDave Kleikamp goto exit_bh; 1005ac27a0ecSDave Kleikamp } 1006ac27a0ecSDave Kleikamp primary[res] = sb_bread(sb, blk); 1007ac27a0ecSDave Kleikamp if (!primary[res]) { 1008ac27a0ecSDave Kleikamp err = -EIO; 1009ac27a0ecSDave Kleikamp goto exit_bh; 1010ac27a0ecSDave Kleikamp } 1011c72df9f9SYongqiang Yang gdbackups = verify_reserved_gdb(sb, group, primary[res]); 1012c72df9f9SYongqiang Yang if (gdbackups < 0) { 1013ac27a0ecSDave Kleikamp brelse(primary[res]); 1014ac27a0ecSDave Kleikamp err = gdbackups; 1015ac27a0ecSDave Kleikamp goto exit_bh; 1016ac27a0ecSDave Kleikamp } 1017ac27a0ecSDave Kleikamp if (++data >= end) 1018ac27a0ecSDave Kleikamp data = (__le32 *)dind->b_data; 1019ac27a0ecSDave Kleikamp } 1020ac27a0ecSDave Kleikamp 1021ac27a0ecSDave Kleikamp for (i = 0; i < reserved_gdb; i++) { 1022617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, primary[i]))) { 1023ac27a0ecSDave Kleikamp /* 1024ac27a0ecSDave Kleikamp int j; 1025ac27a0ecSDave Kleikamp for (j = 0; j < i; j++) 1026537a0310SAmir Goldstein ext4_handle_release_buffer(handle, primary[j]); 1027ac27a0ecSDave Kleikamp */ 1028ac27a0ecSDave Kleikamp goto exit_bh; 1029ac27a0ecSDave Kleikamp } 1030ac27a0ecSDave Kleikamp } 1031ac27a0ecSDave Kleikamp 1032617ba13bSMingming Cao if ((err = ext4_reserve_inode_write(handle, inode, &iloc))) 1033ac27a0ecSDave Kleikamp goto exit_bh; 1034ac27a0ecSDave Kleikamp 1035ac27a0ecSDave Kleikamp /* 1036ac27a0ecSDave Kleikamp * Finally we can add each of the reserved backup GDT blocks from 1037ac27a0ecSDave Kleikamp * the new group to its reserved primary GDT block. 1038ac27a0ecSDave Kleikamp */ 1039668f4dc5SYongqiang Yang blk = group * EXT4_BLOCKS_PER_GROUP(sb); 1040ac27a0ecSDave Kleikamp for (i = 0; i < reserved_gdb; i++) { 1041ac27a0ecSDave Kleikamp int err2; 1042ac27a0ecSDave Kleikamp data = (__le32 *)primary[i]->b_data; 1043ac27a0ecSDave Kleikamp /* printk("reserving backup %lu[%u] = %lu\n", 1044ac27a0ecSDave Kleikamp primary[i]->b_blocknr, gdbackups, 1045ac27a0ecSDave Kleikamp blk + primary[i]->b_blocknr); */ 1046ac27a0ecSDave Kleikamp data[gdbackups] = cpu_to_le32(blk + primary[i]->b_blocknr); 10470390131bSFrank Mayhar err2 = ext4_handle_dirty_metadata(handle, NULL, primary[i]); 1048ac27a0ecSDave Kleikamp if (!err) 1049ac27a0ecSDave Kleikamp err = err2; 1050ac27a0ecSDave Kleikamp } 1051ac27a0ecSDave Kleikamp inode->i_blocks += reserved_gdb * sb->s_blocksize >> 9; 1052617ba13bSMingming Cao ext4_mark_iloc_dirty(handle, inode, &iloc); 1053ac27a0ecSDave Kleikamp 1054ac27a0ecSDave Kleikamp exit_bh: 1055ac27a0ecSDave Kleikamp while (--res >= 0) 1056ac27a0ecSDave Kleikamp brelse(primary[res]); 1057ac27a0ecSDave Kleikamp brelse(dind); 1058ac27a0ecSDave Kleikamp 1059ac27a0ecSDave Kleikamp exit_free: 1060ac27a0ecSDave Kleikamp kfree(primary); 1061ac27a0ecSDave Kleikamp 1062ac27a0ecSDave Kleikamp return err; 1063ac27a0ecSDave Kleikamp } 1064ac27a0ecSDave Kleikamp 1065ac27a0ecSDave Kleikamp /* 1066617ba13bSMingming Cao * Update the backup copies of the ext4 metadata. These don't need to be part 1067ac27a0ecSDave Kleikamp * of the main resize transaction, because e2fsck will re-write them if there 1068ac27a0ecSDave Kleikamp * is a problem (basically only OOM will cause a problem). However, we 1069ac27a0ecSDave Kleikamp * _should_ update the backups if possible, in case the primary gets trashed 1070ac27a0ecSDave Kleikamp * for some reason and we need to run e2fsck from a backup superblock. The 1071ac27a0ecSDave Kleikamp * important part is that the new block and inode counts are in the backup 1072ac27a0ecSDave Kleikamp * superblocks, and the location of the new group metadata in the GDT backups. 1073ac27a0ecSDave Kleikamp * 107432ed5058STheodore Ts'o * We do not need take the s_resize_lock for this, because these 107532ed5058STheodore Ts'o * blocks are not otherwise touched by the filesystem code when it is 107632ed5058STheodore Ts'o * mounted. We don't need to worry about last changing from 107732ed5058STheodore Ts'o * sbi->s_groups_count, because the worst that can happen is that we 107832ed5058STheodore Ts'o * do not copy the full number of backups at this time. The resize 107932ed5058STheodore Ts'o * which changed s_groups_count will backup again. 1080ac27a0ecSDave Kleikamp */ 1081ac27a0ecSDave Kleikamp static void update_backups(struct super_block *sb, 1082ac27a0ecSDave Kleikamp int blk_off, char *data, int size) 1083ac27a0ecSDave Kleikamp { 1084617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 1085fd2d4291SAvantika Mathur const ext4_group_t last = sbi->s_groups_count; 1086617ba13bSMingming Cao const int bpg = EXT4_BLOCKS_PER_GROUP(sb); 1087ac27a0ecSDave Kleikamp unsigned three = 1; 1088ac27a0ecSDave Kleikamp unsigned five = 5; 1089ac27a0ecSDave Kleikamp unsigned seven = 7; 1090fd2d4291SAvantika Mathur ext4_group_t group; 1091ac27a0ecSDave Kleikamp int rest = sb->s_blocksize - size; 1092ac27a0ecSDave Kleikamp handle_t *handle; 1093ac27a0ecSDave Kleikamp int err = 0, err2; 1094ac27a0ecSDave Kleikamp 1095617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, EXT4_MAX_TRANS_DATA); 1096ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 1097ac27a0ecSDave Kleikamp group = 1; 1098ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 1099ac27a0ecSDave Kleikamp goto exit_err; 1100ac27a0ecSDave Kleikamp } 1101ac27a0ecSDave Kleikamp 1102617ba13bSMingming Cao while ((group = ext4_list_backups(sb, &three, &five, &seven)) < last) { 1103ac27a0ecSDave Kleikamp struct buffer_head *bh; 1104ac27a0ecSDave Kleikamp 1105ac27a0ecSDave Kleikamp /* Out of journal space, and can't get more - abort - so sad */ 11060390131bSFrank Mayhar if (ext4_handle_valid(handle) && 11070390131bSFrank Mayhar handle->h_buffer_credits == 0 && 1108617ba13bSMingming Cao ext4_journal_extend(handle, EXT4_MAX_TRANS_DATA) && 1109617ba13bSMingming Cao (err = ext4_journal_restart(handle, EXT4_MAX_TRANS_DATA))) 1110ac27a0ecSDave Kleikamp break; 1111ac27a0ecSDave Kleikamp 1112ac27a0ecSDave Kleikamp bh = sb_getblk(sb, group * bpg + blk_off); 1113ac27a0ecSDave Kleikamp if (!bh) { 1114ac27a0ecSDave Kleikamp err = -EIO; 1115ac27a0ecSDave Kleikamp break; 1116ac27a0ecSDave Kleikamp } 1117617ba13bSMingming Cao ext4_debug("update metadata backup %#04lx\n", 1118ac27a0ecSDave Kleikamp (unsigned long)bh->b_blocknr); 1119617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, bh))) 1120ac27a0ecSDave Kleikamp break; 1121ac27a0ecSDave Kleikamp lock_buffer(bh); 1122ac27a0ecSDave Kleikamp memcpy(bh->b_data, data, size); 1123ac27a0ecSDave Kleikamp if (rest) 1124ac27a0ecSDave Kleikamp memset(bh->b_data + size, 0, rest); 1125ac27a0ecSDave Kleikamp set_buffer_uptodate(bh); 1126ac27a0ecSDave Kleikamp unlock_buffer(bh); 1127b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, bh); 1128b4097142STheodore Ts'o if (unlikely(err)) 1129b4097142STheodore Ts'o ext4_std_error(sb, err); 1130ac27a0ecSDave Kleikamp brelse(bh); 1131ac27a0ecSDave Kleikamp } 1132617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 1133ac27a0ecSDave Kleikamp err = err2; 1134ac27a0ecSDave Kleikamp 1135ac27a0ecSDave Kleikamp /* 1136ac27a0ecSDave Kleikamp * Ugh! Need to have e2fsck write the backup copies. It is too 1137ac27a0ecSDave Kleikamp * late to revert the resize, we shouldn't fail just because of 1138ac27a0ecSDave Kleikamp * the backup copies (they are only needed in case of corruption). 1139ac27a0ecSDave Kleikamp * 1140ac27a0ecSDave Kleikamp * However, if we got here we have a journal problem too, so we 1141ac27a0ecSDave Kleikamp * can't really start a transaction to mark the superblock. 1142ac27a0ecSDave Kleikamp * Chicken out and just set the flag on the hope it will be written 1143ac27a0ecSDave Kleikamp * to disk, and if not - we will simply wait until next fsck. 1144ac27a0ecSDave Kleikamp */ 1145ac27a0ecSDave Kleikamp exit_err: 1146ac27a0ecSDave Kleikamp if (err) { 114712062dddSEric Sandeen ext4_warning(sb, "can't update backup for group %u (err %d), " 1148ac27a0ecSDave Kleikamp "forcing fsck on next reboot", group, err); 1149617ba13bSMingming Cao sbi->s_mount_state &= ~EXT4_VALID_FS; 1150617ba13bSMingming Cao sbi->s_es->s_state &= cpu_to_le16(~EXT4_VALID_FS); 1151ac27a0ecSDave Kleikamp mark_buffer_dirty(sbi->s_sbh); 1152ac27a0ecSDave Kleikamp } 1153ac27a0ecSDave Kleikamp } 1154ac27a0ecSDave Kleikamp 1155bb08c1e7SYongqiang Yang /* 1156bb08c1e7SYongqiang Yang * ext4_add_new_descs() adds @count group descriptor of groups 1157bb08c1e7SYongqiang Yang * starting at @group 1158bb08c1e7SYongqiang Yang * 1159bb08c1e7SYongqiang Yang * @handle: journal handle 1160bb08c1e7SYongqiang Yang * @sb: super block 1161bb08c1e7SYongqiang Yang * @group: the group no. of the first group desc to be added 1162bb08c1e7SYongqiang Yang * @resize_inode: the resize inode 1163bb08c1e7SYongqiang Yang * @count: number of group descriptors to be added 1164bb08c1e7SYongqiang Yang */ 1165bb08c1e7SYongqiang Yang static int ext4_add_new_descs(handle_t *handle, struct super_block *sb, 1166bb08c1e7SYongqiang Yang ext4_group_t group, struct inode *resize_inode, 1167bb08c1e7SYongqiang Yang ext4_group_t count) 1168bb08c1e7SYongqiang Yang { 1169bb08c1e7SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 1170bb08c1e7SYongqiang Yang struct ext4_super_block *es = sbi->s_es; 1171bb08c1e7SYongqiang Yang struct buffer_head *gdb_bh; 1172bb08c1e7SYongqiang Yang int i, gdb_off, gdb_num, err = 0; 1173bb08c1e7SYongqiang Yang 1174bb08c1e7SYongqiang Yang for (i = 0; i < count; i++, group++) { 1175bb08c1e7SYongqiang Yang int reserved_gdb = ext4_bg_has_super(sb, group) ? 1176bb08c1e7SYongqiang Yang le16_to_cpu(es->s_reserved_gdt_blocks) : 0; 1177bb08c1e7SYongqiang Yang 1178bb08c1e7SYongqiang Yang gdb_off = group % EXT4_DESC_PER_BLOCK(sb); 1179bb08c1e7SYongqiang Yang gdb_num = group / EXT4_DESC_PER_BLOCK(sb); 1180bb08c1e7SYongqiang Yang 1181bb08c1e7SYongqiang Yang /* 1182bb08c1e7SYongqiang Yang * We will only either add reserved group blocks to a backup group 1183bb08c1e7SYongqiang Yang * or remove reserved blocks for the first group in a new group block. 1184bb08c1e7SYongqiang Yang * Doing both would be mean more complex code, and sane people don't 1185bb08c1e7SYongqiang Yang * use non-sparse filesystems anymore. This is already checked above. 1186bb08c1e7SYongqiang Yang */ 1187bb08c1e7SYongqiang Yang if (gdb_off) { 1188bb08c1e7SYongqiang Yang gdb_bh = sbi->s_group_desc[gdb_num]; 1189bb08c1e7SYongqiang Yang err = ext4_journal_get_write_access(handle, gdb_bh); 1190bb08c1e7SYongqiang Yang 1191bb08c1e7SYongqiang Yang if (!err && reserved_gdb && ext4_bg_num_gdb(sb, group)) 1192bb08c1e7SYongqiang Yang err = reserve_backup_gdb(handle, resize_inode, group); 1193bb08c1e7SYongqiang Yang } else 1194bb08c1e7SYongqiang Yang err = add_new_gdb(handle, resize_inode, group); 1195bb08c1e7SYongqiang Yang if (err) 1196bb08c1e7SYongqiang Yang break; 1197bb08c1e7SYongqiang Yang } 1198bb08c1e7SYongqiang Yang return err; 1199bb08c1e7SYongqiang Yang } 1200bb08c1e7SYongqiang Yang 1201083f5b24SYongqiang Yang /* 1202083f5b24SYongqiang Yang * ext4_setup_new_descs() will set up the group descriptor descriptors of a flex bg 1203083f5b24SYongqiang Yang */ 1204083f5b24SYongqiang Yang static int ext4_setup_new_descs(handle_t *handle, struct super_block *sb, 1205083f5b24SYongqiang Yang struct ext4_new_flex_group_data *flex_gd) 1206083f5b24SYongqiang Yang { 1207083f5b24SYongqiang Yang struct ext4_new_group_data *group_data = flex_gd->groups; 1208083f5b24SYongqiang Yang struct ext4_group_desc *gdp; 1209083f5b24SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 1210083f5b24SYongqiang Yang struct buffer_head *gdb_bh; 1211083f5b24SYongqiang Yang ext4_group_t group; 1212083f5b24SYongqiang Yang __u16 *bg_flags = flex_gd->bg_flags; 1213083f5b24SYongqiang Yang int i, gdb_off, gdb_num, err = 0; 1214083f5b24SYongqiang Yang 1215083f5b24SYongqiang Yang 1216083f5b24SYongqiang Yang for (i = 0; i < flex_gd->count; i++, group_data++, bg_flags++) { 1217083f5b24SYongqiang Yang group = group_data->group; 1218083f5b24SYongqiang Yang 1219083f5b24SYongqiang Yang gdb_off = group % EXT4_DESC_PER_BLOCK(sb); 1220083f5b24SYongqiang Yang gdb_num = group / EXT4_DESC_PER_BLOCK(sb); 1221083f5b24SYongqiang Yang 1222083f5b24SYongqiang Yang /* 1223083f5b24SYongqiang Yang * get_write_access() has been called on gdb_bh by ext4_add_new_desc(). 1224083f5b24SYongqiang Yang */ 1225083f5b24SYongqiang Yang gdb_bh = sbi->s_group_desc[gdb_num]; 1226083f5b24SYongqiang Yang /* Update group descriptor block for new group */ 1227083f5b24SYongqiang Yang gdp = (struct ext4_group_desc *)((char *)gdb_bh->b_data + 1228083f5b24SYongqiang Yang gdb_off * EXT4_DESC_SIZE(sb)); 1229083f5b24SYongqiang Yang 1230083f5b24SYongqiang Yang memset(gdp, 0, EXT4_DESC_SIZE(sb)); 1231083f5b24SYongqiang Yang ext4_block_bitmap_set(sb, gdp, group_data->block_bitmap); 1232083f5b24SYongqiang Yang ext4_inode_bitmap_set(sb, gdp, group_data->inode_bitmap); 1233083f5b24SYongqiang Yang ext4_inode_table_set(sb, gdp, group_data->inode_table); 1234083f5b24SYongqiang Yang ext4_free_group_clusters_set(sb, gdp, 1235083f5b24SYongqiang Yang EXT4_B2C(sbi, group_data->free_blocks_count)); 1236083f5b24SYongqiang Yang ext4_free_inodes_set(sb, gdp, EXT4_INODES_PER_GROUP(sb)); 1237083f5b24SYongqiang Yang gdp->bg_flags = cpu_to_le16(*bg_flags); 1238083f5b24SYongqiang Yang gdp->bg_checksum = ext4_group_desc_csum(sbi, group, gdp); 1239083f5b24SYongqiang Yang 1240083f5b24SYongqiang Yang err = ext4_handle_dirty_metadata(handle, NULL, gdb_bh); 1241083f5b24SYongqiang Yang if (unlikely(err)) { 1242083f5b24SYongqiang Yang ext4_std_error(sb, err); 1243083f5b24SYongqiang Yang break; 1244083f5b24SYongqiang Yang } 1245083f5b24SYongqiang Yang 1246083f5b24SYongqiang Yang /* 1247083f5b24SYongqiang Yang * We can allocate memory for mb_alloc based on the new group 1248083f5b24SYongqiang Yang * descriptor 1249083f5b24SYongqiang Yang */ 1250083f5b24SYongqiang Yang err = ext4_mb_add_groupinfo(sb, group, gdp); 1251083f5b24SYongqiang Yang if (err) 1252083f5b24SYongqiang Yang break; 1253083f5b24SYongqiang Yang } 1254083f5b24SYongqiang Yang return err; 1255083f5b24SYongqiang Yang } 1256083f5b24SYongqiang Yang 12572e10e2f2SYongqiang Yang /* 12582e10e2f2SYongqiang Yang * ext4_update_super() updates the super block so that the newly added 12592e10e2f2SYongqiang Yang * groups can be seen by the filesystem. 12602e10e2f2SYongqiang Yang * 12612e10e2f2SYongqiang Yang * @sb: super block 12622e10e2f2SYongqiang Yang * @flex_gd: new added groups 12632e10e2f2SYongqiang Yang */ 12642e10e2f2SYongqiang Yang static void ext4_update_super(struct super_block *sb, 12652e10e2f2SYongqiang Yang struct ext4_new_flex_group_data *flex_gd) 12662e10e2f2SYongqiang Yang { 12672e10e2f2SYongqiang Yang ext4_fsblk_t blocks_count = 0; 12682e10e2f2SYongqiang Yang ext4_fsblk_t free_blocks = 0; 12692e10e2f2SYongqiang Yang ext4_fsblk_t reserved_blocks = 0; 12702e10e2f2SYongqiang Yang struct ext4_new_group_data *group_data = flex_gd->groups; 12712e10e2f2SYongqiang Yang struct ext4_sb_info *sbi = EXT4_SB(sb); 12722e10e2f2SYongqiang Yang struct ext4_super_block *es = sbi->s_es; 12732e10e2f2SYongqiang Yang int i; 12742e10e2f2SYongqiang Yang 12752e10e2f2SYongqiang Yang BUG_ON(flex_gd->count == 0 || group_data == NULL); 12762e10e2f2SYongqiang Yang /* 12772e10e2f2SYongqiang Yang * Make the new blocks and inodes valid next. We do this before 12782e10e2f2SYongqiang Yang * increasing the group count so that once the group is enabled, 12792e10e2f2SYongqiang Yang * all of its blocks and inodes are already valid. 12802e10e2f2SYongqiang Yang * 12812e10e2f2SYongqiang Yang * We always allocate group-by-group, then block-by-block or 12822e10e2f2SYongqiang Yang * inode-by-inode within a group, so enabling these 12832e10e2f2SYongqiang Yang * blocks/inodes before the group is live won't actually let us 12842e10e2f2SYongqiang Yang * allocate the new space yet. 12852e10e2f2SYongqiang Yang */ 12862e10e2f2SYongqiang Yang for (i = 0; i < flex_gd->count; i++) { 12872e10e2f2SYongqiang Yang blocks_count += group_data[i].blocks_count; 12882e10e2f2SYongqiang Yang free_blocks += group_data[i].free_blocks_count; 12892e10e2f2SYongqiang Yang } 12902e10e2f2SYongqiang Yang 12912e10e2f2SYongqiang Yang reserved_blocks = ext4_r_blocks_count(es) * 100; 12922e10e2f2SYongqiang Yang do_div(reserved_blocks, ext4_blocks_count(es)); 12932e10e2f2SYongqiang Yang reserved_blocks *= blocks_count; 12942e10e2f2SYongqiang Yang do_div(reserved_blocks, 100); 12952e10e2f2SYongqiang Yang 12962e10e2f2SYongqiang Yang ext4_blocks_count_set(es, ext4_blocks_count(es) + blocks_count); 12972e10e2f2SYongqiang Yang le32_add_cpu(&es->s_inodes_count, EXT4_INODES_PER_GROUP(sb) * 12982e10e2f2SYongqiang Yang flex_gd->count); 12992e10e2f2SYongqiang Yang 13002e10e2f2SYongqiang Yang /* 13012e10e2f2SYongqiang Yang * We need to protect s_groups_count against other CPUs seeing 13022e10e2f2SYongqiang Yang * inconsistent state in the superblock. 13032e10e2f2SYongqiang Yang * 13042e10e2f2SYongqiang Yang * The precise rules we use are: 13052e10e2f2SYongqiang Yang * 13062e10e2f2SYongqiang Yang * * Writers must perform a smp_wmb() after updating all 13072e10e2f2SYongqiang Yang * dependent data and before modifying the groups count 13082e10e2f2SYongqiang Yang * 13092e10e2f2SYongqiang Yang * * Readers must perform an smp_rmb() after reading the groups 13102e10e2f2SYongqiang Yang * count and before reading any dependent data. 13112e10e2f2SYongqiang Yang * 13122e10e2f2SYongqiang Yang * NB. These rules can be relaxed when checking the group count 13132e10e2f2SYongqiang Yang * while freeing data, as we can only allocate from a block 13142e10e2f2SYongqiang Yang * group after serialising against the group count, and we can 13152e10e2f2SYongqiang Yang * only then free after serialising in turn against that 13162e10e2f2SYongqiang Yang * allocation. 13172e10e2f2SYongqiang Yang */ 13182e10e2f2SYongqiang Yang smp_wmb(); 13192e10e2f2SYongqiang Yang 13202e10e2f2SYongqiang Yang /* Update the global fs size fields */ 13212e10e2f2SYongqiang Yang sbi->s_groups_count += flex_gd->count; 13222e10e2f2SYongqiang Yang 13232e10e2f2SYongqiang Yang /* Update the reserved block counts only once the new group is 13242e10e2f2SYongqiang Yang * active. */ 13252e10e2f2SYongqiang Yang ext4_r_blocks_count_set(es, ext4_r_blocks_count(es) + 13262e10e2f2SYongqiang Yang reserved_blocks); 13272e10e2f2SYongqiang Yang 13282e10e2f2SYongqiang Yang /* Update the free space counts */ 13292e10e2f2SYongqiang Yang percpu_counter_add(&sbi->s_freeclusters_counter, 13302e10e2f2SYongqiang Yang EXT4_B2C(sbi, free_blocks)); 13312e10e2f2SYongqiang Yang percpu_counter_add(&sbi->s_freeinodes_counter, 13322e10e2f2SYongqiang Yang EXT4_INODES_PER_GROUP(sb) * flex_gd->count); 13332e10e2f2SYongqiang Yang 13342e10e2f2SYongqiang Yang if (EXT4_HAS_INCOMPAT_FEATURE(sb, 13352e10e2f2SYongqiang Yang EXT4_FEATURE_INCOMPAT_FLEX_BG) && 13362e10e2f2SYongqiang Yang sbi->s_log_groups_per_flex) { 13372e10e2f2SYongqiang Yang ext4_group_t flex_group; 13382e10e2f2SYongqiang Yang flex_group = ext4_flex_group(sbi, group_data[0].group); 13392e10e2f2SYongqiang Yang atomic_add(EXT4_B2C(sbi, free_blocks), 13402e10e2f2SYongqiang Yang &sbi->s_flex_groups[flex_group].free_clusters); 13412e10e2f2SYongqiang Yang atomic_add(EXT4_INODES_PER_GROUP(sb) * flex_gd->count, 13422e10e2f2SYongqiang Yang &sbi->s_flex_groups[flex_group].free_inodes); 13432e10e2f2SYongqiang Yang } 13442e10e2f2SYongqiang Yang 13452e10e2f2SYongqiang Yang if (test_opt(sb, DEBUG)) 13462e10e2f2SYongqiang Yang printk(KERN_DEBUG "EXT4-fs: added group %u:" 13472e10e2f2SYongqiang Yang "%llu blocks(%llu free %llu reserved)\n", flex_gd->count, 13482e10e2f2SYongqiang Yang blocks_count, free_blocks, reserved_blocks); 13492e10e2f2SYongqiang Yang } 13502e10e2f2SYongqiang Yang 1351ac27a0ecSDave Kleikamp /* Add group descriptor data to an existing or new group descriptor block. 1352ac27a0ecSDave Kleikamp * Ensure we handle all possible error conditions _before_ we start modifying 1353ac27a0ecSDave Kleikamp * the filesystem, because we cannot abort the transaction and not have it 1354ac27a0ecSDave Kleikamp * write the data to disk. 1355ac27a0ecSDave Kleikamp * 1356ac27a0ecSDave Kleikamp * If we are on a GDT block boundary, we need to get the reserved GDT block. 1357ac27a0ecSDave Kleikamp * Otherwise, we may need to add backup GDT blocks for a sparse group. 1358ac27a0ecSDave Kleikamp * 1359ac27a0ecSDave Kleikamp * We only need to hold the superblock lock while we are actually adding 1360ac27a0ecSDave Kleikamp * in the new group's counts to the superblock. Prior to that we have 1361ac27a0ecSDave Kleikamp * not really "added" the group at all. We re-check that we are still 1362ac27a0ecSDave Kleikamp * adding in the last group in case things have changed since verifying. 1363ac27a0ecSDave Kleikamp */ 1364617ba13bSMingming Cao int ext4_group_add(struct super_block *sb, struct ext4_new_group_data *input) 1365ac27a0ecSDave Kleikamp { 1366617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 1367617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 1368617ba13bSMingming Cao int reserved_gdb = ext4_bg_has_super(sb, input->group) ? 1369ac27a0ecSDave Kleikamp le16_to_cpu(es->s_reserved_gdt_blocks) : 0; 1370ac27a0ecSDave Kleikamp struct buffer_head *primary = NULL; 1371617ba13bSMingming Cao struct ext4_group_desc *gdp; 1372ac27a0ecSDave Kleikamp struct inode *inode = NULL; 1373ac27a0ecSDave Kleikamp handle_t *handle; 1374ac27a0ecSDave Kleikamp int gdb_off, gdb_num; 1375ac27a0ecSDave Kleikamp int err, err2; 1376ac27a0ecSDave Kleikamp 1377617ba13bSMingming Cao gdb_num = input->group / EXT4_DESC_PER_BLOCK(sb); 1378617ba13bSMingming Cao gdb_off = input->group % EXT4_DESC_PER_BLOCK(sb); 1379ac27a0ecSDave Kleikamp 1380617ba13bSMingming Cao if (gdb_off == 0 && !EXT4_HAS_RO_COMPAT_FEATURE(sb, 1381617ba13bSMingming Cao EXT4_FEATURE_RO_COMPAT_SPARSE_SUPER)) { 138212062dddSEric Sandeen ext4_warning(sb, "Can't resize non-sparse filesystem further"); 1383ac27a0ecSDave Kleikamp return -EPERM; 1384ac27a0ecSDave Kleikamp } 1385ac27a0ecSDave Kleikamp 1386bd81d8eeSLaurent Vivier if (ext4_blocks_count(es) + input->blocks_count < 1387bd81d8eeSLaurent Vivier ext4_blocks_count(es)) { 138812062dddSEric Sandeen ext4_warning(sb, "blocks_count overflow"); 1389ac27a0ecSDave Kleikamp return -EINVAL; 1390ac27a0ecSDave Kleikamp } 1391ac27a0ecSDave Kleikamp 1392617ba13bSMingming Cao if (le32_to_cpu(es->s_inodes_count) + EXT4_INODES_PER_GROUP(sb) < 1393ac27a0ecSDave Kleikamp le32_to_cpu(es->s_inodes_count)) { 139412062dddSEric Sandeen ext4_warning(sb, "inodes_count overflow"); 1395ac27a0ecSDave Kleikamp return -EINVAL; 1396ac27a0ecSDave Kleikamp } 1397ac27a0ecSDave Kleikamp 1398ac27a0ecSDave Kleikamp if (reserved_gdb || gdb_off == 0) { 1399617ba13bSMingming Cao if (!EXT4_HAS_COMPAT_FEATURE(sb, 140037609fd5SJosef Bacik EXT4_FEATURE_COMPAT_RESIZE_INODE) 140137609fd5SJosef Bacik || !le16_to_cpu(es->s_reserved_gdt_blocks)) { 140212062dddSEric Sandeen ext4_warning(sb, 1403ac27a0ecSDave Kleikamp "No reserved GDT blocks, can't resize"); 1404ac27a0ecSDave Kleikamp return -EPERM; 1405ac27a0ecSDave Kleikamp } 14061d1fe1eeSDavid Howells inode = ext4_iget(sb, EXT4_RESIZE_INO); 14071d1fe1eeSDavid Howells if (IS_ERR(inode)) { 140812062dddSEric Sandeen ext4_warning(sb, "Error opening resize inode"); 14091d1fe1eeSDavid Howells return PTR_ERR(inode); 1410ac27a0ecSDave Kleikamp } 1411ac27a0ecSDave Kleikamp } 1412ac27a0ecSDave Kleikamp 1413920313a7SAneesh Kumar K.V 1414ac27a0ecSDave Kleikamp if ((err = verify_group_input(sb, input))) 1415ac27a0ecSDave Kleikamp goto exit_put; 1416ac27a0ecSDave Kleikamp 1417ac27a0ecSDave Kleikamp if ((err = setup_new_group_blocks(sb, input))) 1418ac27a0ecSDave Kleikamp goto exit_put; 1419ac27a0ecSDave Kleikamp 1420ac27a0ecSDave Kleikamp /* 1421ac27a0ecSDave Kleikamp * We will always be modifying at least the superblock and a GDT 1422ac27a0ecSDave Kleikamp * block. If we are adding a group past the last current GDT block, 1423ac27a0ecSDave Kleikamp * we will also modify the inode and the dindirect block. If we 1424ac27a0ecSDave Kleikamp * are adding a group with superblock/GDT backups we will also 1425ac27a0ecSDave Kleikamp * modify each of the reserved GDT dindirect blocks. 1426ac27a0ecSDave Kleikamp */ 1427617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, 1428617ba13bSMingming Cao ext4_bg_has_super(sb, input->group) ? 1429ac27a0ecSDave Kleikamp 3 + reserved_gdb : 4); 1430ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 1431ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 1432ac27a0ecSDave Kleikamp goto exit_put; 1433ac27a0ecSDave Kleikamp } 1434ac27a0ecSDave Kleikamp 1435617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, sbi->s_sbh))) 1436ac27a0ecSDave Kleikamp goto exit_journal; 1437ac27a0ecSDave Kleikamp 1438ac27a0ecSDave Kleikamp /* 1439ac27a0ecSDave Kleikamp * We will only either add reserved group blocks to a backup group 1440ac27a0ecSDave Kleikamp * or remove reserved blocks for the first group in a new group block. 1441ac27a0ecSDave Kleikamp * Doing both would be mean more complex code, and sane people don't 1442ac27a0ecSDave Kleikamp * use non-sparse filesystems anymore. This is already checked above. 1443ac27a0ecSDave Kleikamp */ 1444ac27a0ecSDave Kleikamp if (gdb_off) { 1445ac27a0ecSDave Kleikamp primary = sbi->s_group_desc[gdb_num]; 1446617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, primary))) 1447ac27a0ecSDave Kleikamp goto exit_journal; 1448ac27a0ecSDave Kleikamp 1449668f4dc5SYongqiang Yang if (reserved_gdb && ext4_bg_num_gdb(sb, input->group)) { 1450668f4dc5SYongqiang Yang err = reserve_backup_gdb(handle, inode, input->group); 1451668f4dc5SYongqiang Yang if (err) 1452ac27a0ecSDave Kleikamp goto exit_journal; 1453668f4dc5SYongqiang Yang } 14542f919710SYongqiang Yang } else { 14552f919710SYongqiang Yang /* 14562f919710SYongqiang Yang * Note that we can access new group descriptor block safely 14572f919710SYongqiang Yang * only if add_new_gdb() succeeds. 14582f919710SYongqiang Yang */ 14592f919710SYongqiang Yang err = add_new_gdb(handle, inode, input->group); 14602f919710SYongqiang Yang if (err) 1461ac27a0ecSDave Kleikamp goto exit_journal; 14622f919710SYongqiang Yang primary = sbi->s_group_desc[gdb_num]; 14632f919710SYongqiang Yang } 1464ac27a0ecSDave Kleikamp 1465ac27a0ecSDave Kleikamp /* 1466ac27a0ecSDave Kleikamp * OK, now we've set up the new group. Time to make it active. 1467ac27a0ecSDave Kleikamp * 1468ac27a0ecSDave Kleikamp * so we have to be safe wrt. concurrent accesses the group 1469ac27a0ecSDave Kleikamp * data. So we need to be careful to set all of the relevant 1470ac27a0ecSDave Kleikamp * group descriptor data etc. *before* we enable the group. 1471ac27a0ecSDave Kleikamp * 1472ac27a0ecSDave Kleikamp * The key field here is sbi->s_groups_count: as long as 1473ac27a0ecSDave Kleikamp * that retains its old value, nobody is going to access the new 1474ac27a0ecSDave Kleikamp * group. 1475ac27a0ecSDave Kleikamp * 1476ac27a0ecSDave Kleikamp * So first we update all the descriptor metadata for the new 1477ac27a0ecSDave Kleikamp * group; then we update the total disk blocks count; then we 1478ac27a0ecSDave Kleikamp * update the groups count to enable the group; then finally we 1479ac27a0ecSDave Kleikamp * update the free space counts so that the system can start 1480ac27a0ecSDave Kleikamp * using the new disk blocks. 1481ac27a0ecSDave Kleikamp */ 1482ac27a0ecSDave Kleikamp 1483ac27a0ecSDave Kleikamp /* Update group descriptor block for new group */ 14842856922cSFrederic Bohe gdp = (struct ext4_group_desc *)((char *)primary->b_data + 14852856922cSFrederic Bohe gdb_off * EXT4_DESC_SIZE(sb)); 1486ac27a0ecSDave Kleikamp 1487fdff73f0STheodore Ts'o memset(gdp, 0, EXT4_DESC_SIZE(sb)); 14888fadc143SAlexandre Ratchov ext4_block_bitmap_set(sb, gdp, input->block_bitmap); /* LV FIXME */ 14898fadc143SAlexandre Ratchov ext4_inode_bitmap_set(sb, gdp, input->inode_bitmap); /* LV FIXME */ 14908fadc143SAlexandre Ratchov ext4_inode_table_set(sb, gdp, input->inode_table); /* LV FIXME */ 1491021b65bbSTheodore Ts'o ext4_free_group_clusters_set(sb, gdp, input->free_blocks_count); 1492560671a0SAneesh Kumar K.V ext4_free_inodes_set(sb, gdp, EXT4_INODES_PER_GROUP(sb)); 1493fdff73f0STheodore Ts'o gdp->bg_flags = cpu_to_le16(EXT4_BG_INODE_ZEROED); 1494717d50e4SAndreas Dilger gdp->bg_checksum = ext4_group_desc_csum(sbi, input->group, gdp); 1495ac27a0ecSDave Kleikamp 1496ac27a0ecSDave Kleikamp /* 14975f21b0e6SFrederic Bohe * We can allocate memory for mb_alloc based on the new group 14985f21b0e6SFrederic Bohe * descriptor 14995f21b0e6SFrederic Bohe */ 1500920313a7SAneesh Kumar K.V err = ext4_mb_add_groupinfo(sb, input->group, gdp); 150108c3a813SAneesh Kumar K.V if (err) 15025f21b0e6SFrederic Bohe goto exit_journal; 1503c2ea3fdeSTheodore Ts'o 15045f21b0e6SFrederic Bohe /* 1505ac27a0ecSDave Kleikamp * Make the new blocks and inodes valid next. We do this before 1506ac27a0ecSDave Kleikamp * increasing the group count so that once the group is enabled, 1507ac27a0ecSDave Kleikamp * all of its blocks and inodes are already valid. 1508ac27a0ecSDave Kleikamp * 1509ac27a0ecSDave Kleikamp * We always allocate group-by-group, then block-by-block or 1510ac27a0ecSDave Kleikamp * inode-by-inode within a group, so enabling these 1511ac27a0ecSDave Kleikamp * blocks/inodes before the group is live won't actually let us 1512ac27a0ecSDave Kleikamp * allocate the new space yet. 1513ac27a0ecSDave Kleikamp */ 1514bd81d8eeSLaurent Vivier ext4_blocks_count_set(es, ext4_blocks_count(es) + 1515ac27a0ecSDave Kleikamp input->blocks_count); 1516e8546d06SMarcin Slusarz le32_add_cpu(&es->s_inodes_count, EXT4_INODES_PER_GROUP(sb)); 1517ac27a0ecSDave Kleikamp 1518ac27a0ecSDave Kleikamp /* 1519ac27a0ecSDave Kleikamp * We need to protect s_groups_count against other CPUs seeing 1520ac27a0ecSDave Kleikamp * inconsistent state in the superblock. 1521ac27a0ecSDave Kleikamp * 1522ac27a0ecSDave Kleikamp * The precise rules we use are: 1523ac27a0ecSDave Kleikamp * 1524ac27a0ecSDave Kleikamp * * Writers must perform a smp_wmb() after updating all dependent 1525ac27a0ecSDave Kleikamp * data and before modifying the groups count 1526ac27a0ecSDave Kleikamp * 1527ac27a0ecSDave Kleikamp * * Readers must perform an smp_rmb() after reading the groups count 1528ac27a0ecSDave Kleikamp * and before reading any dependent data. 1529ac27a0ecSDave Kleikamp * 1530ac27a0ecSDave Kleikamp * NB. These rules can be relaxed when checking the group count 1531ac27a0ecSDave Kleikamp * while freeing data, as we can only allocate from a block 1532ac27a0ecSDave Kleikamp * group after serialising against the group count, and we can 1533ac27a0ecSDave Kleikamp * only then free after serialising in turn against that 1534ac27a0ecSDave Kleikamp * allocation. 1535ac27a0ecSDave Kleikamp */ 1536ac27a0ecSDave Kleikamp smp_wmb(); 1537ac27a0ecSDave Kleikamp 1538ac27a0ecSDave Kleikamp /* Update the global fs size fields */ 1539ac27a0ecSDave Kleikamp sbi->s_groups_count++; 1540ac27a0ecSDave Kleikamp 1541b4097142STheodore Ts'o err = ext4_handle_dirty_metadata(handle, NULL, primary); 1542b4097142STheodore Ts'o if (unlikely(err)) { 1543b4097142STheodore Ts'o ext4_std_error(sb, err); 1544b4097142STheodore Ts'o goto exit_journal; 1545b4097142STheodore Ts'o } 1546ac27a0ecSDave Kleikamp 1547ac27a0ecSDave Kleikamp /* Update the reserved block counts only once the new group is 1548ac27a0ecSDave Kleikamp * active. */ 1549bd81d8eeSLaurent Vivier ext4_r_blocks_count_set(es, ext4_r_blocks_count(es) + 1550ac27a0ecSDave Kleikamp input->reserved_blocks); 1551ac27a0ecSDave Kleikamp 1552ac27a0ecSDave Kleikamp /* Update the free space counts */ 155357042651STheodore Ts'o percpu_counter_add(&sbi->s_freeclusters_counter, 155457042651STheodore Ts'o EXT4_B2C(sbi, input->free_blocks_count)); 1555aa0dff2dSPeter Zijlstra percpu_counter_add(&sbi->s_freeinodes_counter, 1556617ba13bSMingming Cao EXT4_INODES_PER_GROUP(sb)); 1557ac27a0ecSDave Kleikamp 155842007efdSEric Sandeen if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_FLEX_BG) && 155942007efdSEric Sandeen sbi->s_log_groups_per_flex) { 1560c62a11fdSFrederic Bohe ext4_group_t flex_group; 1561c62a11fdSFrederic Bohe flex_group = ext4_flex_group(sbi, input->group); 156224aaa8efSTheodore Ts'o atomic_add(EXT4_B2C(sbi, input->free_blocks_count), 156324aaa8efSTheodore Ts'o &sbi->s_flex_groups[flex_group].free_clusters); 15649f24e420STheodore Ts'o atomic_add(EXT4_INODES_PER_GROUP(sb), 15659f24e420STheodore Ts'o &sbi->s_flex_groups[flex_group].free_inodes); 1566c62a11fdSFrederic Bohe } 1567c62a11fdSFrederic Bohe 1568a0375156STheodore Ts'o ext4_handle_dirty_super(handle, sb); 1569ac27a0ecSDave Kleikamp 1570ac27a0ecSDave Kleikamp exit_journal: 1571617ba13bSMingming Cao if ((err2 = ext4_journal_stop(handle)) && !err) 1572ac27a0ecSDave Kleikamp err = err2; 15732f919710SYongqiang Yang if (!err && primary) { 1574ac27a0ecSDave Kleikamp update_backups(sb, sbi->s_sbh->b_blocknr, (char *)es, 1575617ba13bSMingming Cao sizeof(struct ext4_super_block)); 1576ac27a0ecSDave Kleikamp update_backups(sb, primary->b_blocknr, primary->b_data, 1577ac27a0ecSDave Kleikamp primary->b_size); 1578ac27a0ecSDave Kleikamp } 1579ac27a0ecSDave Kleikamp exit_put: 1580ac27a0ecSDave Kleikamp iput(inode); 1581ac27a0ecSDave Kleikamp return err; 1582617ba13bSMingming Cao } /* ext4_group_add */ 1583ac27a0ecSDave Kleikamp 15842b2d6d01STheodore Ts'o /* 158518e31438SYongqiang Yang * extend a group without checking assuming that checking has been done. 158618e31438SYongqiang Yang */ 158718e31438SYongqiang Yang static int ext4_group_extend_no_check(struct super_block *sb, 158818e31438SYongqiang Yang ext4_fsblk_t o_blocks_count, ext4_grpblk_t add) 158918e31438SYongqiang Yang { 159018e31438SYongqiang Yang struct ext4_super_block *es = EXT4_SB(sb)->s_es; 159118e31438SYongqiang Yang handle_t *handle; 159218e31438SYongqiang Yang int err = 0, err2; 159318e31438SYongqiang Yang 159418e31438SYongqiang Yang /* We will update the superblock, one block bitmap, and 159518e31438SYongqiang Yang * one group descriptor via ext4_group_add_blocks(). 159618e31438SYongqiang Yang */ 159718e31438SYongqiang Yang handle = ext4_journal_start_sb(sb, 3); 159818e31438SYongqiang Yang if (IS_ERR(handle)) { 159918e31438SYongqiang Yang err = PTR_ERR(handle); 160018e31438SYongqiang Yang ext4_warning(sb, "error %d on journal start", err); 160118e31438SYongqiang Yang return err; 160218e31438SYongqiang Yang } 160318e31438SYongqiang Yang 160418e31438SYongqiang Yang err = ext4_journal_get_write_access(handle, EXT4_SB(sb)->s_sbh); 160518e31438SYongqiang Yang if (err) { 160618e31438SYongqiang Yang ext4_warning(sb, "error %d on journal write access", err); 160718e31438SYongqiang Yang goto errout; 160818e31438SYongqiang Yang } 160918e31438SYongqiang Yang 161018e31438SYongqiang Yang ext4_blocks_count_set(es, o_blocks_count + add); 161118e31438SYongqiang Yang ext4_debug("freeing blocks %llu through %llu\n", o_blocks_count, 161218e31438SYongqiang Yang o_blocks_count + add); 161318e31438SYongqiang Yang /* We add the blocks to the bitmap and set the group need init bit */ 161418e31438SYongqiang Yang err = ext4_group_add_blocks(handle, sb, o_blocks_count, add); 161518e31438SYongqiang Yang if (err) 161618e31438SYongqiang Yang goto errout; 161718e31438SYongqiang Yang ext4_handle_dirty_super(handle, sb); 161818e31438SYongqiang Yang ext4_debug("freed blocks %llu through %llu\n", o_blocks_count, 161918e31438SYongqiang Yang o_blocks_count + add); 162018e31438SYongqiang Yang errout: 162118e31438SYongqiang Yang err2 = ext4_journal_stop(handle); 162218e31438SYongqiang Yang if (err2 && !err) 162318e31438SYongqiang Yang err = err2; 162418e31438SYongqiang Yang 162518e31438SYongqiang Yang if (!err) { 162618e31438SYongqiang Yang if (test_opt(sb, DEBUG)) 162718e31438SYongqiang Yang printk(KERN_DEBUG "EXT4-fs: extended group to %llu " 162818e31438SYongqiang Yang "blocks\n", ext4_blocks_count(es)); 162918e31438SYongqiang Yang update_backups(sb, EXT4_SB(sb)->s_sbh->b_blocknr, (char *)es, 163018e31438SYongqiang Yang sizeof(struct ext4_super_block)); 163118e31438SYongqiang Yang } 163218e31438SYongqiang Yang return err; 163318e31438SYongqiang Yang } 163418e31438SYongqiang Yang 163518e31438SYongqiang Yang /* 16362b2d6d01STheodore Ts'o * Extend the filesystem to the new number of blocks specified. This entry 1637ac27a0ecSDave Kleikamp * point is only used to extend the current filesystem to the end of the last 1638ac27a0ecSDave Kleikamp * existing group. It can be accessed via ioctl, or by "remount,resize=<size>" 1639ac27a0ecSDave Kleikamp * for emergencies (because it has no dependencies on reserved blocks). 1640ac27a0ecSDave Kleikamp * 1641617ba13bSMingming Cao * If we _really_ wanted, we could use default values to call ext4_group_add() 1642ac27a0ecSDave Kleikamp * allow the "remount" trick to work for arbitrary resizing, assuming enough 1643ac27a0ecSDave Kleikamp * GDT blocks are reserved to grow to the desired size. 1644ac27a0ecSDave Kleikamp */ 1645617ba13bSMingming Cao int ext4_group_extend(struct super_block *sb, struct ext4_super_block *es, 1646617ba13bSMingming Cao ext4_fsblk_t n_blocks_count) 1647ac27a0ecSDave Kleikamp { 1648617ba13bSMingming Cao ext4_fsblk_t o_blocks_count; 1649617ba13bSMingming Cao ext4_grpblk_t last; 1650617ba13bSMingming Cao ext4_grpblk_t add; 1651ac27a0ecSDave Kleikamp struct buffer_head *bh; 1652ac27a0ecSDave Kleikamp handle_t *handle; 1653cc7365dfSYongqiang Yang int err, err2; 16545f21b0e6SFrederic Bohe ext4_group_t group; 1655ac27a0ecSDave Kleikamp 1656bd81d8eeSLaurent Vivier o_blocks_count = ext4_blocks_count(es); 1657ac27a0ecSDave Kleikamp 1658ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 16592b79b09dSYongqiang Yang printk(KERN_DEBUG "EXT4-fs: extending last group from %llu to %llu blocks\n", 1660ac27a0ecSDave Kleikamp o_blocks_count, n_blocks_count); 1661ac27a0ecSDave Kleikamp 1662ac27a0ecSDave Kleikamp if (n_blocks_count == 0 || n_blocks_count == o_blocks_count) 1663ac27a0ecSDave Kleikamp return 0; 1664ac27a0ecSDave Kleikamp 1665ac27a0ecSDave Kleikamp if (n_blocks_count > (sector_t)(~0ULL) >> (sb->s_blocksize_bits - 9)) { 1666617ba13bSMingming Cao printk(KERN_ERR "EXT4-fs: filesystem on %s:" 16672ae02107SMingming Cao " too large to resize to %llu blocks safely\n", 1668ac27a0ecSDave Kleikamp sb->s_id, n_blocks_count); 1669ac27a0ecSDave Kleikamp if (sizeof(sector_t) < 8) 167012062dddSEric Sandeen ext4_warning(sb, "CONFIG_LBDAF not enabled"); 1671ac27a0ecSDave Kleikamp return -EINVAL; 1672ac27a0ecSDave Kleikamp } 1673ac27a0ecSDave Kleikamp 1674ac27a0ecSDave Kleikamp if (n_blocks_count < o_blocks_count) { 167512062dddSEric Sandeen ext4_warning(sb, "can't shrink FS - resize aborted"); 16768f82f840SYongqiang Yang return -EINVAL; 1677ac27a0ecSDave Kleikamp } 1678ac27a0ecSDave Kleikamp 1679ac27a0ecSDave Kleikamp /* Handle the remaining blocks in the last group only. */ 16805f21b0e6SFrederic Bohe ext4_get_group_no_and_offset(sb, o_blocks_count, &group, &last); 1681ac27a0ecSDave Kleikamp 1682ac27a0ecSDave Kleikamp if (last == 0) { 168312062dddSEric Sandeen ext4_warning(sb, "need to use ext2online to resize further"); 1684ac27a0ecSDave Kleikamp return -EPERM; 1685ac27a0ecSDave Kleikamp } 1686ac27a0ecSDave Kleikamp 1687617ba13bSMingming Cao add = EXT4_BLOCKS_PER_GROUP(sb) - last; 1688ac27a0ecSDave Kleikamp 1689ac27a0ecSDave Kleikamp if (o_blocks_count + add < o_blocks_count) { 169012062dddSEric Sandeen ext4_warning(sb, "blocks_count overflow"); 1691ac27a0ecSDave Kleikamp return -EINVAL; 1692ac27a0ecSDave Kleikamp } 1693ac27a0ecSDave Kleikamp 1694ac27a0ecSDave Kleikamp if (o_blocks_count + add > n_blocks_count) 1695ac27a0ecSDave Kleikamp add = n_blocks_count - o_blocks_count; 1696ac27a0ecSDave Kleikamp 1697ac27a0ecSDave Kleikamp if (o_blocks_count + add < n_blocks_count) 169812062dddSEric Sandeen ext4_warning(sb, "will only finish group (%llu blocks, %u new)", 1699ac27a0ecSDave Kleikamp o_blocks_count + add, add); 1700ac27a0ecSDave Kleikamp 1701ac27a0ecSDave Kleikamp /* See if the device is actually as big as what was requested */ 1702ac27a0ecSDave Kleikamp bh = sb_bread(sb, o_blocks_count + add - 1); 1703ac27a0ecSDave Kleikamp if (!bh) { 170412062dddSEric Sandeen ext4_warning(sb, "can't read last block, resize aborted"); 1705ac27a0ecSDave Kleikamp return -ENOSPC; 1706ac27a0ecSDave Kleikamp } 1707ac27a0ecSDave Kleikamp brelse(bh); 1708ac27a0ecSDave Kleikamp 1709ac27a0ecSDave Kleikamp /* We will update the superblock, one block bitmap, and 1710617ba13bSMingming Cao * one group descriptor via ext4_free_blocks(). 1711ac27a0ecSDave Kleikamp */ 1712617ba13bSMingming Cao handle = ext4_journal_start_sb(sb, 3); 1713ac27a0ecSDave Kleikamp if (IS_ERR(handle)) { 1714ac27a0ecSDave Kleikamp err = PTR_ERR(handle); 171512062dddSEric Sandeen ext4_warning(sb, "error %d on journal start", err); 1716ac27a0ecSDave Kleikamp goto exit_put; 1717ac27a0ecSDave Kleikamp } 1718ac27a0ecSDave Kleikamp 1719617ba13bSMingming Cao if ((err = ext4_journal_get_write_access(handle, 1720617ba13bSMingming Cao EXT4_SB(sb)->s_sbh))) { 172112062dddSEric Sandeen ext4_warning(sb, "error %d on journal write access", err); 1722617ba13bSMingming Cao ext4_journal_stop(handle); 1723ac27a0ecSDave Kleikamp goto exit_put; 1724ac27a0ecSDave Kleikamp } 1725bd81d8eeSLaurent Vivier ext4_blocks_count_set(es, o_blocks_count + add); 1726c549a95dSEric Sandeen ext4_debug("freeing blocks %llu through %llu\n", o_blocks_count, 1727ac27a0ecSDave Kleikamp o_blocks_count + add); 1728e21675d4SAneesh Kumar K.V /* We add the blocks to the bitmap and set the group need init bit */ 1729cc7365dfSYongqiang Yang err = ext4_group_add_blocks(handle, sb, o_blocks_count, add); 1730a0375156STheodore Ts'o ext4_handle_dirty_super(handle, sb); 17312ae02107SMingming Cao ext4_debug("freed blocks %llu through %llu\n", o_blocks_count, 1732ac27a0ecSDave Kleikamp o_blocks_count + add); 1733cc7365dfSYongqiang Yang err2 = ext4_journal_stop(handle); 1734cc7365dfSYongqiang Yang if (!err && err2) 1735cc7365dfSYongqiang Yang err = err2; 1736cc7365dfSYongqiang Yang 1737cc7365dfSYongqiang Yang if (err) 1738ac27a0ecSDave Kleikamp goto exit_put; 17395f21b0e6SFrederic Bohe 1740ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 1741bd81d8eeSLaurent Vivier printk(KERN_DEBUG "EXT4-fs: extended group to %llu blocks\n", 1742bd81d8eeSLaurent Vivier ext4_blocks_count(es)); 1743617ba13bSMingming Cao update_backups(sb, EXT4_SB(sb)->s_sbh->b_blocknr, (char *)es, 1744617ba13bSMingming Cao sizeof(struct ext4_super_block)); 1745ac27a0ecSDave Kleikamp exit_put: 1746ac27a0ecSDave Kleikamp return err; 1747617ba13bSMingming Cao } /* ext4_group_extend */ 1748