1 /* 2 * Copyright (C) International Business Machines Corp., 2000-2004 3 * 4 * This program is free software; you can redistribute it and/or modify 5 * it under the terms of the GNU General Public License as published by 6 * the Free Software Foundation; either version 2 of the License, or 7 * (at your option) any later version. 8 * 9 * This program is distributed in the hope that it will be useful, 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See 12 * the GNU General Public License for more details. 13 * 14 * You should have received a copy of the GNU General Public License 15 * along with this program; if not, write to the Free Software 16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA 17 */ 18 19 #include <linux/fs.h> 20 #include <linux/buffer_head.h> 21 #include <linux/quotaops.h> 22 #include "jfs_incore.h" 23 #include "jfs_filsys.h" 24 #include "jfs_metapage.h" 25 #include "jfs_dinode.h" 26 #include "jfs_imap.h" 27 #include "jfs_dmap.h" 28 #include "jfs_superblock.h" 29 #include "jfs_txnmgr.h" 30 #include "jfs_debug.h" 31 32 #define BITSPERPAGE (PSIZE << 3) 33 #define L2MEGABYTE 20 34 #define MEGABYTE (1 << L2MEGABYTE) 35 #define MEGABYTE32 (MEGABYTE << 5) 36 37 /* convert block number to bmap file page number */ 38 #define BLKTODMAPN(b)\ 39 (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1) 40 41 /* 42 * jfs_extendfs() 43 * 44 * function: extend file system; 45 * 46 * |-------------------------------|----------|----------| 47 * file system space fsck inline log 48 * workspace space 49 * 50 * input: 51 * new LVSize: in LV blocks (required) 52 * new LogSize: in LV blocks (optional) 53 * new FSSize: in LV blocks (optional) 54 * 55 * new configuration: 56 * 1. set new LogSize as specified or default from new LVSize; 57 * 2. compute new FSCKSize from new LVSize; 58 * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where 59 * assert(new FSSize >= old FSSize), 60 * i.e., file system must not be shrunk; 61 */ 62 int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize) 63 { 64 int rc = 0; 65 struct jfs_sb_info *sbi = JFS_SBI(sb); 66 struct inode *ipbmap = sbi->ipbmap; 67 struct inode *ipbmap2; 68 struct inode *ipimap = sbi->ipimap; 69 struct jfs_log *log = sbi->log; 70 struct bmap *bmp = sbi->bmap; 71 s64 newLogAddress, newFSCKAddress; 72 int newFSCKSize; 73 s64 newMapSize = 0, mapSize; 74 s64 XAddress, XSize, nblocks, xoff, xaddr, t64; 75 s64 oldLVSize; 76 s64 newFSSize; 77 s64 VolumeSize; 78 int newNpages = 0, nPages, newPage, xlen, t32; 79 int tid; 80 int log_formatted = 0; 81 struct inode *iplist[1]; 82 struct jfs_superblock *j_sb, *j_sb2; 83 s64 old_agsize; 84 int agsizechanged = 0; 85 struct buffer_head *bh, *bh2; 86 87 /* If the volume hasn't grown, get out now */ 88 89 if (sbi->mntflag & JFS_INLINELOG) 90 oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd); 91 else 92 oldLVSize = addressPXD(&sbi->fsckpxd) + 93 lengthPXD(&sbi->fsckpxd); 94 95 if (oldLVSize >= newLVSize) { 96 printk(KERN_WARNING 97 "jfs_extendfs: volume hasn't grown, returning\n"); 98 goto out; 99 } 100 101 VolumeSize = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits; 102 103 if (VolumeSize) { 104 if (newLVSize > VolumeSize) { 105 printk(KERN_WARNING "jfs_extendfs: invalid size\n"); 106 rc = -EINVAL; 107 goto out; 108 } 109 } else { 110 /* check the device */ 111 bh = sb_bread(sb, newLVSize - 1); 112 if (!bh) { 113 printk(KERN_WARNING "jfs_extendfs: invalid size\n"); 114 rc = -EINVAL; 115 goto out; 116 } 117 bforget(bh); 118 } 119 120 /* Can't extend write-protected drive */ 121 122 if (isReadOnly(ipbmap)) { 123 printk(KERN_WARNING "jfs_extendfs: read-only file system\n"); 124 rc = -EROFS; 125 goto out; 126 } 127 128 /* 129 * reconfigure LV spaces 130 * --------------------- 131 * 132 * validate new size, or, if not specified, determine new size 133 */ 134 135 /* 136 * reconfigure inline log space: 137 */ 138 if ((sbi->mntflag & JFS_INLINELOG)) { 139 if (newLogSize == 0) { 140 /* 141 * no size specified: default to 1/256 of aggregate 142 * size; rounded up to a megabyte boundary; 143 */ 144 newLogSize = newLVSize >> 8; 145 t32 = (1 << (20 - sbi->l2bsize)) - 1; 146 newLogSize = (newLogSize + t32) & ~t32; 147 newLogSize = 148 min(newLogSize, MEGABYTE32 >> sbi->l2bsize); 149 } else { 150 /* 151 * convert the newLogSize to fs blocks. 152 * 153 * Since this is given in megabytes, it will always be 154 * an even number of pages. 155 */ 156 newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize; 157 } 158 159 } else 160 newLogSize = 0; 161 162 newLogAddress = newLVSize - newLogSize; 163 164 /* 165 * reconfigure fsck work space: 166 * 167 * configure it to the end of the logical volume regardless of 168 * whether file system extends to the end of the aggregate; 169 * Need enough 4k pages to cover: 170 * - 1 bit per block in aggregate rounded up to BPERDMAP boundary 171 * - 1 extra page to handle control page and intermediate level pages 172 * - 50 extra pages for the chkdsk service log 173 */ 174 t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP) 175 << L2BPERDMAP; 176 t32 = DIV_ROUND_UP(t64, BITSPERPAGE) + 1 + 50; 177 newFSCKSize = t32 << sbi->l2nbperpage; 178 newFSCKAddress = newLogAddress - newFSCKSize; 179 180 /* 181 * compute new file system space; 182 */ 183 newFSSize = newLVSize - newLogSize - newFSCKSize; 184 185 /* file system cannot be shrunk */ 186 if (newFSSize < bmp->db_mapsize) { 187 rc = -EINVAL; 188 goto out; 189 } 190 191 /* 192 * If we're expanding enough that the inline log does not overlap 193 * the old one, we can format the new log before we quiesce the 194 * filesystem. 195 */ 196 if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) { 197 if ((rc = lmLogFormat(log, newLogAddress, newLogSize))) 198 goto out; 199 log_formatted = 1; 200 } 201 /* 202 * quiesce file system 203 * 204 * (prepare to move the inline log and to prevent map update) 205 * 206 * block any new transactions and wait for completion of 207 * all wip transactions and flush modified pages s.t. 208 * on-disk file system is in consistent state and 209 * log is not required for recovery. 210 */ 211 txQuiesce(sb); 212 213 /* Reset size of direct inode */ 214 sbi->direct_inode->i_size = sb->s_bdev->bd_inode->i_size; 215 216 if (sbi->mntflag & JFS_INLINELOG) { 217 /* 218 * deactivate old inline log 219 */ 220 lmLogShutdown(log); 221 222 /* 223 * mark on-disk super block for fs in transition; 224 * 225 * update on-disk superblock for the new space configuration 226 * of inline log space and fsck work space descriptors: 227 * N.B. FS descriptor is NOT updated; 228 * 229 * crash recovery: 230 * logredo(): if FM_EXTENDFS, return to fsck() for cleanup; 231 * fsck(): if FM_EXTENDFS, reformat inline log and fsck 232 * workspace from superblock inline log descriptor and fsck 233 * workspace descriptor; 234 */ 235 236 /* read in superblock */ 237 if ((rc = readSuper(sb, &bh))) 238 goto error_out; 239 j_sb = (struct jfs_superblock *)bh->b_data; 240 241 /* mark extendfs() in progress */ 242 j_sb->s_state |= cpu_to_le32(FM_EXTENDFS); 243 j_sb->s_xsize = cpu_to_le64(newFSSize); 244 PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress); 245 PXDlength(&j_sb->s_xfsckpxd, newFSCKSize); 246 PXDaddress(&j_sb->s_xlogpxd, newLogAddress); 247 PXDlength(&j_sb->s_xlogpxd, newLogSize); 248 249 /* synchronously update superblock */ 250 mark_buffer_dirty(bh); 251 sync_dirty_buffer(bh); 252 brelse(bh); 253 254 /* 255 * format new inline log synchronously; 256 * 257 * crash recovery: if log move in progress, 258 * reformat log and exit success; 259 */ 260 if (!log_formatted) 261 if ((rc = lmLogFormat(log, newLogAddress, newLogSize))) 262 goto error_out; 263 264 /* 265 * activate new log 266 */ 267 log->base = newLogAddress; 268 log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits); 269 if ((rc = lmLogInit(log))) 270 goto error_out; 271 } 272 273 /* 274 * extend block allocation map 275 * --------------------------- 276 * 277 * extendfs() for new extension, retry after crash recovery; 278 * 279 * note: both logredo() and fsck() rebuild map from 280 * the bitmap and configuration parameter from superblock 281 * (disregarding all other control information in the map); 282 * 283 * superblock: 284 * s_size: aggregate size in physical blocks; 285 */ 286 /* 287 * compute the new block allocation map configuration 288 * 289 * map dinode: 290 * di_size: map file size in byte; 291 * di_nblocks: number of blocks allocated for map file; 292 * di_mapsize: number of blocks in aggregate (covered by map); 293 * map control page: 294 * db_mapsize: number of blocks in aggregate (covered by map); 295 */ 296 newMapSize = newFSSize; 297 /* number of data pages of new bmap file: 298 * roundup new size to full dmap page boundary and 299 * add 1 extra dmap page for next extendfs() 300 */ 301 t64 = (newMapSize - 1) + BPERDMAP; 302 newNpages = BLKTODMAPN(t64) + 1; 303 304 /* 305 * extend map from current map (WITHOUT growing mapfile) 306 * 307 * map new extension with unmapped part of the last partial 308 * dmap page, if applicable, and extra page(s) allocated 309 * at end of bmap by mkfs() or previous extendfs(); 310 */ 311 extendBmap: 312 /* compute number of blocks requested to extend */ 313 mapSize = bmp->db_mapsize; 314 XAddress = mapSize; /* eXtension Address */ 315 XSize = newMapSize - mapSize; /* eXtension Size */ 316 old_agsize = bmp->db_agsize; /* We need to know if this changes */ 317 318 /* compute number of blocks that can be extended by current mapfile */ 319 t64 = dbMapFileSizeToMapSize(ipbmap); 320 if (mapSize > t64) { 321 printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n", 322 (long long) mapSize, (long long) t64); 323 rc = -EIO; 324 goto error_out; 325 } 326 nblocks = min(t64 - mapSize, XSize); 327 328 /* 329 * update map pages for new extension: 330 * 331 * update/init dmap and bubble up the control hierarchy 332 * incrementally fold up dmaps into upper levels; 333 * update bmap control page; 334 */ 335 if ((rc = dbExtendFS(ipbmap, XAddress, nblocks))) 336 goto error_out; 337 338 agsizechanged |= (bmp->db_agsize != old_agsize); 339 340 /* 341 * the map now has extended to cover additional nblocks: 342 * dn_mapsize = oldMapsize + nblocks; 343 */ 344 /* ipbmap->i_mapsize += nblocks; */ 345 XSize -= nblocks; 346 347 /* 348 * grow map file to cover remaining extension 349 * and/or one extra dmap page for next extendfs(); 350 * 351 * allocate new map pages and its backing blocks, and 352 * update map file xtree 353 */ 354 /* compute number of data pages of current bmap file */ 355 nPages = ipbmap->i_size >> L2PSIZE; 356 357 /* need to grow map file ? */ 358 if (nPages == newNpages) 359 goto finalizeBmap; 360 361 /* 362 * grow bmap file for the new map pages required: 363 * 364 * allocate growth at the start of newly extended region; 365 * bmap file only grows sequentially, i.e., both data pages 366 * and possibly xtree index pages may grow in append mode, 367 * s.t. logredo() can reconstruct pre-extension state 368 * by washing away bmap file of pages outside s_size boundary; 369 */ 370 /* 371 * journal map file growth as if a regular file growth: 372 * (note: bmap is created with di_mode = IFJOURNAL|IFREG); 373 * 374 * journaling of bmap file growth is not required since 375 * logredo() do/can not use log records of bmap file growth 376 * but it provides careful write semantics, pmap update, etc.; 377 */ 378 /* synchronous write of data pages: bmap data pages are 379 * cached in meta-data cache, and not written out 380 * by txCommit(); 381 */ 382 filemap_fdatawait(ipbmap->i_mapping); 383 filemap_write_and_wait(ipbmap->i_mapping); 384 diWriteSpecial(ipbmap, 0); 385 386 newPage = nPages; /* first new page number */ 387 xoff = newPage << sbi->l2nbperpage; 388 xlen = (newNpages - nPages) << sbi->l2nbperpage; 389 xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1); 390 xaddr = XAddress; 391 392 tid = txBegin(sb, COMMIT_FORCE); 393 394 if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) { 395 txEnd(tid); 396 goto error_out; 397 } 398 /* update bmap file size */ 399 ipbmap->i_size += xlen << sbi->l2bsize; 400 inode_add_bytes(ipbmap, xlen << sbi->l2bsize); 401 402 iplist[0] = ipbmap; 403 rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE); 404 405 txEnd(tid); 406 407 if (rc) 408 goto error_out; 409 410 /* 411 * map file has been grown now to cover extension to further out; 412 * di_size = new map file size; 413 * 414 * if huge extension, the previous extension based on previous 415 * map file size may not have been sufficient to cover whole extension 416 * (it could have been used up for new map pages), 417 * but the newly grown map file now covers lot bigger new free space 418 * available for further extension of map; 419 */ 420 /* any more blocks to extend ? */ 421 if (XSize) 422 goto extendBmap; 423 424 finalizeBmap: 425 /* finalize bmap */ 426 dbFinalizeBmap(ipbmap); 427 428 /* 429 * update inode allocation map 430 * --------------------------- 431 * 432 * move iag lists from old to new iag; 433 * agstart field is not updated for logredo() to reconstruct 434 * iag lists if system crash occurs. 435 * (computation of ag number from agstart based on agsize 436 * will correctly identify the new ag); 437 */ 438 /* if new AG size the same as old AG size, done! */ 439 if (agsizechanged) { 440 if ((rc = diExtendFS(ipimap, ipbmap))) 441 goto error_out; 442 443 /* finalize imap */ 444 if ((rc = diSync(ipimap))) 445 goto error_out; 446 } 447 448 /* 449 * finalize 450 * -------- 451 * 452 * extension is committed when on-disk super block is 453 * updated with new descriptors: logredo will recover 454 * crash before it to pre-extension state; 455 */ 456 457 /* sync log to skip log replay of bmap file growth transaction; */ 458 /* lmLogSync(log, 1); */ 459 460 /* 461 * synchronous write bmap global control page; 462 * for crash before completion of write 463 * logredo() will recover to pre-extendfs state; 464 * for crash after completion of write, 465 * logredo() will recover post-extendfs state; 466 */ 467 if ((rc = dbSync(ipbmap))) 468 goto error_out; 469 470 /* 471 * copy primary bmap inode to secondary bmap inode 472 */ 473 474 ipbmap2 = diReadSpecial(sb, BMAP_I, 1); 475 if (ipbmap2 == NULL) { 476 printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n"); 477 goto error_out; 478 } 479 memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288); 480 ipbmap2->i_size = ipbmap->i_size; 481 ipbmap2->i_blocks = ipbmap->i_blocks; 482 483 diWriteSpecial(ipbmap2, 1); 484 diFreeSpecial(ipbmap2); 485 486 /* 487 * update superblock 488 */ 489 if ((rc = readSuper(sb, &bh))) 490 goto error_out; 491 j_sb = (struct jfs_superblock *)bh->b_data; 492 493 /* mark extendfs() completion */ 494 j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS); 495 j_sb->s_size = cpu_to_le64(bmp->db_mapsize << 496 le16_to_cpu(j_sb->s_l2bfactor)); 497 j_sb->s_agsize = cpu_to_le32(bmp->db_agsize); 498 499 /* update inline log space descriptor */ 500 if (sbi->mntflag & JFS_INLINELOG) { 501 PXDaddress(&(j_sb->s_logpxd), newLogAddress); 502 PXDlength(&(j_sb->s_logpxd), newLogSize); 503 } 504 505 /* record log's mount serial number */ 506 j_sb->s_logserial = cpu_to_le32(log->serial); 507 508 /* update fsck work space descriptor */ 509 PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress); 510 PXDlength(&(j_sb->s_fsckpxd), newFSCKSize); 511 j_sb->s_fscklog = 1; 512 /* sb->s_fsckloglen remains the same */ 513 514 /* Update secondary superblock */ 515 bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits); 516 if (bh2) { 517 j_sb2 = (struct jfs_superblock *)bh2->b_data; 518 memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock)); 519 520 mark_buffer_dirty(bh); 521 sync_dirty_buffer(bh2); 522 brelse(bh2); 523 } 524 525 /* write primary superblock */ 526 mark_buffer_dirty(bh); 527 sync_dirty_buffer(bh); 528 brelse(bh); 529 530 goto resume; 531 532 error_out: 533 jfs_error(sb, "jfs_extendfs"); 534 535 resume: 536 /* 537 * resume file system transactions 538 */ 539 txResume(sb); 540 541 out: 542 return rc; 543 } 544