1748de673SAkira Fujita /* 2748de673SAkira Fujita * Copyright (c) 2008,2009 NEC Software Tohoku, Ltd. 3748de673SAkira Fujita * Written by Takashi Sato <t-sato@yk.jp.nec.com> 4748de673SAkira Fujita * Akira Fujita <a-fujita@rs.jp.nec.com> 5748de673SAkira Fujita * 6748de673SAkira Fujita * This program is free software; you can redistribute it and/or modify it 7748de673SAkira Fujita * under the terms of version 2.1 of the GNU Lesser General Public License 8748de673SAkira Fujita * as published by the Free Software Foundation. 9748de673SAkira Fujita * 10748de673SAkira Fujita * This program is distributed in the hope that it will be useful, 11748de673SAkira Fujita * but WITHOUT ANY WARRANTY; without even the implied warranty of 12748de673SAkira Fujita * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13748de673SAkira Fujita * GNU General Public License for more details. 14748de673SAkira Fujita */ 15748de673SAkira Fujita 16748de673SAkira Fujita #include <linux/fs.h> 17748de673SAkira Fujita #include <linux/quotaops.h> 18748de673SAkira Fujita #include "ext4_jbd2.h" 19748de673SAkira Fujita #include "ext4_extents.h" 20748de673SAkira Fujita #include "ext4.h" 21748de673SAkira Fujita 22e8505970SAkira Fujita /** 23e8505970SAkira Fujita * get_ext_path - Find an extent path for designated logical block number. 24e8505970SAkira Fujita * 25e8505970SAkira Fujita * @inode: an inode which is searched 26e8505970SAkira Fujita * @lblock: logical block number to find an extent path 27e8505970SAkira Fujita * @path: pointer to an extent path pointer (for output) 28e8505970SAkira Fujita * 29e8505970SAkira Fujita * ext4_ext_find_extent wrapper. Return 0 on success, or a negative error value 30e8505970SAkira Fujita * on failure. 31e8505970SAkira Fujita */ 32e8505970SAkira Fujita static inline int 33e8505970SAkira Fujita get_ext_path(struct inode *inode, ext4_lblk_t lblock, 34e8505970SAkira Fujita struct ext4_ext_path **path) 35e8505970SAkira Fujita { 36e8505970SAkira Fujita int ret = 0; 37e8505970SAkira Fujita 38e8505970SAkira Fujita *path = ext4_ext_find_extent(inode, lblock, *path); 39e8505970SAkira Fujita if (IS_ERR(*path)) { 40e8505970SAkira Fujita ret = PTR_ERR(*path); 41e8505970SAkira Fujita *path = NULL; 42347fa6f1SAkira Fujita } else if ((*path)[ext_depth(inode)].p_ext == NULL) 43347fa6f1SAkira Fujita ret = -ENODATA; 44347fa6f1SAkira Fujita 45e8505970SAkira Fujita return ret; 46e8505970SAkira Fujita } 47748de673SAkira Fujita 48748de673SAkira Fujita /** 49748de673SAkira Fujita * copy_extent_status - Copy the extent's initialization status 50748de673SAkira Fujita * 51748de673SAkira Fujita * @src: an extent for getting initialize status 52748de673SAkira Fujita * @dest: an extent to be set the status 53748de673SAkira Fujita */ 54748de673SAkira Fujita static void 55748de673SAkira Fujita copy_extent_status(struct ext4_extent *src, struct ext4_extent *dest) 56748de673SAkira Fujita { 57748de673SAkira Fujita if (ext4_ext_is_uninitialized(src)) 58748de673SAkira Fujita ext4_ext_mark_uninitialized(dest); 59748de673SAkira Fujita else 60748de673SAkira Fujita dest->ee_len = cpu_to_le16(ext4_ext_get_actual_len(dest)); 61748de673SAkira Fujita } 62748de673SAkira Fujita 63748de673SAkira Fujita /** 64748de673SAkira Fujita * mext_next_extent - Search for the next extent and set it to "extent" 65748de673SAkira Fujita * 66748de673SAkira Fujita * @inode: inode which is searched 67748de673SAkira Fujita * @path: this will obtain data for the next extent 68748de673SAkira Fujita * @extent: pointer to the next extent we have just gotten 69748de673SAkira Fujita * 70748de673SAkira Fujita * Search the next extent in the array of ext4_ext_path structure (@path) 71748de673SAkira Fujita * and set it to ext4_extent structure (@extent). In addition, the member of 72748de673SAkira Fujita * @path (->p_ext) also points the next extent. Return 0 on success, 1 if 73748de673SAkira Fujita * ext4_ext_path structure refers to the last extent, or a negative error 74748de673SAkira Fujita * value on failure. 75748de673SAkira Fujita */ 76748de673SAkira Fujita static int 77748de673SAkira Fujita mext_next_extent(struct inode *inode, struct ext4_ext_path *path, 78748de673SAkira Fujita struct ext4_extent **extent) 79748de673SAkira Fujita { 80fc04cb49SAkira Fujita struct ext4_extent_header *eh; 81748de673SAkira Fujita int ppos, leaf_ppos = path->p_depth; 82748de673SAkira Fujita 83748de673SAkira Fujita ppos = leaf_ppos; 84748de673SAkira Fujita if (EXT_LAST_EXTENT(path[ppos].p_hdr) > path[ppos].p_ext) { 85748de673SAkira Fujita /* leaf block */ 86748de673SAkira Fujita *extent = ++path[ppos].p_ext; 87fc04cb49SAkira Fujita path[ppos].p_block = ext_pblock(path[ppos].p_ext); 88748de673SAkira Fujita return 0; 89748de673SAkira Fujita } 90748de673SAkira Fujita 91748de673SAkira Fujita while (--ppos >= 0) { 92748de673SAkira Fujita if (EXT_LAST_INDEX(path[ppos].p_hdr) > 93748de673SAkira Fujita path[ppos].p_idx) { 94748de673SAkira Fujita int cur_ppos = ppos; 95748de673SAkira Fujita 96748de673SAkira Fujita /* index block */ 97748de673SAkira Fujita path[ppos].p_idx++; 98748de673SAkira Fujita path[ppos].p_block = idx_pblock(path[ppos].p_idx); 99748de673SAkira Fujita if (path[ppos+1].p_bh) 100748de673SAkira Fujita brelse(path[ppos+1].p_bh); 101748de673SAkira Fujita path[ppos+1].p_bh = 102748de673SAkira Fujita sb_bread(inode->i_sb, path[ppos].p_block); 103748de673SAkira Fujita if (!path[ppos+1].p_bh) 104748de673SAkira Fujita return -EIO; 105748de673SAkira Fujita path[ppos+1].p_hdr = 106748de673SAkira Fujita ext_block_hdr(path[ppos+1].p_bh); 107748de673SAkira Fujita 108748de673SAkira Fujita /* Halfway index block */ 109748de673SAkira Fujita while (++cur_ppos < leaf_ppos) { 110748de673SAkira Fujita path[cur_ppos].p_idx = 111748de673SAkira Fujita EXT_FIRST_INDEX(path[cur_ppos].p_hdr); 112748de673SAkira Fujita path[cur_ppos].p_block = 113748de673SAkira Fujita idx_pblock(path[cur_ppos].p_idx); 114748de673SAkira Fujita if (path[cur_ppos+1].p_bh) 115748de673SAkira Fujita brelse(path[cur_ppos+1].p_bh); 116748de673SAkira Fujita path[cur_ppos+1].p_bh = sb_bread(inode->i_sb, 117748de673SAkira Fujita path[cur_ppos].p_block); 118748de673SAkira Fujita if (!path[cur_ppos+1].p_bh) 119748de673SAkira Fujita return -EIO; 120748de673SAkira Fujita path[cur_ppos+1].p_hdr = 121748de673SAkira Fujita ext_block_hdr(path[cur_ppos+1].p_bh); 122748de673SAkira Fujita } 123748de673SAkira Fujita 124fc04cb49SAkira Fujita path[leaf_ppos].p_ext = *extent = NULL; 125fc04cb49SAkira Fujita 126fc04cb49SAkira Fujita eh = path[leaf_ppos].p_hdr; 127fc04cb49SAkira Fujita if (le16_to_cpu(eh->eh_entries) == 0) 128fc04cb49SAkira Fujita /* empty leaf is found */ 129fc04cb49SAkira Fujita return -ENODATA; 130fc04cb49SAkira Fujita 131748de673SAkira Fujita /* leaf block */ 132748de673SAkira Fujita path[leaf_ppos].p_ext = *extent = 133748de673SAkira Fujita EXT_FIRST_EXTENT(path[leaf_ppos].p_hdr); 134fc04cb49SAkira Fujita path[leaf_ppos].p_block = 135fc04cb49SAkira Fujita ext_pblock(path[leaf_ppos].p_ext); 136748de673SAkira Fujita return 0; 137748de673SAkira Fujita } 138748de673SAkira Fujita } 139748de673SAkira Fujita /* We found the last extent */ 140748de673SAkira Fujita return 1; 141748de673SAkira Fujita } 142748de673SAkira Fujita 143748de673SAkira Fujita /** 1442147b1a6SAkira Fujita * mext_check_null_inode - NULL check for two inodes 1452147b1a6SAkira Fujita * 1462147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1472147b1a6SAkira Fujita */ 1482147b1a6SAkira Fujita static int 1492147b1a6SAkira Fujita mext_check_null_inode(struct inode *inode1, struct inode *inode2, 1502147b1a6SAkira Fujita const char *function) 1512147b1a6SAkira Fujita { 1522147b1a6SAkira Fujita int ret = 0; 1532147b1a6SAkira Fujita 1542147b1a6SAkira Fujita if (inode1 == NULL) { 1552147b1a6SAkira Fujita ext4_error(inode2->i_sb, function, 1562147b1a6SAkira Fujita "Both inodes should not be NULL: " 1572147b1a6SAkira Fujita "inode1 NULL inode2 %lu", inode2->i_ino); 1582147b1a6SAkira Fujita ret = -EIO; 1592147b1a6SAkira Fujita } else if (inode2 == NULL) { 1602147b1a6SAkira Fujita ext4_error(inode1->i_sb, function, 1612147b1a6SAkira Fujita "Both inodes should not be NULL: " 1622147b1a6SAkira Fujita "inode1 %lu inode2 NULL", inode1->i_ino); 1632147b1a6SAkira Fujita ret = -EIO; 1642147b1a6SAkira Fujita } 1652147b1a6SAkira Fujita return ret; 1662147b1a6SAkira Fujita } 1672147b1a6SAkira Fujita 1682147b1a6SAkira Fujita /** 169fc04cb49SAkira Fujita * double_down_write_data_sem - Acquire two inodes' write lock of i_data_sem 170748de673SAkira Fujita * 171748de673SAkira Fujita * @orig_inode: original inode structure 172748de673SAkira Fujita * @donor_inode: donor inode structure 173fc04cb49SAkira Fujita * Acquire write lock of i_data_sem of the two inodes (orig and donor) by 174fc04cb49SAkira Fujita * i_ino order. 175748de673SAkira Fujita */ 176748de673SAkira Fujita static void 177fc04cb49SAkira Fujita double_down_write_data_sem(struct inode *orig_inode, struct inode *donor_inode) 178748de673SAkira Fujita { 179748de673SAkira Fujita struct inode *first = orig_inode, *second = donor_inode; 180748de673SAkira Fujita 181748de673SAkira Fujita /* 182748de673SAkira Fujita * Use the inode number to provide the stable locking order instead 183748de673SAkira Fujita * of its address, because the C language doesn't guarantee you can 184748de673SAkira Fujita * compare pointers that don't come from the same array. 185748de673SAkira Fujita */ 186748de673SAkira Fujita if (donor_inode->i_ino < orig_inode->i_ino) { 187748de673SAkira Fujita first = donor_inode; 188748de673SAkira Fujita second = orig_inode; 189748de673SAkira Fujita } 190748de673SAkira Fujita 191748de673SAkira Fujita down_write(&EXT4_I(first)->i_data_sem); 19249bd22bcSAkira Fujita down_write_nested(&EXT4_I(second)->i_data_sem, SINGLE_DEPTH_NESTING); 193748de673SAkira Fujita } 194748de673SAkira Fujita 195748de673SAkira Fujita /** 196fc04cb49SAkira Fujita * double_up_write_data_sem - Release two inodes' write lock of i_data_sem 197748de673SAkira Fujita * 198748de673SAkira Fujita * @orig_inode: original inode structure to be released its lock first 199748de673SAkira Fujita * @donor_inode: donor inode structure to be released its lock second 200fc04cb49SAkira Fujita * Release write lock of i_data_sem of two inodes (orig and donor). 201748de673SAkira Fujita */ 202748de673SAkira Fujita static void 203fc04cb49SAkira Fujita double_up_write_data_sem(struct inode *orig_inode, struct inode *donor_inode) 204748de673SAkira Fujita { 205748de673SAkira Fujita up_write(&EXT4_I(orig_inode)->i_data_sem); 206748de673SAkira Fujita up_write(&EXT4_I(donor_inode)->i_data_sem); 207748de673SAkira Fujita } 208748de673SAkira Fujita 209748de673SAkira Fujita /** 210748de673SAkira Fujita * mext_insert_across_blocks - Insert extents across leaf block 211748de673SAkira Fujita * 212748de673SAkira Fujita * @handle: journal handle 213748de673SAkira Fujita * @orig_inode: original inode 214748de673SAkira Fujita * @o_start: first original extent to be changed 215748de673SAkira Fujita * @o_end: last original extent to be changed 216748de673SAkira Fujita * @start_ext: first new extent to be inserted 217748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 218748de673SAkira Fujita * @end_ext: last new extent to be inserted 219748de673SAkira Fujita * 220748de673SAkira Fujita * Allocate a new leaf block and insert extents into it. Return 0 on success, 221748de673SAkira Fujita * or a negative error value on failure. 222748de673SAkira Fujita */ 223748de673SAkira Fujita static int 224748de673SAkira Fujita mext_insert_across_blocks(handle_t *handle, struct inode *orig_inode, 225748de673SAkira Fujita struct ext4_extent *o_start, struct ext4_extent *o_end, 226748de673SAkira Fujita struct ext4_extent *start_ext, struct ext4_extent *new_ext, 227748de673SAkira Fujita struct ext4_extent *end_ext) 228748de673SAkira Fujita { 229748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL; 230748de673SAkira Fujita ext4_lblk_t eblock = 0; 231748de673SAkira Fujita int new_flag = 0; 232748de673SAkira Fujita int end_flag = 0; 233748de673SAkira Fujita int err = 0; 234748de673SAkira Fujita 235748de673SAkira Fujita if (start_ext->ee_len && new_ext->ee_len && end_ext->ee_len) { 236748de673SAkira Fujita if (o_start == o_end) { 237748de673SAkira Fujita 238748de673SAkira Fujita /* start_ext new_ext end_ext 239748de673SAkira Fujita * donor |---------|-----------|--------| 240748de673SAkira Fujita * orig |------------------------------| 241748de673SAkira Fujita */ 242748de673SAkira Fujita end_flag = 1; 243748de673SAkira Fujita } else { 244748de673SAkira Fujita 245748de673SAkira Fujita /* start_ext new_ext end_ext 246748de673SAkira Fujita * donor |---------|----------|---------| 247748de673SAkira Fujita * orig |---------------|--------------| 248748de673SAkira Fujita */ 249748de673SAkira Fujita o_end->ee_block = end_ext->ee_block; 250748de673SAkira Fujita o_end->ee_len = end_ext->ee_len; 251748de673SAkira Fujita ext4_ext_store_pblock(o_end, ext_pblock(end_ext)); 252748de673SAkira Fujita } 253748de673SAkira Fujita 254748de673SAkira Fujita o_start->ee_len = start_ext->ee_len; 255748de673SAkira Fujita new_flag = 1; 256748de673SAkira Fujita 257748de673SAkira Fujita } else if (start_ext->ee_len && new_ext->ee_len && 258748de673SAkira Fujita !end_ext->ee_len && o_start == o_end) { 259748de673SAkira Fujita 260748de673SAkira Fujita /* start_ext new_ext 261748de673SAkira Fujita * donor |--------------|---------------| 262748de673SAkira Fujita * orig |------------------------------| 263748de673SAkira Fujita */ 264748de673SAkira Fujita o_start->ee_len = start_ext->ee_len; 265748de673SAkira Fujita new_flag = 1; 266748de673SAkira Fujita 267748de673SAkira Fujita } else if (!start_ext->ee_len && new_ext->ee_len && 268748de673SAkira Fujita end_ext->ee_len && o_start == o_end) { 269748de673SAkira Fujita 270748de673SAkira Fujita /* new_ext end_ext 271748de673SAkira Fujita * donor |--------------|---------------| 272748de673SAkira Fujita * orig |------------------------------| 273748de673SAkira Fujita */ 274748de673SAkira Fujita o_end->ee_block = end_ext->ee_block; 275748de673SAkira Fujita o_end->ee_len = end_ext->ee_len; 276748de673SAkira Fujita ext4_ext_store_pblock(o_end, ext_pblock(end_ext)); 277748de673SAkira Fujita 278748de673SAkira Fujita /* 279748de673SAkira Fujita * Set 0 to the extent block if new_ext was 280748de673SAkira Fujita * the first block. 281748de673SAkira Fujita */ 282748de673SAkira Fujita if (new_ext->ee_block) 283748de673SAkira Fujita eblock = le32_to_cpu(new_ext->ee_block); 284748de673SAkira Fujita 285748de673SAkira Fujita new_flag = 1; 286748de673SAkira Fujita } else { 287748de673SAkira Fujita ext4_debug("ext4 move extent: Unexpected insert case\n"); 288748de673SAkira Fujita return -EIO; 289748de673SAkira Fujita } 290748de673SAkira Fujita 291748de673SAkira Fujita if (new_flag) { 292e8505970SAkira Fujita err = get_ext_path(orig_inode, eblock, &orig_path); 293347fa6f1SAkira Fujita if (err) 294748de673SAkira Fujita goto out; 295748de673SAkira Fujita 296748de673SAkira Fujita if (ext4_ext_insert_extent(handle, orig_inode, 2970031462bSMingming Cao orig_path, new_ext, 0)) 298748de673SAkira Fujita goto out; 299748de673SAkira Fujita } 300748de673SAkira Fujita 301748de673SAkira Fujita if (end_flag) { 302e8505970SAkira Fujita err = get_ext_path(orig_inode, 303e8505970SAkira Fujita le32_to_cpu(end_ext->ee_block) - 1, &orig_path); 304347fa6f1SAkira Fujita if (err) 305748de673SAkira Fujita goto out; 306748de673SAkira Fujita 307748de673SAkira Fujita if (ext4_ext_insert_extent(handle, orig_inode, 3080031462bSMingming Cao orig_path, end_ext, 0)) 309748de673SAkira Fujita goto out; 310748de673SAkira Fujita } 311748de673SAkira Fujita out: 312748de673SAkira Fujita if (orig_path) { 313748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 314748de673SAkira Fujita kfree(orig_path); 315748de673SAkira Fujita } 316748de673SAkira Fujita 317748de673SAkira Fujita return err; 318748de673SAkira Fujita 319748de673SAkira Fujita } 320748de673SAkira Fujita 321748de673SAkira Fujita /** 322748de673SAkira Fujita * mext_insert_inside_block - Insert new extent to the extent block 323748de673SAkira Fujita * 324748de673SAkira Fujita * @o_start: first original extent to be moved 325748de673SAkira Fujita * @o_end: last original extent to be moved 326748de673SAkira Fujita * @start_ext: first new extent to be inserted 327748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 328748de673SAkira Fujita * @end_ext: last new extent to be inserted 329748de673SAkira Fujita * @eh: extent header of target leaf block 330748de673SAkira Fujita * @range_to_move: used to decide how to insert extent 331748de673SAkira Fujita * 332748de673SAkira Fujita * Insert extents into the leaf block. The extent (@o_start) is overwritten 333748de673SAkira Fujita * by inserted extents. 334748de673SAkira Fujita */ 335748de673SAkira Fujita static void 336748de673SAkira Fujita mext_insert_inside_block(struct ext4_extent *o_start, 337748de673SAkira Fujita struct ext4_extent *o_end, 338748de673SAkira Fujita struct ext4_extent *start_ext, 339748de673SAkira Fujita struct ext4_extent *new_ext, 340748de673SAkira Fujita struct ext4_extent *end_ext, 341748de673SAkira Fujita struct ext4_extent_header *eh, 342748de673SAkira Fujita int range_to_move) 343748de673SAkira Fujita { 344748de673SAkira Fujita int i = 0; 345748de673SAkira Fujita unsigned long len; 346748de673SAkira Fujita 347748de673SAkira Fujita /* Move the existing extents */ 348748de673SAkira Fujita if (range_to_move && o_end < EXT_LAST_EXTENT(eh)) { 349748de673SAkira Fujita len = (unsigned long)(EXT_LAST_EXTENT(eh) + 1) - 350748de673SAkira Fujita (unsigned long)(o_end + 1); 351748de673SAkira Fujita memmove(o_end + 1 + range_to_move, o_end + 1, len); 352748de673SAkira Fujita } 353748de673SAkira Fujita 354748de673SAkira Fujita /* Insert start entry */ 355748de673SAkira Fujita if (start_ext->ee_len) 356748de673SAkira Fujita o_start[i++].ee_len = start_ext->ee_len; 357748de673SAkira Fujita 358748de673SAkira Fujita /* Insert new entry */ 359748de673SAkira Fujita if (new_ext->ee_len) { 360748de673SAkira Fujita o_start[i] = *new_ext; 361748de673SAkira Fujita ext4_ext_store_pblock(&o_start[i++], ext_pblock(new_ext)); 362748de673SAkira Fujita } 363748de673SAkira Fujita 364748de673SAkira Fujita /* Insert end entry */ 365748de673SAkira Fujita if (end_ext->ee_len) 366748de673SAkira Fujita o_start[i] = *end_ext; 367748de673SAkira Fujita 368748de673SAkira Fujita /* Increment the total entries counter on the extent block */ 369748de673SAkira Fujita le16_add_cpu(&eh->eh_entries, range_to_move); 370748de673SAkira Fujita } 371748de673SAkira Fujita 372748de673SAkira Fujita /** 373748de673SAkira Fujita * mext_insert_extents - Insert new extent 374748de673SAkira Fujita * 375748de673SAkira Fujita * @handle: journal handle 376748de673SAkira Fujita * @orig_inode: original inode 377748de673SAkira Fujita * @orig_path: path indicates first extent to be changed 378748de673SAkira Fujita * @o_start: first original extent to be changed 379748de673SAkira Fujita * @o_end: last original extent to be changed 380748de673SAkira Fujita * @start_ext: first new extent to be inserted 381748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 382748de673SAkira Fujita * @end_ext: last new extent to be inserted 383748de673SAkira Fujita * 384748de673SAkira Fujita * Call the function to insert extents. If we cannot add more extents into 385748de673SAkira Fujita * the leaf block, we call mext_insert_across_blocks() to create a 386748de673SAkira Fujita * new leaf block. Otherwise call mext_insert_inside_block(). Return 0 387748de673SAkira Fujita * on success, or a negative error value on failure. 388748de673SAkira Fujita */ 389748de673SAkira Fujita static int 390748de673SAkira Fujita mext_insert_extents(handle_t *handle, struct inode *orig_inode, 391748de673SAkira Fujita struct ext4_ext_path *orig_path, 392748de673SAkira Fujita struct ext4_extent *o_start, 393748de673SAkira Fujita struct ext4_extent *o_end, 394748de673SAkira Fujita struct ext4_extent *start_ext, 395748de673SAkira Fujita struct ext4_extent *new_ext, 396748de673SAkira Fujita struct ext4_extent *end_ext) 397748de673SAkira Fujita { 398748de673SAkira Fujita struct ext4_extent_header *eh; 399748de673SAkira Fujita unsigned long need_slots, slots_range; 400748de673SAkira Fujita int range_to_move, depth, ret; 401748de673SAkira Fujita 402748de673SAkira Fujita /* 403748de673SAkira Fujita * The extents need to be inserted 404748de673SAkira Fujita * start_extent + new_extent + end_extent. 405748de673SAkira Fujita */ 406748de673SAkira Fujita need_slots = (start_ext->ee_len ? 1 : 0) + (end_ext->ee_len ? 1 : 0) + 407748de673SAkira Fujita (new_ext->ee_len ? 1 : 0); 408748de673SAkira Fujita 409748de673SAkira Fujita /* The number of slots between start and end */ 410748de673SAkira Fujita slots_range = ((unsigned long)(o_end + 1) - (unsigned long)o_start + 1) 411748de673SAkira Fujita / sizeof(struct ext4_extent); 412748de673SAkira Fujita 413748de673SAkira Fujita /* Range to move the end of extent */ 414748de673SAkira Fujita range_to_move = need_slots - slots_range; 415748de673SAkira Fujita depth = orig_path->p_depth; 416748de673SAkira Fujita orig_path += depth; 417748de673SAkira Fujita eh = orig_path->p_hdr; 418748de673SAkira Fujita 419748de673SAkira Fujita if (depth) { 420748de673SAkira Fujita /* Register to journal */ 421748de673SAkira Fujita ret = ext4_journal_get_write_access(handle, orig_path->p_bh); 422748de673SAkira Fujita if (ret) 423748de673SAkira Fujita return ret; 424748de673SAkira Fujita } 425748de673SAkira Fujita 426748de673SAkira Fujita /* Expansion */ 427748de673SAkira Fujita if (range_to_move > 0 && 428748de673SAkira Fujita (range_to_move > le16_to_cpu(eh->eh_max) 429748de673SAkira Fujita - le16_to_cpu(eh->eh_entries))) { 430748de673SAkira Fujita 431748de673SAkira Fujita ret = mext_insert_across_blocks(handle, orig_inode, o_start, 432748de673SAkira Fujita o_end, start_ext, new_ext, end_ext); 433748de673SAkira Fujita if (ret < 0) 434748de673SAkira Fujita return ret; 435748de673SAkira Fujita } else 436748de673SAkira Fujita mext_insert_inside_block(o_start, o_end, start_ext, new_ext, 437748de673SAkira Fujita end_ext, eh, range_to_move); 438748de673SAkira Fujita 439748de673SAkira Fujita if (depth) { 440748de673SAkira Fujita ret = ext4_handle_dirty_metadata(handle, orig_inode, 441748de673SAkira Fujita orig_path->p_bh); 442748de673SAkira Fujita if (ret) 443748de673SAkira Fujita return ret; 444748de673SAkira Fujita } else { 445748de673SAkira Fujita ret = ext4_mark_inode_dirty(handle, orig_inode); 446748de673SAkira Fujita if (ret < 0) 447748de673SAkira Fujita return ret; 448748de673SAkira Fujita } 449748de673SAkira Fujita 450748de673SAkira Fujita return 0; 451748de673SAkira Fujita } 452748de673SAkira Fujita 453748de673SAkira Fujita /** 454748de673SAkira Fujita * mext_leaf_block - Move one leaf extent block into the inode. 455748de673SAkira Fujita * 456748de673SAkira Fujita * @handle: journal handle 457748de673SAkira Fujita * @orig_inode: original inode 458748de673SAkira Fujita * @orig_path: path indicates first extent to be changed 459748de673SAkira Fujita * @dext: donor extent 460748de673SAkira Fujita * @from: start offset on the target file 461748de673SAkira Fujita * 462748de673SAkira Fujita * In order to insert extents into the leaf block, we must divide the extent 463748de673SAkira Fujita * in the leaf block into three extents. The one is located to be inserted 464748de673SAkira Fujita * extents, and the others are located around it. 465748de673SAkira Fujita * 466748de673SAkira Fujita * Therefore, this function creates structures to save extents of the leaf 467748de673SAkira Fujita * block, and inserts extents by calling mext_insert_extents() with 468748de673SAkira Fujita * created extents. Return 0 on success, or a negative error value on failure. 469748de673SAkira Fujita */ 470748de673SAkira Fujita static int 471748de673SAkira Fujita mext_leaf_block(handle_t *handle, struct inode *orig_inode, 472748de673SAkira Fujita struct ext4_ext_path *orig_path, struct ext4_extent *dext, 473748de673SAkira Fujita ext4_lblk_t *from) 474748de673SAkira Fujita { 475748de673SAkira Fujita struct ext4_extent *oext, *o_start, *o_end, *prev_ext; 476748de673SAkira Fujita struct ext4_extent new_ext, start_ext, end_ext; 477748de673SAkira Fujita ext4_lblk_t new_ext_end; 478748de673SAkira Fujita ext4_fsblk_t new_phys_end; 479748de673SAkira Fujita int oext_alen, new_ext_alen, end_ext_alen; 480748de673SAkira Fujita int depth = ext_depth(orig_inode); 481748de673SAkira Fujita int ret; 482748de673SAkira Fujita 483748de673SAkira Fujita o_start = o_end = oext = orig_path[depth].p_ext; 484748de673SAkira Fujita oext_alen = ext4_ext_get_actual_len(oext); 485748de673SAkira Fujita start_ext.ee_len = end_ext.ee_len = 0; 486748de673SAkira Fujita 487748de673SAkira Fujita new_ext.ee_block = cpu_to_le32(*from); 488748de673SAkira Fujita ext4_ext_store_pblock(&new_ext, ext_pblock(dext)); 489748de673SAkira Fujita new_ext.ee_len = dext->ee_len; 490748de673SAkira Fujita new_ext_alen = ext4_ext_get_actual_len(&new_ext); 491748de673SAkira Fujita new_ext_end = le32_to_cpu(new_ext.ee_block) + new_ext_alen - 1; 492748de673SAkira Fujita new_phys_end = ext_pblock(&new_ext) + new_ext_alen - 1; 493748de673SAkira Fujita 494748de673SAkira Fujita /* 495748de673SAkira Fujita * Case: original extent is first 496748de673SAkira Fujita * oext |--------| 497748de673SAkira Fujita * new_ext |--| 498748de673SAkira Fujita * start_ext |--| 499748de673SAkira Fujita */ 500748de673SAkira Fujita if (le32_to_cpu(oext->ee_block) < le32_to_cpu(new_ext.ee_block) && 501748de673SAkira Fujita le32_to_cpu(new_ext.ee_block) < 502748de673SAkira Fujita le32_to_cpu(oext->ee_block) + oext_alen) { 503748de673SAkira Fujita start_ext.ee_len = cpu_to_le16(le32_to_cpu(new_ext.ee_block) - 504748de673SAkira Fujita le32_to_cpu(oext->ee_block)); 505748de673SAkira Fujita copy_extent_status(oext, &start_ext); 506748de673SAkira Fujita } else if (oext > EXT_FIRST_EXTENT(orig_path[depth].p_hdr)) { 507748de673SAkira Fujita prev_ext = oext - 1; 508748de673SAkira Fujita /* 509748de673SAkira Fujita * We can merge new_ext into previous extent, 510748de673SAkira Fujita * if these are contiguous and same extent type. 511748de673SAkira Fujita */ 512748de673SAkira Fujita if (ext4_can_extents_be_merged(orig_inode, prev_ext, 513748de673SAkira Fujita &new_ext)) { 514748de673SAkira Fujita o_start = prev_ext; 515748de673SAkira Fujita start_ext.ee_len = cpu_to_le16( 516748de673SAkira Fujita ext4_ext_get_actual_len(prev_ext) + 517748de673SAkira Fujita new_ext_alen); 518748de673SAkira Fujita copy_extent_status(prev_ext, &start_ext); 519748de673SAkira Fujita new_ext.ee_len = 0; 520748de673SAkira Fujita } 521748de673SAkira Fujita } 522748de673SAkira Fujita 523748de673SAkira Fujita /* 524748de673SAkira Fujita * Case: new_ext_end must be less than oext 525748de673SAkira Fujita * oext |-----------| 526748de673SAkira Fujita * new_ext |-------| 527748de673SAkira Fujita */ 5282147b1a6SAkira Fujita if (le32_to_cpu(oext->ee_block) + oext_alen - 1 < new_ext_end) { 5292147b1a6SAkira Fujita ext4_error(orig_inode->i_sb, __func__, 5302147b1a6SAkira Fujita "new_ext_end(%u) should be less than or equal to " 5312147b1a6SAkira Fujita "oext->ee_block(%u) + oext_alen(%d) - 1", 5322147b1a6SAkira Fujita new_ext_end, le32_to_cpu(oext->ee_block), 5332147b1a6SAkira Fujita oext_alen); 5342147b1a6SAkira Fujita ret = -EIO; 5352147b1a6SAkira Fujita goto out; 5362147b1a6SAkira Fujita } 537748de673SAkira Fujita 538748de673SAkira Fujita /* 539748de673SAkira Fujita * Case: new_ext is smaller than original extent 540748de673SAkira Fujita * oext |---------------| 541748de673SAkira Fujita * new_ext |-----------| 542748de673SAkira Fujita * end_ext |---| 543748de673SAkira Fujita */ 544748de673SAkira Fujita if (le32_to_cpu(oext->ee_block) <= new_ext_end && 545748de673SAkira Fujita new_ext_end < le32_to_cpu(oext->ee_block) + oext_alen - 1) { 546748de673SAkira Fujita end_ext.ee_len = 547748de673SAkira Fujita cpu_to_le16(le32_to_cpu(oext->ee_block) + 548748de673SAkira Fujita oext_alen - 1 - new_ext_end); 549748de673SAkira Fujita copy_extent_status(oext, &end_ext); 550748de673SAkira Fujita end_ext_alen = ext4_ext_get_actual_len(&end_ext); 551748de673SAkira Fujita ext4_ext_store_pblock(&end_ext, 552748de673SAkira Fujita (ext_pblock(o_end) + oext_alen - end_ext_alen)); 553748de673SAkira Fujita end_ext.ee_block = 554748de673SAkira Fujita cpu_to_le32(le32_to_cpu(o_end->ee_block) + 555748de673SAkira Fujita oext_alen - end_ext_alen); 556748de673SAkira Fujita } 557748de673SAkira Fujita 558748de673SAkira Fujita ret = mext_insert_extents(handle, orig_inode, orig_path, o_start, 559748de673SAkira Fujita o_end, &start_ext, &new_ext, &end_ext); 5602147b1a6SAkira Fujita out: 561748de673SAkira Fujita return ret; 562748de673SAkira Fujita } 563748de673SAkira Fujita 564748de673SAkira Fujita /** 565748de673SAkira Fujita * mext_calc_swap_extents - Calculate extents for extent swapping. 566748de673SAkira Fujita * 567748de673SAkira Fujita * @tmp_dext: the extent that will belong to the original inode 568748de673SAkira Fujita * @tmp_oext: the extent that will belong to the donor inode 569748de673SAkira Fujita * @orig_off: block offset of original inode 570748de673SAkira Fujita * @donor_off: block offset of donor inode 571748de673SAkira Fujita * @max_count: the maximun length of extents 572c40ce3c9SAkira Fujita * 573c40ce3c9SAkira Fujita * Return 0 on success, or a negative error value on failure. 574748de673SAkira Fujita */ 575c40ce3c9SAkira Fujita static int 576748de673SAkira Fujita mext_calc_swap_extents(struct ext4_extent *tmp_dext, 577748de673SAkira Fujita struct ext4_extent *tmp_oext, 578748de673SAkira Fujita ext4_lblk_t orig_off, ext4_lblk_t donor_off, 579748de673SAkira Fujita ext4_lblk_t max_count) 580748de673SAkira Fujita { 581748de673SAkira Fujita ext4_lblk_t diff, orig_diff; 582748de673SAkira Fujita struct ext4_extent dext_old, oext_old; 583748de673SAkira Fujita 584c40ce3c9SAkira Fujita BUG_ON(orig_off != donor_off); 585c40ce3c9SAkira Fujita 586c40ce3c9SAkira Fujita /* original and donor extents have to cover the same block offset */ 587c40ce3c9SAkira Fujita if (orig_off < le32_to_cpu(tmp_oext->ee_block) || 588c40ce3c9SAkira Fujita le32_to_cpu(tmp_oext->ee_block) + 589c40ce3c9SAkira Fujita ext4_ext_get_actual_len(tmp_oext) - 1 < orig_off) 590c40ce3c9SAkira Fujita return -ENODATA; 591c40ce3c9SAkira Fujita 592c40ce3c9SAkira Fujita if (orig_off < le32_to_cpu(tmp_dext->ee_block) || 593c40ce3c9SAkira Fujita le32_to_cpu(tmp_dext->ee_block) + 594c40ce3c9SAkira Fujita ext4_ext_get_actual_len(tmp_dext) - 1 < orig_off) 595c40ce3c9SAkira Fujita return -ENODATA; 596c40ce3c9SAkira Fujita 597748de673SAkira Fujita dext_old = *tmp_dext; 598748de673SAkira Fujita oext_old = *tmp_oext; 599748de673SAkira Fujita 600748de673SAkira Fujita /* When tmp_dext is too large, pick up the target range. */ 601748de673SAkira Fujita diff = donor_off - le32_to_cpu(tmp_dext->ee_block); 602748de673SAkira Fujita 603748de673SAkira Fujita ext4_ext_store_pblock(tmp_dext, ext_pblock(tmp_dext) + diff); 604748de673SAkira Fujita tmp_dext->ee_block = 605748de673SAkira Fujita cpu_to_le32(le32_to_cpu(tmp_dext->ee_block) + diff); 606748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(le16_to_cpu(tmp_dext->ee_len) - diff); 607748de673SAkira Fujita 608748de673SAkira Fujita if (max_count < ext4_ext_get_actual_len(tmp_dext)) 609748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(max_count); 610748de673SAkira Fujita 611748de673SAkira Fujita orig_diff = orig_off - le32_to_cpu(tmp_oext->ee_block); 612748de673SAkira Fujita ext4_ext_store_pblock(tmp_oext, ext_pblock(tmp_oext) + orig_diff); 613748de673SAkira Fujita 614748de673SAkira Fujita /* Adjust extent length if donor extent is larger than orig */ 615748de673SAkira Fujita if (ext4_ext_get_actual_len(tmp_dext) > 616748de673SAkira Fujita ext4_ext_get_actual_len(tmp_oext) - orig_diff) 617748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(le16_to_cpu(tmp_oext->ee_len) - 618748de673SAkira Fujita orig_diff); 619748de673SAkira Fujita 620748de673SAkira Fujita tmp_oext->ee_len = cpu_to_le16(ext4_ext_get_actual_len(tmp_dext)); 621748de673SAkira Fujita 622748de673SAkira Fujita copy_extent_status(&oext_old, tmp_dext); 623748de673SAkira Fujita copy_extent_status(&dext_old, tmp_oext); 624c40ce3c9SAkira Fujita 625c40ce3c9SAkira Fujita return 0; 626748de673SAkira Fujita } 627748de673SAkira Fujita 628748de673SAkira Fujita /** 629748de673SAkira Fujita * mext_replace_branches - Replace original extents with new extents 630748de673SAkira Fujita * 631748de673SAkira Fujita * @handle: journal handle 632748de673SAkira Fujita * @orig_inode: original inode 633748de673SAkira Fujita * @donor_inode: donor inode 634748de673SAkira Fujita * @from: block offset of orig_inode 635748de673SAkira Fujita * @count: block count to be replaced 636f868a48dSAkira Fujita * @err: pointer to save return value 637748de673SAkira Fujita * 638748de673SAkira Fujita * Replace original inode extents and donor inode extents page by page. 639748de673SAkira Fujita * We implement this replacement in the following three steps: 640748de673SAkira Fujita * 1. Save the block information of original and donor inodes into 641748de673SAkira Fujita * dummy extents. 642748de673SAkira Fujita * 2. Change the block information of original inode to point at the 643748de673SAkira Fujita * donor inode blocks. 644748de673SAkira Fujita * 3. Change the block information of donor inode to point at the saved 645748de673SAkira Fujita * original inode blocks in the dummy extents. 646748de673SAkira Fujita * 647f868a48dSAkira Fujita * Return replaced block count. 648748de673SAkira Fujita */ 649748de673SAkira Fujita static int 650748de673SAkira Fujita mext_replace_branches(handle_t *handle, struct inode *orig_inode, 651748de673SAkira Fujita struct inode *donor_inode, ext4_lblk_t from, 652f868a48dSAkira Fujita ext4_lblk_t count, int *err) 653748de673SAkira Fujita { 654748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL; 655748de673SAkira Fujita struct ext4_ext_path *donor_path = NULL; 656748de673SAkira Fujita struct ext4_extent *oext, *dext; 657748de673SAkira Fujita struct ext4_extent tmp_dext, tmp_oext; 658748de673SAkira Fujita ext4_lblk_t orig_off = from, donor_off = from; 659748de673SAkira Fujita int depth; 660748de673SAkira Fujita int replaced_count = 0; 661748de673SAkira Fujita int dext_alen; 662748de673SAkira Fujita 663748de673SAkira Fujita /* Get the original extent for the block "orig_off" */ 664f868a48dSAkira Fujita *err = get_ext_path(orig_inode, orig_off, &orig_path); 665f868a48dSAkira Fujita if (*err) 666748de673SAkira Fujita goto out; 667748de673SAkira Fujita 668748de673SAkira Fujita /* Get the donor extent for the head */ 669f868a48dSAkira Fujita *err = get_ext_path(donor_inode, donor_off, &donor_path); 670f868a48dSAkira Fujita if (*err) 671748de673SAkira Fujita goto out; 672748de673SAkira Fujita depth = ext_depth(orig_inode); 673748de673SAkira Fujita oext = orig_path[depth].p_ext; 674748de673SAkira Fujita tmp_oext = *oext; 675748de673SAkira Fujita 676748de673SAkira Fujita depth = ext_depth(donor_inode); 677748de673SAkira Fujita dext = donor_path[depth].p_ext; 678748de673SAkira Fujita tmp_dext = *dext; 679748de673SAkira Fujita 680f868a48dSAkira Fujita *err = mext_calc_swap_extents(&tmp_dext, &tmp_oext, orig_off, 681748de673SAkira Fujita donor_off, count); 682f868a48dSAkira Fujita if (*err) 683c40ce3c9SAkira Fujita goto out; 684748de673SAkira Fujita 685748de673SAkira Fujita /* Loop for the donor extents */ 686748de673SAkira Fujita while (1) { 687748de673SAkira Fujita /* The extent for donor must be found. */ 6882147b1a6SAkira Fujita if (!dext) { 6892147b1a6SAkira Fujita ext4_error(donor_inode->i_sb, __func__, 6902147b1a6SAkira Fujita "The extent for donor must be found"); 691f868a48dSAkira Fujita *err = -EIO; 6922147b1a6SAkira Fujita goto out; 6932147b1a6SAkira Fujita } else if (donor_off != le32_to_cpu(tmp_dext.ee_block)) { 6942147b1a6SAkira Fujita ext4_error(donor_inode->i_sb, __func__, 6952147b1a6SAkira Fujita "Donor offset(%u) and the first block of donor " 6962147b1a6SAkira Fujita "extent(%u) should be equal", 6972147b1a6SAkira Fujita donor_off, 6982147b1a6SAkira Fujita le32_to_cpu(tmp_dext.ee_block)); 699f868a48dSAkira Fujita *err = -EIO; 7002147b1a6SAkira Fujita goto out; 7012147b1a6SAkira Fujita } 702748de673SAkira Fujita 703748de673SAkira Fujita /* Set donor extent to orig extent */ 704f868a48dSAkira Fujita *err = mext_leaf_block(handle, orig_inode, 705748de673SAkira Fujita orig_path, &tmp_dext, &orig_off); 706f868a48dSAkira Fujita if (*err) 707748de673SAkira Fujita goto out; 708748de673SAkira Fujita 709748de673SAkira Fujita /* Set orig extent to donor extent */ 710f868a48dSAkira Fujita *err = mext_leaf_block(handle, donor_inode, 711748de673SAkira Fujita donor_path, &tmp_oext, &donor_off); 712f868a48dSAkira Fujita if (*err) 713748de673SAkira Fujita goto out; 714748de673SAkira Fujita 715748de673SAkira Fujita dext_alen = ext4_ext_get_actual_len(&tmp_dext); 716748de673SAkira Fujita replaced_count += dext_alen; 717748de673SAkira Fujita donor_off += dext_alen; 718748de673SAkira Fujita orig_off += dext_alen; 719748de673SAkira Fujita 720748de673SAkira Fujita /* Already moved the expected blocks */ 721748de673SAkira Fujita if (replaced_count >= count) 722748de673SAkira Fujita break; 723748de673SAkira Fujita 724748de673SAkira Fujita if (orig_path) 725748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 726f868a48dSAkira Fujita *err = get_ext_path(orig_inode, orig_off, &orig_path); 727f868a48dSAkira Fujita if (*err) 728748de673SAkira Fujita goto out; 729748de673SAkira Fujita depth = ext_depth(orig_inode); 730748de673SAkira Fujita oext = orig_path[depth].p_ext; 731748de673SAkira Fujita tmp_oext = *oext; 732748de673SAkira Fujita 733748de673SAkira Fujita if (donor_path) 734748de673SAkira Fujita ext4_ext_drop_refs(donor_path); 735f868a48dSAkira Fujita *err = get_ext_path(donor_inode, donor_off, &donor_path); 736f868a48dSAkira Fujita if (*err) 737748de673SAkira Fujita goto out; 738748de673SAkira Fujita depth = ext_depth(donor_inode); 739748de673SAkira Fujita dext = donor_path[depth].p_ext; 740748de673SAkira Fujita tmp_dext = *dext; 741748de673SAkira Fujita 742f868a48dSAkira Fujita *err = mext_calc_swap_extents(&tmp_dext, &tmp_oext, orig_off, 743c40ce3c9SAkira Fujita donor_off, count - replaced_count); 744f868a48dSAkira Fujita if (*err) 745c40ce3c9SAkira Fujita goto out; 746748de673SAkira Fujita } 747748de673SAkira Fujita 748748de673SAkira Fujita out: 749748de673SAkira Fujita if (orig_path) { 750748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 751748de673SAkira Fujita kfree(orig_path); 752748de673SAkira Fujita } 753748de673SAkira Fujita if (donor_path) { 754748de673SAkira Fujita ext4_ext_drop_refs(donor_path); 755748de673SAkira Fujita kfree(donor_path); 756748de673SAkira Fujita } 757748de673SAkira Fujita 758f868a48dSAkira Fujita return replaced_count; 759748de673SAkira Fujita } 760748de673SAkira Fujita 761748de673SAkira Fujita /** 762748de673SAkira Fujita * move_extent_per_page - Move extent data per page 763748de673SAkira Fujita * 764748de673SAkira Fujita * @o_filp: file structure of original file 765748de673SAkira Fujita * @donor_inode: donor inode 766748de673SAkira Fujita * @orig_page_offset: page index on original file 767748de673SAkira Fujita * @data_offset_in_page: block index where data swapping starts 768748de673SAkira Fujita * @block_len_in_page: the number of blocks to be swapped 769748de673SAkira Fujita * @uninit: orig extent is uninitialized or not 770f868a48dSAkira Fujita * @err: pointer to save return value 771748de673SAkira Fujita * 772748de673SAkira Fujita * Save the data in original inode blocks and replace original inode extents 773748de673SAkira Fujita * with donor inode extents by calling mext_replace_branches(). 774f868a48dSAkira Fujita * Finally, write out the saved data in new original inode blocks. Return 775f868a48dSAkira Fujita * replaced block count. 776748de673SAkira Fujita */ 777748de673SAkira Fujita static int 77844fc48f7SAkira Fujita move_extent_per_page(struct file *o_filp, struct inode *donor_inode, 779748de673SAkira Fujita pgoff_t orig_page_offset, int data_offset_in_page, 780f868a48dSAkira Fujita int block_len_in_page, int uninit, int *err) 781748de673SAkira Fujita { 782748de673SAkira Fujita struct inode *orig_inode = o_filp->f_dentry->d_inode; 783748de673SAkira Fujita struct address_space *mapping = orig_inode->i_mapping; 784748de673SAkira Fujita struct buffer_head *bh; 785748de673SAkira Fujita struct page *page = NULL; 786748de673SAkira Fujita const struct address_space_operations *a_ops = mapping->a_ops; 787748de673SAkira Fujita handle_t *handle; 788748de673SAkira Fujita ext4_lblk_t orig_blk_offset; 789748de673SAkira Fujita long long offs = orig_page_offset << PAGE_CACHE_SHIFT; 790748de673SAkira Fujita unsigned long blocksize = orig_inode->i_sb->s_blocksize; 791748de673SAkira Fujita unsigned int w_flags = 0; 792f868a48dSAkira Fujita unsigned int tmp_data_size, data_size, replaced_size; 793748de673SAkira Fujita void *fsdata; 794f868a48dSAkira Fujita int i, jblocks; 795f868a48dSAkira Fujita int err2 = 0; 796f868a48dSAkira Fujita int replaced_count = 0; 797748de673SAkira Fujita int blocks_per_page = PAGE_CACHE_SIZE >> orig_inode->i_blkbits; 798748de673SAkira Fujita 799748de673SAkira Fujita /* 800748de673SAkira Fujita * It needs twice the amount of ordinary journal buffers because 801748de673SAkira Fujita * inode and donor_inode may change each different metadata blocks. 802748de673SAkira Fujita */ 803748de673SAkira Fujita jblocks = ext4_writepage_trans_blocks(orig_inode) * 2; 804748de673SAkira Fujita handle = ext4_journal_start(orig_inode, jblocks); 805748de673SAkira Fujita if (IS_ERR(handle)) { 806f868a48dSAkira Fujita *err = PTR_ERR(handle); 807f868a48dSAkira Fujita return 0; 808748de673SAkira Fujita } 809748de673SAkira Fujita 810748de673SAkira Fujita if (segment_eq(get_fs(), KERNEL_DS)) 811748de673SAkira Fujita w_flags |= AOP_FLAG_UNINTERRUPTIBLE; 812748de673SAkira Fujita 813748de673SAkira Fujita orig_blk_offset = orig_page_offset * blocks_per_page + 814748de673SAkira Fujita data_offset_in_page; 815748de673SAkira Fujita 816748de673SAkira Fujita /* 817748de673SAkira Fujita * If orig extent is uninitialized one, 818748de673SAkira Fujita * it's not necessary force the page into memory 819748de673SAkira Fujita * and then force it to be written out again. 820748de673SAkira Fujita * Just swap data blocks between orig and donor. 821748de673SAkira Fujita */ 822748de673SAkira Fujita if (uninit) { 823fc04cb49SAkira Fujita /* 824fc04cb49SAkira Fujita * Protect extent trees against block allocations 825fc04cb49SAkira Fujita * via delalloc 826fc04cb49SAkira Fujita */ 827fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 828f868a48dSAkira Fujita replaced_count = mext_replace_branches(handle, orig_inode, 829748de673SAkira Fujita donor_inode, orig_blk_offset, 830f868a48dSAkira Fujita block_len_in_page, err); 831748de673SAkira Fujita 832748de673SAkira Fujita /* Clear the inode cache not to refer to the old data */ 833748de673SAkira Fujita ext4_ext_invalidate_cache(orig_inode); 834748de673SAkira Fujita ext4_ext_invalidate_cache(donor_inode); 835fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 836748de673SAkira Fujita goto out2; 837748de673SAkira Fujita } 838748de673SAkira Fujita 839748de673SAkira Fujita offs = (long long)orig_blk_offset << orig_inode->i_blkbits; 840748de673SAkira Fujita 841f868a48dSAkira Fujita /* Calculate data_size */ 842748de673SAkira Fujita if ((orig_blk_offset + block_len_in_page - 1) == 843748de673SAkira Fujita ((orig_inode->i_size - 1) >> orig_inode->i_blkbits)) { 844748de673SAkira Fujita /* Replace the last block */ 845f868a48dSAkira Fujita tmp_data_size = orig_inode->i_size & (blocksize - 1); 846748de673SAkira Fujita /* 847f868a48dSAkira Fujita * If data_size equal zero, it shows data_size is multiples of 848748de673SAkira Fujita * blocksize. So we set appropriate value. 849748de673SAkira Fujita */ 850f868a48dSAkira Fujita if (tmp_data_size == 0) 851f868a48dSAkira Fujita tmp_data_size = blocksize; 852748de673SAkira Fujita 853f868a48dSAkira Fujita data_size = tmp_data_size + 854748de673SAkira Fujita ((block_len_in_page - 1) << orig_inode->i_blkbits); 855f868a48dSAkira Fujita } else 856f868a48dSAkira Fujita data_size = block_len_in_page << orig_inode->i_blkbits; 857748de673SAkira Fujita 858f868a48dSAkira Fujita replaced_size = data_size; 859f868a48dSAkira Fujita 860f868a48dSAkira Fujita *err = a_ops->write_begin(o_filp, mapping, offs, data_size, w_flags, 861748de673SAkira Fujita &page, &fsdata); 862f868a48dSAkira Fujita if (unlikely(*err < 0)) 863748de673SAkira Fujita goto out; 864748de673SAkira Fujita 865748de673SAkira Fujita if (!PageUptodate(page)) { 866748de673SAkira Fujita mapping->a_ops->readpage(o_filp, page); 867748de673SAkira Fujita lock_page(page); 868748de673SAkira Fujita } 869748de673SAkira Fujita 870748de673SAkira Fujita /* 871748de673SAkira Fujita * try_to_release_page() doesn't call releasepage in writeback mode. 872748de673SAkira Fujita * We should care about the order of writing to the same file 873748de673SAkira Fujita * by multiple move extent processes. 874748de673SAkira Fujita * It needs to call wait_on_page_writeback() to wait for the 875748de673SAkira Fujita * writeback of the page. 876748de673SAkira Fujita */ 877748de673SAkira Fujita if (PageWriteback(page)) 878748de673SAkira Fujita wait_on_page_writeback(page); 879748de673SAkira Fujita 880748de673SAkira Fujita /* Release old bh and drop refs */ 881748de673SAkira Fujita try_to_release_page(page, 0); 882748de673SAkira Fujita 883fc04cb49SAkira Fujita /* Protect extent trees against block allocations via delalloc */ 884fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 885f868a48dSAkira Fujita replaced_count = mext_replace_branches(handle, orig_inode, donor_inode, 886f868a48dSAkira Fujita orig_blk_offset, block_len_in_page, 887f868a48dSAkira Fujita &err2); 888f868a48dSAkira Fujita if (err2) { 889f868a48dSAkira Fujita if (replaced_count) { 890f868a48dSAkira Fujita block_len_in_page = replaced_count; 891f868a48dSAkira Fujita replaced_size = 892f868a48dSAkira Fujita block_len_in_page << orig_inode->i_blkbits; 893fc04cb49SAkira Fujita } else { 894fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 895748de673SAkira Fujita goto out; 896f868a48dSAkira Fujita } 897fc04cb49SAkira Fujita } 898748de673SAkira Fujita 899748de673SAkira Fujita /* Clear the inode cache not to refer to the old data */ 900748de673SAkira Fujita ext4_ext_invalidate_cache(orig_inode); 901748de673SAkira Fujita ext4_ext_invalidate_cache(donor_inode); 902748de673SAkira Fujita 903fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 904fc04cb49SAkira Fujita 905748de673SAkira Fujita if (!page_has_buffers(page)) 906748de673SAkira Fujita create_empty_buffers(page, 1 << orig_inode->i_blkbits, 0); 907748de673SAkira Fujita 908748de673SAkira Fujita bh = page_buffers(page); 909748de673SAkira Fujita for (i = 0; i < data_offset_in_page; i++) 910748de673SAkira Fujita bh = bh->b_this_page; 911748de673SAkira Fujita 912748de673SAkira Fujita for (i = 0; i < block_len_in_page; i++) { 913f868a48dSAkira Fujita *err = ext4_get_block(orig_inode, 914748de673SAkira Fujita (sector_t)(orig_blk_offset + i), bh, 0); 915f868a48dSAkira Fujita if (*err < 0) 916748de673SAkira Fujita goto out; 917748de673SAkira Fujita 918748de673SAkira Fujita if (bh->b_this_page != NULL) 919748de673SAkira Fujita bh = bh->b_this_page; 920748de673SAkira Fujita } 921748de673SAkira Fujita 922f868a48dSAkira Fujita *err = a_ops->write_end(o_filp, mapping, offs, data_size, replaced_size, 923748de673SAkira Fujita page, fsdata); 924748de673SAkira Fujita page = NULL; 925748de673SAkira Fujita 926748de673SAkira Fujita out: 927748de673SAkira Fujita if (unlikely(page)) { 928748de673SAkira Fujita if (PageLocked(page)) 929748de673SAkira Fujita unlock_page(page); 930748de673SAkira Fujita page_cache_release(page); 93191cc219aSPeng Tao ext4_journal_stop(handle); 932748de673SAkira Fujita } 933748de673SAkira Fujita out2: 934748de673SAkira Fujita ext4_journal_stop(handle); 935748de673SAkira Fujita 936f868a48dSAkira Fujita if (err2) 937f868a48dSAkira Fujita *err = err2; 938f868a48dSAkira Fujita 939f868a48dSAkira Fujita return replaced_count; 940748de673SAkira Fujita } 941748de673SAkira Fujita 942748de673SAkira Fujita /** 943748de673SAkira Fujita * mext_check_argumants - Check whether move extent can be done 944748de673SAkira Fujita * 945748de673SAkira Fujita * @orig_inode: original inode 946748de673SAkira Fujita * @donor_inode: donor inode 947748de673SAkira Fujita * @orig_start: logical start offset in block for orig 948748de673SAkira Fujita * @donor_start: logical start offset in block for donor 949748de673SAkira Fujita * @len: the number of blocks to be moved 950748de673SAkira Fujita * @moved_len: moved block length 951748de673SAkira Fujita * 952748de673SAkira Fujita * Check the arguments of ext4_move_extents() whether the files can be 953748de673SAkira Fujita * exchanged with each other. 954748de673SAkira Fujita * Return 0 on success, or a negative error value on failure. 955748de673SAkira Fujita */ 956748de673SAkira Fujita static int 957748de673SAkira Fujita mext_check_arguments(struct inode *orig_inode, 958748de673SAkira Fujita struct inode *donor_inode, __u64 orig_start, 959748de673SAkira Fujita __u64 donor_start, __u64 *len, __u64 moved_len) 960748de673SAkira Fujita { 96170d5d3dcSAkira Fujita ext4_lblk_t orig_blocks, donor_blocks; 96270d5d3dcSAkira Fujita unsigned int blkbits = orig_inode->i_blkbits; 96370d5d3dcSAkira Fujita unsigned int blocksize = 1 << blkbits; 96470d5d3dcSAkira Fujita 965748de673SAkira Fujita /* Regular file check */ 966748de673SAkira Fujita if (!S_ISREG(orig_inode->i_mode) || !S_ISREG(donor_inode->i_mode)) { 967748de673SAkira Fujita ext4_debug("ext4 move extent: The argument files should be " 968748de673SAkira Fujita "regular file [ino:orig %lu, donor %lu]\n", 969748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 970748de673SAkira Fujita return -EINVAL; 971748de673SAkira Fujita } 972748de673SAkira Fujita 973748de673SAkira Fujita /* Ext4 move extent does not support swapfile */ 974748de673SAkira Fujita if (IS_SWAPFILE(orig_inode) || IS_SWAPFILE(donor_inode)) { 975748de673SAkira Fujita ext4_debug("ext4 move extent: The argument files should " 976748de673SAkira Fujita "not be swapfile [ino:orig %lu, donor %lu]\n", 977748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 978748de673SAkira Fujita return -EINVAL; 979748de673SAkira Fujita } 980748de673SAkira Fujita 981748de673SAkira Fujita /* Files should be in the same ext4 FS */ 982748de673SAkira Fujita if (orig_inode->i_sb != donor_inode->i_sb) { 983748de673SAkira Fujita ext4_debug("ext4 move extent: The argument files " 984748de673SAkira Fujita "should be in same FS [ino:orig %lu, donor %lu]\n", 985748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 986748de673SAkira Fujita return -EINVAL; 987748de673SAkira Fujita } 988748de673SAkira Fujita 989748de673SAkira Fujita /* Ext4 move extent supports only extent based file */ 990748de673SAkira Fujita if (!(EXT4_I(orig_inode)->i_flags & EXT4_EXTENTS_FL)) { 991748de673SAkira Fujita ext4_debug("ext4 move extent: orig file is not extents " 992748de673SAkira Fujita "based file [ino:orig %lu]\n", orig_inode->i_ino); 993748de673SAkira Fujita return -EOPNOTSUPP; 994748de673SAkira Fujita } else if (!(EXT4_I(donor_inode)->i_flags & EXT4_EXTENTS_FL)) { 995748de673SAkira Fujita ext4_debug("ext4 move extent: donor file is not extents " 996748de673SAkira Fujita "based file [ino:donor %lu]\n", donor_inode->i_ino); 997748de673SAkira Fujita return -EOPNOTSUPP; 998748de673SAkira Fujita } 999748de673SAkira Fujita 1000748de673SAkira Fujita if ((!orig_inode->i_size) || (!donor_inode->i_size)) { 1001748de673SAkira Fujita ext4_debug("ext4 move extent: File size is 0 byte\n"); 1002748de673SAkira Fujita return -EINVAL; 1003748de673SAkira Fujita } 1004748de673SAkira Fujita 1005748de673SAkira Fujita /* Start offset should be same */ 1006748de673SAkira Fujita if (orig_start != donor_start) { 1007748de673SAkira Fujita ext4_debug("ext4 move extent: orig and donor's start " 1008748de673SAkira Fujita "offset are not same [ino:orig %lu, donor %lu]\n", 1009748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1010748de673SAkira Fujita return -EINVAL; 1011748de673SAkira Fujita } 1012748de673SAkira Fujita 1013748de673SAkira Fujita if (moved_len) { 1014748de673SAkira Fujita ext4_debug("ext4 move extent: moved_len should be 0 " 1015748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", orig_inode->i_ino, 1016748de673SAkira Fujita donor_inode->i_ino); 1017748de673SAkira Fujita return -EINVAL; 1018748de673SAkira Fujita } 1019748de673SAkira Fujita 10200a80e986SEric Sandeen if ((orig_start > EXT_MAX_BLOCK) || 10210a80e986SEric Sandeen (donor_start > EXT_MAX_BLOCK) || 10220a80e986SEric Sandeen (*len > EXT_MAX_BLOCK) || 10230a80e986SEric Sandeen (orig_start + *len > EXT_MAX_BLOCK)) { 10240a80e986SEric Sandeen ext4_debug("ext4 move extent: Can't handle over [%u] blocks " 10250a80e986SEric Sandeen "[ino:orig %lu, donor %lu]\n", EXT_MAX_BLOCK, 1026748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1027748de673SAkira Fujita return -EINVAL; 1028748de673SAkira Fujita } 1029748de673SAkira Fujita 1030748de673SAkira Fujita if (orig_inode->i_size > donor_inode->i_size) { 103170d5d3dcSAkira Fujita donor_blocks = (donor_inode->i_size + blocksize - 1) >> blkbits; 103270d5d3dcSAkira Fujita /* TODO: eliminate this artificial restriction */ 103370d5d3dcSAkira Fujita if (orig_start >= donor_blocks) { 1034748de673SAkira Fujita ext4_debug("ext4 move extent: orig start offset " 103570d5d3dcSAkira Fujita "[%llu] should be less than donor file blocks " 103670d5d3dcSAkira Fujita "[%u] [ino:orig %lu, donor %lu]\n", 103770d5d3dcSAkira Fujita orig_start, donor_blocks, 1038748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1039748de673SAkira Fujita return -EINVAL; 1040748de673SAkira Fujita } 1041748de673SAkira Fujita 104270d5d3dcSAkira Fujita /* TODO: eliminate this artificial restriction */ 104370d5d3dcSAkira Fujita if (orig_start + *len > donor_blocks) { 1044748de673SAkira Fujita ext4_debug("ext4 move extent: End offset [%llu] should " 104570d5d3dcSAkira Fujita "be less than donor file blocks [%u]." 104670d5d3dcSAkira Fujita "So adjust length from %llu to %llu " 1047748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", 104870d5d3dcSAkira Fujita orig_start + *len, donor_blocks, 104970d5d3dcSAkira Fujita *len, donor_blocks - orig_start, 1050748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 105170d5d3dcSAkira Fujita *len = donor_blocks - orig_start; 1052748de673SAkira Fujita } 1053748de673SAkira Fujita } else { 105470d5d3dcSAkira Fujita orig_blocks = (orig_inode->i_size + blocksize - 1) >> blkbits; 105570d5d3dcSAkira Fujita if (orig_start >= orig_blocks) { 1056748de673SAkira Fujita ext4_debug("ext4 move extent: start offset [%llu] " 105770d5d3dcSAkira Fujita "should be less than original file blocks " 105870d5d3dcSAkira Fujita "[%u] [ino:orig %lu, donor %lu]\n", 105970d5d3dcSAkira Fujita orig_start, orig_blocks, 1060748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1061748de673SAkira Fujita return -EINVAL; 1062748de673SAkira Fujita } 1063748de673SAkira Fujita 106470d5d3dcSAkira Fujita if (orig_start + *len > orig_blocks) { 1065748de673SAkira Fujita ext4_debug("ext4 move extent: Adjust length " 106670d5d3dcSAkira Fujita "from %llu to %llu. Because it should be " 106770d5d3dcSAkira Fujita "less than original file blocks " 1068748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", 106970d5d3dcSAkira Fujita *len, orig_blocks - orig_start, 1070748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 107170d5d3dcSAkira Fujita *len = orig_blocks - orig_start; 1072748de673SAkira Fujita } 1073748de673SAkira Fujita } 1074748de673SAkira Fujita 1075748de673SAkira Fujita if (!*len) { 1076748de673SAkira Fujita ext4_debug("ext4 move extent: len shoudld not be 0 " 1077748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", orig_inode->i_ino, 1078748de673SAkira Fujita donor_inode->i_ino); 1079748de673SAkira Fujita return -EINVAL; 1080748de673SAkira Fujita } 1081748de673SAkira Fujita 1082748de673SAkira Fujita return 0; 1083748de673SAkira Fujita } 1084748de673SAkira Fujita 1085748de673SAkira Fujita /** 1086748de673SAkira Fujita * mext_inode_double_lock - Lock i_mutex on both @inode1 and @inode2 1087748de673SAkira Fujita * 1088748de673SAkira Fujita * @inode1: the inode structure 1089748de673SAkira Fujita * @inode2: the inode structure 1090748de673SAkira Fujita * 10912147b1a6SAkira Fujita * Lock two inodes' i_mutex by i_ino order. 10922147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1093748de673SAkira Fujita */ 10942147b1a6SAkira Fujita static int 1095748de673SAkira Fujita mext_inode_double_lock(struct inode *inode1, struct inode *inode2) 1096748de673SAkira Fujita { 10972147b1a6SAkira Fujita int ret = 0; 10982147b1a6SAkira Fujita 10992147b1a6SAkira Fujita BUG_ON(inode1 == NULL && inode2 == NULL); 11002147b1a6SAkira Fujita 11012147b1a6SAkira Fujita ret = mext_check_null_inode(inode1, inode2, __func__); 11022147b1a6SAkira Fujita if (ret < 0) 11032147b1a6SAkira Fujita goto out; 11042147b1a6SAkira Fujita 11052147b1a6SAkira Fujita if (inode1 == inode2) { 1106748de673SAkira Fujita mutex_lock(&inode1->i_mutex); 11072147b1a6SAkira Fujita goto out; 1108748de673SAkira Fujita } 1109748de673SAkira Fujita 1110748de673SAkira Fujita if (inode1->i_ino < inode2->i_ino) { 1111748de673SAkira Fujita mutex_lock_nested(&inode1->i_mutex, I_MUTEX_PARENT); 1112748de673SAkira Fujita mutex_lock_nested(&inode2->i_mutex, I_MUTEX_CHILD); 1113748de673SAkira Fujita } else { 1114748de673SAkira Fujita mutex_lock_nested(&inode2->i_mutex, I_MUTEX_PARENT); 1115748de673SAkira Fujita mutex_lock_nested(&inode1->i_mutex, I_MUTEX_CHILD); 1116748de673SAkira Fujita } 11172147b1a6SAkira Fujita 11182147b1a6SAkira Fujita out: 11192147b1a6SAkira Fujita return ret; 1120748de673SAkira Fujita } 1121748de673SAkira Fujita 1122748de673SAkira Fujita /** 1123748de673SAkira Fujita * mext_inode_double_unlock - Release i_mutex on both @inode1 and @inode2 1124748de673SAkira Fujita * 1125748de673SAkira Fujita * @inode1: the inode that is released first 1126748de673SAkira Fujita * @inode2: the inode that is released second 1127748de673SAkira Fujita * 11282147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1129748de673SAkira Fujita */ 1130748de673SAkira Fujita 11312147b1a6SAkira Fujita static int 1132748de673SAkira Fujita mext_inode_double_unlock(struct inode *inode1, struct inode *inode2) 1133748de673SAkira Fujita { 11342147b1a6SAkira Fujita int ret = 0; 11352147b1a6SAkira Fujita 11362147b1a6SAkira Fujita BUG_ON(inode1 == NULL && inode2 == NULL); 11372147b1a6SAkira Fujita 11382147b1a6SAkira Fujita ret = mext_check_null_inode(inode1, inode2, __func__); 11392147b1a6SAkira Fujita if (ret < 0) 11402147b1a6SAkira Fujita goto out; 11412147b1a6SAkira Fujita 1142748de673SAkira Fujita if (inode1) 1143748de673SAkira Fujita mutex_unlock(&inode1->i_mutex); 1144748de673SAkira Fujita 1145748de673SAkira Fujita if (inode2 && inode2 != inode1) 1146748de673SAkira Fujita mutex_unlock(&inode2->i_mutex); 11472147b1a6SAkira Fujita 11482147b1a6SAkira Fujita out: 11492147b1a6SAkira Fujita return ret; 1150748de673SAkira Fujita } 1151748de673SAkira Fujita 1152748de673SAkira Fujita /** 1153748de673SAkira Fujita * ext4_move_extents - Exchange the specified range of a file 1154748de673SAkira Fujita * 1155748de673SAkira Fujita * @o_filp: file structure of the original file 1156748de673SAkira Fujita * @d_filp: file structure of the donor file 1157748de673SAkira Fujita * @orig_start: start offset in block for orig 1158748de673SAkira Fujita * @donor_start: start offset in block for donor 1159748de673SAkira Fujita * @len: the number of blocks to be moved 1160748de673SAkira Fujita * @moved_len: moved block length 1161748de673SAkira Fujita * 1162748de673SAkira Fujita * This function returns 0 and moved block length is set in moved_len 1163748de673SAkira Fujita * if succeed, otherwise returns error value. 1164748de673SAkira Fujita * 1165748de673SAkira Fujita * Note: ext4_move_extents() proceeds the following order. 1166748de673SAkira Fujita * 1:ext4_move_extents() calculates the last block number of moving extent 1167748de673SAkira Fujita * function by the start block number (orig_start) and the number of blocks 1168748de673SAkira Fujita * to be moved (len) specified as arguments. 1169748de673SAkira Fujita * If the {orig, donor}_start points a hole, the extent's start offset 1170748de673SAkira Fujita * pointed by ext_cur (current extent), holecheck_path, orig_path are set 1171748de673SAkira Fujita * after hole behind. 1172748de673SAkira Fujita * 2:Continue step 3 to step 5, until the holecheck_path points to last_extent 1173748de673SAkira Fujita * or the ext_cur exceeds the block_end which is last logical block number. 1174748de673SAkira Fujita * 3:To get the length of continues area, call mext_next_extent() 1175748de673SAkira Fujita * specified with the ext_cur (initial value is holecheck_path) re-cursive, 1176748de673SAkira Fujita * until find un-continuous extent, the start logical block number exceeds 1177748de673SAkira Fujita * the block_end or the extent points to the last extent. 1178748de673SAkira Fujita * 4:Exchange the original inode data with donor inode data 1179748de673SAkira Fujita * from orig_page_offset to seq_end_page. 1180748de673SAkira Fujita * The start indexes of data are specified as arguments. 1181748de673SAkira Fujita * That of the original inode is orig_page_offset, 1182748de673SAkira Fujita * and the donor inode is also orig_page_offset 1183748de673SAkira Fujita * (To easily handle blocksize != pagesize case, the offset for the 1184748de673SAkira Fujita * donor inode is block unit). 1185748de673SAkira Fujita * 5:Update holecheck_path and orig_path to points a next proceeding extent, 1186748de673SAkira Fujita * then returns to step 2. 1187748de673SAkira Fujita * 6:Release holecheck_path, orig_path and set the len to moved_len 1188748de673SAkira Fujita * which shows the number of moved blocks. 1189748de673SAkira Fujita * The moved_len is useful for the command to calculate the file offset 1190748de673SAkira Fujita * for starting next move extent ioctl. 1191748de673SAkira Fujita * 7:Return 0 on success, or a negative error value on failure. 1192748de673SAkira Fujita */ 1193748de673SAkira Fujita int 1194748de673SAkira Fujita ext4_move_extents(struct file *o_filp, struct file *d_filp, 1195748de673SAkira Fujita __u64 orig_start, __u64 donor_start, __u64 len, 1196748de673SAkira Fujita __u64 *moved_len) 1197748de673SAkira Fujita { 1198748de673SAkira Fujita struct inode *orig_inode = o_filp->f_dentry->d_inode; 1199748de673SAkira Fujita struct inode *donor_inode = d_filp->f_dentry->d_inode; 1200748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL, *holecheck_path = NULL; 1201748de673SAkira Fujita struct ext4_extent *ext_prev, *ext_cur, *ext_dummy; 1202748de673SAkira Fujita ext4_lblk_t block_start = orig_start; 1203748de673SAkira Fujita ext4_lblk_t block_end, seq_start, add_blocks, file_end, seq_blocks = 0; 1204748de673SAkira Fujita ext4_lblk_t rest_blocks; 1205748de673SAkira Fujita pgoff_t orig_page_offset = 0, seq_end_page; 12062147b1a6SAkira Fujita int ret1, ret2, depth, last_extent = 0; 1207748de673SAkira Fujita int blocks_per_page = PAGE_CACHE_SIZE >> orig_inode->i_blkbits; 1208748de673SAkira Fujita int data_offset_in_page; 1209748de673SAkira Fujita int block_len_in_page; 1210748de673SAkira Fujita int uninit; 1211748de673SAkira Fujita 1212f3ce8064STheodore Ts'o /* orig and donor should be different file */ 1213f3ce8064STheodore Ts'o if (orig_inode->i_ino == donor_inode->i_ino) { 1214f3ce8064STheodore Ts'o ext4_debug("ext4 move extent: The argument files should not " 1215f3ce8064STheodore Ts'o "be same file [ino:orig %lu, donor %lu]\n", 1216f3ce8064STheodore Ts'o orig_inode->i_ino, donor_inode->i_ino); 1217f3ce8064STheodore Ts'o return -EINVAL; 1218f3ce8064STheodore Ts'o } 1219f3ce8064STheodore Ts'o 1220fc04cb49SAkira Fujita /* Protect orig and donor inodes against a truncate */ 12212147b1a6SAkira Fujita ret1 = mext_inode_double_lock(orig_inode, donor_inode); 12222147b1a6SAkira Fujita if (ret1 < 0) 12232147b1a6SAkira Fujita return ret1; 1224748de673SAkira Fujita 1225fc04cb49SAkira Fujita /* Protect extent tree against block allocations via delalloc */ 1226fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 1227748de673SAkira Fujita /* Check the filesystem environment whether move_extent can be done */ 12282147b1a6SAkira Fujita ret1 = mext_check_arguments(orig_inode, donor_inode, orig_start, 1229748de673SAkira Fujita donor_start, &len, *moved_len); 12302147b1a6SAkira Fujita if (ret1) 1231347fa6f1SAkira Fujita goto out; 1232748de673SAkira Fujita 1233748de673SAkira Fujita file_end = (i_size_read(orig_inode) - 1) >> orig_inode->i_blkbits; 1234748de673SAkira Fujita block_end = block_start + len - 1; 1235748de673SAkira Fujita if (file_end < block_end) 1236748de673SAkira Fujita len -= block_end - file_end; 1237748de673SAkira Fujita 12382147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, block_start, &orig_path); 1239347fa6f1SAkira Fujita if (ret1) 1240347fa6f1SAkira Fujita goto out; 1241748de673SAkira Fujita 1242748de673SAkira Fujita /* Get path structure to check the hole */ 12432147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, block_start, &holecheck_path); 1244347fa6f1SAkira Fujita if (ret1) 1245748de673SAkira Fujita goto out; 1246748de673SAkira Fujita 1247748de673SAkira Fujita depth = ext_depth(orig_inode); 1248748de673SAkira Fujita ext_cur = holecheck_path[depth].p_ext; 1249748de673SAkira Fujita 1250748de673SAkira Fujita /* 1251c40ce3c9SAkira Fujita * Get proper starting location of block replacement if block_start was 1252c40ce3c9SAkira Fujita * within the hole. 1253748de673SAkira Fujita */ 1254748de673SAkira Fujita if (le32_to_cpu(ext_cur->ee_block) + 1255748de673SAkira Fujita ext4_ext_get_actual_len(ext_cur) - 1 < block_start) { 1256c40ce3c9SAkira Fujita /* 1257c40ce3c9SAkira Fujita * The hole exists between extents or the tail of 1258c40ce3c9SAkira Fujita * original file. 1259c40ce3c9SAkira Fujita */ 1260748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, 1261748de673SAkira Fujita holecheck_path, &ext_cur); 1262748de673SAkira Fujita if (last_extent < 0) { 12632147b1a6SAkira Fujita ret1 = last_extent; 1264748de673SAkira Fujita goto out; 1265748de673SAkira Fujita } 1266748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, orig_path, 1267748de673SAkira Fujita &ext_dummy); 1268748de673SAkira Fujita if (last_extent < 0) { 12692147b1a6SAkira Fujita ret1 = last_extent; 1270748de673SAkira Fujita goto out; 1271748de673SAkira Fujita } 1272c40ce3c9SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1273c40ce3c9SAkira Fujita } else if (le32_to_cpu(ext_cur->ee_block) > block_start) 1274c40ce3c9SAkira Fujita /* The hole exists at the beginning of original file. */ 1275c40ce3c9SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1276c40ce3c9SAkira Fujita else 1277748de673SAkira Fujita seq_start = block_start; 1278748de673SAkira Fujita 1279748de673SAkira Fujita /* No blocks within the specified range. */ 1280748de673SAkira Fujita if (le32_to_cpu(ext_cur->ee_block) > block_end) { 1281748de673SAkira Fujita ext4_debug("ext4 move extent: The specified range of file " 1282748de673SAkira Fujita "may be the hole\n"); 12832147b1a6SAkira Fujita ret1 = -EINVAL; 1284748de673SAkira Fujita goto out; 1285748de673SAkira Fujita } 1286748de673SAkira Fujita 1287748de673SAkira Fujita /* Adjust start blocks */ 1288748de673SAkira Fujita add_blocks = min(le32_to_cpu(ext_cur->ee_block) + 1289748de673SAkira Fujita ext4_ext_get_actual_len(ext_cur), block_end + 1) - 1290748de673SAkira Fujita max(le32_to_cpu(ext_cur->ee_block), block_start); 1291748de673SAkira Fujita 1292fc04cb49SAkira Fujita /* Discard preallocations of two inodes */ 1293fc04cb49SAkira Fujita ext4_discard_preallocations(orig_inode); 1294fc04cb49SAkira Fujita ext4_discard_preallocations(donor_inode); 1295fc04cb49SAkira Fujita 1296748de673SAkira Fujita while (!last_extent && le32_to_cpu(ext_cur->ee_block) <= block_end) { 1297748de673SAkira Fujita seq_blocks += add_blocks; 1298748de673SAkira Fujita 1299748de673SAkira Fujita /* Adjust tail blocks */ 1300748de673SAkira Fujita if (seq_start + seq_blocks - 1 > block_end) 1301748de673SAkira Fujita seq_blocks = block_end - seq_start + 1; 1302748de673SAkira Fujita 1303748de673SAkira Fujita ext_prev = ext_cur; 1304748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, holecheck_path, 1305748de673SAkira Fujita &ext_cur); 1306748de673SAkira Fujita if (last_extent < 0) { 13072147b1a6SAkira Fujita ret1 = last_extent; 1308748de673SAkira Fujita break; 1309748de673SAkira Fujita } 1310748de673SAkira Fujita add_blocks = ext4_ext_get_actual_len(ext_cur); 1311748de673SAkira Fujita 1312748de673SAkira Fujita /* 1313748de673SAkira Fujita * Extend the length of contiguous block (seq_blocks) 1314748de673SAkira Fujita * if extents are contiguous. 1315748de673SAkira Fujita */ 1316748de673SAkira Fujita if (ext4_can_extents_be_merged(orig_inode, 1317748de673SAkira Fujita ext_prev, ext_cur) && 1318748de673SAkira Fujita block_end >= le32_to_cpu(ext_cur->ee_block) && 1319748de673SAkira Fujita !last_extent) 1320748de673SAkira Fujita continue; 1321748de673SAkira Fujita 1322748de673SAkira Fujita /* Is original extent is uninitialized */ 1323748de673SAkira Fujita uninit = ext4_ext_is_uninitialized(ext_prev); 1324748de673SAkira Fujita 1325748de673SAkira Fujita data_offset_in_page = seq_start % blocks_per_page; 1326748de673SAkira Fujita 1327748de673SAkira Fujita /* 1328748de673SAkira Fujita * Calculate data blocks count that should be swapped 1329748de673SAkira Fujita * at the first page. 1330748de673SAkira Fujita */ 1331748de673SAkira Fujita if (data_offset_in_page + seq_blocks > blocks_per_page) { 1332748de673SAkira Fujita /* Swapped blocks are across pages */ 1333748de673SAkira Fujita block_len_in_page = 1334748de673SAkira Fujita blocks_per_page - data_offset_in_page; 1335748de673SAkira Fujita } else { 1336748de673SAkira Fujita /* Swapped blocks are in a page */ 1337748de673SAkira Fujita block_len_in_page = seq_blocks; 1338748de673SAkira Fujita } 1339748de673SAkira Fujita 1340748de673SAkira Fujita orig_page_offset = seq_start >> 1341748de673SAkira Fujita (PAGE_CACHE_SHIFT - orig_inode->i_blkbits); 1342748de673SAkira Fujita seq_end_page = (seq_start + seq_blocks - 1) >> 1343748de673SAkira Fujita (PAGE_CACHE_SHIFT - orig_inode->i_blkbits); 1344748de673SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1345748de673SAkira Fujita rest_blocks = seq_blocks; 1346748de673SAkira Fujita 1347fc04cb49SAkira Fujita /* 1348fc04cb49SAkira Fujita * Up semaphore to avoid following problems: 1349fc04cb49SAkira Fujita * a. transaction deadlock among ext4_journal_start, 1350fc04cb49SAkira Fujita * ->write_begin via pagefault, and jbd2_journal_commit 1351fc04cb49SAkira Fujita * b. racing with ->readpage, ->write_begin, and ext4_get_block 1352fc04cb49SAkira Fujita * in move_extent_per_page 1353fc04cb49SAkira Fujita */ 1354fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 1355748de673SAkira Fujita 1356748de673SAkira Fujita while (orig_page_offset <= seq_end_page) { 1357748de673SAkira Fujita 1358748de673SAkira Fujita /* Swap original branches with new branches */ 1359f868a48dSAkira Fujita block_len_in_page = move_extent_per_page( 1360f868a48dSAkira Fujita o_filp, donor_inode, 1361748de673SAkira Fujita orig_page_offset, 1362748de673SAkira Fujita data_offset_in_page, 1363f868a48dSAkira Fujita block_len_in_page, uninit, 1364f868a48dSAkira Fujita &ret1); 1365f868a48dSAkira Fujita 1366748de673SAkira Fujita /* Count how many blocks we have exchanged */ 1367748de673SAkira Fujita *moved_len += block_len_in_page; 1368f868a48dSAkira Fujita if (ret1 < 0) 1369fc04cb49SAkira Fujita break; 13702147b1a6SAkira Fujita if (*moved_len > len) { 13712147b1a6SAkira Fujita ext4_error(orig_inode->i_sb, __func__, 13722147b1a6SAkira Fujita "We replaced blocks too much! " 13732147b1a6SAkira Fujita "sum of replaced: %llu requested: %llu", 13742147b1a6SAkira Fujita *moved_len, len); 13752147b1a6SAkira Fujita ret1 = -EIO; 1376fc04cb49SAkira Fujita break; 13772147b1a6SAkira Fujita } 1378748de673SAkira Fujita 1379f868a48dSAkira Fujita orig_page_offset++; 1380748de673SAkira Fujita data_offset_in_page = 0; 1381748de673SAkira Fujita rest_blocks -= block_len_in_page; 1382748de673SAkira Fujita if (rest_blocks > blocks_per_page) 1383748de673SAkira Fujita block_len_in_page = blocks_per_page; 1384748de673SAkira Fujita else 1385748de673SAkira Fujita block_len_in_page = rest_blocks; 1386748de673SAkira Fujita } 1387748de673SAkira Fujita 1388fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 1389fc04cb49SAkira Fujita if (ret1 < 0) 1390fc04cb49SAkira Fujita break; 1391fc04cb49SAkira Fujita 1392748de673SAkira Fujita /* Decrease buffer counter */ 1393748de673SAkira Fujita if (holecheck_path) 1394748de673SAkira Fujita ext4_ext_drop_refs(holecheck_path); 13952147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, seq_start, &holecheck_path); 1396347fa6f1SAkira Fujita if (ret1) 1397748de673SAkira Fujita break; 1398748de673SAkira Fujita depth = holecheck_path->p_depth; 1399748de673SAkira Fujita 1400748de673SAkira Fujita /* Decrease buffer counter */ 1401748de673SAkira Fujita if (orig_path) 1402748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 14032147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, seq_start, &orig_path); 1404347fa6f1SAkira Fujita if (ret1) 1405748de673SAkira Fujita break; 1406748de673SAkira Fujita 1407748de673SAkira Fujita ext_cur = holecheck_path[depth].p_ext; 1408748de673SAkira Fujita add_blocks = ext4_ext_get_actual_len(ext_cur); 1409748de673SAkira Fujita seq_blocks = 0; 1410748de673SAkira Fujita 1411748de673SAkira Fujita } 1412748de673SAkira Fujita out: 1413748de673SAkira Fujita if (orig_path) { 1414748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 1415748de673SAkira Fujita kfree(orig_path); 1416748de673SAkira Fujita } 1417748de673SAkira Fujita if (holecheck_path) { 1418748de673SAkira Fujita ext4_ext_drop_refs(holecheck_path); 1419748de673SAkira Fujita kfree(holecheck_path); 1420748de673SAkira Fujita } 1421fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 14222147b1a6SAkira Fujita ret2 = mext_inode_double_unlock(orig_inode, donor_inode); 1423748de673SAkira Fujita 14242147b1a6SAkira Fujita if (ret1) 14252147b1a6SAkira Fujita return ret1; 14262147b1a6SAkira Fujita else if (ret2) 14272147b1a6SAkira Fujita return ret2; 1428748de673SAkira Fujita 1429748de673SAkira Fujita return 0; 1430748de673SAkira Fujita } 1431