1748de673SAkira Fujita /* 2748de673SAkira Fujita * Copyright (c) 2008,2009 NEC Software Tohoku, Ltd. 3748de673SAkira Fujita * Written by Takashi Sato <t-sato@yk.jp.nec.com> 4748de673SAkira Fujita * Akira Fujita <a-fujita@rs.jp.nec.com> 5748de673SAkira Fujita * 6748de673SAkira Fujita * This program is free software; you can redistribute it and/or modify it 7748de673SAkira Fujita * under the terms of version 2.1 of the GNU Lesser General Public License 8748de673SAkira Fujita * as published by the Free Software Foundation. 9748de673SAkira Fujita * 10748de673SAkira Fujita * This program is distributed in the hope that it will be useful, 11748de673SAkira Fujita * but WITHOUT ANY WARRANTY; without even the implied warranty of 12748de673SAkira Fujita * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13748de673SAkira Fujita * GNU General Public License for more details. 14748de673SAkira Fujita */ 15748de673SAkira Fujita 16748de673SAkira Fujita #include <linux/fs.h> 17748de673SAkira Fujita #include <linux/quotaops.h> 185a0e3ad6STejun Heo #include <linux/slab.h> 19748de673SAkira Fujita #include "ext4_jbd2.h" 20748de673SAkira Fujita #include "ext4_extents.h" 21748de673SAkira Fujita #include "ext4.h" 22748de673SAkira Fujita 23e8505970SAkira Fujita /** 24e8505970SAkira Fujita * get_ext_path - Find an extent path for designated logical block number. 25e8505970SAkira Fujita * 26e8505970SAkira Fujita * @inode: an inode which is searched 27e8505970SAkira Fujita * @lblock: logical block number to find an extent path 28e8505970SAkira Fujita * @path: pointer to an extent path pointer (for output) 29e8505970SAkira Fujita * 30e8505970SAkira Fujita * ext4_ext_find_extent wrapper. Return 0 on success, or a negative error value 31e8505970SAkira Fujita * on failure. 32e8505970SAkira Fujita */ 33e8505970SAkira Fujita static inline int 34e8505970SAkira Fujita get_ext_path(struct inode *inode, ext4_lblk_t lblock, 35e8505970SAkira Fujita struct ext4_ext_path **path) 36e8505970SAkira Fujita { 37e8505970SAkira Fujita int ret = 0; 38e8505970SAkira Fujita 39e8505970SAkira Fujita *path = ext4_ext_find_extent(inode, lblock, *path); 40e8505970SAkira Fujita if (IS_ERR(*path)) { 41e8505970SAkira Fujita ret = PTR_ERR(*path); 42e8505970SAkira Fujita *path = NULL; 43347fa6f1SAkira Fujita } else if ((*path)[ext_depth(inode)].p_ext == NULL) 44347fa6f1SAkira Fujita ret = -ENODATA; 45347fa6f1SAkira Fujita 46e8505970SAkira Fujita return ret; 47e8505970SAkira Fujita } 48748de673SAkira Fujita 49748de673SAkira Fujita /** 50748de673SAkira Fujita * copy_extent_status - Copy the extent's initialization status 51748de673SAkira Fujita * 52748de673SAkira Fujita * @src: an extent for getting initialize status 53748de673SAkira Fujita * @dest: an extent to be set the status 54748de673SAkira Fujita */ 55748de673SAkira Fujita static void 56748de673SAkira Fujita copy_extent_status(struct ext4_extent *src, struct ext4_extent *dest) 57748de673SAkira Fujita { 58748de673SAkira Fujita if (ext4_ext_is_uninitialized(src)) 59748de673SAkira Fujita ext4_ext_mark_uninitialized(dest); 60748de673SAkira Fujita else 61748de673SAkira Fujita dest->ee_len = cpu_to_le16(ext4_ext_get_actual_len(dest)); 62748de673SAkira Fujita } 63748de673SAkira Fujita 64748de673SAkira Fujita /** 65748de673SAkira Fujita * mext_next_extent - Search for the next extent and set it to "extent" 66748de673SAkira Fujita * 67748de673SAkira Fujita * @inode: inode which is searched 68748de673SAkira Fujita * @path: this will obtain data for the next extent 69748de673SAkira Fujita * @extent: pointer to the next extent we have just gotten 70748de673SAkira Fujita * 71748de673SAkira Fujita * Search the next extent in the array of ext4_ext_path structure (@path) 72748de673SAkira Fujita * and set it to ext4_extent structure (@extent). In addition, the member of 73748de673SAkira Fujita * @path (->p_ext) also points the next extent. Return 0 on success, 1 if 74748de673SAkira Fujita * ext4_ext_path structure refers to the last extent, or a negative error 75748de673SAkira Fujita * value on failure. 76748de673SAkira Fujita */ 77748de673SAkira Fujita static int 78748de673SAkira Fujita mext_next_extent(struct inode *inode, struct ext4_ext_path *path, 79748de673SAkira Fujita struct ext4_extent **extent) 80748de673SAkira Fujita { 81fc04cb49SAkira Fujita struct ext4_extent_header *eh; 82748de673SAkira Fujita int ppos, leaf_ppos = path->p_depth; 83748de673SAkira Fujita 84748de673SAkira Fujita ppos = leaf_ppos; 85748de673SAkira Fujita if (EXT_LAST_EXTENT(path[ppos].p_hdr) > path[ppos].p_ext) { 86748de673SAkira Fujita /* leaf block */ 87748de673SAkira Fujita *extent = ++path[ppos].p_ext; 88bf89d16fSTheodore Ts'o path[ppos].p_block = ext4_ext_pblock(path[ppos].p_ext); 89748de673SAkira Fujita return 0; 90748de673SAkira Fujita } 91748de673SAkira Fujita 92748de673SAkira Fujita while (--ppos >= 0) { 93748de673SAkira Fujita if (EXT_LAST_INDEX(path[ppos].p_hdr) > 94748de673SAkira Fujita path[ppos].p_idx) { 95748de673SAkira Fujita int cur_ppos = ppos; 96748de673SAkira Fujita 97748de673SAkira Fujita /* index block */ 98748de673SAkira Fujita path[ppos].p_idx++; 99bf89d16fSTheodore Ts'o path[ppos].p_block = ext4_idx_pblock(path[ppos].p_idx); 100748de673SAkira Fujita if (path[ppos+1].p_bh) 101748de673SAkira Fujita brelse(path[ppos+1].p_bh); 102748de673SAkira Fujita path[ppos+1].p_bh = 103748de673SAkira Fujita sb_bread(inode->i_sb, path[ppos].p_block); 104748de673SAkira Fujita if (!path[ppos+1].p_bh) 105748de673SAkira Fujita return -EIO; 106748de673SAkira Fujita path[ppos+1].p_hdr = 107748de673SAkira Fujita ext_block_hdr(path[ppos+1].p_bh); 108748de673SAkira Fujita 109748de673SAkira Fujita /* Halfway index block */ 110748de673SAkira Fujita while (++cur_ppos < leaf_ppos) { 111748de673SAkira Fujita path[cur_ppos].p_idx = 112748de673SAkira Fujita EXT_FIRST_INDEX(path[cur_ppos].p_hdr); 113748de673SAkira Fujita path[cur_ppos].p_block = 114bf89d16fSTheodore Ts'o ext4_idx_pblock(path[cur_ppos].p_idx); 115748de673SAkira Fujita if (path[cur_ppos+1].p_bh) 116748de673SAkira Fujita brelse(path[cur_ppos+1].p_bh); 117748de673SAkira Fujita path[cur_ppos+1].p_bh = sb_bread(inode->i_sb, 118748de673SAkira Fujita path[cur_ppos].p_block); 119748de673SAkira Fujita if (!path[cur_ppos+1].p_bh) 120748de673SAkira Fujita return -EIO; 121748de673SAkira Fujita path[cur_ppos+1].p_hdr = 122748de673SAkira Fujita ext_block_hdr(path[cur_ppos+1].p_bh); 123748de673SAkira Fujita } 124748de673SAkira Fujita 125fc04cb49SAkira Fujita path[leaf_ppos].p_ext = *extent = NULL; 126fc04cb49SAkira Fujita 127fc04cb49SAkira Fujita eh = path[leaf_ppos].p_hdr; 128fc04cb49SAkira Fujita if (le16_to_cpu(eh->eh_entries) == 0) 129fc04cb49SAkira Fujita /* empty leaf is found */ 130fc04cb49SAkira Fujita return -ENODATA; 131fc04cb49SAkira Fujita 132748de673SAkira Fujita /* leaf block */ 133748de673SAkira Fujita path[leaf_ppos].p_ext = *extent = 134748de673SAkira Fujita EXT_FIRST_EXTENT(path[leaf_ppos].p_hdr); 135fc04cb49SAkira Fujita path[leaf_ppos].p_block = 136bf89d16fSTheodore Ts'o ext4_ext_pblock(path[leaf_ppos].p_ext); 137748de673SAkira Fujita return 0; 138748de673SAkira Fujita } 139748de673SAkira Fujita } 140748de673SAkira Fujita /* We found the last extent */ 141748de673SAkira Fujita return 1; 142748de673SAkira Fujita } 143748de673SAkira Fujita 144748de673SAkira Fujita /** 1452147b1a6SAkira Fujita * mext_check_null_inode - NULL check for two inodes 1462147b1a6SAkira Fujita * 1472147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1482147b1a6SAkira Fujita */ 1492147b1a6SAkira Fujita static int 1502147b1a6SAkira Fujita mext_check_null_inode(struct inode *inode1, struct inode *inode2, 151c398eda0STheodore Ts'o const char *function, unsigned int line) 1522147b1a6SAkira Fujita { 1532147b1a6SAkira Fujita int ret = 0; 1542147b1a6SAkira Fujita 1552147b1a6SAkira Fujita if (inode1 == NULL) { 156c398eda0STheodore Ts'o __ext4_error(inode2->i_sb, function, line, 1572147b1a6SAkira Fujita "Both inodes should not be NULL: " 1582147b1a6SAkira Fujita "inode1 NULL inode2 %lu", inode2->i_ino); 1592147b1a6SAkira Fujita ret = -EIO; 1602147b1a6SAkira Fujita } else if (inode2 == NULL) { 161c398eda0STheodore Ts'o __ext4_error(inode1->i_sb, function, line, 1622147b1a6SAkira Fujita "Both inodes should not be NULL: " 1632147b1a6SAkira Fujita "inode1 %lu inode2 NULL", inode1->i_ino); 1642147b1a6SAkira Fujita ret = -EIO; 1652147b1a6SAkira Fujita } 1662147b1a6SAkira Fujita return ret; 1672147b1a6SAkira Fujita } 1682147b1a6SAkira Fujita 1692147b1a6SAkira Fujita /** 170fc04cb49SAkira Fujita * double_down_write_data_sem - Acquire two inodes' write lock of i_data_sem 171748de673SAkira Fujita * 172748de673SAkira Fujita * @orig_inode: original inode structure 173748de673SAkira Fujita * @donor_inode: donor inode structure 174fc04cb49SAkira Fujita * Acquire write lock of i_data_sem of the two inodes (orig and donor) by 175fc04cb49SAkira Fujita * i_ino order. 176748de673SAkira Fujita */ 177748de673SAkira Fujita static void 178fc04cb49SAkira Fujita double_down_write_data_sem(struct inode *orig_inode, struct inode *donor_inode) 179748de673SAkira Fujita { 180748de673SAkira Fujita struct inode *first = orig_inode, *second = donor_inode; 181748de673SAkira Fujita 182748de673SAkira Fujita /* 183748de673SAkira Fujita * Use the inode number to provide the stable locking order instead 184748de673SAkira Fujita * of its address, because the C language doesn't guarantee you can 185748de673SAkira Fujita * compare pointers that don't come from the same array. 186748de673SAkira Fujita */ 187748de673SAkira Fujita if (donor_inode->i_ino < orig_inode->i_ino) { 188748de673SAkira Fujita first = donor_inode; 189748de673SAkira Fujita second = orig_inode; 190748de673SAkira Fujita } 191748de673SAkira Fujita 192748de673SAkira Fujita down_write(&EXT4_I(first)->i_data_sem); 19349bd22bcSAkira Fujita down_write_nested(&EXT4_I(second)->i_data_sem, SINGLE_DEPTH_NESTING); 194748de673SAkira Fujita } 195748de673SAkira Fujita 196748de673SAkira Fujita /** 197fc04cb49SAkira Fujita * double_up_write_data_sem - Release two inodes' write lock of i_data_sem 198748de673SAkira Fujita * 199748de673SAkira Fujita * @orig_inode: original inode structure to be released its lock first 200748de673SAkira Fujita * @donor_inode: donor inode structure to be released its lock second 201fc04cb49SAkira Fujita * Release write lock of i_data_sem of two inodes (orig and donor). 202748de673SAkira Fujita */ 203748de673SAkira Fujita static void 204fc04cb49SAkira Fujita double_up_write_data_sem(struct inode *orig_inode, struct inode *donor_inode) 205748de673SAkira Fujita { 206748de673SAkira Fujita up_write(&EXT4_I(orig_inode)->i_data_sem); 207748de673SAkira Fujita up_write(&EXT4_I(donor_inode)->i_data_sem); 208748de673SAkira Fujita } 209748de673SAkira Fujita 210748de673SAkira Fujita /** 211748de673SAkira Fujita * mext_insert_across_blocks - Insert extents across leaf block 212748de673SAkira Fujita * 213748de673SAkira Fujita * @handle: journal handle 214748de673SAkira Fujita * @orig_inode: original inode 215748de673SAkira Fujita * @o_start: first original extent to be changed 216748de673SAkira Fujita * @o_end: last original extent to be changed 217748de673SAkira Fujita * @start_ext: first new extent to be inserted 218748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 219748de673SAkira Fujita * @end_ext: last new extent to be inserted 220748de673SAkira Fujita * 221748de673SAkira Fujita * Allocate a new leaf block and insert extents into it. Return 0 on success, 222748de673SAkira Fujita * or a negative error value on failure. 223748de673SAkira Fujita */ 224748de673SAkira Fujita static int 225748de673SAkira Fujita mext_insert_across_blocks(handle_t *handle, struct inode *orig_inode, 226748de673SAkira Fujita struct ext4_extent *o_start, struct ext4_extent *o_end, 227748de673SAkira Fujita struct ext4_extent *start_ext, struct ext4_extent *new_ext, 228748de673SAkira Fujita struct ext4_extent *end_ext) 229748de673SAkira Fujita { 230748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL; 231748de673SAkira Fujita ext4_lblk_t eblock = 0; 232748de673SAkira Fujita int new_flag = 0; 233748de673SAkira Fujita int end_flag = 0; 234748de673SAkira Fujita int err = 0; 235748de673SAkira Fujita 236748de673SAkira Fujita if (start_ext->ee_len && new_ext->ee_len && end_ext->ee_len) { 237748de673SAkira Fujita if (o_start == o_end) { 238748de673SAkira Fujita 239748de673SAkira Fujita /* start_ext new_ext end_ext 240748de673SAkira Fujita * donor |---------|-----------|--------| 241748de673SAkira Fujita * orig |------------------------------| 242748de673SAkira Fujita */ 243748de673SAkira Fujita end_flag = 1; 244748de673SAkira Fujita } else { 245748de673SAkira Fujita 246748de673SAkira Fujita /* start_ext new_ext end_ext 247748de673SAkira Fujita * donor |---------|----------|---------| 248748de673SAkira Fujita * orig |---------------|--------------| 249748de673SAkira Fujita */ 250748de673SAkira Fujita o_end->ee_block = end_ext->ee_block; 251748de673SAkira Fujita o_end->ee_len = end_ext->ee_len; 252bf89d16fSTheodore Ts'o ext4_ext_store_pblock(o_end, ext4_ext_pblock(end_ext)); 253748de673SAkira Fujita } 254748de673SAkira Fujita 255748de673SAkira Fujita o_start->ee_len = start_ext->ee_len; 2565fd5249aSAkira Fujita eblock = le32_to_cpu(start_ext->ee_block); 257748de673SAkira Fujita new_flag = 1; 258748de673SAkira Fujita 259748de673SAkira Fujita } else if (start_ext->ee_len && new_ext->ee_len && 260748de673SAkira Fujita !end_ext->ee_len && o_start == o_end) { 261748de673SAkira Fujita 262748de673SAkira Fujita /* start_ext new_ext 263748de673SAkira Fujita * donor |--------------|---------------| 264748de673SAkira Fujita * orig |------------------------------| 265748de673SAkira Fujita */ 266748de673SAkira Fujita o_start->ee_len = start_ext->ee_len; 2675fd5249aSAkira Fujita eblock = le32_to_cpu(start_ext->ee_block); 268748de673SAkira Fujita new_flag = 1; 269748de673SAkira Fujita 270748de673SAkira Fujita } else if (!start_ext->ee_len && new_ext->ee_len && 271748de673SAkira Fujita end_ext->ee_len && o_start == o_end) { 272748de673SAkira Fujita 273748de673SAkira Fujita /* new_ext end_ext 274748de673SAkira Fujita * donor |--------------|---------------| 275748de673SAkira Fujita * orig |------------------------------| 276748de673SAkira Fujita */ 277748de673SAkira Fujita o_end->ee_block = end_ext->ee_block; 278748de673SAkira Fujita o_end->ee_len = end_ext->ee_len; 279bf89d16fSTheodore Ts'o ext4_ext_store_pblock(o_end, ext4_ext_pblock(end_ext)); 280748de673SAkira Fujita 281748de673SAkira Fujita /* 282748de673SAkira Fujita * Set 0 to the extent block if new_ext was 283748de673SAkira Fujita * the first block. 284748de673SAkira Fujita */ 285748de673SAkira Fujita if (new_ext->ee_block) 286748de673SAkira Fujita eblock = le32_to_cpu(new_ext->ee_block); 287748de673SAkira Fujita 288748de673SAkira Fujita new_flag = 1; 289748de673SAkira Fujita } else { 290748de673SAkira Fujita ext4_debug("ext4 move extent: Unexpected insert case\n"); 291748de673SAkira Fujita return -EIO; 292748de673SAkira Fujita } 293748de673SAkira Fujita 294748de673SAkira Fujita if (new_flag) { 295e8505970SAkira Fujita err = get_ext_path(orig_inode, eblock, &orig_path); 296347fa6f1SAkira Fujita if (err) 297748de673SAkira Fujita goto out; 298748de673SAkira Fujita 299748de673SAkira Fujita if (ext4_ext_insert_extent(handle, orig_inode, 3000031462bSMingming Cao orig_path, new_ext, 0)) 301748de673SAkira Fujita goto out; 302748de673SAkira Fujita } 303748de673SAkira Fujita 304748de673SAkira Fujita if (end_flag) { 305e8505970SAkira Fujita err = get_ext_path(orig_inode, 306e8505970SAkira Fujita le32_to_cpu(end_ext->ee_block) - 1, &orig_path); 307347fa6f1SAkira Fujita if (err) 308748de673SAkira Fujita goto out; 309748de673SAkira Fujita 310748de673SAkira Fujita if (ext4_ext_insert_extent(handle, orig_inode, 3110031462bSMingming Cao orig_path, end_ext, 0)) 312748de673SAkira Fujita goto out; 313748de673SAkira Fujita } 314748de673SAkira Fujita out: 315748de673SAkira Fujita if (orig_path) { 316748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 317748de673SAkira Fujita kfree(orig_path); 318748de673SAkira Fujita } 319748de673SAkira Fujita 320748de673SAkira Fujita return err; 321748de673SAkira Fujita 322748de673SAkira Fujita } 323748de673SAkira Fujita 324748de673SAkira Fujita /** 325748de673SAkira Fujita * mext_insert_inside_block - Insert new extent to the extent block 326748de673SAkira Fujita * 327748de673SAkira Fujita * @o_start: first original extent to be moved 328748de673SAkira Fujita * @o_end: last original extent to be moved 329748de673SAkira Fujita * @start_ext: first new extent to be inserted 330748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 331748de673SAkira Fujita * @end_ext: last new extent to be inserted 332748de673SAkira Fujita * @eh: extent header of target leaf block 333748de673SAkira Fujita * @range_to_move: used to decide how to insert extent 334748de673SAkira Fujita * 335748de673SAkira Fujita * Insert extents into the leaf block. The extent (@o_start) is overwritten 336748de673SAkira Fujita * by inserted extents. 337748de673SAkira Fujita */ 338748de673SAkira Fujita static void 339748de673SAkira Fujita mext_insert_inside_block(struct ext4_extent *o_start, 340748de673SAkira Fujita struct ext4_extent *o_end, 341748de673SAkira Fujita struct ext4_extent *start_ext, 342748de673SAkira Fujita struct ext4_extent *new_ext, 343748de673SAkira Fujita struct ext4_extent *end_ext, 344748de673SAkira Fujita struct ext4_extent_header *eh, 345748de673SAkira Fujita int range_to_move) 346748de673SAkira Fujita { 347748de673SAkira Fujita int i = 0; 348748de673SAkira Fujita unsigned long len; 349748de673SAkira Fujita 350748de673SAkira Fujita /* Move the existing extents */ 351748de673SAkira Fujita if (range_to_move && o_end < EXT_LAST_EXTENT(eh)) { 352748de673SAkira Fujita len = (unsigned long)(EXT_LAST_EXTENT(eh) + 1) - 353748de673SAkira Fujita (unsigned long)(o_end + 1); 354748de673SAkira Fujita memmove(o_end + 1 + range_to_move, o_end + 1, len); 355748de673SAkira Fujita } 356748de673SAkira Fujita 357748de673SAkira Fujita /* Insert start entry */ 358748de673SAkira Fujita if (start_ext->ee_len) 359748de673SAkira Fujita o_start[i++].ee_len = start_ext->ee_len; 360748de673SAkira Fujita 361748de673SAkira Fujita /* Insert new entry */ 362748de673SAkira Fujita if (new_ext->ee_len) { 363748de673SAkira Fujita o_start[i] = *new_ext; 364bf89d16fSTheodore Ts'o ext4_ext_store_pblock(&o_start[i++], ext4_ext_pblock(new_ext)); 365748de673SAkira Fujita } 366748de673SAkira Fujita 367748de673SAkira Fujita /* Insert end entry */ 368748de673SAkira Fujita if (end_ext->ee_len) 369748de673SAkira Fujita o_start[i] = *end_ext; 370748de673SAkira Fujita 371748de673SAkira Fujita /* Increment the total entries counter on the extent block */ 372748de673SAkira Fujita le16_add_cpu(&eh->eh_entries, range_to_move); 373748de673SAkira Fujita } 374748de673SAkira Fujita 375748de673SAkira Fujita /** 376748de673SAkira Fujita * mext_insert_extents - Insert new extent 377748de673SAkira Fujita * 378748de673SAkira Fujita * @handle: journal handle 379748de673SAkira Fujita * @orig_inode: original inode 380748de673SAkira Fujita * @orig_path: path indicates first extent to be changed 381748de673SAkira Fujita * @o_start: first original extent to be changed 382748de673SAkira Fujita * @o_end: last original extent to be changed 383748de673SAkira Fujita * @start_ext: first new extent to be inserted 384748de673SAkira Fujita * @new_ext: middle of new extent to be inserted 385748de673SAkira Fujita * @end_ext: last new extent to be inserted 386748de673SAkira Fujita * 387748de673SAkira Fujita * Call the function to insert extents. If we cannot add more extents into 388748de673SAkira Fujita * the leaf block, we call mext_insert_across_blocks() to create a 389748de673SAkira Fujita * new leaf block. Otherwise call mext_insert_inside_block(). Return 0 390748de673SAkira Fujita * on success, or a negative error value on failure. 391748de673SAkira Fujita */ 392748de673SAkira Fujita static int 393748de673SAkira Fujita mext_insert_extents(handle_t *handle, struct inode *orig_inode, 394748de673SAkira Fujita struct ext4_ext_path *orig_path, 395748de673SAkira Fujita struct ext4_extent *o_start, 396748de673SAkira Fujita struct ext4_extent *o_end, 397748de673SAkira Fujita struct ext4_extent *start_ext, 398748de673SAkira Fujita struct ext4_extent *new_ext, 399748de673SAkira Fujita struct ext4_extent *end_ext) 400748de673SAkira Fujita { 401748de673SAkira Fujita struct ext4_extent_header *eh; 402748de673SAkira Fujita unsigned long need_slots, slots_range; 403748de673SAkira Fujita int range_to_move, depth, ret; 404748de673SAkira Fujita 405748de673SAkira Fujita /* 406748de673SAkira Fujita * The extents need to be inserted 407748de673SAkira Fujita * start_extent + new_extent + end_extent. 408748de673SAkira Fujita */ 409748de673SAkira Fujita need_slots = (start_ext->ee_len ? 1 : 0) + (end_ext->ee_len ? 1 : 0) + 410748de673SAkira Fujita (new_ext->ee_len ? 1 : 0); 411748de673SAkira Fujita 412748de673SAkira Fujita /* The number of slots between start and end */ 413748de673SAkira Fujita slots_range = ((unsigned long)(o_end + 1) - (unsigned long)o_start + 1) 414748de673SAkira Fujita / sizeof(struct ext4_extent); 415748de673SAkira Fujita 416748de673SAkira Fujita /* Range to move the end of extent */ 417748de673SAkira Fujita range_to_move = need_slots - slots_range; 418748de673SAkira Fujita depth = orig_path->p_depth; 419748de673SAkira Fujita orig_path += depth; 420748de673SAkira Fujita eh = orig_path->p_hdr; 421748de673SAkira Fujita 422748de673SAkira Fujita if (depth) { 423748de673SAkira Fujita /* Register to journal */ 424748de673SAkira Fujita ret = ext4_journal_get_write_access(handle, orig_path->p_bh); 425748de673SAkira Fujita if (ret) 426748de673SAkira Fujita return ret; 427748de673SAkira Fujita } 428748de673SAkira Fujita 429748de673SAkira Fujita /* Expansion */ 430748de673SAkira Fujita if (range_to_move > 0 && 431748de673SAkira Fujita (range_to_move > le16_to_cpu(eh->eh_max) 432748de673SAkira Fujita - le16_to_cpu(eh->eh_entries))) { 433748de673SAkira Fujita 434748de673SAkira Fujita ret = mext_insert_across_blocks(handle, orig_inode, o_start, 435748de673SAkira Fujita o_end, start_ext, new_ext, end_ext); 436748de673SAkira Fujita if (ret < 0) 437748de673SAkira Fujita return ret; 438748de673SAkira Fujita } else 439748de673SAkira Fujita mext_insert_inside_block(o_start, o_end, start_ext, new_ext, 440748de673SAkira Fujita end_ext, eh, range_to_move); 441748de673SAkira Fujita 442748de673SAkira Fujita if (depth) { 443748de673SAkira Fujita ret = ext4_handle_dirty_metadata(handle, orig_inode, 444748de673SAkira Fujita orig_path->p_bh); 445748de673SAkira Fujita if (ret) 446748de673SAkira Fujita return ret; 447748de673SAkira Fujita } else { 448748de673SAkira Fujita ret = ext4_mark_inode_dirty(handle, orig_inode); 449748de673SAkira Fujita if (ret < 0) 450748de673SAkira Fujita return ret; 451748de673SAkira Fujita } 452748de673SAkira Fujita 453748de673SAkira Fujita return 0; 454748de673SAkira Fujita } 455748de673SAkira Fujita 456748de673SAkira Fujita /** 457748de673SAkira Fujita * mext_leaf_block - Move one leaf extent block into the inode. 458748de673SAkira Fujita * 459748de673SAkira Fujita * @handle: journal handle 460748de673SAkira Fujita * @orig_inode: original inode 461748de673SAkira Fujita * @orig_path: path indicates first extent to be changed 462748de673SAkira Fujita * @dext: donor extent 463748de673SAkira Fujita * @from: start offset on the target file 464748de673SAkira Fujita * 465748de673SAkira Fujita * In order to insert extents into the leaf block, we must divide the extent 466748de673SAkira Fujita * in the leaf block into three extents. The one is located to be inserted 467748de673SAkira Fujita * extents, and the others are located around it. 468748de673SAkira Fujita * 469748de673SAkira Fujita * Therefore, this function creates structures to save extents of the leaf 470748de673SAkira Fujita * block, and inserts extents by calling mext_insert_extents() with 471748de673SAkira Fujita * created extents. Return 0 on success, or a negative error value on failure. 472748de673SAkira Fujita */ 473748de673SAkira Fujita static int 474748de673SAkira Fujita mext_leaf_block(handle_t *handle, struct inode *orig_inode, 475748de673SAkira Fujita struct ext4_ext_path *orig_path, struct ext4_extent *dext, 476748de673SAkira Fujita ext4_lblk_t *from) 477748de673SAkira Fujita { 478748de673SAkira Fujita struct ext4_extent *oext, *o_start, *o_end, *prev_ext; 479748de673SAkira Fujita struct ext4_extent new_ext, start_ext, end_ext; 480748de673SAkira Fujita ext4_lblk_t new_ext_end; 481748de673SAkira Fujita int oext_alen, new_ext_alen, end_ext_alen; 482748de673SAkira Fujita int depth = ext_depth(orig_inode); 483748de673SAkira Fujita int ret; 484748de673SAkira Fujita 485c26d0badSSteven Liu start_ext.ee_block = end_ext.ee_block = 0; 486748de673SAkira Fujita o_start = o_end = oext = orig_path[depth].p_ext; 487748de673SAkira Fujita oext_alen = ext4_ext_get_actual_len(oext); 488748de673SAkira Fujita start_ext.ee_len = end_ext.ee_len = 0; 489748de673SAkira Fujita 490748de673SAkira Fujita new_ext.ee_block = cpu_to_le32(*from); 491bf89d16fSTheodore Ts'o ext4_ext_store_pblock(&new_ext, ext4_ext_pblock(dext)); 492748de673SAkira Fujita new_ext.ee_len = dext->ee_len; 493748de673SAkira Fujita new_ext_alen = ext4_ext_get_actual_len(&new_ext); 494748de673SAkira Fujita new_ext_end = le32_to_cpu(new_ext.ee_block) + new_ext_alen - 1; 495748de673SAkira Fujita 496748de673SAkira Fujita /* 497748de673SAkira Fujita * Case: original extent is first 498748de673SAkira Fujita * oext |--------| 499748de673SAkira Fujita * new_ext |--| 500748de673SAkira Fujita * start_ext |--| 501748de673SAkira Fujita */ 502748de673SAkira Fujita if (le32_to_cpu(oext->ee_block) < le32_to_cpu(new_ext.ee_block) && 503748de673SAkira Fujita le32_to_cpu(new_ext.ee_block) < 504748de673SAkira Fujita le32_to_cpu(oext->ee_block) + oext_alen) { 505748de673SAkira Fujita start_ext.ee_len = cpu_to_le16(le32_to_cpu(new_ext.ee_block) - 506748de673SAkira Fujita le32_to_cpu(oext->ee_block)); 5075fd5249aSAkira Fujita start_ext.ee_block = oext->ee_block; 508748de673SAkira Fujita copy_extent_status(oext, &start_ext); 509748de673SAkira Fujita } else if (oext > EXT_FIRST_EXTENT(orig_path[depth].p_hdr)) { 510748de673SAkira Fujita prev_ext = oext - 1; 511748de673SAkira Fujita /* 512748de673SAkira Fujita * We can merge new_ext into previous extent, 513748de673SAkira Fujita * if these are contiguous and same extent type. 514748de673SAkira Fujita */ 515748de673SAkira Fujita if (ext4_can_extents_be_merged(orig_inode, prev_ext, 516748de673SAkira Fujita &new_ext)) { 517748de673SAkira Fujita o_start = prev_ext; 518748de673SAkira Fujita start_ext.ee_len = cpu_to_le16( 519748de673SAkira Fujita ext4_ext_get_actual_len(prev_ext) + 520748de673SAkira Fujita new_ext_alen); 5215fd5249aSAkira Fujita start_ext.ee_block = oext->ee_block; 522748de673SAkira Fujita copy_extent_status(prev_ext, &start_ext); 523748de673SAkira Fujita new_ext.ee_len = 0; 524748de673SAkira Fujita } 525748de673SAkira Fujita } 526748de673SAkira Fujita 527748de673SAkira Fujita /* 528748de673SAkira Fujita * Case: new_ext_end must be less than oext 529748de673SAkira Fujita * oext |-----------| 530748de673SAkira Fujita * new_ext |-------| 531748de673SAkira Fujita */ 5322147b1a6SAkira Fujita if (le32_to_cpu(oext->ee_block) + oext_alen - 1 < new_ext_end) { 53324676da4STheodore Ts'o EXT4_ERROR_INODE(orig_inode, 5342147b1a6SAkira Fujita "new_ext_end(%u) should be less than or equal to " 5352147b1a6SAkira Fujita "oext->ee_block(%u) + oext_alen(%d) - 1", 5362147b1a6SAkira Fujita new_ext_end, le32_to_cpu(oext->ee_block), 5372147b1a6SAkira Fujita oext_alen); 5382147b1a6SAkira Fujita ret = -EIO; 5392147b1a6SAkira Fujita goto out; 5402147b1a6SAkira Fujita } 541748de673SAkira Fujita 542748de673SAkira Fujita /* 543748de673SAkira Fujita * Case: new_ext is smaller than original extent 544748de673SAkira Fujita * oext |---------------| 545748de673SAkira Fujita * new_ext |-----------| 546748de673SAkira Fujita * end_ext |---| 547748de673SAkira Fujita */ 548748de673SAkira Fujita if (le32_to_cpu(oext->ee_block) <= new_ext_end && 549748de673SAkira Fujita new_ext_end < le32_to_cpu(oext->ee_block) + oext_alen - 1) { 550748de673SAkira Fujita end_ext.ee_len = 551748de673SAkira Fujita cpu_to_le16(le32_to_cpu(oext->ee_block) + 552748de673SAkira Fujita oext_alen - 1 - new_ext_end); 553748de673SAkira Fujita copy_extent_status(oext, &end_ext); 554748de673SAkira Fujita end_ext_alen = ext4_ext_get_actual_len(&end_ext); 555748de673SAkira Fujita ext4_ext_store_pblock(&end_ext, 556bf89d16fSTheodore Ts'o (ext4_ext_pblock(o_end) + oext_alen - end_ext_alen)); 557748de673SAkira Fujita end_ext.ee_block = 558748de673SAkira Fujita cpu_to_le32(le32_to_cpu(o_end->ee_block) + 559748de673SAkira Fujita oext_alen - end_ext_alen); 560748de673SAkira Fujita } 561748de673SAkira Fujita 562748de673SAkira Fujita ret = mext_insert_extents(handle, orig_inode, orig_path, o_start, 563748de673SAkira Fujita o_end, &start_ext, &new_ext, &end_ext); 5642147b1a6SAkira Fujita out: 565748de673SAkira Fujita return ret; 566748de673SAkira Fujita } 567748de673SAkira Fujita 568748de673SAkira Fujita /** 569748de673SAkira Fujita * mext_calc_swap_extents - Calculate extents for extent swapping. 570748de673SAkira Fujita * 571748de673SAkira Fujita * @tmp_dext: the extent that will belong to the original inode 572748de673SAkira Fujita * @tmp_oext: the extent that will belong to the donor inode 573748de673SAkira Fujita * @orig_off: block offset of original inode 574748de673SAkira Fujita * @donor_off: block offset of donor inode 57592c28159SAkira Fujita * @max_count: the maximum length of extents 576c40ce3c9SAkira Fujita * 577c40ce3c9SAkira Fujita * Return 0 on success, or a negative error value on failure. 578748de673SAkira Fujita */ 579c40ce3c9SAkira Fujita static int 580748de673SAkira Fujita mext_calc_swap_extents(struct ext4_extent *tmp_dext, 581748de673SAkira Fujita struct ext4_extent *tmp_oext, 582748de673SAkira Fujita ext4_lblk_t orig_off, ext4_lblk_t donor_off, 583748de673SAkira Fujita ext4_lblk_t max_count) 584748de673SAkira Fujita { 585748de673SAkira Fujita ext4_lblk_t diff, orig_diff; 586748de673SAkira Fujita struct ext4_extent dext_old, oext_old; 587748de673SAkira Fujita 588c40ce3c9SAkira Fujita BUG_ON(orig_off != donor_off); 589c40ce3c9SAkira Fujita 590c40ce3c9SAkira Fujita /* original and donor extents have to cover the same block offset */ 591c40ce3c9SAkira Fujita if (orig_off < le32_to_cpu(tmp_oext->ee_block) || 592c40ce3c9SAkira Fujita le32_to_cpu(tmp_oext->ee_block) + 593c40ce3c9SAkira Fujita ext4_ext_get_actual_len(tmp_oext) - 1 < orig_off) 594c40ce3c9SAkira Fujita return -ENODATA; 595c40ce3c9SAkira Fujita 596c40ce3c9SAkira Fujita if (orig_off < le32_to_cpu(tmp_dext->ee_block) || 597c40ce3c9SAkira Fujita le32_to_cpu(tmp_dext->ee_block) + 598c40ce3c9SAkira Fujita ext4_ext_get_actual_len(tmp_dext) - 1 < orig_off) 599c40ce3c9SAkira Fujita return -ENODATA; 600c40ce3c9SAkira Fujita 601748de673SAkira Fujita dext_old = *tmp_dext; 602748de673SAkira Fujita oext_old = *tmp_oext; 603748de673SAkira Fujita 604748de673SAkira Fujita /* When tmp_dext is too large, pick up the target range. */ 605748de673SAkira Fujita diff = donor_off - le32_to_cpu(tmp_dext->ee_block); 606748de673SAkira Fujita 607bf89d16fSTheodore Ts'o ext4_ext_store_pblock(tmp_dext, ext4_ext_pblock(tmp_dext) + diff); 608748de673SAkira Fujita tmp_dext->ee_block = 609748de673SAkira Fujita cpu_to_le32(le32_to_cpu(tmp_dext->ee_block) + diff); 610748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(le16_to_cpu(tmp_dext->ee_len) - diff); 611748de673SAkira Fujita 612748de673SAkira Fujita if (max_count < ext4_ext_get_actual_len(tmp_dext)) 613748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(max_count); 614748de673SAkira Fujita 615748de673SAkira Fujita orig_diff = orig_off - le32_to_cpu(tmp_oext->ee_block); 616bf89d16fSTheodore Ts'o ext4_ext_store_pblock(tmp_oext, ext4_ext_pblock(tmp_oext) + orig_diff); 617748de673SAkira Fujita 618748de673SAkira Fujita /* Adjust extent length if donor extent is larger than orig */ 619748de673SAkira Fujita if (ext4_ext_get_actual_len(tmp_dext) > 620748de673SAkira Fujita ext4_ext_get_actual_len(tmp_oext) - orig_diff) 621748de673SAkira Fujita tmp_dext->ee_len = cpu_to_le16(le16_to_cpu(tmp_oext->ee_len) - 622748de673SAkira Fujita orig_diff); 623748de673SAkira Fujita 624748de673SAkira Fujita tmp_oext->ee_len = cpu_to_le16(ext4_ext_get_actual_len(tmp_dext)); 625748de673SAkira Fujita 626748de673SAkira Fujita copy_extent_status(&oext_old, tmp_dext); 627748de673SAkira Fujita copy_extent_status(&dext_old, tmp_oext); 628c40ce3c9SAkira Fujita 629c40ce3c9SAkira Fujita return 0; 630748de673SAkira Fujita } 631748de673SAkira Fujita 632748de673SAkira Fujita /** 633748de673SAkira Fujita * mext_replace_branches - Replace original extents with new extents 634748de673SAkira Fujita * 635748de673SAkira Fujita * @handle: journal handle 636748de673SAkira Fujita * @orig_inode: original inode 637748de673SAkira Fujita * @donor_inode: donor inode 638748de673SAkira Fujita * @from: block offset of orig_inode 639748de673SAkira Fujita * @count: block count to be replaced 640f868a48dSAkira Fujita * @err: pointer to save return value 641748de673SAkira Fujita * 642748de673SAkira Fujita * Replace original inode extents and donor inode extents page by page. 643748de673SAkira Fujita * We implement this replacement in the following three steps: 644748de673SAkira Fujita * 1. Save the block information of original and donor inodes into 645748de673SAkira Fujita * dummy extents. 646748de673SAkira Fujita * 2. Change the block information of original inode to point at the 647748de673SAkira Fujita * donor inode blocks. 648748de673SAkira Fujita * 3. Change the block information of donor inode to point at the saved 649748de673SAkira Fujita * original inode blocks in the dummy extents. 650748de673SAkira Fujita * 651f868a48dSAkira Fujita * Return replaced block count. 652748de673SAkira Fujita */ 653748de673SAkira Fujita static int 654748de673SAkira Fujita mext_replace_branches(handle_t *handle, struct inode *orig_inode, 655748de673SAkira Fujita struct inode *donor_inode, ext4_lblk_t from, 656f868a48dSAkira Fujita ext4_lblk_t count, int *err) 657748de673SAkira Fujita { 658748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL; 659748de673SAkira Fujita struct ext4_ext_path *donor_path = NULL; 660748de673SAkira Fujita struct ext4_extent *oext, *dext; 661748de673SAkira Fujita struct ext4_extent tmp_dext, tmp_oext; 662748de673SAkira Fujita ext4_lblk_t orig_off = from, donor_off = from; 663748de673SAkira Fujita int depth; 664748de673SAkira Fujita int replaced_count = 0; 665748de673SAkira Fujita int dext_alen; 666748de673SAkira Fujita 667ac48b0a1SAkira Fujita /* Protect extent trees against block allocations via delalloc */ 668ac48b0a1SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 669ac48b0a1SAkira Fujita 670748de673SAkira Fujita /* Get the original extent for the block "orig_off" */ 671f868a48dSAkira Fujita *err = get_ext_path(orig_inode, orig_off, &orig_path); 672f868a48dSAkira Fujita if (*err) 673748de673SAkira Fujita goto out; 674748de673SAkira Fujita 675748de673SAkira Fujita /* Get the donor extent for the head */ 676f868a48dSAkira Fujita *err = get_ext_path(donor_inode, donor_off, &donor_path); 677f868a48dSAkira Fujita if (*err) 678748de673SAkira Fujita goto out; 679748de673SAkira Fujita depth = ext_depth(orig_inode); 680748de673SAkira Fujita oext = orig_path[depth].p_ext; 681748de673SAkira Fujita tmp_oext = *oext; 682748de673SAkira Fujita 683748de673SAkira Fujita depth = ext_depth(donor_inode); 684748de673SAkira Fujita dext = donor_path[depth].p_ext; 685748de673SAkira Fujita tmp_dext = *dext; 686748de673SAkira Fujita 687f868a48dSAkira Fujita *err = mext_calc_swap_extents(&tmp_dext, &tmp_oext, orig_off, 688748de673SAkira Fujita donor_off, count); 689f868a48dSAkira Fujita if (*err) 690c40ce3c9SAkira Fujita goto out; 691748de673SAkira Fujita 692748de673SAkira Fujita /* Loop for the donor extents */ 693748de673SAkira Fujita while (1) { 694748de673SAkira Fujita /* The extent for donor must be found. */ 6952147b1a6SAkira Fujita if (!dext) { 69624676da4STheodore Ts'o EXT4_ERROR_INODE(donor_inode, 6972147b1a6SAkira Fujita "The extent for donor must be found"); 698f868a48dSAkira Fujita *err = -EIO; 6992147b1a6SAkira Fujita goto out; 7002147b1a6SAkira Fujita } else if (donor_off != le32_to_cpu(tmp_dext.ee_block)) { 70124676da4STheodore Ts'o EXT4_ERROR_INODE(donor_inode, 7022147b1a6SAkira Fujita "Donor offset(%u) and the first block of donor " 7032147b1a6SAkira Fujita "extent(%u) should be equal", 7042147b1a6SAkira Fujita donor_off, 7052147b1a6SAkira Fujita le32_to_cpu(tmp_dext.ee_block)); 706f868a48dSAkira Fujita *err = -EIO; 7072147b1a6SAkira Fujita goto out; 7082147b1a6SAkira Fujita } 709748de673SAkira Fujita 710748de673SAkira Fujita /* Set donor extent to orig extent */ 711f868a48dSAkira Fujita *err = mext_leaf_block(handle, orig_inode, 712748de673SAkira Fujita orig_path, &tmp_dext, &orig_off); 713f868a48dSAkira Fujita if (*err) 714748de673SAkira Fujita goto out; 715748de673SAkira Fujita 716748de673SAkira Fujita /* Set orig extent to donor extent */ 717f868a48dSAkira Fujita *err = mext_leaf_block(handle, donor_inode, 718748de673SAkira Fujita donor_path, &tmp_oext, &donor_off); 719f868a48dSAkira Fujita if (*err) 720748de673SAkira Fujita goto out; 721748de673SAkira Fujita 722748de673SAkira Fujita dext_alen = ext4_ext_get_actual_len(&tmp_dext); 723748de673SAkira Fujita replaced_count += dext_alen; 724748de673SAkira Fujita donor_off += dext_alen; 725748de673SAkira Fujita orig_off += dext_alen; 726748de673SAkira Fujita 727748de673SAkira Fujita /* Already moved the expected blocks */ 728748de673SAkira Fujita if (replaced_count >= count) 729748de673SAkira Fujita break; 730748de673SAkira Fujita 731748de673SAkira Fujita if (orig_path) 732748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 733f868a48dSAkira Fujita *err = get_ext_path(orig_inode, orig_off, &orig_path); 734f868a48dSAkira Fujita if (*err) 735748de673SAkira Fujita goto out; 736748de673SAkira Fujita depth = ext_depth(orig_inode); 737748de673SAkira Fujita oext = orig_path[depth].p_ext; 738748de673SAkira Fujita tmp_oext = *oext; 739748de673SAkira Fujita 740748de673SAkira Fujita if (donor_path) 741748de673SAkira Fujita ext4_ext_drop_refs(donor_path); 742f868a48dSAkira Fujita *err = get_ext_path(donor_inode, donor_off, &donor_path); 743f868a48dSAkira Fujita if (*err) 744748de673SAkira Fujita goto out; 745748de673SAkira Fujita depth = ext_depth(donor_inode); 746748de673SAkira Fujita dext = donor_path[depth].p_ext; 747748de673SAkira Fujita tmp_dext = *dext; 748748de673SAkira Fujita 749f868a48dSAkira Fujita *err = mext_calc_swap_extents(&tmp_dext, &tmp_oext, orig_off, 750c40ce3c9SAkira Fujita donor_off, count - replaced_count); 751f868a48dSAkira Fujita if (*err) 752c40ce3c9SAkira Fujita goto out; 753748de673SAkira Fujita } 754748de673SAkira Fujita 755748de673SAkira Fujita out: 756748de673SAkira Fujita if (orig_path) { 757748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 758748de673SAkira Fujita kfree(orig_path); 759748de673SAkira Fujita } 760748de673SAkira Fujita if (donor_path) { 761748de673SAkira Fujita ext4_ext_drop_refs(donor_path); 762748de673SAkira Fujita kfree(donor_path); 763748de673SAkira Fujita } 764748de673SAkira Fujita 765ac48b0a1SAkira Fujita ext4_ext_invalidate_cache(orig_inode); 766ac48b0a1SAkira Fujita ext4_ext_invalidate_cache(donor_inode); 767ac48b0a1SAkira Fujita 768ac48b0a1SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 769ac48b0a1SAkira Fujita 770f868a48dSAkira Fujita return replaced_count; 771748de673SAkira Fujita } 772748de673SAkira Fujita 773748de673SAkira Fujita /** 774748de673SAkira Fujita * move_extent_per_page - Move extent data per page 775748de673SAkira Fujita * 776748de673SAkira Fujita * @o_filp: file structure of original file 777748de673SAkira Fujita * @donor_inode: donor inode 778748de673SAkira Fujita * @orig_page_offset: page index on original file 779748de673SAkira Fujita * @data_offset_in_page: block index where data swapping starts 780748de673SAkira Fujita * @block_len_in_page: the number of blocks to be swapped 781748de673SAkira Fujita * @uninit: orig extent is uninitialized or not 782f868a48dSAkira Fujita * @err: pointer to save return value 783748de673SAkira Fujita * 784748de673SAkira Fujita * Save the data in original inode blocks and replace original inode extents 785748de673SAkira Fujita * with donor inode extents by calling mext_replace_branches(). 786f868a48dSAkira Fujita * Finally, write out the saved data in new original inode blocks. Return 787f868a48dSAkira Fujita * replaced block count. 788748de673SAkira Fujita */ 789748de673SAkira Fujita static int 79044fc48f7SAkira Fujita move_extent_per_page(struct file *o_filp, struct inode *donor_inode, 791748de673SAkira Fujita pgoff_t orig_page_offset, int data_offset_in_page, 792f868a48dSAkira Fujita int block_len_in_page, int uninit, int *err) 793748de673SAkira Fujita { 794748de673SAkira Fujita struct inode *orig_inode = o_filp->f_dentry->d_inode; 795748de673SAkira Fujita struct address_space *mapping = orig_inode->i_mapping; 796748de673SAkira Fujita struct buffer_head *bh; 797748de673SAkira Fujita struct page *page = NULL; 798748de673SAkira Fujita const struct address_space_operations *a_ops = mapping->a_ops; 799748de673SAkira Fujita handle_t *handle; 800748de673SAkira Fujita ext4_lblk_t orig_blk_offset; 801748de673SAkira Fujita long long offs = orig_page_offset << PAGE_CACHE_SHIFT; 802748de673SAkira Fujita unsigned long blocksize = orig_inode->i_sb->s_blocksize; 803748de673SAkira Fujita unsigned int w_flags = 0; 804f868a48dSAkira Fujita unsigned int tmp_data_size, data_size, replaced_size; 805748de673SAkira Fujita void *fsdata; 806f868a48dSAkira Fujita int i, jblocks; 807f868a48dSAkira Fujita int err2 = 0; 808f868a48dSAkira Fujita int replaced_count = 0; 809748de673SAkira Fujita int blocks_per_page = PAGE_CACHE_SIZE >> orig_inode->i_blkbits; 810748de673SAkira Fujita 811748de673SAkira Fujita /* 812748de673SAkira Fujita * It needs twice the amount of ordinary journal buffers because 813748de673SAkira Fujita * inode and donor_inode may change each different metadata blocks. 814748de673SAkira Fujita */ 815748de673SAkira Fujita jblocks = ext4_writepage_trans_blocks(orig_inode) * 2; 816748de673SAkira Fujita handle = ext4_journal_start(orig_inode, jblocks); 817748de673SAkira Fujita if (IS_ERR(handle)) { 818f868a48dSAkira Fujita *err = PTR_ERR(handle); 819f868a48dSAkira Fujita return 0; 820748de673SAkira Fujita } 821748de673SAkira Fujita 822748de673SAkira Fujita if (segment_eq(get_fs(), KERNEL_DS)) 823748de673SAkira Fujita w_flags |= AOP_FLAG_UNINTERRUPTIBLE; 824748de673SAkira Fujita 825748de673SAkira Fujita orig_blk_offset = orig_page_offset * blocks_per_page + 826748de673SAkira Fujita data_offset_in_page; 827748de673SAkira Fujita 828748de673SAkira Fujita /* 829748de673SAkira Fujita * If orig extent is uninitialized one, 830748de673SAkira Fujita * it's not necessary force the page into memory 831748de673SAkira Fujita * and then force it to be written out again. 832748de673SAkira Fujita * Just swap data blocks between orig and donor. 833748de673SAkira Fujita */ 834748de673SAkira Fujita if (uninit) { 835f868a48dSAkira Fujita replaced_count = mext_replace_branches(handle, orig_inode, 836748de673SAkira Fujita donor_inode, orig_blk_offset, 837f868a48dSAkira Fujita block_len_in_page, err); 838748de673SAkira Fujita goto out2; 839748de673SAkira Fujita } 840748de673SAkira Fujita 841748de673SAkira Fujita offs = (long long)orig_blk_offset << orig_inode->i_blkbits; 842748de673SAkira Fujita 843f868a48dSAkira Fujita /* Calculate data_size */ 844748de673SAkira Fujita if ((orig_blk_offset + block_len_in_page - 1) == 845748de673SAkira Fujita ((orig_inode->i_size - 1) >> orig_inode->i_blkbits)) { 846748de673SAkira Fujita /* Replace the last block */ 847f868a48dSAkira Fujita tmp_data_size = orig_inode->i_size & (blocksize - 1); 848748de673SAkira Fujita /* 849f868a48dSAkira Fujita * If data_size equal zero, it shows data_size is multiples of 850748de673SAkira Fujita * blocksize. So we set appropriate value. 851748de673SAkira Fujita */ 852f868a48dSAkira Fujita if (tmp_data_size == 0) 853f868a48dSAkira Fujita tmp_data_size = blocksize; 854748de673SAkira Fujita 855f868a48dSAkira Fujita data_size = tmp_data_size + 856748de673SAkira Fujita ((block_len_in_page - 1) << orig_inode->i_blkbits); 857f868a48dSAkira Fujita } else 858f868a48dSAkira Fujita data_size = block_len_in_page << orig_inode->i_blkbits; 859748de673SAkira Fujita 860f868a48dSAkira Fujita replaced_size = data_size; 861f868a48dSAkira Fujita 862f868a48dSAkira Fujita *err = a_ops->write_begin(o_filp, mapping, offs, data_size, w_flags, 863748de673SAkira Fujita &page, &fsdata); 864f868a48dSAkira Fujita if (unlikely(*err < 0)) 865748de673SAkira Fujita goto out; 866748de673SAkira Fujita 867748de673SAkira Fujita if (!PageUptodate(page)) { 868748de673SAkira Fujita mapping->a_ops->readpage(o_filp, page); 869748de673SAkira Fujita lock_page(page); 870748de673SAkira Fujita } 871748de673SAkira Fujita 872748de673SAkira Fujita /* 873748de673SAkira Fujita * try_to_release_page() doesn't call releasepage in writeback mode. 874748de673SAkira Fujita * We should care about the order of writing to the same file 875748de673SAkira Fujita * by multiple move extent processes. 876748de673SAkira Fujita * It needs to call wait_on_page_writeback() to wait for the 877748de673SAkira Fujita * writeback of the page. 878748de673SAkira Fujita */ 879748de673SAkira Fujita wait_on_page_writeback(page); 880748de673SAkira Fujita 881748de673SAkira Fujita /* Release old bh and drop refs */ 882748de673SAkira Fujita try_to_release_page(page, 0); 883748de673SAkira Fujita 884f868a48dSAkira Fujita replaced_count = mext_replace_branches(handle, orig_inode, donor_inode, 885f868a48dSAkira Fujita orig_blk_offset, block_len_in_page, 886f868a48dSAkira Fujita &err2); 887f868a48dSAkira Fujita if (err2) { 888f868a48dSAkira Fujita if (replaced_count) { 889f868a48dSAkira Fujita block_len_in_page = replaced_count; 890f868a48dSAkira Fujita replaced_size = 891f868a48dSAkira Fujita block_len_in_page << orig_inode->i_blkbits; 892ac48b0a1SAkira Fujita } else 893748de673SAkira Fujita goto out; 894f868a48dSAkira Fujita } 895fc04cb49SAkira Fujita 896748de673SAkira Fujita if (!page_has_buffers(page)) 897748de673SAkira Fujita create_empty_buffers(page, 1 << orig_inode->i_blkbits, 0); 898748de673SAkira Fujita 899748de673SAkira Fujita bh = page_buffers(page); 900748de673SAkira Fujita for (i = 0; i < data_offset_in_page; i++) 901748de673SAkira Fujita bh = bh->b_this_page; 902748de673SAkira Fujita 903748de673SAkira Fujita for (i = 0; i < block_len_in_page; i++) { 904f868a48dSAkira Fujita *err = ext4_get_block(orig_inode, 905748de673SAkira Fujita (sector_t)(orig_blk_offset + i), bh, 0); 906f868a48dSAkira Fujita if (*err < 0) 907748de673SAkira Fujita goto out; 908748de673SAkira Fujita 909748de673SAkira Fujita if (bh->b_this_page != NULL) 910748de673SAkira Fujita bh = bh->b_this_page; 911748de673SAkira Fujita } 912748de673SAkira Fujita 913f868a48dSAkira Fujita *err = a_ops->write_end(o_filp, mapping, offs, data_size, replaced_size, 914748de673SAkira Fujita page, fsdata); 915748de673SAkira Fujita page = NULL; 916748de673SAkira Fujita 917748de673SAkira Fujita out: 918748de673SAkira Fujita if (unlikely(page)) { 919748de673SAkira Fujita if (PageLocked(page)) 920748de673SAkira Fujita unlock_page(page); 921748de673SAkira Fujita page_cache_release(page); 92291cc219aSPeng Tao ext4_journal_stop(handle); 923748de673SAkira Fujita } 924748de673SAkira Fujita out2: 925748de673SAkira Fujita ext4_journal_stop(handle); 926748de673SAkira Fujita 927f868a48dSAkira Fujita if (err2) 928f868a48dSAkira Fujita *err = err2; 929f868a48dSAkira Fujita 930f868a48dSAkira Fujita return replaced_count; 931748de673SAkira Fujita } 932748de673SAkira Fujita 933748de673SAkira Fujita /** 934c437b273SAkira Fujita * mext_check_arguments - Check whether move extent can be done 935748de673SAkira Fujita * 936748de673SAkira Fujita * @orig_inode: original inode 937748de673SAkira Fujita * @donor_inode: donor inode 938748de673SAkira Fujita * @orig_start: logical start offset in block for orig 939748de673SAkira Fujita * @donor_start: logical start offset in block for donor 940748de673SAkira Fujita * @len: the number of blocks to be moved 941748de673SAkira Fujita * 942748de673SAkira Fujita * Check the arguments of ext4_move_extents() whether the files can be 943748de673SAkira Fujita * exchanged with each other. 944748de673SAkira Fujita * Return 0 on success, or a negative error value on failure. 945748de673SAkira Fujita */ 946748de673SAkira Fujita static int 947748de673SAkira Fujita mext_check_arguments(struct inode *orig_inode, 948748de673SAkira Fujita struct inode *donor_inode, __u64 orig_start, 949446aaa6eSKazuya Mio __u64 donor_start, __u64 *len) 950748de673SAkira Fujita { 95170d5d3dcSAkira Fujita ext4_lblk_t orig_blocks, donor_blocks; 95270d5d3dcSAkira Fujita unsigned int blkbits = orig_inode->i_blkbits; 95370d5d3dcSAkira Fujita unsigned int blocksize = 1 << blkbits; 95470d5d3dcSAkira Fujita 9554a58579bSAkira Fujita if (donor_inode->i_mode & (S_ISUID|S_ISGID)) { 9564a58579bSAkira Fujita ext4_debug("ext4 move extent: suid or sgid is set" 9574a58579bSAkira Fujita " to donor file [ino:orig %lu, donor %lu]\n", 9584a58579bSAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 9594a58579bSAkira Fujita return -EINVAL; 9604a58579bSAkira Fujita } 9614a58579bSAkira Fujita 9621f5a81e4STheodore Ts'o if (IS_IMMUTABLE(donor_inode) || IS_APPEND(donor_inode)) 9631f5a81e4STheodore Ts'o return -EPERM; 9641f5a81e4STheodore Ts'o 965748de673SAkira Fujita /* Ext4 move extent does not support swapfile */ 966748de673SAkira Fujita if (IS_SWAPFILE(orig_inode) || IS_SWAPFILE(donor_inode)) { 967748de673SAkira Fujita ext4_debug("ext4 move extent: The argument files should " 968748de673SAkira Fujita "not be swapfile [ino:orig %lu, donor %lu]\n", 969748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 970748de673SAkira Fujita return -EINVAL; 971748de673SAkira Fujita } 972748de673SAkira Fujita 973748de673SAkira Fujita /* Files should be in the same ext4 FS */ 974748de673SAkira Fujita if (orig_inode->i_sb != donor_inode->i_sb) { 975748de673SAkira Fujita ext4_debug("ext4 move extent: The argument files " 976748de673SAkira Fujita "should be in same FS [ino:orig %lu, donor %lu]\n", 977748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 978748de673SAkira Fujita return -EINVAL; 979748de673SAkira Fujita } 980748de673SAkira Fujita 981748de673SAkira Fujita /* Ext4 move extent supports only extent based file */ 98212e9b892SDmitry Monakhov if (!(ext4_test_inode_flag(orig_inode, EXT4_INODE_EXTENTS))) { 983748de673SAkira Fujita ext4_debug("ext4 move extent: orig file is not extents " 984748de673SAkira Fujita "based file [ino:orig %lu]\n", orig_inode->i_ino); 985748de673SAkira Fujita return -EOPNOTSUPP; 98612e9b892SDmitry Monakhov } else if (!(ext4_test_inode_flag(donor_inode, EXT4_INODE_EXTENTS))) { 987748de673SAkira Fujita ext4_debug("ext4 move extent: donor file is not extents " 988748de673SAkira Fujita "based file [ino:donor %lu]\n", donor_inode->i_ino); 989748de673SAkira Fujita return -EOPNOTSUPP; 990748de673SAkira Fujita } 991748de673SAkira Fujita 992748de673SAkira Fujita if ((!orig_inode->i_size) || (!donor_inode->i_size)) { 993748de673SAkira Fujita ext4_debug("ext4 move extent: File size is 0 byte\n"); 994748de673SAkira Fujita return -EINVAL; 995748de673SAkira Fujita } 996748de673SAkira Fujita 997748de673SAkira Fujita /* Start offset should be same */ 998748de673SAkira Fujita if (orig_start != donor_start) { 999748de673SAkira Fujita ext4_debug("ext4 move extent: orig and donor's start " 1000748de673SAkira Fujita "offset are not same [ino:orig %lu, donor %lu]\n", 1001748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1002748de673SAkira Fujita return -EINVAL; 1003748de673SAkira Fujita } 1004748de673SAkira Fujita 1005f17722f9SLukas Czerner if ((orig_start >= EXT_MAX_BLOCKS) || 1006f17722f9SLukas Czerner (donor_start >= EXT_MAX_BLOCKS) || 1007f17722f9SLukas Czerner (*len > EXT_MAX_BLOCKS) || 1008f17722f9SLukas Czerner (orig_start + *len >= EXT_MAX_BLOCKS)) { 10090a80e986SEric Sandeen ext4_debug("ext4 move extent: Can't handle over [%u] blocks " 1010f17722f9SLukas Czerner "[ino:orig %lu, donor %lu]\n", EXT_MAX_BLOCKS, 1011748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1012748de673SAkira Fujita return -EINVAL; 1013748de673SAkira Fujita } 1014748de673SAkira Fujita 1015748de673SAkira Fujita if (orig_inode->i_size > donor_inode->i_size) { 101670d5d3dcSAkira Fujita donor_blocks = (donor_inode->i_size + blocksize - 1) >> blkbits; 101770d5d3dcSAkira Fujita /* TODO: eliminate this artificial restriction */ 101870d5d3dcSAkira Fujita if (orig_start >= donor_blocks) { 1019748de673SAkira Fujita ext4_debug("ext4 move extent: orig start offset " 102070d5d3dcSAkira Fujita "[%llu] should be less than donor file blocks " 102170d5d3dcSAkira Fujita "[%u] [ino:orig %lu, donor %lu]\n", 102270d5d3dcSAkira Fujita orig_start, donor_blocks, 1023748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1024748de673SAkira Fujita return -EINVAL; 1025748de673SAkira Fujita } 1026748de673SAkira Fujita 102770d5d3dcSAkira Fujita /* TODO: eliminate this artificial restriction */ 102870d5d3dcSAkira Fujita if (orig_start + *len > donor_blocks) { 1029748de673SAkira Fujita ext4_debug("ext4 move extent: End offset [%llu] should " 103070d5d3dcSAkira Fujita "be less than donor file blocks [%u]." 103170d5d3dcSAkira Fujita "So adjust length from %llu to %llu " 1032748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", 103370d5d3dcSAkira Fujita orig_start + *len, donor_blocks, 103470d5d3dcSAkira Fujita *len, donor_blocks - orig_start, 1035748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 103670d5d3dcSAkira Fujita *len = donor_blocks - orig_start; 1037748de673SAkira Fujita } 1038748de673SAkira Fujita } else { 103970d5d3dcSAkira Fujita orig_blocks = (orig_inode->i_size + blocksize - 1) >> blkbits; 104070d5d3dcSAkira Fujita if (orig_start >= orig_blocks) { 1041748de673SAkira Fujita ext4_debug("ext4 move extent: start offset [%llu] " 104270d5d3dcSAkira Fujita "should be less than original file blocks " 104370d5d3dcSAkira Fujita "[%u] [ino:orig %lu, donor %lu]\n", 104470d5d3dcSAkira Fujita orig_start, orig_blocks, 1045748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 1046748de673SAkira Fujita return -EINVAL; 1047748de673SAkira Fujita } 1048748de673SAkira Fujita 104970d5d3dcSAkira Fujita if (orig_start + *len > orig_blocks) { 1050748de673SAkira Fujita ext4_debug("ext4 move extent: Adjust length " 105170d5d3dcSAkira Fujita "from %llu to %llu. Because it should be " 105270d5d3dcSAkira Fujita "less than original file blocks " 1053748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", 105470d5d3dcSAkira Fujita *len, orig_blocks - orig_start, 1055748de673SAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 105670d5d3dcSAkira Fujita *len = orig_blocks - orig_start; 1057748de673SAkira Fujita } 1058748de673SAkira Fujita } 1059748de673SAkira Fujita 1060748de673SAkira Fujita if (!*len) { 106192c28159SAkira Fujita ext4_debug("ext4 move extent: len should not be 0 " 1062748de673SAkira Fujita "[ino:orig %lu, donor %lu]\n", orig_inode->i_ino, 1063748de673SAkira Fujita donor_inode->i_ino); 1064748de673SAkira Fujita return -EINVAL; 1065748de673SAkira Fujita } 1066748de673SAkira Fujita 1067748de673SAkira Fujita return 0; 1068748de673SAkira Fujita } 1069748de673SAkira Fujita 1070748de673SAkira Fujita /** 1071748de673SAkira Fujita * mext_inode_double_lock - Lock i_mutex on both @inode1 and @inode2 1072748de673SAkira Fujita * 1073748de673SAkira Fujita * @inode1: the inode structure 1074748de673SAkira Fujita * @inode2: the inode structure 1075748de673SAkira Fujita * 10762147b1a6SAkira Fujita * Lock two inodes' i_mutex by i_ino order. 10772147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1078748de673SAkira Fujita */ 10792147b1a6SAkira Fujita static int 1080748de673SAkira Fujita mext_inode_double_lock(struct inode *inode1, struct inode *inode2) 1081748de673SAkira Fujita { 10822147b1a6SAkira Fujita int ret = 0; 10832147b1a6SAkira Fujita 10842147b1a6SAkira Fujita BUG_ON(inode1 == NULL && inode2 == NULL); 10852147b1a6SAkira Fujita 1086c398eda0STheodore Ts'o ret = mext_check_null_inode(inode1, inode2, __func__, __LINE__); 10872147b1a6SAkira Fujita if (ret < 0) 10882147b1a6SAkira Fujita goto out; 10892147b1a6SAkira Fujita 10902147b1a6SAkira Fujita if (inode1 == inode2) { 1091748de673SAkira Fujita mutex_lock(&inode1->i_mutex); 10922147b1a6SAkira Fujita goto out; 1093748de673SAkira Fujita } 1094748de673SAkira Fujita 1095748de673SAkira Fujita if (inode1->i_ino < inode2->i_ino) { 1096748de673SAkira Fujita mutex_lock_nested(&inode1->i_mutex, I_MUTEX_PARENT); 1097748de673SAkira Fujita mutex_lock_nested(&inode2->i_mutex, I_MUTEX_CHILD); 1098748de673SAkira Fujita } else { 1099748de673SAkira Fujita mutex_lock_nested(&inode2->i_mutex, I_MUTEX_PARENT); 1100748de673SAkira Fujita mutex_lock_nested(&inode1->i_mutex, I_MUTEX_CHILD); 1101748de673SAkira Fujita } 11022147b1a6SAkira Fujita 11032147b1a6SAkira Fujita out: 11042147b1a6SAkira Fujita return ret; 1105748de673SAkira Fujita } 1106748de673SAkira Fujita 1107748de673SAkira Fujita /** 1108748de673SAkira Fujita * mext_inode_double_unlock - Release i_mutex on both @inode1 and @inode2 1109748de673SAkira Fujita * 1110748de673SAkira Fujita * @inode1: the inode that is released first 1111748de673SAkira Fujita * @inode2: the inode that is released second 1112748de673SAkira Fujita * 11132147b1a6SAkira Fujita * If inode1 or inode2 is NULL, return -EIO. Otherwise, return 0. 1114748de673SAkira Fujita */ 1115748de673SAkira Fujita 11162147b1a6SAkira Fujita static int 1117748de673SAkira Fujita mext_inode_double_unlock(struct inode *inode1, struct inode *inode2) 1118748de673SAkira Fujita { 11192147b1a6SAkira Fujita int ret = 0; 11202147b1a6SAkira Fujita 11212147b1a6SAkira Fujita BUG_ON(inode1 == NULL && inode2 == NULL); 11222147b1a6SAkira Fujita 1123c398eda0STheodore Ts'o ret = mext_check_null_inode(inode1, inode2, __func__, __LINE__); 11242147b1a6SAkira Fujita if (ret < 0) 11252147b1a6SAkira Fujita goto out; 11262147b1a6SAkira Fujita 1127748de673SAkira Fujita if (inode1) 1128748de673SAkira Fujita mutex_unlock(&inode1->i_mutex); 1129748de673SAkira Fujita 1130748de673SAkira Fujita if (inode2 && inode2 != inode1) 1131748de673SAkira Fujita mutex_unlock(&inode2->i_mutex); 11322147b1a6SAkira Fujita 11332147b1a6SAkira Fujita out: 11342147b1a6SAkira Fujita return ret; 1135748de673SAkira Fujita } 1136748de673SAkira Fujita 1137748de673SAkira Fujita /** 1138748de673SAkira Fujita * ext4_move_extents - Exchange the specified range of a file 1139748de673SAkira Fujita * 1140748de673SAkira Fujita * @o_filp: file structure of the original file 1141748de673SAkira Fujita * @d_filp: file structure of the donor file 1142748de673SAkira Fujita * @orig_start: start offset in block for orig 1143748de673SAkira Fujita * @donor_start: start offset in block for donor 1144748de673SAkira Fujita * @len: the number of blocks to be moved 1145748de673SAkira Fujita * @moved_len: moved block length 1146748de673SAkira Fujita * 1147748de673SAkira Fujita * This function returns 0 and moved block length is set in moved_len 1148748de673SAkira Fujita * if succeed, otherwise returns error value. 1149748de673SAkira Fujita * 1150748de673SAkira Fujita * Note: ext4_move_extents() proceeds the following order. 1151748de673SAkira Fujita * 1:ext4_move_extents() calculates the last block number of moving extent 1152748de673SAkira Fujita * function by the start block number (orig_start) and the number of blocks 1153748de673SAkira Fujita * to be moved (len) specified as arguments. 1154748de673SAkira Fujita * If the {orig, donor}_start points a hole, the extent's start offset 1155748de673SAkira Fujita * pointed by ext_cur (current extent), holecheck_path, orig_path are set 1156748de673SAkira Fujita * after hole behind. 1157748de673SAkira Fujita * 2:Continue step 3 to step 5, until the holecheck_path points to last_extent 1158748de673SAkira Fujita * or the ext_cur exceeds the block_end which is last logical block number. 1159748de673SAkira Fujita * 3:To get the length of continues area, call mext_next_extent() 1160748de673SAkira Fujita * specified with the ext_cur (initial value is holecheck_path) re-cursive, 1161748de673SAkira Fujita * until find un-continuous extent, the start logical block number exceeds 1162748de673SAkira Fujita * the block_end or the extent points to the last extent. 1163748de673SAkira Fujita * 4:Exchange the original inode data with donor inode data 1164748de673SAkira Fujita * from orig_page_offset to seq_end_page. 1165748de673SAkira Fujita * The start indexes of data are specified as arguments. 1166748de673SAkira Fujita * That of the original inode is orig_page_offset, 1167748de673SAkira Fujita * and the donor inode is also orig_page_offset 1168748de673SAkira Fujita * (To easily handle blocksize != pagesize case, the offset for the 1169748de673SAkira Fujita * donor inode is block unit). 1170748de673SAkira Fujita * 5:Update holecheck_path and orig_path to points a next proceeding extent, 1171748de673SAkira Fujita * then returns to step 2. 1172748de673SAkira Fujita * 6:Release holecheck_path, orig_path and set the len to moved_len 1173748de673SAkira Fujita * which shows the number of moved blocks. 1174748de673SAkira Fujita * The moved_len is useful for the command to calculate the file offset 1175748de673SAkira Fujita * for starting next move extent ioctl. 1176748de673SAkira Fujita * 7:Return 0 on success, or a negative error value on failure. 1177748de673SAkira Fujita */ 1178748de673SAkira Fujita int 1179748de673SAkira Fujita ext4_move_extents(struct file *o_filp, struct file *d_filp, 1180748de673SAkira Fujita __u64 orig_start, __u64 donor_start, __u64 len, 1181748de673SAkira Fujita __u64 *moved_len) 1182748de673SAkira Fujita { 1183748de673SAkira Fujita struct inode *orig_inode = o_filp->f_dentry->d_inode; 1184748de673SAkira Fujita struct inode *donor_inode = d_filp->f_dentry->d_inode; 1185748de673SAkira Fujita struct ext4_ext_path *orig_path = NULL, *holecheck_path = NULL; 1186748de673SAkira Fujita struct ext4_extent *ext_prev, *ext_cur, *ext_dummy; 1187748de673SAkira Fujita ext4_lblk_t block_start = orig_start; 1188748de673SAkira Fujita ext4_lblk_t block_end, seq_start, add_blocks, file_end, seq_blocks = 0; 1189748de673SAkira Fujita ext4_lblk_t rest_blocks; 1190748de673SAkira Fujita pgoff_t orig_page_offset = 0, seq_end_page; 11912147b1a6SAkira Fujita int ret1, ret2, depth, last_extent = 0; 1192748de673SAkira Fujita int blocks_per_page = PAGE_CACHE_SIZE >> orig_inode->i_blkbits; 1193748de673SAkira Fujita int data_offset_in_page; 1194748de673SAkira Fujita int block_len_in_page; 1195748de673SAkira Fujita int uninit; 1196748de673SAkira Fujita 1197f3ce8064STheodore Ts'o /* orig and donor should be different file */ 1198f3ce8064STheodore Ts'o if (orig_inode->i_ino == donor_inode->i_ino) { 1199f3ce8064STheodore Ts'o ext4_debug("ext4 move extent: The argument files should not " 1200f3ce8064STheodore Ts'o "be same file [ino:orig %lu, donor %lu]\n", 1201f3ce8064STheodore Ts'o orig_inode->i_ino, donor_inode->i_ino); 1202f3ce8064STheodore Ts'o return -EINVAL; 1203f3ce8064STheodore Ts'o } 1204f3ce8064STheodore Ts'o 12057247c0caSAkira Fujita /* Regular file check */ 12067247c0caSAkira Fujita if (!S_ISREG(orig_inode->i_mode) || !S_ISREG(donor_inode->i_mode)) { 12077247c0caSAkira Fujita ext4_debug("ext4 move extent: The argument files should be " 12087247c0caSAkira Fujita "regular file [ino:orig %lu, donor %lu]\n", 12097247c0caSAkira Fujita orig_inode->i_ino, donor_inode->i_ino); 12107247c0caSAkira Fujita return -EINVAL; 12117247c0caSAkira Fujita } 12127247c0caSAkira Fujita 1213fc04cb49SAkira Fujita /* Protect orig and donor inodes against a truncate */ 12142147b1a6SAkira Fujita ret1 = mext_inode_double_lock(orig_inode, donor_inode); 12152147b1a6SAkira Fujita if (ret1 < 0) 12162147b1a6SAkira Fujita return ret1; 1217748de673SAkira Fujita 1218fc04cb49SAkira Fujita /* Protect extent tree against block allocations via delalloc */ 1219fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 1220748de673SAkira Fujita /* Check the filesystem environment whether move_extent can be done */ 12212147b1a6SAkira Fujita ret1 = mext_check_arguments(orig_inode, donor_inode, orig_start, 1222446aaa6eSKazuya Mio donor_start, &len); 12232147b1a6SAkira Fujita if (ret1) 1224347fa6f1SAkira Fujita goto out; 1225748de673SAkira Fujita 1226748de673SAkira Fujita file_end = (i_size_read(orig_inode) - 1) >> orig_inode->i_blkbits; 1227748de673SAkira Fujita block_end = block_start + len - 1; 1228748de673SAkira Fujita if (file_end < block_end) 1229748de673SAkira Fujita len -= block_end - file_end; 1230748de673SAkira Fujita 12312147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, block_start, &orig_path); 1232347fa6f1SAkira Fujita if (ret1) 1233347fa6f1SAkira Fujita goto out; 1234748de673SAkira Fujita 1235748de673SAkira Fujita /* Get path structure to check the hole */ 12362147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, block_start, &holecheck_path); 1237347fa6f1SAkira Fujita if (ret1) 1238748de673SAkira Fujita goto out; 1239748de673SAkira Fujita 1240748de673SAkira Fujita depth = ext_depth(orig_inode); 1241748de673SAkira Fujita ext_cur = holecheck_path[depth].p_ext; 1242748de673SAkira Fujita 1243748de673SAkira Fujita /* 1244c40ce3c9SAkira Fujita * Get proper starting location of block replacement if block_start was 1245c40ce3c9SAkira Fujita * within the hole. 1246748de673SAkira Fujita */ 1247748de673SAkira Fujita if (le32_to_cpu(ext_cur->ee_block) + 1248748de673SAkira Fujita ext4_ext_get_actual_len(ext_cur) - 1 < block_start) { 1249c40ce3c9SAkira Fujita /* 1250c40ce3c9SAkira Fujita * The hole exists between extents or the tail of 1251c40ce3c9SAkira Fujita * original file. 1252c40ce3c9SAkira Fujita */ 1253748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, 1254748de673SAkira Fujita holecheck_path, &ext_cur); 1255748de673SAkira Fujita if (last_extent < 0) { 12562147b1a6SAkira Fujita ret1 = last_extent; 1257748de673SAkira Fujita goto out; 1258748de673SAkira Fujita } 1259748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, orig_path, 1260748de673SAkira Fujita &ext_dummy); 1261748de673SAkira Fujita if (last_extent < 0) { 12622147b1a6SAkira Fujita ret1 = last_extent; 1263748de673SAkira Fujita goto out; 1264748de673SAkira Fujita } 1265c40ce3c9SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1266c40ce3c9SAkira Fujita } else if (le32_to_cpu(ext_cur->ee_block) > block_start) 1267c40ce3c9SAkira Fujita /* The hole exists at the beginning of original file. */ 1268c40ce3c9SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1269c40ce3c9SAkira Fujita else 1270748de673SAkira Fujita seq_start = block_start; 1271748de673SAkira Fujita 1272748de673SAkira Fujita /* No blocks within the specified range. */ 1273748de673SAkira Fujita if (le32_to_cpu(ext_cur->ee_block) > block_end) { 1274748de673SAkira Fujita ext4_debug("ext4 move extent: The specified range of file " 1275748de673SAkira Fujita "may be the hole\n"); 12762147b1a6SAkira Fujita ret1 = -EINVAL; 1277748de673SAkira Fujita goto out; 1278748de673SAkira Fujita } 1279748de673SAkira Fujita 1280748de673SAkira Fujita /* Adjust start blocks */ 1281748de673SAkira Fujita add_blocks = min(le32_to_cpu(ext_cur->ee_block) + 1282748de673SAkira Fujita ext4_ext_get_actual_len(ext_cur), block_end + 1) - 1283748de673SAkira Fujita max(le32_to_cpu(ext_cur->ee_block), block_start); 1284748de673SAkira Fujita 1285748de673SAkira Fujita while (!last_extent && le32_to_cpu(ext_cur->ee_block) <= block_end) { 1286748de673SAkira Fujita seq_blocks += add_blocks; 1287748de673SAkira Fujita 1288748de673SAkira Fujita /* Adjust tail blocks */ 1289748de673SAkira Fujita if (seq_start + seq_blocks - 1 > block_end) 1290748de673SAkira Fujita seq_blocks = block_end - seq_start + 1; 1291748de673SAkira Fujita 1292748de673SAkira Fujita ext_prev = ext_cur; 1293748de673SAkira Fujita last_extent = mext_next_extent(orig_inode, holecheck_path, 1294748de673SAkira Fujita &ext_cur); 1295748de673SAkira Fujita if (last_extent < 0) { 12962147b1a6SAkira Fujita ret1 = last_extent; 1297748de673SAkira Fujita break; 1298748de673SAkira Fujita } 1299748de673SAkira Fujita add_blocks = ext4_ext_get_actual_len(ext_cur); 1300748de673SAkira Fujita 1301748de673SAkira Fujita /* 1302748de673SAkira Fujita * Extend the length of contiguous block (seq_blocks) 1303748de673SAkira Fujita * if extents are contiguous. 1304748de673SAkira Fujita */ 1305748de673SAkira Fujita if (ext4_can_extents_be_merged(orig_inode, 1306748de673SAkira Fujita ext_prev, ext_cur) && 1307748de673SAkira Fujita block_end >= le32_to_cpu(ext_cur->ee_block) && 1308748de673SAkira Fujita !last_extent) 1309748de673SAkira Fujita continue; 1310748de673SAkira Fujita 1311748de673SAkira Fujita /* Is original extent is uninitialized */ 1312748de673SAkira Fujita uninit = ext4_ext_is_uninitialized(ext_prev); 1313748de673SAkira Fujita 1314748de673SAkira Fujita data_offset_in_page = seq_start % blocks_per_page; 1315748de673SAkira Fujita 1316748de673SAkira Fujita /* 1317748de673SAkira Fujita * Calculate data blocks count that should be swapped 1318748de673SAkira Fujita * at the first page. 1319748de673SAkira Fujita */ 1320748de673SAkira Fujita if (data_offset_in_page + seq_blocks > blocks_per_page) { 1321748de673SAkira Fujita /* Swapped blocks are across pages */ 1322748de673SAkira Fujita block_len_in_page = 1323748de673SAkira Fujita blocks_per_page - data_offset_in_page; 1324748de673SAkira Fujita } else { 1325748de673SAkira Fujita /* Swapped blocks are in a page */ 1326748de673SAkira Fujita block_len_in_page = seq_blocks; 1327748de673SAkira Fujita } 1328748de673SAkira Fujita 1329748de673SAkira Fujita orig_page_offset = seq_start >> 1330748de673SAkira Fujita (PAGE_CACHE_SHIFT - orig_inode->i_blkbits); 1331748de673SAkira Fujita seq_end_page = (seq_start + seq_blocks - 1) >> 1332748de673SAkira Fujita (PAGE_CACHE_SHIFT - orig_inode->i_blkbits); 1333748de673SAkira Fujita seq_start = le32_to_cpu(ext_cur->ee_block); 1334748de673SAkira Fujita rest_blocks = seq_blocks; 1335748de673SAkira Fujita 1336fc04cb49SAkira Fujita /* 1337fc04cb49SAkira Fujita * Up semaphore to avoid following problems: 1338fc04cb49SAkira Fujita * a. transaction deadlock among ext4_journal_start, 1339fc04cb49SAkira Fujita * ->write_begin via pagefault, and jbd2_journal_commit 1340fc04cb49SAkira Fujita * b. racing with ->readpage, ->write_begin, and ext4_get_block 1341fc04cb49SAkira Fujita * in move_extent_per_page 1342fc04cb49SAkira Fujita */ 1343fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 1344748de673SAkira Fujita 1345748de673SAkira Fujita while (orig_page_offset <= seq_end_page) { 1346748de673SAkira Fujita 1347748de673SAkira Fujita /* Swap original branches with new branches */ 1348f868a48dSAkira Fujita block_len_in_page = move_extent_per_page( 1349f868a48dSAkira Fujita o_filp, donor_inode, 1350748de673SAkira Fujita orig_page_offset, 1351748de673SAkira Fujita data_offset_in_page, 1352f868a48dSAkira Fujita block_len_in_page, uninit, 1353f868a48dSAkira Fujita &ret1); 1354f868a48dSAkira Fujita 1355748de673SAkira Fujita /* Count how many blocks we have exchanged */ 1356748de673SAkira Fujita *moved_len += block_len_in_page; 1357f868a48dSAkira Fujita if (ret1 < 0) 1358fc04cb49SAkira Fujita break; 13592147b1a6SAkira Fujita if (*moved_len > len) { 136024676da4STheodore Ts'o EXT4_ERROR_INODE(orig_inode, 13612147b1a6SAkira Fujita "We replaced blocks too much! " 13622147b1a6SAkira Fujita "sum of replaced: %llu requested: %llu", 13632147b1a6SAkira Fujita *moved_len, len); 13642147b1a6SAkira Fujita ret1 = -EIO; 1365fc04cb49SAkira Fujita break; 13662147b1a6SAkira Fujita } 1367748de673SAkira Fujita 1368f868a48dSAkira Fujita orig_page_offset++; 1369748de673SAkira Fujita data_offset_in_page = 0; 1370748de673SAkira Fujita rest_blocks -= block_len_in_page; 1371748de673SAkira Fujita if (rest_blocks > blocks_per_page) 1372748de673SAkira Fujita block_len_in_page = blocks_per_page; 1373748de673SAkira Fujita else 1374748de673SAkira Fujita block_len_in_page = rest_blocks; 1375748de673SAkira Fujita } 1376748de673SAkira Fujita 1377fc04cb49SAkira Fujita double_down_write_data_sem(orig_inode, donor_inode); 1378fc04cb49SAkira Fujita if (ret1 < 0) 1379fc04cb49SAkira Fujita break; 1380fc04cb49SAkira Fujita 1381748de673SAkira Fujita /* Decrease buffer counter */ 1382748de673SAkira Fujita if (holecheck_path) 1383748de673SAkira Fujita ext4_ext_drop_refs(holecheck_path); 13842147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, seq_start, &holecheck_path); 1385347fa6f1SAkira Fujita if (ret1) 1386748de673SAkira Fujita break; 1387748de673SAkira Fujita depth = holecheck_path->p_depth; 1388748de673SAkira Fujita 1389748de673SAkira Fujita /* Decrease buffer counter */ 1390748de673SAkira Fujita if (orig_path) 1391748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 13922147b1a6SAkira Fujita ret1 = get_ext_path(orig_inode, seq_start, &orig_path); 1393347fa6f1SAkira Fujita if (ret1) 1394748de673SAkira Fujita break; 1395748de673SAkira Fujita 1396748de673SAkira Fujita ext_cur = holecheck_path[depth].p_ext; 1397748de673SAkira Fujita add_blocks = ext4_ext_get_actual_len(ext_cur); 1398748de673SAkira Fujita seq_blocks = 0; 1399748de673SAkira Fujita 1400748de673SAkira Fujita } 1401748de673SAkira Fujita out: 140294d7c16cSAkira Fujita if (*moved_len) { 140394d7c16cSAkira Fujita ext4_discard_preallocations(orig_inode); 140494d7c16cSAkira Fujita ext4_discard_preallocations(donor_inode); 140594d7c16cSAkira Fujita } 140694d7c16cSAkira Fujita 1407748de673SAkira Fujita if (orig_path) { 1408748de673SAkira Fujita ext4_ext_drop_refs(orig_path); 1409748de673SAkira Fujita kfree(orig_path); 1410748de673SAkira Fujita } 1411748de673SAkira Fujita if (holecheck_path) { 1412748de673SAkira Fujita ext4_ext_drop_refs(holecheck_path); 1413748de673SAkira Fujita kfree(holecheck_path); 1414748de673SAkira Fujita } 1415fc04cb49SAkira Fujita double_up_write_data_sem(orig_inode, donor_inode); 14162147b1a6SAkira Fujita ret2 = mext_inode_double_unlock(orig_inode, donor_inode); 1417748de673SAkira Fujita 14182147b1a6SAkira Fujita if (ret1) 14192147b1a6SAkira Fujita return ret1; 14202147b1a6SAkira Fujita else if (ret2) 14212147b1a6SAkira Fujita return ret2; 1422748de673SAkira Fujita 1423748de673SAkira Fujita return 0; 1424748de673SAkira Fujita } 1425