1f46b5a66SChristoph Hellwig /* 2f46b5a66SChristoph Hellwig * Copyright (C) 2007 Oracle. All rights reserved. 3f46b5a66SChristoph Hellwig * 4f46b5a66SChristoph Hellwig * This program is free software; you can redistribute it and/or 5f46b5a66SChristoph Hellwig * modify it under the terms of the GNU General Public 6f46b5a66SChristoph Hellwig * License v2 as published by the Free Software Foundation. 7f46b5a66SChristoph Hellwig * 8f46b5a66SChristoph Hellwig * This program is distributed in the hope that it will be useful, 9f46b5a66SChristoph Hellwig * but WITHOUT ANY WARRANTY; without even the implied warranty of 10f46b5a66SChristoph Hellwig * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 11f46b5a66SChristoph Hellwig * General Public License for more details. 12f46b5a66SChristoph Hellwig * 13f46b5a66SChristoph Hellwig * You should have received a copy of the GNU General Public 14f46b5a66SChristoph Hellwig * License along with this program; if not, write to the 15f46b5a66SChristoph Hellwig * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 16f46b5a66SChristoph Hellwig * Boston, MA 021110-1307, USA. 17f46b5a66SChristoph Hellwig */ 18f46b5a66SChristoph Hellwig 19f46b5a66SChristoph Hellwig #include <linux/kernel.h> 20f46b5a66SChristoph Hellwig #include <linux/bio.h> 21f46b5a66SChristoph Hellwig #include <linux/buffer_head.h> 22f46b5a66SChristoph Hellwig #include <linux/file.h> 23f46b5a66SChristoph Hellwig #include <linux/fs.h> 24cb8e7090SChristoph Hellwig #include <linux/fsnotify.h> 25f46b5a66SChristoph Hellwig #include <linux/pagemap.h> 26f46b5a66SChristoph Hellwig #include <linux/highmem.h> 27f46b5a66SChristoph Hellwig #include <linux/time.h> 28f46b5a66SChristoph Hellwig #include <linux/init.h> 29f46b5a66SChristoph Hellwig #include <linux/string.h> 30f46b5a66SChristoph Hellwig #include <linux/smp_lock.h> 31f46b5a66SChristoph Hellwig #include <linux/backing-dev.h> 32cb8e7090SChristoph Hellwig #include <linux/mount.h> 33f46b5a66SChristoph Hellwig #include <linux/mpage.h> 34cb8e7090SChristoph Hellwig #include <linux/namei.h> 35f46b5a66SChristoph Hellwig #include <linux/swap.h> 36f46b5a66SChristoph Hellwig #include <linux/writeback.h> 37f46b5a66SChristoph Hellwig #include <linux/statfs.h> 38f46b5a66SChristoph Hellwig #include <linux/compat.h> 39f46b5a66SChristoph Hellwig #include <linux/bit_spinlock.h> 40cb8e7090SChristoph Hellwig #include <linux/security.h> 41f46b5a66SChristoph Hellwig #include <linux/version.h> 42f46b5a66SChristoph Hellwig #include <linux/xattr.h> 437ea394f1SYan Zheng #include <linux/vmalloc.h> 44f46b5a66SChristoph Hellwig #include "ctree.h" 45f46b5a66SChristoph Hellwig #include "disk-io.h" 46f46b5a66SChristoph Hellwig #include "transaction.h" 47f46b5a66SChristoph Hellwig #include "btrfs_inode.h" 48f46b5a66SChristoph Hellwig #include "ioctl.h" 49f46b5a66SChristoph Hellwig #include "print-tree.h" 50f46b5a66SChristoph Hellwig #include "volumes.h" 51925baeddSChris Mason #include "locking.h" 52f46b5a66SChristoph Hellwig 53f46b5a66SChristoph Hellwig 54f46b5a66SChristoph Hellwig 55cb8e7090SChristoph Hellwig static noinline int create_subvol(struct btrfs_root *root, 56cb8e7090SChristoph Hellwig struct dentry *dentry, 57cb8e7090SChristoph Hellwig char *name, int namelen) 58f46b5a66SChristoph Hellwig { 59f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 60f46b5a66SChristoph Hellwig struct btrfs_key key; 61f46b5a66SChristoph Hellwig struct btrfs_root_item root_item; 62f46b5a66SChristoph Hellwig struct btrfs_inode_item *inode_item; 63f46b5a66SChristoph Hellwig struct extent_buffer *leaf; 64f46b5a66SChristoph Hellwig struct btrfs_root *new_root = root; 65f46b5a66SChristoph Hellwig struct inode *dir; 66f46b5a66SChristoph Hellwig int ret; 67f46b5a66SChristoph Hellwig int err; 68f46b5a66SChristoph Hellwig u64 objectid; 69f46b5a66SChristoph Hellwig u64 new_dirid = BTRFS_FIRST_FREE_OBJECTID; 70f46b5a66SChristoph Hellwig unsigned long nr = 1; 71f46b5a66SChristoph Hellwig 72f46b5a66SChristoph Hellwig ret = btrfs_check_free_space(root, 1, 0); 73f46b5a66SChristoph Hellwig if (ret) 74f46b5a66SChristoph Hellwig goto fail_commit; 75f46b5a66SChristoph Hellwig 76f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 77f46b5a66SChristoph Hellwig BUG_ON(!trans); 78f46b5a66SChristoph Hellwig 79f46b5a66SChristoph Hellwig ret = btrfs_find_free_objectid(trans, root->fs_info->tree_root, 80f46b5a66SChristoph Hellwig 0, &objectid); 81f46b5a66SChristoph Hellwig if (ret) 82f46b5a66SChristoph Hellwig goto fail; 83f46b5a66SChristoph Hellwig 8431840ae1SZheng Yan leaf = btrfs_alloc_free_block(trans, root, root->leafsize, 0, 8531840ae1SZheng Yan objectid, trans->transid, 0, 0, 0); 868e8a1e31SJosef Bacik if (IS_ERR(leaf)) { 878e8a1e31SJosef Bacik ret = PTR_ERR(leaf); 888e8a1e31SJosef Bacik goto fail; 898e8a1e31SJosef Bacik } 90f46b5a66SChristoph Hellwig 91f46b5a66SChristoph Hellwig btrfs_set_header_nritems(leaf, 0); 92f46b5a66SChristoph Hellwig btrfs_set_header_level(leaf, 0); 93f46b5a66SChristoph Hellwig btrfs_set_header_bytenr(leaf, leaf->start); 94f46b5a66SChristoph Hellwig btrfs_set_header_generation(leaf, trans->transid); 95f46b5a66SChristoph Hellwig btrfs_set_header_owner(leaf, objectid); 96f46b5a66SChristoph Hellwig 97f46b5a66SChristoph Hellwig write_extent_buffer(leaf, root->fs_info->fsid, 98f46b5a66SChristoph Hellwig (unsigned long)btrfs_header_fsid(leaf), 99f46b5a66SChristoph Hellwig BTRFS_FSID_SIZE); 100f46b5a66SChristoph Hellwig btrfs_mark_buffer_dirty(leaf); 101f46b5a66SChristoph Hellwig 102f46b5a66SChristoph Hellwig inode_item = &root_item.inode; 103f46b5a66SChristoph Hellwig memset(inode_item, 0, sizeof(*inode_item)); 104f46b5a66SChristoph Hellwig inode_item->generation = cpu_to_le64(1); 105f46b5a66SChristoph Hellwig inode_item->size = cpu_to_le64(3); 106f46b5a66SChristoph Hellwig inode_item->nlink = cpu_to_le32(1); 107a76a3cd4SYan Zheng inode_item->nbytes = cpu_to_le64(root->leafsize); 108f46b5a66SChristoph Hellwig inode_item->mode = cpu_to_le32(S_IFDIR | 0755); 109f46b5a66SChristoph Hellwig 110f46b5a66SChristoph Hellwig btrfs_set_root_bytenr(&root_item, leaf->start); 11184234f3aSYan Zheng btrfs_set_root_generation(&root_item, trans->transid); 112f46b5a66SChristoph Hellwig btrfs_set_root_level(&root_item, 0); 113f46b5a66SChristoph Hellwig btrfs_set_root_refs(&root_item, 1); 114f46b5a66SChristoph Hellwig btrfs_set_root_used(&root_item, 0); 11580ff3856SYan Zheng btrfs_set_root_last_snapshot(&root_item, 0); 116f46b5a66SChristoph Hellwig 117f46b5a66SChristoph Hellwig memset(&root_item.drop_progress, 0, sizeof(root_item.drop_progress)); 118f46b5a66SChristoph Hellwig root_item.drop_level = 0; 119f46b5a66SChristoph Hellwig 120925baeddSChris Mason btrfs_tree_unlock(leaf); 121f46b5a66SChristoph Hellwig free_extent_buffer(leaf); 122f46b5a66SChristoph Hellwig leaf = NULL; 123f46b5a66SChristoph Hellwig 124f46b5a66SChristoph Hellwig btrfs_set_root_dirid(&root_item, new_dirid); 125f46b5a66SChristoph Hellwig 126f46b5a66SChristoph Hellwig key.objectid = objectid; 127f46b5a66SChristoph Hellwig key.offset = 1; 128f46b5a66SChristoph Hellwig btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY); 129f46b5a66SChristoph Hellwig ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key, 130f46b5a66SChristoph Hellwig &root_item); 131f46b5a66SChristoph Hellwig if (ret) 132f46b5a66SChristoph Hellwig goto fail; 133f46b5a66SChristoph Hellwig 134f46b5a66SChristoph Hellwig /* 135f46b5a66SChristoph Hellwig * insert the directory item 136f46b5a66SChristoph Hellwig */ 137f46b5a66SChristoph Hellwig key.offset = (u64)-1; 138f46b5a66SChristoph Hellwig dir = root->fs_info->sb->s_root->d_inode; 139f46b5a66SChristoph Hellwig ret = btrfs_insert_dir_item(trans, root->fs_info->tree_root, 140f46b5a66SChristoph Hellwig name, namelen, dir->i_ino, &key, 141aec7477bSJosef Bacik BTRFS_FT_DIR, 0); 142f46b5a66SChristoph Hellwig if (ret) 143f46b5a66SChristoph Hellwig goto fail; 144f46b5a66SChristoph Hellwig 145f46b5a66SChristoph Hellwig ret = btrfs_insert_inode_ref(trans, root->fs_info->tree_root, 146f46b5a66SChristoph Hellwig name, namelen, objectid, 147aec7477bSJosef Bacik root->fs_info->sb->s_root->d_inode->i_ino, 0); 148f46b5a66SChristoph Hellwig if (ret) 149f46b5a66SChristoph Hellwig goto fail; 150f46b5a66SChristoph Hellwig 151f46b5a66SChristoph Hellwig ret = btrfs_commit_transaction(trans, root); 152f46b5a66SChristoph Hellwig if (ret) 153f46b5a66SChristoph Hellwig goto fail_commit; 154f46b5a66SChristoph Hellwig 155f46b5a66SChristoph Hellwig new_root = btrfs_read_fs_root(root->fs_info, &key, name, namelen); 156f46b5a66SChristoph Hellwig BUG_ON(!new_root); 157f46b5a66SChristoph Hellwig 158f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(new_root, 1); 159f46b5a66SChristoph Hellwig BUG_ON(!trans); 160f46b5a66SChristoph Hellwig 161cb8e7090SChristoph Hellwig ret = btrfs_create_subvol_root(new_root, dentry, trans, new_dirid, 162f46b5a66SChristoph Hellwig BTRFS_I(dir)->block_group); 163f46b5a66SChristoph Hellwig if (ret) 164f46b5a66SChristoph Hellwig goto fail; 165f46b5a66SChristoph Hellwig 166f46b5a66SChristoph Hellwig fail: 167f46b5a66SChristoph Hellwig nr = trans->blocks_used; 168f46b5a66SChristoph Hellwig err = btrfs_commit_transaction(trans, new_root); 169f46b5a66SChristoph Hellwig if (err && !ret) 170f46b5a66SChristoph Hellwig ret = err; 171f46b5a66SChristoph Hellwig fail_commit: 172f46b5a66SChristoph Hellwig btrfs_btree_balance_dirty(root, nr); 173f46b5a66SChristoph Hellwig return ret; 174f46b5a66SChristoph Hellwig } 175f46b5a66SChristoph Hellwig 176f46b5a66SChristoph Hellwig static int create_snapshot(struct btrfs_root *root, char *name, int namelen) 177f46b5a66SChristoph Hellwig { 178f46b5a66SChristoph Hellwig struct btrfs_pending_snapshot *pending_snapshot; 179f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 180f46b5a66SChristoph Hellwig int ret; 181f46b5a66SChristoph Hellwig int err; 182f46b5a66SChristoph Hellwig unsigned long nr = 0; 183f46b5a66SChristoph Hellwig 184f46b5a66SChristoph Hellwig if (!root->ref_cows) 185f46b5a66SChristoph Hellwig return -EINVAL; 186f46b5a66SChristoph Hellwig 187f46b5a66SChristoph Hellwig ret = btrfs_check_free_space(root, 1, 0); 188f46b5a66SChristoph Hellwig if (ret) 189f46b5a66SChristoph Hellwig goto fail_unlock; 190f46b5a66SChristoph Hellwig 191f46b5a66SChristoph Hellwig pending_snapshot = kmalloc(sizeof(*pending_snapshot), GFP_NOFS); 192f46b5a66SChristoph Hellwig if (!pending_snapshot) { 193f46b5a66SChristoph Hellwig ret = -ENOMEM; 194f46b5a66SChristoph Hellwig goto fail_unlock; 195f46b5a66SChristoph Hellwig } 196f46b5a66SChristoph Hellwig pending_snapshot->name = kmalloc(namelen + 1, GFP_NOFS); 197f46b5a66SChristoph Hellwig if (!pending_snapshot->name) { 198f46b5a66SChristoph Hellwig ret = -ENOMEM; 199f46b5a66SChristoph Hellwig kfree(pending_snapshot); 200f46b5a66SChristoph Hellwig goto fail_unlock; 201f46b5a66SChristoph Hellwig } 202f46b5a66SChristoph Hellwig memcpy(pending_snapshot->name, name, namelen); 203f46b5a66SChristoph Hellwig pending_snapshot->name[namelen] = '\0'; 204f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 205f46b5a66SChristoph Hellwig BUG_ON(!trans); 206f46b5a66SChristoph Hellwig pending_snapshot->root = root; 207f46b5a66SChristoph Hellwig list_add(&pending_snapshot->list, 208f46b5a66SChristoph Hellwig &trans->transaction->pending_snapshots); 209f46b5a66SChristoph Hellwig ret = btrfs_update_inode(trans, root, root->inode); 210f46b5a66SChristoph Hellwig err = btrfs_commit_transaction(trans, root); 211f46b5a66SChristoph Hellwig 212f46b5a66SChristoph Hellwig fail_unlock: 213f46b5a66SChristoph Hellwig btrfs_btree_balance_dirty(root, nr); 214f46b5a66SChristoph Hellwig return ret; 215f46b5a66SChristoph Hellwig } 216f46b5a66SChristoph Hellwig 217cb8e7090SChristoph Hellwig /* copy of may_create in fs/namei.c() */ 218cb8e7090SChristoph Hellwig static inline int btrfs_may_create(struct inode *dir, struct dentry *child) 219cb8e7090SChristoph Hellwig { 220cb8e7090SChristoph Hellwig if (child->d_inode) 221cb8e7090SChristoph Hellwig return -EEXIST; 222cb8e7090SChristoph Hellwig if (IS_DEADDIR(dir)) 223cb8e7090SChristoph Hellwig return -ENOENT; 224cb8e7090SChristoph Hellwig return inode_permission(dir, MAY_WRITE | MAY_EXEC); 225cb8e7090SChristoph Hellwig } 226cb8e7090SChristoph Hellwig 227cb8e7090SChristoph Hellwig /* 228cb8e7090SChristoph Hellwig * Create a new subvolume below @parent. This is largely modeled after 229cb8e7090SChristoph Hellwig * sys_mkdirat and vfs_mkdir, but we only do a single component lookup 230cb8e7090SChristoph Hellwig * inside this filesystem so it's quite a bit simpler. 231cb8e7090SChristoph Hellwig */ 232cb8e7090SChristoph Hellwig static noinline int btrfs_mksubvol(struct path *parent, char *name, 233cb8e7090SChristoph Hellwig int mode, int namelen) 234cb8e7090SChristoph Hellwig { 235cb8e7090SChristoph Hellwig struct dentry *dentry; 236cb8e7090SChristoph Hellwig int error; 237cb8e7090SChristoph Hellwig 238cb8e7090SChristoph Hellwig mutex_lock_nested(&parent->dentry->d_inode->i_mutex, I_MUTEX_PARENT); 239cb8e7090SChristoph Hellwig 240cb8e7090SChristoph Hellwig dentry = lookup_one_len(name, parent->dentry, namelen); 241cb8e7090SChristoph Hellwig error = PTR_ERR(dentry); 242cb8e7090SChristoph Hellwig if (IS_ERR(dentry)) 243cb8e7090SChristoph Hellwig goto out_unlock; 244cb8e7090SChristoph Hellwig 245cb8e7090SChristoph Hellwig error = -EEXIST; 246cb8e7090SChristoph Hellwig if (dentry->d_inode) 247cb8e7090SChristoph Hellwig goto out_dput; 248cb8e7090SChristoph Hellwig 249cb8e7090SChristoph Hellwig if (!IS_POSIXACL(parent->dentry->d_inode)) 250cb8e7090SChristoph Hellwig mode &= ~current->fs->umask; 251cb8e7090SChristoph Hellwig error = mnt_want_write(parent->mnt); 252cb8e7090SChristoph Hellwig if (error) 253cb8e7090SChristoph Hellwig goto out_dput; 254cb8e7090SChristoph Hellwig 255cb8e7090SChristoph Hellwig error = btrfs_may_create(parent->dentry->d_inode, dentry); 256cb8e7090SChristoph Hellwig if (error) 257cb8e7090SChristoph Hellwig goto out_drop_write; 258cb8e7090SChristoph Hellwig 259cb8e7090SChristoph Hellwig /* 260cb8e7090SChristoph Hellwig * Actually perform the low-level subvolume creation after all 261cb8e7090SChristoph Hellwig * this VFS fuzz. 262cb8e7090SChristoph Hellwig * 263cb8e7090SChristoph Hellwig * Eventually we want to pass in an inode under which we create this 264cb8e7090SChristoph Hellwig * subvolume, but for now all are under the filesystem root. 265cb8e7090SChristoph Hellwig * 266cb8e7090SChristoph Hellwig * Also we should pass on the mode eventually to allow creating new 267cb8e7090SChristoph Hellwig * subvolume with specific mode bits. 268cb8e7090SChristoph Hellwig */ 269cb8e7090SChristoph Hellwig error = create_subvol(BTRFS_I(parent->dentry->d_inode)->root, dentry, 270cb8e7090SChristoph Hellwig name, namelen); 271cb8e7090SChristoph Hellwig if (error) 272cb8e7090SChristoph Hellwig goto out_drop_write; 273cb8e7090SChristoph Hellwig 274cb8e7090SChristoph Hellwig fsnotify_mkdir(parent->dentry->d_inode, dentry); 275cb8e7090SChristoph Hellwig out_drop_write: 276cb8e7090SChristoph Hellwig mnt_drop_write(parent->mnt); 277cb8e7090SChristoph Hellwig out_dput: 278cb8e7090SChristoph Hellwig dput(dentry); 279cb8e7090SChristoph Hellwig out_unlock: 280cb8e7090SChristoph Hellwig mutex_unlock(&parent->dentry->d_inode->i_mutex); 281cb8e7090SChristoph Hellwig return error; 282cb8e7090SChristoph Hellwig } 283cb8e7090SChristoph Hellwig 284cb8e7090SChristoph Hellwig 285f46b5a66SChristoph Hellwig int btrfs_defrag_file(struct file *file) 286f46b5a66SChristoph Hellwig { 287f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 288f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 289f46b5a66SChristoph Hellwig struct extent_io_tree *io_tree = &BTRFS_I(inode)->io_tree; 2903eaa2885SChris Mason struct btrfs_ordered_extent *ordered; 291f46b5a66SChristoph Hellwig struct page *page; 292f46b5a66SChristoph Hellwig unsigned long last_index; 293f46b5a66SChristoph Hellwig unsigned long ra_pages = root->fs_info->bdi.ra_pages; 294f46b5a66SChristoph Hellwig unsigned long total_read = 0; 295f46b5a66SChristoph Hellwig u64 page_start; 296f46b5a66SChristoph Hellwig u64 page_end; 297f46b5a66SChristoph Hellwig unsigned long i; 298f46b5a66SChristoph Hellwig int ret; 299f46b5a66SChristoph Hellwig 300f46b5a66SChristoph Hellwig ret = btrfs_check_free_space(root, inode->i_size, 0); 301f46b5a66SChristoph Hellwig if (ret) 302f46b5a66SChristoph Hellwig return -ENOSPC; 303f46b5a66SChristoph Hellwig 304f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 305f46b5a66SChristoph Hellwig last_index = inode->i_size >> PAGE_CACHE_SHIFT; 306f46b5a66SChristoph Hellwig for (i = 0; i <= last_index; i++) { 307f46b5a66SChristoph Hellwig if (total_read % ra_pages == 0) { 308f46b5a66SChristoph Hellwig btrfs_force_ra(inode->i_mapping, &file->f_ra, file, i, 309f46b5a66SChristoph Hellwig min(last_index, i + ra_pages - 1)); 310f46b5a66SChristoph Hellwig } 311f46b5a66SChristoph Hellwig total_read++; 3123eaa2885SChris Mason again: 313f46b5a66SChristoph Hellwig page = grab_cache_page(inode->i_mapping, i); 314f46b5a66SChristoph Hellwig if (!page) 315f46b5a66SChristoph Hellwig goto out_unlock; 316f46b5a66SChristoph Hellwig if (!PageUptodate(page)) { 317f46b5a66SChristoph Hellwig btrfs_readpage(NULL, page); 318f46b5a66SChristoph Hellwig lock_page(page); 319f46b5a66SChristoph Hellwig if (!PageUptodate(page)) { 320f46b5a66SChristoph Hellwig unlock_page(page); 321f46b5a66SChristoph Hellwig page_cache_release(page); 322f46b5a66SChristoph Hellwig goto out_unlock; 323f46b5a66SChristoph Hellwig } 324f46b5a66SChristoph Hellwig } 325f46b5a66SChristoph Hellwig 326f46b5a66SChristoph Hellwig wait_on_page_writeback(page); 327f46b5a66SChristoph Hellwig 328f46b5a66SChristoph Hellwig page_start = (u64)page->index << PAGE_CACHE_SHIFT; 329f46b5a66SChristoph Hellwig page_end = page_start + PAGE_CACHE_SIZE - 1; 330f46b5a66SChristoph Hellwig lock_extent(io_tree, page_start, page_end, GFP_NOFS); 3313eaa2885SChris Mason 3323eaa2885SChris Mason ordered = btrfs_lookup_ordered_extent(inode, page_start); 3333eaa2885SChris Mason if (ordered) { 3343eaa2885SChris Mason unlock_extent(io_tree, page_start, page_end, GFP_NOFS); 3353eaa2885SChris Mason unlock_page(page); 3363eaa2885SChris Mason page_cache_release(page); 3373eaa2885SChris Mason btrfs_start_ordered_extent(inode, ordered, 1); 3383eaa2885SChris Mason btrfs_put_ordered_extent(ordered); 3393eaa2885SChris Mason goto again; 3403eaa2885SChris Mason } 3413eaa2885SChris Mason set_page_extent_mapped(page); 3423eaa2885SChris Mason 343f87f057bSChris Mason /* 344f87f057bSChris Mason * this makes sure page_mkwrite is called on the 345f87f057bSChris Mason * page if it is dirtied again later 346f87f057bSChris Mason */ 347f87f057bSChris Mason clear_page_dirty_for_io(page); 348f87f057bSChris Mason 349ea8c2819SChris Mason btrfs_set_extent_delalloc(inode, page_start, page_end); 350f46b5a66SChristoph Hellwig 351f46b5a66SChristoph Hellwig unlock_extent(io_tree, page_start, page_end, GFP_NOFS); 352f46b5a66SChristoph Hellwig set_page_dirty(page); 353f46b5a66SChristoph Hellwig unlock_page(page); 354f46b5a66SChristoph Hellwig page_cache_release(page); 355f46b5a66SChristoph Hellwig balance_dirty_pages_ratelimited_nr(inode->i_mapping, 1); 356f46b5a66SChristoph Hellwig } 357f46b5a66SChristoph Hellwig 358f46b5a66SChristoph Hellwig out_unlock: 359f46b5a66SChristoph Hellwig mutex_unlock(&inode->i_mutex); 360f46b5a66SChristoph Hellwig return 0; 361f46b5a66SChristoph Hellwig } 362f46b5a66SChristoph Hellwig 363f46b5a66SChristoph Hellwig /* 364f46b5a66SChristoph Hellwig * Called inside transaction, so use GFP_NOFS 365f46b5a66SChristoph Hellwig */ 366f46b5a66SChristoph Hellwig 367f46b5a66SChristoph Hellwig static int btrfs_ioctl_resize(struct btrfs_root *root, void __user *arg) 368f46b5a66SChristoph Hellwig { 369f46b5a66SChristoph Hellwig u64 new_size; 370f46b5a66SChristoph Hellwig u64 old_size; 371f46b5a66SChristoph Hellwig u64 devid = 1; 372f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 373f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 374f46b5a66SChristoph Hellwig struct btrfs_device *device = NULL; 375f46b5a66SChristoph Hellwig char *sizestr; 376f46b5a66SChristoph Hellwig char *devstr = NULL; 377f46b5a66SChristoph Hellwig int ret = 0; 378f46b5a66SChristoph Hellwig int namelen; 379f46b5a66SChristoph Hellwig int mod = 0; 380f46b5a66SChristoph Hellwig 381*c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 382*c146afadSYan Zheng return -EROFS; 383*c146afadSYan Zheng 384f46b5a66SChristoph Hellwig vol_args = kmalloc(sizeof(*vol_args), GFP_NOFS); 385f46b5a66SChristoph Hellwig 386f46b5a66SChristoph Hellwig if (!vol_args) 387f46b5a66SChristoph Hellwig return -ENOMEM; 388f46b5a66SChristoph Hellwig 389f46b5a66SChristoph Hellwig if (copy_from_user(vol_args, arg, sizeof(*vol_args))) { 390f46b5a66SChristoph Hellwig ret = -EFAULT; 391f46b5a66SChristoph Hellwig goto out; 392f46b5a66SChristoph Hellwig } 3935516e595SMark Fasheh 3945516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 395f46b5a66SChristoph Hellwig namelen = strlen(vol_args->name); 396f46b5a66SChristoph Hellwig 3977d9eb12cSChris Mason mutex_lock(&root->fs_info->volume_mutex); 398f46b5a66SChristoph Hellwig sizestr = vol_args->name; 399f46b5a66SChristoph Hellwig devstr = strchr(sizestr, ':'); 400f46b5a66SChristoph Hellwig if (devstr) { 401f46b5a66SChristoph Hellwig char *end; 402f46b5a66SChristoph Hellwig sizestr = devstr + 1; 403f46b5a66SChristoph Hellwig *devstr = '\0'; 404f46b5a66SChristoph Hellwig devstr = vol_args->name; 405f46b5a66SChristoph Hellwig devid = simple_strtoull(devstr, &end, 10); 406f46b5a66SChristoph Hellwig printk(KERN_INFO "resizing devid %llu\n", devid); 407f46b5a66SChristoph Hellwig } 408f46b5a66SChristoph Hellwig device = btrfs_find_device(root, devid, NULL); 409f46b5a66SChristoph Hellwig if (!device) { 410f46b5a66SChristoph Hellwig printk(KERN_INFO "resizer unable to find device %llu\n", devid); 411f46b5a66SChristoph Hellwig ret = -EINVAL; 412f46b5a66SChristoph Hellwig goto out_unlock; 413f46b5a66SChristoph Hellwig } 414f46b5a66SChristoph Hellwig if (!strcmp(sizestr, "max")) 415f46b5a66SChristoph Hellwig new_size = device->bdev->bd_inode->i_size; 416f46b5a66SChristoph Hellwig else { 417f46b5a66SChristoph Hellwig if (sizestr[0] == '-') { 418f46b5a66SChristoph Hellwig mod = -1; 419f46b5a66SChristoph Hellwig sizestr++; 420f46b5a66SChristoph Hellwig } else if (sizestr[0] == '+') { 421f46b5a66SChristoph Hellwig mod = 1; 422f46b5a66SChristoph Hellwig sizestr++; 423f46b5a66SChristoph Hellwig } 424f46b5a66SChristoph Hellwig new_size = btrfs_parse_size(sizestr); 425f46b5a66SChristoph Hellwig if (new_size == 0) { 426f46b5a66SChristoph Hellwig ret = -EINVAL; 427f46b5a66SChristoph Hellwig goto out_unlock; 428f46b5a66SChristoph Hellwig } 429f46b5a66SChristoph Hellwig } 430f46b5a66SChristoph Hellwig 431f46b5a66SChristoph Hellwig old_size = device->total_bytes; 432f46b5a66SChristoph Hellwig 433f46b5a66SChristoph Hellwig if (mod < 0) { 434f46b5a66SChristoph Hellwig if (new_size > old_size) { 435f46b5a66SChristoph Hellwig ret = -EINVAL; 436f46b5a66SChristoph Hellwig goto out_unlock; 437f46b5a66SChristoph Hellwig } 438f46b5a66SChristoph Hellwig new_size = old_size - new_size; 439f46b5a66SChristoph Hellwig } else if (mod > 0) { 440f46b5a66SChristoph Hellwig new_size = old_size + new_size; 441f46b5a66SChristoph Hellwig } 442f46b5a66SChristoph Hellwig 443f46b5a66SChristoph Hellwig if (new_size < 256 * 1024 * 1024) { 444f46b5a66SChristoph Hellwig ret = -EINVAL; 445f46b5a66SChristoph Hellwig goto out_unlock; 446f46b5a66SChristoph Hellwig } 447f46b5a66SChristoph Hellwig if (new_size > device->bdev->bd_inode->i_size) { 448f46b5a66SChristoph Hellwig ret = -EFBIG; 449f46b5a66SChristoph Hellwig goto out_unlock; 450f46b5a66SChristoph Hellwig } 451f46b5a66SChristoph Hellwig 452f46b5a66SChristoph Hellwig do_div(new_size, root->sectorsize); 453f46b5a66SChristoph Hellwig new_size *= root->sectorsize; 454f46b5a66SChristoph Hellwig 455f46b5a66SChristoph Hellwig printk(KERN_INFO "new size for %s is %llu\n", 456f46b5a66SChristoph Hellwig device->name, (unsigned long long)new_size); 457f46b5a66SChristoph Hellwig 458f46b5a66SChristoph Hellwig if (new_size > old_size) { 459f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 460f46b5a66SChristoph Hellwig ret = btrfs_grow_device(trans, device, new_size); 461f46b5a66SChristoph Hellwig btrfs_commit_transaction(trans, root); 462f46b5a66SChristoph Hellwig } else { 463f46b5a66SChristoph Hellwig ret = btrfs_shrink_device(device, new_size); 464f46b5a66SChristoph Hellwig } 465f46b5a66SChristoph Hellwig 466f46b5a66SChristoph Hellwig out_unlock: 4677d9eb12cSChris Mason mutex_unlock(&root->fs_info->volume_mutex); 468f46b5a66SChristoph Hellwig out: 469f46b5a66SChristoph Hellwig kfree(vol_args); 470f46b5a66SChristoph Hellwig return ret; 471f46b5a66SChristoph Hellwig } 472f46b5a66SChristoph Hellwig 473cb8e7090SChristoph Hellwig static noinline int btrfs_ioctl_snap_create(struct file *file, 474f46b5a66SChristoph Hellwig void __user *arg) 475f46b5a66SChristoph Hellwig { 476cb8e7090SChristoph Hellwig struct btrfs_root *root = BTRFS_I(fdentry(file)->d_inode)->root; 477f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 478f46b5a66SChristoph Hellwig struct btrfs_dir_item *di; 479f46b5a66SChristoph Hellwig struct btrfs_path *path; 480f46b5a66SChristoph Hellwig u64 root_dirid; 481f46b5a66SChristoph Hellwig int namelen; 482f46b5a66SChristoph Hellwig int ret; 483f46b5a66SChristoph Hellwig 484*c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 485*c146afadSYan Zheng return -EROFS; 486*c146afadSYan Zheng 487f46b5a66SChristoph Hellwig vol_args = kmalloc(sizeof(*vol_args), GFP_NOFS); 488f46b5a66SChristoph Hellwig 489f46b5a66SChristoph Hellwig if (!vol_args) 490f46b5a66SChristoph Hellwig return -ENOMEM; 491f46b5a66SChristoph Hellwig 492f46b5a66SChristoph Hellwig if (copy_from_user(vol_args, arg, sizeof(*vol_args))) { 493f46b5a66SChristoph Hellwig ret = -EFAULT; 494f46b5a66SChristoph Hellwig goto out; 495f46b5a66SChristoph Hellwig } 496f46b5a66SChristoph Hellwig 4975516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 498f46b5a66SChristoph Hellwig namelen = strlen(vol_args->name); 499f46b5a66SChristoph Hellwig if (strchr(vol_args->name, '/')) { 500f46b5a66SChristoph Hellwig ret = -EINVAL; 501f46b5a66SChristoph Hellwig goto out; 502f46b5a66SChristoph Hellwig } 503f46b5a66SChristoph Hellwig 504f46b5a66SChristoph Hellwig path = btrfs_alloc_path(); 505f46b5a66SChristoph Hellwig if (!path) { 506f46b5a66SChristoph Hellwig ret = -ENOMEM; 507f46b5a66SChristoph Hellwig goto out; 508f46b5a66SChristoph Hellwig } 509f46b5a66SChristoph Hellwig 510f46b5a66SChristoph Hellwig root_dirid = root->fs_info->sb->s_root->d_inode->i_ino, 511f46b5a66SChristoph Hellwig di = btrfs_lookup_dir_item(NULL, root->fs_info->tree_root, 512f46b5a66SChristoph Hellwig path, root_dirid, 513f46b5a66SChristoph Hellwig vol_args->name, namelen, 0); 514f46b5a66SChristoph Hellwig btrfs_free_path(path); 515f46b5a66SChristoph Hellwig 516f46b5a66SChristoph Hellwig if (di && !IS_ERR(di)) { 517f46b5a66SChristoph Hellwig ret = -EEXIST; 518f46b5a66SChristoph Hellwig goto out; 519f46b5a66SChristoph Hellwig } 520f46b5a66SChristoph Hellwig 521f46b5a66SChristoph Hellwig if (IS_ERR(di)) { 522f46b5a66SChristoph Hellwig ret = PTR_ERR(di); 523f46b5a66SChristoph Hellwig goto out; 524f46b5a66SChristoph Hellwig } 525f46b5a66SChristoph Hellwig 526cb8e7090SChristoph Hellwig if (root == root->fs_info->tree_root) { 527cb8e7090SChristoph Hellwig ret = btrfs_mksubvol(&file->f_path, vol_args->name, 528cb8e7090SChristoph Hellwig file->f_path.dentry->d_inode->i_mode, 529cb8e7090SChristoph Hellwig namelen); 530cb8e7090SChristoph Hellwig } else { 531f46b5a66SChristoph Hellwig ret = create_snapshot(root, vol_args->name, namelen); 532cb8e7090SChristoph Hellwig } 533cb8e7090SChristoph Hellwig 534f46b5a66SChristoph Hellwig out: 535f46b5a66SChristoph Hellwig kfree(vol_args); 536f46b5a66SChristoph Hellwig return ret; 537f46b5a66SChristoph Hellwig } 538f46b5a66SChristoph Hellwig 539f46b5a66SChristoph Hellwig static int btrfs_ioctl_defrag(struct file *file) 540f46b5a66SChristoph Hellwig { 541f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 542f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 543*c146afadSYan Zheng int ret; 544*c146afadSYan Zheng 545*c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 546*c146afadSYan Zheng if (ret) 547*c146afadSYan Zheng return ret; 548f46b5a66SChristoph Hellwig 549f46b5a66SChristoph Hellwig switch (inode->i_mode & S_IFMT) { 550f46b5a66SChristoph Hellwig case S_IFDIR: 551f46b5a66SChristoph Hellwig btrfs_defrag_root(root, 0); 552f46b5a66SChristoph Hellwig btrfs_defrag_root(root->fs_info->extent_root, 0); 553f46b5a66SChristoph Hellwig break; 554f46b5a66SChristoph Hellwig case S_IFREG: 555f46b5a66SChristoph Hellwig btrfs_defrag_file(file); 556f46b5a66SChristoph Hellwig break; 557f46b5a66SChristoph Hellwig } 558f46b5a66SChristoph Hellwig 559f46b5a66SChristoph Hellwig return 0; 560f46b5a66SChristoph Hellwig } 561f46b5a66SChristoph Hellwig 562f46b5a66SChristoph Hellwig long btrfs_ioctl_add_dev(struct btrfs_root *root, void __user *arg) 563f46b5a66SChristoph Hellwig { 564f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 565f46b5a66SChristoph Hellwig int ret; 566f46b5a66SChristoph Hellwig 567f46b5a66SChristoph Hellwig vol_args = kmalloc(sizeof(*vol_args), GFP_NOFS); 568f46b5a66SChristoph Hellwig 569f46b5a66SChristoph Hellwig if (!vol_args) 570f46b5a66SChristoph Hellwig return -ENOMEM; 571f46b5a66SChristoph Hellwig 572f46b5a66SChristoph Hellwig if (copy_from_user(vol_args, arg, sizeof(*vol_args))) { 573f46b5a66SChristoph Hellwig ret = -EFAULT; 574f46b5a66SChristoph Hellwig goto out; 575f46b5a66SChristoph Hellwig } 5765516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 577f46b5a66SChristoph Hellwig ret = btrfs_init_new_device(root, vol_args->name); 578f46b5a66SChristoph Hellwig 579f46b5a66SChristoph Hellwig out: 580f46b5a66SChristoph Hellwig kfree(vol_args); 581f46b5a66SChristoph Hellwig return ret; 582f46b5a66SChristoph Hellwig } 583f46b5a66SChristoph Hellwig 584f46b5a66SChristoph Hellwig long btrfs_ioctl_rm_dev(struct btrfs_root *root, void __user *arg) 585f46b5a66SChristoph Hellwig { 586f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 587f46b5a66SChristoph Hellwig int ret; 588f46b5a66SChristoph Hellwig 589*c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 590*c146afadSYan Zheng return -EROFS; 591*c146afadSYan Zheng 592f46b5a66SChristoph Hellwig vol_args = kmalloc(sizeof(*vol_args), GFP_NOFS); 593f46b5a66SChristoph Hellwig 594f46b5a66SChristoph Hellwig if (!vol_args) 595f46b5a66SChristoph Hellwig return -ENOMEM; 596f46b5a66SChristoph Hellwig 597f46b5a66SChristoph Hellwig if (copy_from_user(vol_args, arg, sizeof(*vol_args))) { 598f46b5a66SChristoph Hellwig ret = -EFAULT; 599f46b5a66SChristoph Hellwig goto out; 600f46b5a66SChristoph Hellwig } 6015516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 602f46b5a66SChristoph Hellwig ret = btrfs_rm_device(root, vol_args->name); 603f46b5a66SChristoph Hellwig 604f46b5a66SChristoph Hellwig out: 605f46b5a66SChristoph Hellwig kfree(vol_args); 606f46b5a66SChristoph Hellwig return ret; 607f46b5a66SChristoph Hellwig } 608f46b5a66SChristoph Hellwig 609c5c9cd4dSSage Weil long btrfs_ioctl_clone(struct file *file, unsigned long srcfd, u64 off, 610c5c9cd4dSSage Weil u64 olen, u64 destoff) 611f46b5a66SChristoph Hellwig { 612f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 613f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 614f46b5a66SChristoph Hellwig struct file *src_file; 615f46b5a66SChristoph Hellwig struct inode *src; 616f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 617f46b5a66SChristoph Hellwig struct btrfs_path *path; 618f46b5a66SChristoph Hellwig struct extent_buffer *leaf; 619ae01a0abSYan Zheng char *buf; 620ae01a0abSYan Zheng struct btrfs_key key; 621f46b5a66SChristoph Hellwig u32 nritems; 622f46b5a66SChristoph Hellwig int slot; 623ae01a0abSYan Zheng int ret; 624c5c9cd4dSSage Weil u64 len = olen; 625c5c9cd4dSSage Weil u64 bs = root->fs_info->sb->s_blocksize; 626c5c9cd4dSSage Weil u64 hint_byte; 627f46b5a66SChristoph Hellwig 628c5c9cd4dSSage Weil /* 629c5c9cd4dSSage Weil * TODO: 630c5c9cd4dSSage Weil * - split compressed inline extents. annoying: we need to 631c5c9cd4dSSage Weil * decompress into destination's address_space (the file offset 632c5c9cd4dSSage Weil * may change, so source mapping won't do), then recompress (or 633c5c9cd4dSSage Weil * otherwise reinsert) a subrange. 634c5c9cd4dSSage Weil * - allow ranges within the same file to be cloned (provided 635c5c9cd4dSSage Weil * they don't overlap)? 636c5c9cd4dSSage Weil */ 637c5c9cd4dSSage Weil 638*c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 639*c146afadSYan Zheng if (ret) 640*c146afadSYan Zheng return ret; 641*c146afadSYan Zheng 642c5c9cd4dSSage Weil src_file = fget(srcfd); 643f46b5a66SChristoph Hellwig if (!src_file) 644f46b5a66SChristoph Hellwig return -EBADF; 645f46b5a66SChristoph Hellwig src = src_file->f_dentry->d_inode; 646f46b5a66SChristoph Hellwig 647c5c9cd4dSSage Weil ret = -EINVAL; 648c5c9cd4dSSage Weil if (src == inode) 649c5c9cd4dSSage Weil goto out_fput; 650c5c9cd4dSSage Weil 651ae01a0abSYan Zheng ret = -EISDIR; 652ae01a0abSYan Zheng if (S_ISDIR(src->i_mode) || S_ISDIR(inode->i_mode)) 653f46b5a66SChristoph Hellwig goto out_fput; 654f46b5a66SChristoph Hellwig 655ae01a0abSYan Zheng ret = -EXDEV; 656ae01a0abSYan Zheng if (src->i_sb != inode->i_sb || BTRFS_I(src)->root != root) 657ae01a0abSYan Zheng goto out_fput; 658ae01a0abSYan Zheng 659ae01a0abSYan Zheng ret = -ENOMEM; 660ae01a0abSYan Zheng buf = vmalloc(btrfs_level_size(root, 0)); 661ae01a0abSYan Zheng if (!buf) 662ae01a0abSYan Zheng goto out_fput; 663ae01a0abSYan Zheng 664ae01a0abSYan Zheng path = btrfs_alloc_path(); 665ae01a0abSYan Zheng if (!path) { 666ae01a0abSYan Zheng vfree(buf); 667ae01a0abSYan Zheng goto out_fput; 668ae01a0abSYan Zheng } 669ae01a0abSYan Zheng path->reada = 2; 670ae01a0abSYan Zheng 671f46b5a66SChristoph Hellwig if (inode < src) { 672f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 673f46b5a66SChristoph Hellwig mutex_lock(&src->i_mutex); 674f46b5a66SChristoph Hellwig } else { 675f46b5a66SChristoph Hellwig mutex_lock(&src->i_mutex); 676f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 677f46b5a66SChristoph Hellwig } 678f46b5a66SChristoph Hellwig 679c5c9cd4dSSage Weil /* determine range to clone */ 680c5c9cd4dSSage Weil ret = -EINVAL; 681c5c9cd4dSSage Weil if (off >= src->i_size || off + len > src->i_size) 682f46b5a66SChristoph Hellwig goto out_unlock; 683c5c9cd4dSSage Weil if (len == 0) 684c5c9cd4dSSage Weil olen = len = src->i_size - off; 685c5c9cd4dSSage Weil /* if we extend to eof, continue to block boundary */ 686c5c9cd4dSSage Weil if (off + len == src->i_size) 687c5c9cd4dSSage Weil len = ((src->i_size + bs-1) & ~(bs-1)) 688c5c9cd4dSSage Weil - off; 689c5c9cd4dSSage Weil 690c5c9cd4dSSage Weil /* verify the end result is block aligned */ 691c5c9cd4dSSage Weil if ((off & (bs-1)) || 692c5c9cd4dSSage Weil ((off + len) & (bs-1))) 693c5c9cd4dSSage Weil goto out_unlock; 694c5c9cd4dSSage Weil 695c5c9cd4dSSage Weil printk("final src extent is %llu~%llu\n", off, len); 696c5c9cd4dSSage Weil printk("final dst extent is %llu~%llu\n", destoff, len); 697f46b5a66SChristoph Hellwig 698f46b5a66SChristoph Hellwig /* do any pending delalloc/csum calc on src, one way or 699f46b5a66SChristoph Hellwig another, and lock file content */ 700f46b5a66SChristoph Hellwig while (1) { 70131840ae1SZheng Yan struct btrfs_ordered_extent *ordered; 702c5c9cd4dSSage Weil lock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 703c5c9cd4dSSage Weil ordered = btrfs_lookup_first_ordered_extent(inode, off+len); 704ae01a0abSYan Zheng if (BTRFS_I(src)->delalloc_bytes == 0 && !ordered) 705f46b5a66SChristoph Hellwig break; 706c5c9cd4dSSage Weil unlock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 707ae01a0abSYan Zheng if (ordered) 708ae01a0abSYan Zheng btrfs_put_ordered_extent(ordered); 709c5c9cd4dSSage Weil btrfs_wait_ordered_range(src, off, off+len); 710f46b5a66SChristoph Hellwig } 711f46b5a66SChristoph Hellwig 712ae01a0abSYan Zheng trans = btrfs_start_transaction(root, 1); 713ae01a0abSYan Zheng BUG_ON(!trans); 714ae01a0abSYan Zheng 715c5c9cd4dSSage Weil /* punch hole in destination first */ 716c5c9cd4dSSage Weil btrfs_drop_extents(trans, root, inode, off, off+len, 0, &hint_byte); 717c5c9cd4dSSage Weil 718c5c9cd4dSSage Weil /* clone data */ 719f46b5a66SChristoph Hellwig key.objectid = src->i_ino; 720ae01a0abSYan Zheng key.type = BTRFS_EXTENT_DATA_KEY; 721ae01a0abSYan Zheng key.offset = 0; 722f46b5a66SChristoph Hellwig 723f46b5a66SChristoph Hellwig while (1) { 724f46b5a66SChristoph Hellwig /* 725f46b5a66SChristoph Hellwig * note the key will change type as we walk through the 726f46b5a66SChristoph Hellwig * tree. 727f46b5a66SChristoph Hellwig */ 728f46b5a66SChristoph Hellwig ret = btrfs_search_slot(trans, root, &key, path, 0, 0); 729f46b5a66SChristoph Hellwig if (ret < 0) 730f46b5a66SChristoph Hellwig goto out; 731f46b5a66SChristoph Hellwig 732ae01a0abSYan Zheng nritems = btrfs_header_nritems(path->nodes[0]); 733ae01a0abSYan Zheng if (path->slots[0] >= nritems) { 734f46b5a66SChristoph Hellwig ret = btrfs_next_leaf(root, path); 735f46b5a66SChristoph Hellwig if (ret < 0) 736f46b5a66SChristoph Hellwig goto out; 737f46b5a66SChristoph Hellwig if (ret > 0) 738f46b5a66SChristoph Hellwig break; 739ae01a0abSYan Zheng nritems = btrfs_header_nritems(path->nodes[0]); 740f46b5a66SChristoph Hellwig } 741f46b5a66SChristoph Hellwig leaf = path->nodes[0]; 742f46b5a66SChristoph Hellwig slot = path->slots[0]; 743f46b5a66SChristoph Hellwig 744ae01a0abSYan Zheng btrfs_item_key_to_cpu(leaf, &key, slot); 745f46b5a66SChristoph Hellwig if (btrfs_key_type(&key) > BTRFS_CSUM_ITEM_KEY || 746f46b5a66SChristoph Hellwig key.objectid != src->i_ino) 747f46b5a66SChristoph Hellwig break; 748f46b5a66SChristoph Hellwig 749c5c9cd4dSSage Weil if (btrfs_key_type(&key) == BTRFS_EXTENT_DATA_KEY) { 750c5c9cd4dSSage Weil struct btrfs_file_extent_item *extent; 751c5c9cd4dSSage Weil int type; 75231840ae1SZheng Yan u32 size; 75331840ae1SZheng Yan struct btrfs_key new_key; 754c5c9cd4dSSage Weil u64 disko = 0, diskl = 0; 755c5c9cd4dSSage Weil u64 datao = 0, datal = 0; 756c5c9cd4dSSage Weil u8 comp; 75731840ae1SZheng Yan 75831840ae1SZheng Yan size = btrfs_item_size_nr(leaf, slot); 75931840ae1SZheng Yan read_extent_buffer(leaf, buf, 76031840ae1SZheng Yan btrfs_item_ptr_offset(leaf, slot), 76131840ae1SZheng Yan size); 762c5c9cd4dSSage Weil 763c5c9cd4dSSage Weil extent = btrfs_item_ptr(leaf, slot, 764c5c9cd4dSSage Weil struct btrfs_file_extent_item); 765c5c9cd4dSSage Weil comp = btrfs_file_extent_compression(leaf, extent); 766c5c9cd4dSSage Weil type = btrfs_file_extent_type(leaf, extent); 767c5c9cd4dSSage Weil if (type == BTRFS_FILE_EXTENT_REG) { 768c5c9cd4dSSage Weil disko = btrfs_file_extent_disk_bytenr(leaf, extent); 769c5c9cd4dSSage Weil diskl = btrfs_file_extent_disk_num_bytes(leaf, extent); 770c5c9cd4dSSage Weil datao = btrfs_file_extent_offset(leaf, extent); 771c5c9cd4dSSage Weil datal = btrfs_file_extent_num_bytes(leaf, extent); 772c5c9cd4dSSage Weil } else if (type == BTRFS_FILE_EXTENT_INLINE) { 773c5c9cd4dSSage Weil /* take upper bound, may be compressed */ 774c5c9cd4dSSage Weil datal = btrfs_file_extent_ram_bytes(leaf, 775c5c9cd4dSSage Weil extent); 776c5c9cd4dSSage Weil } 77731840ae1SZheng Yan btrfs_release_path(root, path); 77831840ae1SZheng Yan 779c5c9cd4dSSage Weil if (key.offset + datal < off || 780c5c9cd4dSSage Weil key.offset >= off+len) 781c5c9cd4dSSage Weil goto next; 782c5c9cd4dSSage Weil 78331840ae1SZheng Yan memcpy(&new_key, &key, sizeof(new_key)); 78431840ae1SZheng Yan new_key.objectid = inode->i_ino; 785c5c9cd4dSSage Weil new_key.offset = key.offset + destoff - off; 786c5c9cd4dSSage Weil 787c5c9cd4dSSage Weil if (type == BTRFS_FILE_EXTENT_REG) { 78831840ae1SZheng Yan ret = btrfs_insert_empty_item(trans, root, path, 78931840ae1SZheng Yan &new_key, size); 79031840ae1SZheng Yan if (ret) 79131840ae1SZheng Yan goto out; 79231840ae1SZheng Yan 79331840ae1SZheng Yan leaf = path->nodes[0]; 79431840ae1SZheng Yan slot = path->slots[0]; 79531840ae1SZheng Yan write_extent_buffer(leaf, buf, 79631840ae1SZheng Yan btrfs_item_ptr_offset(leaf, slot), 79731840ae1SZheng Yan size); 798ae01a0abSYan Zheng 799f46b5a66SChristoph Hellwig extent = btrfs_item_ptr(leaf, slot, 800f46b5a66SChristoph Hellwig struct btrfs_file_extent_item); 801c5c9cd4dSSage Weil printk(" orig disk %llu~%llu data %llu~%llu\n", 802c5c9cd4dSSage Weil disko, diskl, datao, datal); 803c5c9cd4dSSage Weil 804c5c9cd4dSSage Weil if (off > key.offset) { 805c5c9cd4dSSage Weil datao += off - key.offset; 806c5c9cd4dSSage Weil datal -= off - key.offset; 807c5c9cd4dSSage Weil } 808c5c9cd4dSSage Weil if (key.offset + datao + datal + key.offset > 809c5c9cd4dSSage Weil off + len) 810c5c9cd4dSSage Weil datal = off + len - key.offset - datao; 811c5c9cd4dSSage Weil /* disko == 0 means it's a hole */ 812c5c9cd4dSSage Weil if (!disko) 813c5c9cd4dSSage Weil datao = 0; 814c5c9cd4dSSage Weil printk(" final disk %llu~%llu data %llu~%llu\n", 815c5c9cd4dSSage Weil disko, diskl, datao, datal); 816c5c9cd4dSSage Weil 817c5c9cd4dSSage Weil btrfs_set_file_extent_offset(leaf, extent, 818c5c9cd4dSSage Weil datao); 819c5c9cd4dSSage Weil btrfs_set_file_extent_num_bytes(leaf, extent, 820c5c9cd4dSSage Weil datal); 821c5c9cd4dSSage Weil if (disko) { 822c5c9cd4dSSage Weil inode_add_bytes(inode, datal); 823ae01a0abSYan Zheng ret = btrfs_inc_extent_ref(trans, root, 824c5c9cd4dSSage Weil disko, diskl, leaf->start, 825f46b5a66SChristoph Hellwig root->root_key.objectid, 826f46b5a66SChristoph Hellwig trans->transid, 8273bb1a1bcSYan Zheng inode->i_ino); 828ae01a0abSYan Zheng BUG_ON(ret); 829f46b5a66SChristoph Hellwig } 830c5c9cd4dSSage Weil } else if (type == BTRFS_FILE_EXTENT_INLINE) { 831c5c9cd4dSSage Weil u64 skip = 0; 832c5c9cd4dSSage Weil u64 trim = 0; 833c5c9cd4dSSage Weil if (off > key.offset) { 834c5c9cd4dSSage Weil skip = off - key.offset; 835c5c9cd4dSSage Weil new_key.offset += skip; 83631840ae1SZheng Yan } 837c5c9cd4dSSage Weil if (key.offset + datal > off+len) 838c5c9cd4dSSage Weil trim = key.offset + datal - (off+len); 839c5c9cd4dSSage Weil printk("len %lld skip %lld trim %lld\n", 840c5c9cd4dSSage Weil datal, skip, trim); 841c5c9cd4dSSage Weil if (comp && (skip || trim)) { 842c5c9cd4dSSage Weil printk("btrfs clone_range can't split compressed inline extents yet\n"); 843c5c9cd4dSSage Weil ret = -EINVAL; 844c5c9cd4dSSage Weil goto out; 84531840ae1SZheng Yan } 846c5c9cd4dSSage Weil size -= skip + trim; 847c5c9cd4dSSage Weil datal -= skip + trim; 848c5c9cd4dSSage Weil ret = btrfs_insert_empty_item(trans, root, path, 849c5c9cd4dSSage Weil &new_key, size); 850c5c9cd4dSSage Weil if (ret) 851c5c9cd4dSSage Weil goto out; 852c5c9cd4dSSage Weil 853c5c9cd4dSSage Weil if (skip) { 854c5c9cd4dSSage Weil u32 start = btrfs_file_extent_calc_inline_size(0); 855c5c9cd4dSSage Weil memmove(buf+start, buf+start+skip, 856c5c9cd4dSSage Weil datal); 857c5c9cd4dSSage Weil } 858c5c9cd4dSSage Weil 859c5c9cd4dSSage Weil leaf = path->nodes[0]; 860c5c9cd4dSSage Weil slot = path->slots[0]; 861c5c9cd4dSSage Weil write_extent_buffer(leaf, buf, 862c5c9cd4dSSage Weil btrfs_item_ptr_offset(leaf, slot), 863c5c9cd4dSSage Weil size); 864c5c9cd4dSSage Weil inode_add_bytes(inode, datal); 865c5c9cd4dSSage Weil } 866c5c9cd4dSSage Weil 867c5c9cd4dSSage Weil btrfs_mark_buffer_dirty(leaf); 868c5c9cd4dSSage Weil } 869c5c9cd4dSSage Weil 870c5c9cd4dSSage Weil if (btrfs_key_type(&key) == BTRFS_CSUM_ITEM_KEY) { 871c5c9cd4dSSage Weil u32 size; 872c5c9cd4dSSage Weil struct btrfs_key new_key; 873c5c9cd4dSSage Weil u64 coverslen; 874c5c9cd4dSSage Weil int coff, clen; 875c5c9cd4dSSage Weil 876c5c9cd4dSSage Weil size = btrfs_item_size_nr(leaf, slot); 877c5c9cd4dSSage Weil coverslen = (size / BTRFS_CRC32_SIZE) << 878c5c9cd4dSSage Weil root->fs_info->sb->s_blocksize_bits; 879c5c9cd4dSSage Weil printk("csums for %llu~%llu\n", 880c5c9cd4dSSage Weil key.offset, coverslen); 881c5c9cd4dSSage Weil if (key.offset + coverslen < off || 882c5c9cd4dSSage Weil key.offset >= off+len) 883c5c9cd4dSSage Weil goto next; 884c5c9cd4dSSage Weil 885c5c9cd4dSSage Weil read_extent_buffer(leaf, buf, 886c5c9cd4dSSage Weil btrfs_item_ptr_offset(leaf, slot), 887c5c9cd4dSSage Weil size); 888c5c9cd4dSSage Weil btrfs_release_path(root, path); 889c5c9cd4dSSage Weil 890c5c9cd4dSSage Weil coff = 0; 891c5c9cd4dSSage Weil if (off > key.offset) 892c5c9cd4dSSage Weil coff = ((off - key.offset) >> 893c5c9cd4dSSage Weil root->fs_info->sb->s_blocksize_bits) * 894c5c9cd4dSSage Weil BTRFS_CRC32_SIZE; 895c5c9cd4dSSage Weil clen = size - coff; 896c5c9cd4dSSage Weil if (key.offset + coverslen > off+len) 897c5c9cd4dSSage Weil clen -= ((key.offset+coverslen-off-len) >> 898c5c9cd4dSSage Weil root->fs_info->sb->s_blocksize_bits) * 899c5c9cd4dSSage Weil BTRFS_CRC32_SIZE; 900c5c9cd4dSSage Weil printk(" will dup %d~%d of %d\n", 901c5c9cd4dSSage Weil coff, clen, size); 902c5c9cd4dSSage Weil 903c5c9cd4dSSage Weil memcpy(&new_key, &key, sizeof(new_key)); 904c5c9cd4dSSage Weil new_key.objectid = inode->i_ino; 905c5c9cd4dSSage Weil new_key.offset = key.offset + destoff - off; 906c5c9cd4dSSage Weil 907c5c9cd4dSSage Weil ret = btrfs_insert_empty_item(trans, root, path, 908c5c9cd4dSSage Weil &new_key, clen); 909c5c9cd4dSSage Weil if (ret) 910c5c9cd4dSSage Weil goto out; 911c5c9cd4dSSage Weil 912c5c9cd4dSSage Weil leaf = path->nodes[0]; 913c5c9cd4dSSage Weil slot = path->slots[0]; 914c5c9cd4dSSage Weil write_extent_buffer(leaf, buf + coff, 915c5c9cd4dSSage Weil btrfs_item_ptr_offset(leaf, slot), 916c5c9cd4dSSage Weil clen); 917c5c9cd4dSSage Weil btrfs_mark_buffer_dirty(leaf); 918c5c9cd4dSSage Weil } 919c5c9cd4dSSage Weil 920c5c9cd4dSSage Weil next: 92131840ae1SZheng Yan btrfs_release_path(root, path); 922ae01a0abSYan Zheng key.offset++; 923ae01a0abSYan Zheng } 924f46b5a66SChristoph Hellwig ret = 0; 925f46b5a66SChristoph Hellwig out: 926ae01a0abSYan Zheng btrfs_release_path(root, path); 927ae01a0abSYan Zheng if (ret == 0) { 928ae01a0abSYan Zheng inode->i_mtime = inode->i_ctime = CURRENT_TIME; 929c5c9cd4dSSage Weil if (destoff + olen > inode->i_size) 930c5c9cd4dSSage Weil btrfs_i_size_write(inode, destoff + olen); 931ae01a0abSYan Zheng BTRFS_I(inode)->flags = BTRFS_I(src)->flags; 932ae01a0abSYan Zheng ret = btrfs_update_inode(trans, root, inode); 933ae01a0abSYan Zheng } 934f46b5a66SChristoph Hellwig btrfs_end_transaction(trans, root); 935c5c9cd4dSSage Weil unlock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 936ae01a0abSYan Zheng if (ret) 937ae01a0abSYan Zheng vmtruncate(inode, 0); 938f46b5a66SChristoph Hellwig out_unlock: 939f46b5a66SChristoph Hellwig mutex_unlock(&src->i_mutex); 940f46b5a66SChristoph Hellwig mutex_unlock(&inode->i_mutex); 941ae01a0abSYan Zheng vfree(buf); 942ae01a0abSYan Zheng btrfs_free_path(path); 943f46b5a66SChristoph Hellwig out_fput: 944f46b5a66SChristoph Hellwig fput(src_file); 945f46b5a66SChristoph Hellwig return ret; 946f46b5a66SChristoph Hellwig } 947f46b5a66SChristoph Hellwig 948c5c9cd4dSSage Weil long btrfs_ioctl_clone_range(struct file *file, unsigned long argptr) 949c5c9cd4dSSage Weil { 950c5c9cd4dSSage Weil struct btrfs_ioctl_clone_range_args args; 951c5c9cd4dSSage Weil 952c5c9cd4dSSage Weil if (copy_from_user(&args, (void *)argptr, sizeof(args))) 953c5c9cd4dSSage Weil return -EFAULT; 954c5c9cd4dSSage Weil return btrfs_ioctl_clone(file, args.src_fd, args.src_offset, 955c5c9cd4dSSage Weil args.src_length, args.dest_offset); 956c5c9cd4dSSage Weil } 957c5c9cd4dSSage Weil 958f46b5a66SChristoph Hellwig /* 959f46b5a66SChristoph Hellwig * there are many ways the trans_start and trans_end ioctls can lead 960f46b5a66SChristoph Hellwig * to deadlocks. They should only be used by applications that 961f46b5a66SChristoph Hellwig * basically own the machine, and have a very in depth understanding 962f46b5a66SChristoph Hellwig * of all the possible deadlocks and enospc problems. 963f46b5a66SChristoph Hellwig */ 964f46b5a66SChristoph Hellwig long btrfs_ioctl_trans_start(struct file *file) 965f46b5a66SChristoph Hellwig { 966f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 967f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 968f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 969f46b5a66SChristoph Hellwig int ret = 0; 970f46b5a66SChristoph Hellwig 971df5b5520SChristoph Hellwig if (!capable(CAP_SYS_ADMIN)) 972df5b5520SChristoph Hellwig return -EPERM; 973df5b5520SChristoph Hellwig 974f46b5a66SChristoph Hellwig if (file->private_data) { 975f46b5a66SChristoph Hellwig ret = -EINPROGRESS; 976f46b5a66SChristoph Hellwig goto out; 977f46b5a66SChristoph Hellwig } 9789ca9ee09SSage Weil 979*c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 980*c146afadSYan Zheng if (ret) 981*c146afadSYan Zheng goto out; 982*c146afadSYan Zheng 9839ca9ee09SSage Weil mutex_lock(&root->fs_info->trans_mutex); 9849ca9ee09SSage Weil root->fs_info->open_ioctl_trans++; 9859ca9ee09SSage Weil mutex_unlock(&root->fs_info->trans_mutex); 9869ca9ee09SSage Weil 9879ca9ee09SSage Weil trans = btrfs_start_ioctl_transaction(root, 0); 988f46b5a66SChristoph Hellwig if (trans) 989f46b5a66SChristoph Hellwig file->private_data = trans; 990f46b5a66SChristoph Hellwig else 991f46b5a66SChristoph Hellwig ret = -ENOMEM; 992f46b5a66SChristoph Hellwig /*printk(KERN_INFO "btrfs_ioctl_trans_start on %p\n", file);*/ 993f46b5a66SChristoph Hellwig out: 994f46b5a66SChristoph Hellwig return ret; 995f46b5a66SChristoph Hellwig } 996f46b5a66SChristoph Hellwig 997f46b5a66SChristoph Hellwig /* 998f46b5a66SChristoph Hellwig * there are many ways the trans_start and trans_end ioctls can lead 999f46b5a66SChristoph Hellwig * to deadlocks. They should only be used by applications that 1000f46b5a66SChristoph Hellwig * basically own the machine, and have a very in depth understanding 1001f46b5a66SChristoph Hellwig * of all the possible deadlocks and enospc problems. 1002f46b5a66SChristoph Hellwig */ 1003f46b5a66SChristoph Hellwig long btrfs_ioctl_trans_end(struct file *file) 1004f46b5a66SChristoph Hellwig { 1005f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 1006f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 1007f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 1008f46b5a66SChristoph Hellwig int ret = 0; 1009f46b5a66SChristoph Hellwig 1010f46b5a66SChristoph Hellwig trans = file->private_data; 1011f46b5a66SChristoph Hellwig if (!trans) { 1012f46b5a66SChristoph Hellwig ret = -EINVAL; 1013f46b5a66SChristoph Hellwig goto out; 1014f46b5a66SChristoph Hellwig } 1015f46b5a66SChristoph Hellwig btrfs_end_transaction(trans, root); 1016b214107eSChristoph Hellwig file->private_data = NULL; 10179ca9ee09SSage Weil 10189ca9ee09SSage Weil mutex_lock(&root->fs_info->trans_mutex); 10199ca9ee09SSage Weil root->fs_info->open_ioctl_trans--; 10209ca9ee09SSage Weil mutex_unlock(&root->fs_info->trans_mutex); 10219ca9ee09SSage Weil 1022f46b5a66SChristoph Hellwig out: 1023f46b5a66SChristoph Hellwig return ret; 1024f46b5a66SChristoph Hellwig } 1025f46b5a66SChristoph Hellwig 1026f46b5a66SChristoph Hellwig long btrfs_ioctl(struct file *file, unsigned int 1027f46b5a66SChristoph Hellwig cmd, unsigned long arg) 1028f46b5a66SChristoph Hellwig { 1029f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(fdentry(file)->d_inode)->root; 1030f46b5a66SChristoph Hellwig 1031f46b5a66SChristoph Hellwig switch (cmd) { 1032f46b5a66SChristoph Hellwig case BTRFS_IOC_SNAP_CREATE: 1033cb8e7090SChristoph Hellwig return btrfs_ioctl_snap_create(file, (void __user *)arg); 1034f46b5a66SChristoph Hellwig case BTRFS_IOC_DEFRAG: 1035f46b5a66SChristoph Hellwig return btrfs_ioctl_defrag(file); 1036f46b5a66SChristoph Hellwig case BTRFS_IOC_RESIZE: 1037f46b5a66SChristoph Hellwig return btrfs_ioctl_resize(root, (void __user *)arg); 1038f46b5a66SChristoph Hellwig case BTRFS_IOC_ADD_DEV: 1039f46b5a66SChristoph Hellwig return btrfs_ioctl_add_dev(root, (void __user *)arg); 1040f46b5a66SChristoph Hellwig case BTRFS_IOC_RM_DEV: 1041f46b5a66SChristoph Hellwig return btrfs_ioctl_rm_dev(root, (void __user *)arg); 1042f46b5a66SChristoph Hellwig case BTRFS_IOC_BALANCE: 1043f46b5a66SChristoph Hellwig return btrfs_balance(root->fs_info->dev_root); 1044f46b5a66SChristoph Hellwig case BTRFS_IOC_CLONE: 1045c5c9cd4dSSage Weil return btrfs_ioctl_clone(file, arg, 0, 0, 0); 1046c5c9cd4dSSage Weil case BTRFS_IOC_CLONE_RANGE: 1047c5c9cd4dSSage Weil return btrfs_ioctl_clone_range(file, arg); 1048f46b5a66SChristoph Hellwig case BTRFS_IOC_TRANS_START: 1049f46b5a66SChristoph Hellwig return btrfs_ioctl_trans_start(file); 1050f46b5a66SChristoph Hellwig case BTRFS_IOC_TRANS_END: 1051f46b5a66SChristoph Hellwig return btrfs_ioctl_trans_end(file); 1052f46b5a66SChristoph Hellwig case BTRFS_IOC_SYNC: 1053ea8c2819SChris Mason btrfs_start_delalloc_inodes(root); 1054f46b5a66SChristoph Hellwig btrfs_sync_fs(file->f_dentry->d_sb, 1); 1055f46b5a66SChristoph Hellwig return 0; 1056f46b5a66SChristoph Hellwig } 1057f46b5a66SChristoph Hellwig 1058f46b5a66SChristoph Hellwig return -ENOTTY; 1059f46b5a66SChristoph Hellwig } 1060