1f46b5a66SChristoph Hellwig /* 2f46b5a66SChristoph Hellwig * Copyright (C) 2007 Oracle. All rights reserved. 3f46b5a66SChristoph Hellwig * 4f46b5a66SChristoph Hellwig * This program is free software; you can redistribute it and/or 5f46b5a66SChristoph Hellwig * modify it under the terms of the GNU General Public 6f46b5a66SChristoph Hellwig * License v2 as published by the Free Software Foundation. 7f46b5a66SChristoph Hellwig * 8f46b5a66SChristoph Hellwig * This program is distributed in the hope that it will be useful, 9f46b5a66SChristoph Hellwig * but WITHOUT ANY WARRANTY; without even the implied warranty of 10f46b5a66SChristoph Hellwig * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 11f46b5a66SChristoph Hellwig * General Public License for more details. 12f46b5a66SChristoph Hellwig * 13f46b5a66SChristoph Hellwig * You should have received a copy of the GNU General Public 14f46b5a66SChristoph Hellwig * License along with this program; if not, write to the 15f46b5a66SChristoph Hellwig * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 16f46b5a66SChristoph Hellwig * Boston, MA 021110-1307, USA. 17f46b5a66SChristoph Hellwig */ 18f46b5a66SChristoph Hellwig 19f46b5a66SChristoph Hellwig #include <linux/kernel.h> 20f46b5a66SChristoph Hellwig #include <linux/bio.h> 21f46b5a66SChristoph Hellwig #include <linux/buffer_head.h> 22f46b5a66SChristoph Hellwig #include <linux/file.h> 23f46b5a66SChristoph Hellwig #include <linux/fs.h> 24cb8e7090SChristoph Hellwig #include <linux/fsnotify.h> 25f46b5a66SChristoph Hellwig #include <linux/pagemap.h> 26f46b5a66SChristoph Hellwig #include <linux/highmem.h> 27f46b5a66SChristoph Hellwig #include <linux/time.h> 28f46b5a66SChristoph Hellwig #include <linux/init.h> 29f46b5a66SChristoph Hellwig #include <linux/string.h> 30f46b5a66SChristoph Hellwig #include <linux/backing-dev.h> 31cb8e7090SChristoph Hellwig #include <linux/mount.h> 32f46b5a66SChristoph Hellwig #include <linux/mpage.h> 33cb8e7090SChristoph Hellwig #include <linux/namei.h> 34f46b5a66SChristoph Hellwig #include <linux/swap.h> 35f46b5a66SChristoph Hellwig #include <linux/writeback.h> 36f46b5a66SChristoph Hellwig #include <linux/statfs.h> 37f46b5a66SChristoph Hellwig #include <linux/compat.h> 38f46b5a66SChristoph Hellwig #include <linux/bit_spinlock.h> 39cb8e7090SChristoph Hellwig #include <linux/security.h> 40f46b5a66SChristoph Hellwig #include <linux/xattr.h> 417ea394f1SYan Zheng #include <linux/vmalloc.h> 424b4e25f2SChris Mason #include "compat.h" 43f46b5a66SChristoph Hellwig #include "ctree.h" 44f46b5a66SChristoph Hellwig #include "disk-io.h" 45f46b5a66SChristoph Hellwig #include "transaction.h" 46f46b5a66SChristoph Hellwig #include "btrfs_inode.h" 47f46b5a66SChristoph Hellwig #include "ioctl.h" 48f46b5a66SChristoph Hellwig #include "print-tree.h" 49f46b5a66SChristoph Hellwig #include "volumes.h" 50925baeddSChris Mason #include "locking.h" 5198d377a0STARUISI Hiroaki #include "ctree.h" 52f46b5a66SChristoph Hellwig 536cbff00fSChristoph Hellwig /* Mask out flags that are inappropriate for the given type of inode. */ 546cbff00fSChristoph Hellwig static inline __u32 btrfs_mask_flags(umode_t mode, __u32 flags) 556cbff00fSChristoph Hellwig { 566cbff00fSChristoph Hellwig if (S_ISDIR(mode)) 576cbff00fSChristoph Hellwig return flags; 586cbff00fSChristoph Hellwig else if (S_ISREG(mode)) 596cbff00fSChristoph Hellwig return flags & ~FS_DIRSYNC_FL; 606cbff00fSChristoph Hellwig else 616cbff00fSChristoph Hellwig return flags & (FS_NODUMP_FL | FS_NOATIME_FL); 626cbff00fSChristoph Hellwig } 63f46b5a66SChristoph Hellwig 646cbff00fSChristoph Hellwig /* 656cbff00fSChristoph Hellwig * Export inode flags to the format expected by the FS_IOC_GETFLAGS ioctl. 666cbff00fSChristoph Hellwig */ 676cbff00fSChristoph Hellwig static unsigned int btrfs_flags_to_ioctl(unsigned int flags) 686cbff00fSChristoph Hellwig { 696cbff00fSChristoph Hellwig unsigned int iflags = 0; 706cbff00fSChristoph Hellwig 716cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_SYNC) 726cbff00fSChristoph Hellwig iflags |= FS_SYNC_FL; 736cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_IMMUTABLE) 746cbff00fSChristoph Hellwig iflags |= FS_IMMUTABLE_FL; 756cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_APPEND) 766cbff00fSChristoph Hellwig iflags |= FS_APPEND_FL; 776cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_NODUMP) 786cbff00fSChristoph Hellwig iflags |= FS_NODUMP_FL; 796cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_NOATIME) 806cbff00fSChristoph Hellwig iflags |= FS_NOATIME_FL; 816cbff00fSChristoph Hellwig if (flags & BTRFS_INODE_DIRSYNC) 826cbff00fSChristoph Hellwig iflags |= FS_DIRSYNC_FL; 836cbff00fSChristoph Hellwig 846cbff00fSChristoph Hellwig return iflags; 856cbff00fSChristoph Hellwig } 866cbff00fSChristoph Hellwig 876cbff00fSChristoph Hellwig /* 886cbff00fSChristoph Hellwig * Update inode->i_flags based on the btrfs internal flags. 896cbff00fSChristoph Hellwig */ 906cbff00fSChristoph Hellwig void btrfs_update_iflags(struct inode *inode) 916cbff00fSChristoph Hellwig { 926cbff00fSChristoph Hellwig struct btrfs_inode *ip = BTRFS_I(inode); 936cbff00fSChristoph Hellwig 946cbff00fSChristoph Hellwig inode->i_flags &= ~(S_SYNC|S_APPEND|S_IMMUTABLE|S_NOATIME|S_DIRSYNC); 956cbff00fSChristoph Hellwig 966cbff00fSChristoph Hellwig if (ip->flags & BTRFS_INODE_SYNC) 976cbff00fSChristoph Hellwig inode->i_flags |= S_SYNC; 986cbff00fSChristoph Hellwig if (ip->flags & BTRFS_INODE_IMMUTABLE) 996cbff00fSChristoph Hellwig inode->i_flags |= S_IMMUTABLE; 1006cbff00fSChristoph Hellwig if (ip->flags & BTRFS_INODE_APPEND) 1016cbff00fSChristoph Hellwig inode->i_flags |= S_APPEND; 1026cbff00fSChristoph Hellwig if (ip->flags & BTRFS_INODE_NOATIME) 1036cbff00fSChristoph Hellwig inode->i_flags |= S_NOATIME; 1046cbff00fSChristoph Hellwig if (ip->flags & BTRFS_INODE_DIRSYNC) 1056cbff00fSChristoph Hellwig inode->i_flags |= S_DIRSYNC; 1066cbff00fSChristoph Hellwig } 1076cbff00fSChristoph Hellwig 1086cbff00fSChristoph Hellwig /* 1096cbff00fSChristoph Hellwig * Inherit flags from the parent inode. 1106cbff00fSChristoph Hellwig * 1116cbff00fSChristoph Hellwig * Unlike extN we don't have any flags we don't want to inherit currently. 1126cbff00fSChristoph Hellwig */ 1136cbff00fSChristoph Hellwig void btrfs_inherit_iflags(struct inode *inode, struct inode *dir) 1146cbff00fSChristoph Hellwig { 1150b4dcea5SChris Mason unsigned int flags; 1160b4dcea5SChris Mason 1170b4dcea5SChris Mason if (!dir) 1180b4dcea5SChris Mason return; 1190b4dcea5SChris Mason 1200b4dcea5SChris Mason flags = BTRFS_I(dir)->flags; 1216cbff00fSChristoph Hellwig 1226cbff00fSChristoph Hellwig if (S_ISREG(inode->i_mode)) 1236cbff00fSChristoph Hellwig flags &= ~BTRFS_INODE_DIRSYNC; 1246cbff00fSChristoph Hellwig else if (!S_ISDIR(inode->i_mode)) 1256cbff00fSChristoph Hellwig flags &= (BTRFS_INODE_NODUMP | BTRFS_INODE_NOATIME); 1266cbff00fSChristoph Hellwig 1276cbff00fSChristoph Hellwig BTRFS_I(inode)->flags = flags; 1286cbff00fSChristoph Hellwig btrfs_update_iflags(inode); 1296cbff00fSChristoph Hellwig } 1306cbff00fSChristoph Hellwig 1316cbff00fSChristoph Hellwig static int btrfs_ioctl_getflags(struct file *file, void __user *arg) 1326cbff00fSChristoph Hellwig { 1336cbff00fSChristoph Hellwig struct btrfs_inode *ip = BTRFS_I(file->f_path.dentry->d_inode); 1346cbff00fSChristoph Hellwig unsigned int flags = btrfs_flags_to_ioctl(ip->flags); 1356cbff00fSChristoph Hellwig 1366cbff00fSChristoph Hellwig if (copy_to_user(arg, &flags, sizeof(flags))) 1376cbff00fSChristoph Hellwig return -EFAULT; 1386cbff00fSChristoph Hellwig return 0; 1396cbff00fSChristoph Hellwig } 1406cbff00fSChristoph Hellwig 1416cbff00fSChristoph Hellwig static int btrfs_ioctl_setflags(struct file *file, void __user *arg) 1426cbff00fSChristoph Hellwig { 1436cbff00fSChristoph Hellwig struct inode *inode = file->f_path.dentry->d_inode; 1446cbff00fSChristoph Hellwig struct btrfs_inode *ip = BTRFS_I(inode); 1456cbff00fSChristoph Hellwig struct btrfs_root *root = ip->root; 1466cbff00fSChristoph Hellwig struct btrfs_trans_handle *trans; 1476cbff00fSChristoph Hellwig unsigned int flags, oldflags; 1486cbff00fSChristoph Hellwig int ret; 1496cbff00fSChristoph Hellwig 1506cbff00fSChristoph Hellwig if (copy_from_user(&flags, arg, sizeof(flags))) 1516cbff00fSChristoph Hellwig return -EFAULT; 1526cbff00fSChristoph Hellwig 1536cbff00fSChristoph Hellwig if (flags & ~(FS_IMMUTABLE_FL | FS_APPEND_FL | \ 1546cbff00fSChristoph Hellwig FS_NOATIME_FL | FS_NODUMP_FL | \ 1556cbff00fSChristoph Hellwig FS_SYNC_FL | FS_DIRSYNC_FL)) 1566cbff00fSChristoph Hellwig return -EOPNOTSUPP; 1576cbff00fSChristoph Hellwig 1586cbff00fSChristoph Hellwig if (!is_owner_or_cap(inode)) 1596cbff00fSChristoph Hellwig return -EACCES; 1606cbff00fSChristoph Hellwig 1616cbff00fSChristoph Hellwig mutex_lock(&inode->i_mutex); 1626cbff00fSChristoph Hellwig 1636cbff00fSChristoph Hellwig flags = btrfs_mask_flags(inode->i_mode, flags); 1646cbff00fSChristoph Hellwig oldflags = btrfs_flags_to_ioctl(ip->flags); 1656cbff00fSChristoph Hellwig if ((flags ^ oldflags) & (FS_APPEND_FL | FS_IMMUTABLE_FL)) { 1666cbff00fSChristoph Hellwig if (!capable(CAP_LINUX_IMMUTABLE)) { 1676cbff00fSChristoph Hellwig ret = -EPERM; 1686cbff00fSChristoph Hellwig goto out_unlock; 1696cbff00fSChristoph Hellwig } 1706cbff00fSChristoph Hellwig } 1716cbff00fSChristoph Hellwig 1726cbff00fSChristoph Hellwig ret = mnt_want_write(file->f_path.mnt); 1736cbff00fSChristoph Hellwig if (ret) 1746cbff00fSChristoph Hellwig goto out_unlock; 1756cbff00fSChristoph Hellwig 1766cbff00fSChristoph Hellwig if (flags & FS_SYNC_FL) 1776cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_SYNC; 1786cbff00fSChristoph Hellwig else 1796cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_SYNC; 1806cbff00fSChristoph Hellwig if (flags & FS_IMMUTABLE_FL) 1816cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_IMMUTABLE; 1826cbff00fSChristoph Hellwig else 1836cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_IMMUTABLE; 1846cbff00fSChristoph Hellwig if (flags & FS_APPEND_FL) 1856cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_APPEND; 1866cbff00fSChristoph Hellwig else 1876cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_APPEND; 1886cbff00fSChristoph Hellwig if (flags & FS_NODUMP_FL) 1896cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_NODUMP; 1906cbff00fSChristoph Hellwig else 1916cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_NODUMP; 1926cbff00fSChristoph Hellwig if (flags & FS_NOATIME_FL) 1936cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_NOATIME; 1946cbff00fSChristoph Hellwig else 1956cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_NOATIME; 1966cbff00fSChristoph Hellwig if (flags & FS_DIRSYNC_FL) 1976cbff00fSChristoph Hellwig ip->flags |= BTRFS_INODE_DIRSYNC; 1986cbff00fSChristoph Hellwig else 1996cbff00fSChristoph Hellwig ip->flags &= ~BTRFS_INODE_DIRSYNC; 2006cbff00fSChristoph Hellwig 2016cbff00fSChristoph Hellwig 2026cbff00fSChristoph Hellwig trans = btrfs_join_transaction(root, 1); 2036cbff00fSChristoph Hellwig BUG_ON(!trans); 2046cbff00fSChristoph Hellwig 2056cbff00fSChristoph Hellwig ret = btrfs_update_inode(trans, root, inode); 2066cbff00fSChristoph Hellwig BUG_ON(ret); 2076cbff00fSChristoph Hellwig 2086cbff00fSChristoph Hellwig btrfs_update_iflags(inode); 2096cbff00fSChristoph Hellwig inode->i_ctime = CURRENT_TIME; 2106cbff00fSChristoph Hellwig btrfs_end_transaction(trans, root); 2116cbff00fSChristoph Hellwig 2126cbff00fSChristoph Hellwig mnt_drop_write(file->f_path.mnt); 2136cbff00fSChristoph Hellwig out_unlock: 2146cbff00fSChristoph Hellwig mutex_unlock(&inode->i_mutex); 2156cbff00fSChristoph Hellwig return 0; 2166cbff00fSChristoph Hellwig } 2176cbff00fSChristoph Hellwig 2186cbff00fSChristoph Hellwig static int btrfs_ioctl_getversion(struct file *file, int __user *arg) 2196cbff00fSChristoph Hellwig { 2206cbff00fSChristoph Hellwig struct inode *inode = file->f_path.dentry->d_inode; 2216cbff00fSChristoph Hellwig 2226cbff00fSChristoph Hellwig return put_user(inode->i_generation, arg); 2236cbff00fSChristoph Hellwig } 224f46b5a66SChristoph Hellwig 225cb8e7090SChristoph Hellwig static noinline int create_subvol(struct btrfs_root *root, 226cb8e7090SChristoph Hellwig struct dentry *dentry, 227cb8e7090SChristoph Hellwig char *name, int namelen) 228f46b5a66SChristoph Hellwig { 229f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 230f46b5a66SChristoph Hellwig struct btrfs_key key; 231f46b5a66SChristoph Hellwig struct btrfs_root_item root_item; 232f46b5a66SChristoph Hellwig struct btrfs_inode_item *inode_item; 233f46b5a66SChristoph Hellwig struct extent_buffer *leaf; 23476dda93cSYan, Zheng struct btrfs_root *new_root; 23576dda93cSYan, Zheng struct inode *dir = dentry->d_parent->d_inode; 236f46b5a66SChristoph Hellwig int ret; 237f46b5a66SChristoph Hellwig int err; 238f46b5a66SChristoph Hellwig u64 objectid; 239f46b5a66SChristoph Hellwig u64 new_dirid = BTRFS_FIRST_FREE_OBJECTID; 2403de4586cSChris Mason u64 index = 0; 241f46b5a66SChristoph Hellwig 2429ed74f2dSJosef Bacik /* 2439ed74f2dSJosef Bacik * 1 - inode item 2449ed74f2dSJosef Bacik * 2 - refs 2459ed74f2dSJosef Bacik * 1 - root item 2469ed74f2dSJosef Bacik * 2 - dir items 2479ed74f2dSJosef Bacik */ 2489ed74f2dSJosef Bacik ret = btrfs_reserve_metadata_space(root, 6); 249f46b5a66SChristoph Hellwig if (ret) 25076dda93cSYan, Zheng return ret; 251f46b5a66SChristoph Hellwig 252f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 253f46b5a66SChristoph Hellwig BUG_ON(!trans); 254f46b5a66SChristoph Hellwig 255f46b5a66SChristoph Hellwig ret = btrfs_find_free_objectid(trans, root->fs_info->tree_root, 256f46b5a66SChristoph Hellwig 0, &objectid); 257f46b5a66SChristoph Hellwig if (ret) 258f46b5a66SChristoph Hellwig goto fail; 259f46b5a66SChristoph Hellwig 2605d4f98a2SYan Zheng leaf = btrfs_alloc_free_block(trans, root, root->leafsize, 2615d4f98a2SYan Zheng 0, objectid, NULL, 0, 0, 0); 2628e8a1e31SJosef Bacik if (IS_ERR(leaf)) { 2638e8a1e31SJosef Bacik ret = PTR_ERR(leaf); 2648e8a1e31SJosef Bacik goto fail; 2658e8a1e31SJosef Bacik } 266f46b5a66SChristoph Hellwig 2675d4f98a2SYan Zheng memset_extent_buffer(leaf, 0, 0, sizeof(struct btrfs_header)); 268f46b5a66SChristoph Hellwig btrfs_set_header_bytenr(leaf, leaf->start); 269f46b5a66SChristoph Hellwig btrfs_set_header_generation(leaf, trans->transid); 2705d4f98a2SYan Zheng btrfs_set_header_backref_rev(leaf, BTRFS_MIXED_BACKREF_REV); 271f46b5a66SChristoph Hellwig btrfs_set_header_owner(leaf, objectid); 272f46b5a66SChristoph Hellwig 273f46b5a66SChristoph Hellwig write_extent_buffer(leaf, root->fs_info->fsid, 274f46b5a66SChristoph Hellwig (unsigned long)btrfs_header_fsid(leaf), 275f46b5a66SChristoph Hellwig BTRFS_FSID_SIZE); 2765d4f98a2SYan Zheng write_extent_buffer(leaf, root->fs_info->chunk_tree_uuid, 2775d4f98a2SYan Zheng (unsigned long)btrfs_header_chunk_tree_uuid(leaf), 2785d4f98a2SYan Zheng BTRFS_UUID_SIZE); 279f46b5a66SChristoph Hellwig btrfs_mark_buffer_dirty(leaf); 280f46b5a66SChristoph Hellwig 281f46b5a66SChristoph Hellwig inode_item = &root_item.inode; 282f46b5a66SChristoph Hellwig memset(inode_item, 0, sizeof(*inode_item)); 283f46b5a66SChristoph Hellwig inode_item->generation = cpu_to_le64(1); 284f46b5a66SChristoph Hellwig inode_item->size = cpu_to_le64(3); 285f46b5a66SChristoph Hellwig inode_item->nlink = cpu_to_le32(1); 286a76a3cd4SYan Zheng inode_item->nbytes = cpu_to_le64(root->leafsize); 287f46b5a66SChristoph Hellwig inode_item->mode = cpu_to_le32(S_IFDIR | 0755); 288f46b5a66SChristoph Hellwig 289f46b5a66SChristoph Hellwig btrfs_set_root_bytenr(&root_item, leaf->start); 29084234f3aSYan Zheng btrfs_set_root_generation(&root_item, trans->transid); 291f46b5a66SChristoph Hellwig btrfs_set_root_level(&root_item, 0); 292f46b5a66SChristoph Hellwig btrfs_set_root_refs(&root_item, 1); 29386b9f2ecSYan, Zheng btrfs_set_root_used(&root_item, leaf->len); 29480ff3856SYan Zheng btrfs_set_root_last_snapshot(&root_item, 0); 295f46b5a66SChristoph Hellwig 296f46b5a66SChristoph Hellwig memset(&root_item.drop_progress, 0, sizeof(root_item.drop_progress)); 297f46b5a66SChristoph Hellwig root_item.drop_level = 0; 298f46b5a66SChristoph Hellwig 299925baeddSChris Mason btrfs_tree_unlock(leaf); 300f46b5a66SChristoph Hellwig free_extent_buffer(leaf); 301f46b5a66SChristoph Hellwig leaf = NULL; 302f46b5a66SChristoph Hellwig 303f46b5a66SChristoph Hellwig btrfs_set_root_dirid(&root_item, new_dirid); 304f46b5a66SChristoph Hellwig 305f46b5a66SChristoph Hellwig key.objectid = objectid; 3065d4f98a2SYan Zheng key.offset = 0; 307f46b5a66SChristoph Hellwig btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY); 308f46b5a66SChristoph Hellwig ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key, 309f46b5a66SChristoph Hellwig &root_item); 310f46b5a66SChristoph Hellwig if (ret) 311f46b5a66SChristoph Hellwig goto fail; 312f46b5a66SChristoph Hellwig 31376dda93cSYan, Zheng key.offset = (u64)-1; 31476dda93cSYan, Zheng new_root = btrfs_read_fs_root_no_name(root->fs_info, &key); 31576dda93cSYan, Zheng BUG_ON(IS_ERR(new_root)); 31676dda93cSYan, Zheng 31776dda93cSYan, Zheng btrfs_record_root_in_trans(trans, new_root); 31876dda93cSYan, Zheng 31976dda93cSYan, Zheng ret = btrfs_create_subvol_root(trans, new_root, new_dirid, 32076dda93cSYan, Zheng BTRFS_I(dir)->block_group); 321f46b5a66SChristoph Hellwig /* 322f46b5a66SChristoph Hellwig * insert the directory item 323f46b5a66SChristoph Hellwig */ 3243de4586cSChris Mason ret = btrfs_set_inode_index(dir, &index); 3253de4586cSChris Mason BUG_ON(ret); 3263de4586cSChris Mason 3273de4586cSChris Mason ret = btrfs_insert_dir_item(trans, root, 328f46b5a66SChristoph Hellwig name, namelen, dir->i_ino, &key, 3293de4586cSChris Mason BTRFS_FT_DIR, index); 330f46b5a66SChristoph Hellwig if (ret) 331f46b5a66SChristoph Hellwig goto fail; 3320660b5afSChris Mason 33352c26179SYan Zheng btrfs_i_size_write(dir, dir->i_size + namelen * 2); 33452c26179SYan Zheng ret = btrfs_update_inode(trans, root, dir); 33552c26179SYan Zheng BUG_ON(ret); 33652c26179SYan Zheng 3370660b5afSChris Mason ret = btrfs_add_root_ref(trans, root->fs_info->tree_root, 3384df27c4dSYan, Zheng objectid, root->root_key.objectid, 3390660b5afSChris Mason dir->i_ino, index, name, namelen); 34076dda93cSYan, Zheng 3410660b5afSChris Mason BUG_ON(ret); 3420660b5afSChris Mason 34376dda93cSYan, Zheng d_instantiate(dentry, btrfs_lookup_dentry(dir, dentry)); 344f46b5a66SChristoph Hellwig fail: 34576dda93cSYan, Zheng err = btrfs_commit_transaction(trans, root); 346f46b5a66SChristoph Hellwig if (err && !ret) 347f46b5a66SChristoph Hellwig ret = err; 3489ed74f2dSJosef Bacik 3499ed74f2dSJosef Bacik btrfs_unreserve_metadata_space(root, 6); 350f46b5a66SChristoph Hellwig return ret; 351f46b5a66SChristoph Hellwig } 352f46b5a66SChristoph Hellwig 3533de4586cSChris Mason static int create_snapshot(struct btrfs_root *root, struct dentry *dentry, 3543de4586cSChris Mason char *name, int namelen) 355f46b5a66SChristoph Hellwig { 3562e4bfab9SYan, Zheng struct inode *inode; 357f46b5a66SChristoph Hellwig struct btrfs_pending_snapshot *pending_snapshot; 358f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 3592e4bfab9SYan, Zheng int ret; 360f46b5a66SChristoph Hellwig 361f46b5a66SChristoph Hellwig if (!root->ref_cows) 362f46b5a66SChristoph Hellwig return -EINVAL; 363f46b5a66SChristoph Hellwig 3649ed74f2dSJosef Bacik /* 3659ed74f2dSJosef Bacik * 1 - inode item 3669ed74f2dSJosef Bacik * 2 - refs 3679ed74f2dSJosef Bacik * 1 - root item 3689ed74f2dSJosef Bacik * 2 - dir items 3699ed74f2dSJosef Bacik */ 3709ed74f2dSJosef Bacik ret = btrfs_reserve_metadata_space(root, 6); 371f46b5a66SChristoph Hellwig if (ret) 3722e4bfab9SYan, Zheng goto fail; 373f46b5a66SChristoph Hellwig 3743de4586cSChris Mason pending_snapshot = kzalloc(sizeof(*pending_snapshot), GFP_NOFS); 375f46b5a66SChristoph Hellwig if (!pending_snapshot) { 376f46b5a66SChristoph Hellwig ret = -ENOMEM; 3779ed74f2dSJosef Bacik btrfs_unreserve_metadata_space(root, 6); 3782e4bfab9SYan, Zheng goto fail; 379f46b5a66SChristoph Hellwig } 380f46b5a66SChristoph Hellwig pending_snapshot->name = kmalloc(namelen + 1, GFP_NOFS); 381f46b5a66SChristoph Hellwig if (!pending_snapshot->name) { 382f46b5a66SChristoph Hellwig ret = -ENOMEM; 383f46b5a66SChristoph Hellwig kfree(pending_snapshot); 3849ed74f2dSJosef Bacik btrfs_unreserve_metadata_space(root, 6); 3852e4bfab9SYan, Zheng goto fail; 386f46b5a66SChristoph Hellwig } 387f46b5a66SChristoph Hellwig memcpy(pending_snapshot->name, name, namelen); 388f46b5a66SChristoph Hellwig pending_snapshot->name[namelen] = '\0'; 3893de4586cSChris Mason pending_snapshot->dentry = dentry; 390f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 391f46b5a66SChristoph Hellwig BUG_ON(!trans); 392f46b5a66SChristoph Hellwig pending_snapshot->root = root; 393f46b5a66SChristoph Hellwig list_add(&pending_snapshot->list, 394f46b5a66SChristoph Hellwig &trans->transaction->pending_snapshots); 3952e4bfab9SYan, Zheng ret = btrfs_commit_transaction(trans, root); 3962e4bfab9SYan, Zheng BUG_ON(ret); 3972e4bfab9SYan, Zheng btrfs_unreserve_metadata_space(root, 6); 398f46b5a66SChristoph Hellwig 3992e4bfab9SYan, Zheng inode = btrfs_lookup_dentry(dentry->d_parent->d_inode, dentry); 4002e4bfab9SYan, Zheng if (IS_ERR(inode)) { 4012e4bfab9SYan, Zheng ret = PTR_ERR(inode); 4022e4bfab9SYan, Zheng goto fail; 4032e4bfab9SYan, Zheng } 4042e4bfab9SYan, Zheng BUG_ON(!inode); 4052e4bfab9SYan, Zheng d_instantiate(dentry, inode); 4062e4bfab9SYan, Zheng ret = 0; 4072e4bfab9SYan, Zheng fail: 408f46b5a66SChristoph Hellwig return ret; 409f46b5a66SChristoph Hellwig } 410f46b5a66SChristoph Hellwig 411cb8e7090SChristoph Hellwig /* copy of may_create in fs/namei.c() */ 412cb8e7090SChristoph Hellwig static inline int btrfs_may_create(struct inode *dir, struct dentry *child) 413cb8e7090SChristoph Hellwig { 414cb8e7090SChristoph Hellwig if (child->d_inode) 415cb8e7090SChristoph Hellwig return -EEXIST; 416cb8e7090SChristoph Hellwig if (IS_DEADDIR(dir)) 417cb8e7090SChristoph Hellwig return -ENOENT; 418cb8e7090SChristoph Hellwig return inode_permission(dir, MAY_WRITE | MAY_EXEC); 419cb8e7090SChristoph Hellwig } 420cb8e7090SChristoph Hellwig 421cb8e7090SChristoph Hellwig /* 422cb8e7090SChristoph Hellwig * Create a new subvolume below @parent. This is largely modeled after 423cb8e7090SChristoph Hellwig * sys_mkdirat and vfs_mkdir, but we only do a single component lookup 424cb8e7090SChristoph Hellwig * inside this filesystem so it's quite a bit simpler. 425cb8e7090SChristoph Hellwig */ 42676dda93cSYan, Zheng static noinline int btrfs_mksubvol(struct path *parent, 42776dda93cSYan, Zheng char *name, int namelen, 4283de4586cSChris Mason struct btrfs_root *snap_src) 429cb8e7090SChristoph Hellwig { 43076dda93cSYan, Zheng struct inode *dir = parent->dentry->d_inode; 431cb8e7090SChristoph Hellwig struct dentry *dentry; 432cb8e7090SChristoph Hellwig int error; 433cb8e7090SChristoph Hellwig 43476dda93cSYan, Zheng mutex_lock_nested(&dir->i_mutex, I_MUTEX_PARENT); 435cb8e7090SChristoph Hellwig 436cb8e7090SChristoph Hellwig dentry = lookup_one_len(name, parent->dentry, namelen); 437cb8e7090SChristoph Hellwig error = PTR_ERR(dentry); 438cb8e7090SChristoph Hellwig if (IS_ERR(dentry)) 439cb8e7090SChristoph Hellwig goto out_unlock; 440cb8e7090SChristoph Hellwig 441cb8e7090SChristoph Hellwig error = -EEXIST; 442cb8e7090SChristoph Hellwig if (dentry->d_inode) 443cb8e7090SChristoph Hellwig goto out_dput; 444cb8e7090SChristoph Hellwig 445cb8e7090SChristoph Hellwig error = mnt_want_write(parent->mnt); 446cb8e7090SChristoph Hellwig if (error) 447cb8e7090SChristoph Hellwig goto out_dput; 448cb8e7090SChristoph Hellwig 44976dda93cSYan, Zheng error = btrfs_may_create(dir, dentry); 450cb8e7090SChristoph Hellwig if (error) 451cb8e7090SChristoph Hellwig goto out_drop_write; 452cb8e7090SChristoph Hellwig 45376dda93cSYan, Zheng down_read(&BTRFS_I(dir)->root->fs_info->subvol_sem); 45476dda93cSYan, Zheng 45576dda93cSYan, Zheng if (btrfs_root_refs(&BTRFS_I(dir)->root->root_item) == 0) 45676dda93cSYan, Zheng goto out_up_read; 45776dda93cSYan, Zheng 4583de4586cSChris Mason if (snap_src) { 45976dda93cSYan, Zheng error = create_snapshot(snap_src, dentry, 46076dda93cSYan, Zheng name, namelen); 4613de4586cSChris Mason } else { 46276dda93cSYan, Zheng error = create_subvol(BTRFS_I(dir)->root, dentry, 46376dda93cSYan, Zheng name, namelen); 4643de4586cSChris Mason } 46576dda93cSYan, Zheng if (!error) 46676dda93cSYan, Zheng fsnotify_mkdir(dir, dentry); 46776dda93cSYan, Zheng out_up_read: 46876dda93cSYan, Zheng up_read(&BTRFS_I(dir)->root->fs_info->subvol_sem); 469cb8e7090SChristoph Hellwig out_drop_write: 470cb8e7090SChristoph Hellwig mnt_drop_write(parent->mnt); 471cb8e7090SChristoph Hellwig out_dput: 472cb8e7090SChristoph Hellwig dput(dentry); 473cb8e7090SChristoph Hellwig out_unlock: 47476dda93cSYan, Zheng mutex_unlock(&dir->i_mutex); 475cb8e7090SChristoph Hellwig return error; 476cb8e7090SChristoph Hellwig } 477cb8e7090SChristoph Hellwig 478b2950863SChristoph Hellwig static int btrfs_defrag_file(struct file *file) 479f46b5a66SChristoph Hellwig { 480f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 481f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 482f46b5a66SChristoph Hellwig struct extent_io_tree *io_tree = &BTRFS_I(inode)->io_tree; 4833eaa2885SChris Mason struct btrfs_ordered_extent *ordered; 484f46b5a66SChristoph Hellwig struct page *page; 485f46b5a66SChristoph Hellwig unsigned long last_index; 486f46b5a66SChristoph Hellwig unsigned long ra_pages = root->fs_info->bdi.ra_pages; 487f46b5a66SChristoph Hellwig unsigned long total_read = 0; 488f46b5a66SChristoph Hellwig u64 page_start; 489f46b5a66SChristoph Hellwig u64 page_end; 490f46b5a66SChristoph Hellwig unsigned long i; 491f46b5a66SChristoph Hellwig int ret; 492f46b5a66SChristoph Hellwig 4936a63209fSJosef Bacik ret = btrfs_check_data_free_space(root, inode, inode->i_size); 494f46b5a66SChristoph Hellwig if (ret) 495f46b5a66SChristoph Hellwig return -ENOSPC; 496f46b5a66SChristoph Hellwig 497f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 498f46b5a66SChristoph Hellwig last_index = inode->i_size >> PAGE_CACHE_SHIFT; 499f46b5a66SChristoph Hellwig for (i = 0; i <= last_index; i++) { 500f46b5a66SChristoph Hellwig if (total_read % ra_pages == 0) { 501f46b5a66SChristoph Hellwig btrfs_force_ra(inode->i_mapping, &file->f_ra, file, i, 502f46b5a66SChristoph Hellwig min(last_index, i + ra_pages - 1)); 503f46b5a66SChristoph Hellwig } 504f46b5a66SChristoph Hellwig total_read++; 5053eaa2885SChris Mason again: 506f46b5a66SChristoph Hellwig page = grab_cache_page(inode->i_mapping, i); 507f46b5a66SChristoph Hellwig if (!page) 508f46b5a66SChristoph Hellwig goto out_unlock; 509f46b5a66SChristoph Hellwig if (!PageUptodate(page)) { 510f46b5a66SChristoph Hellwig btrfs_readpage(NULL, page); 511f46b5a66SChristoph Hellwig lock_page(page); 512f46b5a66SChristoph Hellwig if (!PageUptodate(page)) { 513f46b5a66SChristoph Hellwig unlock_page(page); 514f46b5a66SChristoph Hellwig page_cache_release(page); 515f46b5a66SChristoph Hellwig goto out_unlock; 516f46b5a66SChristoph Hellwig } 517f46b5a66SChristoph Hellwig } 518f46b5a66SChristoph Hellwig 519f46b5a66SChristoph Hellwig wait_on_page_writeback(page); 520f46b5a66SChristoph Hellwig 521f46b5a66SChristoph Hellwig page_start = (u64)page->index << PAGE_CACHE_SHIFT; 522f46b5a66SChristoph Hellwig page_end = page_start + PAGE_CACHE_SIZE - 1; 523f46b5a66SChristoph Hellwig lock_extent(io_tree, page_start, page_end, GFP_NOFS); 5243eaa2885SChris Mason 5253eaa2885SChris Mason ordered = btrfs_lookup_ordered_extent(inode, page_start); 5263eaa2885SChris Mason if (ordered) { 5273eaa2885SChris Mason unlock_extent(io_tree, page_start, page_end, GFP_NOFS); 5283eaa2885SChris Mason unlock_page(page); 5293eaa2885SChris Mason page_cache_release(page); 5303eaa2885SChris Mason btrfs_start_ordered_extent(inode, ordered, 1); 5313eaa2885SChris Mason btrfs_put_ordered_extent(ordered); 5323eaa2885SChris Mason goto again; 5333eaa2885SChris Mason } 5343eaa2885SChris Mason set_page_extent_mapped(page); 5353eaa2885SChris Mason 536f87f057bSChris Mason /* 537f87f057bSChris Mason * this makes sure page_mkwrite is called on the 538f87f057bSChris Mason * page if it is dirtied again later 539f87f057bSChris Mason */ 540f87f057bSChris Mason clear_page_dirty_for_io(page); 541f87f057bSChris Mason 542ea8c2819SChris Mason btrfs_set_extent_delalloc(inode, page_start, page_end); 543f46b5a66SChristoph Hellwig set_page_dirty(page); 544a1ed835eSChris Mason unlock_extent(io_tree, page_start, page_end, GFP_NOFS); 545f46b5a66SChristoph Hellwig unlock_page(page); 546f46b5a66SChristoph Hellwig page_cache_release(page); 547f46b5a66SChristoph Hellwig balance_dirty_pages_ratelimited_nr(inode->i_mapping, 1); 548f46b5a66SChristoph Hellwig } 549f46b5a66SChristoph Hellwig 550f46b5a66SChristoph Hellwig out_unlock: 551f46b5a66SChristoph Hellwig mutex_unlock(&inode->i_mutex); 552f46b5a66SChristoph Hellwig return 0; 553f46b5a66SChristoph Hellwig } 554f46b5a66SChristoph Hellwig 55576dda93cSYan, Zheng static noinline int btrfs_ioctl_resize(struct btrfs_root *root, 55676dda93cSYan, Zheng void __user *arg) 557f46b5a66SChristoph Hellwig { 558f46b5a66SChristoph Hellwig u64 new_size; 559f46b5a66SChristoph Hellwig u64 old_size; 560f46b5a66SChristoph Hellwig u64 devid = 1; 561f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 562f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 563f46b5a66SChristoph Hellwig struct btrfs_device *device = NULL; 564f46b5a66SChristoph Hellwig char *sizestr; 565f46b5a66SChristoph Hellwig char *devstr = NULL; 566f46b5a66SChristoph Hellwig int ret = 0; 567f46b5a66SChristoph Hellwig int namelen; 568f46b5a66SChristoph Hellwig int mod = 0; 569f46b5a66SChristoph Hellwig 570c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 571c146afadSYan Zheng return -EROFS; 572c146afadSYan Zheng 573e441d54dSChris Mason if (!capable(CAP_SYS_ADMIN)) 574e441d54dSChris Mason return -EPERM; 575e441d54dSChris Mason 576dae7b665SLi Zefan vol_args = memdup_user(arg, sizeof(*vol_args)); 577dae7b665SLi Zefan if (IS_ERR(vol_args)) 578dae7b665SLi Zefan return PTR_ERR(vol_args); 5795516e595SMark Fasheh 5805516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 581f46b5a66SChristoph Hellwig namelen = strlen(vol_args->name); 582f46b5a66SChristoph Hellwig 5837d9eb12cSChris Mason mutex_lock(&root->fs_info->volume_mutex); 584f46b5a66SChristoph Hellwig sizestr = vol_args->name; 585f46b5a66SChristoph Hellwig devstr = strchr(sizestr, ':'); 586f46b5a66SChristoph Hellwig if (devstr) { 587f46b5a66SChristoph Hellwig char *end; 588f46b5a66SChristoph Hellwig sizestr = devstr + 1; 589f46b5a66SChristoph Hellwig *devstr = '\0'; 590f46b5a66SChristoph Hellwig devstr = vol_args->name; 591f46b5a66SChristoph Hellwig devid = simple_strtoull(devstr, &end, 10); 59221380931SJoel Becker printk(KERN_INFO "resizing devid %llu\n", 59321380931SJoel Becker (unsigned long long)devid); 594f46b5a66SChristoph Hellwig } 5952b82032cSYan Zheng device = btrfs_find_device(root, devid, NULL, NULL); 596f46b5a66SChristoph Hellwig if (!device) { 59721380931SJoel Becker printk(KERN_INFO "resizer unable to find device %llu\n", 59821380931SJoel Becker (unsigned long long)devid); 599f46b5a66SChristoph Hellwig ret = -EINVAL; 600f46b5a66SChristoph Hellwig goto out_unlock; 601f46b5a66SChristoph Hellwig } 602f46b5a66SChristoph Hellwig if (!strcmp(sizestr, "max")) 603f46b5a66SChristoph Hellwig new_size = device->bdev->bd_inode->i_size; 604f46b5a66SChristoph Hellwig else { 605f46b5a66SChristoph Hellwig if (sizestr[0] == '-') { 606f46b5a66SChristoph Hellwig mod = -1; 607f46b5a66SChristoph Hellwig sizestr++; 608f46b5a66SChristoph Hellwig } else if (sizestr[0] == '+') { 609f46b5a66SChristoph Hellwig mod = 1; 610f46b5a66SChristoph Hellwig sizestr++; 611f46b5a66SChristoph Hellwig } 612f46b5a66SChristoph Hellwig new_size = btrfs_parse_size(sizestr); 613f46b5a66SChristoph Hellwig if (new_size == 0) { 614f46b5a66SChristoph Hellwig ret = -EINVAL; 615f46b5a66SChristoph Hellwig goto out_unlock; 616f46b5a66SChristoph Hellwig } 617f46b5a66SChristoph Hellwig } 618f46b5a66SChristoph Hellwig 619f46b5a66SChristoph Hellwig old_size = device->total_bytes; 620f46b5a66SChristoph Hellwig 621f46b5a66SChristoph Hellwig if (mod < 0) { 622f46b5a66SChristoph Hellwig if (new_size > old_size) { 623f46b5a66SChristoph Hellwig ret = -EINVAL; 624f46b5a66SChristoph Hellwig goto out_unlock; 625f46b5a66SChristoph Hellwig } 626f46b5a66SChristoph Hellwig new_size = old_size - new_size; 627f46b5a66SChristoph Hellwig } else if (mod > 0) { 628f46b5a66SChristoph Hellwig new_size = old_size + new_size; 629f46b5a66SChristoph Hellwig } 630f46b5a66SChristoph Hellwig 631f46b5a66SChristoph Hellwig if (new_size < 256 * 1024 * 1024) { 632f46b5a66SChristoph Hellwig ret = -EINVAL; 633f46b5a66SChristoph Hellwig goto out_unlock; 634f46b5a66SChristoph Hellwig } 635f46b5a66SChristoph Hellwig if (new_size > device->bdev->bd_inode->i_size) { 636f46b5a66SChristoph Hellwig ret = -EFBIG; 637f46b5a66SChristoph Hellwig goto out_unlock; 638f46b5a66SChristoph Hellwig } 639f46b5a66SChristoph Hellwig 640f46b5a66SChristoph Hellwig do_div(new_size, root->sectorsize); 641f46b5a66SChristoph Hellwig new_size *= root->sectorsize; 642f46b5a66SChristoph Hellwig 643f46b5a66SChristoph Hellwig printk(KERN_INFO "new size for %s is %llu\n", 644f46b5a66SChristoph Hellwig device->name, (unsigned long long)new_size); 645f46b5a66SChristoph Hellwig 646f46b5a66SChristoph Hellwig if (new_size > old_size) { 647f46b5a66SChristoph Hellwig trans = btrfs_start_transaction(root, 1); 648f46b5a66SChristoph Hellwig ret = btrfs_grow_device(trans, device, new_size); 649f46b5a66SChristoph Hellwig btrfs_commit_transaction(trans, root); 650f46b5a66SChristoph Hellwig } else { 651f46b5a66SChristoph Hellwig ret = btrfs_shrink_device(device, new_size); 652f46b5a66SChristoph Hellwig } 653f46b5a66SChristoph Hellwig 654f46b5a66SChristoph Hellwig out_unlock: 6557d9eb12cSChris Mason mutex_unlock(&root->fs_info->volume_mutex); 656f46b5a66SChristoph Hellwig kfree(vol_args); 657f46b5a66SChristoph Hellwig return ret; 658f46b5a66SChristoph Hellwig } 659f46b5a66SChristoph Hellwig 660cb8e7090SChristoph Hellwig static noinline int btrfs_ioctl_snap_create(struct file *file, 6613de4586cSChris Mason void __user *arg, int subvol) 662f46b5a66SChristoph Hellwig { 663cb8e7090SChristoph Hellwig struct btrfs_root *root = BTRFS_I(fdentry(file)->d_inode)->root; 664f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 6653de4586cSChris Mason struct file *src_file; 666f46b5a66SChristoph Hellwig int namelen; 6673de4586cSChris Mason int ret = 0; 668f46b5a66SChristoph Hellwig 669c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 670c146afadSYan Zheng return -EROFS; 671c146afadSYan Zheng 672dae7b665SLi Zefan vol_args = memdup_user(arg, sizeof(*vol_args)); 673dae7b665SLi Zefan if (IS_ERR(vol_args)) 674dae7b665SLi Zefan return PTR_ERR(vol_args); 675f46b5a66SChristoph Hellwig 6765516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 677f46b5a66SChristoph Hellwig namelen = strlen(vol_args->name); 678f46b5a66SChristoph Hellwig if (strchr(vol_args->name, '/')) { 679f46b5a66SChristoph Hellwig ret = -EINVAL; 680f46b5a66SChristoph Hellwig goto out; 681f46b5a66SChristoph Hellwig } 682f46b5a66SChristoph Hellwig 6833de4586cSChris Mason if (subvol) { 68476dda93cSYan, Zheng ret = btrfs_mksubvol(&file->f_path, vol_args->name, namelen, 68576dda93cSYan, Zheng NULL); 686cb8e7090SChristoph Hellwig } else { 6873de4586cSChris Mason struct inode *src_inode; 6883de4586cSChris Mason src_file = fget(vol_args->fd); 6893de4586cSChris Mason if (!src_file) { 6903de4586cSChris Mason ret = -EINVAL; 6913de4586cSChris Mason goto out; 6923de4586cSChris Mason } 6933de4586cSChris Mason 6943de4586cSChris Mason src_inode = src_file->f_path.dentry->d_inode; 6953de4586cSChris Mason if (src_inode->i_sb != file->f_path.dentry->d_inode->i_sb) { 696d397712bSChris Mason printk(KERN_INFO "btrfs: Snapshot src from " 697d397712bSChris Mason "another FS\n"); 6983de4586cSChris Mason ret = -EINVAL; 6993de4586cSChris Mason fput(src_file); 7003de4586cSChris Mason goto out; 7013de4586cSChris Mason } 70276dda93cSYan, Zheng ret = btrfs_mksubvol(&file->f_path, vol_args->name, namelen, 70376dda93cSYan, Zheng BTRFS_I(src_inode)->root); 7043de4586cSChris Mason fput(src_file); 705cb8e7090SChristoph Hellwig } 706f46b5a66SChristoph Hellwig out: 707f46b5a66SChristoph Hellwig kfree(vol_args); 708f46b5a66SChristoph Hellwig return ret; 709f46b5a66SChristoph Hellwig } 710f46b5a66SChristoph Hellwig 71176dda93cSYan, Zheng /* 71276dda93cSYan, Zheng * helper to check if the subvolume references other subvolumes 71376dda93cSYan, Zheng */ 71476dda93cSYan, Zheng static noinline int may_destroy_subvol(struct btrfs_root *root) 71576dda93cSYan, Zheng { 71676dda93cSYan, Zheng struct btrfs_path *path; 71776dda93cSYan, Zheng struct btrfs_key key; 71876dda93cSYan, Zheng int ret; 71976dda93cSYan, Zheng 72076dda93cSYan, Zheng path = btrfs_alloc_path(); 72176dda93cSYan, Zheng if (!path) 72276dda93cSYan, Zheng return -ENOMEM; 72376dda93cSYan, Zheng 72476dda93cSYan, Zheng key.objectid = root->root_key.objectid; 72576dda93cSYan, Zheng key.type = BTRFS_ROOT_REF_KEY; 72676dda93cSYan, Zheng key.offset = (u64)-1; 72776dda93cSYan, Zheng 72876dda93cSYan, Zheng ret = btrfs_search_slot(NULL, root->fs_info->tree_root, 72976dda93cSYan, Zheng &key, path, 0, 0); 73076dda93cSYan, Zheng if (ret < 0) 73176dda93cSYan, Zheng goto out; 73276dda93cSYan, Zheng BUG_ON(ret == 0); 73376dda93cSYan, Zheng 73476dda93cSYan, Zheng ret = 0; 73576dda93cSYan, Zheng if (path->slots[0] > 0) { 73676dda93cSYan, Zheng path->slots[0]--; 73776dda93cSYan, Zheng btrfs_item_key_to_cpu(path->nodes[0], &key, path->slots[0]); 73876dda93cSYan, Zheng if (key.objectid == root->root_key.objectid && 73976dda93cSYan, Zheng key.type == BTRFS_ROOT_REF_KEY) 74076dda93cSYan, Zheng ret = -ENOTEMPTY; 74176dda93cSYan, Zheng } 74276dda93cSYan, Zheng out: 74376dda93cSYan, Zheng btrfs_free_path(path); 74476dda93cSYan, Zheng return ret; 74576dda93cSYan, Zheng } 74676dda93cSYan, Zheng 74798d377a0STARUISI Hiroaki /* 74898d377a0STARUISI Hiroaki Search INODE_REFs to identify path name of 'dirid' directory 74998d377a0STARUISI Hiroaki in a 'tree_id' tree. and sets path name to 'name'. 75098d377a0STARUISI Hiroaki */ 75198d377a0STARUISI Hiroaki static noinline int btrfs_search_path_in_tree(struct btrfs_fs_info *info, 75298d377a0STARUISI Hiroaki u64 tree_id, u64 dirid, char *name) 75398d377a0STARUISI Hiroaki { 75498d377a0STARUISI Hiroaki struct btrfs_root *root; 75598d377a0STARUISI Hiroaki struct btrfs_key key; 75698d377a0STARUISI Hiroaki char *name_stack, *ptr; 75798d377a0STARUISI Hiroaki int ret = -1; 75898d377a0STARUISI Hiroaki int slot; 75998d377a0STARUISI Hiroaki int len; 76098d377a0STARUISI Hiroaki int total_len = 0; 76198d377a0STARUISI Hiroaki struct btrfs_inode_ref *iref; 76298d377a0STARUISI Hiroaki struct extent_buffer *l; 76398d377a0STARUISI Hiroaki struct btrfs_path *path; 76498d377a0STARUISI Hiroaki 76598d377a0STARUISI Hiroaki if (dirid == BTRFS_FIRST_FREE_OBJECTID) { 76698d377a0STARUISI Hiroaki name[0]='\0'; 76798d377a0STARUISI Hiroaki return 0; 76898d377a0STARUISI Hiroaki } 76998d377a0STARUISI Hiroaki 77098d377a0STARUISI Hiroaki path = btrfs_alloc_path(); 77198d377a0STARUISI Hiroaki if (!path) 77298d377a0STARUISI Hiroaki return -ENOMEM; 77398d377a0STARUISI Hiroaki 77498d377a0STARUISI Hiroaki name_stack = kzalloc(BTRFS_PATH_NAME_MAX+1, GFP_NOFS); 77598d377a0STARUISI Hiroaki if (!name_stack) { 77698d377a0STARUISI Hiroaki btrfs_free_path(path); 77798d377a0STARUISI Hiroaki return -ENOMEM; 77898d377a0STARUISI Hiroaki } 77998d377a0STARUISI Hiroaki 78098d377a0STARUISI Hiroaki ptr = &name_stack[BTRFS_PATH_NAME_MAX]; 78198d377a0STARUISI Hiroaki 78298d377a0STARUISI Hiroaki key.objectid = tree_id; 78398d377a0STARUISI Hiroaki key.type = BTRFS_ROOT_ITEM_KEY; 78498d377a0STARUISI Hiroaki key.offset = (u64)-1; 78598d377a0STARUISI Hiroaki root = btrfs_read_fs_root_no_name(info, &key); 78698d377a0STARUISI Hiroaki if (IS_ERR(root)) { 78798d377a0STARUISI Hiroaki printk(KERN_ERR "could not find root %llu\n", tree_id); 78898d377a0STARUISI Hiroaki return -ENOENT; 78998d377a0STARUISI Hiroaki } 79098d377a0STARUISI Hiroaki 79198d377a0STARUISI Hiroaki key.objectid = dirid; 79298d377a0STARUISI Hiroaki key.type = BTRFS_INODE_REF_KEY; 79398d377a0STARUISI Hiroaki key.offset = 0; 79498d377a0STARUISI Hiroaki 79598d377a0STARUISI Hiroaki while(1) { 79698d377a0STARUISI Hiroaki ret = btrfs_search_slot(NULL, root, &key, path, 0, 0); 79798d377a0STARUISI Hiroaki if (ret < 0) 79898d377a0STARUISI Hiroaki goto out; 79998d377a0STARUISI Hiroaki 80098d377a0STARUISI Hiroaki l = path->nodes[0]; 80198d377a0STARUISI Hiroaki slot = path->slots[0]; 80298d377a0STARUISI Hiroaki btrfs_item_key_to_cpu(l, &key, slot); 80398d377a0STARUISI Hiroaki 80498d377a0STARUISI Hiroaki if (ret > 0 && (key.objectid != dirid || 80598d377a0STARUISI Hiroaki key.type != BTRFS_INODE_REF_KEY)) 80698d377a0STARUISI Hiroaki goto out; 80798d377a0STARUISI Hiroaki 80898d377a0STARUISI Hiroaki iref = btrfs_item_ptr(l, slot, struct btrfs_inode_ref); 80998d377a0STARUISI Hiroaki len = btrfs_inode_ref_name_len(l, iref); 81098d377a0STARUISI Hiroaki ptr -= len + 1; 81198d377a0STARUISI Hiroaki total_len += len + 1; 81298d377a0STARUISI Hiroaki if (ptr < name_stack) 81398d377a0STARUISI Hiroaki goto out; 81498d377a0STARUISI Hiroaki 81598d377a0STARUISI Hiroaki *(ptr + len) = '/'; 81698d377a0STARUISI Hiroaki read_extent_buffer(l, ptr,(unsigned long)(iref + 1), len); 81798d377a0STARUISI Hiroaki 81898d377a0STARUISI Hiroaki if (key.offset == BTRFS_FIRST_FREE_OBJECTID) 81998d377a0STARUISI Hiroaki break; 82098d377a0STARUISI Hiroaki 82198d377a0STARUISI Hiroaki btrfs_release_path(root, path); 82298d377a0STARUISI Hiroaki key.objectid = key.offset; 82398d377a0STARUISI Hiroaki key.offset = 0; 82498d377a0STARUISI Hiroaki dirid = key.objectid; 82598d377a0STARUISI Hiroaki 82698d377a0STARUISI Hiroaki } 82798d377a0STARUISI Hiroaki if (ptr < name_stack) 82898d377a0STARUISI Hiroaki goto out; 82998d377a0STARUISI Hiroaki strncpy(name, ptr, total_len); 83098d377a0STARUISI Hiroaki name[total_len]='\0'; 83198d377a0STARUISI Hiroaki ret = 0; 83298d377a0STARUISI Hiroaki out: 83398d377a0STARUISI Hiroaki btrfs_free_path(path); 83498d377a0STARUISI Hiroaki kfree(name_stack); 83598d377a0STARUISI Hiroaki return ret; 83698d377a0STARUISI Hiroaki } 83798d377a0STARUISI Hiroaki 83876dda93cSYan, Zheng static noinline int btrfs_ioctl_snap_destroy(struct file *file, 83976dda93cSYan, Zheng void __user *arg) 84076dda93cSYan, Zheng { 84176dda93cSYan, Zheng struct dentry *parent = fdentry(file); 84276dda93cSYan, Zheng struct dentry *dentry; 84376dda93cSYan, Zheng struct inode *dir = parent->d_inode; 84476dda93cSYan, Zheng struct inode *inode; 84576dda93cSYan, Zheng struct btrfs_root *root = BTRFS_I(dir)->root; 84676dda93cSYan, Zheng struct btrfs_root *dest = NULL; 84776dda93cSYan, Zheng struct btrfs_ioctl_vol_args *vol_args; 84876dda93cSYan, Zheng struct btrfs_trans_handle *trans; 84976dda93cSYan, Zheng int namelen; 85076dda93cSYan, Zheng int ret; 85176dda93cSYan, Zheng int err = 0; 85276dda93cSYan, Zheng 85376dda93cSYan, Zheng if (!capable(CAP_SYS_ADMIN)) 85476dda93cSYan, Zheng return -EPERM; 85576dda93cSYan, Zheng 85676dda93cSYan, Zheng vol_args = memdup_user(arg, sizeof(*vol_args)); 85776dda93cSYan, Zheng if (IS_ERR(vol_args)) 85876dda93cSYan, Zheng return PTR_ERR(vol_args); 85976dda93cSYan, Zheng 86076dda93cSYan, Zheng vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 86176dda93cSYan, Zheng namelen = strlen(vol_args->name); 86276dda93cSYan, Zheng if (strchr(vol_args->name, '/') || 86376dda93cSYan, Zheng strncmp(vol_args->name, "..", namelen) == 0) { 86476dda93cSYan, Zheng err = -EINVAL; 86576dda93cSYan, Zheng goto out; 86676dda93cSYan, Zheng } 86776dda93cSYan, Zheng 86876dda93cSYan, Zheng err = mnt_want_write(file->f_path.mnt); 86976dda93cSYan, Zheng if (err) 87076dda93cSYan, Zheng goto out; 87176dda93cSYan, Zheng 87276dda93cSYan, Zheng mutex_lock_nested(&dir->i_mutex, I_MUTEX_PARENT); 87376dda93cSYan, Zheng dentry = lookup_one_len(vol_args->name, parent, namelen); 87476dda93cSYan, Zheng if (IS_ERR(dentry)) { 87576dda93cSYan, Zheng err = PTR_ERR(dentry); 87676dda93cSYan, Zheng goto out_unlock_dir; 87776dda93cSYan, Zheng } 87876dda93cSYan, Zheng 87976dda93cSYan, Zheng if (!dentry->d_inode) { 88076dda93cSYan, Zheng err = -ENOENT; 88176dda93cSYan, Zheng goto out_dput; 88276dda93cSYan, Zheng } 88376dda93cSYan, Zheng 88476dda93cSYan, Zheng inode = dentry->d_inode; 88576dda93cSYan, Zheng if (inode->i_ino != BTRFS_FIRST_FREE_OBJECTID) { 88676dda93cSYan, Zheng err = -EINVAL; 88776dda93cSYan, Zheng goto out_dput; 88876dda93cSYan, Zheng } 88976dda93cSYan, Zheng 89076dda93cSYan, Zheng dest = BTRFS_I(inode)->root; 89176dda93cSYan, Zheng 89276dda93cSYan, Zheng mutex_lock(&inode->i_mutex); 89376dda93cSYan, Zheng err = d_invalidate(dentry); 89476dda93cSYan, Zheng if (err) 89576dda93cSYan, Zheng goto out_unlock; 89676dda93cSYan, Zheng 89776dda93cSYan, Zheng down_write(&root->fs_info->subvol_sem); 89876dda93cSYan, Zheng 89976dda93cSYan, Zheng err = may_destroy_subvol(dest); 90076dda93cSYan, Zheng if (err) 90176dda93cSYan, Zheng goto out_up_write; 90276dda93cSYan, Zheng 90376dda93cSYan, Zheng trans = btrfs_start_transaction(root, 1); 90476dda93cSYan, Zheng ret = btrfs_unlink_subvol(trans, root, dir, 90576dda93cSYan, Zheng dest->root_key.objectid, 90676dda93cSYan, Zheng dentry->d_name.name, 90776dda93cSYan, Zheng dentry->d_name.len); 90876dda93cSYan, Zheng BUG_ON(ret); 90976dda93cSYan, Zheng 91076dda93cSYan, Zheng btrfs_record_root_in_trans(trans, dest); 91176dda93cSYan, Zheng 91276dda93cSYan, Zheng memset(&dest->root_item.drop_progress, 0, 91376dda93cSYan, Zheng sizeof(dest->root_item.drop_progress)); 91476dda93cSYan, Zheng dest->root_item.drop_level = 0; 91576dda93cSYan, Zheng btrfs_set_root_refs(&dest->root_item, 0); 91676dda93cSYan, Zheng 91776dda93cSYan, Zheng ret = btrfs_insert_orphan_item(trans, 91876dda93cSYan, Zheng root->fs_info->tree_root, 91976dda93cSYan, Zheng dest->root_key.objectid); 92076dda93cSYan, Zheng BUG_ON(ret); 92176dda93cSYan, Zheng 92276dda93cSYan, Zheng ret = btrfs_commit_transaction(trans, root); 92376dda93cSYan, Zheng BUG_ON(ret); 92476dda93cSYan, Zheng inode->i_flags |= S_DEAD; 92576dda93cSYan, Zheng out_up_write: 92676dda93cSYan, Zheng up_write(&root->fs_info->subvol_sem); 92776dda93cSYan, Zheng out_unlock: 92876dda93cSYan, Zheng mutex_unlock(&inode->i_mutex); 92976dda93cSYan, Zheng if (!err) { 930efefb143SYan, Zheng shrink_dcache_sb(root->fs_info->sb); 93176dda93cSYan, Zheng btrfs_invalidate_inodes(dest); 93276dda93cSYan, Zheng d_delete(dentry); 93376dda93cSYan, Zheng } 93476dda93cSYan, Zheng out_dput: 93576dda93cSYan, Zheng dput(dentry); 93676dda93cSYan, Zheng out_unlock_dir: 93776dda93cSYan, Zheng mutex_unlock(&dir->i_mutex); 93876dda93cSYan, Zheng mnt_drop_write(file->f_path.mnt); 93976dda93cSYan, Zheng out: 94076dda93cSYan, Zheng kfree(vol_args); 94176dda93cSYan, Zheng return err; 94276dda93cSYan, Zheng } 94376dda93cSYan, Zheng 944f46b5a66SChristoph Hellwig static int btrfs_ioctl_defrag(struct file *file) 945f46b5a66SChristoph Hellwig { 946f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 947f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 948c146afadSYan Zheng int ret; 949c146afadSYan Zheng 950c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 951c146afadSYan Zheng if (ret) 952c146afadSYan Zheng return ret; 953f46b5a66SChristoph Hellwig 954f46b5a66SChristoph Hellwig switch (inode->i_mode & S_IFMT) { 955f46b5a66SChristoph Hellwig case S_IFDIR: 956e441d54dSChris Mason if (!capable(CAP_SYS_ADMIN)) { 957e441d54dSChris Mason ret = -EPERM; 958e441d54dSChris Mason goto out; 959e441d54dSChris Mason } 960f46b5a66SChristoph Hellwig btrfs_defrag_root(root, 0); 961f46b5a66SChristoph Hellwig btrfs_defrag_root(root->fs_info->extent_root, 0); 962f46b5a66SChristoph Hellwig break; 963f46b5a66SChristoph Hellwig case S_IFREG: 964e441d54dSChris Mason if (!(file->f_mode & FMODE_WRITE)) { 965e441d54dSChris Mason ret = -EINVAL; 966e441d54dSChris Mason goto out; 967e441d54dSChris Mason } 968f46b5a66SChristoph Hellwig btrfs_defrag_file(file); 969f46b5a66SChristoph Hellwig break; 970f46b5a66SChristoph Hellwig } 971e441d54dSChris Mason out: 972ab67b7c1SYan Zheng mnt_drop_write(file->f_path.mnt); 973e441d54dSChris Mason return ret; 974f46b5a66SChristoph Hellwig } 975f46b5a66SChristoph Hellwig 976b2950863SChristoph Hellwig static long btrfs_ioctl_add_dev(struct btrfs_root *root, void __user *arg) 977f46b5a66SChristoph Hellwig { 978f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 979f46b5a66SChristoph Hellwig int ret; 980f46b5a66SChristoph Hellwig 981e441d54dSChris Mason if (!capable(CAP_SYS_ADMIN)) 982e441d54dSChris Mason return -EPERM; 983e441d54dSChris Mason 984dae7b665SLi Zefan vol_args = memdup_user(arg, sizeof(*vol_args)); 985dae7b665SLi Zefan if (IS_ERR(vol_args)) 986dae7b665SLi Zefan return PTR_ERR(vol_args); 987f46b5a66SChristoph Hellwig 9885516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 989f46b5a66SChristoph Hellwig ret = btrfs_init_new_device(root, vol_args->name); 990f46b5a66SChristoph Hellwig 991f46b5a66SChristoph Hellwig kfree(vol_args); 992f46b5a66SChristoph Hellwig return ret; 993f46b5a66SChristoph Hellwig } 994f46b5a66SChristoph Hellwig 995b2950863SChristoph Hellwig static long btrfs_ioctl_rm_dev(struct btrfs_root *root, void __user *arg) 996f46b5a66SChristoph Hellwig { 997f46b5a66SChristoph Hellwig struct btrfs_ioctl_vol_args *vol_args; 998f46b5a66SChristoph Hellwig int ret; 999f46b5a66SChristoph Hellwig 1000e441d54dSChris Mason if (!capable(CAP_SYS_ADMIN)) 1001e441d54dSChris Mason return -EPERM; 1002e441d54dSChris Mason 1003c146afadSYan Zheng if (root->fs_info->sb->s_flags & MS_RDONLY) 1004c146afadSYan Zheng return -EROFS; 1005c146afadSYan Zheng 1006dae7b665SLi Zefan vol_args = memdup_user(arg, sizeof(*vol_args)); 1007dae7b665SLi Zefan if (IS_ERR(vol_args)) 1008dae7b665SLi Zefan return PTR_ERR(vol_args); 1009f46b5a66SChristoph Hellwig 10105516e595SMark Fasheh vol_args->name[BTRFS_PATH_NAME_MAX] = '\0'; 1011f46b5a66SChristoph Hellwig ret = btrfs_rm_device(root, vol_args->name); 1012f46b5a66SChristoph Hellwig 1013f46b5a66SChristoph Hellwig kfree(vol_args); 1014f46b5a66SChristoph Hellwig return ret; 1015f46b5a66SChristoph Hellwig } 1016f46b5a66SChristoph Hellwig 101776dda93cSYan, Zheng static noinline long btrfs_ioctl_clone(struct file *file, unsigned long srcfd, 1018b2950863SChristoph Hellwig u64 off, u64 olen, u64 destoff) 1019f46b5a66SChristoph Hellwig { 1020f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 1021f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 1022f46b5a66SChristoph Hellwig struct file *src_file; 1023f46b5a66SChristoph Hellwig struct inode *src; 1024f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 1025f46b5a66SChristoph Hellwig struct btrfs_path *path; 1026f46b5a66SChristoph Hellwig struct extent_buffer *leaf; 1027ae01a0abSYan Zheng char *buf; 1028ae01a0abSYan Zheng struct btrfs_key key; 1029f46b5a66SChristoph Hellwig u32 nritems; 1030f46b5a66SChristoph Hellwig int slot; 1031ae01a0abSYan Zheng int ret; 1032c5c9cd4dSSage Weil u64 len = olen; 1033c5c9cd4dSSage Weil u64 bs = root->fs_info->sb->s_blocksize; 1034c5c9cd4dSSage Weil u64 hint_byte; 1035d20f7043SChris Mason 1036c5c9cd4dSSage Weil /* 1037c5c9cd4dSSage Weil * TODO: 1038c5c9cd4dSSage Weil * - split compressed inline extents. annoying: we need to 1039c5c9cd4dSSage Weil * decompress into destination's address_space (the file offset 1040c5c9cd4dSSage Weil * may change, so source mapping won't do), then recompress (or 1041c5c9cd4dSSage Weil * otherwise reinsert) a subrange. 1042c5c9cd4dSSage Weil * - allow ranges within the same file to be cloned (provided 1043c5c9cd4dSSage Weil * they don't overlap)? 1044c5c9cd4dSSage Weil */ 1045c5c9cd4dSSage Weil 1046e441d54dSChris Mason /* the destination must be opened for writing */ 1047e441d54dSChris Mason if (!(file->f_mode & FMODE_WRITE)) 1048e441d54dSChris Mason return -EINVAL; 1049e441d54dSChris Mason 1050c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 1051c146afadSYan Zheng if (ret) 1052c146afadSYan Zheng return ret; 1053c146afadSYan Zheng 1054c5c9cd4dSSage Weil src_file = fget(srcfd); 1055ab67b7c1SYan Zheng if (!src_file) { 1056ab67b7c1SYan Zheng ret = -EBADF; 1057ab67b7c1SYan Zheng goto out_drop_write; 1058ab67b7c1SYan Zheng } 1059f46b5a66SChristoph Hellwig src = src_file->f_dentry->d_inode; 1060f46b5a66SChristoph Hellwig 1061c5c9cd4dSSage Weil ret = -EINVAL; 1062c5c9cd4dSSage Weil if (src == inode) 1063c5c9cd4dSSage Weil goto out_fput; 1064c5c9cd4dSSage Weil 1065ae01a0abSYan Zheng ret = -EISDIR; 1066ae01a0abSYan Zheng if (S_ISDIR(src->i_mode) || S_ISDIR(inode->i_mode)) 1067f46b5a66SChristoph Hellwig goto out_fput; 1068f46b5a66SChristoph Hellwig 1069ae01a0abSYan Zheng ret = -EXDEV; 1070ae01a0abSYan Zheng if (src->i_sb != inode->i_sb || BTRFS_I(src)->root != root) 1071ae01a0abSYan Zheng goto out_fput; 1072ae01a0abSYan Zheng 1073ae01a0abSYan Zheng ret = -ENOMEM; 1074ae01a0abSYan Zheng buf = vmalloc(btrfs_level_size(root, 0)); 1075ae01a0abSYan Zheng if (!buf) 1076ae01a0abSYan Zheng goto out_fput; 1077ae01a0abSYan Zheng 1078ae01a0abSYan Zheng path = btrfs_alloc_path(); 1079ae01a0abSYan Zheng if (!path) { 1080ae01a0abSYan Zheng vfree(buf); 1081ae01a0abSYan Zheng goto out_fput; 1082ae01a0abSYan Zheng } 1083ae01a0abSYan Zheng path->reada = 2; 1084ae01a0abSYan Zheng 1085f46b5a66SChristoph Hellwig if (inode < src) { 1086f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 1087f46b5a66SChristoph Hellwig mutex_lock(&src->i_mutex); 1088f46b5a66SChristoph Hellwig } else { 1089f46b5a66SChristoph Hellwig mutex_lock(&src->i_mutex); 1090f46b5a66SChristoph Hellwig mutex_lock(&inode->i_mutex); 1091f46b5a66SChristoph Hellwig } 1092f46b5a66SChristoph Hellwig 1093c5c9cd4dSSage Weil /* determine range to clone */ 1094c5c9cd4dSSage Weil ret = -EINVAL; 1095c5c9cd4dSSage Weil if (off >= src->i_size || off + len > src->i_size) 1096f46b5a66SChristoph Hellwig goto out_unlock; 1097c5c9cd4dSSage Weil if (len == 0) 1098c5c9cd4dSSage Weil olen = len = src->i_size - off; 1099c5c9cd4dSSage Weil /* if we extend to eof, continue to block boundary */ 1100c5c9cd4dSSage Weil if (off + len == src->i_size) 1101c5c9cd4dSSage Weil len = ((src->i_size + bs-1) & ~(bs-1)) 1102c5c9cd4dSSage Weil - off; 1103c5c9cd4dSSage Weil 1104c5c9cd4dSSage Weil /* verify the end result is block aligned */ 1105c5c9cd4dSSage Weil if ((off & (bs-1)) || 1106c5c9cd4dSSage Weil ((off + len) & (bs-1))) 1107c5c9cd4dSSage Weil goto out_unlock; 1108c5c9cd4dSSage Weil 1109f46b5a66SChristoph Hellwig /* do any pending delalloc/csum calc on src, one way or 1110f46b5a66SChristoph Hellwig another, and lock file content */ 1111f46b5a66SChristoph Hellwig while (1) { 111231840ae1SZheng Yan struct btrfs_ordered_extent *ordered; 1113c5c9cd4dSSage Weil lock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 1114c5c9cd4dSSage Weil ordered = btrfs_lookup_first_ordered_extent(inode, off+len); 1115ae01a0abSYan Zheng if (BTRFS_I(src)->delalloc_bytes == 0 && !ordered) 1116f46b5a66SChristoph Hellwig break; 1117c5c9cd4dSSage Weil unlock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 1118ae01a0abSYan Zheng if (ordered) 1119ae01a0abSYan Zheng btrfs_put_ordered_extent(ordered); 1120c5c9cd4dSSage Weil btrfs_wait_ordered_range(src, off, off+len); 1121f46b5a66SChristoph Hellwig } 1122f46b5a66SChristoph Hellwig 1123ae01a0abSYan Zheng trans = btrfs_start_transaction(root, 1); 1124ae01a0abSYan Zheng BUG_ON(!trans); 1125ae01a0abSYan Zheng 1126c5c9cd4dSSage Weil /* punch hole in destination first */ 1127920bbbfbSYan, Zheng btrfs_drop_extents(trans, inode, off, off + len, &hint_byte, 1); 1128c5c9cd4dSSage Weil 1129c5c9cd4dSSage Weil /* clone data */ 1130f46b5a66SChristoph Hellwig key.objectid = src->i_ino; 1131ae01a0abSYan Zheng key.type = BTRFS_EXTENT_DATA_KEY; 1132ae01a0abSYan Zheng key.offset = 0; 1133f46b5a66SChristoph Hellwig 1134f46b5a66SChristoph Hellwig while (1) { 1135f46b5a66SChristoph Hellwig /* 1136f46b5a66SChristoph Hellwig * note the key will change type as we walk through the 1137f46b5a66SChristoph Hellwig * tree. 1138f46b5a66SChristoph Hellwig */ 1139f46b5a66SChristoph Hellwig ret = btrfs_search_slot(trans, root, &key, path, 0, 0); 1140f46b5a66SChristoph Hellwig if (ret < 0) 1141f46b5a66SChristoph Hellwig goto out; 1142f46b5a66SChristoph Hellwig 1143ae01a0abSYan Zheng nritems = btrfs_header_nritems(path->nodes[0]); 1144ae01a0abSYan Zheng if (path->slots[0] >= nritems) { 1145f46b5a66SChristoph Hellwig ret = btrfs_next_leaf(root, path); 1146f46b5a66SChristoph Hellwig if (ret < 0) 1147f46b5a66SChristoph Hellwig goto out; 1148f46b5a66SChristoph Hellwig if (ret > 0) 1149f46b5a66SChristoph Hellwig break; 1150ae01a0abSYan Zheng nritems = btrfs_header_nritems(path->nodes[0]); 1151f46b5a66SChristoph Hellwig } 1152f46b5a66SChristoph Hellwig leaf = path->nodes[0]; 1153f46b5a66SChristoph Hellwig slot = path->slots[0]; 1154f46b5a66SChristoph Hellwig 1155ae01a0abSYan Zheng btrfs_item_key_to_cpu(leaf, &key, slot); 1156d20f7043SChris Mason if (btrfs_key_type(&key) > BTRFS_EXTENT_DATA_KEY || 1157f46b5a66SChristoph Hellwig key.objectid != src->i_ino) 1158f46b5a66SChristoph Hellwig break; 1159f46b5a66SChristoph Hellwig 1160c5c9cd4dSSage Weil if (btrfs_key_type(&key) == BTRFS_EXTENT_DATA_KEY) { 1161c5c9cd4dSSage Weil struct btrfs_file_extent_item *extent; 1162c5c9cd4dSSage Weil int type; 116331840ae1SZheng Yan u32 size; 116431840ae1SZheng Yan struct btrfs_key new_key; 1165c5c9cd4dSSage Weil u64 disko = 0, diskl = 0; 1166c5c9cd4dSSage Weil u64 datao = 0, datal = 0; 1167c5c9cd4dSSage Weil u8 comp; 116831840ae1SZheng Yan 116931840ae1SZheng Yan size = btrfs_item_size_nr(leaf, slot); 117031840ae1SZheng Yan read_extent_buffer(leaf, buf, 117131840ae1SZheng Yan btrfs_item_ptr_offset(leaf, slot), 117231840ae1SZheng Yan size); 1173c5c9cd4dSSage Weil 1174c5c9cd4dSSage Weil extent = btrfs_item_ptr(leaf, slot, 1175c5c9cd4dSSage Weil struct btrfs_file_extent_item); 1176c5c9cd4dSSage Weil comp = btrfs_file_extent_compression(leaf, extent); 1177c5c9cd4dSSage Weil type = btrfs_file_extent_type(leaf, extent); 1178c8a894d7SChris Mason if (type == BTRFS_FILE_EXTENT_REG || 1179c8a894d7SChris Mason type == BTRFS_FILE_EXTENT_PREALLOC) { 1180d397712bSChris Mason disko = btrfs_file_extent_disk_bytenr(leaf, 1181d397712bSChris Mason extent); 1182d397712bSChris Mason diskl = btrfs_file_extent_disk_num_bytes(leaf, 1183d397712bSChris Mason extent); 1184c5c9cd4dSSage Weil datao = btrfs_file_extent_offset(leaf, extent); 1185d397712bSChris Mason datal = btrfs_file_extent_num_bytes(leaf, 1186d397712bSChris Mason extent); 1187c5c9cd4dSSage Weil } else if (type == BTRFS_FILE_EXTENT_INLINE) { 1188c5c9cd4dSSage Weil /* take upper bound, may be compressed */ 1189c5c9cd4dSSage Weil datal = btrfs_file_extent_ram_bytes(leaf, 1190c5c9cd4dSSage Weil extent); 1191c5c9cd4dSSage Weil } 119231840ae1SZheng Yan btrfs_release_path(root, path); 119331840ae1SZheng Yan 1194c5c9cd4dSSage Weil if (key.offset + datal < off || 1195c5c9cd4dSSage Weil key.offset >= off+len) 1196c5c9cd4dSSage Weil goto next; 1197c5c9cd4dSSage Weil 119831840ae1SZheng Yan memcpy(&new_key, &key, sizeof(new_key)); 119931840ae1SZheng Yan new_key.objectid = inode->i_ino; 1200c5c9cd4dSSage Weil new_key.offset = key.offset + destoff - off; 1201c5c9cd4dSSage Weil 1202c8a894d7SChris Mason if (type == BTRFS_FILE_EXTENT_REG || 1203c8a894d7SChris Mason type == BTRFS_FILE_EXTENT_PREALLOC) { 120431840ae1SZheng Yan ret = btrfs_insert_empty_item(trans, root, path, 120531840ae1SZheng Yan &new_key, size); 120631840ae1SZheng Yan if (ret) 120731840ae1SZheng Yan goto out; 120831840ae1SZheng Yan 120931840ae1SZheng Yan leaf = path->nodes[0]; 121031840ae1SZheng Yan slot = path->slots[0]; 121131840ae1SZheng Yan write_extent_buffer(leaf, buf, 121231840ae1SZheng Yan btrfs_item_ptr_offset(leaf, slot), 121331840ae1SZheng Yan size); 1214ae01a0abSYan Zheng 1215f46b5a66SChristoph Hellwig extent = btrfs_item_ptr(leaf, slot, 1216f46b5a66SChristoph Hellwig struct btrfs_file_extent_item); 1217c5c9cd4dSSage Weil 1218c5c9cd4dSSage Weil if (off > key.offset) { 1219c5c9cd4dSSage Weil datao += off - key.offset; 1220c5c9cd4dSSage Weil datal -= off - key.offset; 1221c5c9cd4dSSage Weil } 1222ac6889cbSChris Mason 1223ac6889cbSChris Mason if (key.offset + datal > off + len) 1224ac6889cbSChris Mason datal = off + len - key.offset; 1225ac6889cbSChris Mason 1226c5c9cd4dSSage Weil /* disko == 0 means it's a hole */ 1227c5c9cd4dSSage Weil if (!disko) 1228c5c9cd4dSSage Weil datao = 0; 1229c5c9cd4dSSage Weil 1230c5c9cd4dSSage Weil btrfs_set_file_extent_offset(leaf, extent, 1231c5c9cd4dSSage Weil datao); 1232c5c9cd4dSSage Weil btrfs_set_file_extent_num_bytes(leaf, extent, 1233c5c9cd4dSSage Weil datal); 1234c5c9cd4dSSage Weil if (disko) { 1235c5c9cd4dSSage Weil inode_add_bytes(inode, datal); 1236ae01a0abSYan Zheng ret = btrfs_inc_extent_ref(trans, root, 12375d4f98a2SYan Zheng disko, diskl, 0, 1238f46b5a66SChristoph Hellwig root->root_key.objectid, 12395d4f98a2SYan Zheng inode->i_ino, 12405d4f98a2SYan Zheng new_key.offset - datao); 1241ae01a0abSYan Zheng BUG_ON(ret); 1242f46b5a66SChristoph Hellwig } 1243c5c9cd4dSSage Weil } else if (type == BTRFS_FILE_EXTENT_INLINE) { 1244c5c9cd4dSSage Weil u64 skip = 0; 1245c5c9cd4dSSage Weil u64 trim = 0; 1246c5c9cd4dSSage Weil if (off > key.offset) { 1247c5c9cd4dSSage Weil skip = off - key.offset; 1248c5c9cd4dSSage Weil new_key.offset += skip; 124931840ae1SZheng Yan } 1250d397712bSChris Mason 1251c5c9cd4dSSage Weil if (key.offset + datal > off+len) 1252c5c9cd4dSSage Weil trim = key.offset + datal - (off+len); 1253d397712bSChris Mason 1254c5c9cd4dSSage Weil if (comp && (skip || trim)) { 1255c5c9cd4dSSage Weil ret = -EINVAL; 1256c5c9cd4dSSage Weil goto out; 125731840ae1SZheng Yan } 1258c5c9cd4dSSage Weil size -= skip + trim; 1259c5c9cd4dSSage Weil datal -= skip + trim; 1260c5c9cd4dSSage Weil ret = btrfs_insert_empty_item(trans, root, path, 1261c5c9cd4dSSage Weil &new_key, size); 1262c5c9cd4dSSage Weil if (ret) 1263c5c9cd4dSSage Weil goto out; 1264c5c9cd4dSSage Weil 1265c5c9cd4dSSage Weil if (skip) { 1266d397712bSChris Mason u32 start = 1267d397712bSChris Mason btrfs_file_extent_calc_inline_size(0); 1268c5c9cd4dSSage Weil memmove(buf+start, buf+start+skip, 1269c5c9cd4dSSage Weil datal); 1270c5c9cd4dSSage Weil } 1271c5c9cd4dSSage Weil 1272c5c9cd4dSSage Weil leaf = path->nodes[0]; 1273c5c9cd4dSSage Weil slot = path->slots[0]; 1274c5c9cd4dSSage Weil write_extent_buffer(leaf, buf, 1275c5c9cd4dSSage Weil btrfs_item_ptr_offset(leaf, slot), 1276c5c9cd4dSSage Weil size); 1277c5c9cd4dSSage Weil inode_add_bytes(inode, datal); 1278c5c9cd4dSSage Weil } 1279c5c9cd4dSSage Weil 1280c5c9cd4dSSage Weil btrfs_mark_buffer_dirty(leaf); 1281c5c9cd4dSSage Weil } 1282c5c9cd4dSSage Weil 1283c5c9cd4dSSage Weil next: 128431840ae1SZheng Yan btrfs_release_path(root, path); 1285ae01a0abSYan Zheng key.offset++; 1286ae01a0abSYan Zheng } 1287f46b5a66SChristoph Hellwig ret = 0; 1288f46b5a66SChristoph Hellwig out: 1289ae01a0abSYan Zheng btrfs_release_path(root, path); 1290ae01a0abSYan Zheng if (ret == 0) { 1291ae01a0abSYan Zheng inode->i_mtime = inode->i_ctime = CURRENT_TIME; 1292c5c9cd4dSSage Weil if (destoff + olen > inode->i_size) 1293c5c9cd4dSSage Weil btrfs_i_size_write(inode, destoff + olen); 1294ae01a0abSYan Zheng BTRFS_I(inode)->flags = BTRFS_I(src)->flags; 1295ae01a0abSYan Zheng ret = btrfs_update_inode(trans, root, inode); 1296ae01a0abSYan Zheng } 1297f46b5a66SChristoph Hellwig btrfs_end_transaction(trans, root); 1298c5c9cd4dSSage Weil unlock_extent(&BTRFS_I(src)->io_tree, off, off+len, GFP_NOFS); 1299ae01a0abSYan Zheng if (ret) 1300ae01a0abSYan Zheng vmtruncate(inode, 0); 1301f46b5a66SChristoph Hellwig out_unlock: 1302f46b5a66SChristoph Hellwig mutex_unlock(&src->i_mutex); 1303f46b5a66SChristoph Hellwig mutex_unlock(&inode->i_mutex); 1304ae01a0abSYan Zheng vfree(buf); 1305ae01a0abSYan Zheng btrfs_free_path(path); 1306f46b5a66SChristoph Hellwig out_fput: 1307f46b5a66SChristoph Hellwig fput(src_file); 1308ab67b7c1SYan Zheng out_drop_write: 1309ab67b7c1SYan Zheng mnt_drop_write(file->f_path.mnt); 1310f46b5a66SChristoph Hellwig return ret; 1311f46b5a66SChristoph Hellwig } 1312f46b5a66SChristoph Hellwig 13137a865e8aSChristoph Hellwig static long btrfs_ioctl_clone_range(struct file *file, void __user *argp) 1314c5c9cd4dSSage Weil { 1315c5c9cd4dSSage Weil struct btrfs_ioctl_clone_range_args args; 1316c5c9cd4dSSage Weil 13177a865e8aSChristoph Hellwig if (copy_from_user(&args, argp, sizeof(args))) 1318c5c9cd4dSSage Weil return -EFAULT; 1319c5c9cd4dSSage Weil return btrfs_ioctl_clone(file, args.src_fd, args.src_offset, 1320c5c9cd4dSSage Weil args.src_length, args.dest_offset); 1321c5c9cd4dSSage Weil } 1322c5c9cd4dSSage Weil 1323f46b5a66SChristoph Hellwig /* 1324f46b5a66SChristoph Hellwig * there are many ways the trans_start and trans_end ioctls can lead 1325f46b5a66SChristoph Hellwig * to deadlocks. They should only be used by applications that 1326f46b5a66SChristoph Hellwig * basically own the machine, and have a very in depth understanding 1327f46b5a66SChristoph Hellwig * of all the possible deadlocks and enospc problems. 1328f46b5a66SChristoph Hellwig */ 1329b2950863SChristoph Hellwig static long btrfs_ioctl_trans_start(struct file *file) 1330f46b5a66SChristoph Hellwig { 1331f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 1332f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 1333f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 13341ab86aedSSage Weil int ret; 1335f46b5a66SChristoph Hellwig 13361ab86aedSSage Weil ret = -EPERM; 1337df5b5520SChristoph Hellwig if (!capable(CAP_SYS_ADMIN)) 1338f46b5a66SChristoph Hellwig goto out; 13391ab86aedSSage Weil 13401ab86aedSSage Weil ret = -EINPROGRESS; 13411ab86aedSSage Weil if (file->private_data) 13421ab86aedSSage Weil goto out; 13439ca9ee09SSage Weil 1344c146afadSYan Zheng ret = mnt_want_write(file->f_path.mnt); 1345c146afadSYan Zheng if (ret) 1346c146afadSYan Zheng goto out; 1347c146afadSYan Zheng 13489ca9ee09SSage Weil mutex_lock(&root->fs_info->trans_mutex); 13499ca9ee09SSage Weil root->fs_info->open_ioctl_trans++; 13509ca9ee09SSage Weil mutex_unlock(&root->fs_info->trans_mutex); 13519ca9ee09SSage Weil 1352f46b5a66SChristoph Hellwig ret = -ENOMEM; 13531ab86aedSSage Weil trans = btrfs_start_ioctl_transaction(root, 0); 13541ab86aedSSage Weil if (!trans) 13551ab86aedSSage Weil goto out_drop; 13561ab86aedSSage Weil 13571ab86aedSSage Weil file->private_data = trans; 13581ab86aedSSage Weil return 0; 13591ab86aedSSage Weil 13601ab86aedSSage Weil out_drop: 13611ab86aedSSage Weil mutex_lock(&root->fs_info->trans_mutex); 13621ab86aedSSage Weil root->fs_info->open_ioctl_trans--; 13631ab86aedSSage Weil mutex_unlock(&root->fs_info->trans_mutex); 13641ab86aedSSage Weil mnt_drop_write(file->f_path.mnt); 1365f46b5a66SChristoph Hellwig out: 1366f46b5a66SChristoph Hellwig return ret; 1367f46b5a66SChristoph Hellwig } 1368f46b5a66SChristoph Hellwig 1369f46b5a66SChristoph Hellwig /* 1370f46b5a66SChristoph Hellwig * there are many ways the trans_start and trans_end ioctls can lead 1371f46b5a66SChristoph Hellwig * to deadlocks. They should only be used by applications that 1372f46b5a66SChristoph Hellwig * basically own the machine, and have a very in depth understanding 1373f46b5a66SChristoph Hellwig * of all the possible deadlocks and enospc problems. 1374f46b5a66SChristoph Hellwig */ 1375f46b5a66SChristoph Hellwig long btrfs_ioctl_trans_end(struct file *file) 1376f46b5a66SChristoph Hellwig { 1377f46b5a66SChristoph Hellwig struct inode *inode = fdentry(file)->d_inode; 1378f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(inode)->root; 1379f46b5a66SChristoph Hellwig struct btrfs_trans_handle *trans; 1380f46b5a66SChristoph Hellwig 1381f46b5a66SChristoph Hellwig trans = file->private_data; 13821ab86aedSSage Weil if (!trans) 13831ab86aedSSage Weil return -EINVAL; 1384b214107eSChristoph Hellwig file->private_data = NULL; 13859ca9ee09SSage Weil 13861ab86aedSSage Weil btrfs_end_transaction(trans, root); 13871ab86aedSSage Weil 13889ca9ee09SSage Weil mutex_lock(&root->fs_info->trans_mutex); 13899ca9ee09SSage Weil root->fs_info->open_ioctl_trans--; 13909ca9ee09SSage Weil mutex_unlock(&root->fs_info->trans_mutex); 13919ca9ee09SSage Weil 1392cfc8ea87SSage Weil mnt_drop_write(file->f_path.mnt); 13931ab86aedSSage Weil return 0; 1394f46b5a66SChristoph Hellwig } 1395f46b5a66SChristoph Hellwig 1396f46b5a66SChristoph Hellwig long btrfs_ioctl(struct file *file, unsigned int 1397f46b5a66SChristoph Hellwig cmd, unsigned long arg) 1398f46b5a66SChristoph Hellwig { 1399f46b5a66SChristoph Hellwig struct btrfs_root *root = BTRFS_I(fdentry(file)->d_inode)->root; 14004bcabaa3SChristoph Hellwig void __user *argp = (void __user *)arg; 1401f46b5a66SChristoph Hellwig 1402f46b5a66SChristoph Hellwig switch (cmd) { 14036cbff00fSChristoph Hellwig case FS_IOC_GETFLAGS: 14046cbff00fSChristoph Hellwig return btrfs_ioctl_getflags(file, argp); 14056cbff00fSChristoph Hellwig case FS_IOC_SETFLAGS: 14066cbff00fSChristoph Hellwig return btrfs_ioctl_setflags(file, argp); 14076cbff00fSChristoph Hellwig case FS_IOC_GETVERSION: 14086cbff00fSChristoph Hellwig return btrfs_ioctl_getversion(file, argp); 1409f46b5a66SChristoph Hellwig case BTRFS_IOC_SNAP_CREATE: 14104bcabaa3SChristoph Hellwig return btrfs_ioctl_snap_create(file, argp, 0); 14113de4586cSChris Mason case BTRFS_IOC_SUBVOL_CREATE: 14124bcabaa3SChristoph Hellwig return btrfs_ioctl_snap_create(file, argp, 1); 141376dda93cSYan, Zheng case BTRFS_IOC_SNAP_DESTROY: 141476dda93cSYan, Zheng return btrfs_ioctl_snap_destroy(file, argp); 1415f46b5a66SChristoph Hellwig case BTRFS_IOC_DEFRAG: 1416f46b5a66SChristoph Hellwig return btrfs_ioctl_defrag(file); 1417f46b5a66SChristoph Hellwig case BTRFS_IOC_RESIZE: 14184bcabaa3SChristoph Hellwig return btrfs_ioctl_resize(root, argp); 1419f46b5a66SChristoph Hellwig case BTRFS_IOC_ADD_DEV: 14204bcabaa3SChristoph Hellwig return btrfs_ioctl_add_dev(root, argp); 1421f46b5a66SChristoph Hellwig case BTRFS_IOC_RM_DEV: 14224bcabaa3SChristoph Hellwig return btrfs_ioctl_rm_dev(root, argp); 1423f46b5a66SChristoph Hellwig case BTRFS_IOC_BALANCE: 1424f46b5a66SChristoph Hellwig return btrfs_balance(root->fs_info->dev_root); 1425f46b5a66SChristoph Hellwig case BTRFS_IOC_CLONE: 1426c5c9cd4dSSage Weil return btrfs_ioctl_clone(file, arg, 0, 0, 0); 1427c5c9cd4dSSage Weil case BTRFS_IOC_CLONE_RANGE: 14287a865e8aSChristoph Hellwig return btrfs_ioctl_clone_range(file, argp); 1429f46b5a66SChristoph Hellwig case BTRFS_IOC_TRANS_START: 1430f46b5a66SChristoph Hellwig return btrfs_ioctl_trans_start(file); 1431f46b5a66SChristoph Hellwig case BTRFS_IOC_TRANS_END: 1432f46b5a66SChristoph Hellwig return btrfs_ioctl_trans_end(file); 1433f46b5a66SChristoph Hellwig case BTRFS_IOC_SYNC: 1434f46b5a66SChristoph Hellwig btrfs_sync_fs(file->f_dentry->d_sb, 1); 1435f46b5a66SChristoph Hellwig return 0; 1436f46b5a66SChristoph Hellwig } 1437f46b5a66SChristoph Hellwig 1438f46b5a66SChristoph Hellwig return -ENOTTY; 1439f46b5a66SChristoph Hellwig } 1440