16cbd5570SChris Mason /* 26cbd5570SChris Mason * Copyright (C) 2007 Oracle. All rights reserved. 36cbd5570SChris Mason * 46cbd5570SChris Mason * This program is free software; you can redistribute it and/or 56cbd5570SChris Mason * modify it under the terms of the GNU General Public 66cbd5570SChris Mason * License v2 as published by the Free Software Foundation. 76cbd5570SChris Mason * 86cbd5570SChris Mason * This program is distributed in the hope that it will be useful, 96cbd5570SChris Mason * but WITHOUT ANY WARRANTY; without even the implied warranty of 106cbd5570SChris Mason * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 116cbd5570SChris Mason * General Public License for more details. 126cbd5570SChris Mason * 136cbd5570SChris Mason * You should have received a copy of the GNU General Public 146cbd5570SChris Mason * License along with this program; if not, write to the 156cbd5570SChris Mason * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 166cbd5570SChris Mason * Boston, MA 021110-1307, USA. 176cbd5570SChris Mason */ 186cbd5570SChris Mason 1979154b1bSChris Mason #include <linux/fs.h> 2034088780SChris Mason #include <linux/sched.h> 21d3c2fdcfSChris Mason #include <linux/writeback.h> 225f39d397SChris Mason #include <linux/pagemap.h> 2379154b1bSChris Mason #include "ctree.h" 2479154b1bSChris Mason #include "disk-io.h" 2579154b1bSChris Mason #include "transaction.h" 26925baeddSChris Mason #include "locking.h" 2779154b1bSChris Mason 2878fae27eSChris Mason static int total_trans = 0; 292c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 302c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 312c90e5d6SChris Mason 320f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 330f7d52f4SChris Mason 3480b6794dSChris Mason static noinline void put_transaction(struct btrfs_transaction *transaction) 3579154b1bSChris Mason { 362c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 3779154b1bSChris Mason transaction->use_count--; 3878fae27eSChris Mason if (transaction->use_count == 0) { 3978fae27eSChris Mason WARN_ON(total_trans == 0); 4078fae27eSChris Mason total_trans--; 418fd17795SChris Mason list_del_init(&transaction->list); 422c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 432c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 4479154b1bSChris Mason } 4578fae27eSChris Mason } 4679154b1bSChris Mason 4780b6794dSChris Mason static noinline int join_transaction(struct btrfs_root *root) 4879154b1bSChris Mason { 4979154b1bSChris Mason struct btrfs_transaction *cur_trans; 5079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 5179154b1bSChris Mason if (!cur_trans) { 522c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 532c90e5d6SChris Mason GFP_NOFS); 5478fae27eSChris Mason total_trans++; 5579154b1bSChris Mason BUG_ON(!cur_trans); 560f7d52f4SChris Mason root->fs_info->generation++; 57e18e4809SChris Mason root->fs_info->last_alloc = 0; 584529ba49SChris Mason root->fs_info->last_data_alloc = 0; 5915ee9bc7SJosef Bacik cur_trans->num_writers = 1; 6015ee9bc7SJosef Bacik cur_trans->num_joined = 0; 610f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 6279154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 6379154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 6479154b1bSChris Mason cur_trans->in_commit = 0; 65d5719762SChris Mason cur_trans->use_count = 1; 6679154b1bSChris Mason cur_trans->commit_done = 0; 6708607c1bSChris Mason cur_trans->start_time = get_seconds(); 683063d29fSChris Mason INIT_LIST_HEAD(&cur_trans->pending_snapshots); 698fd17795SChris Mason list_add_tail(&cur_trans->list, &root->fs_info->trans_list); 70d1310b2eSChris Mason extent_io_tree_init(&cur_trans->dirty_pages, 715f39d397SChris Mason root->fs_info->btree_inode->i_mapping, 725f39d397SChris Mason GFP_NOFS); 7348ec2cf8SChris Mason spin_lock(&root->fs_info->new_trans_lock); 7448ec2cf8SChris Mason root->fs_info->running_transaction = cur_trans; 7548ec2cf8SChris Mason spin_unlock(&root->fs_info->new_trans_lock); 7615ee9bc7SJosef Bacik } else { 7779154b1bSChris Mason cur_trans->num_writers++; 7815ee9bc7SJosef Bacik cur_trans->num_joined++; 7915ee9bc7SJosef Bacik } 8015ee9bc7SJosef Bacik 8179154b1bSChris Mason return 0; 8279154b1bSChris Mason } 8379154b1bSChris Mason 8480b6794dSChris Mason static noinline int record_root_in_trans(struct btrfs_root *root) 856702ed49SChris Mason { 866702ed49SChris Mason u64 running_trans_id = root->fs_info->running_transaction->transid; 876702ed49SChris Mason if (root->ref_cows && root->last_trans < running_trans_id) { 886702ed49SChris Mason WARN_ON(root == root->fs_info->extent_root); 896702ed49SChris Mason if (root->root_item.refs != 0) { 906702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 916702ed49SChris Mason (unsigned long)root->root_key.objectid, 926702ed49SChris Mason BTRFS_ROOT_TRANS_TAG); 93925baeddSChris Mason root->commit_root = btrfs_root_node(root); 946702ed49SChris Mason } else { 956702ed49SChris Mason WARN_ON(1); 966702ed49SChris Mason } 976702ed49SChris Mason root->last_trans = running_trans_id; 986702ed49SChris Mason } 996702ed49SChris Mason return 0; 1006702ed49SChris Mason } 1016702ed49SChris Mason 10279154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 10379154b1bSChris Mason int num_blocks) 10479154b1bSChris Mason { 1052c90e5d6SChris Mason struct btrfs_trans_handle *h = 1062c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 10779154b1bSChris Mason int ret; 10879154b1bSChris Mason 10979154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 11079154b1bSChris Mason ret = join_transaction(root); 11179154b1bSChris Mason BUG_ON(ret); 1120f7d52f4SChris Mason 1136702ed49SChris Mason record_root_in_trans(root); 1146702ed49SChris Mason h->transid = root->fs_info->running_transaction->transid; 11579154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 11679154b1bSChris Mason h->blocks_reserved = num_blocks; 11779154b1bSChris Mason h->blocks_used = 0; 11831f3c99bSChris Mason h->block_group = NULL; 11926b8003fSChris Mason h->alloc_exclude_nr = 0; 12026b8003fSChris Mason h->alloc_exclude_start = 0; 12179154b1bSChris Mason root->fs_info->running_transaction->use_count++; 12279154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 12379154b1bSChris Mason return h; 12479154b1bSChris Mason } 12579154b1bSChris Mason 12689ce8a63SChris Mason static noinline int wait_for_commit(struct btrfs_root *root, 12789ce8a63SChris Mason struct btrfs_transaction *commit) 12889ce8a63SChris Mason { 12989ce8a63SChris Mason DEFINE_WAIT(wait); 13089ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 13189ce8a63SChris Mason while(!commit->commit_done) { 13289ce8a63SChris Mason prepare_to_wait(&commit->commit_wait, &wait, 13389ce8a63SChris Mason TASK_UNINTERRUPTIBLE); 13489ce8a63SChris Mason if (commit->commit_done) 13589ce8a63SChris Mason break; 13689ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 13789ce8a63SChris Mason schedule(); 13889ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 13989ce8a63SChris Mason } 14089ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 14189ce8a63SChris Mason finish_wait(&commit->commit_wait, &wait); 14289ce8a63SChris Mason return 0; 14389ce8a63SChris Mason } 14489ce8a63SChris Mason 14589ce8a63SChris Mason static int __btrfs_end_transaction(struct btrfs_trans_handle *trans, 14689ce8a63SChris Mason struct btrfs_root *root, int throttle) 14779154b1bSChris Mason { 14879154b1bSChris Mason struct btrfs_transaction *cur_trans; 149d6e4a428SChris Mason 15079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 15179154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 152ccd467d6SChris Mason WARN_ON(cur_trans != trans->transaction); 153d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 154ccd467d6SChris Mason cur_trans->num_writers--; 15589ce8a63SChris Mason 15679154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 15779154b1bSChris Mason wake_up(&cur_trans->writer_wait); 15889ce8a63SChris Mason 15989ce8a63SChris Mason if (cur_trans->in_commit && throttle) { 160e6dcd2dcSChris Mason DEFINE_WAIT(wait); 16189ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 162e6dcd2dcSChris Mason prepare_to_wait(&root->fs_info->transaction_throttle, &wait, 163e6dcd2dcSChris Mason TASK_UNINTERRUPTIBLE); 164e6dcd2dcSChris Mason schedule(); 165e6dcd2dcSChris Mason finish_wait(&root->fs_info->transaction_throttle, &wait); 16689ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 16789ce8a63SChris Mason } 16889ce8a63SChris Mason 16979154b1bSChris Mason put_transaction(cur_trans); 17079154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 171d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 1722c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 17379154b1bSChris Mason return 0; 17479154b1bSChris Mason } 17579154b1bSChris Mason 17689ce8a63SChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 17789ce8a63SChris Mason struct btrfs_root *root) 17889ce8a63SChris Mason { 17989ce8a63SChris Mason return __btrfs_end_transaction(trans, root, 0); 18089ce8a63SChris Mason } 18189ce8a63SChris Mason 18289ce8a63SChris Mason int btrfs_end_transaction_throttle(struct btrfs_trans_handle *trans, 18389ce8a63SChris Mason struct btrfs_root *root) 18489ce8a63SChris Mason { 18589ce8a63SChris Mason return __btrfs_end_transaction(trans, root, 1); 18689ce8a63SChris Mason } 18789ce8a63SChris Mason 18879154b1bSChris Mason 18979154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 19079154b1bSChris Mason struct btrfs_root *root) 19179154b1bSChris Mason { 1927c4452b9SChris Mason int ret; 1937c4452b9SChris Mason int err; 1947c4452b9SChris Mason int werr = 0; 195d1310b2eSChris Mason struct extent_io_tree *dirty_pages; 1967c4452b9SChris Mason struct page *page; 1977c4452b9SChris Mason struct inode *btree_inode = root->fs_info->btree_inode; 1985f39d397SChris Mason u64 start; 1995f39d397SChris Mason u64 end; 2005f39d397SChris Mason unsigned long index; 2017c4452b9SChris Mason 2027c4452b9SChris Mason if (!trans || !trans->transaction) { 2037c4452b9SChris Mason return filemap_write_and_wait(btree_inode->i_mapping); 2047c4452b9SChris Mason } 2057c4452b9SChris Mason dirty_pages = &trans->transaction->dirty_pages; 2067c4452b9SChris Mason while(1) { 2075f39d397SChris Mason ret = find_first_extent_bit(dirty_pages, 0, &start, &end, 2085f39d397SChris Mason EXTENT_DIRTY); 2095f39d397SChris Mason if (ret) 2107c4452b9SChris Mason break; 2115f39d397SChris Mason clear_extent_dirty(dirty_pages, start, end, GFP_NOFS); 2125f39d397SChris Mason while(start <= end) { 2135f39d397SChris Mason index = start >> PAGE_CACHE_SHIFT; 21435ebb934SChris Mason start = (u64)(index + 1) << PAGE_CACHE_SHIFT; 2155f39d397SChris Mason page = find_lock_page(btree_inode->i_mapping, index); 2167c4452b9SChris Mason if (!page) 2177c4452b9SChris Mason continue; 2186702ed49SChris Mason if (PageWriteback(page)) { 2196702ed49SChris Mason if (PageDirty(page)) 2206702ed49SChris Mason wait_on_page_writeback(page); 2216702ed49SChris Mason else { 2226702ed49SChris Mason unlock_page(page); 2236702ed49SChris Mason page_cache_release(page); 2246702ed49SChris Mason continue; 2256702ed49SChris Mason } 2266702ed49SChris Mason } 2277c4452b9SChris Mason err = write_one_page(page, 0); 2287c4452b9SChris Mason if (err) 2297c4452b9SChris Mason werr = err; 2307c4452b9SChris Mason page_cache_release(page); 2317c4452b9SChris Mason } 2327c4452b9SChris Mason } 2337c4452b9SChris Mason err = filemap_fdatawait(btree_inode->i_mapping); 2347c4452b9SChris Mason if (err) 2357c4452b9SChris Mason werr = err; 2367c4452b9SChris Mason return werr; 23779154b1bSChris Mason } 23879154b1bSChris Mason 2390b86a832SChris Mason static int update_cowonly_root(struct btrfs_trans_handle *trans, 24079154b1bSChris Mason struct btrfs_root *root) 24179154b1bSChris Mason { 24279154b1bSChris Mason int ret; 2430b86a832SChris Mason u64 old_root_bytenr; 2440b86a832SChris Mason struct btrfs_root *tree_root = root->fs_info->tree_root; 24579154b1bSChris Mason 2460b86a832SChris Mason btrfs_write_dirty_block_groups(trans, root); 24779154b1bSChris Mason while(1) { 2480b86a832SChris Mason old_root_bytenr = btrfs_root_bytenr(&root->root_item); 2490b86a832SChris Mason if (old_root_bytenr == root->node->start) 25079154b1bSChris Mason break; 2510b86a832SChris Mason btrfs_set_root_bytenr(&root->root_item, 2520b86a832SChris Mason root->node->start); 2530b86a832SChris Mason btrfs_set_root_level(&root->root_item, 2540b86a832SChris Mason btrfs_header_level(root->node)); 25579154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 2560b86a832SChris Mason &root->root_key, 2570b86a832SChris Mason &root->root_item); 25879154b1bSChris Mason BUG_ON(ret); 2590b86a832SChris Mason btrfs_write_dirty_block_groups(trans, root); 2600b86a832SChris Mason } 2610b86a832SChris Mason return 0; 2620b86a832SChris Mason } 2630b86a832SChris Mason 2640b86a832SChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 2650b86a832SChris Mason struct btrfs_root *root) 2660b86a832SChris Mason { 2670b86a832SChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 2680b86a832SChris Mason struct list_head *next; 2690b86a832SChris Mason 2700b86a832SChris Mason while(!list_empty(&fs_info->dirty_cowonly_roots)) { 2710b86a832SChris Mason next = fs_info->dirty_cowonly_roots.next; 2720b86a832SChris Mason list_del_init(next); 2730b86a832SChris Mason root = list_entry(next, struct btrfs_root, dirty_list); 2740b86a832SChris Mason update_cowonly_root(trans, root); 27579154b1bSChris Mason } 27679154b1bSChris Mason return 0; 27779154b1bSChris Mason } 27879154b1bSChris Mason 2790f7d52f4SChris Mason struct dirty_root { 2800f7d52f4SChris Mason struct list_head list; 2810f7d52f4SChris Mason struct btrfs_root *root; 28258176a96SJosef Bacik struct btrfs_root *latest_root; 2830f7d52f4SChris Mason }; 2840f7d52f4SChris Mason 2855ce14bbcSChris Mason int btrfs_add_dead_root(struct btrfs_root *root, 2865ce14bbcSChris Mason struct btrfs_root *latest, 2875ce14bbcSChris Mason struct list_head *dead_list) 2885eda7b5eSChris Mason { 2895eda7b5eSChris Mason struct dirty_root *dirty; 2905eda7b5eSChris Mason 2915eda7b5eSChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2925eda7b5eSChris Mason if (!dirty) 2935eda7b5eSChris Mason return -ENOMEM; 2945eda7b5eSChris Mason dirty->root = root; 2955ce14bbcSChris Mason dirty->latest_root = latest; 2965eda7b5eSChris Mason list_add(&dirty->list, dead_list); 2975eda7b5eSChris Mason return 0; 2985eda7b5eSChris Mason } 2995eda7b5eSChris Mason 30080b6794dSChris Mason static noinline int add_dirty_roots(struct btrfs_trans_handle *trans, 30135b7e476SChris Mason struct radix_tree_root *radix, 30235b7e476SChris Mason struct list_head *list) 3030f7d52f4SChris Mason { 3040f7d52f4SChris Mason struct dirty_root *dirty; 3050f7d52f4SChris Mason struct btrfs_root *gang[8]; 3060f7d52f4SChris Mason struct btrfs_root *root; 3070f7d52f4SChris Mason int i; 3080f7d52f4SChris Mason int ret; 30954aa1f4dSChris Mason int err = 0; 3105eda7b5eSChris Mason u32 refs; 31154aa1f4dSChris Mason 3120f7d52f4SChris Mason while(1) { 3130f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 3140f7d52f4SChris Mason ARRAY_SIZE(gang), 3150f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 3160f7d52f4SChris Mason if (ret == 0) 3170f7d52f4SChris Mason break; 3180f7d52f4SChris Mason for (i = 0; i < ret; i++) { 3190f7d52f4SChris Mason root = gang[i]; 3202619ba1fSChris Mason radix_tree_tag_clear(radix, 3212619ba1fSChris Mason (unsigned long)root->root_key.objectid, 3220f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 3230f7d52f4SChris Mason if (root->commit_root == root->node) { 324db94535dSChris Mason WARN_ON(root->node->start != 325db94535dSChris Mason btrfs_root_bytenr(&root->root_item)); 3265f39d397SChris Mason free_extent_buffer(root->commit_root); 3270f7d52f4SChris Mason root->commit_root = NULL; 32858176a96SJosef Bacik 32958176a96SJosef Bacik /* make sure to update the root on disk 33058176a96SJosef Bacik * so we get any updates to the block used 33158176a96SJosef Bacik * counts 33258176a96SJosef Bacik */ 33358176a96SJosef Bacik err = btrfs_update_root(trans, 33458176a96SJosef Bacik root->fs_info->tree_root, 33558176a96SJosef Bacik &root->root_key, 33658176a96SJosef Bacik &root->root_item); 3370f7d52f4SChris Mason continue; 3380f7d52f4SChris Mason } 3390f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 3400f7d52f4SChris Mason BUG_ON(!dirty); 3419f3a7427SChris Mason dirty->root = kmalloc(sizeof(*dirty->root), GFP_NOFS); 3429f3a7427SChris Mason BUG_ON(!dirty->root); 3439f3a7427SChris Mason 3449f3a7427SChris Mason memset(&root->root_item.drop_progress, 0, 3459f3a7427SChris Mason sizeof(struct btrfs_disk_key)); 3469f3a7427SChris Mason root->root_item.drop_level = 0; 3479f3a7427SChris Mason 3489f3a7427SChris Mason memcpy(dirty->root, root, sizeof(*root)); 3499f3a7427SChris Mason dirty->root->node = root->commit_root; 35058176a96SJosef Bacik dirty->latest_root = root; 3510f7d52f4SChris Mason root->commit_root = NULL; 3525eda7b5eSChris Mason 3530f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 354db94535dSChris Mason btrfs_set_root_bytenr(&root->root_item, 355db94535dSChris Mason root->node->start); 356db94535dSChris Mason btrfs_set_root_level(&root->root_item, 357db94535dSChris Mason btrfs_header_level(root->node)); 3580f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 3590f7d52f4SChris Mason &root->root_key, 3600f7d52f4SChris Mason &root->root_item); 36154aa1f4dSChris Mason if (err) 36254aa1f4dSChris Mason break; 3639f3a7427SChris Mason 3649f3a7427SChris Mason refs = btrfs_root_refs(&dirty->root->root_item); 3659f3a7427SChris Mason btrfs_set_root_refs(&dirty->root->root_item, refs - 1); 3665eda7b5eSChris Mason err = btrfs_update_root(trans, root->fs_info->tree_root, 3679f3a7427SChris Mason &dirty->root->root_key, 3689f3a7427SChris Mason &dirty->root->root_item); 3695eda7b5eSChris Mason 3705eda7b5eSChris Mason BUG_ON(err); 3719f3a7427SChris Mason if (refs == 1) { 3720f7d52f4SChris Mason list_add(&dirty->list, list); 3739f3a7427SChris Mason } else { 3749f3a7427SChris Mason WARN_ON(1); 3759f3a7427SChris Mason kfree(dirty->root); 3765eda7b5eSChris Mason kfree(dirty); 3770f7d52f4SChris Mason } 3780f7d52f4SChris Mason } 3799f3a7427SChris Mason } 38054aa1f4dSChris Mason return err; 3810f7d52f4SChris Mason } 3820f7d52f4SChris Mason 383e9d0b13bSChris Mason int btrfs_defrag_root(struct btrfs_root *root, int cacheonly) 384e9d0b13bSChris Mason { 385e9d0b13bSChris Mason struct btrfs_fs_info *info = root->fs_info; 386e9d0b13bSChris Mason int ret; 387e9d0b13bSChris Mason struct btrfs_trans_handle *trans; 388d3c2fdcfSChris Mason unsigned long nr; 389e9d0b13bSChris Mason 390a2135011SChris Mason smp_mb(); 391e9d0b13bSChris Mason if (root->defrag_running) 392e9d0b13bSChris Mason return 0; 393e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 3946b80053dSChris Mason while (1) { 395e9d0b13bSChris Mason root->defrag_running = 1; 396e9d0b13bSChris Mason ret = btrfs_defrag_leaves(trans, root, cacheonly); 397d3c2fdcfSChris Mason nr = trans->blocks_used; 398e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 399d3c2fdcfSChris Mason btrfs_btree_balance_dirty(info->tree_root, nr); 400e9d0b13bSChris Mason cond_resched(); 401e9d0b13bSChris Mason 402e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 4033f157a2fSChris Mason if (root->fs_info->closing || ret != -EAGAIN) 404e9d0b13bSChris Mason break; 405e9d0b13bSChris Mason } 406e9d0b13bSChris Mason root->defrag_running = 0; 407a2135011SChris Mason smp_mb(); 408e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 409e9d0b13bSChris Mason return 0; 410e9d0b13bSChris Mason } 411e9d0b13bSChris Mason 41280b6794dSChris Mason static noinline int drop_dirty_roots(struct btrfs_root *tree_root, 41335b7e476SChris Mason struct list_head *list) 4140f7d52f4SChris Mason { 4150f7d52f4SChris Mason struct dirty_root *dirty; 4160f7d52f4SChris Mason struct btrfs_trans_handle *trans; 417d3c2fdcfSChris Mason unsigned long nr; 418db94535dSChris Mason u64 num_bytes; 419db94535dSChris Mason u64 bytes_used; 42054aa1f4dSChris Mason int ret = 0; 4219f3a7427SChris Mason int err; 4229f3a7427SChris Mason 4230f7d52f4SChris Mason while(!list_empty(list)) { 42458176a96SJosef Bacik struct btrfs_root *root; 42558176a96SJosef Bacik 4260f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 4270f7d52f4SChris Mason list_del_init(&dirty->list); 4285eda7b5eSChris Mason 429db94535dSChris Mason num_bytes = btrfs_root_used(&dirty->root->root_item); 43058176a96SJosef Bacik root = dirty->latest_root; 431a2135011SChris Mason atomic_inc(&root->fs_info->throttles); 43258176a96SJosef Bacik 433a2135011SChris Mason mutex_lock(&root->fs_info->drop_mutex); 4349f3a7427SChris Mason while(1) { 4350f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 4369f3a7427SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root); 4379f3a7427SChris Mason if (ret != -EAGAIN) { 4389f3a7427SChris Mason break; 4399f3a7427SChris Mason } 44058176a96SJosef Bacik 4419f3a7427SChris Mason err = btrfs_update_root(trans, 4429f3a7427SChris Mason tree_root, 4439f3a7427SChris Mason &dirty->root->root_key, 4449f3a7427SChris Mason &dirty->root->root_item); 4459f3a7427SChris Mason if (err) 4469f3a7427SChris Mason ret = err; 447d3c2fdcfSChris Mason nr = trans->blocks_used; 4481b1e2135SChris Mason ret = btrfs_end_transaction_throttle(trans, tree_root); 4490f7d52f4SChris Mason BUG_ON(ret); 450a2135011SChris Mason 451a2135011SChris Mason mutex_unlock(&root->fs_info->drop_mutex); 452d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 4534dc11904SChris Mason cond_resched(); 454a2135011SChris Mason mutex_lock(&root->fs_info->drop_mutex); 4559f3a7427SChris Mason } 4569f3a7427SChris Mason BUG_ON(ret); 457a2135011SChris Mason atomic_dec(&root->fs_info->throttles); 45858176a96SJosef Bacik 459a2135011SChris Mason mutex_lock(&root->fs_info->alloc_mutex); 460db94535dSChris Mason num_bytes -= btrfs_root_used(&dirty->root->root_item); 461db94535dSChris Mason bytes_used = btrfs_root_used(&root->root_item); 462db94535dSChris Mason if (num_bytes) { 46358176a96SJosef Bacik record_root_in_trans(root); 4645f39d397SChris Mason btrfs_set_root_used(&root->root_item, 465db94535dSChris Mason bytes_used - num_bytes); 46658176a96SJosef Bacik } 467a2135011SChris Mason mutex_unlock(&root->fs_info->alloc_mutex); 468a2135011SChris Mason 4699f3a7427SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->root->root_key); 47058176a96SJosef Bacik if (ret) { 47158176a96SJosef Bacik BUG(); 47254aa1f4dSChris Mason break; 47358176a96SJosef Bacik } 474a2135011SChris Mason mutex_unlock(&root->fs_info->drop_mutex); 475a2135011SChris Mason 476d3c2fdcfSChris Mason nr = trans->blocks_used; 4770f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 4780f7d52f4SChris Mason BUG_ON(ret); 4795eda7b5eSChris Mason 480f510cfecSChris Mason free_extent_buffer(dirty->root->node); 4815eda7b5eSChris Mason kfree(dirty->root); 4820f7d52f4SChris Mason kfree(dirty); 483d3c2fdcfSChris Mason 484d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 4854dc11904SChris Mason cond_resched(); 4860f7d52f4SChris Mason } 48754aa1f4dSChris Mason return ret; 4880f7d52f4SChris Mason } 4890f7d52f4SChris Mason 49080b6794dSChris Mason static noinline int create_pending_snapshot(struct btrfs_trans_handle *trans, 4913063d29fSChris Mason struct btrfs_fs_info *fs_info, 4923063d29fSChris Mason struct btrfs_pending_snapshot *pending) 4933063d29fSChris Mason { 4943063d29fSChris Mason struct btrfs_key key; 49580b6794dSChris Mason struct btrfs_root_item *new_root_item; 4963063d29fSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 4973063d29fSChris Mason struct btrfs_root *root = pending->root; 4983063d29fSChris Mason struct extent_buffer *tmp; 499925baeddSChris Mason struct extent_buffer *old; 5003063d29fSChris Mason int ret; 5013b96362cSSven Wegener int namelen; 5023063d29fSChris Mason u64 objectid; 5033063d29fSChris Mason 50480b6794dSChris Mason new_root_item = kmalloc(sizeof(*new_root_item), GFP_NOFS); 50580b6794dSChris Mason if (!new_root_item) { 50680b6794dSChris Mason ret = -ENOMEM; 50780b6794dSChris Mason goto fail; 50880b6794dSChris Mason } 5093063d29fSChris Mason ret = btrfs_find_free_objectid(trans, tree_root, 0, &objectid); 5103063d29fSChris Mason if (ret) 5113063d29fSChris Mason goto fail; 5123063d29fSChris Mason 51380b6794dSChris Mason memcpy(new_root_item, &root->root_item, sizeof(*new_root_item)); 5143063d29fSChris Mason 5153063d29fSChris Mason key.objectid = objectid; 5163063d29fSChris Mason key.offset = 1; 5173063d29fSChris Mason btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY); 5183063d29fSChris Mason 519925baeddSChris Mason old = btrfs_lock_root_node(root); 520925baeddSChris Mason btrfs_cow_block(trans, root, old, NULL, 0, &old); 5213063d29fSChris Mason 522925baeddSChris Mason btrfs_copy_root(trans, root, old, &tmp, objectid); 523925baeddSChris Mason btrfs_tree_unlock(old); 524925baeddSChris Mason free_extent_buffer(old); 5253063d29fSChris Mason 52680b6794dSChris Mason btrfs_set_root_bytenr(new_root_item, tmp->start); 52780b6794dSChris Mason btrfs_set_root_level(new_root_item, btrfs_header_level(tmp)); 5283063d29fSChris Mason ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key, 52980b6794dSChris Mason new_root_item); 530925baeddSChris Mason btrfs_tree_unlock(tmp); 5313063d29fSChris Mason free_extent_buffer(tmp); 5323063d29fSChris Mason if (ret) 5333063d29fSChris Mason goto fail; 5343063d29fSChris Mason 5353063d29fSChris Mason /* 5363063d29fSChris Mason * insert the directory item 5373063d29fSChris Mason */ 5383063d29fSChris Mason key.offset = (u64)-1; 5393b96362cSSven Wegener namelen = strlen(pending->name); 5403063d29fSChris Mason ret = btrfs_insert_dir_item(trans, root->fs_info->tree_root, 5413b96362cSSven Wegener pending->name, namelen, 5423063d29fSChris Mason root->fs_info->sb->s_root->d_inode->i_ino, 5433063d29fSChris Mason &key, BTRFS_FT_DIR); 5443063d29fSChris Mason 5453063d29fSChris Mason if (ret) 5463063d29fSChris Mason goto fail; 5473063d29fSChris Mason 5483063d29fSChris Mason ret = btrfs_insert_inode_ref(trans, root->fs_info->tree_root, 5493063d29fSChris Mason pending->name, strlen(pending->name), objectid, 5503063d29fSChris Mason root->fs_info->sb->s_root->d_inode->i_ino); 5513b96362cSSven Wegener 5523b96362cSSven Wegener /* Invalidate existing dcache entry for new snapshot. */ 5533b96362cSSven Wegener btrfs_invalidate_dcache_root(root, pending->name, namelen); 5543b96362cSSven Wegener 5553063d29fSChris Mason fail: 55680b6794dSChris Mason kfree(new_root_item); 5573063d29fSChris Mason return ret; 5583063d29fSChris Mason } 5593063d29fSChris Mason 56080b6794dSChris Mason static noinline int create_pending_snapshots(struct btrfs_trans_handle *trans, 5613063d29fSChris Mason struct btrfs_fs_info *fs_info) 5623063d29fSChris Mason { 5633063d29fSChris Mason struct btrfs_pending_snapshot *pending; 5643063d29fSChris Mason struct list_head *head = &trans->transaction->pending_snapshots; 5653063d29fSChris Mason int ret; 5663063d29fSChris Mason 5673063d29fSChris Mason while(!list_empty(head)) { 5683063d29fSChris Mason pending = list_entry(head->next, 5693063d29fSChris Mason struct btrfs_pending_snapshot, list); 5703063d29fSChris Mason ret = create_pending_snapshot(trans, fs_info, pending); 5713063d29fSChris Mason BUG_ON(ret); 5723063d29fSChris Mason list_del(&pending->list); 5733063d29fSChris Mason kfree(pending->name); 5743063d29fSChris Mason kfree(pending); 5753063d29fSChris Mason } 576dc17ff8fSChris Mason return 0; 577dc17ff8fSChris Mason } 578dc17ff8fSChris Mason 57979154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 58079154b1bSChris Mason struct btrfs_root *root) 58179154b1bSChris Mason { 58215ee9bc7SJosef Bacik unsigned long joined = 0; 58315ee9bc7SJosef Bacik unsigned long timeout = 1; 58479154b1bSChris Mason struct btrfs_transaction *cur_trans; 5858fd17795SChris Mason struct btrfs_transaction *prev_trans = NULL; 5860b86a832SChris Mason struct btrfs_root *chunk_root = root->fs_info->chunk_root; 5870f7d52f4SChris Mason struct list_head dirty_fs_roots; 588d1310b2eSChris Mason struct extent_io_tree *pinned_copy; 58979154b1bSChris Mason DEFINE_WAIT(wait); 59015ee9bc7SJosef Bacik int ret; 59179154b1bSChris Mason 5920f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 593d6e4a428SChris Mason 59479154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 59579154b1bSChris Mason if (trans->transaction->in_commit) { 59679154b1bSChris Mason cur_trans = trans->transaction; 59779154b1bSChris Mason trans->transaction->use_count++; 598ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 59979154b1bSChris Mason btrfs_end_transaction(trans, root); 600ccd467d6SChris Mason 60179154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 60279154b1bSChris Mason BUG_ON(ret); 60315ee9bc7SJosef Bacik 60415ee9bc7SJosef Bacik mutex_lock(&root->fs_info->trans_mutex); 60579154b1bSChris Mason put_transaction(cur_trans); 60615ee9bc7SJosef Bacik mutex_unlock(&root->fs_info->trans_mutex); 60715ee9bc7SJosef Bacik 60879154b1bSChris Mason return 0; 60979154b1bSChris Mason } 6104313b399SChris Mason 6114313b399SChris Mason pinned_copy = kmalloc(sizeof(*pinned_copy), GFP_NOFS); 6124313b399SChris Mason if (!pinned_copy) 6134313b399SChris Mason return -ENOMEM; 6144313b399SChris Mason 615d1310b2eSChris Mason extent_io_tree_init(pinned_copy, 6164313b399SChris Mason root->fs_info->btree_inode->i_mapping, GFP_NOFS); 6174313b399SChris Mason 618e6dcd2dcSChris Mason printk("commit trans %Lu\n", trans->transid); 6192c90e5d6SChris Mason trans->transaction->in_commit = 1; 620ccd467d6SChris Mason cur_trans = trans->transaction; 621ccd467d6SChris Mason if (cur_trans->list.prev != &root->fs_info->trans_list) { 622ccd467d6SChris Mason prev_trans = list_entry(cur_trans->list.prev, 623ccd467d6SChris Mason struct btrfs_transaction, list); 624ccd467d6SChris Mason if (!prev_trans->commit_done) { 625ccd467d6SChris Mason prev_trans->use_count++; 626ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 627ccd467d6SChris Mason 628ccd467d6SChris Mason wait_for_commit(root, prev_trans); 629ccd467d6SChris Mason 630ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 63115ee9bc7SJosef Bacik put_transaction(prev_trans); 632ccd467d6SChris Mason } 633ccd467d6SChris Mason } 63415ee9bc7SJosef Bacik 63515ee9bc7SJosef Bacik do { 63615ee9bc7SJosef Bacik joined = cur_trans->num_joined; 6372c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 63815ee9bc7SJosef Bacik prepare_to_wait(&cur_trans->writer_wait, &wait, 63979154b1bSChris Mason TASK_UNINTERRUPTIBLE); 64015ee9bc7SJosef Bacik 64115ee9bc7SJosef Bacik if (cur_trans->num_writers > 1) 64215ee9bc7SJosef Bacik timeout = MAX_SCHEDULE_TIMEOUT; 64315ee9bc7SJosef Bacik else 64415ee9bc7SJosef Bacik timeout = 1; 64515ee9bc7SJosef Bacik 64679154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 64715ee9bc7SJosef Bacik 64815ee9bc7SJosef Bacik schedule_timeout(timeout); 64915ee9bc7SJosef Bacik 65079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 65115ee9bc7SJosef Bacik finish_wait(&cur_trans->writer_wait, &wait); 65215ee9bc7SJosef Bacik } while (cur_trans->num_writers > 1 || 65315ee9bc7SJosef Bacik (cur_trans->num_joined != joined)); 65415ee9bc7SJosef Bacik 6553063d29fSChris Mason ret = create_pending_snapshots(trans, root->fs_info); 6563063d29fSChris Mason BUG_ON(ret); 6573063d29fSChris Mason 6582c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 659dc17ff8fSChris Mason 66054aa1f4dSChris Mason ret = add_dirty_roots(trans, &root->fs_info->fs_roots_radix, 66154aa1f4dSChris Mason &dirty_fs_roots); 66254aa1f4dSChris Mason BUG_ON(ret); 66354aa1f4dSChris Mason 66479154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 66579154b1bSChris Mason BUG_ON(ret); 66654aa1f4dSChris Mason 66778fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 668cee36a03SChris Mason spin_lock(&root->fs_info->new_trans_lock); 66978fae27eSChris Mason root->fs_info->running_transaction = NULL; 670cee36a03SChris Mason spin_unlock(&root->fs_info->new_trans_lock); 6714b52dff6SChris Mason btrfs_set_super_generation(&root->fs_info->super_copy, 6724b52dff6SChris Mason cur_trans->transid); 6734b52dff6SChris Mason btrfs_set_super_root(&root->fs_info->super_copy, 674db94535dSChris Mason root->fs_info->tree_root->node->start); 675db94535dSChris Mason btrfs_set_super_root_level(&root->fs_info->super_copy, 676db94535dSChris Mason btrfs_header_level(root->fs_info->tree_root->node)); 6775f39d397SChris Mason 6780b86a832SChris Mason btrfs_set_super_chunk_root(&root->fs_info->super_copy, 6790b86a832SChris Mason chunk_root->node->start); 6800b86a832SChris Mason btrfs_set_super_chunk_root_level(&root->fs_info->super_copy, 6810b86a832SChris Mason btrfs_header_level(chunk_root->node)); 682a061fc8dSChris Mason memcpy(&root->fs_info->super_for_commit, &root->fs_info->super_copy, 6834b52dff6SChris Mason sizeof(root->fs_info->super_copy)); 684ccd467d6SChris Mason 6854313b399SChris Mason btrfs_copy_pinned(root, pinned_copy); 686ccd467d6SChris Mason 687e6dcd2dcSChris Mason wake_up(&root->fs_info->transaction_throttle); 688e6dcd2dcSChris Mason 68978fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 69079154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 69179154b1bSChris Mason BUG_ON(ret); 69279154b1bSChris Mason write_ctree_super(trans, root); 6934313b399SChris Mason 6944313b399SChris Mason btrfs_finish_extent_commit(trans, root, pinned_copy); 69578fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 6964313b399SChris Mason 6974313b399SChris Mason kfree(pinned_copy); 6984313b399SChris Mason 6992c90e5d6SChris Mason cur_trans->commit_done = 1; 70015ee9bc7SJosef Bacik root->fs_info->last_trans_committed = cur_trans->transid; 7012c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 70279154b1bSChris Mason put_transaction(cur_trans); 70378fae27eSChris Mason put_transaction(cur_trans); 70458176a96SJosef Bacik 705facda1e7SChris Mason if (root->fs_info->closing) 706facda1e7SChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_fs_roots); 707facda1e7SChris Mason else 708facda1e7SChris Mason list_splice_init(&dirty_fs_roots, &root->fs_info->dead_roots); 70958176a96SJosef Bacik 71078fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 711e6dcd2dcSChris Mason printk("done commit trans %Lu\n", trans->transid); 7122c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 71379154b1bSChris Mason 714facda1e7SChris Mason if (root->fs_info->closing) { 7150f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 716facda1e7SChris Mason } 71779154b1bSChris Mason return ret; 71879154b1bSChris Mason } 71979154b1bSChris Mason 720e9d0b13bSChris Mason int btrfs_clean_old_snapshots(struct btrfs_root *root) 721e9d0b13bSChris Mason { 722e9d0b13bSChris Mason struct list_head dirty_roots; 723e9d0b13bSChris Mason INIT_LIST_HEAD(&dirty_roots); 724a74a4b97SChris Mason again: 725e9d0b13bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 726e9d0b13bSChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_roots); 727e9d0b13bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 728e9d0b13bSChris Mason 729e9d0b13bSChris Mason if (!list_empty(&dirty_roots)) { 730e9d0b13bSChris Mason drop_dirty_roots(root, &dirty_roots); 731a74a4b97SChris Mason goto again; 732e9d0b13bSChris Mason } 733e9d0b13bSChris Mason return 0; 734e9d0b13bSChris Mason } 73508607c1bSChris Mason 736