16cbd5570SChris Mason /* 26cbd5570SChris Mason * Copyright (C) 2007 Oracle. All rights reserved. 36cbd5570SChris Mason * 46cbd5570SChris Mason * This program is free software; you can redistribute it and/or 56cbd5570SChris Mason * modify it under the terms of the GNU General Public 66cbd5570SChris Mason * License v2 as published by the Free Software Foundation. 76cbd5570SChris Mason * 86cbd5570SChris Mason * This program is distributed in the hope that it will be useful, 96cbd5570SChris Mason * but WITHOUT ANY WARRANTY; without even the implied warranty of 106cbd5570SChris Mason * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 116cbd5570SChris Mason * General Public License for more details. 126cbd5570SChris Mason * 136cbd5570SChris Mason * You should have received a copy of the GNU General Public 146cbd5570SChris Mason * License along with this program; if not, write to the 156cbd5570SChris Mason * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 166cbd5570SChris Mason * Boston, MA 021110-1307, USA. 176cbd5570SChris Mason */ 186cbd5570SChris Mason 1979154b1bSChris Mason #include <linux/fs.h> 2034088780SChris Mason #include <linux/sched.h> 21d3c2fdcfSChris Mason #include <linux/writeback.h> 225f39d397SChris Mason #include <linux/pagemap.h> 2379154b1bSChris Mason #include "ctree.h" 2479154b1bSChris Mason #include "disk-io.h" 2579154b1bSChris Mason #include "transaction.h" 26925baeddSChris Mason #include "locking.h" 2779154b1bSChris Mason 2878fae27eSChris Mason static int total_trans = 0; 292c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 302c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 312c90e5d6SChris Mason 320f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 330f7d52f4SChris Mason 3480b6794dSChris Mason static noinline void put_transaction(struct btrfs_transaction *transaction) 3579154b1bSChris Mason { 362c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 3779154b1bSChris Mason transaction->use_count--; 3878fae27eSChris Mason if (transaction->use_count == 0) { 3978fae27eSChris Mason WARN_ON(total_trans == 0); 4078fae27eSChris Mason total_trans--; 418fd17795SChris Mason list_del_init(&transaction->list); 422c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 432c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 4479154b1bSChris Mason } 4578fae27eSChris Mason } 4679154b1bSChris Mason 4780b6794dSChris Mason static noinline int join_transaction(struct btrfs_root *root) 4879154b1bSChris Mason { 4979154b1bSChris Mason struct btrfs_transaction *cur_trans; 5079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 5179154b1bSChris Mason if (!cur_trans) { 522c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 532c90e5d6SChris Mason GFP_NOFS); 5478fae27eSChris Mason total_trans++; 5579154b1bSChris Mason BUG_ON(!cur_trans); 560f7d52f4SChris Mason root->fs_info->generation++; 57e18e4809SChris Mason root->fs_info->last_alloc = 0; 584529ba49SChris Mason root->fs_info->last_data_alloc = 0; 5915ee9bc7SJosef Bacik cur_trans->num_writers = 1; 6015ee9bc7SJosef Bacik cur_trans->num_joined = 0; 610f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 6279154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 6379154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 6479154b1bSChris Mason cur_trans->in_commit = 0; 65d5719762SChris Mason cur_trans->use_count = 1; 6679154b1bSChris Mason cur_trans->commit_done = 0; 6708607c1bSChris Mason cur_trans->start_time = get_seconds(); 683063d29fSChris Mason INIT_LIST_HEAD(&cur_trans->pending_snapshots); 698fd17795SChris Mason list_add_tail(&cur_trans->list, &root->fs_info->trans_list); 70dc17ff8fSChris Mason btrfs_ordered_inode_tree_init(&cur_trans->ordered_inode_tree); 71d1310b2eSChris Mason extent_io_tree_init(&cur_trans->dirty_pages, 725f39d397SChris Mason root->fs_info->btree_inode->i_mapping, 735f39d397SChris Mason GFP_NOFS); 7448ec2cf8SChris Mason spin_lock(&root->fs_info->new_trans_lock); 7548ec2cf8SChris Mason root->fs_info->running_transaction = cur_trans; 7648ec2cf8SChris Mason spin_unlock(&root->fs_info->new_trans_lock); 7715ee9bc7SJosef Bacik } else { 7879154b1bSChris Mason cur_trans->num_writers++; 7915ee9bc7SJosef Bacik cur_trans->num_joined++; 8015ee9bc7SJosef Bacik } 8115ee9bc7SJosef Bacik 8279154b1bSChris Mason return 0; 8379154b1bSChris Mason } 8479154b1bSChris Mason 8580b6794dSChris Mason static noinline int record_root_in_trans(struct btrfs_root *root) 866702ed49SChris Mason { 876702ed49SChris Mason u64 running_trans_id = root->fs_info->running_transaction->transid; 886702ed49SChris Mason if (root->ref_cows && root->last_trans < running_trans_id) { 896702ed49SChris Mason WARN_ON(root == root->fs_info->extent_root); 906702ed49SChris Mason if (root->root_item.refs != 0) { 916702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 926702ed49SChris Mason (unsigned long)root->root_key.objectid, 936702ed49SChris Mason BTRFS_ROOT_TRANS_TAG); 94925baeddSChris Mason root->commit_root = btrfs_root_node(root); 956702ed49SChris Mason } else { 966702ed49SChris Mason WARN_ON(1); 976702ed49SChris Mason } 986702ed49SChris Mason root->last_trans = running_trans_id; 996702ed49SChris Mason } 1006702ed49SChris Mason return 0; 1016702ed49SChris Mason } 1026702ed49SChris Mason 10379154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 10479154b1bSChris Mason int num_blocks) 10579154b1bSChris Mason { 1062c90e5d6SChris Mason struct btrfs_trans_handle *h = 1072c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 10879154b1bSChris Mason int ret; 10979154b1bSChris Mason 11079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 11179154b1bSChris Mason ret = join_transaction(root); 11279154b1bSChris Mason BUG_ON(ret); 1130f7d52f4SChris Mason 1146702ed49SChris Mason record_root_in_trans(root); 1156702ed49SChris Mason h->transid = root->fs_info->running_transaction->transid; 11679154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 11779154b1bSChris Mason h->blocks_reserved = num_blocks; 11879154b1bSChris Mason h->blocks_used = 0; 11931f3c99bSChris Mason h->block_group = NULL; 12026b8003fSChris Mason h->alloc_exclude_nr = 0; 12126b8003fSChris Mason h->alloc_exclude_start = 0; 12279154b1bSChris Mason root->fs_info->running_transaction->use_count++; 12379154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 12479154b1bSChris Mason return h; 12579154b1bSChris Mason } 12679154b1bSChris Mason 12789ce8a63SChris Mason static noinline int wait_for_commit(struct btrfs_root *root, 12889ce8a63SChris Mason struct btrfs_transaction *commit) 12989ce8a63SChris Mason { 13089ce8a63SChris Mason DEFINE_WAIT(wait); 13189ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 13289ce8a63SChris Mason while(!commit->commit_done) { 13389ce8a63SChris Mason prepare_to_wait(&commit->commit_wait, &wait, 13489ce8a63SChris Mason TASK_UNINTERRUPTIBLE); 13589ce8a63SChris Mason if (commit->commit_done) 13689ce8a63SChris Mason break; 13789ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 13889ce8a63SChris Mason schedule(); 13989ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 14089ce8a63SChris Mason } 14189ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 14289ce8a63SChris Mason finish_wait(&commit->commit_wait, &wait); 14389ce8a63SChris Mason return 0; 14489ce8a63SChris Mason } 14589ce8a63SChris Mason 14689ce8a63SChris Mason static int __btrfs_end_transaction(struct btrfs_trans_handle *trans, 14789ce8a63SChris Mason struct btrfs_root *root, int throttle) 14879154b1bSChris Mason { 14979154b1bSChris Mason struct btrfs_transaction *cur_trans; 150d6e4a428SChris Mason 15179154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 15279154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 153ccd467d6SChris Mason WARN_ON(cur_trans != trans->transaction); 154d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 155ccd467d6SChris Mason cur_trans->num_writers--; 15689ce8a63SChris Mason 15779154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 15879154b1bSChris Mason wake_up(&cur_trans->writer_wait); 15989ce8a63SChris Mason 16089ce8a63SChris Mason if (cur_trans->in_commit && throttle) { 16189ce8a63SChris Mason int ret; 16289ce8a63SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 16389ce8a63SChris Mason ret = wait_for_commit(root, cur_trans); 16489ce8a63SChris Mason BUG_ON(ret); 16589ce8a63SChris Mason mutex_lock(&root->fs_info->trans_mutex); 16689ce8a63SChris Mason } 16789ce8a63SChris Mason 16879154b1bSChris Mason put_transaction(cur_trans); 16979154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 170d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 1712c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 17279154b1bSChris Mason return 0; 17379154b1bSChris Mason } 17479154b1bSChris Mason 17589ce8a63SChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 17689ce8a63SChris Mason struct btrfs_root *root) 17789ce8a63SChris Mason { 17889ce8a63SChris Mason return __btrfs_end_transaction(trans, root, 0); 17989ce8a63SChris Mason } 18089ce8a63SChris Mason 18189ce8a63SChris Mason int btrfs_end_transaction_throttle(struct btrfs_trans_handle *trans, 18289ce8a63SChris Mason struct btrfs_root *root) 18389ce8a63SChris Mason { 18489ce8a63SChris Mason return __btrfs_end_transaction(trans, root, 1); 18589ce8a63SChris Mason } 18689ce8a63SChris Mason 18779154b1bSChris Mason 18879154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 18979154b1bSChris Mason struct btrfs_root *root) 19079154b1bSChris Mason { 1917c4452b9SChris Mason int ret; 1927c4452b9SChris Mason int err; 1937c4452b9SChris Mason int werr = 0; 194d1310b2eSChris Mason struct extent_io_tree *dirty_pages; 1957c4452b9SChris Mason struct page *page; 1967c4452b9SChris Mason struct inode *btree_inode = root->fs_info->btree_inode; 1975f39d397SChris Mason u64 start; 1985f39d397SChris Mason u64 end; 1995f39d397SChris Mason unsigned long index; 2007c4452b9SChris Mason 2017c4452b9SChris Mason if (!trans || !trans->transaction) { 2027c4452b9SChris Mason return filemap_write_and_wait(btree_inode->i_mapping); 2037c4452b9SChris Mason } 2047c4452b9SChris Mason dirty_pages = &trans->transaction->dirty_pages; 2057c4452b9SChris Mason while(1) { 2065f39d397SChris Mason ret = find_first_extent_bit(dirty_pages, 0, &start, &end, 2075f39d397SChris Mason EXTENT_DIRTY); 2085f39d397SChris Mason if (ret) 2097c4452b9SChris Mason break; 2105f39d397SChris Mason clear_extent_dirty(dirty_pages, start, end, GFP_NOFS); 2115f39d397SChris Mason while(start <= end) { 2125f39d397SChris Mason index = start >> PAGE_CACHE_SHIFT; 21335ebb934SChris Mason start = (u64)(index + 1) << PAGE_CACHE_SHIFT; 2145f39d397SChris Mason page = find_lock_page(btree_inode->i_mapping, index); 2157c4452b9SChris Mason if (!page) 2167c4452b9SChris Mason continue; 2176702ed49SChris Mason if (PageWriteback(page)) { 2186702ed49SChris Mason if (PageDirty(page)) 2196702ed49SChris Mason wait_on_page_writeback(page); 2206702ed49SChris Mason else { 2216702ed49SChris Mason unlock_page(page); 2226702ed49SChris Mason page_cache_release(page); 2236702ed49SChris Mason continue; 2246702ed49SChris Mason } 2256702ed49SChris Mason } 2267c4452b9SChris Mason err = write_one_page(page, 0); 2277c4452b9SChris Mason if (err) 2287c4452b9SChris Mason werr = err; 2297c4452b9SChris Mason page_cache_release(page); 2307c4452b9SChris Mason } 2317c4452b9SChris Mason } 2327c4452b9SChris Mason err = filemap_fdatawait(btree_inode->i_mapping); 2337c4452b9SChris Mason if (err) 2347c4452b9SChris Mason werr = err; 2357c4452b9SChris Mason return werr; 23679154b1bSChris Mason } 23779154b1bSChris Mason 2380b86a832SChris Mason static int update_cowonly_root(struct btrfs_trans_handle *trans, 23979154b1bSChris Mason struct btrfs_root *root) 24079154b1bSChris Mason { 24179154b1bSChris Mason int ret; 2420b86a832SChris Mason u64 old_root_bytenr; 2430b86a832SChris Mason struct btrfs_root *tree_root = root->fs_info->tree_root; 24479154b1bSChris Mason 2450b86a832SChris Mason btrfs_write_dirty_block_groups(trans, root); 24679154b1bSChris Mason while(1) { 2470b86a832SChris Mason old_root_bytenr = btrfs_root_bytenr(&root->root_item); 2480b86a832SChris Mason if (old_root_bytenr == root->node->start) 24979154b1bSChris Mason break; 2500b86a832SChris Mason btrfs_set_root_bytenr(&root->root_item, 2510b86a832SChris Mason root->node->start); 2520b86a832SChris Mason btrfs_set_root_level(&root->root_item, 2530b86a832SChris Mason btrfs_header_level(root->node)); 25479154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 2550b86a832SChris Mason &root->root_key, 2560b86a832SChris Mason &root->root_item); 25779154b1bSChris Mason BUG_ON(ret); 2580b86a832SChris Mason btrfs_write_dirty_block_groups(trans, root); 2590b86a832SChris Mason } 2600b86a832SChris Mason return 0; 2610b86a832SChris Mason } 2620b86a832SChris Mason 2630b86a832SChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 2640b86a832SChris Mason struct btrfs_root *root) 2650b86a832SChris Mason { 2660b86a832SChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 2670b86a832SChris Mason struct list_head *next; 2680b86a832SChris Mason 2690b86a832SChris Mason while(!list_empty(&fs_info->dirty_cowonly_roots)) { 2700b86a832SChris Mason next = fs_info->dirty_cowonly_roots.next; 2710b86a832SChris Mason list_del_init(next); 2720b86a832SChris Mason root = list_entry(next, struct btrfs_root, dirty_list); 2730b86a832SChris Mason update_cowonly_root(trans, root); 27479154b1bSChris Mason } 27579154b1bSChris Mason return 0; 27679154b1bSChris Mason } 27779154b1bSChris Mason 2780f7d52f4SChris Mason struct dirty_root { 2790f7d52f4SChris Mason struct list_head list; 2800f7d52f4SChris Mason struct btrfs_root *root; 28158176a96SJosef Bacik struct btrfs_root *latest_root; 2820f7d52f4SChris Mason }; 2830f7d52f4SChris Mason 2845ce14bbcSChris Mason int btrfs_add_dead_root(struct btrfs_root *root, 2855ce14bbcSChris Mason struct btrfs_root *latest, 2865ce14bbcSChris Mason struct list_head *dead_list) 2875eda7b5eSChris Mason { 2885eda7b5eSChris Mason struct dirty_root *dirty; 2895eda7b5eSChris Mason 2905eda7b5eSChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2915eda7b5eSChris Mason if (!dirty) 2925eda7b5eSChris Mason return -ENOMEM; 2935eda7b5eSChris Mason dirty->root = root; 2945ce14bbcSChris Mason dirty->latest_root = latest; 2955eda7b5eSChris Mason list_add(&dirty->list, dead_list); 2965eda7b5eSChris Mason return 0; 2975eda7b5eSChris Mason } 2985eda7b5eSChris Mason 29980b6794dSChris Mason static noinline int add_dirty_roots(struct btrfs_trans_handle *trans, 30035b7e476SChris Mason struct radix_tree_root *radix, 30135b7e476SChris Mason struct list_head *list) 3020f7d52f4SChris Mason { 3030f7d52f4SChris Mason struct dirty_root *dirty; 3040f7d52f4SChris Mason struct btrfs_root *gang[8]; 3050f7d52f4SChris Mason struct btrfs_root *root; 3060f7d52f4SChris Mason int i; 3070f7d52f4SChris Mason int ret; 30854aa1f4dSChris Mason int err = 0; 3095eda7b5eSChris Mason u32 refs; 31054aa1f4dSChris Mason 3110f7d52f4SChris Mason while(1) { 3120f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 3130f7d52f4SChris Mason ARRAY_SIZE(gang), 3140f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 3150f7d52f4SChris Mason if (ret == 0) 3160f7d52f4SChris Mason break; 3170f7d52f4SChris Mason for (i = 0; i < ret; i++) { 3180f7d52f4SChris Mason root = gang[i]; 3192619ba1fSChris Mason radix_tree_tag_clear(radix, 3202619ba1fSChris Mason (unsigned long)root->root_key.objectid, 3210f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 3220f7d52f4SChris Mason if (root->commit_root == root->node) { 323db94535dSChris Mason WARN_ON(root->node->start != 324db94535dSChris Mason btrfs_root_bytenr(&root->root_item)); 3255f39d397SChris Mason free_extent_buffer(root->commit_root); 3260f7d52f4SChris Mason root->commit_root = NULL; 32758176a96SJosef Bacik 32858176a96SJosef Bacik /* make sure to update the root on disk 32958176a96SJosef Bacik * so we get any updates to the block used 33058176a96SJosef Bacik * counts 33158176a96SJosef Bacik */ 33258176a96SJosef Bacik err = btrfs_update_root(trans, 33358176a96SJosef Bacik root->fs_info->tree_root, 33458176a96SJosef Bacik &root->root_key, 33558176a96SJosef Bacik &root->root_item); 3360f7d52f4SChris Mason continue; 3370f7d52f4SChris Mason } 3380f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 3390f7d52f4SChris Mason BUG_ON(!dirty); 3409f3a7427SChris Mason dirty->root = kmalloc(sizeof(*dirty->root), GFP_NOFS); 3419f3a7427SChris Mason BUG_ON(!dirty->root); 3429f3a7427SChris Mason 3439f3a7427SChris Mason memset(&root->root_item.drop_progress, 0, 3449f3a7427SChris Mason sizeof(struct btrfs_disk_key)); 3459f3a7427SChris Mason root->root_item.drop_level = 0; 3469f3a7427SChris Mason 3479f3a7427SChris Mason memcpy(dirty->root, root, sizeof(*root)); 3489f3a7427SChris Mason dirty->root->node = root->commit_root; 34958176a96SJosef Bacik dirty->latest_root = root; 3500f7d52f4SChris Mason root->commit_root = NULL; 3515eda7b5eSChris Mason 3520f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 353db94535dSChris Mason btrfs_set_root_bytenr(&root->root_item, 354db94535dSChris Mason root->node->start); 355db94535dSChris Mason btrfs_set_root_level(&root->root_item, 356db94535dSChris Mason btrfs_header_level(root->node)); 3570f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 3580f7d52f4SChris Mason &root->root_key, 3590f7d52f4SChris Mason &root->root_item); 36054aa1f4dSChris Mason if (err) 36154aa1f4dSChris Mason break; 3629f3a7427SChris Mason 3639f3a7427SChris Mason refs = btrfs_root_refs(&dirty->root->root_item); 3649f3a7427SChris Mason btrfs_set_root_refs(&dirty->root->root_item, refs - 1); 3655eda7b5eSChris Mason err = btrfs_update_root(trans, root->fs_info->tree_root, 3669f3a7427SChris Mason &dirty->root->root_key, 3679f3a7427SChris Mason &dirty->root->root_item); 3685eda7b5eSChris Mason 3695eda7b5eSChris Mason BUG_ON(err); 3709f3a7427SChris Mason if (refs == 1) { 3710f7d52f4SChris Mason list_add(&dirty->list, list); 3729f3a7427SChris Mason } else { 3739f3a7427SChris Mason WARN_ON(1); 3749f3a7427SChris Mason kfree(dirty->root); 3755eda7b5eSChris Mason kfree(dirty); 3760f7d52f4SChris Mason } 3770f7d52f4SChris Mason } 3789f3a7427SChris Mason } 37954aa1f4dSChris Mason return err; 3800f7d52f4SChris Mason } 3810f7d52f4SChris Mason 382e9d0b13bSChris Mason int btrfs_defrag_root(struct btrfs_root *root, int cacheonly) 383e9d0b13bSChris Mason { 384e9d0b13bSChris Mason struct btrfs_fs_info *info = root->fs_info; 385e9d0b13bSChris Mason int ret; 386e9d0b13bSChris Mason struct btrfs_trans_handle *trans; 387d3c2fdcfSChris Mason unsigned long nr; 388e9d0b13bSChris Mason 389a2135011SChris Mason smp_mb(); 390e9d0b13bSChris Mason if (root->defrag_running) 391e9d0b13bSChris Mason return 0; 392e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 3936b80053dSChris Mason while (1) { 394e9d0b13bSChris Mason root->defrag_running = 1; 395e9d0b13bSChris Mason ret = btrfs_defrag_leaves(trans, root, cacheonly); 396d3c2fdcfSChris Mason nr = trans->blocks_used; 397e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 398d3c2fdcfSChris Mason btrfs_btree_balance_dirty(info->tree_root, nr); 399e9d0b13bSChris Mason cond_resched(); 400e9d0b13bSChris Mason 401e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 4023f157a2fSChris Mason if (root->fs_info->closing || ret != -EAGAIN) 403e9d0b13bSChris Mason break; 404e9d0b13bSChris Mason } 405e9d0b13bSChris Mason root->defrag_running = 0; 406a2135011SChris Mason smp_mb(); 407e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 408e9d0b13bSChris Mason return 0; 409e9d0b13bSChris Mason } 410e9d0b13bSChris Mason 41180b6794dSChris Mason static noinline int drop_dirty_roots(struct btrfs_root *tree_root, 41235b7e476SChris Mason struct list_head *list) 4130f7d52f4SChris Mason { 4140f7d52f4SChris Mason struct dirty_root *dirty; 4150f7d52f4SChris Mason struct btrfs_trans_handle *trans; 416d3c2fdcfSChris Mason unsigned long nr; 417db94535dSChris Mason u64 num_bytes; 418db94535dSChris Mason u64 bytes_used; 41954aa1f4dSChris Mason int ret = 0; 4209f3a7427SChris Mason int err; 4219f3a7427SChris Mason 4220f7d52f4SChris Mason while(!list_empty(list)) { 42358176a96SJosef Bacik struct btrfs_root *root; 42458176a96SJosef Bacik 4250f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 4260f7d52f4SChris Mason list_del_init(&dirty->list); 4275eda7b5eSChris Mason 428db94535dSChris Mason num_bytes = btrfs_root_used(&dirty->root->root_item); 42958176a96SJosef Bacik root = dirty->latest_root; 430a2135011SChris Mason atomic_inc(&root->fs_info->throttles); 43158176a96SJosef Bacik 432a2135011SChris Mason mutex_lock(&root->fs_info->drop_mutex); 4339f3a7427SChris Mason while(1) { 4340f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 4359f3a7427SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root); 4369f3a7427SChris Mason if (ret != -EAGAIN) { 4379f3a7427SChris Mason break; 4389f3a7427SChris Mason } 43958176a96SJosef Bacik 4409f3a7427SChris Mason err = btrfs_update_root(trans, 4419f3a7427SChris Mason tree_root, 4429f3a7427SChris Mason &dirty->root->root_key, 4439f3a7427SChris Mason &dirty->root->root_item); 4449f3a7427SChris Mason if (err) 4459f3a7427SChris Mason ret = err; 446d3c2fdcfSChris Mason nr = trans->blocks_used; 4471b1e2135SChris Mason ret = btrfs_end_transaction_throttle(trans, tree_root); 4480f7d52f4SChris Mason BUG_ON(ret); 449a2135011SChris Mason 450a2135011SChris Mason mutex_unlock(&root->fs_info->drop_mutex); 451d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 4524dc11904SChris Mason cond_resched(); 453a2135011SChris Mason mutex_lock(&root->fs_info->drop_mutex); 4549f3a7427SChris Mason } 4559f3a7427SChris Mason BUG_ON(ret); 456a2135011SChris Mason atomic_dec(&root->fs_info->throttles); 45758176a96SJosef Bacik 458a2135011SChris Mason mutex_lock(&root->fs_info->alloc_mutex); 459db94535dSChris Mason num_bytes -= btrfs_root_used(&dirty->root->root_item); 460db94535dSChris Mason bytes_used = btrfs_root_used(&root->root_item); 461db94535dSChris Mason if (num_bytes) { 46258176a96SJosef Bacik record_root_in_trans(root); 4635f39d397SChris Mason btrfs_set_root_used(&root->root_item, 464db94535dSChris Mason bytes_used - num_bytes); 46558176a96SJosef Bacik } 466a2135011SChris Mason mutex_unlock(&root->fs_info->alloc_mutex); 467a2135011SChris Mason 4689f3a7427SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->root->root_key); 46958176a96SJosef Bacik if (ret) { 47058176a96SJosef Bacik BUG(); 47154aa1f4dSChris Mason break; 47258176a96SJosef Bacik } 473a2135011SChris Mason mutex_unlock(&root->fs_info->drop_mutex); 474a2135011SChris Mason 475d3c2fdcfSChris Mason nr = trans->blocks_used; 4760f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 4770f7d52f4SChris Mason BUG_ON(ret); 4785eda7b5eSChris Mason 479f510cfecSChris Mason free_extent_buffer(dirty->root->node); 4805eda7b5eSChris Mason kfree(dirty->root); 4810f7d52f4SChris Mason kfree(dirty); 482d3c2fdcfSChris Mason 483d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 4844dc11904SChris Mason cond_resched(); 4850f7d52f4SChris Mason } 48654aa1f4dSChris Mason return ret; 4870f7d52f4SChris Mason } 4880f7d52f4SChris Mason 489dc17ff8fSChris Mason int btrfs_write_ordered_inodes(struct btrfs_trans_handle *trans, 490dc17ff8fSChris Mason struct btrfs_root *root) 491dc17ff8fSChris Mason { 492dc17ff8fSChris Mason struct btrfs_transaction *cur_trans = trans->transaction; 493dc17ff8fSChris Mason struct inode *inode; 494dc17ff8fSChris Mason u64 root_objectid = 0; 495dc17ff8fSChris Mason u64 objectid = 0; 496dc17ff8fSChris Mason int ret; 497dc17ff8fSChris Mason 498a2135011SChris Mason atomic_inc(&root->fs_info->throttles); 499dc17ff8fSChris Mason while(1) { 500dc17ff8fSChris Mason ret = btrfs_find_first_ordered_inode( 501dc17ff8fSChris Mason &cur_trans->ordered_inode_tree, 5024d5e74bcSChris Mason &root_objectid, &objectid, &inode); 503dc17ff8fSChris Mason if (!ret) 504dc17ff8fSChris Mason break; 505dc17ff8fSChris Mason 506dc17ff8fSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 5074d5e74bcSChris Mason 50881d7ed29SChris Mason if (S_ISREG(inode->i_mode)) { 50981d7ed29SChris Mason atomic_inc(&BTRFS_I(inode)->ordered_writeback); 510dc17ff8fSChris Mason filemap_fdatawrite(inode->i_mapping); 51181d7ed29SChris Mason atomic_dec(&BTRFS_I(inode)->ordered_writeback); 51281d7ed29SChris Mason } 513dc17ff8fSChris Mason iput(inode); 5144d5e74bcSChris Mason 515dc17ff8fSChris Mason mutex_lock(&root->fs_info->trans_mutex); 516dc17ff8fSChris Mason } 517dc17ff8fSChris Mason while(1) { 518dc17ff8fSChris Mason root_objectid = 0; 519dc17ff8fSChris Mason objectid = 0; 520dc17ff8fSChris Mason ret = btrfs_find_del_first_ordered_inode( 521dc17ff8fSChris Mason &cur_trans->ordered_inode_tree, 5224d5e74bcSChris Mason &root_objectid, &objectid, &inode); 523dc17ff8fSChris Mason if (!ret) 524dc17ff8fSChris Mason break; 525dc17ff8fSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 5264d5e74bcSChris Mason 52781d7ed29SChris Mason if (S_ISREG(inode->i_mode)) { 52881d7ed29SChris Mason atomic_inc(&BTRFS_I(inode)->ordered_writeback); 529dc17ff8fSChris Mason filemap_write_and_wait(inode->i_mapping); 53081d7ed29SChris Mason atomic_dec(&BTRFS_I(inode)->ordered_writeback); 53181d7ed29SChris Mason } 5322da98f00SChris Mason atomic_dec(&inode->i_count); 533dc17ff8fSChris Mason iput(inode); 5344d5e74bcSChris Mason 535dc17ff8fSChris Mason mutex_lock(&root->fs_info->trans_mutex); 536dc17ff8fSChris Mason } 537a2135011SChris Mason atomic_dec(&root->fs_info->throttles); 5383063d29fSChris Mason return 0; 5393063d29fSChris Mason } 5403063d29fSChris Mason 54180b6794dSChris Mason static noinline int create_pending_snapshot(struct btrfs_trans_handle *trans, 5423063d29fSChris Mason struct btrfs_fs_info *fs_info, 5433063d29fSChris Mason struct btrfs_pending_snapshot *pending) 5443063d29fSChris Mason { 5453063d29fSChris Mason struct btrfs_key key; 54680b6794dSChris Mason struct btrfs_root_item *new_root_item; 5473063d29fSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 5483063d29fSChris Mason struct btrfs_root *root = pending->root; 5493063d29fSChris Mason struct extent_buffer *tmp; 550925baeddSChris Mason struct extent_buffer *old; 5513063d29fSChris Mason int ret; 5523b96362cSSven Wegener int namelen; 5533063d29fSChris Mason u64 objectid; 5543063d29fSChris Mason 55580b6794dSChris Mason new_root_item = kmalloc(sizeof(*new_root_item), GFP_NOFS); 55680b6794dSChris Mason if (!new_root_item) { 55780b6794dSChris Mason ret = -ENOMEM; 55880b6794dSChris Mason goto fail; 55980b6794dSChris Mason } 5603063d29fSChris Mason ret = btrfs_find_free_objectid(trans, tree_root, 0, &objectid); 5613063d29fSChris Mason if (ret) 5623063d29fSChris Mason goto fail; 5633063d29fSChris Mason 56480b6794dSChris Mason memcpy(new_root_item, &root->root_item, sizeof(*new_root_item)); 5653063d29fSChris Mason 5663063d29fSChris Mason key.objectid = objectid; 5673063d29fSChris Mason key.offset = 1; 5683063d29fSChris Mason btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY); 5693063d29fSChris Mason 570925baeddSChris Mason old = btrfs_lock_root_node(root); 571925baeddSChris Mason btrfs_cow_block(trans, root, old, NULL, 0, &old); 5723063d29fSChris Mason 573925baeddSChris Mason btrfs_copy_root(trans, root, old, &tmp, objectid); 574925baeddSChris Mason btrfs_tree_unlock(old); 575925baeddSChris Mason free_extent_buffer(old); 5763063d29fSChris Mason 57780b6794dSChris Mason btrfs_set_root_bytenr(new_root_item, tmp->start); 57880b6794dSChris Mason btrfs_set_root_level(new_root_item, btrfs_header_level(tmp)); 5793063d29fSChris Mason ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key, 58080b6794dSChris Mason new_root_item); 581925baeddSChris Mason btrfs_tree_unlock(tmp); 5823063d29fSChris Mason free_extent_buffer(tmp); 5833063d29fSChris Mason if (ret) 5843063d29fSChris Mason goto fail; 5853063d29fSChris Mason 5863063d29fSChris Mason /* 5873063d29fSChris Mason * insert the directory item 5883063d29fSChris Mason */ 5893063d29fSChris Mason key.offset = (u64)-1; 5903b96362cSSven Wegener namelen = strlen(pending->name); 5913063d29fSChris Mason ret = btrfs_insert_dir_item(trans, root->fs_info->tree_root, 5923b96362cSSven Wegener pending->name, namelen, 5933063d29fSChris Mason root->fs_info->sb->s_root->d_inode->i_ino, 5943063d29fSChris Mason &key, BTRFS_FT_DIR); 5953063d29fSChris Mason 5963063d29fSChris Mason if (ret) 5973063d29fSChris Mason goto fail; 5983063d29fSChris Mason 5993063d29fSChris Mason ret = btrfs_insert_inode_ref(trans, root->fs_info->tree_root, 6003063d29fSChris Mason pending->name, strlen(pending->name), objectid, 6013063d29fSChris Mason root->fs_info->sb->s_root->d_inode->i_ino); 6023b96362cSSven Wegener 6033b96362cSSven Wegener /* Invalidate existing dcache entry for new snapshot. */ 6043b96362cSSven Wegener btrfs_invalidate_dcache_root(root, pending->name, namelen); 6053b96362cSSven Wegener 6063063d29fSChris Mason fail: 60780b6794dSChris Mason kfree(new_root_item); 6083063d29fSChris Mason return ret; 6093063d29fSChris Mason } 6103063d29fSChris Mason 61180b6794dSChris Mason static noinline int create_pending_snapshots(struct btrfs_trans_handle *trans, 6123063d29fSChris Mason struct btrfs_fs_info *fs_info) 6133063d29fSChris Mason { 6143063d29fSChris Mason struct btrfs_pending_snapshot *pending; 6153063d29fSChris Mason struct list_head *head = &trans->transaction->pending_snapshots; 6163063d29fSChris Mason int ret; 6173063d29fSChris Mason 6183063d29fSChris Mason while(!list_empty(head)) { 6193063d29fSChris Mason pending = list_entry(head->next, 6203063d29fSChris Mason struct btrfs_pending_snapshot, list); 6213063d29fSChris Mason ret = create_pending_snapshot(trans, fs_info, pending); 6223063d29fSChris Mason BUG_ON(ret); 6233063d29fSChris Mason list_del(&pending->list); 6243063d29fSChris Mason kfree(pending->name); 6253063d29fSChris Mason kfree(pending); 6263063d29fSChris Mason } 627dc17ff8fSChris Mason return 0; 628dc17ff8fSChris Mason } 629dc17ff8fSChris Mason 63079154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 63179154b1bSChris Mason struct btrfs_root *root) 63279154b1bSChris Mason { 63315ee9bc7SJosef Bacik unsigned long joined = 0; 63415ee9bc7SJosef Bacik unsigned long timeout = 1; 63579154b1bSChris Mason struct btrfs_transaction *cur_trans; 6368fd17795SChris Mason struct btrfs_transaction *prev_trans = NULL; 6370b86a832SChris Mason struct btrfs_root *chunk_root = root->fs_info->chunk_root; 6380f7d52f4SChris Mason struct list_head dirty_fs_roots; 639d1310b2eSChris Mason struct extent_io_tree *pinned_copy; 64079154b1bSChris Mason DEFINE_WAIT(wait); 64115ee9bc7SJosef Bacik int ret; 64279154b1bSChris Mason 6430f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 644d6e4a428SChris Mason 64579154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 64679154b1bSChris Mason if (trans->transaction->in_commit) { 64779154b1bSChris Mason cur_trans = trans->transaction; 64879154b1bSChris Mason trans->transaction->use_count++; 649ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 65079154b1bSChris Mason btrfs_end_transaction(trans, root); 651ccd467d6SChris Mason 65279154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 65379154b1bSChris Mason BUG_ON(ret); 65415ee9bc7SJosef Bacik 65515ee9bc7SJosef Bacik mutex_lock(&root->fs_info->trans_mutex); 65679154b1bSChris Mason put_transaction(cur_trans); 65715ee9bc7SJosef Bacik mutex_unlock(&root->fs_info->trans_mutex); 65815ee9bc7SJosef Bacik 65979154b1bSChris Mason return 0; 66079154b1bSChris Mason } 6614313b399SChris Mason 6624313b399SChris Mason pinned_copy = kmalloc(sizeof(*pinned_copy), GFP_NOFS); 6634313b399SChris Mason if (!pinned_copy) 6644313b399SChris Mason return -ENOMEM; 6654313b399SChris Mason 666d1310b2eSChris Mason extent_io_tree_init(pinned_copy, 6674313b399SChris Mason root->fs_info->btree_inode->i_mapping, GFP_NOFS); 6684313b399SChris Mason 6692c90e5d6SChris Mason trans->transaction->in_commit = 1; 67089ce8a63SChris Mason printk("trans %Lu in commit\n", trans->transid); 671ccd467d6SChris Mason cur_trans = trans->transaction; 672ccd467d6SChris Mason if (cur_trans->list.prev != &root->fs_info->trans_list) { 673ccd467d6SChris Mason prev_trans = list_entry(cur_trans->list.prev, 674ccd467d6SChris Mason struct btrfs_transaction, list); 675ccd467d6SChris Mason if (!prev_trans->commit_done) { 676ccd467d6SChris Mason prev_trans->use_count++; 677ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 678ccd467d6SChris Mason 679ccd467d6SChris Mason wait_for_commit(root, prev_trans); 680ccd467d6SChris Mason 681ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 68215ee9bc7SJosef Bacik put_transaction(prev_trans); 683ccd467d6SChris Mason } 684ccd467d6SChris Mason } 68515ee9bc7SJosef Bacik 68615ee9bc7SJosef Bacik do { 68715ee9bc7SJosef Bacik joined = cur_trans->num_joined; 6882c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 68915ee9bc7SJosef Bacik prepare_to_wait(&cur_trans->writer_wait, &wait, 69079154b1bSChris Mason TASK_UNINTERRUPTIBLE); 69115ee9bc7SJosef Bacik 69215ee9bc7SJosef Bacik if (cur_trans->num_writers > 1) 69315ee9bc7SJosef Bacik timeout = MAX_SCHEDULE_TIMEOUT; 69415ee9bc7SJosef Bacik else 69515ee9bc7SJosef Bacik timeout = 1; 69615ee9bc7SJosef Bacik 69779154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 69815ee9bc7SJosef Bacik 69915ee9bc7SJosef Bacik schedule_timeout(timeout); 70015ee9bc7SJosef Bacik 70179154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 70215ee9bc7SJosef Bacik finish_wait(&cur_trans->writer_wait, &wait); 703dc17ff8fSChris Mason ret = btrfs_write_ordered_inodes(trans, root); 704dc17ff8fSChris Mason 70515ee9bc7SJosef Bacik } while (cur_trans->num_writers > 1 || 70615ee9bc7SJosef Bacik (cur_trans->num_joined != joined)); 70715ee9bc7SJosef Bacik 7083063d29fSChris Mason ret = create_pending_snapshots(trans, root->fs_info); 7093063d29fSChris Mason BUG_ON(ret); 7103063d29fSChris Mason 7112c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 712dc17ff8fSChris Mason 71354aa1f4dSChris Mason ret = add_dirty_roots(trans, &root->fs_info->fs_roots_radix, 71454aa1f4dSChris Mason &dirty_fs_roots); 71554aa1f4dSChris Mason BUG_ON(ret); 71654aa1f4dSChris Mason 71779154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 71879154b1bSChris Mason BUG_ON(ret); 71954aa1f4dSChris Mason 72078fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 721cee36a03SChris Mason spin_lock(&root->fs_info->new_trans_lock); 72278fae27eSChris Mason root->fs_info->running_transaction = NULL; 723cee36a03SChris Mason spin_unlock(&root->fs_info->new_trans_lock); 7244b52dff6SChris Mason btrfs_set_super_generation(&root->fs_info->super_copy, 7254b52dff6SChris Mason cur_trans->transid); 7264b52dff6SChris Mason btrfs_set_super_root(&root->fs_info->super_copy, 727db94535dSChris Mason root->fs_info->tree_root->node->start); 728db94535dSChris Mason btrfs_set_super_root_level(&root->fs_info->super_copy, 729db94535dSChris Mason btrfs_header_level(root->fs_info->tree_root->node)); 7305f39d397SChris Mason 7310b86a832SChris Mason btrfs_set_super_chunk_root(&root->fs_info->super_copy, 7320b86a832SChris Mason chunk_root->node->start); 7330b86a832SChris Mason btrfs_set_super_chunk_root_level(&root->fs_info->super_copy, 7340b86a832SChris Mason btrfs_header_level(chunk_root->node)); 735a061fc8dSChris Mason memcpy(&root->fs_info->super_for_commit, &root->fs_info->super_copy, 7364b52dff6SChris Mason sizeof(root->fs_info->super_copy)); 737ccd467d6SChris Mason 7384313b399SChris Mason btrfs_copy_pinned(root, pinned_copy); 739ccd467d6SChris Mason 74078fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 74179154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 74279154b1bSChris Mason BUG_ON(ret); 74379154b1bSChris Mason write_ctree_super(trans, root); 7444313b399SChris Mason 7454313b399SChris Mason btrfs_finish_extent_commit(trans, root, pinned_copy); 74678fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 7474313b399SChris Mason 7484313b399SChris Mason kfree(pinned_copy); 7494313b399SChris Mason 7502c90e5d6SChris Mason cur_trans->commit_done = 1; 75189ce8a63SChris Mason printk("trans %Lu done in commit\n", cur_trans->transid); 75215ee9bc7SJosef Bacik root->fs_info->last_trans_committed = cur_trans->transid; 7532c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 75479154b1bSChris Mason put_transaction(cur_trans); 75578fae27eSChris Mason put_transaction(cur_trans); 75658176a96SJosef Bacik 757facda1e7SChris Mason if (root->fs_info->closing) 758facda1e7SChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_fs_roots); 759facda1e7SChris Mason else 760facda1e7SChris Mason list_splice_init(&dirty_fs_roots, &root->fs_info->dead_roots); 76158176a96SJosef Bacik 76278fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 7632c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 76479154b1bSChris Mason 765facda1e7SChris Mason if (root->fs_info->closing) { 7660f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 767facda1e7SChris Mason } 76879154b1bSChris Mason return ret; 76979154b1bSChris Mason } 77079154b1bSChris Mason 771e9d0b13bSChris Mason int btrfs_clean_old_snapshots(struct btrfs_root *root) 772e9d0b13bSChris Mason { 773e9d0b13bSChris Mason struct list_head dirty_roots; 774e9d0b13bSChris Mason INIT_LIST_HEAD(&dirty_roots); 775a74a4b97SChris Mason again: 776e9d0b13bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 777e9d0b13bSChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_roots); 778e9d0b13bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 779e9d0b13bSChris Mason 780e9d0b13bSChris Mason if (!list_empty(&dirty_roots)) { 781e9d0b13bSChris Mason drop_dirty_roots(root, &dirty_roots); 782a74a4b97SChris Mason goto again; 783e9d0b13bSChris Mason } 784e9d0b13bSChris Mason return 0; 785e9d0b13bSChris Mason } 78608607c1bSChris Mason 787