16cbd5570SChris Mason /* 26cbd5570SChris Mason * Copyright (C) 2007 Oracle. All rights reserved. 36cbd5570SChris Mason * 46cbd5570SChris Mason * This program is free software; you can redistribute it and/or 56cbd5570SChris Mason * modify it under the terms of the GNU General Public 66cbd5570SChris Mason * License v2 as published by the Free Software Foundation. 76cbd5570SChris Mason * 86cbd5570SChris Mason * This program is distributed in the hope that it will be useful, 96cbd5570SChris Mason * but WITHOUT ANY WARRANTY; without even the implied warranty of 106cbd5570SChris Mason * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 116cbd5570SChris Mason * General Public License for more details. 126cbd5570SChris Mason * 136cbd5570SChris Mason * You should have received a copy of the GNU General Public 146cbd5570SChris Mason * License along with this program; if not, write to the 156cbd5570SChris Mason * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 166cbd5570SChris Mason * Boston, MA 021110-1307, USA. 176cbd5570SChris Mason */ 186cbd5570SChris Mason 1979154b1bSChris Mason #include <linux/fs.h> 2034088780SChris Mason #include <linux/sched.h> 2179154b1bSChris Mason #include "ctree.h" 2279154b1bSChris Mason #include "disk-io.h" 2379154b1bSChris Mason #include "transaction.h" 2479154b1bSChris Mason 2578fae27eSChris Mason static int total_trans = 0; 262c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 272c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 282c90e5d6SChris Mason 2908607c1bSChris Mason static struct workqueue_struct *trans_wq; 3008607c1bSChris Mason 310f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 32*6702ed49SChris Mason #define BTRFS_ROOT_DEFRAG_TAG 1 330f7d52f4SChris Mason 3479154b1bSChris Mason static void put_transaction(struct btrfs_transaction *transaction) 3579154b1bSChris Mason { 362c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 3779154b1bSChris Mason transaction->use_count--; 3878fae27eSChris Mason if (transaction->use_count == 0) { 3978fae27eSChris Mason WARN_ON(total_trans == 0); 4078fae27eSChris Mason total_trans--; 418fd17795SChris Mason list_del_init(&transaction->list); 422c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 432c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 4479154b1bSChris Mason } 4578fae27eSChris Mason } 4679154b1bSChris Mason 4779154b1bSChris Mason static int join_transaction(struct btrfs_root *root) 4879154b1bSChris Mason { 4979154b1bSChris Mason struct btrfs_transaction *cur_trans; 5079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 5179154b1bSChris Mason if (!cur_trans) { 522c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 532c90e5d6SChris Mason GFP_NOFS); 5478fae27eSChris Mason total_trans++; 5579154b1bSChris Mason BUG_ON(!cur_trans); 560f7d52f4SChris Mason root->fs_info->generation++; 5779154b1bSChris Mason root->fs_info->running_transaction = cur_trans; 5879154b1bSChris Mason cur_trans->num_writers = 0; 590f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 6079154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 6179154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 6279154b1bSChris Mason cur_trans->in_commit = 0; 63d5719762SChris Mason cur_trans->use_count = 1; 6479154b1bSChris Mason cur_trans->commit_done = 0; 6508607c1bSChris Mason cur_trans->start_time = get_seconds(); 668fd17795SChris Mason list_add_tail(&cur_trans->list, &root->fs_info->trans_list); 677c4452b9SChris Mason init_bit_radix(&cur_trans->dirty_pages); 6879154b1bSChris Mason } 6979154b1bSChris Mason cur_trans->num_writers++; 7079154b1bSChris Mason return 0; 7179154b1bSChris Mason } 7279154b1bSChris Mason 73*6702ed49SChris Mason static int record_root_in_trans(struct btrfs_root *root) 74*6702ed49SChris Mason { 75*6702ed49SChris Mason u64 running_trans_id = root->fs_info->running_transaction->transid; 76*6702ed49SChris Mason if (root->ref_cows && root->last_trans < running_trans_id) { 77*6702ed49SChris Mason WARN_ON(root == root->fs_info->extent_root); 78*6702ed49SChris Mason if (root->root_item.refs != 0) { 79*6702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 80*6702ed49SChris Mason (unsigned long)root->root_key.objectid, 81*6702ed49SChris Mason BTRFS_ROOT_TRANS_TAG); 82*6702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 83*6702ed49SChris Mason (unsigned long)root->root_key.objectid, 84*6702ed49SChris Mason BTRFS_ROOT_DEFRAG_TAG); 85*6702ed49SChris Mason root->commit_root = root->node; 86*6702ed49SChris Mason get_bh(root->node); 87*6702ed49SChris Mason } else { 88*6702ed49SChris Mason WARN_ON(1); 89*6702ed49SChris Mason } 90*6702ed49SChris Mason root->last_trans = running_trans_id; 91*6702ed49SChris Mason } 92*6702ed49SChris Mason return 0; 93*6702ed49SChris Mason } 94*6702ed49SChris Mason 9579154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 9679154b1bSChris Mason int num_blocks) 9779154b1bSChris Mason { 982c90e5d6SChris Mason struct btrfs_trans_handle *h = 992c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 10079154b1bSChris Mason int ret; 10179154b1bSChris Mason 10279154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 10379154b1bSChris Mason ret = join_transaction(root); 10479154b1bSChris Mason BUG_ON(ret); 1050f7d52f4SChris Mason 106*6702ed49SChris Mason record_root_in_trans(root); 107*6702ed49SChris Mason h->transid = root->fs_info->running_transaction->transid; 10879154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 10979154b1bSChris Mason h->blocks_reserved = num_blocks; 11079154b1bSChris Mason h->blocks_used = 0; 11131f3c99bSChris Mason h->block_group = NULL; 11279154b1bSChris Mason root->fs_info->running_transaction->use_count++; 11379154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 11479154b1bSChris Mason return h; 11579154b1bSChris Mason } 11679154b1bSChris Mason 11779154b1bSChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 11879154b1bSChris Mason struct btrfs_root *root) 11979154b1bSChris Mason { 12079154b1bSChris Mason struct btrfs_transaction *cur_trans; 121d6e4a428SChris Mason 12279154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 12379154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 124ccd467d6SChris Mason WARN_ON(cur_trans != trans->transaction); 125d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 126ccd467d6SChris Mason cur_trans->num_writers--; 12779154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 12879154b1bSChris Mason wake_up(&cur_trans->writer_wait); 12979154b1bSChris Mason put_transaction(cur_trans); 13079154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 131d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 1322c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 13379154b1bSChris Mason return 0; 13479154b1bSChris Mason } 13579154b1bSChris Mason 13679154b1bSChris Mason 13779154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 13879154b1bSChris Mason struct btrfs_root *root) 13979154b1bSChris Mason { 1407c4452b9SChris Mason unsigned long gang[16]; 1417c4452b9SChris Mason int ret; 1427c4452b9SChris Mason int i; 1437c4452b9SChris Mason int err; 1447c4452b9SChris Mason int werr = 0; 1457c4452b9SChris Mason struct page *page; 1467c4452b9SChris Mason struct radix_tree_root *dirty_pages; 1477c4452b9SChris Mason struct inode *btree_inode = root->fs_info->btree_inode; 1487c4452b9SChris Mason 1497c4452b9SChris Mason if (!trans || !trans->transaction) { 1507c4452b9SChris Mason return filemap_write_and_wait(btree_inode->i_mapping); 1517c4452b9SChris Mason } 1527c4452b9SChris Mason dirty_pages = &trans->transaction->dirty_pages; 1537c4452b9SChris Mason while(1) { 154e37c9e69SChris Mason ret = find_first_radix_bit(dirty_pages, gang, 155e37c9e69SChris Mason 0, ARRAY_SIZE(gang)); 1567c4452b9SChris Mason if (!ret) 1577c4452b9SChris Mason break; 1587c4452b9SChris Mason for (i = 0; i < ret; i++) { 1597c4452b9SChris Mason /* FIXME EIO */ 1607c4452b9SChris Mason clear_radix_bit(dirty_pages, gang[i]); 1617c4452b9SChris Mason page = find_lock_page(btree_inode->i_mapping, 1627c4452b9SChris Mason gang[i]); 1637c4452b9SChris Mason if (!page) 1647c4452b9SChris Mason continue; 165*6702ed49SChris Mason if (PageWriteback(page)) { 166*6702ed49SChris Mason if (PageDirty(page)) 167*6702ed49SChris Mason wait_on_page_writeback(page); 168*6702ed49SChris Mason else { 169*6702ed49SChris Mason unlock_page(page); 170*6702ed49SChris Mason page_cache_release(page); 171*6702ed49SChris Mason continue; 172*6702ed49SChris Mason } 173*6702ed49SChris Mason } 1747c4452b9SChris Mason err = write_one_page(page, 0); 1757c4452b9SChris Mason if (err) 1767c4452b9SChris Mason werr = err; 1777c4452b9SChris Mason page_cache_release(page); 1787c4452b9SChris Mason } 1797c4452b9SChris Mason } 1807c4452b9SChris Mason err = filemap_fdatawait(btree_inode->i_mapping); 1817c4452b9SChris Mason if (err) 1827c4452b9SChris Mason werr = err; 1837c4452b9SChris Mason return werr; 18479154b1bSChris Mason } 18579154b1bSChris Mason 18679154b1bSChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 18779154b1bSChris Mason struct btrfs_root *root) 18879154b1bSChris Mason { 18979154b1bSChris Mason int ret; 19079154b1bSChris Mason u64 old_extent_block; 19179154b1bSChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 19279154b1bSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 19379154b1bSChris Mason struct btrfs_root *extent_root = fs_info->extent_root; 19479154b1bSChris Mason 1959078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 19679154b1bSChris Mason while(1) { 19779154b1bSChris Mason old_extent_block = btrfs_root_blocknr(&extent_root->root_item); 1987eccb903SChris Mason if (old_extent_block == bh_blocknr(extent_root->node)) 19979154b1bSChris Mason break; 20079154b1bSChris Mason btrfs_set_root_blocknr(&extent_root->root_item, 2017eccb903SChris Mason bh_blocknr(extent_root->node)); 20279154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 20379154b1bSChris Mason &extent_root->root_key, 20479154b1bSChris Mason &extent_root->root_item); 20579154b1bSChris Mason BUG_ON(ret); 2069078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 20779154b1bSChris Mason } 20879154b1bSChris Mason return 0; 20979154b1bSChris Mason } 21079154b1bSChris Mason 21179154b1bSChris Mason static int wait_for_commit(struct btrfs_root *root, 21279154b1bSChris Mason struct btrfs_transaction *commit) 21379154b1bSChris Mason { 21479154b1bSChris Mason DEFINE_WAIT(wait); 215ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 21679154b1bSChris Mason while(!commit->commit_done) { 21779154b1bSChris Mason prepare_to_wait(&commit->commit_wait, &wait, 21879154b1bSChris Mason TASK_UNINTERRUPTIBLE); 21979154b1bSChris Mason if (commit->commit_done) 22079154b1bSChris Mason break; 22179154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 22279154b1bSChris Mason schedule(); 22379154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 22479154b1bSChris Mason } 225ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 22679154b1bSChris Mason finish_wait(&commit->commit_wait, &wait); 22779154b1bSChris Mason return 0; 22879154b1bSChris Mason } 22979154b1bSChris Mason 2300f7d52f4SChris Mason struct dirty_root { 2310f7d52f4SChris Mason struct list_head list; 2320f7d52f4SChris Mason struct btrfs_root *root; 2330f7d52f4SChris Mason }; 2340f7d52f4SChris Mason 2355eda7b5eSChris Mason int btrfs_add_dead_root(struct btrfs_root *root, struct list_head *dead_list) 2365eda7b5eSChris Mason { 2375eda7b5eSChris Mason struct dirty_root *dirty; 2385eda7b5eSChris Mason 2395eda7b5eSChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2405eda7b5eSChris Mason if (!dirty) 2415eda7b5eSChris Mason return -ENOMEM; 2425eda7b5eSChris Mason dirty->root = root; 2435eda7b5eSChris Mason list_add(&dirty->list, dead_list); 2445eda7b5eSChris Mason return 0; 2455eda7b5eSChris Mason } 2465eda7b5eSChris Mason 24735b7e476SChris Mason static int add_dirty_roots(struct btrfs_trans_handle *trans, 24835b7e476SChris Mason struct radix_tree_root *radix, 24935b7e476SChris Mason struct list_head *list) 2500f7d52f4SChris Mason { 2510f7d52f4SChris Mason struct dirty_root *dirty; 2520f7d52f4SChris Mason struct btrfs_root *gang[8]; 2530f7d52f4SChris Mason struct btrfs_root *root; 2540f7d52f4SChris Mason int i; 2550f7d52f4SChris Mason int ret; 25654aa1f4dSChris Mason int err = 0; 2575eda7b5eSChris Mason u32 refs; 25854aa1f4dSChris Mason 2590f7d52f4SChris Mason while(1) { 2600f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 2610f7d52f4SChris Mason ARRAY_SIZE(gang), 2620f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 2630f7d52f4SChris Mason if (ret == 0) 2640f7d52f4SChris Mason break; 2650f7d52f4SChris Mason for (i = 0; i < ret; i++) { 2660f7d52f4SChris Mason root = gang[i]; 2672619ba1fSChris Mason radix_tree_tag_clear(radix, 2682619ba1fSChris Mason (unsigned long)root->root_key.objectid, 2690f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 2700f7d52f4SChris Mason if (root->commit_root == root->node) { 2717eccb903SChris Mason WARN_ON(bh_blocknr(root->node) != 2720f7d52f4SChris Mason btrfs_root_blocknr(&root->root_item)); 2730f7d52f4SChris Mason brelse(root->commit_root); 2740f7d52f4SChris Mason root->commit_root = NULL; 2750f7d52f4SChris Mason continue; 2760f7d52f4SChris Mason } 2770f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2780f7d52f4SChris Mason BUG_ON(!dirty); 2799f3a7427SChris Mason dirty->root = kmalloc(sizeof(*dirty->root), GFP_NOFS); 2809f3a7427SChris Mason BUG_ON(!dirty->root); 2819f3a7427SChris Mason 2829f3a7427SChris Mason memset(&root->root_item.drop_progress, 0, 2839f3a7427SChris Mason sizeof(struct btrfs_disk_key)); 2849f3a7427SChris Mason root->root_item.drop_level = 0; 2859f3a7427SChris Mason 2869f3a7427SChris Mason memcpy(dirty->root, root, sizeof(*root)); 2879f3a7427SChris Mason dirty->root->node = root->commit_root; 2880f7d52f4SChris Mason root->commit_root = NULL; 2895eda7b5eSChris Mason 2900f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 2910f7d52f4SChris Mason btrfs_set_root_blocknr(&root->root_item, 2927eccb903SChris Mason bh_blocknr(root->node)); 2930f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 2940f7d52f4SChris Mason &root->root_key, 2950f7d52f4SChris Mason &root->root_item); 29654aa1f4dSChris Mason if (err) 29754aa1f4dSChris Mason break; 2989f3a7427SChris Mason 2999f3a7427SChris Mason refs = btrfs_root_refs(&dirty->root->root_item); 3009f3a7427SChris Mason btrfs_set_root_refs(&dirty->root->root_item, refs - 1); 3015eda7b5eSChris Mason err = btrfs_update_root(trans, root->fs_info->tree_root, 3029f3a7427SChris Mason &dirty->root->root_key, 3039f3a7427SChris Mason &dirty->root->root_item); 3045eda7b5eSChris Mason 3055eda7b5eSChris Mason BUG_ON(err); 3069f3a7427SChris Mason if (refs == 1) { 3070f7d52f4SChris Mason list_add(&dirty->list, list); 3089f3a7427SChris Mason } else { 3099f3a7427SChris Mason WARN_ON(1); 3109f3a7427SChris Mason kfree(dirty->root); 3115eda7b5eSChris Mason kfree(dirty); 3120f7d52f4SChris Mason } 3130f7d52f4SChris Mason } 3149f3a7427SChris Mason } 31554aa1f4dSChris Mason return err; 3160f7d52f4SChris Mason } 3170f7d52f4SChris Mason 318*6702ed49SChris Mason int btrfs_defrag_dirty_roots(struct btrfs_fs_info *info) 319*6702ed49SChris Mason { 320*6702ed49SChris Mason struct btrfs_root *gang[1]; 321*6702ed49SChris Mason struct btrfs_root *root; 322*6702ed49SChris Mason struct btrfs_root *tree_root = info->tree_root; 323*6702ed49SChris Mason struct btrfs_trans_handle *trans; 324*6702ed49SChris Mason int i; 325*6702ed49SChris Mason int ret; 326*6702ed49SChris Mason int err = 0; 327*6702ed49SChris Mason u64 last = 0; 328*6702ed49SChris Mason 329*6702ed49SChris Mason trans = btrfs_start_transaction(tree_root, 1); 330*6702ed49SChris Mason while(1) { 331*6702ed49SChris Mason ret = radix_tree_gang_lookup_tag(&info->fs_roots_radix, 332*6702ed49SChris Mason (void **)gang, last, 333*6702ed49SChris Mason ARRAY_SIZE(gang), 334*6702ed49SChris Mason BTRFS_ROOT_DEFRAG_TAG); 335*6702ed49SChris Mason if (ret == 0) 336*6702ed49SChris Mason break; 337*6702ed49SChris Mason for (i = 0; i < ret; i++) { 338*6702ed49SChris Mason root = gang[i]; 339*6702ed49SChris Mason last = root->root_key.objectid + 1; 340*6702ed49SChris Mason radix_tree_tag_clear(&info->fs_roots_radix, 341*6702ed49SChris Mason (unsigned long)root->root_key.objectid, 342*6702ed49SChris Mason BTRFS_ROOT_DEFRAG_TAG); 343*6702ed49SChris Mason if (root->defrag_running) 344*6702ed49SChris Mason continue; 345*6702ed49SChris Mason 346*6702ed49SChris Mason while (1) { 347*6702ed49SChris Mason mutex_lock(&root->fs_info->trans_mutex); 348*6702ed49SChris Mason record_root_in_trans(root); 349*6702ed49SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 350*6702ed49SChris Mason 351*6702ed49SChris Mason root->defrag_running = 1; 352*6702ed49SChris Mason err = btrfs_defrag_leaves(trans, root, 1); 353*6702ed49SChris Mason btrfs_end_transaction(trans, tree_root); 354*6702ed49SChris Mason mutex_unlock(&info->fs_mutex); 355*6702ed49SChris Mason 356*6702ed49SChris Mason btrfs_btree_balance_dirty(root); 357*6702ed49SChris Mason 358*6702ed49SChris Mason mutex_lock(&info->fs_mutex); 359*6702ed49SChris Mason trans = btrfs_start_transaction(tree_root, 1); 360*6702ed49SChris Mason if (err != -EAGAIN) 361*6702ed49SChris Mason break; 362*6702ed49SChris Mason } 363*6702ed49SChris Mason root->defrag_running = 0; 364*6702ed49SChris Mason } 365*6702ed49SChris Mason } 366*6702ed49SChris Mason btrfs_end_transaction(trans, tree_root); 367*6702ed49SChris Mason return err; 368*6702ed49SChris Mason } 369*6702ed49SChris Mason 37035b7e476SChris Mason static int drop_dirty_roots(struct btrfs_root *tree_root, 37135b7e476SChris Mason struct list_head *list) 3720f7d52f4SChris Mason { 3730f7d52f4SChris Mason struct dirty_root *dirty; 3740f7d52f4SChris Mason struct btrfs_trans_handle *trans; 37554aa1f4dSChris Mason int ret = 0; 3769f3a7427SChris Mason int err; 3779f3a7427SChris Mason 3780f7d52f4SChris Mason while(!list_empty(list)) { 379facda1e7SChris Mason mutex_lock(&tree_root->fs_info->fs_mutex); 3800f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 3810f7d52f4SChris Mason list_del_init(&dirty->list); 3825eda7b5eSChris Mason 3839f3a7427SChris Mason while(1) { 3840f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 3859f3a7427SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root); 3869f3a7427SChris Mason if (ret != -EAGAIN) { 3879f3a7427SChris Mason break; 3889f3a7427SChris Mason } 3899f3a7427SChris Mason err = btrfs_update_root(trans, 3909f3a7427SChris Mason tree_root, 3919f3a7427SChris Mason &dirty->root->root_key, 3929f3a7427SChris Mason &dirty->root->root_item); 3939f3a7427SChris Mason if (err) 3949f3a7427SChris Mason ret = err; 3959f3a7427SChris Mason ret = btrfs_end_transaction(trans, tree_root); 3960f7d52f4SChris Mason BUG_ON(ret); 3979f3a7427SChris Mason } 3989f3a7427SChris Mason BUG_ON(ret); 3999f3a7427SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->root->root_key); 40054aa1f4dSChris Mason if (ret) 40154aa1f4dSChris Mason break; 4020f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 4030f7d52f4SChris Mason BUG_ON(ret); 4045eda7b5eSChris Mason 4055eda7b5eSChris Mason kfree(dirty->root); 4060f7d52f4SChris Mason kfree(dirty); 407facda1e7SChris Mason mutex_unlock(&tree_root->fs_info->fs_mutex); 4088c2383c3SChris Mason btrfs_btree_balance_dirty(tree_root); 4090f7d52f4SChris Mason } 41054aa1f4dSChris Mason return ret; 4110f7d52f4SChris Mason } 4120f7d52f4SChris Mason 41379154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 41479154b1bSChris Mason struct btrfs_root *root) 41579154b1bSChris Mason { 41679154b1bSChris Mason int ret = 0; 41779154b1bSChris Mason struct btrfs_transaction *cur_trans; 4188fd17795SChris Mason struct btrfs_transaction *prev_trans = NULL; 4190f7d52f4SChris Mason struct list_head dirty_fs_roots; 420ccd467d6SChris Mason struct radix_tree_root pinned_copy; 42179154b1bSChris Mason DEFINE_WAIT(wait); 42279154b1bSChris Mason 423ccd467d6SChris Mason init_bit_radix(&pinned_copy); 4240f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 425d6e4a428SChris Mason 42679154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 42779154b1bSChris Mason if (trans->transaction->in_commit) { 42879154b1bSChris Mason cur_trans = trans->transaction; 42979154b1bSChris Mason trans->transaction->use_count++; 430ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 43179154b1bSChris Mason btrfs_end_transaction(trans, root); 432ccd467d6SChris Mason 433ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 43479154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 43579154b1bSChris Mason BUG_ON(ret); 43679154b1bSChris Mason put_transaction(cur_trans); 437ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 43879154b1bSChris Mason return 0; 43979154b1bSChris Mason } 4402c90e5d6SChris Mason trans->transaction->in_commit = 1; 441ccd467d6SChris Mason cur_trans = trans->transaction; 442ccd467d6SChris Mason if (cur_trans->list.prev != &root->fs_info->trans_list) { 443ccd467d6SChris Mason prev_trans = list_entry(cur_trans->list.prev, 444ccd467d6SChris Mason struct btrfs_transaction, list); 445ccd467d6SChris Mason if (!prev_trans->commit_done) { 446ccd467d6SChris Mason prev_trans->use_count++; 447ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 448ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 449ccd467d6SChris Mason 450ccd467d6SChris Mason wait_for_commit(root, prev_trans); 451ccd467d6SChris Mason put_transaction(prev_trans); 452ccd467d6SChris Mason 453ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 454ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 455ccd467d6SChris Mason } 456ccd467d6SChris Mason } 45779154b1bSChris Mason while (trans->transaction->num_writers > 1) { 4582c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 45979154b1bSChris Mason prepare_to_wait(&trans->transaction->writer_wait, &wait, 46079154b1bSChris Mason TASK_UNINTERRUPTIBLE); 46179154b1bSChris Mason if (trans->transaction->num_writers <= 1) 46279154b1bSChris Mason break; 463ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 46479154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 46579154b1bSChris Mason schedule(); 466ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 46779154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 4682c90e5d6SChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 46979154b1bSChris Mason } 47079154b1bSChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 4712c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 47254aa1f4dSChris Mason ret = add_dirty_roots(trans, &root->fs_info->fs_roots_radix, 47354aa1f4dSChris Mason &dirty_fs_roots); 47454aa1f4dSChris Mason BUG_ON(ret); 47554aa1f4dSChris Mason 47679154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 47779154b1bSChris Mason BUG_ON(ret); 47854aa1f4dSChris Mason 47978fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 48078fae27eSChris Mason root->fs_info->running_transaction = NULL; 4814b52dff6SChris Mason btrfs_set_super_generation(&root->fs_info->super_copy, 4824b52dff6SChris Mason cur_trans->transid); 4834b52dff6SChris Mason btrfs_set_super_root(&root->fs_info->super_copy, 4844b52dff6SChris Mason bh_blocknr(root->fs_info->tree_root->node)); 4854b52dff6SChris Mason memcpy(root->fs_info->disk_super, &root->fs_info->super_copy, 4864b52dff6SChris Mason sizeof(root->fs_info->super_copy)); 487ccd467d6SChris Mason 488ccd467d6SChris Mason btrfs_copy_pinned(root, &pinned_copy); 489ccd467d6SChris Mason 49078fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 4918fd17795SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 49279154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 49379154b1bSChris Mason BUG_ON(ret); 49479154b1bSChris Mason write_ctree_super(trans, root); 4958fd17795SChris Mason mutex_lock(&root->fs_info->fs_mutex); 496ccd467d6SChris Mason btrfs_finish_extent_commit(trans, root, &pinned_copy); 49778fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 4982c90e5d6SChris Mason cur_trans->commit_done = 1; 4992c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 50079154b1bSChris Mason put_transaction(cur_trans); 50178fae27eSChris Mason put_transaction(cur_trans); 502facda1e7SChris Mason if (root->fs_info->closing) 503facda1e7SChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_fs_roots); 504facda1e7SChris Mason else 505facda1e7SChris Mason list_splice_init(&dirty_fs_roots, &root->fs_info->dead_roots); 50678fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 5072c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 50879154b1bSChris Mason 509facda1e7SChris Mason if (root->fs_info->closing) { 510facda1e7SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 5110f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 512facda1e7SChris Mason mutex_lock(&root->fs_info->fs_mutex); 513facda1e7SChris Mason } 51479154b1bSChris Mason return ret; 51579154b1bSChris Mason } 51679154b1bSChris Mason 51708607c1bSChris Mason void btrfs_transaction_cleaner(struct work_struct *work) 51808607c1bSChris Mason { 51908607c1bSChris Mason struct btrfs_fs_info *fs_info = container_of(work, 52008607c1bSChris Mason struct btrfs_fs_info, 52108607c1bSChris Mason trans_work.work); 52208607c1bSChris Mason 52308607c1bSChris Mason struct btrfs_root *root = fs_info->tree_root; 52408607c1bSChris Mason struct btrfs_transaction *cur; 52508607c1bSChris Mason struct btrfs_trans_handle *trans; 526facda1e7SChris Mason struct list_head dirty_roots; 52708607c1bSChris Mason unsigned long now; 52808607c1bSChris Mason unsigned long delay = HZ * 30; 52908607c1bSChris Mason int ret; 53008607c1bSChris Mason 531facda1e7SChris Mason INIT_LIST_HEAD(&dirty_roots); 53208607c1bSChris Mason mutex_lock(&root->fs_info->fs_mutex); 53308607c1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 53408607c1bSChris Mason cur = root->fs_info->running_transaction; 53508607c1bSChris Mason if (!cur) { 53608607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 53708607c1bSChris Mason goto out; 53808607c1bSChris Mason } 53908607c1bSChris Mason now = get_seconds(); 54008607c1bSChris Mason if (now < cur->start_time || now - cur->start_time < 30) { 54108607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 54208607c1bSChris Mason delay = HZ * 5; 54308607c1bSChris Mason goto out; 54408607c1bSChris Mason } 54508607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 546*6702ed49SChris Mason btrfs_defrag_dirty_roots(root->fs_info); 54708607c1bSChris Mason trans = btrfs_start_transaction(root, 1); 54808607c1bSChris Mason ret = btrfs_commit_transaction(trans, root); 54908607c1bSChris Mason out: 55008607c1bSChris Mason mutex_unlock(&root->fs_info->fs_mutex); 551ad693af6SChris Mason 552ad693af6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 553ad693af6SChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_roots); 554ad693af6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 555ad693af6SChris Mason 556ad693af6SChris Mason if (!list_empty(&dirty_roots)) { 557ad693af6SChris Mason drop_dirty_roots(root, &dirty_roots); 558ad693af6SChris Mason } 55908607c1bSChris Mason btrfs_transaction_queue_work(root, delay); 56008607c1bSChris Mason } 56108607c1bSChris Mason 56208607c1bSChris Mason void btrfs_transaction_queue_work(struct btrfs_root *root, int delay) 56308607c1bSChris Mason { 56408607c1bSChris Mason queue_delayed_work(trans_wq, &root->fs_info->trans_work, delay); 56508607c1bSChris Mason } 56608607c1bSChris Mason 56708607c1bSChris Mason void btrfs_transaction_flush_work(struct btrfs_root *root) 56808607c1bSChris Mason { 56908607c1bSChris Mason cancel_rearming_delayed_workqueue(trans_wq, &root->fs_info->trans_work); 57008607c1bSChris Mason flush_workqueue(trans_wq); 57108607c1bSChris Mason } 57208607c1bSChris Mason 57308607c1bSChris Mason void __init btrfs_init_transaction_sys(void) 57408607c1bSChris Mason { 57508607c1bSChris Mason trans_wq = create_workqueue("btrfs"); 57608607c1bSChris Mason } 57708607c1bSChris Mason 57808607c1bSChris Mason void __exit btrfs_exit_transaction_sys(void) 57908607c1bSChris Mason { 58008607c1bSChris Mason destroy_workqueue(trans_wq); 58108607c1bSChris Mason } 58208607c1bSChris Mason 583