16cbd5570SChris Mason /* 26cbd5570SChris Mason * Copyright (C) 2007 Oracle. All rights reserved. 36cbd5570SChris Mason * 46cbd5570SChris Mason * This program is free software; you can redistribute it and/or 56cbd5570SChris Mason * modify it under the terms of the GNU General Public 66cbd5570SChris Mason * License v2 as published by the Free Software Foundation. 76cbd5570SChris Mason * 86cbd5570SChris Mason * This program is distributed in the hope that it will be useful, 96cbd5570SChris Mason * but WITHOUT ANY WARRANTY; without even the implied warranty of 106cbd5570SChris Mason * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 116cbd5570SChris Mason * General Public License for more details. 126cbd5570SChris Mason * 136cbd5570SChris Mason * You should have received a copy of the GNU General Public 146cbd5570SChris Mason * License along with this program; if not, write to the 156cbd5570SChris Mason * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 166cbd5570SChris Mason * Boston, MA 021110-1307, USA. 176cbd5570SChris Mason */ 186cbd5570SChris Mason 1979154b1bSChris Mason #include <linux/fs.h> 2034088780SChris Mason #include <linux/sched.h> 21d3c2fdcfSChris Mason #include <linux/writeback.h> 2279154b1bSChris Mason #include "ctree.h" 2379154b1bSChris Mason #include "disk-io.h" 2479154b1bSChris Mason #include "transaction.h" 2579154b1bSChris Mason 2678fae27eSChris Mason static int total_trans = 0; 272c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 282c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 292c90e5d6SChris Mason 3008607c1bSChris Mason static struct workqueue_struct *trans_wq; 3108607c1bSChris Mason 320f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 336702ed49SChris Mason #define BTRFS_ROOT_DEFRAG_TAG 1 340f7d52f4SChris Mason 3579154b1bSChris Mason static void put_transaction(struct btrfs_transaction *transaction) 3679154b1bSChris Mason { 372c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 3879154b1bSChris Mason transaction->use_count--; 3978fae27eSChris Mason if (transaction->use_count == 0) { 4078fae27eSChris Mason WARN_ON(total_trans == 0); 4178fae27eSChris Mason total_trans--; 428fd17795SChris Mason list_del_init(&transaction->list); 432c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 442c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 4579154b1bSChris Mason } 4678fae27eSChris Mason } 4779154b1bSChris Mason 4879154b1bSChris Mason static int join_transaction(struct btrfs_root *root) 4979154b1bSChris Mason { 5079154b1bSChris Mason struct btrfs_transaction *cur_trans; 5179154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 5279154b1bSChris Mason if (!cur_trans) { 532c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 542c90e5d6SChris Mason GFP_NOFS); 5578fae27eSChris Mason total_trans++; 5679154b1bSChris Mason BUG_ON(!cur_trans); 570f7d52f4SChris Mason root->fs_info->generation++; 5879154b1bSChris Mason root->fs_info->running_transaction = cur_trans; 5915ee9bc7SJosef Bacik cur_trans->num_writers = 1; 6015ee9bc7SJosef Bacik cur_trans->num_joined = 0; 610f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 6279154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 6379154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 6479154b1bSChris Mason cur_trans->in_commit = 0; 65d5719762SChris Mason cur_trans->use_count = 1; 6679154b1bSChris Mason cur_trans->commit_done = 0; 6708607c1bSChris Mason cur_trans->start_time = get_seconds(); 688fd17795SChris Mason list_add_tail(&cur_trans->list, &root->fs_info->trans_list); 697c4452b9SChris Mason init_bit_radix(&cur_trans->dirty_pages); 7015ee9bc7SJosef Bacik } else { 7179154b1bSChris Mason cur_trans->num_writers++; 7215ee9bc7SJosef Bacik cur_trans->num_joined++; 7315ee9bc7SJosef Bacik } 7415ee9bc7SJosef Bacik 7579154b1bSChris Mason return 0; 7679154b1bSChris Mason } 7779154b1bSChris Mason 786702ed49SChris Mason static int record_root_in_trans(struct btrfs_root *root) 796702ed49SChris Mason { 806702ed49SChris Mason u64 running_trans_id = root->fs_info->running_transaction->transid; 816702ed49SChris Mason if (root->ref_cows && root->last_trans < running_trans_id) { 826702ed49SChris Mason WARN_ON(root == root->fs_info->extent_root); 836702ed49SChris Mason if (root->root_item.refs != 0) { 846702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 856702ed49SChris Mason (unsigned long)root->root_key.objectid, 866702ed49SChris Mason BTRFS_ROOT_TRANS_TAG); 876702ed49SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 886702ed49SChris Mason (unsigned long)root->root_key.objectid, 896702ed49SChris Mason BTRFS_ROOT_DEFRAG_TAG); 906702ed49SChris Mason root->commit_root = root->node; 916702ed49SChris Mason get_bh(root->node); 926702ed49SChris Mason } else { 936702ed49SChris Mason WARN_ON(1); 946702ed49SChris Mason } 956702ed49SChris Mason root->last_trans = running_trans_id; 966702ed49SChris Mason } 976702ed49SChris Mason return 0; 986702ed49SChris Mason } 996702ed49SChris Mason 10079154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 10179154b1bSChris Mason int num_blocks) 10279154b1bSChris Mason { 1032c90e5d6SChris Mason struct btrfs_trans_handle *h = 1042c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 10579154b1bSChris Mason int ret; 10679154b1bSChris Mason 10779154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 10879154b1bSChris Mason ret = join_transaction(root); 10979154b1bSChris Mason BUG_ON(ret); 1100f7d52f4SChris Mason 1116702ed49SChris Mason record_root_in_trans(root); 1126702ed49SChris Mason h->transid = root->fs_info->running_transaction->transid; 11379154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 11479154b1bSChris Mason h->blocks_reserved = num_blocks; 11579154b1bSChris Mason h->blocks_used = 0; 11631f3c99bSChris Mason h->block_group = NULL; 11726b8003fSChris Mason h->alloc_exclude_nr = 0; 11826b8003fSChris Mason h->alloc_exclude_start = 0; 11979154b1bSChris Mason root->fs_info->running_transaction->use_count++; 12079154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 12179154b1bSChris Mason return h; 12279154b1bSChris Mason } 12379154b1bSChris Mason 12479154b1bSChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 12579154b1bSChris Mason struct btrfs_root *root) 12679154b1bSChris Mason { 12779154b1bSChris Mason struct btrfs_transaction *cur_trans; 128d6e4a428SChris Mason 12979154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 13079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 131ccd467d6SChris Mason WARN_ON(cur_trans != trans->transaction); 132d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 133ccd467d6SChris Mason cur_trans->num_writers--; 13479154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 13579154b1bSChris Mason wake_up(&cur_trans->writer_wait); 13679154b1bSChris Mason put_transaction(cur_trans); 13779154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 138d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 1392c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 14079154b1bSChris Mason return 0; 14179154b1bSChris Mason } 14279154b1bSChris Mason 14379154b1bSChris Mason 14479154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 14579154b1bSChris Mason struct btrfs_root *root) 14679154b1bSChris Mason { 1477c4452b9SChris Mason unsigned long gang[16]; 1487c4452b9SChris Mason int ret; 1497c4452b9SChris Mason int i; 1507c4452b9SChris Mason int err; 1517c4452b9SChris Mason int werr = 0; 1527c4452b9SChris Mason struct page *page; 1537c4452b9SChris Mason struct radix_tree_root *dirty_pages; 1547c4452b9SChris Mason struct inode *btree_inode = root->fs_info->btree_inode; 1557c4452b9SChris Mason 1567c4452b9SChris Mason if (!trans || !trans->transaction) { 1577c4452b9SChris Mason return filemap_write_and_wait(btree_inode->i_mapping); 1587c4452b9SChris Mason } 1597c4452b9SChris Mason dirty_pages = &trans->transaction->dirty_pages; 1607c4452b9SChris Mason while(1) { 161e37c9e69SChris Mason ret = find_first_radix_bit(dirty_pages, gang, 162e37c9e69SChris Mason 0, ARRAY_SIZE(gang)); 1637c4452b9SChris Mason if (!ret) 1647c4452b9SChris Mason break; 1657c4452b9SChris Mason for (i = 0; i < ret; i++) { 1667c4452b9SChris Mason /* FIXME EIO */ 1677c4452b9SChris Mason clear_radix_bit(dirty_pages, gang[i]); 1687c4452b9SChris Mason page = find_lock_page(btree_inode->i_mapping, 1697c4452b9SChris Mason gang[i]); 1707c4452b9SChris Mason if (!page) 1717c4452b9SChris Mason continue; 1726702ed49SChris Mason if (PageWriteback(page)) { 1736702ed49SChris Mason if (PageDirty(page)) 1746702ed49SChris Mason wait_on_page_writeback(page); 1756702ed49SChris Mason else { 1766702ed49SChris Mason unlock_page(page); 1776702ed49SChris Mason page_cache_release(page); 1786702ed49SChris Mason continue; 1796702ed49SChris Mason } 1806702ed49SChris Mason } 1817c4452b9SChris Mason err = write_one_page(page, 0); 1827c4452b9SChris Mason if (err) 1837c4452b9SChris Mason werr = err; 1847c4452b9SChris Mason page_cache_release(page); 1857c4452b9SChris Mason } 1867c4452b9SChris Mason } 1877c4452b9SChris Mason err = filemap_fdatawait(btree_inode->i_mapping); 1887c4452b9SChris Mason if (err) 1897c4452b9SChris Mason werr = err; 1907c4452b9SChris Mason return werr; 19179154b1bSChris Mason } 19279154b1bSChris Mason 19379154b1bSChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 19479154b1bSChris Mason struct btrfs_root *root) 19579154b1bSChris Mason { 19679154b1bSChris Mason int ret; 19779154b1bSChris Mason u64 old_extent_block; 19879154b1bSChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 19979154b1bSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 20079154b1bSChris Mason struct btrfs_root *extent_root = fs_info->extent_root; 20179154b1bSChris Mason 2029078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 20379154b1bSChris Mason while(1) { 20479154b1bSChris Mason old_extent_block = btrfs_root_blocknr(&extent_root->root_item); 2057eccb903SChris Mason if (old_extent_block == bh_blocknr(extent_root->node)) 20679154b1bSChris Mason break; 20779154b1bSChris Mason btrfs_set_root_blocknr(&extent_root->root_item, 2087eccb903SChris Mason bh_blocknr(extent_root->node)); 20979154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 21079154b1bSChris Mason &extent_root->root_key, 21179154b1bSChris Mason &extent_root->root_item); 21279154b1bSChris Mason BUG_ON(ret); 2139078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 21479154b1bSChris Mason } 21579154b1bSChris Mason return 0; 21679154b1bSChris Mason } 21779154b1bSChris Mason 21879154b1bSChris Mason static int wait_for_commit(struct btrfs_root *root, 21979154b1bSChris Mason struct btrfs_transaction *commit) 22079154b1bSChris Mason { 22179154b1bSChris Mason DEFINE_WAIT(wait); 222ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 22379154b1bSChris Mason while(!commit->commit_done) { 22479154b1bSChris Mason prepare_to_wait(&commit->commit_wait, &wait, 22579154b1bSChris Mason TASK_UNINTERRUPTIBLE); 22679154b1bSChris Mason if (commit->commit_done) 22779154b1bSChris Mason break; 22879154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 22979154b1bSChris Mason schedule(); 23079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 23179154b1bSChris Mason } 232ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 23379154b1bSChris Mason finish_wait(&commit->commit_wait, &wait); 23479154b1bSChris Mason return 0; 23579154b1bSChris Mason } 23679154b1bSChris Mason 2370f7d52f4SChris Mason struct dirty_root { 2380f7d52f4SChris Mason struct list_head list; 2390f7d52f4SChris Mason struct btrfs_root *root; 24058176a96SJosef Bacik struct btrfs_root *latest_root; 2410f7d52f4SChris Mason }; 2420f7d52f4SChris Mason 2435ce14bbcSChris Mason int btrfs_add_dead_root(struct btrfs_root *root, 2445ce14bbcSChris Mason struct btrfs_root *latest, 2455ce14bbcSChris Mason struct list_head *dead_list) 2465eda7b5eSChris Mason { 2475eda7b5eSChris Mason struct dirty_root *dirty; 2485eda7b5eSChris Mason 2495eda7b5eSChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2505eda7b5eSChris Mason if (!dirty) 2515eda7b5eSChris Mason return -ENOMEM; 2525eda7b5eSChris Mason dirty->root = root; 2535ce14bbcSChris Mason dirty->latest_root = latest; 2545eda7b5eSChris Mason list_add(&dirty->list, dead_list); 2555eda7b5eSChris Mason return 0; 2565eda7b5eSChris Mason } 2575eda7b5eSChris Mason 25835b7e476SChris Mason static int add_dirty_roots(struct btrfs_trans_handle *trans, 25935b7e476SChris Mason struct radix_tree_root *radix, 26035b7e476SChris Mason struct list_head *list) 2610f7d52f4SChris Mason { 2620f7d52f4SChris Mason struct dirty_root *dirty; 2630f7d52f4SChris Mason struct btrfs_root *gang[8]; 2640f7d52f4SChris Mason struct btrfs_root *root; 2650f7d52f4SChris Mason int i; 2660f7d52f4SChris Mason int ret; 26754aa1f4dSChris Mason int err = 0; 2685eda7b5eSChris Mason u32 refs; 26954aa1f4dSChris Mason 2700f7d52f4SChris Mason while(1) { 2710f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 2720f7d52f4SChris Mason ARRAY_SIZE(gang), 2730f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 2740f7d52f4SChris Mason if (ret == 0) 2750f7d52f4SChris Mason break; 2760f7d52f4SChris Mason for (i = 0; i < ret; i++) { 2770f7d52f4SChris Mason root = gang[i]; 2782619ba1fSChris Mason radix_tree_tag_clear(radix, 2792619ba1fSChris Mason (unsigned long)root->root_key.objectid, 2800f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 2810f7d52f4SChris Mason if (root->commit_root == root->node) { 2827eccb903SChris Mason WARN_ON(bh_blocknr(root->node) != 2830f7d52f4SChris Mason btrfs_root_blocknr(&root->root_item)); 2840f7d52f4SChris Mason brelse(root->commit_root); 2850f7d52f4SChris Mason root->commit_root = NULL; 28658176a96SJosef Bacik 28758176a96SJosef Bacik /* make sure to update the root on disk 28858176a96SJosef Bacik * so we get any updates to the block used 28958176a96SJosef Bacik * counts 29058176a96SJosef Bacik */ 29158176a96SJosef Bacik err = btrfs_update_root(trans, 29258176a96SJosef Bacik root->fs_info->tree_root, 29358176a96SJosef Bacik &root->root_key, 29458176a96SJosef Bacik &root->root_item); 2950f7d52f4SChris Mason continue; 2960f7d52f4SChris Mason } 2970f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 2980f7d52f4SChris Mason BUG_ON(!dirty); 2999f3a7427SChris Mason dirty->root = kmalloc(sizeof(*dirty->root), GFP_NOFS); 3009f3a7427SChris Mason BUG_ON(!dirty->root); 3019f3a7427SChris Mason 3029f3a7427SChris Mason memset(&root->root_item.drop_progress, 0, 3039f3a7427SChris Mason sizeof(struct btrfs_disk_key)); 3049f3a7427SChris Mason root->root_item.drop_level = 0; 3059f3a7427SChris Mason 3069f3a7427SChris Mason memcpy(dirty->root, root, sizeof(*root)); 3079f3a7427SChris Mason dirty->root->node = root->commit_root; 30858176a96SJosef Bacik dirty->latest_root = root; 3090f7d52f4SChris Mason root->commit_root = NULL; 3105eda7b5eSChris Mason 3110f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 3120f7d52f4SChris Mason btrfs_set_root_blocknr(&root->root_item, 3137eccb903SChris Mason bh_blocknr(root->node)); 3140f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 3150f7d52f4SChris Mason &root->root_key, 3160f7d52f4SChris Mason &root->root_item); 31754aa1f4dSChris Mason if (err) 31854aa1f4dSChris Mason break; 3199f3a7427SChris Mason 3209f3a7427SChris Mason refs = btrfs_root_refs(&dirty->root->root_item); 3219f3a7427SChris Mason btrfs_set_root_refs(&dirty->root->root_item, refs - 1); 3225eda7b5eSChris Mason err = btrfs_update_root(trans, root->fs_info->tree_root, 3239f3a7427SChris Mason &dirty->root->root_key, 3249f3a7427SChris Mason &dirty->root->root_item); 3255eda7b5eSChris Mason 3265eda7b5eSChris Mason BUG_ON(err); 3279f3a7427SChris Mason if (refs == 1) { 3280f7d52f4SChris Mason list_add(&dirty->list, list); 3299f3a7427SChris Mason } else { 3309f3a7427SChris Mason WARN_ON(1); 3319f3a7427SChris Mason kfree(dirty->root); 3325eda7b5eSChris Mason kfree(dirty); 3330f7d52f4SChris Mason } 3340f7d52f4SChris Mason } 3359f3a7427SChris Mason } 33654aa1f4dSChris Mason return err; 3370f7d52f4SChris Mason } 3380f7d52f4SChris Mason 339e9d0b13bSChris Mason int btrfs_defrag_root(struct btrfs_root *root, int cacheonly) 340e9d0b13bSChris Mason { 341e9d0b13bSChris Mason struct btrfs_fs_info *info = root->fs_info; 342e9d0b13bSChris Mason int ret; 343e9d0b13bSChris Mason struct btrfs_trans_handle *trans; 344d3c2fdcfSChris Mason unsigned long nr; 345e9d0b13bSChris Mason 346e9d0b13bSChris Mason if (root->defrag_running) 347e9d0b13bSChris Mason return 0; 348e9d0b13bSChris Mason 349e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 350e9d0b13bSChris Mason while (1) { 351e9d0b13bSChris Mason root->defrag_running = 1; 352e9d0b13bSChris Mason ret = btrfs_defrag_leaves(trans, root, cacheonly); 353d3c2fdcfSChris Mason nr = trans->blocks_used; 354e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 355e9d0b13bSChris Mason mutex_unlock(&info->fs_mutex); 356e9d0b13bSChris Mason 357d3c2fdcfSChris Mason btrfs_btree_balance_dirty(info->tree_root, nr); 358e9d0b13bSChris Mason cond_resched(); 359e9d0b13bSChris Mason 360e9d0b13bSChris Mason mutex_lock(&info->fs_mutex); 361e9d0b13bSChris Mason trans = btrfs_start_transaction(root, 1); 362e9d0b13bSChris Mason if (ret != -EAGAIN) 363e9d0b13bSChris Mason break; 364e9d0b13bSChris Mason } 365e9d0b13bSChris Mason root->defrag_running = 0; 366e9d0b13bSChris Mason radix_tree_tag_clear(&info->fs_roots_radix, 367e9d0b13bSChris Mason (unsigned long)root->root_key.objectid, 368e9d0b13bSChris Mason BTRFS_ROOT_DEFRAG_TAG); 369e9d0b13bSChris Mason btrfs_end_transaction(trans, root); 370e9d0b13bSChris Mason return 0; 371e9d0b13bSChris Mason } 372e9d0b13bSChris Mason 3736702ed49SChris Mason int btrfs_defrag_dirty_roots(struct btrfs_fs_info *info) 3746702ed49SChris Mason { 3756702ed49SChris Mason struct btrfs_root *gang[1]; 3766702ed49SChris Mason struct btrfs_root *root; 3776702ed49SChris Mason int i; 3786702ed49SChris Mason int ret; 3796702ed49SChris Mason int err = 0; 3806702ed49SChris Mason u64 last = 0; 3816702ed49SChris Mason 3826702ed49SChris Mason while(1) { 3836702ed49SChris Mason ret = radix_tree_gang_lookup_tag(&info->fs_roots_radix, 3846702ed49SChris Mason (void **)gang, last, 3856702ed49SChris Mason ARRAY_SIZE(gang), 3866702ed49SChris Mason BTRFS_ROOT_DEFRAG_TAG); 3876702ed49SChris Mason if (ret == 0) 3886702ed49SChris Mason break; 3896702ed49SChris Mason for (i = 0; i < ret; i++) { 3906702ed49SChris Mason root = gang[i]; 3916702ed49SChris Mason last = root->root_key.objectid + 1; 392e9d0b13bSChris Mason btrfs_defrag_root(root, 1); 3936702ed49SChris Mason } 3946702ed49SChris Mason } 395e9d0b13bSChris Mason btrfs_defrag_root(info->extent_root, 1); 3966702ed49SChris Mason return err; 3976702ed49SChris Mason } 3986702ed49SChris Mason 39935b7e476SChris Mason static int drop_dirty_roots(struct btrfs_root *tree_root, 40035b7e476SChris Mason struct list_head *list) 4010f7d52f4SChris Mason { 4020f7d52f4SChris Mason struct dirty_root *dirty; 4030f7d52f4SChris Mason struct btrfs_trans_handle *trans; 404d3c2fdcfSChris Mason unsigned long nr; 40558176a96SJosef Bacik u64 num_blocks; 40658176a96SJosef Bacik u64 blocks_used; 40754aa1f4dSChris Mason int ret = 0; 4089f3a7427SChris Mason int err; 4099f3a7427SChris Mason 4100f7d52f4SChris Mason while(!list_empty(list)) { 41158176a96SJosef Bacik struct btrfs_root *root; 41258176a96SJosef Bacik 413facda1e7SChris Mason mutex_lock(&tree_root->fs_info->fs_mutex); 4140f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 4150f7d52f4SChris Mason list_del_init(&dirty->list); 4165eda7b5eSChris Mason 41758176a96SJosef Bacik num_blocks = btrfs_root_blocks_used(&dirty->root->root_item); 41858176a96SJosef Bacik root = dirty->latest_root; 41958176a96SJosef Bacik 4209f3a7427SChris Mason while(1) { 4210f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 4229f3a7427SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root); 4239f3a7427SChris Mason if (ret != -EAGAIN) { 4249f3a7427SChris Mason break; 4259f3a7427SChris Mason } 42658176a96SJosef Bacik 4279f3a7427SChris Mason err = btrfs_update_root(trans, 4289f3a7427SChris Mason tree_root, 4299f3a7427SChris Mason &dirty->root->root_key, 4309f3a7427SChris Mason &dirty->root->root_item); 4319f3a7427SChris Mason if (err) 4329f3a7427SChris Mason ret = err; 433d3c2fdcfSChris Mason nr = trans->blocks_used; 4349f3a7427SChris Mason ret = btrfs_end_transaction(trans, tree_root); 4350f7d52f4SChris Mason BUG_ON(ret); 436f4468e94SChris Mason mutex_unlock(&tree_root->fs_info->fs_mutex); 437d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 438f4468e94SChris Mason schedule(); 439f4468e94SChris Mason 440f4468e94SChris Mason mutex_lock(&tree_root->fs_info->fs_mutex); 4419f3a7427SChris Mason } 4429f3a7427SChris Mason BUG_ON(ret); 44358176a96SJosef Bacik 44458176a96SJosef Bacik num_blocks -= btrfs_root_blocks_used(&dirty->root->root_item); 44558176a96SJosef Bacik blocks_used = btrfs_root_blocks_used(&root->root_item); 44658176a96SJosef Bacik if (num_blocks) { 44758176a96SJosef Bacik record_root_in_trans(root); 44858176a96SJosef Bacik btrfs_set_root_blocks_used(&root->root_item, 44958176a96SJosef Bacik blocks_used - num_blocks); 45058176a96SJosef Bacik } 4519f3a7427SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->root->root_key); 45258176a96SJosef Bacik if (ret) { 45358176a96SJosef Bacik BUG(); 45454aa1f4dSChris Mason break; 45558176a96SJosef Bacik } 456d3c2fdcfSChris Mason nr = trans->blocks_used; 4570f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 4580f7d52f4SChris Mason BUG_ON(ret); 4595eda7b5eSChris Mason 4605eda7b5eSChris Mason kfree(dirty->root); 4610f7d52f4SChris Mason kfree(dirty); 462facda1e7SChris Mason mutex_unlock(&tree_root->fs_info->fs_mutex); 463d3c2fdcfSChris Mason 464d3c2fdcfSChris Mason btrfs_btree_balance_dirty(tree_root, nr); 465f4468e94SChris Mason schedule(); 4660f7d52f4SChris Mason } 46754aa1f4dSChris Mason return ret; 4680f7d52f4SChris Mason } 4690f7d52f4SChris Mason 47079154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 47179154b1bSChris Mason struct btrfs_root *root) 47279154b1bSChris Mason { 47315ee9bc7SJosef Bacik unsigned long joined = 0; 47415ee9bc7SJosef Bacik unsigned long timeout = 1; 47579154b1bSChris Mason struct btrfs_transaction *cur_trans; 4768fd17795SChris Mason struct btrfs_transaction *prev_trans = NULL; 4770f7d52f4SChris Mason struct list_head dirty_fs_roots; 478ccd467d6SChris Mason struct radix_tree_root pinned_copy; 47979154b1bSChris Mason DEFINE_WAIT(wait); 48015ee9bc7SJosef Bacik int ret; 48179154b1bSChris Mason 482ccd467d6SChris Mason init_bit_radix(&pinned_copy); 4830f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 484d6e4a428SChris Mason 48579154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 48679154b1bSChris Mason if (trans->transaction->in_commit) { 48779154b1bSChris Mason cur_trans = trans->transaction; 48879154b1bSChris Mason trans->transaction->use_count++; 489ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 49079154b1bSChris Mason btrfs_end_transaction(trans, root); 491ccd467d6SChris Mason 492ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 49379154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 49479154b1bSChris Mason BUG_ON(ret); 49515ee9bc7SJosef Bacik 49615ee9bc7SJosef Bacik mutex_lock(&root->fs_info->trans_mutex); 49779154b1bSChris Mason put_transaction(cur_trans); 49815ee9bc7SJosef Bacik mutex_unlock(&root->fs_info->trans_mutex); 49915ee9bc7SJosef Bacik 500ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 50179154b1bSChris Mason return 0; 50279154b1bSChris Mason } 5032c90e5d6SChris Mason trans->transaction->in_commit = 1; 504ccd467d6SChris Mason cur_trans = trans->transaction; 505ccd467d6SChris Mason if (cur_trans->list.prev != &root->fs_info->trans_list) { 506ccd467d6SChris Mason prev_trans = list_entry(cur_trans->list.prev, 507ccd467d6SChris Mason struct btrfs_transaction, list); 508ccd467d6SChris Mason if (!prev_trans->commit_done) { 509ccd467d6SChris Mason prev_trans->use_count++; 510ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 511ccd467d6SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 512ccd467d6SChris Mason 513ccd467d6SChris Mason wait_for_commit(root, prev_trans); 514ccd467d6SChris Mason 515ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 516ccd467d6SChris Mason mutex_lock(&root->fs_info->trans_mutex); 51715ee9bc7SJosef Bacik put_transaction(prev_trans); 518ccd467d6SChris Mason } 519ccd467d6SChris Mason } 52015ee9bc7SJosef Bacik 52115ee9bc7SJosef Bacik do { 52215ee9bc7SJosef Bacik joined = cur_trans->num_joined; 5232c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 52415ee9bc7SJosef Bacik prepare_to_wait(&cur_trans->writer_wait, &wait, 52579154b1bSChris Mason TASK_UNINTERRUPTIBLE); 52615ee9bc7SJosef Bacik 52715ee9bc7SJosef Bacik if (cur_trans->num_writers > 1) 52815ee9bc7SJosef Bacik timeout = MAX_SCHEDULE_TIMEOUT; 52915ee9bc7SJosef Bacik else 53015ee9bc7SJosef Bacik timeout = 1; 53115ee9bc7SJosef Bacik 532ccd467d6SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 53379154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 53415ee9bc7SJosef Bacik 53515ee9bc7SJosef Bacik schedule_timeout(timeout); 53615ee9bc7SJosef Bacik 537ccd467d6SChris Mason mutex_lock(&root->fs_info->fs_mutex); 53879154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 53915ee9bc7SJosef Bacik finish_wait(&cur_trans->writer_wait, &wait); 54015ee9bc7SJosef Bacik } while (cur_trans->num_writers > 1 || 54115ee9bc7SJosef Bacik (cur_trans->num_joined != joined)); 54215ee9bc7SJosef Bacik 5432c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 54454aa1f4dSChris Mason ret = add_dirty_roots(trans, &root->fs_info->fs_roots_radix, 54554aa1f4dSChris Mason &dirty_fs_roots); 54654aa1f4dSChris Mason BUG_ON(ret); 54754aa1f4dSChris Mason 54879154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 54979154b1bSChris Mason BUG_ON(ret); 55054aa1f4dSChris Mason 55178fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 55278fae27eSChris Mason root->fs_info->running_transaction = NULL; 5534b52dff6SChris Mason btrfs_set_super_generation(&root->fs_info->super_copy, 5544b52dff6SChris Mason cur_trans->transid); 5554b52dff6SChris Mason btrfs_set_super_root(&root->fs_info->super_copy, 5564b52dff6SChris Mason bh_blocknr(root->fs_info->tree_root->node)); 5574b52dff6SChris Mason memcpy(root->fs_info->disk_super, &root->fs_info->super_copy, 5584b52dff6SChris Mason sizeof(root->fs_info->super_copy)); 559ccd467d6SChris Mason 560ccd467d6SChris Mason btrfs_copy_pinned(root, &pinned_copy); 561ccd467d6SChris Mason 56278fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 5638fd17795SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 56479154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 56579154b1bSChris Mason BUG_ON(ret); 56679154b1bSChris Mason write_ctree_super(trans, root); 5678fd17795SChris Mason mutex_lock(&root->fs_info->fs_mutex); 568ccd467d6SChris Mason btrfs_finish_extent_commit(trans, root, &pinned_copy); 56978fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 5702c90e5d6SChris Mason cur_trans->commit_done = 1; 57115ee9bc7SJosef Bacik root->fs_info->last_trans_committed = cur_trans->transid; 5722c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 57379154b1bSChris Mason put_transaction(cur_trans); 57478fae27eSChris Mason put_transaction(cur_trans); 57558176a96SJosef Bacik 576facda1e7SChris Mason if (root->fs_info->closing) 577facda1e7SChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_fs_roots); 578facda1e7SChris Mason else 579facda1e7SChris Mason list_splice_init(&dirty_fs_roots, &root->fs_info->dead_roots); 58058176a96SJosef Bacik 58178fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 5822c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 58379154b1bSChris Mason 584facda1e7SChris Mason if (root->fs_info->closing) { 585facda1e7SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 5860f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 587facda1e7SChris Mason mutex_lock(&root->fs_info->fs_mutex); 588facda1e7SChris Mason } 58979154b1bSChris Mason return ret; 59079154b1bSChris Mason } 59179154b1bSChris Mason 592e9d0b13bSChris Mason int btrfs_clean_old_snapshots(struct btrfs_root *root) 593e9d0b13bSChris Mason { 594e9d0b13bSChris Mason struct list_head dirty_roots; 595e9d0b13bSChris Mason INIT_LIST_HEAD(&dirty_roots); 596e9d0b13bSChris Mason 597e9d0b13bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 598e9d0b13bSChris Mason list_splice_init(&root->fs_info->dead_roots, &dirty_roots); 599e9d0b13bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 600e9d0b13bSChris Mason 601e9d0b13bSChris Mason if (!list_empty(&dirty_roots)) { 602e9d0b13bSChris Mason drop_dirty_roots(root, &dirty_roots); 603e9d0b13bSChris Mason } 604e9d0b13bSChris Mason return 0; 605e9d0b13bSChris Mason } 60608607c1bSChris Mason void btrfs_transaction_cleaner(struct work_struct *work) 60708607c1bSChris Mason { 60808607c1bSChris Mason struct btrfs_fs_info *fs_info = container_of(work, 60908607c1bSChris Mason struct btrfs_fs_info, 61008607c1bSChris Mason trans_work.work); 61108607c1bSChris Mason 61208607c1bSChris Mason struct btrfs_root *root = fs_info->tree_root; 61308607c1bSChris Mason struct btrfs_transaction *cur; 61408607c1bSChris Mason struct btrfs_trans_handle *trans; 61508607c1bSChris Mason unsigned long now; 61608607c1bSChris Mason unsigned long delay = HZ * 30; 61708607c1bSChris Mason int ret; 61808607c1bSChris Mason 61908607c1bSChris Mason mutex_lock(&root->fs_info->fs_mutex); 62008607c1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 62108607c1bSChris Mason cur = root->fs_info->running_transaction; 62208607c1bSChris Mason if (!cur) { 62308607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 62408607c1bSChris Mason goto out; 62508607c1bSChris Mason } 62608607c1bSChris Mason now = get_seconds(); 62708607c1bSChris Mason if (now < cur->start_time || now - cur->start_time < 30) { 62808607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 62908607c1bSChris Mason delay = HZ * 5; 63008607c1bSChris Mason goto out; 63108607c1bSChris Mason } 63208607c1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 6336702ed49SChris Mason btrfs_defrag_dirty_roots(root->fs_info); 63408607c1bSChris Mason trans = btrfs_start_transaction(root, 1); 63508607c1bSChris Mason ret = btrfs_commit_transaction(trans, root); 63608607c1bSChris Mason out: 63708607c1bSChris Mason mutex_unlock(&root->fs_info->fs_mutex); 638e9d0b13bSChris Mason btrfs_clean_old_snapshots(root); 63908607c1bSChris Mason btrfs_transaction_queue_work(root, delay); 64008607c1bSChris Mason } 64108607c1bSChris Mason 64208607c1bSChris Mason void btrfs_transaction_queue_work(struct btrfs_root *root, int delay) 64308607c1bSChris Mason { 64408607c1bSChris Mason queue_delayed_work(trans_wq, &root->fs_info->trans_work, delay); 64508607c1bSChris Mason } 64608607c1bSChris Mason 64708607c1bSChris Mason void btrfs_transaction_flush_work(struct btrfs_root *root) 64808607c1bSChris Mason { 64908607c1bSChris Mason cancel_rearming_delayed_workqueue(trans_wq, &root->fs_info->trans_work); 65008607c1bSChris Mason flush_workqueue(trans_wq); 65108607c1bSChris Mason } 65208607c1bSChris Mason 65308607c1bSChris Mason void __init btrfs_init_transaction_sys(void) 65408607c1bSChris Mason { 65508607c1bSChris Mason trans_wq = create_workqueue("btrfs"); 65608607c1bSChris Mason } 65708607c1bSChris Mason 65808607c1bSChris Mason void __exit btrfs_exit_transaction_sys(void) 65908607c1bSChris Mason { 66008607c1bSChris Mason destroy_workqueue(trans_wq); 66108607c1bSChris Mason } 66208607c1bSChris Mason 663