179154b1bSChris Mason #include <linux/module.h> 279154b1bSChris Mason #include <linux/fs.h> 379154b1bSChris Mason #include "ctree.h" 479154b1bSChris Mason #include "disk-io.h" 579154b1bSChris Mason #include "transaction.h" 679154b1bSChris Mason 778fae27eSChris Mason static int total_trans = 0; 82c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 92c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 102c90e5d6SChris Mason 110f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 120f7d52f4SChris Mason 132c90e5d6SChris Mason #define TRANS_MAGIC 0xE1E10E 1479154b1bSChris Mason static void put_transaction(struct btrfs_transaction *transaction) 1579154b1bSChris Mason { 162c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 1779154b1bSChris Mason transaction->use_count--; 182c90e5d6SChris Mason WARN_ON(transaction->magic != TRANS_MAGIC); 1978fae27eSChris Mason if (transaction->use_count == 0) { 2078fae27eSChris Mason WARN_ON(total_trans == 0); 2178fae27eSChris Mason total_trans--; 228fd17795SChris Mason list_del_init(&transaction->list); 232c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 242c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 2579154b1bSChris Mason } 2678fae27eSChris Mason } 2779154b1bSChris Mason 2879154b1bSChris Mason static int join_transaction(struct btrfs_root *root) 2979154b1bSChris Mason { 3079154b1bSChris Mason struct btrfs_transaction *cur_trans; 3179154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 3279154b1bSChris Mason if (!cur_trans) { 332c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 342c90e5d6SChris Mason GFP_NOFS); 3578fae27eSChris Mason total_trans++; 3679154b1bSChris Mason BUG_ON(!cur_trans); 370f7d52f4SChris Mason root->fs_info->generation++; 3879154b1bSChris Mason root->fs_info->running_transaction = cur_trans; 3979154b1bSChris Mason cur_trans->num_writers = 0; 400f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 4179154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 4279154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 432c90e5d6SChris Mason cur_trans->magic = TRANS_MAGIC; 4479154b1bSChris Mason cur_trans->in_commit = 0; 45d5719762SChris Mason cur_trans->use_count = 1; 4679154b1bSChris Mason cur_trans->commit_done = 0; 478fd17795SChris Mason list_add_tail(&cur_trans->list, &root->fs_info->trans_list); 4879154b1bSChris Mason } 4979154b1bSChris Mason cur_trans->num_writers++; 5079154b1bSChris Mason return 0; 5179154b1bSChris Mason } 5279154b1bSChris Mason 5379154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 5479154b1bSChris Mason int num_blocks) 5579154b1bSChris Mason { 562c90e5d6SChris Mason struct btrfs_trans_handle *h = 572c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 5879154b1bSChris Mason int ret; 590f7d52f4SChris Mason u64 running_trans_id; 6079154b1bSChris Mason 6179154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 6279154b1bSChris Mason ret = join_transaction(root); 6379154b1bSChris Mason BUG_ON(ret); 640f7d52f4SChris Mason running_trans_id = root->fs_info->running_transaction->transid; 650f7d52f4SChris Mason 660f7d52f4SChris Mason if (root != root->fs_info->tree_root && root->last_trans < 670f7d52f4SChris Mason running_trans_id) { 680f7d52f4SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 692619ba1fSChris Mason (unsigned long)root->root_key.objectid, 702619ba1fSChris Mason BTRFS_ROOT_TRANS_TAG); 710f7d52f4SChris Mason root->commit_root = root->node; 720f7d52f4SChris Mason get_bh(root->node); 730f7d52f4SChris Mason } 740f7d52f4SChris Mason root->last_trans = running_trans_id; 750f7d52f4SChris Mason h->transid = running_trans_id; 7679154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 7779154b1bSChris Mason h->blocks_reserved = num_blocks; 7879154b1bSChris Mason h->blocks_used = 0; 7979154b1bSChris Mason root->fs_info->running_transaction->use_count++; 8079154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 812c90e5d6SChris Mason h->magic = h->magic2 = TRANS_MAGIC; 8279154b1bSChris Mason return h; 8379154b1bSChris Mason } 8479154b1bSChris Mason 8579154b1bSChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 8679154b1bSChris Mason struct btrfs_root *root) 8779154b1bSChris Mason { 8879154b1bSChris Mason struct btrfs_transaction *cur_trans; 89d6e4a428SChris Mason 902c90e5d6SChris Mason WARN_ON(trans->magic != TRANS_MAGIC); 912c90e5d6SChris Mason WARN_ON(trans->magic2 != TRANS_MAGIC); 9279154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 9379154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 94d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 9579154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 9679154b1bSChris Mason wake_up(&cur_trans->writer_wait); 9779154b1bSChris Mason cur_trans->num_writers--; 9879154b1bSChris Mason put_transaction(cur_trans); 9979154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 100d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 1012c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 10279154b1bSChris Mason return 0; 10379154b1bSChris Mason } 10479154b1bSChris Mason 10579154b1bSChris Mason 10679154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 10779154b1bSChris Mason struct btrfs_root *root) 10879154b1bSChris Mason { 1097cfcc17eSChris Mason filemap_write_and_wait(root->fs_info->btree_inode->i_mapping); 11079154b1bSChris Mason return 0; 11179154b1bSChris Mason } 11279154b1bSChris Mason 11379154b1bSChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 11479154b1bSChris Mason struct btrfs_root *root) 11579154b1bSChris Mason { 11679154b1bSChris Mason int ret; 11779154b1bSChris Mason u64 old_extent_block; 11879154b1bSChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 11979154b1bSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 12079154b1bSChris Mason struct btrfs_root *extent_root = fs_info->extent_root; 1218352d8a4SChris Mason struct btrfs_root *dev_root = fs_info->dev_root; 12279154b1bSChris Mason 1238352d8a4SChris Mason if (btrfs_super_device_root(fs_info->disk_super) != 1248352d8a4SChris Mason bh_blocknr(dev_root->node)) { 1258352d8a4SChris Mason btrfs_set_super_device_root(fs_info->disk_super, 1268352d8a4SChris Mason bh_blocknr(dev_root->node)); 1278352d8a4SChris Mason } 128*9078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 12979154b1bSChris Mason while(1) { 13079154b1bSChris Mason old_extent_block = btrfs_root_blocknr(&extent_root->root_item); 1317eccb903SChris Mason if (old_extent_block == bh_blocknr(extent_root->node)) 13279154b1bSChris Mason break; 13379154b1bSChris Mason btrfs_set_root_blocknr(&extent_root->root_item, 1347eccb903SChris Mason bh_blocknr(extent_root->node)); 13579154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 13679154b1bSChris Mason &extent_root->root_key, 13779154b1bSChris Mason &extent_root->root_item); 13879154b1bSChris Mason BUG_ON(ret); 139*9078a3e1SChris Mason btrfs_write_dirty_block_groups(trans, extent_root); 14079154b1bSChris Mason } 14179154b1bSChris Mason return 0; 14279154b1bSChris Mason } 14379154b1bSChris Mason 14479154b1bSChris Mason static int wait_for_commit(struct btrfs_root *root, 14579154b1bSChris Mason struct btrfs_transaction *commit) 14679154b1bSChris Mason { 14779154b1bSChris Mason DEFINE_WAIT(wait); 14879154b1bSChris Mason while(!commit->commit_done) { 14979154b1bSChris Mason prepare_to_wait(&commit->commit_wait, &wait, 15079154b1bSChris Mason TASK_UNINTERRUPTIBLE); 15179154b1bSChris Mason if (commit->commit_done) 15279154b1bSChris Mason break; 15379154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 15479154b1bSChris Mason schedule(); 15579154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 15679154b1bSChris Mason } 15779154b1bSChris Mason finish_wait(&commit->commit_wait, &wait); 15879154b1bSChris Mason return 0; 15979154b1bSChris Mason } 16079154b1bSChris Mason 1610f7d52f4SChris Mason struct dirty_root { 1620f7d52f4SChris Mason struct list_head list; 1630f7d52f4SChris Mason struct btrfs_key snap_key; 1640f7d52f4SChris Mason struct buffer_head *commit_root; 1650f7d52f4SChris Mason struct btrfs_root *root; 1660f7d52f4SChris Mason }; 1670f7d52f4SChris Mason 1680f7d52f4SChris Mason int add_dirty_roots(struct btrfs_trans_handle *trans, 1690f7d52f4SChris Mason struct radix_tree_root *radix, struct list_head *list) 1700f7d52f4SChris Mason { 1710f7d52f4SChris Mason struct dirty_root *dirty; 1720f7d52f4SChris Mason struct btrfs_root *gang[8]; 1730f7d52f4SChris Mason struct btrfs_root *root; 1740f7d52f4SChris Mason int i; 1750f7d52f4SChris Mason int ret; 1760f7d52f4SChris Mason int err; 1770f7d52f4SChris Mason while(1) { 1780f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 1790f7d52f4SChris Mason ARRAY_SIZE(gang), 1800f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 1810f7d52f4SChris Mason if (ret == 0) 1820f7d52f4SChris Mason break; 1830f7d52f4SChris Mason for (i = 0; i < ret; i++) { 1840f7d52f4SChris Mason root = gang[i]; 1852619ba1fSChris Mason radix_tree_tag_clear(radix, 1862619ba1fSChris Mason (unsigned long)root->root_key.objectid, 1870f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 1880f7d52f4SChris Mason if (root->commit_root == root->node) { 1897eccb903SChris Mason WARN_ON(bh_blocknr(root->node) != 1900f7d52f4SChris Mason btrfs_root_blocknr(&root->root_item)); 1910f7d52f4SChris Mason brelse(root->commit_root); 1920f7d52f4SChris Mason root->commit_root = NULL; 1930f7d52f4SChris Mason continue; 1940f7d52f4SChris Mason } 1950f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 1960f7d52f4SChris Mason BUG_ON(!dirty); 1970f7d52f4SChris Mason memcpy(&dirty->snap_key, &root->root_key, 1980f7d52f4SChris Mason sizeof(root->root_key)); 1990f7d52f4SChris Mason dirty->commit_root = root->commit_root; 2000f7d52f4SChris Mason root->commit_root = NULL; 2010f7d52f4SChris Mason dirty->root = root; 2020f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 2030f7d52f4SChris Mason btrfs_set_root_blocknr(&root->root_item, 2047eccb903SChris Mason bh_blocknr(root->node)); 2050f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 2060f7d52f4SChris Mason &root->root_key, 2070f7d52f4SChris Mason &root->root_item); 2080f7d52f4SChris Mason BUG_ON(err); 2090f7d52f4SChris Mason list_add(&dirty->list, list); 2100f7d52f4SChris Mason } 2110f7d52f4SChris Mason } 2120f7d52f4SChris Mason return 0; 2130f7d52f4SChris Mason } 2140f7d52f4SChris Mason 2150f7d52f4SChris Mason int drop_dirty_roots(struct btrfs_root *tree_root, struct list_head *list) 2160f7d52f4SChris Mason { 2170f7d52f4SChris Mason struct dirty_root *dirty; 2180f7d52f4SChris Mason struct btrfs_trans_handle *trans; 2190f7d52f4SChris Mason int ret; 2200f7d52f4SChris Mason 2210f7d52f4SChris Mason while(!list_empty(list)) { 2220f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 2230f7d52f4SChris Mason list_del_init(&dirty->list); 2240f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 2250f7d52f4SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root, 2260f7d52f4SChris Mason dirty->commit_root); 2270f7d52f4SChris Mason BUG_ON(ret); 2280f7d52f4SChris Mason 2290f7d52f4SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->snap_key); 2300f7d52f4SChris Mason BUG_ON(ret); 2310f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 2320f7d52f4SChris Mason BUG_ON(ret); 2330f7d52f4SChris Mason kfree(dirty); 2340f7d52f4SChris Mason } 2350f7d52f4SChris Mason return 0; 2360f7d52f4SChris Mason } 2370f7d52f4SChris Mason 23879154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 23979154b1bSChris Mason struct btrfs_root *root) 24079154b1bSChris Mason { 24179154b1bSChris Mason int ret = 0; 24279154b1bSChris Mason struct btrfs_transaction *cur_trans; 2438fd17795SChris Mason struct btrfs_transaction *prev_trans = NULL; 2440f7d52f4SChris Mason struct list_head dirty_fs_roots; 24579154b1bSChris Mason DEFINE_WAIT(wait); 24679154b1bSChris Mason 2470f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 248d6e4a428SChris Mason 24979154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 25079154b1bSChris Mason if (trans->transaction->in_commit) { 25179154b1bSChris Mason cur_trans = trans->transaction; 25279154b1bSChris Mason trans->transaction->use_count++; 25379154b1bSChris Mason btrfs_end_transaction(trans, root); 25479154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 25579154b1bSChris Mason BUG_ON(ret); 25679154b1bSChris Mason put_transaction(cur_trans); 25779154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 25879154b1bSChris Mason return 0; 25979154b1bSChris Mason } 2602c90e5d6SChris Mason cur_trans = trans->transaction; 2612c90e5d6SChris Mason trans->transaction->in_commit = 1; 26279154b1bSChris Mason while (trans->transaction->num_writers > 1) { 2632c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 26479154b1bSChris Mason prepare_to_wait(&trans->transaction->writer_wait, &wait, 26579154b1bSChris Mason TASK_UNINTERRUPTIBLE); 26679154b1bSChris Mason if (trans->transaction->num_writers <= 1) 26779154b1bSChris Mason break; 26879154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 26979154b1bSChris Mason schedule(); 27079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 2712c90e5d6SChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 27279154b1bSChris Mason } 27379154b1bSChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 2742c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 2750f7d52f4SChris Mason add_dirty_roots(trans, &root->fs_info->fs_roots_radix, &dirty_fs_roots); 27679154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 27779154b1bSChris Mason BUG_ON(ret); 27878fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 27978fae27eSChris Mason root->fs_info->running_transaction = NULL; 2808fd17795SChris Mason if (cur_trans->list.prev != &root->fs_info->trans_list) { 2818fd17795SChris Mason prev_trans = list_entry(cur_trans->list.prev, 2828fd17795SChris Mason struct btrfs_transaction, list); 2838fd17795SChris Mason if (prev_trans->commit_done) 2848fd17795SChris Mason prev_trans = NULL; 2858fd17795SChris Mason else 2868fd17795SChris Mason prev_trans->use_count++; 2878fd17795SChris Mason } 28878fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 2898fd17795SChris Mason mutex_unlock(&root->fs_info->fs_mutex); 29079154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 2918fd17795SChris Mason if (prev_trans) { 2928fd17795SChris Mason mutex_lock(&root->fs_info->trans_mutex); 2938fd17795SChris Mason wait_for_commit(root, prev_trans); 2948fd17795SChris Mason put_transaction(prev_trans); 2958fd17795SChris Mason mutex_unlock(&root->fs_info->trans_mutex); 2968fd17795SChris Mason } 2978fd17795SChris Mason btrfs_set_super_generation(root->fs_info->disk_super, 2988fd17795SChris Mason cur_trans->transid); 29979154b1bSChris Mason BUG_ON(ret); 30079154b1bSChris Mason write_ctree_super(trans, root); 3018fd17795SChris Mason 3028fd17795SChris Mason mutex_lock(&root->fs_info->fs_mutex); 30378fae27eSChris Mason btrfs_finish_extent_commit(trans, root); 30478fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 3052c90e5d6SChris Mason cur_trans->commit_done = 1; 3062c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 30779154b1bSChris Mason put_transaction(cur_trans); 30878fae27eSChris Mason put_transaction(cur_trans); 30978fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 3102c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 31179154b1bSChris Mason 3120f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 31379154b1bSChris Mason return ret; 31479154b1bSChris Mason } 31579154b1bSChris Mason 316