179154b1bSChris Mason #include <linux/module.h> 279154b1bSChris Mason #include <linux/fs.h> 379154b1bSChris Mason #include "ctree.h" 479154b1bSChris Mason #include "disk-io.h" 579154b1bSChris Mason #include "transaction.h" 679154b1bSChris Mason 778fae27eSChris Mason static int total_trans = 0; 82c90e5d6SChris Mason extern struct kmem_cache *btrfs_trans_handle_cachep; 92c90e5d6SChris Mason extern struct kmem_cache *btrfs_transaction_cachep; 102c90e5d6SChris Mason 11*0f7d52f4SChris Mason #define BTRFS_ROOT_TRANS_TAG 0 12*0f7d52f4SChris Mason 132c90e5d6SChris Mason #define TRANS_MAGIC 0xE1E10E 1479154b1bSChris Mason static void put_transaction(struct btrfs_transaction *transaction) 1579154b1bSChris Mason { 162c90e5d6SChris Mason WARN_ON(transaction->use_count == 0); 1779154b1bSChris Mason transaction->use_count--; 182c90e5d6SChris Mason WARN_ON(transaction->magic != TRANS_MAGIC); 1978fae27eSChris Mason if (transaction->use_count == 0) { 2078fae27eSChris Mason WARN_ON(total_trans == 0); 2178fae27eSChris Mason total_trans--; 222c90e5d6SChris Mason memset(transaction, 0, sizeof(*transaction)); 232c90e5d6SChris Mason kmem_cache_free(btrfs_transaction_cachep, transaction); 2479154b1bSChris Mason } 2578fae27eSChris Mason } 2679154b1bSChris Mason 2779154b1bSChris Mason static int join_transaction(struct btrfs_root *root) 2879154b1bSChris Mason { 2979154b1bSChris Mason struct btrfs_transaction *cur_trans; 3079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 3179154b1bSChris Mason if (!cur_trans) { 322c90e5d6SChris Mason cur_trans = kmem_cache_alloc(btrfs_transaction_cachep, 332c90e5d6SChris Mason GFP_NOFS); 3478fae27eSChris Mason total_trans++; 3579154b1bSChris Mason BUG_ON(!cur_trans); 36*0f7d52f4SChris Mason root->fs_info->generation++; 3779154b1bSChris Mason root->fs_info->running_transaction = cur_trans; 3879154b1bSChris Mason cur_trans->num_writers = 0; 39*0f7d52f4SChris Mason cur_trans->transid = root->fs_info->generation; 4079154b1bSChris Mason init_waitqueue_head(&cur_trans->writer_wait); 4179154b1bSChris Mason init_waitqueue_head(&cur_trans->commit_wait); 422c90e5d6SChris Mason cur_trans->magic = TRANS_MAGIC; 4379154b1bSChris Mason cur_trans->in_commit = 0; 44d5719762SChris Mason cur_trans->use_count = 1; 4579154b1bSChris Mason cur_trans->commit_done = 0; 4679154b1bSChris Mason } 4779154b1bSChris Mason cur_trans->num_writers++; 4879154b1bSChris Mason return 0; 4979154b1bSChris Mason } 5079154b1bSChris Mason 5179154b1bSChris Mason struct btrfs_trans_handle *btrfs_start_transaction(struct btrfs_root *root, 5279154b1bSChris Mason int num_blocks) 5379154b1bSChris Mason { 542c90e5d6SChris Mason struct btrfs_trans_handle *h = 552c90e5d6SChris Mason kmem_cache_alloc(btrfs_trans_handle_cachep, GFP_NOFS); 5679154b1bSChris Mason int ret; 57*0f7d52f4SChris Mason u64 running_trans_id; 5879154b1bSChris Mason 5979154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 6079154b1bSChris Mason ret = join_transaction(root); 6179154b1bSChris Mason BUG_ON(ret); 62*0f7d52f4SChris Mason running_trans_id = root->fs_info->running_transaction->transid; 63*0f7d52f4SChris Mason 64*0f7d52f4SChris Mason if (root != root->fs_info->tree_root && root->last_trans < 65*0f7d52f4SChris Mason running_trans_id) { 66*0f7d52f4SChris Mason radix_tree_tag_set(&root->fs_info->fs_roots_radix, 67*0f7d52f4SChris Mason (unsigned long)root, BTRFS_ROOT_TRANS_TAG); 68*0f7d52f4SChris Mason root->commit_root = root->node; 69*0f7d52f4SChris Mason get_bh(root->node); 70*0f7d52f4SChris Mason } 71*0f7d52f4SChris Mason root->last_trans = running_trans_id; 72*0f7d52f4SChris Mason h->transid = running_trans_id; 7379154b1bSChris Mason h->transaction = root->fs_info->running_transaction; 7479154b1bSChris Mason h->blocks_reserved = num_blocks; 7579154b1bSChris Mason h->blocks_used = 0; 7679154b1bSChris Mason root->fs_info->running_transaction->use_count++; 7779154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 782c90e5d6SChris Mason h->magic = h->magic2 = TRANS_MAGIC; 7979154b1bSChris Mason return h; 8079154b1bSChris Mason } 8179154b1bSChris Mason 8279154b1bSChris Mason int btrfs_end_transaction(struct btrfs_trans_handle *trans, 8379154b1bSChris Mason struct btrfs_root *root) 8479154b1bSChris Mason { 8579154b1bSChris Mason struct btrfs_transaction *cur_trans; 86d6e4a428SChris Mason 872c90e5d6SChris Mason WARN_ON(trans->magic != TRANS_MAGIC); 882c90e5d6SChris Mason WARN_ON(trans->magic2 != TRANS_MAGIC); 8979154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 9079154b1bSChris Mason cur_trans = root->fs_info->running_transaction; 91d5719762SChris Mason WARN_ON(cur_trans->num_writers < 1); 9279154b1bSChris Mason if (waitqueue_active(&cur_trans->writer_wait)) 9379154b1bSChris Mason wake_up(&cur_trans->writer_wait); 9479154b1bSChris Mason cur_trans->num_writers--; 9579154b1bSChris Mason put_transaction(cur_trans); 9679154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 97d6025579SChris Mason memset(trans, 0, sizeof(*trans)); 982c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 9979154b1bSChris Mason return 0; 10079154b1bSChris Mason } 10179154b1bSChris Mason 10279154b1bSChris Mason 10379154b1bSChris Mason int btrfs_write_and_wait_transaction(struct btrfs_trans_handle *trans, 10479154b1bSChris Mason struct btrfs_root *root) 10579154b1bSChris Mason { 1067cfcc17eSChris Mason filemap_write_and_wait(root->fs_info->btree_inode->i_mapping); 10779154b1bSChris Mason return 0; 10879154b1bSChris Mason } 10979154b1bSChris Mason 11079154b1bSChris Mason int btrfs_commit_tree_roots(struct btrfs_trans_handle *trans, 11179154b1bSChris Mason struct btrfs_root *root) 11279154b1bSChris Mason { 11379154b1bSChris Mason int ret; 11479154b1bSChris Mason u64 old_extent_block; 11579154b1bSChris Mason struct btrfs_fs_info *fs_info = root->fs_info; 11679154b1bSChris Mason struct btrfs_root *tree_root = fs_info->tree_root; 11779154b1bSChris Mason struct btrfs_root *extent_root = fs_info->extent_root; 11879154b1bSChris Mason struct btrfs_root *inode_root = fs_info->inode_root; 11979154b1bSChris Mason 12079154b1bSChris Mason btrfs_set_root_blocknr(&inode_root->root_item, 12179154b1bSChris Mason inode_root->node->b_blocknr); 12279154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 12379154b1bSChris Mason &inode_root->root_key, 12479154b1bSChris Mason &inode_root->root_item); 12579154b1bSChris Mason BUG_ON(ret); 12679154b1bSChris Mason while(1) { 12779154b1bSChris Mason old_extent_block = btrfs_root_blocknr(&extent_root->root_item); 12879154b1bSChris Mason if (old_extent_block == extent_root->node->b_blocknr) 12979154b1bSChris Mason break; 13079154b1bSChris Mason btrfs_set_root_blocknr(&extent_root->root_item, 13179154b1bSChris Mason extent_root->node->b_blocknr); 13279154b1bSChris Mason ret = btrfs_update_root(trans, tree_root, 13379154b1bSChris Mason &extent_root->root_key, 13479154b1bSChris Mason &extent_root->root_item); 13579154b1bSChris Mason BUG_ON(ret); 13679154b1bSChris Mason } 13779154b1bSChris Mason return 0; 13879154b1bSChris Mason } 13979154b1bSChris Mason 14079154b1bSChris Mason static int wait_for_commit(struct btrfs_root *root, 14179154b1bSChris Mason struct btrfs_transaction *commit) 14279154b1bSChris Mason { 14379154b1bSChris Mason DEFINE_WAIT(wait); 14479154b1bSChris Mason while(!commit->commit_done) { 14579154b1bSChris Mason prepare_to_wait(&commit->commit_wait, &wait, 14679154b1bSChris Mason TASK_UNINTERRUPTIBLE); 14779154b1bSChris Mason if (commit->commit_done) 14879154b1bSChris Mason break; 14979154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 15079154b1bSChris Mason schedule(); 15179154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 15279154b1bSChris Mason } 15379154b1bSChris Mason finish_wait(&commit->commit_wait, &wait); 15479154b1bSChris Mason return 0; 15579154b1bSChris Mason } 15679154b1bSChris Mason 157*0f7d52f4SChris Mason struct dirty_root { 158*0f7d52f4SChris Mason struct list_head list; 159*0f7d52f4SChris Mason struct btrfs_key snap_key; 160*0f7d52f4SChris Mason struct buffer_head *commit_root; 161*0f7d52f4SChris Mason struct btrfs_root *root; 162*0f7d52f4SChris Mason }; 163*0f7d52f4SChris Mason 164*0f7d52f4SChris Mason int add_dirty_roots(struct btrfs_trans_handle *trans, 165*0f7d52f4SChris Mason struct radix_tree_root *radix, struct list_head *list) 166*0f7d52f4SChris Mason { 167*0f7d52f4SChris Mason struct dirty_root *dirty; 168*0f7d52f4SChris Mason struct btrfs_root *gang[8]; 169*0f7d52f4SChris Mason struct btrfs_root *root; 170*0f7d52f4SChris Mason int i; 171*0f7d52f4SChris Mason int ret; 172*0f7d52f4SChris Mason int err; 173*0f7d52f4SChris Mason printk("add dirty\n"); 174*0f7d52f4SChris Mason while(1) { 175*0f7d52f4SChris Mason ret = radix_tree_gang_lookup_tag(radix, (void **)gang, 0, 176*0f7d52f4SChris Mason ARRAY_SIZE(gang), 177*0f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 178*0f7d52f4SChris Mason if (ret == 0) 179*0f7d52f4SChris Mason break; 180*0f7d52f4SChris Mason for (i = 0; i < ret; i++) { 181*0f7d52f4SChris Mason root = gang[i]; 182*0f7d52f4SChris Mason radix_tree_tag_clear(radix, (unsigned long)root, 183*0f7d52f4SChris Mason BTRFS_ROOT_TRANS_TAG); 184*0f7d52f4SChris Mason if (root->commit_root == root->node) { 185*0f7d52f4SChris Mason WARN_ON(root->node->b_blocknr != 186*0f7d52f4SChris Mason btrfs_root_blocknr(&root->root_item)); 187*0f7d52f4SChris Mason brelse(root->commit_root); 188*0f7d52f4SChris Mason root->commit_root = NULL; 189*0f7d52f4SChris Mason continue; 190*0f7d52f4SChris Mason } 191*0f7d52f4SChris Mason dirty = kmalloc(sizeof(*dirty), GFP_NOFS); 192*0f7d52f4SChris Mason BUG_ON(!dirty); 193*0f7d52f4SChris Mason memcpy(&dirty->snap_key, &root->root_key, 194*0f7d52f4SChris Mason sizeof(root->root_key)); 195*0f7d52f4SChris Mason dirty->commit_root = root->commit_root; 196*0f7d52f4SChris Mason root->commit_root = NULL; 197*0f7d52f4SChris Mason dirty->root = root; 198*0f7d52f4SChris Mason printk("adding dirty root %Lu gen %Lu blocknr %Lu\n", root->root_key.objectid, root->root_key.offset, dirty->commit_root->b_blocknr); 199*0f7d52f4SChris Mason root->root_key.offset = root->fs_info->generation; 200*0f7d52f4SChris Mason btrfs_set_root_blocknr(&root->root_item, 201*0f7d52f4SChris Mason root->node->b_blocknr); 202*0f7d52f4SChris Mason err = btrfs_insert_root(trans, root->fs_info->tree_root, 203*0f7d52f4SChris Mason &root->root_key, 204*0f7d52f4SChris Mason &root->root_item); 205*0f7d52f4SChris Mason BUG_ON(err); 206*0f7d52f4SChris Mason list_add(&dirty->list, list); 207*0f7d52f4SChris Mason } 208*0f7d52f4SChris Mason } 209*0f7d52f4SChris Mason printk("add dirty done\n"); 210*0f7d52f4SChris Mason return 0; 211*0f7d52f4SChris Mason } 212*0f7d52f4SChris Mason 213*0f7d52f4SChris Mason int drop_dirty_roots(struct btrfs_root *tree_root, struct list_head *list) 214*0f7d52f4SChris Mason { 215*0f7d52f4SChris Mason struct dirty_root *dirty; 216*0f7d52f4SChris Mason struct btrfs_trans_handle *trans; 217*0f7d52f4SChris Mason int ret; 218*0f7d52f4SChris Mason 219*0f7d52f4SChris Mason while(!list_empty(list)) { 220*0f7d52f4SChris Mason dirty = list_entry(list->next, struct dirty_root, list); 221*0f7d52f4SChris Mason list_del_init(&dirty->list); 222*0f7d52f4SChris Mason trans = btrfs_start_transaction(tree_root, 1); 223*0f7d52f4SChris Mason printk("drop snapshot root %p, commit_root blocknr %Lu generation %Lu\n", dirty->root, dirty->commit_root->b_blocknr, dirty->snap_key.offset); 224*0f7d52f4SChris Mason ret = btrfs_drop_snapshot(trans, dirty->root, 225*0f7d52f4SChris Mason dirty->commit_root); 226*0f7d52f4SChris Mason BUG_ON(ret); 227*0f7d52f4SChris Mason 228*0f7d52f4SChris Mason printk("del root objectid %Lu, offset %Lu\n", dirty->snap_key.objectid, dirty->snap_key.offset); 229*0f7d52f4SChris Mason ret = btrfs_del_root(trans, tree_root, &dirty->snap_key); 230*0f7d52f4SChris Mason BUG_ON(ret); 231*0f7d52f4SChris Mason ret = btrfs_end_transaction(trans, tree_root); 232*0f7d52f4SChris Mason BUG_ON(ret); 233*0f7d52f4SChris Mason kfree(dirty); 234*0f7d52f4SChris Mason } 235*0f7d52f4SChris Mason return 0; 236*0f7d52f4SChris Mason } 237*0f7d52f4SChris Mason 23879154b1bSChris Mason int btrfs_commit_transaction(struct btrfs_trans_handle *trans, 23979154b1bSChris Mason struct btrfs_root *root) 24079154b1bSChris Mason { 24179154b1bSChris Mason int ret = 0; 24279154b1bSChris Mason struct btrfs_transaction *cur_trans; 243*0f7d52f4SChris Mason struct list_head dirty_fs_roots; 24479154b1bSChris Mason DEFINE_WAIT(wait); 24579154b1bSChris Mason 246*0f7d52f4SChris Mason INIT_LIST_HEAD(&dirty_fs_roots); 247d6e4a428SChris Mason 24879154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 24979154b1bSChris Mason if (trans->transaction->in_commit) { 2502c90e5d6SChris Mason printk("already in commit!, waiting\n"); 25179154b1bSChris Mason cur_trans = trans->transaction; 25279154b1bSChris Mason trans->transaction->use_count++; 25379154b1bSChris Mason btrfs_end_transaction(trans, root); 25479154b1bSChris Mason ret = wait_for_commit(root, cur_trans); 25579154b1bSChris Mason BUG_ON(ret); 25679154b1bSChris Mason put_transaction(cur_trans); 25779154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 25879154b1bSChris Mason return 0; 25979154b1bSChris Mason } 2602c90e5d6SChris Mason cur_trans = trans->transaction; 2612c90e5d6SChris Mason trans->transaction->in_commit = 1; 26279154b1bSChris Mason while (trans->transaction->num_writers > 1) { 2632c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 26479154b1bSChris Mason prepare_to_wait(&trans->transaction->writer_wait, &wait, 26579154b1bSChris Mason TASK_UNINTERRUPTIBLE); 26679154b1bSChris Mason if (trans->transaction->num_writers <= 1) 26779154b1bSChris Mason break; 26879154b1bSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 26979154b1bSChris Mason schedule(); 27079154b1bSChris Mason mutex_lock(&root->fs_info->trans_mutex); 2712c90e5d6SChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 27279154b1bSChris Mason } 27379154b1bSChris Mason finish_wait(&trans->transaction->writer_wait, &wait); 2742c90e5d6SChris Mason WARN_ON(cur_trans != trans->transaction); 275*0f7d52f4SChris Mason add_dirty_roots(trans, &root->fs_info->fs_roots_radix, &dirty_fs_roots); 27679154b1bSChris Mason ret = btrfs_commit_tree_roots(trans, root); 27779154b1bSChris Mason BUG_ON(ret); 27878fae27eSChris Mason cur_trans = root->fs_info->running_transaction; 27978fae27eSChris Mason root->fs_info->running_transaction = NULL; 280*0f7d52f4SChris Mason btrfs_set_super_generation(root->fs_info->disk_super, 281*0f7d52f4SChris Mason root->fs_info->generation + 1); 28278fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 28379154b1bSChris Mason ret = btrfs_write_and_wait_transaction(trans, root); 28479154b1bSChris Mason BUG_ON(ret); 28579154b1bSChris Mason 28679154b1bSChris Mason write_ctree_super(trans, root); 28778fae27eSChris Mason btrfs_finish_extent_commit(trans, root); 28878fae27eSChris Mason mutex_lock(&root->fs_info->trans_mutex); 2892c90e5d6SChris Mason cur_trans->commit_done = 1; 2902c90e5d6SChris Mason wake_up(&cur_trans->commit_wait); 29179154b1bSChris Mason put_transaction(cur_trans); 29278fae27eSChris Mason put_transaction(cur_trans); 29378fae27eSChris Mason mutex_unlock(&root->fs_info->trans_mutex); 2942c90e5d6SChris Mason kmem_cache_free(btrfs_trans_handle_cachep, trans); 29579154b1bSChris Mason 296*0f7d52f4SChris Mason drop_dirty_roots(root->fs_info->tree_root, &dirty_fs_roots); 29779154b1bSChris Mason return ret; 29879154b1bSChris Mason } 29979154b1bSChris Mason 300