1c1d7c514SDavid Sterba // SPDX-License-Identifier: GPL-2.0 2a542ad1bSJan Schmidt /* 3a542ad1bSJan Schmidt * Copyright (C) 2011 STRATO. All rights reserved. 4a542ad1bSJan Schmidt */ 5a542ad1bSJan Schmidt 6f54de068SDavid Sterba #include <linux/mm.h> 7afce772eSLu Fengqi #include <linux/rbtree.h> 800142756SJeff Mahoney #include <trace/events/btrfs.h> 9a542ad1bSJan Schmidt #include "ctree.h" 10a542ad1bSJan Schmidt #include "disk-io.h" 11a542ad1bSJan Schmidt #include "backref.h" 128da6d581SJan Schmidt #include "ulist.h" 138da6d581SJan Schmidt #include "transaction.h" 148da6d581SJan Schmidt #include "delayed-ref.h" 15b916a59aSJan Schmidt #include "locking.h" 16a542ad1bSJan Schmidt 17dc046b10SJosef Bacik /* Just an arbitrary number so we can be sure this happened */ 18dc046b10SJosef Bacik #define BACKREF_FOUND_SHARED 6 19dc046b10SJosef Bacik 20976b1908SJan Schmidt struct extent_inode_elem { 21976b1908SJan Schmidt u64 inum; 22976b1908SJan Schmidt u64 offset; 23976b1908SJan Schmidt struct extent_inode_elem *next; 24976b1908SJan Schmidt }; 25976b1908SJan Schmidt 2673980becSJeff Mahoney static int check_extent_in_eb(const struct btrfs_key *key, 2773980becSJeff Mahoney const struct extent_buffer *eb, 2873980becSJeff Mahoney const struct btrfs_file_extent_item *fi, 29976b1908SJan Schmidt u64 extent_item_pos, 30c995ab3cSZygo Blaxell struct extent_inode_elem **eie, 31c995ab3cSZygo Blaxell bool ignore_offset) 32976b1908SJan Schmidt { 338ca15e05SJosef Bacik u64 offset = 0; 348ca15e05SJosef Bacik struct extent_inode_elem *e; 358ca15e05SJosef Bacik 36c995ab3cSZygo Blaxell if (!ignore_offset && 37c995ab3cSZygo Blaxell !btrfs_file_extent_compression(eb, fi) && 388ca15e05SJosef Bacik !btrfs_file_extent_encryption(eb, fi) && 398ca15e05SJosef Bacik !btrfs_file_extent_other_encoding(eb, fi)) { 40976b1908SJan Schmidt u64 data_offset; 41976b1908SJan Schmidt u64 data_len; 42976b1908SJan Schmidt 43976b1908SJan Schmidt data_offset = btrfs_file_extent_offset(eb, fi); 44976b1908SJan Schmidt data_len = btrfs_file_extent_num_bytes(eb, fi); 45976b1908SJan Schmidt 46976b1908SJan Schmidt if (extent_item_pos < data_offset || 47976b1908SJan Schmidt extent_item_pos >= data_offset + data_len) 48976b1908SJan Schmidt return 1; 498ca15e05SJosef Bacik offset = extent_item_pos - data_offset; 508ca15e05SJosef Bacik } 51976b1908SJan Schmidt 52976b1908SJan Schmidt e = kmalloc(sizeof(*e), GFP_NOFS); 53976b1908SJan Schmidt if (!e) 54976b1908SJan Schmidt return -ENOMEM; 55976b1908SJan Schmidt 56976b1908SJan Schmidt e->next = *eie; 57976b1908SJan Schmidt e->inum = key->objectid; 588ca15e05SJosef Bacik e->offset = key->offset + offset; 59976b1908SJan Schmidt *eie = e; 60976b1908SJan Schmidt 61976b1908SJan Schmidt return 0; 62976b1908SJan Schmidt } 63976b1908SJan Schmidt 64f05c4746SWang Shilong static void free_inode_elem_list(struct extent_inode_elem *eie) 65f05c4746SWang Shilong { 66f05c4746SWang Shilong struct extent_inode_elem *eie_next; 67f05c4746SWang Shilong 68f05c4746SWang Shilong for (; eie; eie = eie_next) { 69f05c4746SWang Shilong eie_next = eie->next; 70f05c4746SWang Shilong kfree(eie); 71f05c4746SWang Shilong } 72f05c4746SWang Shilong } 73f05c4746SWang Shilong 7473980becSJeff Mahoney static int find_extent_in_eb(const struct extent_buffer *eb, 7573980becSJeff Mahoney u64 wanted_disk_byte, u64 extent_item_pos, 76c995ab3cSZygo Blaxell struct extent_inode_elem **eie, 77c995ab3cSZygo Blaxell bool ignore_offset) 78976b1908SJan Schmidt { 79976b1908SJan Schmidt u64 disk_byte; 80976b1908SJan Schmidt struct btrfs_key key; 81976b1908SJan Schmidt struct btrfs_file_extent_item *fi; 82976b1908SJan Schmidt int slot; 83976b1908SJan Schmidt int nritems; 84976b1908SJan Schmidt int extent_type; 85976b1908SJan Schmidt int ret; 86976b1908SJan Schmidt 87976b1908SJan Schmidt /* 88976b1908SJan Schmidt * from the shared data ref, we only have the leaf but we need 89976b1908SJan Schmidt * the key. thus, we must look into all items and see that we 90976b1908SJan Schmidt * find one (some) with a reference to our extent item. 91976b1908SJan Schmidt */ 92976b1908SJan Schmidt nritems = btrfs_header_nritems(eb); 93976b1908SJan Schmidt for (slot = 0; slot < nritems; ++slot) { 94976b1908SJan Schmidt btrfs_item_key_to_cpu(eb, &key, slot); 95976b1908SJan Schmidt if (key.type != BTRFS_EXTENT_DATA_KEY) 96976b1908SJan Schmidt continue; 97976b1908SJan Schmidt fi = btrfs_item_ptr(eb, slot, struct btrfs_file_extent_item); 98976b1908SJan Schmidt extent_type = btrfs_file_extent_type(eb, fi); 99976b1908SJan Schmidt if (extent_type == BTRFS_FILE_EXTENT_INLINE) 100976b1908SJan Schmidt continue; 101976b1908SJan Schmidt /* don't skip BTRFS_FILE_EXTENT_PREALLOC, we can handle that */ 102976b1908SJan Schmidt disk_byte = btrfs_file_extent_disk_bytenr(eb, fi); 103976b1908SJan Schmidt if (disk_byte != wanted_disk_byte) 104976b1908SJan Schmidt continue; 105976b1908SJan Schmidt 106c995ab3cSZygo Blaxell ret = check_extent_in_eb(&key, eb, fi, extent_item_pos, eie, ignore_offset); 107976b1908SJan Schmidt if (ret < 0) 108976b1908SJan Schmidt return ret; 109976b1908SJan Schmidt } 110976b1908SJan Schmidt 111976b1908SJan Schmidt return 0; 112976b1908SJan Schmidt } 113976b1908SJan Schmidt 11486d5f994SEdmund Nadolski struct preftree { 115ecf160b4SLiu Bo struct rb_root_cached root; 1166c336b21SJeff Mahoney unsigned int count; 11786d5f994SEdmund Nadolski }; 11886d5f994SEdmund Nadolski 119ecf160b4SLiu Bo #define PREFTREE_INIT { .root = RB_ROOT_CACHED, .count = 0 } 12086d5f994SEdmund Nadolski 12186d5f994SEdmund Nadolski struct preftrees { 12286d5f994SEdmund Nadolski struct preftree direct; /* BTRFS_SHARED_[DATA|BLOCK]_REF_KEY */ 12386d5f994SEdmund Nadolski struct preftree indirect; /* BTRFS_[TREE_BLOCK|EXTENT_DATA]_REF_KEY */ 12486d5f994SEdmund Nadolski struct preftree indirect_missing_keys; 12586d5f994SEdmund Nadolski }; 12686d5f994SEdmund Nadolski 1273ec4d323SEdmund Nadolski /* 1283ec4d323SEdmund Nadolski * Checks for a shared extent during backref search. 1293ec4d323SEdmund Nadolski * 1303ec4d323SEdmund Nadolski * The share_count tracks prelim_refs (direct and indirect) having a 1313ec4d323SEdmund Nadolski * ref->count >0: 1323ec4d323SEdmund Nadolski * - incremented when a ref->count transitions to >0 1333ec4d323SEdmund Nadolski * - decremented when a ref->count transitions to <1 1343ec4d323SEdmund Nadolski */ 1353ec4d323SEdmund Nadolski struct share_check { 1363ec4d323SEdmund Nadolski u64 root_objectid; 1373ec4d323SEdmund Nadolski u64 inum; 1383ec4d323SEdmund Nadolski int share_count; 1393ec4d323SEdmund Nadolski }; 1403ec4d323SEdmund Nadolski 1413ec4d323SEdmund Nadolski static inline int extent_is_shared(struct share_check *sc) 1423ec4d323SEdmund Nadolski { 1433ec4d323SEdmund Nadolski return (sc && sc->share_count > 1) ? BACKREF_FOUND_SHARED : 0; 1443ec4d323SEdmund Nadolski } 1453ec4d323SEdmund Nadolski 146b9e9a6cbSWang Shilong static struct kmem_cache *btrfs_prelim_ref_cache; 147b9e9a6cbSWang Shilong 148b9e9a6cbSWang Shilong int __init btrfs_prelim_ref_init(void) 149b9e9a6cbSWang Shilong { 150b9e9a6cbSWang Shilong btrfs_prelim_ref_cache = kmem_cache_create("btrfs_prelim_ref", 151e0c476b1SJeff Mahoney sizeof(struct prelim_ref), 152b9e9a6cbSWang Shilong 0, 153fba4b697SNikolay Borisov SLAB_MEM_SPREAD, 154b9e9a6cbSWang Shilong NULL); 155b9e9a6cbSWang Shilong if (!btrfs_prelim_ref_cache) 156b9e9a6cbSWang Shilong return -ENOMEM; 157b9e9a6cbSWang Shilong return 0; 158b9e9a6cbSWang Shilong } 159b9e9a6cbSWang Shilong 160e67c718bSDavid Sterba void __cold btrfs_prelim_ref_exit(void) 161b9e9a6cbSWang Shilong { 162b9e9a6cbSWang Shilong kmem_cache_destroy(btrfs_prelim_ref_cache); 163b9e9a6cbSWang Shilong } 164b9e9a6cbSWang Shilong 16586d5f994SEdmund Nadolski static void free_pref(struct prelim_ref *ref) 16686d5f994SEdmund Nadolski { 16786d5f994SEdmund Nadolski kmem_cache_free(btrfs_prelim_ref_cache, ref); 16886d5f994SEdmund Nadolski } 16986d5f994SEdmund Nadolski 17086d5f994SEdmund Nadolski /* 17186d5f994SEdmund Nadolski * Return 0 when both refs are for the same block (and can be merged). 17286d5f994SEdmund Nadolski * A -1 return indicates ref1 is a 'lower' block than ref2, while 1 17386d5f994SEdmund Nadolski * indicates a 'higher' block. 17486d5f994SEdmund Nadolski */ 17586d5f994SEdmund Nadolski static int prelim_ref_compare(struct prelim_ref *ref1, 17686d5f994SEdmund Nadolski struct prelim_ref *ref2) 17786d5f994SEdmund Nadolski { 17886d5f994SEdmund Nadolski if (ref1->level < ref2->level) 17986d5f994SEdmund Nadolski return -1; 18086d5f994SEdmund Nadolski if (ref1->level > ref2->level) 18186d5f994SEdmund Nadolski return 1; 18286d5f994SEdmund Nadolski if (ref1->root_id < ref2->root_id) 18386d5f994SEdmund Nadolski return -1; 18486d5f994SEdmund Nadolski if (ref1->root_id > ref2->root_id) 18586d5f994SEdmund Nadolski return 1; 18686d5f994SEdmund Nadolski if (ref1->key_for_search.type < ref2->key_for_search.type) 18786d5f994SEdmund Nadolski return -1; 18886d5f994SEdmund Nadolski if (ref1->key_for_search.type > ref2->key_for_search.type) 18986d5f994SEdmund Nadolski return 1; 19086d5f994SEdmund Nadolski if (ref1->key_for_search.objectid < ref2->key_for_search.objectid) 19186d5f994SEdmund Nadolski return -1; 19286d5f994SEdmund Nadolski if (ref1->key_for_search.objectid > ref2->key_for_search.objectid) 19386d5f994SEdmund Nadolski return 1; 19486d5f994SEdmund Nadolski if (ref1->key_for_search.offset < ref2->key_for_search.offset) 19586d5f994SEdmund Nadolski return -1; 19686d5f994SEdmund Nadolski if (ref1->key_for_search.offset > ref2->key_for_search.offset) 19786d5f994SEdmund Nadolski return 1; 19886d5f994SEdmund Nadolski if (ref1->parent < ref2->parent) 19986d5f994SEdmund Nadolski return -1; 20086d5f994SEdmund Nadolski if (ref1->parent > ref2->parent) 20186d5f994SEdmund Nadolski return 1; 20286d5f994SEdmund Nadolski 20386d5f994SEdmund Nadolski return 0; 20486d5f994SEdmund Nadolski } 20586d5f994SEdmund Nadolski 206ccc8dc75SColin Ian King static void update_share_count(struct share_check *sc, int oldcount, 207ccc8dc75SColin Ian King int newcount) 2083ec4d323SEdmund Nadolski { 2093ec4d323SEdmund Nadolski if ((!sc) || (oldcount == 0 && newcount < 1)) 2103ec4d323SEdmund Nadolski return; 2113ec4d323SEdmund Nadolski 2123ec4d323SEdmund Nadolski if (oldcount > 0 && newcount < 1) 2133ec4d323SEdmund Nadolski sc->share_count--; 2143ec4d323SEdmund Nadolski else if (oldcount < 1 && newcount > 0) 2153ec4d323SEdmund Nadolski sc->share_count++; 2163ec4d323SEdmund Nadolski } 2173ec4d323SEdmund Nadolski 21886d5f994SEdmund Nadolski /* 21986d5f994SEdmund Nadolski * Add @newref to the @root rbtree, merging identical refs. 22086d5f994SEdmund Nadolski * 2213ec4d323SEdmund Nadolski * Callers should assume that newref has been freed after calling. 22286d5f994SEdmund Nadolski */ 22300142756SJeff Mahoney static void prelim_ref_insert(const struct btrfs_fs_info *fs_info, 22400142756SJeff Mahoney struct preftree *preftree, 2253ec4d323SEdmund Nadolski struct prelim_ref *newref, 2263ec4d323SEdmund Nadolski struct share_check *sc) 22786d5f994SEdmund Nadolski { 228ecf160b4SLiu Bo struct rb_root_cached *root; 22986d5f994SEdmund Nadolski struct rb_node **p; 23086d5f994SEdmund Nadolski struct rb_node *parent = NULL; 23186d5f994SEdmund Nadolski struct prelim_ref *ref; 23286d5f994SEdmund Nadolski int result; 233ecf160b4SLiu Bo bool leftmost = true; 23486d5f994SEdmund Nadolski 23586d5f994SEdmund Nadolski root = &preftree->root; 236ecf160b4SLiu Bo p = &root->rb_root.rb_node; 23786d5f994SEdmund Nadolski 23886d5f994SEdmund Nadolski while (*p) { 23986d5f994SEdmund Nadolski parent = *p; 24086d5f994SEdmund Nadolski ref = rb_entry(parent, struct prelim_ref, rbnode); 24186d5f994SEdmund Nadolski result = prelim_ref_compare(ref, newref); 24286d5f994SEdmund Nadolski if (result < 0) { 24386d5f994SEdmund Nadolski p = &(*p)->rb_left; 24486d5f994SEdmund Nadolski } else if (result > 0) { 24586d5f994SEdmund Nadolski p = &(*p)->rb_right; 246ecf160b4SLiu Bo leftmost = false; 24786d5f994SEdmund Nadolski } else { 24886d5f994SEdmund Nadolski /* Identical refs, merge them and free @newref */ 24986d5f994SEdmund Nadolski struct extent_inode_elem *eie = ref->inode_list; 25086d5f994SEdmund Nadolski 25186d5f994SEdmund Nadolski while (eie && eie->next) 25286d5f994SEdmund Nadolski eie = eie->next; 25386d5f994SEdmund Nadolski 25486d5f994SEdmund Nadolski if (!eie) 25586d5f994SEdmund Nadolski ref->inode_list = newref->inode_list; 25686d5f994SEdmund Nadolski else 25786d5f994SEdmund Nadolski eie->next = newref->inode_list; 25800142756SJeff Mahoney trace_btrfs_prelim_ref_merge(fs_info, ref, newref, 25900142756SJeff Mahoney preftree->count); 2603ec4d323SEdmund Nadolski /* 2613ec4d323SEdmund Nadolski * A delayed ref can have newref->count < 0. 2623ec4d323SEdmund Nadolski * The ref->count is updated to follow any 2633ec4d323SEdmund Nadolski * BTRFS_[ADD|DROP]_DELAYED_REF actions. 2643ec4d323SEdmund Nadolski */ 2653ec4d323SEdmund Nadolski update_share_count(sc, ref->count, 2663ec4d323SEdmund Nadolski ref->count + newref->count); 26786d5f994SEdmund Nadolski ref->count += newref->count; 26886d5f994SEdmund Nadolski free_pref(newref); 26986d5f994SEdmund Nadolski return; 27086d5f994SEdmund Nadolski } 27186d5f994SEdmund Nadolski } 27286d5f994SEdmund Nadolski 2733ec4d323SEdmund Nadolski update_share_count(sc, 0, newref->count); 2746c336b21SJeff Mahoney preftree->count++; 27500142756SJeff Mahoney trace_btrfs_prelim_ref_insert(fs_info, newref, NULL, preftree->count); 27686d5f994SEdmund Nadolski rb_link_node(&newref->rbnode, parent, p); 277ecf160b4SLiu Bo rb_insert_color_cached(&newref->rbnode, root, leftmost); 27886d5f994SEdmund Nadolski } 27986d5f994SEdmund Nadolski 28086d5f994SEdmund Nadolski /* 28186d5f994SEdmund Nadolski * Release the entire tree. We don't care about internal consistency so 28286d5f994SEdmund Nadolski * just free everything and then reset the tree root. 28386d5f994SEdmund Nadolski */ 28486d5f994SEdmund Nadolski static void prelim_release(struct preftree *preftree) 28586d5f994SEdmund Nadolski { 28686d5f994SEdmund Nadolski struct prelim_ref *ref, *next_ref; 28786d5f994SEdmund Nadolski 288ecf160b4SLiu Bo rbtree_postorder_for_each_entry_safe(ref, next_ref, 289ecf160b4SLiu Bo &preftree->root.rb_root, rbnode) 29086d5f994SEdmund Nadolski free_pref(ref); 29186d5f994SEdmund Nadolski 292ecf160b4SLiu Bo preftree->root = RB_ROOT_CACHED; 2936c336b21SJeff Mahoney preftree->count = 0; 29486d5f994SEdmund Nadolski } 29586d5f994SEdmund Nadolski 296d5c88b73SJan Schmidt /* 297d5c88b73SJan Schmidt * the rules for all callers of this function are: 298d5c88b73SJan Schmidt * - obtaining the parent is the goal 299d5c88b73SJan Schmidt * - if you add a key, you must know that it is a correct key 300d5c88b73SJan Schmidt * - if you cannot add the parent or a correct key, then we will look into the 301d5c88b73SJan Schmidt * block later to set a correct key 302d5c88b73SJan Schmidt * 303d5c88b73SJan Schmidt * delayed refs 304d5c88b73SJan Schmidt * ============ 305d5c88b73SJan Schmidt * backref type | shared | indirect | shared | indirect 306d5c88b73SJan Schmidt * information | tree | tree | data | data 307d5c88b73SJan Schmidt * --------------------+--------+----------+--------+---------- 308d5c88b73SJan Schmidt * parent logical | y | - | - | - 309d5c88b73SJan Schmidt * key to resolve | - | y | y | y 310d5c88b73SJan Schmidt * tree block logical | - | - | - | - 311d5c88b73SJan Schmidt * root for resolving | y | y | y | y 312d5c88b73SJan Schmidt * 313d5c88b73SJan Schmidt * - column 1: we've the parent -> done 314d5c88b73SJan Schmidt * - column 2, 3, 4: we use the key to find the parent 315d5c88b73SJan Schmidt * 316d5c88b73SJan Schmidt * on disk refs (inline or keyed) 317d5c88b73SJan Schmidt * ============================== 318d5c88b73SJan Schmidt * backref type | shared | indirect | shared | indirect 319d5c88b73SJan Schmidt * information | tree | tree | data | data 320d5c88b73SJan Schmidt * --------------------+--------+----------+--------+---------- 321d5c88b73SJan Schmidt * parent logical | y | - | y | - 322d5c88b73SJan Schmidt * key to resolve | - | - | - | y 323d5c88b73SJan Schmidt * tree block logical | y | y | y | y 324d5c88b73SJan Schmidt * root for resolving | - | y | y | y 325d5c88b73SJan Schmidt * 326d5c88b73SJan Schmidt * - column 1, 3: we've the parent -> done 327d5c88b73SJan Schmidt * - column 2: we take the first key from the block to find the parent 328e0c476b1SJeff Mahoney * (see add_missing_keys) 329d5c88b73SJan Schmidt * - column 4: we use the key to find the parent 330d5c88b73SJan Schmidt * 331d5c88b73SJan Schmidt * additional information that's available but not required to find the parent 332d5c88b73SJan Schmidt * block might help in merging entries to gain some speed. 333d5c88b73SJan Schmidt */ 33400142756SJeff Mahoney static int add_prelim_ref(const struct btrfs_fs_info *fs_info, 33500142756SJeff Mahoney struct preftree *preftree, u64 root_id, 336e0c476b1SJeff Mahoney const struct btrfs_key *key, int level, u64 parent, 3373ec4d323SEdmund Nadolski u64 wanted_disk_byte, int count, 3383ec4d323SEdmund Nadolski struct share_check *sc, gfp_t gfp_mask) 3398da6d581SJan Schmidt { 340e0c476b1SJeff Mahoney struct prelim_ref *ref; 3418da6d581SJan Schmidt 34248ec4736SLiu Bo if (root_id == BTRFS_DATA_RELOC_TREE_OBJECTID) 34348ec4736SLiu Bo return 0; 34448ec4736SLiu Bo 345b9e9a6cbSWang Shilong ref = kmem_cache_alloc(btrfs_prelim_ref_cache, gfp_mask); 3468da6d581SJan Schmidt if (!ref) 3478da6d581SJan Schmidt return -ENOMEM; 3488da6d581SJan Schmidt 3498da6d581SJan Schmidt ref->root_id = root_id; 3507ac8b88eSethanwu if (key) 351d5c88b73SJan Schmidt ref->key_for_search = *key; 3527ac8b88eSethanwu else 353d5c88b73SJan Schmidt memset(&ref->key_for_search, 0, sizeof(ref->key_for_search)); 3548da6d581SJan Schmidt 3553301958bSJan Schmidt ref->inode_list = NULL; 3568da6d581SJan Schmidt ref->level = level; 3578da6d581SJan Schmidt ref->count = count; 3588da6d581SJan Schmidt ref->parent = parent; 3598da6d581SJan Schmidt ref->wanted_disk_byte = wanted_disk_byte; 3603ec4d323SEdmund Nadolski prelim_ref_insert(fs_info, preftree, ref, sc); 3613ec4d323SEdmund Nadolski return extent_is_shared(sc); 3628da6d581SJan Schmidt } 3638da6d581SJan Schmidt 36486d5f994SEdmund Nadolski /* direct refs use root == 0, key == NULL */ 36500142756SJeff Mahoney static int add_direct_ref(const struct btrfs_fs_info *fs_info, 36600142756SJeff Mahoney struct preftrees *preftrees, int level, u64 parent, 3673ec4d323SEdmund Nadolski u64 wanted_disk_byte, int count, 3683ec4d323SEdmund Nadolski struct share_check *sc, gfp_t gfp_mask) 36986d5f994SEdmund Nadolski { 37000142756SJeff Mahoney return add_prelim_ref(fs_info, &preftrees->direct, 0, NULL, level, 3713ec4d323SEdmund Nadolski parent, wanted_disk_byte, count, sc, gfp_mask); 37286d5f994SEdmund Nadolski } 37386d5f994SEdmund Nadolski 37486d5f994SEdmund Nadolski /* indirect refs use parent == 0 */ 37500142756SJeff Mahoney static int add_indirect_ref(const struct btrfs_fs_info *fs_info, 37600142756SJeff Mahoney struct preftrees *preftrees, u64 root_id, 37786d5f994SEdmund Nadolski const struct btrfs_key *key, int level, 3783ec4d323SEdmund Nadolski u64 wanted_disk_byte, int count, 3793ec4d323SEdmund Nadolski struct share_check *sc, gfp_t gfp_mask) 38086d5f994SEdmund Nadolski { 38186d5f994SEdmund Nadolski struct preftree *tree = &preftrees->indirect; 38286d5f994SEdmund Nadolski 38386d5f994SEdmund Nadolski if (!key) 38486d5f994SEdmund Nadolski tree = &preftrees->indirect_missing_keys; 38500142756SJeff Mahoney return add_prelim_ref(fs_info, tree, root_id, key, level, 0, 3863ec4d323SEdmund Nadolski wanted_disk_byte, count, sc, gfp_mask); 38786d5f994SEdmund Nadolski } 38886d5f994SEdmund Nadolski 389ed58f2e6Sethanwu static int is_shared_data_backref(struct preftrees *preftrees, u64 bytenr) 390ed58f2e6Sethanwu { 391ed58f2e6Sethanwu struct rb_node **p = &preftrees->direct.root.rb_root.rb_node; 392ed58f2e6Sethanwu struct rb_node *parent = NULL; 393ed58f2e6Sethanwu struct prelim_ref *ref = NULL; 3949c6c723fSArnd Bergmann struct prelim_ref target = {}; 395ed58f2e6Sethanwu int result; 396ed58f2e6Sethanwu 397ed58f2e6Sethanwu target.parent = bytenr; 398ed58f2e6Sethanwu 399ed58f2e6Sethanwu while (*p) { 400ed58f2e6Sethanwu parent = *p; 401ed58f2e6Sethanwu ref = rb_entry(parent, struct prelim_ref, rbnode); 402ed58f2e6Sethanwu result = prelim_ref_compare(ref, &target); 403ed58f2e6Sethanwu 404ed58f2e6Sethanwu if (result < 0) 405ed58f2e6Sethanwu p = &(*p)->rb_left; 406ed58f2e6Sethanwu else if (result > 0) 407ed58f2e6Sethanwu p = &(*p)->rb_right; 408ed58f2e6Sethanwu else 409ed58f2e6Sethanwu return 1; 410ed58f2e6Sethanwu } 411ed58f2e6Sethanwu return 0; 412ed58f2e6Sethanwu } 413ed58f2e6Sethanwu 4148da6d581SJan Schmidt static int add_all_parents(struct btrfs_root *root, struct btrfs_path *path, 415ed58f2e6Sethanwu struct ulist *parents, 416ed58f2e6Sethanwu struct preftrees *preftrees, struct prelim_ref *ref, 41744853868SJosef Bacik int level, u64 time_seq, const u64 *extent_item_pos, 418b25b0b87Sethanwu bool ignore_offset) 4198da6d581SJan Schmidt { 42069bca40dSAlexander Block int ret = 0; 42169bca40dSAlexander Block int slot; 42269bca40dSAlexander Block struct extent_buffer *eb; 42369bca40dSAlexander Block struct btrfs_key key; 4247ef81ac8SJosef Bacik struct btrfs_key *key_for_search = &ref->key_for_search; 4258da6d581SJan Schmidt struct btrfs_file_extent_item *fi; 426ed8c4913SJosef Bacik struct extent_inode_elem *eie = NULL, *old = NULL; 4278da6d581SJan Schmidt u64 disk_byte; 4287ef81ac8SJosef Bacik u64 wanted_disk_byte = ref->wanted_disk_byte; 4297ef81ac8SJosef Bacik u64 count = 0; 4307ac8b88eSethanwu u64 data_offset; 4318da6d581SJan Schmidt 43269bca40dSAlexander Block if (level != 0) { 43369bca40dSAlexander Block eb = path->nodes[level]; 43469bca40dSAlexander Block ret = ulist_add(parents, eb->start, 0, GFP_NOFS); 4353301958bSJan Schmidt if (ret < 0) 4363301958bSJan Schmidt return ret; 4378da6d581SJan Schmidt return 0; 43869bca40dSAlexander Block } 4398da6d581SJan Schmidt 4408da6d581SJan Schmidt /* 441ed58f2e6Sethanwu * 1. We normally enter this function with the path already pointing to 44269bca40dSAlexander Block * the first item to check. But sometimes, we may enter it with 443ed58f2e6Sethanwu * slot == nritems. 444ed58f2e6Sethanwu * 2. We are searching for normal backref but bytenr of this leaf 445ed58f2e6Sethanwu * matches shared data backref 446cfc0eed0Sethanwu * 3. The leaf owner is not equal to the root we are searching 447cfc0eed0Sethanwu * 448ed58f2e6Sethanwu * For these cases, go to the next leaf before we continue. 4498da6d581SJan Schmidt */ 450ed58f2e6Sethanwu eb = path->nodes[0]; 451ed58f2e6Sethanwu if (path->slots[0] >= btrfs_header_nritems(eb) || 452cfc0eed0Sethanwu is_shared_data_backref(preftrees, eb->start) || 453cfc0eed0Sethanwu ref->root_id != btrfs_header_owner(eb)) { 454de47c9d3SEdmund Nadolski if (time_seq == SEQ_LAST) 45521633fc6SQu Wenruo ret = btrfs_next_leaf(root, path); 45621633fc6SQu Wenruo else 4573d7806ecSJan Schmidt ret = btrfs_next_old_leaf(root, path, time_seq); 45821633fc6SQu Wenruo } 4598da6d581SJan Schmidt 460b25b0b87Sethanwu while (!ret && count < ref->count) { 4618da6d581SJan Schmidt eb = path->nodes[0]; 46269bca40dSAlexander Block slot = path->slots[0]; 46369bca40dSAlexander Block 46469bca40dSAlexander Block btrfs_item_key_to_cpu(eb, &key, slot); 46569bca40dSAlexander Block 46669bca40dSAlexander Block if (key.objectid != key_for_search->objectid || 46769bca40dSAlexander Block key.type != BTRFS_EXTENT_DATA_KEY) 46869bca40dSAlexander Block break; 46969bca40dSAlexander Block 470ed58f2e6Sethanwu /* 471ed58f2e6Sethanwu * We are searching for normal backref but bytenr of this leaf 472cfc0eed0Sethanwu * matches shared data backref, OR 473cfc0eed0Sethanwu * the leaf owner is not equal to the root we are searching for 474ed58f2e6Sethanwu */ 475cfc0eed0Sethanwu if (slot == 0 && 476cfc0eed0Sethanwu (is_shared_data_backref(preftrees, eb->start) || 477cfc0eed0Sethanwu ref->root_id != btrfs_header_owner(eb))) { 478ed58f2e6Sethanwu if (time_seq == SEQ_LAST) 479ed58f2e6Sethanwu ret = btrfs_next_leaf(root, path); 480ed58f2e6Sethanwu else 481ed58f2e6Sethanwu ret = btrfs_next_old_leaf(root, path, time_seq); 482ed58f2e6Sethanwu continue; 483ed58f2e6Sethanwu } 48469bca40dSAlexander Block fi = btrfs_item_ptr(eb, slot, struct btrfs_file_extent_item); 4858da6d581SJan Schmidt disk_byte = btrfs_file_extent_disk_bytenr(eb, fi); 4867ac8b88eSethanwu data_offset = btrfs_file_extent_offset(eb, fi); 48769bca40dSAlexander Block 48869bca40dSAlexander Block if (disk_byte == wanted_disk_byte) { 48969bca40dSAlexander Block eie = NULL; 490ed8c4913SJosef Bacik old = NULL; 4917ac8b88eSethanwu if (ref->key_for_search.offset == key.offset - data_offset) 4927ef81ac8SJosef Bacik count++; 4937ac8b88eSethanwu else 4947ac8b88eSethanwu goto next; 49569bca40dSAlexander Block if (extent_item_pos) { 49669bca40dSAlexander Block ret = check_extent_in_eb(&key, eb, fi, 49769bca40dSAlexander Block *extent_item_pos, 498c995ab3cSZygo Blaxell &eie, ignore_offset); 49969bca40dSAlexander Block if (ret < 0) 50069bca40dSAlexander Block break; 5018da6d581SJan Schmidt } 502ed8c4913SJosef Bacik if (ret > 0) 503ed8c4913SJosef Bacik goto next; 5044eb1f66dSTakashi Iwai ret = ulist_add_merge_ptr(parents, eb->start, 5054eb1f66dSTakashi Iwai eie, (void **)&old, GFP_NOFS); 50669bca40dSAlexander Block if (ret < 0) 50769bca40dSAlexander Block break; 508ed8c4913SJosef Bacik if (!ret && extent_item_pos) { 509ed8c4913SJosef Bacik while (old->next) 510ed8c4913SJosef Bacik old = old->next; 511ed8c4913SJosef Bacik old->next = eie; 51269bca40dSAlexander Block } 513f05c4746SWang Shilong eie = NULL; 51469bca40dSAlexander Block } 515ed8c4913SJosef Bacik next: 516de47c9d3SEdmund Nadolski if (time_seq == SEQ_LAST) 51721633fc6SQu Wenruo ret = btrfs_next_item(root, path); 51821633fc6SQu Wenruo else 51969bca40dSAlexander Block ret = btrfs_next_old_item(root, path, time_seq); 5208da6d581SJan Schmidt } 5218da6d581SJan Schmidt 52269bca40dSAlexander Block if (ret > 0) 52369bca40dSAlexander Block ret = 0; 524f05c4746SWang Shilong else if (ret < 0) 525f05c4746SWang Shilong free_inode_elem_list(eie); 52669bca40dSAlexander Block return ret; 5278da6d581SJan Schmidt } 5288da6d581SJan Schmidt 5298da6d581SJan Schmidt /* 5308da6d581SJan Schmidt * resolve an indirect backref in the form (root_id, key, level) 5318da6d581SJan Schmidt * to a logical address 5328da6d581SJan Schmidt */ 533e0c476b1SJeff Mahoney static int resolve_indirect_ref(struct btrfs_fs_info *fs_info, 534da61d31aSJosef Bacik struct btrfs_path *path, u64 time_seq, 535ed58f2e6Sethanwu struct preftrees *preftrees, 536e0c476b1SJeff Mahoney struct prelim_ref *ref, struct ulist *parents, 537b25b0b87Sethanwu const u64 *extent_item_pos, bool ignore_offset) 5388da6d581SJan Schmidt { 5398da6d581SJan Schmidt struct btrfs_root *root; 5408da6d581SJan Schmidt struct btrfs_key root_key; 5418da6d581SJan Schmidt struct extent_buffer *eb; 5428da6d581SJan Schmidt int ret = 0; 5438da6d581SJan Schmidt int root_level; 5448da6d581SJan Schmidt int level = ref->level; 5457ac8b88eSethanwu struct btrfs_key search_key = ref->key_for_search; 5468da6d581SJan Schmidt 5478da6d581SJan Schmidt root_key.objectid = ref->root_id; 5488da6d581SJan Schmidt root_key.type = BTRFS_ROOT_ITEM_KEY; 5498da6d581SJan Schmidt root_key.offset = (u64)-1; 550538f72cdSWang Shilong 5512d9e9776SJosef Bacik root = btrfs_get_fs_root(fs_info, &root_key, false); 5528da6d581SJan Schmidt if (IS_ERR(root)) { 5538da6d581SJan Schmidt ret = PTR_ERR(root); 5549326f76fSJosef Bacik goto out_free; 5559326f76fSJosef Bacik } 5569326f76fSJosef Bacik 55739dba873SJosef Bacik if (!path->search_commit_root && 55839dba873SJosef Bacik test_bit(BTRFS_ROOT_DELETING, &root->state)) { 55939dba873SJosef Bacik ret = -ENOENT; 56039dba873SJosef Bacik goto out; 56139dba873SJosef Bacik } 56239dba873SJosef Bacik 563f5ee5c9aSJeff Mahoney if (btrfs_is_testing(fs_info)) { 564d9ee522bSJosef Bacik ret = -ENOENT; 565d9ee522bSJosef Bacik goto out; 566d9ee522bSJosef Bacik } 567d9ee522bSJosef Bacik 5689e351cc8SJosef Bacik if (path->search_commit_root) 5699e351cc8SJosef Bacik root_level = btrfs_header_level(root->commit_root); 570de47c9d3SEdmund Nadolski else if (time_seq == SEQ_LAST) 57121633fc6SQu Wenruo root_level = btrfs_header_level(root->node); 5729e351cc8SJosef Bacik else 5735b6602e7SJan Schmidt root_level = btrfs_old_root_level(root, time_seq); 5748da6d581SJan Schmidt 575c75e8394SJosef Bacik if (root_level + 1 == level) 5768da6d581SJan Schmidt goto out; 5778da6d581SJan Schmidt 5787ac8b88eSethanwu /* 5797ac8b88eSethanwu * We can often find data backrefs with an offset that is too large 5807ac8b88eSethanwu * (>= LLONG_MAX, maximum allowed file offset) due to underflows when 5817ac8b88eSethanwu * subtracting a file's offset with the data offset of its 5827ac8b88eSethanwu * corresponding extent data item. This can happen for example in the 5837ac8b88eSethanwu * clone ioctl. 5847ac8b88eSethanwu * 5857ac8b88eSethanwu * So if we detect such case we set the search key's offset to zero to 5867ac8b88eSethanwu * make sure we will find the matching file extent item at 5877ac8b88eSethanwu * add_all_parents(), otherwise we will miss it because the offset 5887ac8b88eSethanwu * taken form the backref is much larger then the offset of the file 5897ac8b88eSethanwu * extent item. This can make us scan a very large number of file 5907ac8b88eSethanwu * extent items, but at least it will not make us miss any. 5917ac8b88eSethanwu * 5927ac8b88eSethanwu * This is an ugly workaround for a behaviour that should have never 5937ac8b88eSethanwu * existed, but it does and a fix for the clone ioctl would touch a lot 5947ac8b88eSethanwu * of places, cause backwards incompatibility and would not fix the 5957ac8b88eSethanwu * problem for extents cloned with older kernels. 5967ac8b88eSethanwu */ 5977ac8b88eSethanwu if (search_key.type == BTRFS_EXTENT_DATA_KEY && 5987ac8b88eSethanwu search_key.offset >= LLONG_MAX) 5997ac8b88eSethanwu search_key.offset = 0; 6008da6d581SJan Schmidt path->lowest_level = level; 601de47c9d3SEdmund Nadolski if (time_seq == SEQ_LAST) 6027ac8b88eSethanwu ret = btrfs_search_slot(NULL, root, &search_key, path, 0, 0); 60321633fc6SQu Wenruo else 6047ac8b88eSethanwu ret = btrfs_search_old_slot(root, &search_key, path, time_seq); 605538f72cdSWang Shilong 606ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 607ab8d0fc4SJeff Mahoney "search slot in root %llu (level %d, ref count %d) returned %d for key (%llu %u %llu)", 608c1c9ff7cSGeert Uytterhoeven ref->root_id, level, ref->count, ret, 609c1c9ff7cSGeert Uytterhoeven ref->key_for_search.objectid, ref->key_for_search.type, 610c1c9ff7cSGeert Uytterhoeven ref->key_for_search.offset); 6118da6d581SJan Schmidt if (ret < 0) 6128da6d581SJan Schmidt goto out; 6138da6d581SJan Schmidt 6148da6d581SJan Schmidt eb = path->nodes[level]; 6159345457fSJan Schmidt while (!eb) { 616fae7f21cSDulshani Gunawardhana if (WARN_ON(!level)) { 6178da6d581SJan Schmidt ret = 1; 6188da6d581SJan Schmidt goto out; 6198da6d581SJan Schmidt } 6209345457fSJan Schmidt level--; 6219345457fSJan Schmidt eb = path->nodes[level]; 6229345457fSJan Schmidt } 6238da6d581SJan Schmidt 624ed58f2e6Sethanwu ret = add_all_parents(root, path, parents, preftrees, ref, level, 625b25b0b87Sethanwu time_seq, extent_item_pos, ignore_offset); 6268da6d581SJan Schmidt out: 62700246528SJosef Bacik btrfs_put_root(root); 6289326f76fSJosef Bacik out_free: 629da61d31aSJosef Bacik path->lowest_level = 0; 630da61d31aSJosef Bacik btrfs_release_path(path); 6318da6d581SJan Schmidt return ret; 6328da6d581SJan Schmidt } 6338da6d581SJan Schmidt 6344dae077aSJeff Mahoney static struct extent_inode_elem * 6354dae077aSJeff Mahoney unode_aux_to_inode_list(struct ulist_node *node) 6364dae077aSJeff Mahoney { 6374dae077aSJeff Mahoney if (!node) 6384dae077aSJeff Mahoney return NULL; 6394dae077aSJeff Mahoney return (struct extent_inode_elem *)(uintptr_t)node->aux; 6404dae077aSJeff Mahoney } 6414dae077aSJeff Mahoney 6428da6d581SJan Schmidt /* 64352042d8eSAndrea Gelmini * We maintain three separate rbtrees: one for direct refs, one for 64486d5f994SEdmund Nadolski * indirect refs which have a key, and one for indirect refs which do not 64586d5f994SEdmund Nadolski * have a key. Each tree does merge on insertion. 64686d5f994SEdmund Nadolski * 64786d5f994SEdmund Nadolski * Once all of the references are located, we iterate over the tree of 64886d5f994SEdmund Nadolski * indirect refs with missing keys. An appropriate key is located and 64986d5f994SEdmund Nadolski * the ref is moved onto the tree for indirect refs. After all missing 65086d5f994SEdmund Nadolski * keys are thus located, we iterate over the indirect ref tree, resolve 65186d5f994SEdmund Nadolski * each reference, and then insert the resolved reference onto the 65286d5f994SEdmund Nadolski * direct tree (merging there too). 65386d5f994SEdmund Nadolski * 65486d5f994SEdmund Nadolski * New backrefs (i.e., for parent nodes) are added to the appropriate 65586d5f994SEdmund Nadolski * rbtree as they are encountered. The new backrefs are subsequently 65686d5f994SEdmund Nadolski * resolved as above. 6578da6d581SJan Schmidt */ 658e0c476b1SJeff Mahoney static int resolve_indirect_refs(struct btrfs_fs_info *fs_info, 659da61d31aSJosef Bacik struct btrfs_path *path, u64 time_seq, 66086d5f994SEdmund Nadolski struct preftrees *preftrees, 661b25b0b87Sethanwu const u64 *extent_item_pos, 662c995ab3cSZygo Blaxell struct share_check *sc, bool ignore_offset) 6638da6d581SJan Schmidt { 6648da6d581SJan Schmidt int err; 6658da6d581SJan Schmidt int ret = 0; 6668da6d581SJan Schmidt struct ulist *parents; 6678da6d581SJan Schmidt struct ulist_node *node; 668cd1b413cSJan Schmidt struct ulist_iterator uiter; 66986d5f994SEdmund Nadolski struct rb_node *rnode; 6708da6d581SJan Schmidt 6718da6d581SJan Schmidt parents = ulist_alloc(GFP_NOFS); 6728da6d581SJan Schmidt if (!parents) 6738da6d581SJan Schmidt return -ENOMEM; 6748da6d581SJan Schmidt 6758da6d581SJan Schmidt /* 67686d5f994SEdmund Nadolski * We could trade memory usage for performance here by iterating 67786d5f994SEdmund Nadolski * the tree, allocating new refs for each insertion, and then 67886d5f994SEdmund Nadolski * freeing the entire indirect tree when we're done. In some test 67986d5f994SEdmund Nadolski * cases, the tree can grow quite large (~200k objects). 6808da6d581SJan Schmidt */ 681ecf160b4SLiu Bo while ((rnode = rb_first_cached(&preftrees->indirect.root))) { 68286d5f994SEdmund Nadolski struct prelim_ref *ref; 68386d5f994SEdmund Nadolski 68486d5f994SEdmund Nadolski ref = rb_entry(rnode, struct prelim_ref, rbnode); 68586d5f994SEdmund Nadolski if (WARN(ref->parent, 68686d5f994SEdmund Nadolski "BUG: direct ref found in indirect tree")) { 68786d5f994SEdmund Nadolski ret = -EINVAL; 68886d5f994SEdmund Nadolski goto out; 68986d5f994SEdmund Nadolski } 69086d5f994SEdmund Nadolski 691ecf160b4SLiu Bo rb_erase_cached(&ref->rbnode, &preftrees->indirect.root); 6926c336b21SJeff Mahoney preftrees->indirect.count--; 69386d5f994SEdmund Nadolski 69486d5f994SEdmund Nadolski if (ref->count == 0) { 69586d5f994SEdmund Nadolski free_pref(ref); 6968da6d581SJan Schmidt continue; 69786d5f994SEdmund Nadolski } 69886d5f994SEdmund Nadolski 6993ec4d323SEdmund Nadolski if (sc && sc->root_objectid && 7003ec4d323SEdmund Nadolski ref->root_id != sc->root_objectid) { 70186d5f994SEdmund Nadolski free_pref(ref); 702dc046b10SJosef Bacik ret = BACKREF_FOUND_SHARED; 703dc046b10SJosef Bacik goto out; 704dc046b10SJosef Bacik } 705ed58f2e6Sethanwu err = resolve_indirect_ref(fs_info, path, time_seq, preftrees, 706ed58f2e6Sethanwu ref, parents, extent_item_pos, 707b25b0b87Sethanwu ignore_offset); 70895def2edSWang Shilong /* 70995def2edSWang Shilong * we can only tolerate ENOENT,otherwise,we should catch error 71095def2edSWang Shilong * and return directly. 71195def2edSWang Shilong */ 71295def2edSWang Shilong if (err == -ENOENT) { 7133ec4d323SEdmund Nadolski prelim_ref_insert(fs_info, &preftrees->direct, ref, 7143ec4d323SEdmund Nadolski NULL); 7158da6d581SJan Schmidt continue; 71695def2edSWang Shilong } else if (err) { 71786d5f994SEdmund Nadolski free_pref(ref); 71895def2edSWang Shilong ret = err; 71995def2edSWang Shilong goto out; 72095def2edSWang Shilong } 7218da6d581SJan Schmidt 7228da6d581SJan Schmidt /* we put the first parent into the ref at hand */ 723cd1b413cSJan Schmidt ULIST_ITER_INIT(&uiter); 724cd1b413cSJan Schmidt node = ulist_next(parents, &uiter); 7258da6d581SJan Schmidt ref->parent = node ? node->val : 0; 7264dae077aSJeff Mahoney ref->inode_list = unode_aux_to_inode_list(node); 7278da6d581SJan Schmidt 72886d5f994SEdmund Nadolski /* Add a prelim_ref(s) for any other parent(s). */ 729cd1b413cSJan Schmidt while ((node = ulist_next(parents, &uiter))) { 73086d5f994SEdmund Nadolski struct prelim_ref *new_ref; 73186d5f994SEdmund Nadolski 732b9e9a6cbSWang Shilong new_ref = kmem_cache_alloc(btrfs_prelim_ref_cache, 733b9e9a6cbSWang Shilong GFP_NOFS); 7348da6d581SJan Schmidt if (!new_ref) { 73586d5f994SEdmund Nadolski free_pref(ref); 7368da6d581SJan Schmidt ret = -ENOMEM; 737e36902d4SWang Shilong goto out; 7388da6d581SJan Schmidt } 7398da6d581SJan Schmidt memcpy(new_ref, ref, sizeof(*ref)); 7408da6d581SJan Schmidt new_ref->parent = node->val; 7414dae077aSJeff Mahoney new_ref->inode_list = unode_aux_to_inode_list(node); 7423ec4d323SEdmund Nadolski prelim_ref_insert(fs_info, &preftrees->direct, 7433ec4d323SEdmund Nadolski new_ref, NULL); 7448da6d581SJan Schmidt } 74586d5f994SEdmund Nadolski 7463ec4d323SEdmund Nadolski /* 74752042d8eSAndrea Gelmini * Now it's a direct ref, put it in the direct tree. We must 7483ec4d323SEdmund Nadolski * do this last because the ref could be merged/freed here. 7493ec4d323SEdmund Nadolski */ 7503ec4d323SEdmund Nadolski prelim_ref_insert(fs_info, &preftrees->direct, ref, NULL); 75186d5f994SEdmund Nadolski 7528da6d581SJan Schmidt ulist_reinit(parents); 7539dd14fd6SEdmund Nadolski cond_resched(); 7548da6d581SJan Schmidt } 755e36902d4SWang Shilong out: 7568da6d581SJan Schmidt ulist_free(parents); 7578da6d581SJan Schmidt return ret; 7588da6d581SJan Schmidt } 7598da6d581SJan Schmidt 760d5c88b73SJan Schmidt /* 761d5c88b73SJan Schmidt * read tree blocks and add keys where required. 762d5c88b73SJan Schmidt */ 763e0c476b1SJeff Mahoney static int add_missing_keys(struct btrfs_fs_info *fs_info, 76438e3eebfSJosef Bacik struct preftrees *preftrees, bool lock) 765d5c88b73SJan Schmidt { 766e0c476b1SJeff Mahoney struct prelim_ref *ref; 767d5c88b73SJan Schmidt struct extent_buffer *eb; 76886d5f994SEdmund Nadolski struct preftree *tree = &preftrees->indirect_missing_keys; 76986d5f994SEdmund Nadolski struct rb_node *node; 770d5c88b73SJan Schmidt 771ecf160b4SLiu Bo while ((node = rb_first_cached(&tree->root))) { 77286d5f994SEdmund Nadolski ref = rb_entry(node, struct prelim_ref, rbnode); 773ecf160b4SLiu Bo rb_erase_cached(node, &tree->root); 77486d5f994SEdmund Nadolski 77586d5f994SEdmund Nadolski BUG_ON(ref->parent); /* should not be a direct ref */ 77686d5f994SEdmund Nadolski BUG_ON(ref->key_for_search.type); 777d5c88b73SJan Schmidt BUG_ON(!ref->wanted_disk_byte); 77886d5f994SEdmund Nadolski 779581c1760SQu Wenruo eb = read_tree_block(fs_info, ref->wanted_disk_byte, 0, 780581c1760SQu Wenruo ref->level - 1, NULL); 78164c043deSLiu Bo if (IS_ERR(eb)) { 78286d5f994SEdmund Nadolski free_pref(ref); 78364c043deSLiu Bo return PTR_ERR(eb); 78464c043deSLiu Bo } else if (!extent_buffer_uptodate(eb)) { 78586d5f994SEdmund Nadolski free_pref(ref); 786416bc658SJosef Bacik free_extent_buffer(eb); 787416bc658SJosef Bacik return -EIO; 788416bc658SJosef Bacik } 78938e3eebfSJosef Bacik if (lock) 790d5c88b73SJan Schmidt btrfs_tree_read_lock(eb); 791d5c88b73SJan Schmidt if (btrfs_header_level(eb) == 0) 792d5c88b73SJan Schmidt btrfs_item_key_to_cpu(eb, &ref->key_for_search, 0); 793d5c88b73SJan Schmidt else 794d5c88b73SJan Schmidt btrfs_node_key_to_cpu(eb, &ref->key_for_search, 0); 79538e3eebfSJosef Bacik if (lock) 796d5c88b73SJan Schmidt btrfs_tree_read_unlock(eb); 797d5c88b73SJan Schmidt free_extent_buffer(eb); 7983ec4d323SEdmund Nadolski prelim_ref_insert(fs_info, &preftrees->indirect, ref, NULL); 7999dd14fd6SEdmund Nadolski cond_resched(); 800d5c88b73SJan Schmidt } 801d5c88b73SJan Schmidt return 0; 802d5c88b73SJan Schmidt } 803d5c88b73SJan Schmidt 8048da6d581SJan Schmidt /* 8058da6d581SJan Schmidt * add all currently queued delayed refs from this head whose seq nr is 8068da6d581SJan Schmidt * smaller or equal that seq to the list 8078da6d581SJan Schmidt */ 80800142756SJeff Mahoney static int add_delayed_refs(const struct btrfs_fs_info *fs_info, 80900142756SJeff Mahoney struct btrfs_delayed_ref_head *head, u64 seq, 810b25b0b87Sethanwu struct preftrees *preftrees, struct share_check *sc) 8118da6d581SJan Schmidt { 812c6fc2454SQu Wenruo struct btrfs_delayed_ref_node *node; 8138da6d581SJan Schmidt struct btrfs_delayed_extent_op *extent_op = head->extent_op; 814d5c88b73SJan Schmidt struct btrfs_key key; 81586d5f994SEdmund Nadolski struct btrfs_key tmp_op_key; 8160e0adbcfSJosef Bacik struct rb_node *n; 81701747e92SEdmund Nadolski int count; 818b1375d64SJan Schmidt int ret = 0; 8198da6d581SJan Schmidt 820a6dbceafSNikolay Borisov if (extent_op && extent_op->update_key) 82186d5f994SEdmund Nadolski btrfs_disk_key_to_cpu(&tmp_op_key, &extent_op->key); 8228da6d581SJan Schmidt 823d7df2c79SJosef Bacik spin_lock(&head->lock); 824e3d03965SLiu Bo for (n = rb_first_cached(&head->ref_tree); n; n = rb_next(n)) { 8250e0adbcfSJosef Bacik node = rb_entry(n, struct btrfs_delayed_ref_node, 8260e0adbcfSJosef Bacik ref_node); 8278da6d581SJan Schmidt if (node->seq > seq) 8288da6d581SJan Schmidt continue; 8298da6d581SJan Schmidt 8308da6d581SJan Schmidt switch (node->action) { 8318da6d581SJan Schmidt case BTRFS_ADD_DELAYED_EXTENT: 8328da6d581SJan Schmidt case BTRFS_UPDATE_DELAYED_HEAD: 8338da6d581SJan Schmidt WARN_ON(1); 8348da6d581SJan Schmidt continue; 8358da6d581SJan Schmidt case BTRFS_ADD_DELAYED_REF: 83601747e92SEdmund Nadolski count = node->ref_mod; 8378da6d581SJan Schmidt break; 8388da6d581SJan Schmidt case BTRFS_DROP_DELAYED_REF: 83901747e92SEdmund Nadolski count = node->ref_mod * -1; 8408da6d581SJan Schmidt break; 8418da6d581SJan Schmidt default: 842290342f6SArnd Bergmann BUG(); 8438da6d581SJan Schmidt } 8448da6d581SJan Schmidt switch (node->type) { 8458da6d581SJan Schmidt case BTRFS_TREE_BLOCK_REF_KEY: { 84686d5f994SEdmund Nadolski /* NORMAL INDIRECT METADATA backref */ 8478da6d581SJan Schmidt struct btrfs_delayed_tree_ref *ref; 8488da6d581SJan Schmidt 8498da6d581SJan Schmidt ref = btrfs_delayed_node_to_tree_ref(node); 85000142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, ref->root, 85100142756SJeff Mahoney &tmp_op_key, ref->level + 1, 85201747e92SEdmund Nadolski node->bytenr, count, sc, 85301747e92SEdmund Nadolski GFP_ATOMIC); 8548da6d581SJan Schmidt break; 8558da6d581SJan Schmidt } 8568da6d581SJan Schmidt case BTRFS_SHARED_BLOCK_REF_KEY: { 85786d5f994SEdmund Nadolski /* SHARED DIRECT METADATA backref */ 8588da6d581SJan Schmidt struct btrfs_delayed_tree_ref *ref; 8598da6d581SJan Schmidt 8608da6d581SJan Schmidt ref = btrfs_delayed_node_to_tree_ref(node); 86186d5f994SEdmund Nadolski 86201747e92SEdmund Nadolski ret = add_direct_ref(fs_info, preftrees, ref->level + 1, 86301747e92SEdmund Nadolski ref->parent, node->bytenr, count, 8643ec4d323SEdmund Nadolski sc, GFP_ATOMIC); 8658da6d581SJan Schmidt break; 8668da6d581SJan Schmidt } 8678da6d581SJan Schmidt case BTRFS_EXTENT_DATA_REF_KEY: { 86886d5f994SEdmund Nadolski /* NORMAL INDIRECT DATA backref */ 8698da6d581SJan Schmidt struct btrfs_delayed_data_ref *ref; 8708da6d581SJan Schmidt ref = btrfs_delayed_node_to_data_ref(node); 8718da6d581SJan Schmidt 8728da6d581SJan Schmidt key.objectid = ref->objectid; 8738da6d581SJan Schmidt key.type = BTRFS_EXTENT_DATA_KEY; 8748da6d581SJan Schmidt key.offset = ref->offset; 875dc046b10SJosef Bacik 876dc046b10SJosef Bacik /* 877dc046b10SJosef Bacik * Found a inum that doesn't match our known inum, we 878dc046b10SJosef Bacik * know it's shared. 879dc046b10SJosef Bacik */ 8803ec4d323SEdmund Nadolski if (sc && sc->inum && ref->objectid != sc->inum) { 881dc046b10SJosef Bacik ret = BACKREF_FOUND_SHARED; 8823ec4d323SEdmund Nadolski goto out; 883dc046b10SJosef Bacik } 884dc046b10SJosef Bacik 88500142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, ref->root, 88601747e92SEdmund Nadolski &key, 0, node->bytenr, count, sc, 88701747e92SEdmund Nadolski GFP_ATOMIC); 8888da6d581SJan Schmidt break; 8898da6d581SJan Schmidt } 8908da6d581SJan Schmidt case BTRFS_SHARED_DATA_REF_KEY: { 89186d5f994SEdmund Nadolski /* SHARED DIRECT FULL backref */ 8928da6d581SJan Schmidt struct btrfs_delayed_data_ref *ref; 8938da6d581SJan Schmidt 8948da6d581SJan Schmidt ref = btrfs_delayed_node_to_data_ref(node); 89586d5f994SEdmund Nadolski 89601747e92SEdmund Nadolski ret = add_direct_ref(fs_info, preftrees, 0, ref->parent, 89701747e92SEdmund Nadolski node->bytenr, count, sc, 89801747e92SEdmund Nadolski GFP_ATOMIC); 8998da6d581SJan Schmidt break; 9008da6d581SJan Schmidt } 9018da6d581SJan Schmidt default: 9028da6d581SJan Schmidt WARN_ON(1); 9038da6d581SJan Schmidt } 9043ec4d323SEdmund Nadolski /* 9053ec4d323SEdmund Nadolski * We must ignore BACKREF_FOUND_SHARED until all delayed 9063ec4d323SEdmund Nadolski * refs have been checked. 9073ec4d323SEdmund Nadolski */ 9083ec4d323SEdmund Nadolski if (ret && (ret != BACKREF_FOUND_SHARED)) 909d7df2c79SJosef Bacik break; 9108da6d581SJan Schmidt } 9113ec4d323SEdmund Nadolski if (!ret) 9123ec4d323SEdmund Nadolski ret = extent_is_shared(sc); 9133ec4d323SEdmund Nadolski out: 914d7df2c79SJosef Bacik spin_unlock(&head->lock); 915d7df2c79SJosef Bacik return ret; 9168da6d581SJan Schmidt } 9178da6d581SJan Schmidt 9188da6d581SJan Schmidt /* 9198da6d581SJan Schmidt * add all inline backrefs for bytenr to the list 9203ec4d323SEdmund Nadolski * 9213ec4d323SEdmund Nadolski * Returns 0 on success, <0 on error, or BACKREF_FOUND_SHARED. 9228da6d581SJan Schmidt */ 92300142756SJeff Mahoney static int add_inline_refs(const struct btrfs_fs_info *fs_info, 92400142756SJeff Mahoney struct btrfs_path *path, u64 bytenr, 92586d5f994SEdmund Nadolski int *info_level, struct preftrees *preftrees, 926b25b0b87Sethanwu struct share_check *sc) 9278da6d581SJan Schmidt { 928b1375d64SJan Schmidt int ret = 0; 9298da6d581SJan Schmidt int slot; 9308da6d581SJan Schmidt struct extent_buffer *leaf; 9318da6d581SJan Schmidt struct btrfs_key key; 932261c84b6SJosef Bacik struct btrfs_key found_key; 9338da6d581SJan Schmidt unsigned long ptr; 9348da6d581SJan Schmidt unsigned long end; 9358da6d581SJan Schmidt struct btrfs_extent_item *ei; 9368da6d581SJan Schmidt u64 flags; 9378da6d581SJan Schmidt u64 item_size; 9388da6d581SJan Schmidt 9398da6d581SJan Schmidt /* 9408da6d581SJan Schmidt * enumerate all inline refs 9418da6d581SJan Schmidt */ 9428da6d581SJan Schmidt leaf = path->nodes[0]; 943dadcaf78SJan Schmidt slot = path->slots[0]; 9448da6d581SJan Schmidt 9458da6d581SJan Schmidt item_size = btrfs_item_size_nr(leaf, slot); 9468da6d581SJan Schmidt BUG_ON(item_size < sizeof(*ei)); 9478da6d581SJan Schmidt 9488da6d581SJan Schmidt ei = btrfs_item_ptr(leaf, slot, struct btrfs_extent_item); 9498da6d581SJan Schmidt flags = btrfs_extent_flags(leaf, ei); 950261c84b6SJosef Bacik btrfs_item_key_to_cpu(leaf, &found_key, slot); 9518da6d581SJan Schmidt 9528da6d581SJan Schmidt ptr = (unsigned long)(ei + 1); 9538da6d581SJan Schmidt end = (unsigned long)ei + item_size; 9548da6d581SJan Schmidt 955261c84b6SJosef Bacik if (found_key.type == BTRFS_EXTENT_ITEM_KEY && 956261c84b6SJosef Bacik flags & BTRFS_EXTENT_FLAG_TREE_BLOCK) { 9578da6d581SJan Schmidt struct btrfs_tree_block_info *info; 9588da6d581SJan Schmidt 9598da6d581SJan Schmidt info = (struct btrfs_tree_block_info *)ptr; 9608da6d581SJan Schmidt *info_level = btrfs_tree_block_level(leaf, info); 9618da6d581SJan Schmidt ptr += sizeof(struct btrfs_tree_block_info); 9628da6d581SJan Schmidt BUG_ON(ptr > end); 963261c84b6SJosef Bacik } else if (found_key.type == BTRFS_METADATA_ITEM_KEY) { 964261c84b6SJosef Bacik *info_level = found_key.offset; 9658da6d581SJan Schmidt } else { 9668da6d581SJan Schmidt BUG_ON(!(flags & BTRFS_EXTENT_FLAG_DATA)); 9678da6d581SJan Schmidt } 9688da6d581SJan Schmidt 9698da6d581SJan Schmidt while (ptr < end) { 9708da6d581SJan Schmidt struct btrfs_extent_inline_ref *iref; 9718da6d581SJan Schmidt u64 offset; 9728da6d581SJan Schmidt int type; 9738da6d581SJan Schmidt 9748da6d581SJan Schmidt iref = (struct btrfs_extent_inline_ref *)ptr; 9753de28d57SLiu Bo type = btrfs_get_extent_inline_ref_type(leaf, iref, 9763de28d57SLiu Bo BTRFS_REF_TYPE_ANY); 9773de28d57SLiu Bo if (type == BTRFS_REF_TYPE_INVALID) 978af431dcbSSu Yue return -EUCLEAN; 9793de28d57SLiu Bo 9808da6d581SJan Schmidt offset = btrfs_extent_inline_ref_offset(leaf, iref); 9818da6d581SJan Schmidt 9828da6d581SJan Schmidt switch (type) { 9838da6d581SJan Schmidt case BTRFS_SHARED_BLOCK_REF_KEY: 98400142756SJeff Mahoney ret = add_direct_ref(fs_info, preftrees, 98500142756SJeff Mahoney *info_level + 1, offset, 9863ec4d323SEdmund Nadolski bytenr, 1, NULL, GFP_NOFS); 9878da6d581SJan Schmidt break; 9888da6d581SJan Schmidt case BTRFS_SHARED_DATA_REF_KEY: { 9898da6d581SJan Schmidt struct btrfs_shared_data_ref *sdref; 9908da6d581SJan Schmidt int count; 9918da6d581SJan Schmidt 9928da6d581SJan Schmidt sdref = (struct btrfs_shared_data_ref *)(iref + 1); 9938da6d581SJan Schmidt count = btrfs_shared_data_ref_count(leaf, sdref); 99486d5f994SEdmund Nadolski 99500142756SJeff Mahoney ret = add_direct_ref(fs_info, preftrees, 0, offset, 9963ec4d323SEdmund Nadolski bytenr, count, sc, GFP_NOFS); 9978da6d581SJan Schmidt break; 9988da6d581SJan Schmidt } 9998da6d581SJan Schmidt case BTRFS_TREE_BLOCK_REF_KEY: 100000142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, offset, 100100142756SJeff Mahoney NULL, *info_level + 1, 10023ec4d323SEdmund Nadolski bytenr, 1, NULL, GFP_NOFS); 10038da6d581SJan Schmidt break; 10048da6d581SJan Schmidt case BTRFS_EXTENT_DATA_REF_KEY: { 10058da6d581SJan Schmidt struct btrfs_extent_data_ref *dref; 10068da6d581SJan Schmidt int count; 10078da6d581SJan Schmidt u64 root; 10088da6d581SJan Schmidt 10098da6d581SJan Schmidt dref = (struct btrfs_extent_data_ref *)(&iref->offset); 10108da6d581SJan Schmidt count = btrfs_extent_data_ref_count(leaf, dref); 10118da6d581SJan Schmidt key.objectid = btrfs_extent_data_ref_objectid(leaf, 10128da6d581SJan Schmidt dref); 10138da6d581SJan Schmidt key.type = BTRFS_EXTENT_DATA_KEY; 10148da6d581SJan Schmidt key.offset = btrfs_extent_data_ref_offset(leaf, dref); 1015dc046b10SJosef Bacik 10163ec4d323SEdmund Nadolski if (sc && sc->inum && key.objectid != sc->inum) { 1017dc046b10SJosef Bacik ret = BACKREF_FOUND_SHARED; 1018dc046b10SJosef Bacik break; 1019dc046b10SJosef Bacik } 1020dc046b10SJosef Bacik 10218da6d581SJan Schmidt root = btrfs_extent_data_ref_root(leaf, dref); 102286d5f994SEdmund Nadolski 102300142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, root, 102400142756SJeff Mahoney &key, 0, bytenr, count, 10253ec4d323SEdmund Nadolski sc, GFP_NOFS); 10268da6d581SJan Schmidt break; 10278da6d581SJan Schmidt } 10288da6d581SJan Schmidt default: 10298da6d581SJan Schmidt WARN_ON(1); 10308da6d581SJan Schmidt } 10311149ab6bSWang Shilong if (ret) 10321149ab6bSWang Shilong return ret; 10338da6d581SJan Schmidt ptr += btrfs_extent_inline_ref_size(type); 10348da6d581SJan Schmidt } 10358da6d581SJan Schmidt 10368da6d581SJan Schmidt return 0; 10378da6d581SJan Schmidt } 10388da6d581SJan Schmidt 10398da6d581SJan Schmidt /* 10408da6d581SJan Schmidt * add all non-inline backrefs for bytenr to the list 10413ec4d323SEdmund Nadolski * 10423ec4d323SEdmund Nadolski * Returns 0 on success, <0 on error, or BACKREF_FOUND_SHARED. 10438da6d581SJan Schmidt */ 1044e0c476b1SJeff Mahoney static int add_keyed_refs(struct btrfs_fs_info *fs_info, 10458da6d581SJan Schmidt struct btrfs_path *path, u64 bytenr, 104686d5f994SEdmund Nadolski int info_level, struct preftrees *preftrees, 10473ec4d323SEdmund Nadolski struct share_check *sc) 10488da6d581SJan Schmidt { 10498da6d581SJan Schmidt struct btrfs_root *extent_root = fs_info->extent_root; 10508da6d581SJan Schmidt int ret; 10518da6d581SJan Schmidt int slot; 10528da6d581SJan Schmidt struct extent_buffer *leaf; 10538da6d581SJan Schmidt struct btrfs_key key; 10548da6d581SJan Schmidt 10558da6d581SJan Schmidt while (1) { 10568da6d581SJan Schmidt ret = btrfs_next_item(extent_root, path); 10578da6d581SJan Schmidt if (ret < 0) 10588da6d581SJan Schmidt break; 10598da6d581SJan Schmidt if (ret) { 10608da6d581SJan Schmidt ret = 0; 10618da6d581SJan Schmidt break; 10628da6d581SJan Schmidt } 10638da6d581SJan Schmidt 10648da6d581SJan Schmidt slot = path->slots[0]; 10658da6d581SJan Schmidt leaf = path->nodes[0]; 10668da6d581SJan Schmidt btrfs_item_key_to_cpu(leaf, &key, slot); 10678da6d581SJan Schmidt 10688da6d581SJan Schmidt if (key.objectid != bytenr) 10698da6d581SJan Schmidt break; 10708da6d581SJan Schmidt if (key.type < BTRFS_TREE_BLOCK_REF_KEY) 10718da6d581SJan Schmidt continue; 10728da6d581SJan Schmidt if (key.type > BTRFS_SHARED_DATA_REF_KEY) 10738da6d581SJan Schmidt break; 10748da6d581SJan Schmidt 10758da6d581SJan Schmidt switch (key.type) { 10768da6d581SJan Schmidt case BTRFS_SHARED_BLOCK_REF_KEY: 107786d5f994SEdmund Nadolski /* SHARED DIRECT METADATA backref */ 107800142756SJeff Mahoney ret = add_direct_ref(fs_info, preftrees, 107900142756SJeff Mahoney info_level + 1, key.offset, 10803ec4d323SEdmund Nadolski bytenr, 1, NULL, GFP_NOFS); 10818da6d581SJan Schmidt break; 10828da6d581SJan Schmidt case BTRFS_SHARED_DATA_REF_KEY: { 108386d5f994SEdmund Nadolski /* SHARED DIRECT FULL backref */ 10848da6d581SJan Schmidt struct btrfs_shared_data_ref *sdref; 10858da6d581SJan Schmidt int count; 10868da6d581SJan Schmidt 10878da6d581SJan Schmidt sdref = btrfs_item_ptr(leaf, slot, 10888da6d581SJan Schmidt struct btrfs_shared_data_ref); 10898da6d581SJan Schmidt count = btrfs_shared_data_ref_count(leaf, sdref); 109000142756SJeff Mahoney ret = add_direct_ref(fs_info, preftrees, 0, 109100142756SJeff Mahoney key.offset, bytenr, count, 10923ec4d323SEdmund Nadolski sc, GFP_NOFS); 10938da6d581SJan Schmidt break; 10948da6d581SJan Schmidt } 10958da6d581SJan Schmidt case BTRFS_TREE_BLOCK_REF_KEY: 109686d5f994SEdmund Nadolski /* NORMAL INDIRECT METADATA backref */ 109700142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, key.offset, 109800142756SJeff Mahoney NULL, info_level + 1, bytenr, 10993ec4d323SEdmund Nadolski 1, NULL, GFP_NOFS); 11008da6d581SJan Schmidt break; 11018da6d581SJan Schmidt case BTRFS_EXTENT_DATA_REF_KEY: { 110286d5f994SEdmund Nadolski /* NORMAL INDIRECT DATA backref */ 11038da6d581SJan Schmidt struct btrfs_extent_data_ref *dref; 11048da6d581SJan Schmidt int count; 11058da6d581SJan Schmidt u64 root; 11068da6d581SJan Schmidt 11078da6d581SJan Schmidt dref = btrfs_item_ptr(leaf, slot, 11088da6d581SJan Schmidt struct btrfs_extent_data_ref); 11098da6d581SJan Schmidt count = btrfs_extent_data_ref_count(leaf, dref); 11108da6d581SJan Schmidt key.objectid = btrfs_extent_data_ref_objectid(leaf, 11118da6d581SJan Schmidt dref); 11128da6d581SJan Schmidt key.type = BTRFS_EXTENT_DATA_KEY; 11138da6d581SJan Schmidt key.offset = btrfs_extent_data_ref_offset(leaf, dref); 1114dc046b10SJosef Bacik 11153ec4d323SEdmund Nadolski if (sc && sc->inum && key.objectid != sc->inum) { 1116dc046b10SJosef Bacik ret = BACKREF_FOUND_SHARED; 1117dc046b10SJosef Bacik break; 1118dc046b10SJosef Bacik } 1119dc046b10SJosef Bacik 11208da6d581SJan Schmidt root = btrfs_extent_data_ref_root(leaf, dref); 112100142756SJeff Mahoney ret = add_indirect_ref(fs_info, preftrees, root, 112200142756SJeff Mahoney &key, 0, bytenr, count, 11233ec4d323SEdmund Nadolski sc, GFP_NOFS); 11248da6d581SJan Schmidt break; 11258da6d581SJan Schmidt } 11268da6d581SJan Schmidt default: 11278da6d581SJan Schmidt WARN_ON(1); 11288da6d581SJan Schmidt } 11291149ab6bSWang Shilong if (ret) 11301149ab6bSWang Shilong return ret; 11311149ab6bSWang Shilong 11328da6d581SJan Schmidt } 11338da6d581SJan Schmidt 11348da6d581SJan Schmidt return ret; 11358da6d581SJan Schmidt } 11368da6d581SJan Schmidt 11378da6d581SJan Schmidt /* 11388da6d581SJan Schmidt * this adds all existing backrefs (inline backrefs, backrefs and delayed 11398da6d581SJan Schmidt * refs) for the given bytenr to the refs list, merges duplicates and resolves 11408da6d581SJan Schmidt * indirect refs to their parent bytenr. 11418da6d581SJan Schmidt * When roots are found, they're added to the roots list 11428da6d581SJan Schmidt * 1143de47c9d3SEdmund Nadolski * If time_seq is set to SEQ_LAST, it will not search delayed_refs, and behave 114421633fc6SQu Wenruo * much like trans == NULL case, the difference only lies in it will not 114521633fc6SQu Wenruo * commit root. 114621633fc6SQu Wenruo * The special case is for qgroup to search roots in commit_transaction(). 114721633fc6SQu Wenruo * 11483ec4d323SEdmund Nadolski * @sc - if !NULL, then immediately return BACKREF_FOUND_SHARED when a 11493ec4d323SEdmund Nadolski * shared extent is detected. 11503ec4d323SEdmund Nadolski * 11513ec4d323SEdmund Nadolski * Otherwise this returns 0 for success and <0 for an error. 11523ec4d323SEdmund Nadolski * 1153c995ab3cSZygo Blaxell * If ignore_offset is set to false, only extent refs whose offsets match 1154c995ab3cSZygo Blaxell * extent_item_pos are returned. If true, every extent ref is returned 1155c995ab3cSZygo Blaxell * and extent_item_pos is ignored. 1156c995ab3cSZygo Blaxell * 11578da6d581SJan Schmidt * FIXME some caching might speed things up 11588da6d581SJan Schmidt */ 11598da6d581SJan Schmidt static int find_parent_nodes(struct btrfs_trans_handle *trans, 11608da6d581SJan Schmidt struct btrfs_fs_info *fs_info, u64 bytenr, 1161097b8a7cSJan Schmidt u64 time_seq, struct ulist *refs, 1162dc046b10SJosef Bacik struct ulist *roots, const u64 *extent_item_pos, 1163c995ab3cSZygo Blaxell struct share_check *sc, bool ignore_offset) 11648da6d581SJan Schmidt { 11658da6d581SJan Schmidt struct btrfs_key key; 11668da6d581SJan Schmidt struct btrfs_path *path; 11678da6d581SJan Schmidt struct btrfs_delayed_ref_root *delayed_refs = NULL; 1168d3b01064SLi Zefan struct btrfs_delayed_ref_head *head; 11698da6d581SJan Schmidt int info_level = 0; 11708da6d581SJan Schmidt int ret; 1171e0c476b1SJeff Mahoney struct prelim_ref *ref; 117286d5f994SEdmund Nadolski struct rb_node *node; 1173f05c4746SWang Shilong struct extent_inode_elem *eie = NULL; 117486d5f994SEdmund Nadolski struct preftrees preftrees = { 117586d5f994SEdmund Nadolski .direct = PREFTREE_INIT, 117686d5f994SEdmund Nadolski .indirect = PREFTREE_INIT, 117786d5f994SEdmund Nadolski .indirect_missing_keys = PREFTREE_INIT 117886d5f994SEdmund Nadolski }; 11798da6d581SJan Schmidt 11808da6d581SJan Schmidt key.objectid = bytenr; 11818da6d581SJan Schmidt key.offset = (u64)-1; 1182261c84b6SJosef Bacik if (btrfs_fs_incompat(fs_info, SKINNY_METADATA)) 1183261c84b6SJosef Bacik key.type = BTRFS_METADATA_ITEM_KEY; 1184261c84b6SJosef Bacik else 1185261c84b6SJosef Bacik key.type = BTRFS_EXTENT_ITEM_KEY; 11868da6d581SJan Schmidt 11878da6d581SJan Schmidt path = btrfs_alloc_path(); 11888da6d581SJan Schmidt if (!path) 11898da6d581SJan Schmidt return -ENOMEM; 1190e84752d4SWang Shilong if (!trans) { 1191da61d31aSJosef Bacik path->search_commit_root = 1; 1192e84752d4SWang Shilong path->skip_locking = 1; 1193e84752d4SWang Shilong } 11948da6d581SJan Schmidt 1195de47c9d3SEdmund Nadolski if (time_seq == SEQ_LAST) 119621633fc6SQu Wenruo path->skip_locking = 1; 119721633fc6SQu Wenruo 11988da6d581SJan Schmidt /* 11998da6d581SJan Schmidt * grab both a lock on the path and a lock on the delayed ref head. 12008da6d581SJan Schmidt * We need both to get a consistent picture of how the refs look 12018da6d581SJan Schmidt * at a specified point in time 12028da6d581SJan Schmidt */ 12038da6d581SJan Schmidt again: 1204d3b01064SLi Zefan head = NULL; 1205d3b01064SLi Zefan 12068da6d581SJan Schmidt ret = btrfs_search_slot(trans, fs_info->extent_root, &key, path, 0, 0); 12078da6d581SJan Schmidt if (ret < 0) 12088da6d581SJan Schmidt goto out; 12098da6d581SJan Schmidt BUG_ON(ret == 0); 12108da6d581SJan Schmidt 1211faa2dbf0SJosef Bacik #ifdef CONFIG_BTRFS_FS_RUN_SANITY_TESTS 121221633fc6SQu Wenruo if (trans && likely(trans->type != __TRANS_DUMMY) && 1213de47c9d3SEdmund Nadolski time_seq != SEQ_LAST) { 1214faa2dbf0SJosef Bacik #else 1215de47c9d3SEdmund Nadolski if (trans && time_seq != SEQ_LAST) { 1216faa2dbf0SJosef Bacik #endif 12178da6d581SJan Schmidt /* 12187a3ae2f8SJan Schmidt * look if there are updates for this ref queued and lock the 12197a3ae2f8SJan Schmidt * head 12208da6d581SJan Schmidt */ 12218da6d581SJan Schmidt delayed_refs = &trans->transaction->delayed_refs; 12228da6d581SJan Schmidt spin_lock(&delayed_refs->lock); 1223f72ad18eSLiu Bo head = btrfs_find_delayed_ref_head(delayed_refs, bytenr); 12248da6d581SJan Schmidt if (head) { 12258da6d581SJan Schmidt if (!mutex_trylock(&head->mutex)) { 1226d278850eSJosef Bacik refcount_inc(&head->refs); 12278da6d581SJan Schmidt spin_unlock(&delayed_refs->lock); 12288da6d581SJan Schmidt 12298da6d581SJan Schmidt btrfs_release_path(path); 12308da6d581SJan Schmidt 12318da6d581SJan Schmidt /* 12328da6d581SJan Schmidt * Mutex was contended, block until it's 12338da6d581SJan Schmidt * released and try again 12348da6d581SJan Schmidt */ 12358da6d581SJan Schmidt mutex_lock(&head->mutex); 12368da6d581SJan Schmidt mutex_unlock(&head->mutex); 1237d278850eSJosef Bacik btrfs_put_delayed_ref_head(head); 12388da6d581SJan Schmidt goto again; 12398da6d581SJan Schmidt } 1240d7df2c79SJosef Bacik spin_unlock(&delayed_refs->lock); 124100142756SJeff Mahoney ret = add_delayed_refs(fs_info, head, time_seq, 1242b25b0b87Sethanwu &preftrees, sc); 1243155725c9SJan Schmidt mutex_unlock(&head->mutex); 1244d7df2c79SJosef Bacik if (ret) 12458da6d581SJan Schmidt goto out; 1246d7df2c79SJosef Bacik } else { 12478da6d581SJan Schmidt spin_unlock(&delayed_refs->lock); 12487a3ae2f8SJan Schmidt } 1249d7df2c79SJosef Bacik } 12508da6d581SJan Schmidt 12518da6d581SJan Schmidt if (path->slots[0]) { 12528da6d581SJan Schmidt struct extent_buffer *leaf; 12538da6d581SJan Schmidt int slot; 12548da6d581SJan Schmidt 1255dadcaf78SJan Schmidt path->slots[0]--; 12568da6d581SJan Schmidt leaf = path->nodes[0]; 1257dadcaf78SJan Schmidt slot = path->slots[0]; 12588da6d581SJan Schmidt btrfs_item_key_to_cpu(leaf, &key, slot); 12598da6d581SJan Schmidt if (key.objectid == bytenr && 1260261c84b6SJosef Bacik (key.type == BTRFS_EXTENT_ITEM_KEY || 1261261c84b6SJosef Bacik key.type == BTRFS_METADATA_ITEM_KEY)) { 126200142756SJeff Mahoney ret = add_inline_refs(fs_info, path, bytenr, 1263b25b0b87Sethanwu &info_level, &preftrees, sc); 12648da6d581SJan Schmidt if (ret) 12658da6d581SJan Schmidt goto out; 1266e0c476b1SJeff Mahoney ret = add_keyed_refs(fs_info, path, bytenr, info_level, 12673ec4d323SEdmund Nadolski &preftrees, sc); 12688da6d581SJan Schmidt if (ret) 12698da6d581SJan Schmidt goto out; 12708da6d581SJan Schmidt } 12718da6d581SJan Schmidt } 127286d5f994SEdmund Nadolski 12738da6d581SJan Schmidt btrfs_release_path(path); 12748da6d581SJan Schmidt 127538e3eebfSJosef Bacik ret = add_missing_keys(fs_info, &preftrees, path->skip_locking == 0); 1276d5c88b73SJan Schmidt if (ret) 1277d5c88b73SJan Schmidt goto out; 1278d5c88b73SJan Schmidt 1279ecf160b4SLiu Bo WARN_ON(!RB_EMPTY_ROOT(&preftrees.indirect_missing_keys.root.rb_root)); 12808da6d581SJan Schmidt 128186d5f994SEdmund Nadolski ret = resolve_indirect_refs(fs_info, path, time_seq, &preftrees, 1282b25b0b87Sethanwu extent_item_pos, sc, ignore_offset); 12838da6d581SJan Schmidt if (ret) 12848da6d581SJan Schmidt goto out; 12858da6d581SJan Schmidt 1286ecf160b4SLiu Bo WARN_ON(!RB_EMPTY_ROOT(&preftrees.indirect.root.rb_root)); 12878da6d581SJan Schmidt 128886d5f994SEdmund Nadolski /* 128986d5f994SEdmund Nadolski * This walks the tree of merged and resolved refs. Tree blocks are 129086d5f994SEdmund Nadolski * read in as needed. Unique entries are added to the ulist, and 129186d5f994SEdmund Nadolski * the list of found roots is updated. 129286d5f994SEdmund Nadolski * 129386d5f994SEdmund Nadolski * We release the entire tree in one go before returning. 129486d5f994SEdmund Nadolski */ 1295ecf160b4SLiu Bo node = rb_first_cached(&preftrees.direct.root); 129686d5f994SEdmund Nadolski while (node) { 129786d5f994SEdmund Nadolski ref = rb_entry(node, struct prelim_ref, rbnode); 129886d5f994SEdmund Nadolski node = rb_next(&ref->rbnode); 1299c8195a7bSZygo Blaxell /* 1300c8195a7bSZygo Blaxell * ref->count < 0 can happen here if there are delayed 1301c8195a7bSZygo Blaxell * refs with a node->action of BTRFS_DROP_DELAYED_REF. 1302c8195a7bSZygo Blaxell * prelim_ref_insert() relies on this when merging 1303c8195a7bSZygo Blaxell * identical refs to keep the overall count correct. 1304c8195a7bSZygo Blaxell * prelim_ref_insert() will merge only those refs 1305c8195a7bSZygo Blaxell * which compare identically. Any refs having 1306c8195a7bSZygo Blaxell * e.g. different offsets would not be merged, 1307c8195a7bSZygo Blaxell * and would retain their original ref->count < 0. 1308c8195a7bSZygo Blaxell */ 130998cfee21SWang Shilong if (roots && ref->count && ref->root_id && ref->parent == 0) { 13103ec4d323SEdmund Nadolski if (sc && sc->root_objectid && 13113ec4d323SEdmund Nadolski ref->root_id != sc->root_objectid) { 1312dc046b10SJosef Bacik ret = BACKREF_FOUND_SHARED; 1313dc046b10SJosef Bacik goto out; 1314dc046b10SJosef Bacik } 1315dc046b10SJosef Bacik 13168da6d581SJan Schmidt /* no parent == root of tree */ 13178da6d581SJan Schmidt ret = ulist_add(roots, ref->root_id, 0, GFP_NOFS); 1318f1723939SWang Shilong if (ret < 0) 1319f1723939SWang Shilong goto out; 13208da6d581SJan Schmidt } 13218da6d581SJan Schmidt if (ref->count && ref->parent) { 13228a56457fSJosef Bacik if (extent_item_pos && !ref->inode_list && 13238a56457fSJosef Bacik ref->level == 0) { 1324976b1908SJan Schmidt struct extent_buffer *eb; 1325707e8a07SDavid Sterba 1326581c1760SQu Wenruo eb = read_tree_block(fs_info, ref->parent, 0, 1327581c1760SQu Wenruo ref->level, NULL); 132864c043deSLiu Bo if (IS_ERR(eb)) { 132964c043deSLiu Bo ret = PTR_ERR(eb); 133064c043deSLiu Bo goto out; 133164c043deSLiu Bo } else if (!extent_buffer_uptodate(eb)) { 1332416bc658SJosef Bacik free_extent_buffer(eb); 1333c16c2e2eSWang Shilong ret = -EIO; 1334c16c2e2eSWang Shilong goto out; 1335416bc658SJosef Bacik } 133638e3eebfSJosef Bacik 133738e3eebfSJosef Bacik if (!path->skip_locking) { 13386f7ff6d7SFilipe Manana btrfs_tree_read_lock(eb); 1339300aa896SDavid Sterba btrfs_set_lock_blocking_read(eb); 134038e3eebfSJosef Bacik } 1341976b1908SJan Schmidt ret = find_extent_in_eb(eb, bytenr, 1342c995ab3cSZygo Blaxell *extent_item_pos, &eie, ignore_offset); 134338e3eebfSJosef Bacik if (!path->skip_locking) 13446f7ff6d7SFilipe Manana btrfs_tree_read_unlock_blocking(eb); 1345976b1908SJan Schmidt free_extent_buffer(eb); 1346f5929cd8SFilipe David Borba Manana if (ret < 0) 1347f5929cd8SFilipe David Borba Manana goto out; 1348f5929cd8SFilipe David Borba Manana ref->inode_list = eie; 1349976b1908SJan Schmidt } 13504eb1f66dSTakashi Iwai ret = ulist_add_merge_ptr(refs, ref->parent, 13514eb1f66dSTakashi Iwai ref->inode_list, 13524eb1f66dSTakashi Iwai (void **)&eie, GFP_NOFS); 1353f1723939SWang Shilong if (ret < 0) 1354f1723939SWang Shilong goto out; 13553301958bSJan Schmidt if (!ret && extent_item_pos) { 13563301958bSJan Schmidt /* 13573301958bSJan Schmidt * we've recorded that parent, so we must extend 13583301958bSJan Schmidt * its inode list here 13593301958bSJan Schmidt */ 13603301958bSJan Schmidt BUG_ON(!eie); 13613301958bSJan Schmidt while (eie->next) 13623301958bSJan Schmidt eie = eie->next; 13633301958bSJan Schmidt eie->next = ref->inode_list; 13643301958bSJan Schmidt } 1365f05c4746SWang Shilong eie = NULL; 13668da6d581SJan Schmidt } 13679dd14fd6SEdmund Nadolski cond_resched(); 13688da6d581SJan Schmidt } 13698da6d581SJan Schmidt 13708da6d581SJan Schmidt out: 13718da6d581SJan Schmidt btrfs_free_path(path); 137286d5f994SEdmund Nadolski 137386d5f994SEdmund Nadolski prelim_release(&preftrees.direct); 137486d5f994SEdmund Nadolski prelim_release(&preftrees.indirect); 137586d5f994SEdmund Nadolski prelim_release(&preftrees.indirect_missing_keys); 137686d5f994SEdmund Nadolski 1377f05c4746SWang Shilong if (ret < 0) 1378f05c4746SWang Shilong free_inode_elem_list(eie); 13798da6d581SJan Schmidt return ret; 13808da6d581SJan Schmidt } 13818da6d581SJan Schmidt 1382976b1908SJan Schmidt static void free_leaf_list(struct ulist *blocks) 1383976b1908SJan Schmidt { 1384976b1908SJan Schmidt struct ulist_node *node = NULL; 1385976b1908SJan Schmidt struct extent_inode_elem *eie; 1386976b1908SJan Schmidt struct ulist_iterator uiter; 1387976b1908SJan Schmidt 1388976b1908SJan Schmidt ULIST_ITER_INIT(&uiter); 1389976b1908SJan Schmidt while ((node = ulist_next(blocks, &uiter))) { 1390976b1908SJan Schmidt if (!node->aux) 1391976b1908SJan Schmidt continue; 13924dae077aSJeff Mahoney eie = unode_aux_to_inode_list(node); 1393f05c4746SWang Shilong free_inode_elem_list(eie); 1394976b1908SJan Schmidt node->aux = 0; 1395976b1908SJan Schmidt } 1396976b1908SJan Schmidt 1397976b1908SJan Schmidt ulist_free(blocks); 1398976b1908SJan Schmidt } 1399976b1908SJan Schmidt 14008da6d581SJan Schmidt /* 14018da6d581SJan Schmidt * Finds all leafs with a reference to the specified combination of bytenr and 14028da6d581SJan Schmidt * offset. key_list_head will point to a list of corresponding keys (caller must 14038da6d581SJan Schmidt * free each list element). The leafs will be stored in the leafs ulist, which 14048da6d581SJan Schmidt * must be freed with ulist_free. 14058da6d581SJan Schmidt * 14068da6d581SJan Schmidt * returns 0 on success, <0 on error 14078da6d581SJan Schmidt */ 140819b546d7SQu Wenruo int btrfs_find_all_leafs(struct btrfs_trans_handle *trans, 14098da6d581SJan Schmidt struct btrfs_fs_info *fs_info, u64 bytenr, 1410097b8a7cSJan Schmidt u64 time_seq, struct ulist **leafs, 1411c995ab3cSZygo Blaxell const u64 *extent_item_pos, bool ignore_offset) 14128da6d581SJan Schmidt { 14138da6d581SJan Schmidt int ret; 14148da6d581SJan Schmidt 14158da6d581SJan Schmidt *leafs = ulist_alloc(GFP_NOFS); 141698cfee21SWang Shilong if (!*leafs) 14178da6d581SJan Schmidt return -ENOMEM; 14188da6d581SJan Schmidt 1419afce772eSLu Fengqi ret = find_parent_nodes(trans, fs_info, bytenr, time_seq, 1420c995ab3cSZygo Blaxell *leafs, NULL, extent_item_pos, NULL, ignore_offset); 14218da6d581SJan Schmidt if (ret < 0 && ret != -ENOENT) { 1422976b1908SJan Schmidt free_leaf_list(*leafs); 14238da6d581SJan Schmidt return ret; 14248da6d581SJan Schmidt } 14258da6d581SJan Schmidt 14268da6d581SJan Schmidt return 0; 14278da6d581SJan Schmidt } 14288da6d581SJan Schmidt 14298da6d581SJan Schmidt /* 14308da6d581SJan Schmidt * walk all backrefs for a given extent to find all roots that reference this 14318da6d581SJan Schmidt * extent. Walking a backref means finding all extents that reference this 14328da6d581SJan Schmidt * extent and in turn walk the backrefs of those, too. Naturally this is a 14338da6d581SJan Schmidt * recursive process, but here it is implemented in an iterative fashion: We 14348da6d581SJan Schmidt * find all referencing extents for the extent in question and put them on a 14358da6d581SJan Schmidt * list. In turn, we find all referencing extents for those, further appending 14368da6d581SJan Schmidt * to the list. The way we iterate the list allows adding more elements after 14378da6d581SJan Schmidt * the current while iterating. The process stops when we reach the end of the 14388da6d581SJan Schmidt * list. Found roots are added to the roots list. 14398da6d581SJan Schmidt * 14408da6d581SJan Schmidt * returns 0 on success, < 0 on error. 14418da6d581SJan Schmidt */ 1442e0c476b1SJeff Mahoney static int btrfs_find_all_roots_safe(struct btrfs_trans_handle *trans, 14438da6d581SJan Schmidt struct btrfs_fs_info *fs_info, u64 bytenr, 1444c995ab3cSZygo Blaxell u64 time_seq, struct ulist **roots, 1445c995ab3cSZygo Blaxell bool ignore_offset) 14468da6d581SJan Schmidt { 14478da6d581SJan Schmidt struct ulist *tmp; 14488da6d581SJan Schmidt struct ulist_node *node = NULL; 1449cd1b413cSJan Schmidt struct ulist_iterator uiter; 14508da6d581SJan Schmidt int ret; 14518da6d581SJan Schmidt 14528da6d581SJan Schmidt tmp = ulist_alloc(GFP_NOFS); 14538da6d581SJan Schmidt if (!tmp) 14548da6d581SJan Schmidt return -ENOMEM; 14558da6d581SJan Schmidt *roots = ulist_alloc(GFP_NOFS); 14568da6d581SJan Schmidt if (!*roots) { 14578da6d581SJan Schmidt ulist_free(tmp); 14588da6d581SJan Schmidt return -ENOMEM; 14598da6d581SJan Schmidt } 14608da6d581SJan Schmidt 1461cd1b413cSJan Schmidt ULIST_ITER_INIT(&uiter); 14628da6d581SJan Schmidt while (1) { 1463afce772eSLu Fengqi ret = find_parent_nodes(trans, fs_info, bytenr, time_seq, 1464c995ab3cSZygo Blaxell tmp, *roots, NULL, NULL, ignore_offset); 14658da6d581SJan Schmidt if (ret < 0 && ret != -ENOENT) { 14668da6d581SJan Schmidt ulist_free(tmp); 14678da6d581SJan Schmidt ulist_free(*roots); 14688da6d581SJan Schmidt return ret; 14698da6d581SJan Schmidt } 1470cd1b413cSJan Schmidt node = ulist_next(tmp, &uiter); 14718da6d581SJan Schmidt if (!node) 14728da6d581SJan Schmidt break; 14738da6d581SJan Schmidt bytenr = node->val; 1474bca1a290SWang Shilong cond_resched(); 14758da6d581SJan Schmidt } 14768da6d581SJan Schmidt 14778da6d581SJan Schmidt ulist_free(tmp); 14788da6d581SJan Schmidt return 0; 14798da6d581SJan Schmidt } 14808da6d581SJan Schmidt 14819e351cc8SJosef Bacik int btrfs_find_all_roots(struct btrfs_trans_handle *trans, 14829e351cc8SJosef Bacik struct btrfs_fs_info *fs_info, u64 bytenr, 1483c995ab3cSZygo Blaxell u64 time_seq, struct ulist **roots, 1484c995ab3cSZygo Blaxell bool ignore_offset) 14859e351cc8SJosef Bacik { 14869e351cc8SJosef Bacik int ret; 14879e351cc8SJosef Bacik 14889e351cc8SJosef Bacik if (!trans) 14899e351cc8SJosef Bacik down_read(&fs_info->commit_root_sem); 1490e0c476b1SJeff Mahoney ret = btrfs_find_all_roots_safe(trans, fs_info, bytenr, 1491c995ab3cSZygo Blaxell time_seq, roots, ignore_offset); 14929e351cc8SJosef Bacik if (!trans) 14939e351cc8SJosef Bacik up_read(&fs_info->commit_root_sem); 14949e351cc8SJosef Bacik return ret; 14959e351cc8SJosef Bacik } 14969e351cc8SJosef Bacik 14972c2ed5aaSMark Fasheh /** 14982c2ed5aaSMark Fasheh * btrfs_check_shared - tell us whether an extent is shared 14992c2ed5aaSMark Fasheh * 15002c2ed5aaSMark Fasheh * btrfs_check_shared uses the backref walking code but will short 15012c2ed5aaSMark Fasheh * circuit as soon as it finds a root or inode that doesn't match the 15022c2ed5aaSMark Fasheh * one passed in. This provides a significant performance benefit for 15032c2ed5aaSMark Fasheh * callers (such as fiemap) which want to know whether the extent is 15042c2ed5aaSMark Fasheh * shared but do not need a ref count. 15052c2ed5aaSMark Fasheh * 150603628cdbSFilipe Manana * This attempts to attach to the running transaction in order to account for 150703628cdbSFilipe Manana * delayed refs, but continues on even when no running transaction exists. 1508bb739cf0SEdmund Nadolski * 15092c2ed5aaSMark Fasheh * Return: 0 if extent is not shared, 1 if it is shared, < 0 on error. 15102c2ed5aaSMark Fasheh */ 15115911c8feSDavid Sterba int btrfs_check_shared(struct btrfs_root *root, u64 inum, u64 bytenr, 15125911c8feSDavid Sterba struct ulist *roots, struct ulist *tmp) 1513dc046b10SJosef Bacik { 1514bb739cf0SEdmund Nadolski struct btrfs_fs_info *fs_info = root->fs_info; 1515bb739cf0SEdmund Nadolski struct btrfs_trans_handle *trans; 1516dc046b10SJosef Bacik struct ulist_iterator uiter; 1517dc046b10SJosef Bacik struct ulist_node *node; 15183284da7bSDavid Sterba struct seq_list elem = SEQ_LIST_INIT(elem); 1519dc046b10SJosef Bacik int ret = 0; 15203ec4d323SEdmund Nadolski struct share_check shared = { 15214fd786e6SMisono Tomohiro .root_objectid = root->root_key.objectid, 15223ec4d323SEdmund Nadolski .inum = inum, 15233ec4d323SEdmund Nadolski .share_count = 0, 15243ec4d323SEdmund Nadolski }; 1525dc046b10SJosef Bacik 15265911c8feSDavid Sterba ulist_init(roots); 15275911c8feSDavid Sterba ulist_init(tmp); 1528dc046b10SJosef Bacik 1529a6d155d2SFilipe Manana trans = btrfs_join_transaction_nostart(root); 1530bb739cf0SEdmund Nadolski if (IS_ERR(trans)) { 153103628cdbSFilipe Manana if (PTR_ERR(trans) != -ENOENT && PTR_ERR(trans) != -EROFS) { 153203628cdbSFilipe Manana ret = PTR_ERR(trans); 153303628cdbSFilipe Manana goto out; 153403628cdbSFilipe Manana } 1535bb739cf0SEdmund Nadolski trans = NULL; 1536dc046b10SJosef Bacik down_read(&fs_info->commit_root_sem); 1537bb739cf0SEdmund Nadolski } else { 1538bb739cf0SEdmund Nadolski btrfs_get_tree_mod_seq(fs_info, &elem); 1539bb739cf0SEdmund Nadolski } 1540bb739cf0SEdmund Nadolski 1541dc046b10SJosef Bacik ULIST_ITER_INIT(&uiter); 1542dc046b10SJosef Bacik while (1) { 1543dc046b10SJosef Bacik ret = find_parent_nodes(trans, fs_info, bytenr, elem.seq, tmp, 1544c995ab3cSZygo Blaxell roots, NULL, &shared, false); 1545dc046b10SJosef Bacik if (ret == BACKREF_FOUND_SHARED) { 15462c2ed5aaSMark Fasheh /* this is the only condition under which we return 1 */ 1547dc046b10SJosef Bacik ret = 1; 1548dc046b10SJosef Bacik break; 1549dc046b10SJosef Bacik } 1550dc046b10SJosef Bacik if (ret < 0 && ret != -ENOENT) 1551dc046b10SJosef Bacik break; 15522c2ed5aaSMark Fasheh ret = 0; 1553dc046b10SJosef Bacik node = ulist_next(tmp, &uiter); 1554dc046b10SJosef Bacik if (!node) 1555dc046b10SJosef Bacik break; 1556dc046b10SJosef Bacik bytenr = node->val; 155718bf591bSEdmund Nadolski shared.share_count = 0; 1558dc046b10SJosef Bacik cond_resched(); 1559dc046b10SJosef Bacik } 1560bb739cf0SEdmund Nadolski 1561bb739cf0SEdmund Nadolski if (trans) { 1562dc046b10SJosef Bacik btrfs_put_tree_mod_seq(fs_info, &elem); 1563bb739cf0SEdmund Nadolski btrfs_end_transaction(trans); 1564bb739cf0SEdmund Nadolski } else { 1565dc046b10SJosef Bacik up_read(&fs_info->commit_root_sem); 1566bb739cf0SEdmund Nadolski } 156703628cdbSFilipe Manana out: 15685911c8feSDavid Sterba ulist_release(roots); 15695911c8feSDavid Sterba ulist_release(tmp); 1570dc046b10SJosef Bacik return ret; 1571dc046b10SJosef Bacik } 1572dc046b10SJosef Bacik 1573f186373fSMark Fasheh int btrfs_find_one_extref(struct btrfs_root *root, u64 inode_objectid, 1574f186373fSMark Fasheh u64 start_off, struct btrfs_path *path, 1575f186373fSMark Fasheh struct btrfs_inode_extref **ret_extref, 1576f186373fSMark Fasheh u64 *found_off) 1577f186373fSMark Fasheh { 1578f186373fSMark Fasheh int ret, slot; 1579f186373fSMark Fasheh struct btrfs_key key; 1580f186373fSMark Fasheh struct btrfs_key found_key; 1581f186373fSMark Fasheh struct btrfs_inode_extref *extref; 158273980becSJeff Mahoney const struct extent_buffer *leaf; 1583f186373fSMark Fasheh unsigned long ptr; 1584f186373fSMark Fasheh 1585f186373fSMark Fasheh key.objectid = inode_objectid; 1586962a298fSDavid Sterba key.type = BTRFS_INODE_EXTREF_KEY; 1587f186373fSMark Fasheh key.offset = start_off; 1588f186373fSMark Fasheh 1589f186373fSMark Fasheh ret = btrfs_search_slot(NULL, root, &key, path, 0, 0); 1590f186373fSMark Fasheh if (ret < 0) 1591f186373fSMark Fasheh return ret; 1592f186373fSMark Fasheh 1593f186373fSMark Fasheh while (1) { 1594f186373fSMark Fasheh leaf = path->nodes[0]; 1595f186373fSMark Fasheh slot = path->slots[0]; 1596f186373fSMark Fasheh if (slot >= btrfs_header_nritems(leaf)) { 1597f186373fSMark Fasheh /* 1598f186373fSMark Fasheh * If the item at offset is not found, 1599f186373fSMark Fasheh * btrfs_search_slot will point us to the slot 1600f186373fSMark Fasheh * where it should be inserted. In our case 1601f186373fSMark Fasheh * that will be the slot directly before the 1602f186373fSMark Fasheh * next INODE_REF_KEY_V2 item. In the case 1603f186373fSMark Fasheh * that we're pointing to the last slot in a 1604f186373fSMark Fasheh * leaf, we must move one leaf over. 1605f186373fSMark Fasheh */ 1606f186373fSMark Fasheh ret = btrfs_next_leaf(root, path); 1607f186373fSMark Fasheh if (ret) { 1608f186373fSMark Fasheh if (ret >= 1) 1609f186373fSMark Fasheh ret = -ENOENT; 1610f186373fSMark Fasheh break; 1611f186373fSMark Fasheh } 1612f186373fSMark Fasheh continue; 1613f186373fSMark Fasheh } 1614f186373fSMark Fasheh 1615f186373fSMark Fasheh btrfs_item_key_to_cpu(leaf, &found_key, slot); 1616f186373fSMark Fasheh 1617f186373fSMark Fasheh /* 1618f186373fSMark Fasheh * Check that we're still looking at an extended ref key for 1619f186373fSMark Fasheh * this particular objectid. If we have different 1620f186373fSMark Fasheh * objectid or type then there are no more to be found 1621f186373fSMark Fasheh * in the tree and we can exit. 1622f186373fSMark Fasheh */ 1623f186373fSMark Fasheh ret = -ENOENT; 1624f186373fSMark Fasheh if (found_key.objectid != inode_objectid) 1625f186373fSMark Fasheh break; 1626962a298fSDavid Sterba if (found_key.type != BTRFS_INODE_EXTREF_KEY) 1627f186373fSMark Fasheh break; 1628f186373fSMark Fasheh 1629f186373fSMark Fasheh ret = 0; 1630f186373fSMark Fasheh ptr = btrfs_item_ptr_offset(leaf, path->slots[0]); 1631f186373fSMark Fasheh extref = (struct btrfs_inode_extref *)ptr; 1632f186373fSMark Fasheh *ret_extref = extref; 1633f186373fSMark Fasheh if (found_off) 1634f186373fSMark Fasheh *found_off = found_key.offset; 1635f186373fSMark Fasheh break; 1636f186373fSMark Fasheh } 1637f186373fSMark Fasheh 1638f186373fSMark Fasheh return ret; 1639f186373fSMark Fasheh } 1640f186373fSMark Fasheh 164148a3b636SEric Sandeen /* 164248a3b636SEric Sandeen * this iterates to turn a name (from iref/extref) into a full filesystem path. 164348a3b636SEric Sandeen * Elements of the path are separated by '/' and the path is guaranteed to be 164448a3b636SEric Sandeen * 0-terminated. the path is only given within the current file system. 164548a3b636SEric Sandeen * Therefore, it never starts with a '/'. the caller is responsible to provide 164648a3b636SEric Sandeen * "size" bytes in "dest". the dest buffer will be filled backwards. finally, 164748a3b636SEric Sandeen * the start point of the resulting string is returned. this pointer is within 164848a3b636SEric Sandeen * dest, normally. 164948a3b636SEric Sandeen * in case the path buffer would overflow, the pointer is decremented further 165048a3b636SEric Sandeen * as if output was written to the buffer, though no more output is actually 165148a3b636SEric Sandeen * generated. that way, the caller can determine how much space would be 165248a3b636SEric Sandeen * required for the path to fit into the buffer. in that case, the returned 165348a3b636SEric Sandeen * value will be smaller than dest. callers must check this! 165448a3b636SEric Sandeen */ 165596b5bd77SJan Schmidt char *btrfs_ref_to_path(struct btrfs_root *fs_root, struct btrfs_path *path, 1656d24bec3aSMark Fasheh u32 name_len, unsigned long name_off, 1657a542ad1bSJan Schmidt struct extent_buffer *eb_in, u64 parent, 1658a542ad1bSJan Schmidt char *dest, u32 size) 1659a542ad1bSJan Schmidt { 1660a542ad1bSJan Schmidt int slot; 1661a542ad1bSJan Schmidt u64 next_inum; 1662a542ad1bSJan Schmidt int ret; 1663661bec6bSGabriel de Perthuis s64 bytes_left = ((s64)size) - 1; 1664a542ad1bSJan Schmidt struct extent_buffer *eb = eb_in; 1665a542ad1bSJan Schmidt struct btrfs_key found_key; 1666b916a59aSJan Schmidt int leave_spinning = path->leave_spinning; 1667d24bec3aSMark Fasheh struct btrfs_inode_ref *iref; 1668a542ad1bSJan Schmidt 1669a542ad1bSJan Schmidt if (bytes_left >= 0) 1670a542ad1bSJan Schmidt dest[bytes_left] = '\0'; 1671a542ad1bSJan Schmidt 1672b916a59aSJan Schmidt path->leave_spinning = 1; 1673a542ad1bSJan Schmidt while (1) { 1674d24bec3aSMark Fasheh bytes_left -= name_len; 1675a542ad1bSJan Schmidt if (bytes_left >= 0) 1676a542ad1bSJan Schmidt read_extent_buffer(eb, dest + bytes_left, 1677d24bec3aSMark Fasheh name_off, name_len); 1678b916a59aSJan Schmidt if (eb != eb_in) { 16790c0fe3b0SFilipe Manana if (!path->skip_locking) 1680b916a59aSJan Schmidt btrfs_tree_read_unlock_blocking(eb); 1681a542ad1bSJan Schmidt free_extent_buffer(eb); 1682b916a59aSJan Schmidt } 1683c234a24dSDavid Sterba ret = btrfs_find_item(fs_root, path, parent, 0, 1684c234a24dSDavid Sterba BTRFS_INODE_REF_KEY, &found_key); 16858f24b496SJan Schmidt if (ret > 0) 16868f24b496SJan Schmidt ret = -ENOENT; 1687a542ad1bSJan Schmidt if (ret) 1688a542ad1bSJan Schmidt break; 1689d24bec3aSMark Fasheh 1690a542ad1bSJan Schmidt next_inum = found_key.offset; 1691a542ad1bSJan Schmidt 1692a542ad1bSJan Schmidt /* regular exit ahead */ 1693a542ad1bSJan Schmidt if (parent == next_inum) 1694a542ad1bSJan Schmidt break; 1695a542ad1bSJan Schmidt 1696a542ad1bSJan Schmidt slot = path->slots[0]; 1697a542ad1bSJan Schmidt eb = path->nodes[0]; 1698a542ad1bSJan Schmidt /* make sure we can use eb after releasing the path */ 1699b916a59aSJan Schmidt if (eb != eb_in) { 17000c0fe3b0SFilipe Manana if (!path->skip_locking) 1701300aa896SDavid Sterba btrfs_set_lock_blocking_read(eb); 17020c0fe3b0SFilipe Manana path->nodes[0] = NULL; 17030c0fe3b0SFilipe Manana path->locks[0] = 0; 1704b916a59aSJan Schmidt } 1705a542ad1bSJan Schmidt btrfs_release_path(path); 1706a542ad1bSJan Schmidt iref = btrfs_item_ptr(eb, slot, struct btrfs_inode_ref); 1707d24bec3aSMark Fasheh 1708d24bec3aSMark Fasheh name_len = btrfs_inode_ref_name_len(eb, iref); 1709d24bec3aSMark Fasheh name_off = (unsigned long)(iref + 1); 1710d24bec3aSMark Fasheh 1711a542ad1bSJan Schmidt parent = next_inum; 1712a542ad1bSJan Schmidt --bytes_left; 1713a542ad1bSJan Schmidt if (bytes_left >= 0) 1714a542ad1bSJan Schmidt dest[bytes_left] = '/'; 1715a542ad1bSJan Schmidt } 1716a542ad1bSJan Schmidt 1717a542ad1bSJan Schmidt btrfs_release_path(path); 1718b916a59aSJan Schmidt path->leave_spinning = leave_spinning; 1719a542ad1bSJan Schmidt 1720a542ad1bSJan Schmidt if (ret) 1721a542ad1bSJan Schmidt return ERR_PTR(ret); 1722a542ad1bSJan Schmidt 1723a542ad1bSJan Schmidt return dest + bytes_left; 1724a542ad1bSJan Schmidt } 1725a542ad1bSJan Schmidt 1726a542ad1bSJan Schmidt /* 1727a542ad1bSJan Schmidt * this makes the path point to (logical EXTENT_ITEM *) 1728a542ad1bSJan Schmidt * returns BTRFS_EXTENT_FLAG_DATA for data, BTRFS_EXTENT_FLAG_TREE_BLOCK for 1729a542ad1bSJan Schmidt * tree blocks and <0 on error. 1730a542ad1bSJan Schmidt */ 1731a542ad1bSJan Schmidt int extent_from_logical(struct btrfs_fs_info *fs_info, u64 logical, 173269917e43SLiu Bo struct btrfs_path *path, struct btrfs_key *found_key, 173369917e43SLiu Bo u64 *flags_ret) 1734a542ad1bSJan Schmidt { 1735a542ad1bSJan Schmidt int ret; 1736a542ad1bSJan Schmidt u64 flags; 1737261c84b6SJosef Bacik u64 size = 0; 1738a542ad1bSJan Schmidt u32 item_size; 173973980becSJeff Mahoney const struct extent_buffer *eb; 1740a542ad1bSJan Schmidt struct btrfs_extent_item *ei; 1741a542ad1bSJan Schmidt struct btrfs_key key; 1742a542ad1bSJan Schmidt 1743261c84b6SJosef Bacik if (btrfs_fs_incompat(fs_info, SKINNY_METADATA)) 1744261c84b6SJosef Bacik key.type = BTRFS_METADATA_ITEM_KEY; 1745261c84b6SJosef Bacik else 1746a542ad1bSJan Schmidt key.type = BTRFS_EXTENT_ITEM_KEY; 1747a542ad1bSJan Schmidt key.objectid = logical; 1748a542ad1bSJan Schmidt key.offset = (u64)-1; 1749a542ad1bSJan Schmidt 1750a542ad1bSJan Schmidt ret = btrfs_search_slot(NULL, fs_info->extent_root, &key, path, 0, 0); 1751a542ad1bSJan Schmidt if (ret < 0) 1752a542ad1bSJan Schmidt return ret; 1753a542ad1bSJan Schmidt 1754850a8cdfSWang Shilong ret = btrfs_previous_extent_item(fs_info->extent_root, path, 0); 1755850a8cdfSWang Shilong if (ret) { 1756850a8cdfSWang Shilong if (ret > 0) 1757580f0a67SJosef Bacik ret = -ENOENT; 1758580f0a67SJosef Bacik return ret; 1759580f0a67SJosef Bacik } 1760850a8cdfSWang Shilong btrfs_item_key_to_cpu(path->nodes[0], found_key, path->slots[0]); 1761261c84b6SJosef Bacik if (found_key->type == BTRFS_METADATA_ITEM_KEY) 1762da17066cSJeff Mahoney size = fs_info->nodesize; 1763261c84b6SJosef Bacik else if (found_key->type == BTRFS_EXTENT_ITEM_KEY) 1764261c84b6SJosef Bacik size = found_key->offset; 1765261c84b6SJosef Bacik 1766580f0a67SJosef Bacik if (found_key->objectid > logical || 1767261c84b6SJosef Bacik found_key->objectid + size <= logical) { 1768ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 1769ab8d0fc4SJeff Mahoney "logical %llu is not within any extent", logical); 1770a542ad1bSJan Schmidt return -ENOENT; 17714692cf58SJan Schmidt } 1772a542ad1bSJan Schmidt 1773a542ad1bSJan Schmidt eb = path->nodes[0]; 1774a542ad1bSJan Schmidt item_size = btrfs_item_size_nr(eb, path->slots[0]); 1775a542ad1bSJan Schmidt BUG_ON(item_size < sizeof(*ei)); 1776a542ad1bSJan Schmidt 1777a542ad1bSJan Schmidt ei = btrfs_item_ptr(eb, path->slots[0], struct btrfs_extent_item); 1778a542ad1bSJan Schmidt flags = btrfs_extent_flags(eb, ei); 1779a542ad1bSJan Schmidt 1780ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 1781ab8d0fc4SJeff Mahoney "logical %llu is at position %llu within the extent (%llu EXTENT_ITEM %llu) flags %#llx size %u", 1782c1c9ff7cSGeert Uytterhoeven logical, logical - found_key->objectid, found_key->objectid, 1783c1c9ff7cSGeert Uytterhoeven found_key->offset, flags, item_size); 178469917e43SLiu Bo 178569917e43SLiu Bo WARN_ON(!flags_ret); 178669917e43SLiu Bo if (flags_ret) { 1787a542ad1bSJan Schmidt if (flags & BTRFS_EXTENT_FLAG_TREE_BLOCK) 178869917e43SLiu Bo *flags_ret = BTRFS_EXTENT_FLAG_TREE_BLOCK; 178969917e43SLiu Bo else if (flags & BTRFS_EXTENT_FLAG_DATA) 179069917e43SLiu Bo *flags_ret = BTRFS_EXTENT_FLAG_DATA; 179169917e43SLiu Bo else 1792290342f6SArnd Bergmann BUG(); 179369917e43SLiu Bo return 0; 179469917e43SLiu Bo } 1795a542ad1bSJan Schmidt 1796a542ad1bSJan Schmidt return -EIO; 1797a542ad1bSJan Schmidt } 1798a542ad1bSJan Schmidt 1799a542ad1bSJan Schmidt /* 1800a542ad1bSJan Schmidt * helper function to iterate extent inline refs. ptr must point to a 0 value 1801a542ad1bSJan Schmidt * for the first call and may be modified. it is used to track state. 1802a542ad1bSJan Schmidt * if more refs exist, 0 is returned and the next call to 1803e0c476b1SJeff Mahoney * get_extent_inline_ref must pass the modified ptr parameter to get the 1804a542ad1bSJan Schmidt * next ref. after the last ref was processed, 1 is returned. 1805a542ad1bSJan Schmidt * returns <0 on error 1806a542ad1bSJan Schmidt */ 1807e0c476b1SJeff Mahoney static int get_extent_inline_ref(unsigned long *ptr, 180873980becSJeff Mahoney const struct extent_buffer *eb, 180973980becSJeff Mahoney const struct btrfs_key *key, 181073980becSJeff Mahoney const struct btrfs_extent_item *ei, 181173980becSJeff Mahoney u32 item_size, 1812a542ad1bSJan Schmidt struct btrfs_extent_inline_ref **out_eiref, 1813a542ad1bSJan Schmidt int *out_type) 1814a542ad1bSJan Schmidt { 1815a542ad1bSJan Schmidt unsigned long end; 1816a542ad1bSJan Schmidt u64 flags; 1817a542ad1bSJan Schmidt struct btrfs_tree_block_info *info; 1818a542ad1bSJan Schmidt 1819a542ad1bSJan Schmidt if (!*ptr) { 1820a542ad1bSJan Schmidt /* first call */ 1821a542ad1bSJan Schmidt flags = btrfs_extent_flags(eb, ei); 1822a542ad1bSJan Schmidt if (flags & BTRFS_EXTENT_FLAG_TREE_BLOCK) { 18236eda71d0SLiu Bo if (key->type == BTRFS_METADATA_ITEM_KEY) { 18246eda71d0SLiu Bo /* a skinny metadata extent */ 18256eda71d0SLiu Bo *out_eiref = 18266eda71d0SLiu Bo (struct btrfs_extent_inline_ref *)(ei + 1); 18276eda71d0SLiu Bo } else { 18286eda71d0SLiu Bo WARN_ON(key->type != BTRFS_EXTENT_ITEM_KEY); 1829a542ad1bSJan Schmidt info = (struct btrfs_tree_block_info *)(ei + 1); 1830a542ad1bSJan Schmidt *out_eiref = 1831a542ad1bSJan Schmidt (struct btrfs_extent_inline_ref *)(info + 1); 18326eda71d0SLiu Bo } 1833a542ad1bSJan Schmidt } else { 1834a542ad1bSJan Schmidt *out_eiref = (struct btrfs_extent_inline_ref *)(ei + 1); 1835a542ad1bSJan Schmidt } 1836a542ad1bSJan Schmidt *ptr = (unsigned long)*out_eiref; 1837cd857dd6SLiu Bo if ((unsigned long)(*ptr) >= (unsigned long)ei + item_size) 1838a542ad1bSJan Schmidt return -ENOENT; 1839a542ad1bSJan Schmidt } 1840a542ad1bSJan Schmidt 1841a542ad1bSJan Schmidt end = (unsigned long)ei + item_size; 18426eda71d0SLiu Bo *out_eiref = (struct btrfs_extent_inline_ref *)(*ptr); 18433de28d57SLiu Bo *out_type = btrfs_get_extent_inline_ref_type(eb, *out_eiref, 18443de28d57SLiu Bo BTRFS_REF_TYPE_ANY); 18453de28d57SLiu Bo if (*out_type == BTRFS_REF_TYPE_INVALID) 1846af431dcbSSu Yue return -EUCLEAN; 1847a542ad1bSJan Schmidt 1848a542ad1bSJan Schmidt *ptr += btrfs_extent_inline_ref_size(*out_type); 1849a542ad1bSJan Schmidt WARN_ON(*ptr > end); 1850a542ad1bSJan Schmidt if (*ptr == end) 1851a542ad1bSJan Schmidt return 1; /* last */ 1852a542ad1bSJan Schmidt 1853a542ad1bSJan Schmidt return 0; 1854a542ad1bSJan Schmidt } 1855a542ad1bSJan Schmidt 1856a542ad1bSJan Schmidt /* 1857a542ad1bSJan Schmidt * reads the tree block backref for an extent. tree level and root are returned 1858a542ad1bSJan Schmidt * through out_level and out_root. ptr must point to a 0 value for the first 1859e0c476b1SJeff Mahoney * call and may be modified (see get_extent_inline_ref comment). 1860a542ad1bSJan Schmidt * returns 0 if data was provided, 1 if there was no more data to provide or 1861a542ad1bSJan Schmidt * <0 on error. 1862a542ad1bSJan Schmidt */ 1863a542ad1bSJan Schmidt int tree_backref_for_extent(unsigned long *ptr, struct extent_buffer *eb, 18646eda71d0SLiu Bo struct btrfs_key *key, struct btrfs_extent_item *ei, 18656eda71d0SLiu Bo u32 item_size, u64 *out_root, u8 *out_level) 1866a542ad1bSJan Schmidt { 1867a542ad1bSJan Schmidt int ret; 1868a542ad1bSJan Schmidt int type; 1869a542ad1bSJan Schmidt struct btrfs_extent_inline_ref *eiref; 1870a542ad1bSJan Schmidt 1871a542ad1bSJan Schmidt if (*ptr == (unsigned long)-1) 1872a542ad1bSJan Schmidt return 1; 1873a542ad1bSJan Schmidt 1874a542ad1bSJan Schmidt while (1) { 1875e0c476b1SJeff Mahoney ret = get_extent_inline_ref(ptr, eb, key, ei, item_size, 1876a542ad1bSJan Schmidt &eiref, &type); 1877a542ad1bSJan Schmidt if (ret < 0) 1878a542ad1bSJan Schmidt return ret; 1879a542ad1bSJan Schmidt 1880a542ad1bSJan Schmidt if (type == BTRFS_TREE_BLOCK_REF_KEY || 1881a542ad1bSJan Schmidt type == BTRFS_SHARED_BLOCK_REF_KEY) 1882a542ad1bSJan Schmidt break; 1883a542ad1bSJan Schmidt 1884a542ad1bSJan Schmidt if (ret == 1) 1885a542ad1bSJan Schmidt return 1; 1886a542ad1bSJan Schmidt } 1887a542ad1bSJan Schmidt 1888a542ad1bSJan Schmidt /* we can treat both ref types equally here */ 1889a542ad1bSJan Schmidt *out_root = btrfs_extent_inline_ref_offset(eb, eiref); 1890a1317f45SFilipe Manana 1891a1317f45SFilipe Manana if (key->type == BTRFS_EXTENT_ITEM_KEY) { 1892a1317f45SFilipe Manana struct btrfs_tree_block_info *info; 1893a1317f45SFilipe Manana 1894a1317f45SFilipe Manana info = (struct btrfs_tree_block_info *)(ei + 1); 1895a542ad1bSJan Schmidt *out_level = btrfs_tree_block_level(eb, info); 1896a1317f45SFilipe Manana } else { 1897a1317f45SFilipe Manana ASSERT(key->type == BTRFS_METADATA_ITEM_KEY); 1898a1317f45SFilipe Manana *out_level = (u8)key->offset; 1899a1317f45SFilipe Manana } 1900a542ad1bSJan Schmidt 1901a542ad1bSJan Schmidt if (ret == 1) 1902a542ad1bSJan Schmidt *ptr = (unsigned long)-1; 1903a542ad1bSJan Schmidt 1904a542ad1bSJan Schmidt return 0; 1905a542ad1bSJan Schmidt } 1906a542ad1bSJan Schmidt 1907ab8d0fc4SJeff Mahoney static int iterate_leaf_refs(struct btrfs_fs_info *fs_info, 1908ab8d0fc4SJeff Mahoney struct extent_inode_elem *inode_list, 1909976b1908SJan Schmidt u64 root, u64 extent_item_objectid, 19104692cf58SJan Schmidt iterate_extent_inodes_t *iterate, void *ctx) 1911a542ad1bSJan Schmidt { 1912976b1908SJan Schmidt struct extent_inode_elem *eie; 19134692cf58SJan Schmidt int ret = 0; 1914a542ad1bSJan Schmidt 1915976b1908SJan Schmidt for (eie = inode_list; eie; eie = eie->next) { 1916ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 1917ab8d0fc4SJeff Mahoney "ref for %llu resolved, key (%llu EXTEND_DATA %llu), root %llu", 1918ab8d0fc4SJeff Mahoney extent_item_objectid, eie->inum, 1919ab8d0fc4SJeff Mahoney eie->offset, root); 1920976b1908SJan Schmidt ret = iterate(eie->inum, eie->offset, root, ctx); 19214692cf58SJan Schmidt if (ret) { 1922ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 1923ab8d0fc4SJeff Mahoney "stopping iteration for %llu due to ret=%d", 1924976b1908SJan Schmidt extent_item_objectid, ret); 1925a542ad1bSJan Schmidt break; 1926a542ad1bSJan Schmidt } 1927a542ad1bSJan Schmidt } 1928a542ad1bSJan Schmidt 1929a542ad1bSJan Schmidt return ret; 1930a542ad1bSJan Schmidt } 1931a542ad1bSJan Schmidt 1932a542ad1bSJan Schmidt /* 1933a542ad1bSJan Schmidt * calls iterate() for every inode that references the extent identified by 19344692cf58SJan Schmidt * the given parameters. 1935a542ad1bSJan Schmidt * when the iterator function returns a non-zero value, iteration stops. 1936a542ad1bSJan Schmidt */ 1937a542ad1bSJan Schmidt int iterate_extent_inodes(struct btrfs_fs_info *fs_info, 19384692cf58SJan Schmidt u64 extent_item_objectid, u64 extent_item_pos, 19397a3ae2f8SJan Schmidt int search_commit_root, 1940c995ab3cSZygo Blaxell iterate_extent_inodes_t *iterate, void *ctx, 1941c995ab3cSZygo Blaxell bool ignore_offset) 1942a542ad1bSJan Schmidt { 1943a542ad1bSJan Schmidt int ret; 1944da61d31aSJosef Bacik struct btrfs_trans_handle *trans = NULL; 19457a3ae2f8SJan Schmidt struct ulist *refs = NULL; 19467a3ae2f8SJan Schmidt struct ulist *roots = NULL; 19474692cf58SJan Schmidt struct ulist_node *ref_node = NULL; 19484692cf58SJan Schmidt struct ulist_node *root_node = NULL; 19493284da7bSDavid Sterba struct seq_list tree_mod_seq_elem = SEQ_LIST_INIT(tree_mod_seq_elem); 1950cd1b413cSJan Schmidt struct ulist_iterator ref_uiter; 1951cd1b413cSJan Schmidt struct ulist_iterator root_uiter; 1952a542ad1bSJan Schmidt 1953ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, "resolving all inodes for extent %llu", 19544692cf58SJan Schmidt extent_item_objectid); 19554692cf58SJan Schmidt 1956da61d31aSJosef Bacik if (!search_commit_root) { 1957bfc61c36SFilipe Manana trans = btrfs_attach_transaction(fs_info->extent_root); 1958bfc61c36SFilipe Manana if (IS_ERR(trans)) { 1959bfc61c36SFilipe Manana if (PTR_ERR(trans) != -ENOENT && 1960bfc61c36SFilipe Manana PTR_ERR(trans) != -EROFS) 19617a3ae2f8SJan Schmidt return PTR_ERR(trans); 1962bfc61c36SFilipe Manana trans = NULL; 19637a3ae2f8SJan Schmidt } 1964bfc61c36SFilipe Manana } 1965bfc61c36SFilipe Manana 1966bfc61c36SFilipe Manana if (trans) 1967bfc61c36SFilipe Manana btrfs_get_tree_mod_seq(fs_info, &tree_mod_seq_elem); 1968bfc61c36SFilipe Manana else 1969bfc61c36SFilipe Manana down_read(&fs_info->commit_root_sem); 19704692cf58SJan Schmidt 19714692cf58SJan Schmidt ret = btrfs_find_all_leafs(trans, fs_info, extent_item_objectid, 1972097b8a7cSJan Schmidt tree_mod_seq_elem.seq, &refs, 1973c995ab3cSZygo Blaxell &extent_item_pos, ignore_offset); 19744692cf58SJan Schmidt if (ret) 19754692cf58SJan Schmidt goto out; 19764692cf58SJan Schmidt 1977cd1b413cSJan Schmidt ULIST_ITER_INIT(&ref_uiter); 1978cd1b413cSJan Schmidt while (!ret && (ref_node = ulist_next(refs, &ref_uiter))) { 1979e0c476b1SJeff Mahoney ret = btrfs_find_all_roots_safe(trans, fs_info, ref_node->val, 1980c995ab3cSZygo Blaxell tree_mod_seq_elem.seq, &roots, 1981c995ab3cSZygo Blaxell ignore_offset); 19824692cf58SJan Schmidt if (ret) 1983a542ad1bSJan Schmidt break; 1984cd1b413cSJan Schmidt ULIST_ITER_INIT(&root_uiter); 1985cd1b413cSJan Schmidt while (!ret && (root_node = ulist_next(roots, &root_uiter))) { 1986ab8d0fc4SJeff Mahoney btrfs_debug(fs_info, 1987ab8d0fc4SJeff Mahoney "root %llu references leaf %llu, data list %#llx", 1988ab8d0fc4SJeff Mahoney root_node->val, ref_node->val, 1989c1c9ff7cSGeert Uytterhoeven ref_node->aux); 1990ab8d0fc4SJeff Mahoney ret = iterate_leaf_refs(fs_info, 1991ab8d0fc4SJeff Mahoney (struct extent_inode_elem *) 1992995e01b7SJan Schmidt (uintptr_t)ref_node->aux, 1993995e01b7SJan Schmidt root_node->val, 1994995e01b7SJan Schmidt extent_item_objectid, 1995a542ad1bSJan Schmidt iterate, ctx); 19964692cf58SJan Schmidt } 1997976b1908SJan Schmidt ulist_free(roots); 1998a542ad1bSJan Schmidt } 1999a542ad1bSJan Schmidt 2000976b1908SJan Schmidt free_leaf_list(refs); 20014692cf58SJan Schmidt out: 2002bfc61c36SFilipe Manana if (trans) { 20038445f61cSJan Schmidt btrfs_put_tree_mod_seq(fs_info, &tree_mod_seq_elem); 20043a45bb20SJeff Mahoney btrfs_end_transaction(trans); 20059e351cc8SJosef Bacik } else { 20069e351cc8SJosef Bacik up_read(&fs_info->commit_root_sem); 20077a3ae2f8SJan Schmidt } 20087a3ae2f8SJan Schmidt 2009a542ad1bSJan Schmidt return ret; 2010a542ad1bSJan Schmidt } 2011a542ad1bSJan Schmidt 2012a542ad1bSJan Schmidt int iterate_inodes_from_logical(u64 logical, struct btrfs_fs_info *fs_info, 2013a542ad1bSJan Schmidt struct btrfs_path *path, 2014c995ab3cSZygo Blaxell iterate_extent_inodes_t *iterate, void *ctx, 2015c995ab3cSZygo Blaxell bool ignore_offset) 2016a542ad1bSJan Schmidt { 2017a542ad1bSJan Schmidt int ret; 20184692cf58SJan Schmidt u64 extent_item_pos; 201969917e43SLiu Bo u64 flags = 0; 2020a542ad1bSJan Schmidt struct btrfs_key found_key; 20217a3ae2f8SJan Schmidt int search_commit_root = path->search_commit_root; 2022a542ad1bSJan Schmidt 202369917e43SLiu Bo ret = extent_from_logical(fs_info, logical, path, &found_key, &flags); 20244692cf58SJan Schmidt btrfs_release_path(path); 2025a542ad1bSJan Schmidt if (ret < 0) 2026a542ad1bSJan Schmidt return ret; 202769917e43SLiu Bo if (flags & BTRFS_EXTENT_FLAG_TREE_BLOCK) 20283627bf45SStefan Behrens return -EINVAL; 2029a542ad1bSJan Schmidt 20304692cf58SJan Schmidt extent_item_pos = logical - found_key.objectid; 20317a3ae2f8SJan Schmidt ret = iterate_extent_inodes(fs_info, found_key.objectid, 20327a3ae2f8SJan Schmidt extent_item_pos, search_commit_root, 2033c995ab3cSZygo Blaxell iterate, ctx, ignore_offset); 2034a542ad1bSJan Schmidt 2035a542ad1bSJan Schmidt return ret; 2036a542ad1bSJan Schmidt } 2037a542ad1bSJan Schmidt 2038d24bec3aSMark Fasheh typedef int (iterate_irefs_t)(u64 parent, u32 name_len, unsigned long name_off, 2039d24bec3aSMark Fasheh struct extent_buffer *eb, void *ctx); 2040d24bec3aSMark Fasheh 2041d24bec3aSMark Fasheh static int iterate_inode_refs(u64 inum, struct btrfs_root *fs_root, 2042a542ad1bSJan Schmidt struct btrfs_path *path, 2043a542ad1bSJan Schmidt iterate_irefs_t *iterate, void *ctx) 2044a542ad1bSJan Schmidt { 2045aefc1eb1SJan Schmidt int ret = 0; 2046a542ad1bSJan Schmidt int slot; 2047a542ad1bSJan Schmidt u32 cur; 2048a542ad1bSJan Schmidt u32 len; 2049a542ad1bSJan Schmidt u32 name_len; 2050a542ad1bSJan Schmidt u64 parent = 0; 2051a542ad1bSJan Schmidt int found = 0; 2052a542ad1bSJan Schmidt struct extent_buffer *eb; 2053a542ad1bSJan Schmidt struct btrfs_item *item; 2054a542ad1bSJan Schmidt struct btrfs_inode_ref *iref; 2055a542ad1bSJan Schmidt struct btrfs_key found_key; 2056a542ad1bSJan Schmidt 2057aefc1eb1SJan Schmidt while (!ret) { 2058c234a24dSDavid Sterba ret = btrfs_find_item(fs_root, path, inum, 2059c234a24dSDavid Sterba parent ? parent + 1 : 0, BTRFS_INODE_REF_KEY, 2060a542ad1bSJan Schmidt &found_key); 2061c234a24dSDavid Sterba 2062a542ad1bSJan Schmidt if (ret < 0) 2063a542ad1bSJan Schmidt break; 2064a542ad1bSJan Schmidt if (ret) { 2065a542ad1bSJan Schmidt ret = found ? 0 : -ENOENT; 2066a542ad1bSJan Schmidt break; 2067a542ad1bSJan Schmidt } 2068a542ad1bSJan Schmidt ++found; 2069a542ad1bSJan Schmidt 2070a542ad1bSJan Schmidt parent = found_key.offset; 2071a542ad1bSJan Schmidt slot = path->slots[0]; 20723fe81ce2SFilipe David Borba Manana eb = btrfs_clone_extent_buffer(path->nodes[0]); 20733fe81ce2SFilipe David Borba Manana if (!eb) { 20743fe81ce2SFilipe David Borba Manana ret = -ENOMEM; 20753fe81ce2SFilipe David Borba Manana break; 20763fe81ce2SFilipe David Borba Manana } 2077a542ad1bSJan Schmidt btrfs_release_path(path); 2078a542ad1bSJan Schmidt 2079dd3cc16bSRoss Kirk item = btrfs_item_nr(slot); 2080a542ad1bSJan Schmidt iref = btrfs_item_ptr(eb, slot, struct btrfs_inode_ref); 2081a542ad1bSJan Schmidt 2082a542ad1bSJan Schmidt for (cur = 0; cur < btrfs_item_size(eb, item); cur += len) { 2083a542ad1bSJan Schmidt name_len = btrfs_inode_ref_name_len(eb, iref); 2084a542ad1bSJan Schmidt /* path must be released before calling iterate()! */ 2085ab8d0fc4SJeff Mahoney btrfs_debug(fs_root->fs_info, 2086ab8d0fc4SJeff Mahoney "following ref at offset %u for inode %llu in tree %llu", 20874fd786e6SMisono Tomohiro cur, found_key.objectid, 20884fd786e6SMisono Tomohiro fs_root->root_key.objectid); 2089d24bec3aSMark Fasheh ret = iterate(parent, name_len, 2090d24bec3aSMark Fasheh (unsigned long)(iref + 1), eb, ctx); 2091aefc1eb1SJan Schmidt if (ret) 2092a542ad1bSJan Schmidt break; 2093a542ad1bSJan Schmidt len = sizeof(*iref) + name_len; 2094a542ad1bSJan Schmidt iref = (struct btrfs_inode_ref *)((char *)iref + len); 2095a542ad1bSJan Schmidt } 2096a542ad1bSJan Schmidt free_extent_buffer(eb); 2097a542ad1bSJan Schmidt } 2098a542ad1bSJan Schmidt 2099a542ad1bSJan Schmidt btrfs_release_path(path); 2100a542ad1bSJan Schmidt 2101a542ad1bSJan Schmidt return ret; 2102a542ad1bSJan Schmidt } 2103a542ad1bSJan Schmidt 2104d24bec3aSMark Fasheh static int iterate_inode_extrefs(u64 inum, struct btrfs_root *fs_root, 2105d24bec3aSMark Fasheh struct btrfs_path *path, 2106d24bec3aSMark Fasheh iterate_irefs_t *iterate, void *ctx) 2107d24bec3aSMark Fasheh { 2108d24bec3aSMark Fasheh int ret; 2109d24bec3aSMark Fasheh int slot; 2110d24bec3aSMark Fasheh u64 offset = 0; 2111d24bec3aSMark Fasheh u64 parent; 2112d24bec3aSMark Fasheh int found = 0; 2113d24bec3aSMark Fasheh struct extent_buffer *eb; 2114d24bec3aSMark Fasheh struct btrfs_inode_extref *extref; 2115d24bec3aSMark Fasheh u32 item_size; 2116d24bec3aSMark Fasheh u32 cur_offset; 2117d24bec3aSMark Fasheh unsigned long ptr; 2118d24bec3aSMark Fasheh 2119d24bec3aSMark Fasheh while (1) { 2120d24bec3aSMark Fasheh ret = btrfs_find_one_extref(fs_root, inum, offset, path, &extref, 2121d24bec3aSMark Fasheh &offset); 2122d24bec3aSMark Fasheh if (ret < 0) 2123d24bec3aSMark Fasheh break; 2124d24bec3aSMark Fasheh if (ret) { 2125d24bec3aSMark Fasheh ret = found ? 0 : -ENOENT; 2126d24bec3aSMark Fasheh break; 2127d24bec3aSMark Fasheh } 2128d24bec3aSMark Fasheh ++found; 2129d24bec3aSMark Fasheh 2130d24bec3aSMark Fasheh slot = path->slots[0]; 21313fe81ce2SFilipe David Borba Manana eb = btrfs_clone_extent_buffer(path->nodes[0]); 21323fe81ce2SFilipe David Borba Manana if (!eb) { 21333fe81ce2SFilipe David Borba Manana ret = -ENOMEM; 21343fe81ce2SFilipe David Borba Manana break; 21353fe81ce2SFilipe David Borba Manana } 2136d24bec3aSMark Fasheh btrfs_release_path(path); 2137d24bec3aSMark Fasheh 21382849a854SChris Mason item_size = btrfs_item_size_nr(eb, slot); 21392849a854SChris Mason ptr = btrfs_item_ptr_offset(eb, slot); 2140d24bec3aSMark Fasheh cur_offset = 0; 2141d24bec3aSMark Fasheh 2142d24bec3aSMark Fasheh while (cur_offset < item_size) { 2143d24bec3aSMark Fasheh u32 name_len; 2144d24bec3aSMark Fasheh 2145d24bec3aSMark Fasheh extref = (struct btrfs_inode_extref *)(ptr + cur_offset); 2146d24bec3aSMark Fasheh parent = btrfs_inode_extref_parent(eb, extref); 2147d24bec3aSMark Fasheh name_len = btrfs_inode_extref_name_len(eb, extref); 2148d24bec3aSMark Fasheh ret = iterate(parent, name_len, 2149d24bec3aSMark Fasheh (unsigned long)&extref->name, eb, ctx); 2150d24bec3aSMark Fasheh if (ret) 2151d24bec3aSMark Fasheh break; 2152d24bec3aSMark Fasheh 21532849a854SChris Mason cur_offset += btrfs_inode_extref_name_len(eb, extref); 2154d24bec3aSMark Fasheh cur_offset += sizeof(*extref); 2155d24bec3aSMark Fasheh } 2156d24bec3aSMark Fasheh free_extent_buffer(eb); 2157d24bec3aSMark Fasheh 2158d24bec3aSMark Fasheh offset++; 2159d24bec3aSMark Fasheh } 2160d24bec3aSMark Fasheh 2161d24bec3aSMark Fasheh btrfs_release_path(path); 2162d24bec3aSMark Fasheh 2163d24bec3aSMark Fasheh return ret; 2164d24bec3aSMark Fasheh } 2165d24bec3aSMark Fasheh 2166d24bec3aSMark Fasheh static int iterate_irefs(u64 inum, struct btrfs_root *fs_root, 2167d24bec3aSMark Fasheh struct btrfs_path *path, iterate_irefs_t *iterate, 2168d24bec3aSMark Fasheh void *ctx) 2169d24bec3aSMark Fasheh { 2170d24bec3aSMark Fasheh int ret; 2171d24bec3aSMark Fasheh int found_refs = 0; 2172d24bec3aSMark Fasheh 2173d24bec3aSMark Fasheh ret = iterate_inode_refs(inum, fs_root, path, iterate, ctx); 2174d24bec3aSMark Fasheh if (!ret) 2175d24bec3aSMark Fasheh ++found_refs; 2176d24bec3aSMark Fasheh else if (ret != -ENOENT) 2177d24bec3aSMark Fasheh return ret; 2178d24bec3aSMark Fasheh 2179d24bec3aSMark Fasheh ret = iterate_inode_extrefs(inum, fs_root, path, iterate, ctx); 2180d24bec3aSMark Fasheh if (ret == -ENOENT && found_refs) 2181d24bec3aSMark Fasheh return 0; 2182d24bec3aSMark Fasheh 2183d24bec3aSMark Fasheh return ret; 2184d24bec3aSMark Fasheh } 2185d24bec3aSMark Fasheh 2186a542ad1bSJan Schmidt /* 2187a542ad1bSJan Schmidt * returns 0 if the path could be dumped (probably truncated) 2188a542ad1bSJan Schmidt * returns <0 in case of an error 2189a542ad1bSJan Schmidt */ 2190d24bec3aSMark Fasheh static int inode_to_path(u64 inum, u32 name_len, unsigned long name_off, 2191a542ad1bSJan Schmidt struct extent_buffer *eb, void *ctx) 2192a542ad1bSJan Schmidt { 2193a542ad1bSJan Schmidt struct inode_fs_paths *ipath = ctx; 2194a542ad1bSJan Schmidt char *fspath; 2195a542ad1bSJan Schmidt char *fspath_min; 2196a542ad1bSJan Schmidt int i = ipath->fspath->elem_cnt; 2197a542ad1bSJan Schmidt const int s_ptr = sizeof(char *); 2198a542ad1bSJan Schmidt u32 bytes_left; 2199a542ad1bSJan Schmidt 2200a542ad1bSJan Schmidt bytes_left = ipath->fspath->bytes_left > s_ptr ? 2201a542ad1bSJan Schmidt ipath->fspath->bytes_left - s_ptr : 0; 2202a542ad1bSJan Schmidt 2203740c3d22SChris Mason fspath_min = (char *)ipath->fspath->val + (i + 1) * s_ptr; 220496b5bd77SJan Schmidt fspath = btrfs_ref_to_path(ipath->fs_root, ipath->btrfs_path, name_len, 220596b5bd77SJan Schmidt name_off, eb, inum, fspath_min, bytes_left); 2206a542ad1bSJan Schmidt if (IS_ERR(fspath)) 2207a542ad1bSJan Schmidt return PTR_ERR(fspath); 2208a542ad1bSJan Schmidt 2209a542ad1bSJan Schmidt if (fspath > fspath_min) { 2210745c4d8eSJeff Mahoney ipath->fspath->val[i] = (u64)(unsigned long)fspath; 2211a542ad1bSJan Schmidt ++ipath->fspath->elem_cnt; 2212a542ad1bSJan Schmidt ipath->fspath->bytes_left = fspath - fspath_min; 2213a542ad1bSJan Schmidt } else { 2214a542ad1bSJan Schmidt ++ipath->fspath->elem_missed; 2215a542ad1bSJan Schmidt ipath->fspath->bytes_missing += fspath_min - fspath; 2216a542ad1bSJan Schmidt ipath->fspath->bytes_left = 0; 2217a542ad1bSJan Schmidt } 2218a542ad1bSJan Schmidt 2219a542ad1bSJan Schmidt return 0; 2220a542ad1bSJan Schmidt } 2221a542ad1bSJan Schmidt 2222a542ad1bSJan Schmidt /* 2223a542ad1bSJan Schmidt * this dumps all file system paths to the inode into the ipath struct, provided 2224a542ad1bSJan Schmidt * is has been created large enough. each path is zero-terminated and accessed 2225740c3d22SChris Mason * from ipath->fspath->val[i]. 2226a542ad1bSJan Schmidt * when it returns, there are ipath->fspath->elem_cnt number of paths available 2227740c3d22SChris Mason * in ipath->fspath->val[]. when the allocated space wasn't sufficient, the 222801327610SNicholas D Steeves * number of missed paths is recorded in ipath->fspath->elem_missed, otherwise, 2229a542ad1bSJan Schmidt * it's zero. ipath->fspath->bytes_missing holds the number of bytes that would 2230a542ad1bSJan Schmidt * have been needed to return all paths. 2231a542ad1bSJan Schmidt */ 2232a542ad1bSJan Schmidt int paths_from_inode(u64 inum, struct inode_fs_paths *ipath) 2233a542ad1bSJan Schmidt { 2234a542ad1bSJan Schmidt return iterate_irefs(inum, ipath->fs_root, ipath->btrfs_path, 2235a542ad1bSJan Schmidt inode_to_path, ipath); 2236a542ad1bSJan Schmidt } 2237a542ad1bSJan Schmidt 2238a542ad1bSJan Schmidt struct btrfs_data_container *init_data_container(u32 total_bytes) 2239a542ad1bSJan Schmidt { 2240a542ad1bSJan Schmidt struct btrfs_data_container *data; 2241a542ad1bSJan Schmidt size_t alloc_bytes; 2242a542ad1bSJan Schmidt 2243a542ad1bSJan Schmidt alloc_bytes = max_t(size_t, total_bytes, sizeof(*data)); 2244f54de068SDavid Sterba data = kvmalloc(alloc_bytes, GFP_KERNEL); 2245a542ad1bSJan Schmidt if (!data) 2246a542ad1bSJan Schmidt return ERR_PTR(-ENOMEM); 2247a542ad1bSJan Schmidt 2248a542ad1bSJan Schmidt if (total_bytes >= sizeof(*data)) { 2249a542ad1bSJan Schmidt data->bytes_left = total_bytes - sizeof(*data); 2250a542ad1bSJan Schmidt data->bytes_missing = 0; 2251a542ad1bSJan Schmidt } else { 2252a542ad1bSJan Schmidt data->bytes_missing = sizeof(*data) - total_bytes; 2253a542ad1bSJan Schmidt data->bytes_left = 0; 2254a542ad1bSJan Schmidt } 2255a542ad1bSJan Schmidt 2256a542ad1bSJan Schmidt data->elem_cnt = 0; 2257a542ad1bSJan Schmidt data->elem_missed = 0; 2258a542ad1bSJan Schmidt 2259a542ad1bSJan Schmidt return data; 2260a542ad1bSJan Schmidt } 2261a542ad1bSJan Schmidt 2262a542ad1bSJan Schmidt /* 2263a542ad1bSJan Schmidt * allocates space to return multiple file system paths for an inode. 2264a542ad1bSJan Schmidt * total_bytes to allocate are passed, note that space usable for actual path 2265a542ad1bSJan Schmidt * information will be total_bytes - sizeof(struct inode_fs_paths). 2266a542ad1bSJan Schmidt * the returned pointer must be freed with free_ipath() in the end. 2267a542ad1bSJan Schmidt */ 2268a542ad1bSJan Schmidt struct inode_fs_paths *init_ipath(s32 total_bytes, struct btrfs_root *fs_root, 2269a542ad1bSJan Schmidt struct btrfs_path *path) 2270a542ad1bSJan Schmidt { 2271a542ad1bSJan Schmidt struct inode_fs_paths *ifp; 2272a542ad1bSJan Schmidt struct btrfs_data_container *fspath; 2273a542ad1bSJan Schmidt 2274a542ad1bSJan Schmidt fspath = init_data_container(total_bytes); 2275a542ad1bSJan Schmidt if (IS_ERR(fspath)) 2276afc6961fSMisono Tomohiro return ERR_CAST(fspath); 2277a542ad1bSJan Schmidt 2278f54de068SDavid Sterba ifp = kmalloc(sizeof(*ifp), GFP_KERNEL); 2279a542ad1bSJan Schmidt if (!ifp) { 2280f54de068SDavid Sterba kvfree(fspath); 2281a542ad1bSJan Schmidt return ERR_PTR(-ENOMEM); 2282a542ad1bSJan Schmidt } 2283a542ad1bSJan Schmidt 2284a542ad1bSJan Schmidt ifp->btrfs_path = path; 2285a542ad1bSJan Schmidt ifp->fspath = fspath; 2286a542ad1bSJan Schmidt ifp->fs_root = fs_root; 2287a542ad1bSJan Schmidt 2288a542ad1bSJan Schmidt return ifp; 2289a542ad1bSJan Schmidt } 2290a542ad1bSJan Schmidt 2291a542ad1bSJan Schmidt void free_ipath(struct inode_fs_paths *ipath) 2292a542ad1bSJan Schmidt { 22934735fb28SJesper Juhl if (!ipath) 22944735fb28SJesper Juhl return; 2295f54de068SDavid Sterba kvfree(ipath->fspath); 2296a542ad1bSJan Schmidt kfree(ipath); 2297a542ad1bSJan Schmidt } 2298a37f232bSQu Wenruo 2299a37f232bSQu Wenruo struct btrfs_backref_iter *btrfs_backref_iter_alloc( 2300a37f232bSQu Wenruo struct btrfs_fs_info *fs_info, gfp_t gfp_flag) 2301a37f232bSQu Wenruo { 2302a37f232bSQu Wenruo struct btrfs_backref_iter *ret; 2303a37f232bSQu Wenruo 2304a37f232bSQu Wenruo ret = kzalloc(sizeof(*ret), gfp_flag); 2305a37f232bSQu Wenruo if (!ret) 2306a37f232bSQu Wenruo return NULL; 2307a37f232bSQu Wenruo 2308a37f232bSQu Wenruo ret->path = btrfs_alloc_path(); 2309a37f232bSQu Wenruo if (!ret) { 2310a37f232bSQu Wenruo kfree(ret); 2311a37f232bSQu Wenruo return NULL; 2312a37f232bSQu Wenruo } 2313a37f232bSQu Wenruo 2314a37f232bSQu Wenruo /* Current backref iterator only supports iteration in commit root */ 2315a37f232bSQu Wenruo ret->path->search_commit_root = 1; 2316a37f232bSQu Wenruo ret->path->skip_locking = 1; 2317a37f232bSQu Wenruo ret->fs_info = fs_info; 2318a37f232bSQu Wenruo 2319a37f232bSQu Wenruo return ret; 2320a37f232bSQu Wenruo } 2321a37f232bSQu Wenruo 2322a37f232bSQu Wenruo int btrfs_backref_iter_start(struct btrfs_backref_iter *iter, u64 bytenr) 2323a37f232bSQu Wenruo { 2324a37f232bSQu Wenruo struct btrfs_fs_info *fs_info = iter->fs_info; 2325a37f232bSQu Wenruo struct btrfs_path *path = iter->path; 2326a37f232bSQu Wenruo struct btrfs_extent_item *ei; 2327a37f232bSQu Wenruo struct btrfs_key key; 2328a37f232bSQu Wenruo int ret; 2329a37f232bSQu Wenruo 2330a37f232bSQu Wenruo key.objectid = bytenr; 2331a37f232bSQu Wenruo key.type = BTRFS_METADATA_ITEM_KEY; 2332a37f232bSQu Wenruo key.offset = (u64)-1; 2333a37f232bSQu Wenruo iter->bytenr = bytenr; 2334a37f232bSQu Wenruo 2335a37f232bSQu Wenruo ret = btrfs_search_slot(NULL, fs_info->extent_root, &key, path, 0, 0); 2336a37f232bSQu Wenruo if (ret < 0) 2337a37f232bSQu Wenruo return ret; 2338a37f232bSQu Wenruo if (ret == 0) { 2339a37f232bSQu Wenruo ret = -EUCLEAN; 2340a37f232bSQu Wenruo goto release; 2341a37f232bSQu Wenruo } 2342a37f232bSQu Wenruo if (path->slots[0] == 0) { 2343a37f232bSQu Wenruo WARN_ON(IS_ENABLED(CONFIG_BTRFS_DEBUG)); 2344a37f232bSQu Wenruo ret = -EUCLEAN; 2345a37f232bSQu Wenruo goto release; 2346a37f232bSQu Wenruo } 2347a37f232bSQu Wenruo path->slots[0]--; 2348a37f232bSQu Wenruo 2349a37f232bSQu Wenruo btrfs_item_key_to_cpu(path->nodes[0], &key, path->slots[0]); 2350a37f232bSQu Wenruo if ((key.type != BTRFS_EXTENT_ITEM_KEY && 2351a37f232bSQu Wenruo key.type != BTRFS_METADATA_ITEM_KEY) || key.objectid != bytenr) { 2352a37f232bSQu Wenruo ret = -ENOENT; 2353a37f232bSQu Wenruo goto release; 2354a37f232bSQu Wenruo } 2355a37f232bSQu Wenruo memcpy(&iter->cur_key, &key, sizeof(key)); 2356a37f232bSQu Wenruo iter->item_ptr = (u32)btrfs_item_ptr_offset(path->nodes[0], 2357a37f232bSQu Wenruo path->slots[0]); 2358a37f232bSQu Wenruo iter->end_ptr = (u32)(iter->item_ptr + 2359a37f232bSQu Wenruo btrfs_item_size_nr(path->nodes[0], path->slots[0])); 2360a37f232bSQu Wenruo ei = btrfs_item_ptr(path->nodes[0], path->slots[0], 2361a37f232bSQu Wenruo struct btrfs_extent_item); 2362a37f232bSQu Wenruo 2363a37f232bSQu Wenruo /* 2364a37f232bSQu Wenruo * Only support iteration on tree backref yet. 2365a37f232bSQu Wenruo * 2366a37f232bSQu Wenruo * This is an extra precaution for non skinny-metadata, where 2367a37f232bSQu Wenruo * EXTENT_ITEM is also used for tree blocks, that we can only use 2368a37f232bSQu Wenruo * extent flags to determine if it's a tree block. 2369a37f232bSQu Wenruo */ 2370a37f232bSQu Wenruo if (btrfs_extent_flags(path->nodes[0], ei) & BTRFS_EXTENT_FLAG_DATA) { 2371a37f232bSQu Wenruo ret = -ENOTSUPP; 2372a37f232bSQu Wenruo goto release; 2373a37f232bSQu Wenruo } 2374a37f232bSQu Wenruo iter->cur_ptr = (u32)(iter->item_ptr + sizeof(*ei)); 2375a37f232bSQu Wenruo 2376a37f232bSQu Wenruo /* If there is no inline backref, go search for keyed backref */ 2377a37f232bSQu Wenruo if (iter->cur_ptr >= iter->end_ptr) { 2378a37f232bSQu Wenruo ret = btrfs_next_item(fs_info->extent_root, path); 2379a37f232bSQu Wenruo 2380a37f232bSQu Wenruo /* No inline nor keyed ref */ 2381a37f232bSQu Wenruo if (ret > 0) { 2382a37f232bSQu Wenruo ret = -ENOENT; 2383a37f232bSQu Wenruo goto release; 2384a37f232bSQu Wenruo } 2385a37f232bSQu Wenruo if (ret < 0) 2386a37f232bSQu Wenruo goto release; 2387a37f232bSQu Wenruo 2388a37f232bSQu Wenruo btrfs_item_key_to_cpu(path->nodes[0], &iter->cur_key, 2389a37f232bSQu Wenruo path->slots[0]); 2390a37f232bSQu Wenruo if (iter->cur_key.objectid != bytenr || 2391a37f232bSQu Wenruo (iter->cur_key.type != BTRFS_SHARED_BLOCK_REF_KEY && 2392a37f232bSQu Wenruo iter->cur_key.type != BTRFS_TREE_BLOCK_REF_KEY)) { 2393a37f232bSQu Wenruo ret = -ENOENT; 2394a37f232bSQu Wenruo goto release; 2395a37f232bSQu Wenruo } 2396a37f232bSQu Wenruo iter->cur_ptr = (u32)btrfs_item_ptr_offset(path->nodes[0], 2397a37f232bSQu Wenruo path->slots[0]); 2398a37f232bSQu Wenruo iter->item_ptr = iter->cur_ptr; 2399a37f232bSQu Wenruo iter->end_ptr = (u32)(iter->item_ptr + btrfs_item_size_nr( 2400a37f232bSQu Wenruo path->nodes[0], path->slots[0])); 2401a37f232bSQu Wenruo } 2402a37f232bSQu Wenruo 2403a37f232bSQu Wenruo return 0; 2404a37f232bSQu Wenruo release: 2405a37f232bSQu Wenruo btrfs_backref_iter_release(iter); 2406a37f232bSQu Wenruo return ret; 2407a37f232bSQu Wenruo } 2408c39c2ddcSQu Wenruo 2409c39c2ddcSQu Wenruo /* 2410c39c2ddcSQu Wenruo * Go to the next backref item of current bytenr, can be either inlined or 2411c39c2ddcSQu Wenruo * keyed. 2412c39c2ddcSQu Wenruo * 2413c39c2ddcSQu Wenruo * Caller needs to check whether it's inline ref or not by iter->cur_key. 2414c39c2ddcSQu Wenruo * 2415c39c2ddcSQu Wenruo * Return 0 if we get next backref without problem. 2416c39c2ddcSQu Wenruo * Return >0 if there is no extra backref for this bytenr. 2417c39c2ddcSQu Wenruo * Return <0 if there is something wrong happened. 2418c39c2ddcSQu Wenruo */ 2419c39c2ddcSQu Wenruo int btrfs_backref_iter_next(struct btrfs_backref_iter *iter) 2420c39c2ddcSQu Wenruo { 2421c39c2ddcSQu Wenruo struct extent_buffer *eb = btrfs_backref_get_eb(iter); 2422c39c2ddcSQu Wenruo struct btrfs_path *path = iter->path; 2423c39c2ddcSQu Wenruo struct btrfs_extent_inline_ref *iref; 2424c39c2ddcSQu Wenruo int ret; 2425c39c2ddcSQu Wenruo u32 size; 2426c39c2ddcSQu Wenruo 2427c39c2ddcSQu Wenruo if (btrfs_backref_iter_is_inline_ref(iter)) { 2428c39c2ddcSQu Wenruo /* We're still inside the inline refs */ 2429c39c2ddcSQu Wenruo ASSERT(iter->cur_ptr < iter->end_ptr); 2430c39c2ddcSQu Wenruo 2431c39c2ddcSQu Wenruo if (btrfs_backref_has_tree_block_info(iter)) { 2432c39c2ddcSQu Wenruo /* First tree block info */ 2433c39c2ddcSQu Wenruo size = sizeof(struct btrfs_tree_block_info); 2434c39c2ddcSQu Wenruo } else { 2435c39c2ddcSQu Wenruo /* Use inline ref type to determine the size */ 2436c39c2ddcSQu Wenruo int type; 2437c39c2ddcSQu Wenruo 2438c39c2ddcSQu Wenruo iref = (struct btrfs_extent_inline_ref *) 2439c39c2ddcSQu Wenruo ((unsigned long)iter->cur_ptr); 2440c39c2ddcSQu Wenruo type = btrfs_extent_inline_ref_type(eb, iref); 2441c39c2ddcSQu Wenruo 2442c39c2ddcSQu Wenruo size = btrfs_extent_inline_ref_size(type); 2443c39c2ddcSQu Wenruo } 2444c39c2ddcSQu Wenruo iter->cur_ptr += size; 2445c39c2ddcSQu Wenruo if (iter->cur_ptr < iter->end_ptr) 2446c39c2ddcSQu Wenruo return 0; 2447c39c2ddcSQu Wenruo 2448c39c2ddcSQu Wenruo /* All inline items iterated, fall through */ 2449c39c2ddcSQu Wenruo } 2450c39c2ddcSQu Wenruo 2451c39c2ddcSQu Wenruo /* We're at keyed items, there is no inline item, go to the next one */ 2452c39c2ddcSQu Wenruo ret = btrfs_next_item(iter->fs_info->extent_root, iter->path); 2453c39c2ddcSQu Wenruo if (ret) 2454c39c2ddcSQu Wenruo return ret; 2455c39c2ddcSQu Wenruo 2456c39c2ddcSQu Wenruo btrfs_item_key_to_cpu(path->nodes[0], &iter->cur_key, path->slots[0]); 2457c39c2ddcSQu Wenruo if (iter->cur_key.objectid != iter->bytenr || 2458c39c2ddcSQu Wenruo (iter->cur_key.type != BTRFS_TREE_BLOCK_REF_KEY && 2459c39c2ddcSQu Wenruo iter->cur_key.type != BTRFS_SHARED_BLOCK_REF_KEY)) 2460c39c2ddcSQu Wenruo return 1; 2461c39c2ddcSQu Wenruo iter->item_ptr = (u32)btrfs_item_ptr_offset(path->nodes[0], 2462c39c2ddcSQu Wenruo path->slots[0]); 2463c39c2ddcSQu Wenruo iter->cur_ptr = iter->item_ptr; 2464c39c2ddcSQu Wenruo iter->end_ptr = iter->item_ptr + (u32)btrfs_item_size_nr(path->nodes[0], 2465c39c2ddcSQu Wenruo path->slots[0]); 2466c39c2ddcSQu Wenruo return 0; 2467c39c2ddcSQu Wenruo } 2468584fb121SQu Wenruo 2469584fb121SQu Wenruo void btrfs_backref_init_cache(struct btrfs_fs_info *fs_info, 2470584fb121SQu Wenruo struct btrfs_backref_cache *cache, int is_reloc) 2471584fb121SQu Wenruo { 2472584fb121SQu Wenruo int i; 2473584fb121SQu Wenruo 2474584fb121SQu Wenruo cache->rb_root = RB_ROOT; 2475584fb121SQu Wenruo for (i = 0; i < BTRFS_MAX_LEVEL; i++) 2476584fb121SQu Wenruo INIT_LIST_HEAD(&cache->pending[i]); 2477584fb121SQu Wenruo INIT_LIST_HEAD(&cache->changed); 2478584fb121SQu Wenruo INIT_LIST_HEAD(&cache->detached); 2479584fb121SQu Wenruo INIT_LIST_HEAD(&cache->leaves); 2480584fb121SQu Wenruo INIT_LIST_HEAD(&cache->pending_edge); 2481584fb121SQu Wenruo INIT_LIST_HEAD(&cache->useless_node); 2482584fb121SQu Wenruo cache->fs_info = fs_info; 2483584fb121SQu Wenruo cache->is_reloc = is_reloc; 2484584fb121SQu Wenruo } 2485*b1818dabSQu Wenruo 2486*b1818dabSQu Wenruo struct btrfs_backref_node *btrfs_backref_alloc_node( 2487*b1818dabSQu Wenruo struct btrfs_backref_cache *cache, u64 bytenr, int level) 2488*b1818dabSQu Wenruo { 2489*b1818dabSQu Wenruo struct btrfs_backref_node *node; 2490*b1818dabSQu Wenruo 2491*b1818dabSQu Wenruo ASSERT(level >= 0 && level < BTRFS_MAX_LEVEL); 2492*b1818dabSQu Wenruo node = kzalloc(sizeof(*node), GFP_NOFS); 2493*b1818dabSQu Wenruo if (!node) 2494*b1818dabSQu Wenruo return node; 2495*b1818dabSQu Wenruo 2496*b1818dabSQu Wenruo INIT_LIST_HEAD(&node->list); 2497*b1818dabSQu Wenruo INIT_LIST_HEAD(&node->upper); 2498*b1818dabSQu Wenruo INIT_LIST_HEAD(&node->lower); 2499*b1818dabSQu Wenruo RB_CLEAR_NODE(&node->rb_node); 2500*b1818dabSQu Wenruo cache->nr_nodes++; 2501*b1818dabSQu Wenruo node->level = level; 2502*b1818dabSQu Wenruo node->bytenr = bytenr; 2503*b1818dabSQu Wenruo 2504*b1818dabSQu Wenruo return node; 2505*b1818dabSQu Wenruo } 2506