10a8165d7SJaegeuk Kim /* 2e05df3b1SJaegeuk Kim * fs/f2fs/node.c 3e05df3b1SJaegeuk Kim * 4e05df3b1SJaegeuk Kim * Copyright (c) 2012 Samsung Electronics Co., Ltd. 5e05df3b1SJaegeuk Kim * http://www.samsung.com/ 6e05df3b1SJaegeuk Kim * 7e05df3b1SJaegeuk Kim * This program is free software; you can redistribute it and/or modify 8e05df3b1SJaegeuk Kim * it under the terms of the GNU General Public License version 2 as 9e05df3b1SJaegeuk Kim * published by the Free Software Foundation. 10e05df3b1SJaegeuk Kim */ 11e05df3b1SJaegeuk Kim #include <linux/fs.h> 12e05df3b1SJaegeuk Kim #include <linux/f2fs_fs.h> 13e05df3b1SJaegeuk Kim #include <linux/mpage.h> 14e05df3b1SJaegeuk Kim #include <linux/backing-dev.h> 15e05df3b1SJaegeuk Kim #include <linux/blkdev.h> 16e05df3b1SJaegeuk Kim #include <linux/pagevec.h> 17e05df3b1SJaegeuk Kim #include <linux/swap.h> 18e05df3b1SJaegeuk Kim 19e05df3b1SJaegeuk Kim #include "f2fs.h" 20e05df3b1SJaegeuk Kim #include "node.h" 21e05df3b1SJaegeuk Kim #include "segment.h" 229e4ded3fSJaegeuk Kim #include "trace.h" 2351dd6249SNamjae Jeon #include <trace/events/f2fs.h> 24e05df3b1SJaegeuk Kim 2568afcf2dSTomohiro Kusumi #define on_build_free_nids(nmi) mutex_is_locked(&(nm_i)->build_lock) 26f978f5a0SGu Zheng 27e05df3b1SJaegeuk Kim static struct kmem_cache *nat_entry_slab; 28e05df3b1SJaegeuk Kim static struct kmem_cache *free_nid_slab; 29aec71382SChao Yu static struct kmem_cache *nat_entry_set_slab; 30e05df3b1SJaegeuk Kim 316fb03f3aSJaegeuk Kim bool available_free_memory(struct f2fs_sb_info *sbi, int type) 32cdfc41c1SJaegeuk Kim { 336fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 34cdfc41c1SJaegeuk Kim struct sysinfo val; 35e5e7ea3cSJaegeuk Kim unsigned long avail_ram; 36cdfc41c1SJaegeuk Kim unsigned long mem_size = 0; 376fb03f3aSJaegeuk Kim bool res = false; 38cdfc41c1SJaegeuk Kim 39cdfc41c1SJaegeuk Kim si_meminfo(&val); 40e5e7ea3cSJaegeuk Kim 41e5e7ea3cSJaegeuk Kim /* only uses low memory */ 42e5e7ea3cSJaegeuk Kim avail_ram = val.totalram - val.totalhigh; 43e5e7ea3cSJaegeuk Kim 44429511cdSChao Yu /* 45429511cdSChao Yu * give 25%, 25%, 50%, 50%, 50% memory for each components respectively 46429511cdSChao Yu */ 476fb03f3aSJaegeuk Kim if (type == FREE_NIDS) { 48b8559dc2SChao Yu mem_size = (nm_i->nid_cnt[FREE_NID_LIST] * 49b8559dc2SChao Yu sizeof(struct free_nid)) >> PAGE_SHIFT; 50e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 516fb03f3aSJaegeuk Kim } else if (type == NAT_ENTRIES) { 52e5e7ea3cSJaegeuk Kim mem_size = (nm_i->nat_cnt * sizeof(struct nat_entry)) >> 5309cbfeafSKirill A. Shutemov PAGE_SHIFT; 54e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 55e589c2c4SJaegeuk Kim if (excess_cached_nats(sbi)) 56e589c2c4SJaegeuk Kim res = false; 57a1257023SJaegeuk Kim } else if (type == DIRTY_DENTS) { 58a1257023SJaegeuk Kim if (sbi->sb->s_bdi->wb.dirty_exceeded) 59a1257023SJaegeuk Kim return false; 60a1257023SJaegeuk Kim mem_size = get_pages(sbi, F2FS_DIRTY_DENTS); 61a1257023SJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 62e5e7ea3cSJaegeuk Kim } else if (type == INO_ENTRIES) { 63e5e7ea3cSJaegeuk Kim int i; 64e5e7ea3cSJaegeuk Kim 65e5e7ea3cSJaegeuk Kim for (i = 0; i <= UPDATE_INO; i++) 668f73cbb7SKinglong Mee mem_size += sbi->im[i].ino_num * 678f73cbb7SKinglong Mee sizeof(struct ino_entry); 688f73cbb7SKinglong Mee mem_size >>= PAGE_SHIFT; 69e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 70429511cdSChao Yu } else if (type == EXTENT_CACHE) { 717441ccefSJaegeuk Kim mem_size = (atomic_read(&sbi->total_ext_tree) * 727441ccefSJaegeuk Kim sizeof(struct extent_tree) + 73429511cdSChao Yu atomic_read(&sbi->total_ext_node) * 7409cbfeafSKirill A. Shutemov sizeof(struct extent_node)) >> PAGE_SHIFT; 75429511cdSChao Yu res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 761e84371fSJaegeuk Kim } else { 771663cae4SJaegeuk Kim if (!sbi->sb->s_bdi->wb.dirty_exceeded) 781663cae4SJaegeuk Kim return true; 796fb03f3aSJaegeuk Kim } 806fb03f3aSJaegeuk Kim return res; 81cdfc41c1SJaegeuk Kim } 82cdfc41c1SJaegeuk Kim 83e05df3b1SJaegeuk Kim static void clear_node_page_dirty(struct page *page) 84e05df3b1SJaegeuk Kim { 85e05df3b1SJaegeuk Kim struct address_space *mapping = page->mapping; 86e05df3b1SJaegeuk Kim unsigned int long flags; 87e05df3b1SJaegeuk Kim 88e05df3b1SJaegeuk Kim if (PageDirty(page)) { 89e05df3b1SJaegeuk Kim spin_lock_irqsave(&mapping->tree_lock, flags); 90e05df3b1SJaegeuk Kim radix_tree_tag_clear(&mapping->page_tree, 91e05df3b1SJaegeuk Kim page_index(page), 92e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY); 93e05df3b1SJaegeuk Kim spin_unlock_irqrestore(&mapping->tree_lock, flags); 94e05df3b1SJaegeuk Kim 95e05df3b1SJaegeuk Kim clear_page_dirty_for_io(page); 964081363fSJaegeuk Kim dec_page_count(F2FS_M_SB(mapping), F2FS_DIRTY_NODES); 97e05df3b1SJaegeuk Kim } 98e05df3b1SJaegeuk Kim ClearPageUptodate(page); 99e05df3b1SJaegeuk Kim } 100e05df3b1SJaegeuk Kim 101e05df3b1SJaegeuk Kim static struct page *get_current_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 102e05df3b1SJaegeuk Kim { 103e05df3b1SJaegeuk Kim pgoff_t index = current_nat_addr(sbi, nid); 104e05df3b1SJaegeuk Kim return get_meta_page(sbi, index); 105e05df3b1SJaegeuk Kim } 106e05df3b1SJaegeuk Kim 107e05df3b1SJaegeuk Kim static struct page *get_next_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 108e05df3b1SJaegeuk Kim { 109e05df3b1SJaegeuk Kim struct page *src_page; 110e05df3b1SJaegeuk Kim struct page *dst_page; 111e05df3b1SJaegeuk Kim pgoff_t src_off; 112e05df3b1SJaegeuk Kim pgoff_t dst_off; 113e05df3b1SJaegeuk Kim void *src_addr; 114e05df3b1SJaegeuk Kim void *dst_addr; 115e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 116e05df3b1SJaegeuk Kim 117e05df3b1SJaegeuk Kim src_off = current_nat_addr(sbi, nid); 118e05df3b1SJaegeuk Kim dst_off = next_nat_addr(sbi, src_off); 119e05df3b1SJaegeuk Kim 120e05df3b1SJaegeuk Kim /* get current nat block page with lock */ 121e05df3b1SJaegeuk Kim src_page = get_meta_page(sbi, src_off); 122e05df3b1SJaegeuk Kim dst_page = grab_meta_page(sbi, dst_off); 1239850cf4aSJaegeuk Kim f2fs_bug_on(sbi, PageDirty(src_page)); 124e05df3b1SJaegeuk Kim 125e05df3b1SJaegeuk Kim src_addr = page_address(src_page); 126e05df3b1SJaegeuk Kim dst_addr = page_address(dst_page); 12709cbfeafSKirill A. Shutemov memcpy(dst_addr, src_addr, PAGE_SIZE); 128e05df3b1SJaegeuk Kim set_page_dirty(dst_page); 129e05df3b1SJaegeuk Kim f2fs_put_page(src_page, 1); 130e05df3b1SJaegeuk Kim 131e05df3b1SJaegeuk Kim set_to_next_nat(nm_i, nid); 132e05df3b1SJaegeuk Kim 133e05df3b1SJaegeuk Kim return dst_page; 134e05df3b1SJaegeuk Kim } 135e05df3b1SJaegeuk Kim 136e05df3b1SJaegeuk Kim static struct nat_entry *__lookup_nat_cache(struct f2fs_nm_info *nm_i, nid_t n) 137e05df3b1SJaegeuk Kim { 138e05df3b1SJaegeuk Kim return radix_tree_lookup(&nm_i->nat_root, n); 139e05df3b1SJaegeuk Kim } 140e05df3b1SJaegeuk Kim 141e05df3b1SJaegeuk Kim static unsigned int __gang_lookup_nat_cache(struct f2fs_nm_info *nm_i, 142e05df3b1SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry **ep) 143e05df3b1SJaegeuk Kim { 144e05df3b1SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_root, (void **)ep, start, nr); 145e05df3b1SJaegeuk Kim } 146e05df3b1SJaegeuk Kim 147e05df3b1SJaegeuk Kim static void __del_from_nat_cache(struct f2fs_nm_info *nm_i, struct nat_entry *e) 148e05df3b1SJaegeuk Kim { 149e05df3b1SJaegeuk Kim list_del(&e->list); 150e05df3b1SJaegeuk Kim radix_tree_delete(&nm_i->nat_root, nat_get_nid(e)); 151e05df3b1SJaegeuk Kim nm_i->nat_cnt--; 152e05df3b1SJaegeuk Kim kmem_cache_free(nat_entry_slab, e); 153e05df3b1SJaegeuk Kim } 154e05df3b1SJaegeuk Kim 155309cc2b6SJaegeuk Kim static void __set_nat_cache_dirty(struct f2fs_nm_info *nm_i, 156309cc2b6SJaegeuk Kim struct nat_entry *ne) 157309cc2b6SJaegeuk Kim { 158309cc2b6SJaegeuk Kim nid_t set = NAT_BLOCK_OFFSET(ne->ni.nid); 159309cc2b6SJaegeuk Kim struct nat_entry_set *head; 160309cc2b6SJaegeuk Kim 161309cc2b6SJaegeuk Kim head = radix_tree_lookup(&nm_i->nat_set_root, set); 162309cc2b6SJaegeuk Kim if (!head) { 16380c54505SJaegeuk Kim head = f2fs_kmem_cache_alloc(nat_entry_set_slab, GFP_NOFS); 164309cc2b6SJaegeuk Kim 165309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->entry_list); 166309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->set_list); 167309cc2b6SJaegeuk Kim head->set = set; 168309cc2b6SJaegeuk Kim head->entry_cnt = 0; 1699be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_set_root, set, head); 170309cc2b6SJaegeuk Kim } 171febeca6dSChao Yu 172febeca6dSChao Yu if (get_nat_flag(ne, IS_DIRTY)) 173febeca6dSChao Yu goto refresh_list; 174febeca6dSChao Yu 175309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt++; 176309cc2b6SJaegeuk Kim head->entry_cnt++; 177309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, true); 178febeca6dSChao Yu refresh_list: 179febeca6dSChao Yu if (nat_get_blkaddr(ne) == NEW_ADDR) 180febeca6dSChao Yu list_del_init(&ne->list); 181febeca6dSChao Yu else 182febeca6dSChao Yu list_move_tail(&ne->list, &head->entry_list); 183309cc2b6SJaegeuk Kim } 184309cc2b6SJaegeuk Kim 185309cc2b6SJaegeuk Kim static void __clear_nat_cache_dirty(struct f2fs_nm_info *nm_i, 1860b28b71eSKinglong Mee struct nat_entry_set *set, struct nat_entry *ne) 187309cc2b6SJaegeuk Kim { 188309cc2b6SJaegeuk Kim list_move_tail(&ne->list, &nm_i->nat_entries); 189309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, false); 1900b28b71eSKinglong Mee set->entry_cnt--; 191309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt--; 192309cc2b6SJaegeuk Kim } 193309cc2b6SJaegeuk Kim 194309cc2b6SJaegeuk Kim static unsigned int __gang_lookup_nat_set(struct f2fs_nm_info *nm_i, 195309cc2b6SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry_set **ep) 196309cc2b6SJaegeuk Kim { 197309cc2b6SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_set_root, (void **)ep, 198309cc2b6SJaegeuk Kim start, nr); 199309cc2b6SJaegeuk Kim } 200309cc2b6SJaegeuk Kim 2012dcf51abSJaegeuk Kim int need_dentry_mark(struct f2fs_sb_info *sbi, nid_t nid) 2022dcf51abSJaegeuk Kim { 2032dcf51abSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2042dcf51abSJaegeuk Kim struct nat_entry *e; 2052dcf51abSJaegeuk Kim bool need = false; 2062dcf51abSJaegeuk Kim 207b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 2082dcf51abSJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2092dcf51abSJaegeuk Kim if (e) { 2102dcf51abSJaegeuk Kim if (!get_nat_flag(e, IS_CHECKPOINTED) && 2112dcf51abSJaegeuk Kim !get_nat_flag(e, HAS_FSYNCED_INODE)) 2122dcf51abSJaegeuk Kim need = true; 2132dcf51abSJaegeuk Kim } 214b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 2152dcf51abSJaegeuk Kim return need; 2162dcf51abSJaegeuk Kim } 2172dcf51abSJaegeuk Kim 21888bd02c9SJaegeuk Kim bool is_checkpointed_node(struct f2fs_sb_info *sbi, nid_t nid) 219e05df3b1SJaegeuk Kim { 220e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 221e05df3b1SJaegeuk Kim struct nat_entry *e; 22288bd02c9SJaegeuk Kim bool is_cp = true; 223e05df3b1SJaegeuk Kim 224b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 225e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2267ef35e3bSJaegeuk Kim if (e && !get_nat_flag(e, IS_CHECKPOINTED)) 22788bd02c9SJaegeuk Kim is_cp = false; 228b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 229e05df3b1SJaegeuk Kim return is_cp; 230e05df3b1SJaegeuk Kim } 231e05df3b1SJaegeuk Kim 23288bd02c9SJaegeuk Kim bool need_inode_block_update(struct f2fs_sb_info *sbi, nid_t ino) 233b6fe5873SJaegeuk Kim { 234b6fe5873SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 235b6fe5873SJaegeuk Kim struct nat_entry *e; 23688bd02c9SJaegeuk Kim bool need_update = true; 237b6fe5873SJaegeuk Kim 238b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 23988bd02c9SJaegeuk Kim e = __lookup_nat_cache(nm_i, ino); 24088bd02c9SJaegeuk Kim if (e && get_nat_flag(e, HAS_LAST_FSYNC) && 24188bd02c9SJaegeuk Kim (get_nat_flag(e, IS_CHECKPOINTED) || 24288bd02c9SJaegeuk Kim get_nat_flag(e, HAS_FSYNCED_INODE))) 24388bd02c9SJaegeuk Kim need_update = false; 244b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 24588bd02c9SJaegeuk Kim return need_update; 246b6fe5873SJaegeuk Kim } 247b6fe5873SJaegeuk Kim 2485c9e4184SChao Yu static struct nat_entry *grab_nat_entry(struct f2fs_nm_info *nm_i, nid_t nid, 2495c9e4184SChao Yu bool no_fail) 250e05df3b1SJaegeuk Kim { 251e05df3b1SJaegeuk Kim struct nat_entry *new; 252e05df3b1SJaegeuk Kim 2535c9e4184SChao Yu if (no_fail) { 25480c54505SJaegeuk Kim new = f2fs_kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2559be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_root, nid, new); 2565c9e4184SChao Yu } else { 2575c9e4184SChao Yu new = kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2585c9e4184SChao Yu if (!new) 2595c9e4184SChao Yu return NULL; 2605c9e4184SChao Yu if (radix_tree_insert(&nm_i->nat_root, nid, new)) { 2615c9e4184SChao Yu kmem_cache_free(nat_entry_slab, new); 2625c9e4184SChao Yu return NULL; 2635c9e4184SChao Yu } 2645c9e4184SChao Yu } 2655c9e4184SChao Yu 266e05df3b1SJaegeuk Kim memset(new, 0, sizeof(struct nat_entry)); 267e05df3b1SJaegeuk Kim nat_set_nid(new, nid); 26888bd02c9SJaegeuk Kim nat_reset_flag(new); 269e05df3b1SJaegeuk Kim list_add_tail(&new->list, &nm_i->nat_entries); 270e05df3b1SJaegeuk Kim nm_i->nat_cnt++; 271e05df3b1SJaegeuk Kim return new; 272e05df3b1SJaegeuk Kim } 273e05df3b1SJaegeuk Kim 2741515aef0SChao Yu static void cache_nat_entry(struct f2fs_sb_info *sbi, nid_t nid, 275e05df3b1SJaegeuk Kim struct f2fs_nat_entry *ne) 276e05df3b1SJaegeuk Kim { 2771515aef0SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 278e05df3b1SJaegeuk Kim struct nat_entry *e; 2799be32d72SJaegeuk Kim 280e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 281e05df3b1SJaegeuk Kim if (!e) { 2825c9e4184SChao Yu e = grab_nat_entry(nm_i, nid, false); 2835c9e4184SChao Yu if (e) 28494dac22eSChao Yu node_info_from_raw_nat(&e->ni, ne); 2851515aef0SChao Yu } else { 2860c0b471eSEric Biggers f2fs_bug_on(sbi, nat_get_ino(e) != le32_to_cpu(ne->ino) || 2870c0b471eSEric Biggers nat_get_blkaddr(e) != 2880c0b471eSEric Biggers le32_to_cpu(ne->block_addr) || 2891515aef0SChao Yu nat_get_version(e) != ne->version); 290e05df3b1SJaegeuk Kim } 291e05df3b1SJaegeuk Kim } 292e05df3b1SJaegeuk Kim 293e05df3b1SJaegeuk Kim static void set_node_addr(struct f2fs_sb_info *sbi, struct node_info *ni, 294479f40c4SJaegeuk Kim block_t new_blkaddr, bool fsync_done) 295e05df3b1SJaegeuk Kim { 296e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 297e05df3b1SJaegeuk Kim struct nat_entry *e; 2989be32d72SJaegeuk Kim 299b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 300e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->nid); 301e05df3b1SJaegeuk Kim if (!e) { 3025c9e4184SChao Yu e = grab_nat_entry(nm_i, ni->nid, true); 3035c27f4eeSChao Yu copy_node_info(&e->ni, ni); 3049850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr == NEW_ADDR); 305e05df3b1SJaegeuk Kim } else if (new_blkaddr == NEW_ADDR) { 306e05df3b1SJaegeuk Kim /* 307e05df3b1SJaegeuk Kim * when nid is reallocated, 308e05df3b1SJaegeuk Kim * previous nat entry can be remained in nat cache. 309e05df3b1SJaegeuk Kim * So, reinitialize it with new information. 310e05df3b1SJaegeuk Kim */ 3115c27f4eeSChao Yu copy_node_info(&e->ni, ni); 3129850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr != NULL_ADDR); 313e05df3b1SJaegeuk Kim } 314e05df3b1SJaegeuk Kim 315e05df3b1SJaegeuk Kim /* sanity check */ 3169850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != ni->blk_addr); 3179850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NULL_ADDR && 318e05df3b1SJaegeuk Kim new_blkaddr == NULL_ADDR); 3199850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NEW_ADDR && 320e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 3219850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != NEW_ADDR && 322e05df3b1SJaegeuk Kim nat_get_blkaddr(e) != NULL_ADDR && 323e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 324e05df3b1SJaegeuk Kim 325e1c42045Sarter97 /* increment version no as node is removed */ 326e05df3b1SJaegeuk Kim if (nat_get_blkaddr(e) != NEW_ADDR && new_blkaddr == NULL_ADDR) { 327e05df3b1SJaegeuk Kim unsigned char version = nat_get_version(e); 328e05df3b1SJaegeuk Kim nat_set_version(e, inc_node_version(version)); 32926834466SJaegeuk Kim 33026834466SJaegeuk Kim /* in order to reuse the nid */ 33126834466SJaegeuk Kim if (nm_i->next_scan_nid > ni->nid) 33226834466SJaegeuk Kim nm_i->next_scan_nid = ni->nid; 333e05df3b1SJaegeuk Kim } 334e05df3b1SJaegeuk Kim 335e05df3b1SJaegeuk Kim /* change address */ 336e05df3b1SJaegeuk Kim nat_set_blkaddr(e, new_blkaddr); 33788bd02c9SJaegeuk Kim if (new_blkaddr == NEW_ADDR || new_blkaddr == NULL_ADDR) 33888bd02c9SJaegeuk Kim set_nat_flag(e, IS_CHECKPOINTED, false); 339e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, e); 340479f40c4SJaegeuk Kim 341479f40c4SJaegeuk Kim /* update fsync_mark if its inode nat entry is still alive */ 342d5b692b7SChao Yu if (ni->nid != ni->ino) 343479f40c4SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->ino); 34488bd02c9SJaegeuk Kim if (e) { 34588bd02c9SJaegeuk Kim if (fsync_done && ni->nid == ni->ino) 34688bd02c9SJaegeuk Kim set_nat_flag(e, HAS_FSYNCED_INODE, true); 34788bd02c9SJaegeuk Kim set_nat_flag(e, HAS_LAST_FSYNC, fsync_done); 34888bd02c9SJaegeuk Kim } 349b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 350e05df3b1SJaegeuk Kim } 351e05df3b1SJaegeuk Kim 3524660f9c0SJaegeuk Kim int try_to_free_nats(struct f2fs_sb_info *sbi, int nr_shrink) 353e05df3b1SJaegeuk Kim { 354e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 3551b38dc8eSJaegeuk Kim int nr = nr_shrink; 356e05df3b1SJaegeuk Kim 357b873b798SJaegeuk Kim if (!down_write_trylock(&nm_i->nat_tree_lock)) 358b873b798SJaegeuk Kim return 0; 359e05df3b1SJaegeuk Kim 360e05df3b1SJaegeuk Kim while (nr_shrink && !list_empty(&nm_i->nat_entries)) { 361e05df3b1SJaegeuk Kim struct nat_entry *ne; 362e05df3b1SJaegeuk Kim ne = list_first_entry(&nm_i->nat_entries, 363e05df3b1SJaegeuk Kim struct nat_entry, list); 364e05df3b1SJaegeuk Kim __del_from_nat_cache(nm_i, ne); 365e05df3b1SJaegeuk Kim nr_shrink--; 366e05df3b1SJaegeuk Kim } 367b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 3681b38dc8eSJaegeuk Kim return nr - nr_shrink; 369e05df3b1SJaegeuk Kim } 370e05df3b1SJaegeuk Kim 3710a8165d7SJaegeuk Kim /* 372e1c42045Sarter97 * This function always returns success 373e05df3b1SJaegeuk Kim */ 374e05df3b1SJaegeuk Kim void get_node_info(struct f2fs_sb_info *sbi, nid_t nid, struct node_info *ni) 375e05df3b1SJaegeuk Kim { 376e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 377e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 378b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 379e05df3b1SJaegeuk Kim nid_t start_nid = START_NID(nid); 380e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk; 381e05df3b1SJaegeuk Kim struct page *page = NULL; 382e05df3b1SJaegeuk Kim struct f2fs_nat_entry ne; 383e05df3b1SJaegeuk Kim struct nat_entry *e; 38466a82d1fSYunlei He pgoff_t index; 385e05df3b1SJaegeuk Kim int i; 386e05df3b1SJaegeuk Kim 387e05df3b1SJaegeuk Kim ni->nid = nid; 388e05df3b1SJaegeuk Kim 389e05df3b1SJaegeuk Kim /* Check nat cache */ 390b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 391e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 392e05df3b1SJaegeuk Kim if (e) { 393e05df3b1SJaegeuk Kim ni->ino = nat_get_ino(e); 394e05df3b1SJaegeuk Kim ni->blk_addr = nat_get_blkaddr(e); 395e05df3b1SJaegeuk Kim ni->version = nat_get_version(e); 396b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 397e05df3b1SJaegeuk Kim return; 3981515aef0SChao Yu } 399e05df3b1SJaegeuk Kim 4003547ea96SJaegeuk Kim memset(&ne, 0, sizeof(struct f2fs_nat_entry)); 4013547ea96SJaegeuk Kim 402e05df3b1SJaegeuk Kim /* Check current segment summary */ 403b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 404dfc08a12SChao Yu i = lookup_journal_in_cursum(journal, NAT_JOURNAL, nid, 0); 405e05df3b1SJaegeuk Kim if (i >= 0) { 406dfc08a12SChao Yu ne = nat_in_journal(journal, i); 407e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 408e05df3b1SJaegeuk Kim } 409b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 41066a82d1fSYunlei He if (i >= 0) { 41166a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 412e05df3b1SJaegeuk Kim goto cache; 41366a82d1fSYunlei He } 414e05df3b1SJaegeuk Kim 415e05df3b1SJaegeuk Kim /* Fill node_info from nat page */ 41666a82d1fSYunlei He index = current_nat_addr(sbi, nid); 41766a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 41866a82d1fSYunlei He 41966a82d1fSYunlei He page = get_meta_page(sbi, index); 420e05df3b1SJaegeuk Kim nat_blk = (struct f2fs_nat_block *)page_address(page); 421e05df3b1SJaegeuk Kim ne = nat_blk->entries[nid - start_nid]; 422e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 423e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 424e05df3b1SJaegeuk Kim cache: 425e05df3b1SJaegeuk Kim /* cache nat entry */ 426b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 4271515aef0SChao Yu cache_nat_entry(sbi, nid, &ne); 428b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 429e05df3b1SJaegeuk Kim } 430e05df3b1SJaegeuk Kim 43179344efbSJaegeuk Kim /* 43279344efbSJaegeuk Kim * readahead MAX_RA_NODE number of node pages. 43379344efbSJaegeuk Kim */ 43479344efbSJaegeuk Kim static void ra_node_pages(struct page *parent, int start, int n) 43579344efbSJaegeuk Kim { 43679344efbSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 43779344efbSJaegeuk Kim struct blk_plug plug; 43879344efbSJaegeuk Kim int i, end; 43979344efbSJaegeuk Kim nid_t nid; 44079344efbSJaegeuk Kim 44179344efbSJaegeuk Kim blk_start_plug(&plug); 44279344efbSJaegeuk Kim 44379344efbSJaegeuk Kim /* Then, try readahead for siblings of the desired node */ 44479344efbSJaegeuk Kim end = start + n; 44579344efbSJaegeuk Kim end = min(end, NIDS_PER_BLOCK); 44679344efbSJaegeuk Kim for (i = start; i < end; i++) { 44779344efbSJaegeuk Kim nid = get_nid(parent, i, false); 44879344efbSJaegeuk Kim ra_node_page(sbi, nid); 44979344efbSJaegeuk Kim } 45079344efbSJaegeuk Kim 45179344efbSJaegeuk Kim blk_finish_plug(&plug); 45279344efbSJaegeuk Kim } 45379344efbSJaegeuk Kim 4543cf45747SChao Yu pgoff_t get_next_page_offset(struct dnode_of_data *dn, pgoff_t pgofs) 4553cf45747SChao Yu { 4563cf45747SChao Yu const long direct_index = ADDRS_PER_INODE(dn->inode); 4573cf45747SChao Yu const long direct_blks = ADDRS_PER_BLOCK; 4583cf45747SChao Yu const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 4593cf45747SChao Yu unsigned int skipped_unit = ADDRS_PER_BLOCK; 4603cf45747SChao Yu int cur_level = dn->cur_level; 4613cf45747SChao Yu int max_level = dn->max_level; 4623cf45747SChao Yu pgoff_t base = 0; 4633cf45747SChao Yu 4643cf45747SChao Yu if (!dn->max_level) 4653cf45747SChao Yu return pgofs + 1; 4663cf45747SChao Yu 4673cf45747SChao Yu while (max_level-- > cur_level) 4683cf45747SChao Yu skipped_unit *= NIDS_PER_BLOCK; 4693cf45747SChao Yu 4703cf45747SChao Yu switch (dn->max_level) { 4713cf45747SChao Yu case 3: 4723cf45747SChao Yu base += 2 * indirect_blks; 4733cf45747SChao Yu case 2: 4743cf45747SChao Yu base += 2 * direct_blks; 4753cf45747SChao Yu case 1: 4763cf45747SChao Yu base += direct_index; 4773cf45747SChao Yu break; 4783cf45747SChao Yu default: 4793cf45747SChao Yu f2fs_bug_on(F2FS_I_SB(dn->inode), 1); 4803cf45747SChao Yu } 4813cf45747SChao Yu 4823cf45747SChao Yu return ((pgofs - base) / skipped_unit + 1) * skipped_unit + base; 4833cf45747SChao Yu } 4843cf45747SChao Yu 4850a8165d7SJaegeuk Kim /* 486e05df3b1SJaegeuk Kim * The maximum depth is four. 487e05df3b1SJaegeuk Kim * Offset[0] will have raw inode offset. 488e05df3b1SJaegeuk Kim */ 48981ca7350SChao Yu static int get_node_path(struct inode *inode, long block, 490de93653fSJaegeuk Kim int offset[4], unsigned int noffset[4]) 491e05df3b1SJaegeuk Kim { 49281ca7350SChao Yu const long direct_index = ADDRS_PER_INODE(inode); 493e05df3b1SJaegeuk Kim const long direct_blks = ADDRS_PER_BLOCK; 494e05df3b1SJaegeuk Kim const long dptrs_per_blk = NIDS_PER_BLOCK; 495e05df3b1SJaegeuk Kim const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 496e05df3b1SJaegeuk Kim const long dindirect_blks = indirect_blks * NIDS_PER_BLOCK; 497e05df3b1SJaegeuk Kim int n = 0; 498e05df3b1SJaegeuk Kim int level = 0; 499e05df3b1SJaegeuk Kim 500e05df3b1SJaegeuk Kim noffset[0] = 0; 501e05df3b1SJaegeuk Kim 502e05df3b1SJaegeuk Kim if (block < direct_index) { 50325c0a6e5SNamjae Jeon offset[n] = block; 504e05df3b1SJaegeuk Kim goto got; 505e05df3b1SJaegeuk Kim } 506e05df3b1SJaegeuk Kim block -= direct_index; 507e05df3b1SJaegeuk Kim if (block < direct_blks) { 508e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR1_BLOCK; 509e05df3b1SJaegeuk Kim noffset[n] = 1; 51025c0a6e5SNamjae Jeon offset[n] = block; 511e05df3b1SJaegeuk Kim level = 1; 512e05df3b1SJaegeuk Kim goto got; 513e05df3b1SJaegeuk Kim } 514e05df3b1SJaegeuk Kim block -= direct_blks; 515e05df3b1SJaegeuk Kim if (block < direct_blks) { 516e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR2_BLOCK; 517e05df3b1SJaegeuk Kim noffset[n] = 2; 51825c0a6e5SNamjae Jeon offset[n] = block; 519e05df3b1SJaegeuk Kim level = 1; 520e05df3b1SJaegeuk Kim goto got; 521e05df3b1SJaegeuk Kim } 522e05df3b1SJaegeuk Kim block -= direct_blks; 523e05df3b1SJaegeuk Kim if (block < indirect_blks) { 524e05df3b1SJaegeuk Kim offset[n++] = NODE_IND1_BLOCK; 525e05df3b1SJaegeuk Kim noffset[n] = 3; 526e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 527e05df3b1SJaegeuk Kim noffset[n] = 4 + offset[n - 1]; 52825c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 529e05df3b1SJaegeuk Kim level = 2; 530e05df3b1SJaegeuk Kim goto got; 531e05df3b1SJaegeuk Kim } 532e05df3b1SJaegeuk Kim block -= indirect_blks; 533e05df3b1SJaegeuk Kim if (block < indirect_blks) { 534e05df3b1SJaegeuk Kim offset[n++] = NODE_IND2_BLOCK; 535e05df3b1SJaegeuk Kim noffset[n] = 4 + dptrs_per_blk; 536e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 537e05df3b1SJaegeuk Kim noffset[n] = 5 + dptrs_per_blk + offset[n - 1]; 53825c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 539e05df3b1SJaegeuk Kim level = 2; 540e05df3b1SJaegeuk Kim goto got; 541e05df3b1SJaegeuk Kim } 542e05df3b1SJaegeuk Kim block -= indirect_blks; 543e05df3b1SJaegeuk Kim if (block < dindirect_blks) { 544e05df3b1SJaegeuk Kim offset[n++] = NODE_DIND_BLOCK; 545e05df3b1SJaegeuk Kim noffset[n] = 5 + (dptrs_per_blk * 2); 546e05df3b1SJaegeuk Kim offset[n++] = block / indirect_blks; 547e05df3b1SJaegeuk Kim noffset[n] = 6 + (dptrs_per_blk * 2) + 548e05df3b1SJaegeuk Kim offset[n - 1] * (dptrs_per_blk + 1); 549e05df3b1SJaegeuk Kim offset[n++] = (block / direct_blks) % dptrs_per_blk; 550e05df3b1SJaegeuk Kim noffset[n] = 7 + (dptrs_per_blk * 2) + 551e05df3b1SJaegeuk Kim offset[n - 2] * (dptrs_per_blk + 1) + 552e05df3b1SJaegeuk Kim offset[n - 1]; 55325c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 554e05df3b1SJaegeuk Kim level = 3; 555e05df3b1SJaegeuk Kim goto got; 556e05df3b1SJaegeuk Kim } else { 557e05df3b1SJaegeuk Kim BUG(); 558e05df3b1SJaegeuk Kim } 559e05df3b1SJaegeuk Kim got: 560e05df3b1SJaegeuk Kim return level; 561e05df3b1SJaegeuk Kim } 562e05df3b1SJaegeuk Kim 563e05df3b1SJaegeuk Kim /* 564e05df3b1SJaegeuk Kim * Caller should call f2fs_put_dnode(dn). 5654f4124d0SChao Yu * Also, it should grab and release a rwsem by calling f2fs_lock_op() and 5664f4124d0SChao Yu * f2fs_unlock_op() only if ro is not set RDONLY_NODE. 56739936837SJaegeuk Kim * In the case of RDONLY_NODE, we don't need to care about mutex. 568e05df3b1SJaegeuk Kim */ 569266e97a8SJaegeuk Kim int get_dnode_of_data(struct dnode_of_data *dn, pgoff_t index, int mode) 570e05df3b1SJaegeuk Kim { 5714081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 572e05df3b1SJaegeuk Kim struct page *npage[4]; 573f1a3b98eSJaegeuk Kim struct page *parent = NULL; 574e05df3b1SJaegeuk Kim int offset[4]; 575e05df3b1SJaegeuk Kim unsigned int noffset[4]; 576e05df3b1SJaegeuk Kim nid_t nids[4]; 5773cf45747SChao Yu int level, i = 0; 578e05df3b1SJaegeuk Kim int err = 0; 579e05df3b1SJaegeuk Kim 58081ca7350SChao Yu level = get_node_path(dn->inode, index, offset, noffset); 581e05df3b1SJaegeuk Kim 582e05df3b1SJaegeuk Kim nids[0] = dn->inode->i_ino; 5831646cfacSJaegeuk Kim npage[0] = dn->inode_page; 5841646cfacSJaegeuk Kim 5851646cfacSJaegeuk Kim if (!npage[0]) { 586e05df3b1SJaegeuk Kim npage[0] = get_node_page(sbi, nids[0]); 587e05df3b1SJaegeuk Kim if (IS_ERR(npage[0])) 588e05df3b1SJaegeuk Kim return PTR_ERR(npage[0]); 5891646cfacSJaegeuk Kim } 590f1a3b98eSJaegeuk Kim 591f1a3b98eSJaegeuk Kim /* if inline_data is set, should not report any block indices */ 592f1a3b98eSJaegeuk Kim if (f2fs_has_inline_data(dn->inode) && index) { 59376629165SJaegeuk Kim err = -ENOENT; 594f1a3b98eSJaegeuk Kim f2fs_put_page(npage[0], 1); 595f1a3b98eSJaegeuk Kim goto release_out; 596f1a3b98eSJaegeuk Kim } 597f1a3b98eSJaegeuk Kim 598e05df3b1SJaegeuk Kim parent = npage[0]; 59952c2db3fSChangman Lee if (level != 0) 600e05df3b1SJaegeuk Kim nids[1] = get_nid(parent, offset[0], true); 601e05df3b1SJaegeuk Kim dn->inode_page = npage[0]; 602e05df3b1SJaegeuk Kim dn->inode_page_locked = true; 603e05df3b1SJaegeuk Kim 604e05df3b1SJaegeuk Kim /* get indirect or direct nodes */ 605e05df3b1SJaegeuk Kim for (i = 1; i <= level; i++) { 606e05df3b1SJaegeuk Kim bool done = false; 607e05df3b1SJaegeuk Kim 608266e97a8SJaegeuk Kim if (!nids[i] && mode == ALLOC_NODE) { 609e05df3b1SJaegeuk Kim /* alloc new node */ 610e05df3b1SJaegeuk Kim if (!alloc_nid(sbi, &(nids[i]))) { 611e05df3b1SJaegeuk Kim err = -ENOSPC; 612e05df3b1SJaegeuk Kim goto release_pages; 613e05df3b1SJaegeuk Kim } 614e05df3b1SJaegeuk Kim 615e05df3b1SJaegeuk Kim dn->nid = nids[i]; 6168ae8f162SJaegeuk Kim npage[i] = new_node_page(dn, noffset[i], NULL); 617e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 618e05df3b1SJaegeuk Kim alloc_nid_failed(sbi, nids[i]); 619e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 620e05df3b1SJaegeuk Kim goto release_pages; 621e05df3b1SJaegeuk Kim } 622e05df3b1SJaegeuk Kim 623e05df3b1SJaegeuk Kim set_nid(parent, offset[i - 1], nids[i], i == 1); 624e05df3b1SJaegeuk Kim alloc_nid_done(sbi, nids[i]); 625e05df3b1SJaegeuk Kim done = true; 626266e97a8SJaegeuk Kim } else if (mode == LOOKUP_NODE_RA && i == level && level > 1) { 627e05df3b1SJaegeuk Kim npage[i] = get_node_page_ra(parent, offset[i - 1]); 628e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 629e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 630e05df3b1SJaegeuk Kim goto release_pages; 631e05df3b1SJaegeuk Kim } 632e05df3b1SJaegeuk Kim done = true; 633e05df3b1SJaegeuk Kim } 634e05df3b1SJaegeuk Kim if (i == 1) { 635e05df3b1SJaegeuk Kim dn->inode_page_locked = false; 636e05df3b1SJaegeuk Kim unlock_page(parent); 637e05df3b1SJaegeuk Kim } else { 638e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 639e05df3b1SJaegeuk Kim } 640e05df3b1SJaegeuk Kim 641e05df3b1SJaegeuk Kim if (!done) { 642e05df3b1SJaegeuk Kim npage[i] = get_node_page(sbi, nids[i]); 643e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 644e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 645e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 646e05df3b1SJaegeuk Kim goto release_out; 647e05df3b1SJaegeuk Kim } 648e05df3b1SJaegeuk Kim } 649e05df3b1SJaegeuk Kim if (i < level) { 650e05df3b1SJaegeuk Kim parent = npage[i]; 651e05df3b1SJaegeuk Kim nids[i + 1] = get_nid(parent, offset[i], false); 652e05df3b1SJaegeuk Kim } 653e05df3b1SJaegeuk Kim } 654e05df3b1SJaegeuk Kim dn->nid = nids[level]; 655e05df3b1SJaegeuk Kim dn->ofs_in_node = offset[level]; 656e05df3b1SJaegeuk Kim dn->node_page = npage[level]; 657e05df3b1SJaegeuk Kim dn->data_blkaddr = datablock_addr(dn->node_page, dn->ofs_in_node); 658e05df3b1SJaegeuk Kim return 0; 659e05df3b1SJaegeuk Kim 660e05df3b1SJaegeuk Kim release_pages: 661e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 662e05df3b1SJaegeuk Kim if (i > 1) 663e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 664e05df3b1SJaegeuk Kim release_out: 665e05df3b1SJaegeuk Kim dn->inode_page = NULL; 666e05df3b1SJaegeuk Kim dn->node_page = NULL; 6673cf45747SChao Yu if (err == -ENOENT) { 6683cf45747SChao Yu dn->cur_level = i; 6693cf45747SChao Yu dn->max_level = level; 6700a2aa8fbSJaegeuk Kim dn->ofs_in_node = offset[level]; 6713cf45747SChao Yu } 672e05df3b1SJaegeuk Kim return err; 673e05df3b1SJaegeuk Kim } 674e05df3b1SJaegeuk Kim 675e05df3b1SJaegeuk Kim static void truncate_node(struct dnode_of_data *dn) 676e05df3b1SJaegeuk Kim { 6774081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 678e05df3b1SJaegeuk Kim struct node_info ni; 679e05df3b1SJaegeuk Kim 680e05df3b1SJaegeuk Kim get_node_info(sbi, dn->nid, &ni); 68171e9fec5SJaegeuk Kim if (dn->inode->i_blocks == 0) { 6829850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr != NULL_ADDR); 68371e9fec5SJaegeuk Kim goto invalidate; 68471e9fec5SJaegeuk Kim } 6859850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 686e05df3b1SJaegeuk Kim 687e05df3b1SJaegeuk Kim /* Deallocate node address */ 68871e9fec5SJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 689ef86d709SGu Zheng dec_valid_node_count(sbi, dn->inode); 690479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 691e05df3b1SJaegeuk Kim 692e05df3b1SJaegeuk Kim if (dn->nid == dn->inode->i_ino) { 693e05df3b1SJaegeuk Kim remove_orphan_inode(sbi, dn->nid); 694e05df3b1SJaegeuk Kim dec_valid_inode_count(sbi); 6950f18b462SJaegeuk Kim f2fs_inode_synced(dn->inode); 696e05df3b1SJaegeuk Kim } 69771e9fec5SJaegeuk Kim invalidate: 698e05df3b1SJaegeuk Kim clear_node_page_dirty(dn->node_page); 699caf0047eSChao Yu set_sbi_flag(sbi, SBI_IS_DIRTY); 700e05df3b1SJaegeuk Kim 701e05df3b1SJaegeuk Kim f2fs_put_page(dn->node_page, 1); 702bf39c00aSJaegeuk Kim 703bf39c00aSJaegeuk Kim invalidate_mapping_pages(NODE_MAPPING(sbi), 704bf39c00aSJaegeuk Kim dn->node_page->index, dn->node_page->index); 705bf39c00aSJaegeuk Kim 706e05df3b1SJaegeuk Kim dn->node_page = NULL; 70751dd6249SNamjae Jeon trace_f2fs_truncate_node(dn->inode, dn->nid, ni.blk_addr); 708e05df3b1SJaegeuk Kim } 709e05df3b1SJaegeuk Kim 710e05df3b1SJaegeuk Kim static int truncate_dnode(struct dnode_of_data *dn) 711e05df3b1SJaegeuk Kim { 712e05df3b1SJaegeuk Kim struct page *page; 713e05df3b1SJaegeuk Kim 714e05df3b1SJaegeuk Kim if (dn->nid == 0) 715e05df3b1SJaegeuk Kim return 1; 716e05df3b1SJaegeuk Kim 717e05df3b1SJaegeuk Kim /* get direct node */ 7184081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 719e05df3b1SJaegeuk Kim if (IS_ERR(page) && PTR_ERR(page) == -ENOENT) 720e05df3b1SJaegeuk Kim return 1; 721e05df3b1SJaegeuk Kim else if (IS_ERR(page)) 722e05df3b1SJaegeuk Kim return PTR_ERR(page); 723e05df3b1SJaegeuk Kim 724e05df3b1SJaegeuk Kim /* Make dnode_of_data for parameter */ 725e05df3b1SJaegeuk Kim dn->node_page = page; 726e05df3b1SJaegeuk Kim dn->ofs_in_node = 0; 727e05df3b1SJaegeuk Kim truncate_data_blocks(dn); 728e05df3b1SJaegeuk Kim truncate_node(dn); 729e05df3b1SJaegeuk Kim return 1; 730e05df3b1SJaegeuk Kim } 731e05df3b1SJaegeuk Kim 732e05df3b1SJaegeuk Kim static int truncate_nodes(struct dnode_of_data *dn, unsigned int nofs, 733e05df3b1SJaegeuk Kim int ofs, int depth) 734e05df3b1SJaegeuk Kim { 735e05df3b1SJaegeuk Kim struct dnode_of_data rdn = *dn; 736e05df3b1SJaegeuk Kim struct page *page; 737e05df3b1SJaegeuk Kim struct f2fs_node *rn; 738e05df3b1SJaegeuk Kim nid_t child_nid; 739e05df3b1SJaegeuk Kim unsigned int child_nofs; 740e05df3b1SJaegeuk Kim int freed = 0; 741e05df3b1SJaegeuk Kim int i, ret; 742e05df3b1SJaegeuk Kim 743e05df3b1SJaegeuk Kim if (dn->nid == 0) 744e05df3b1SJaegeuk Kim return NIDS_PER_BLOCK + 1; 745e05df3b1SJaegeuk Kim 74651dd6249SNamjae Jeon trace_f2fs_truncate_nodes_enter(dn->inode, dn->nid, dn->data_blkaddr); 74751dd6249SNamjae Jeon 7484081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 74951dd6249SNamjae Jeon if (IS_ERR(page)) { 75051dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, PTR_ERR(page)); 751e05df3b1SJaegeuk Kim return PTR_ERR(page); 75251dd6249SNamjae Jeon } 753e05df3b1SJaegeuk Kim 75479344efbSJaegeuk Kim ra_node_pages(page, ofs, NIDS_PER_BLOCK); 75579344efbSJaegeuk Kim 75645590710SGu Zheng rn = F2FS_NODE(page); 757e05df3b1SJaegeuk Kim if (depth < 3) { 758e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++, freed++) { 759e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 760e05df3b1SJaegeuk Kim if (child_nid == 0) 761e05df3b1SJaegeuk Kim continue; 762e05df3b1SJaegeuk Kim rdn.nid = child_nid; 763e05df3b1SJaegeuk Kim ret = truncate_dnode(&rdn); 764e05df3b1SJaegeuk Kim if (ret < 0) 765e05df3b1SJaegeuk Kim goto out_err; 76612719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 76793bae099SJaegeuk Kim dn->node_changed = true; 768e05df3b1SJaegeuk Kim } 769e05df3b1SJaegeuk Kim } else { 770e05df3b1SJaegeuk Kim child_nofs = nofs + ofs * (NIDS_PER_BLOCK + 1) + 1; 771e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++) { 772e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 773e05df3b1SJaegeuk Kim if (child_nid == 0) { 774e05df3b1SJaegeuk Kim child_nofs += NIDS_PER_BLOCK + 1; 775e05df3b1SJaegeuk Kim continue; 776e05df3b1SJaegeuk Kim } 777e05df3b1SJaegeuk Kim rdn.nid = child_nid; 778e05df3b1SJaegeuk Kim ret = truncate_nodes(&rdn, child_nofs, 0, depth - 1); 779e05df3b1SJaegeuk Kim if (ret == (NIDS_PER_BLOCK + 1)) { 78012719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 78193bae099SJaegeuk Kim dn->node_changed = true; 782e05df3b1SJaegeuk Kim child_nofs += ret; 783e05df3b1SJaegeuk Kim } else if (ret < 0 && ret != -ENOENT) { 784e05df3b1SJaegeuk Kim goto out_err; 785e05df3b1SJaegeuk Kim } 786e05df3b1SJaegeuk Kim } 787e05df3b1SJaegeuk Kim freed = child_nofs; 788e05df3b1SJaegeuk Kim } 789e05df3b1SJaegeuk Kim 790e05df3b1SJaegeuk Kim if (!ofs) { 791e05df3b1SJaegeuk Kim /* remove current indirect node */ 792e05df3b1SJaegeuk Kim dn->node_page = page; 793e05df3b1SJaegeuk Kim truncate_node(dn); 794e05df3b1SJaegeuk Kim freed++; 795e05df3b1SJaegeuk Kim } else { 796e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 797e05df3b1SJaegeuk Kim } 79851dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, freed); 799e05df3b1SJaegeuk Kim return freed; 800e05df3b1SJaegeuk Kim 801e05df3b1SJaegeuk Kim out_err: 802e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 80351dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, ret); 804e05df3b1SJaegeuk Kim return ret; 805e05df3b1SJaegeuk Kim } 806e05df3b1SJaegeuk Kim 807e05df3b1SJaegeuk Kim static int truncate_partial_nodes(struct dnode_of_data *dn, 808e05df3b1SJaegeuk Kim struct f2fs_inode *ri, int *offset, int depth) 809e05df3b1SJaegeuk Kim { 810e05df3b1SJaegeuk Kim struct page *pages[2]; 811e05df3b1SJaegeuk Kim nid_t nid[3]; 812e05df3b1SJaegeuk Kim nid_t child_nid; 813e05df3b1SJaegeuk Kim int err = 0; 814e05df3b1SJaegeuk Kim int i; 815e05df3b1SJaegeuk Kim int idx = depth - 2; 816e05df3b1SJaegeuk Kim 817e05df3b1SJaegeuk Kim nid[0] = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 818e05df3b1SJaegeuk Kim if (!nid[0]) 819e05df3b1SJaegeuk Kim return 0; 820e05df3b1SJaegeuk Kim 821e05df3b1SJaegeuk Kim /* get indirect nodes in the path */ 822a225dca3Sshifei10.ge for (i = 0; i < idx + 1; i++) { 823e1c42045Sarter97 /* reference count'll be increased */ 8244081363fSJaegeuk Kim pages[i] = get_node_page(F2FS_I_SB(dn->inode), nid[i]); 825e05df3b1SJaegeuk Kim if (IS_ERR(pages[i])) { 826e05df3b1SJaegeuk Kim err = PTR_ERR(pages[i]); 827a225dca3Sshifei10.ge idx = i - 1; 828e05df3b1SJaegeuk Kim goto fail; 829e05df3b1SJaegeuk Kim } 830e05df3b1SJaegeuk Kim nid[i + 1] = get_nid(pages[i], offset[i + 1], false); 831e05df3b1SJaegeuk Kim } 832e05df3b1SJaegeuk Kim 83379344efbSJaegeuk Kim ra_node_pages(pages[idx], offset[idx + 1], NIDS_PER_BLOCK); 83479344efbSJaegeuk Kim 835e05df3b1SJaegeuk Kim /* free direct nodes linked to a partial indirect node */ 836a225dca3Sshifei10.ge for (i = offset[idx + 1]; i < NIDS_PER_BLOCK; i++) { 837e05df3b1SJaegeuk Kim child_nid = get_nid(pages[idx], i, false); 838e05df3b1SJaegeuk Kim if (!child_nid) 839e05df3b1SJaegeuk Kim continue; 840e05df3b1SJaegeuk Kim dn->nid = child_nid; 841e05df3b1SJaegeuk Kim err = truncate_dnode(dn); 842e05df3b1SJaegeuk Kim if (err < 0) 843e05df3b1SJaegeuk Kim goto fail; 84412719ae1SJaegeuk Kim if (set_nid(pages[idx], i, 0, false)) 84593bae099SJaegeuk Kim dn->node_changed = true; 846e05df3b1SJaegeuk Kim } 847e05df3b1SJaegeuk Kim 848a225dca3Sshifei10.ge if (offset[idx + 1] == 0) { 849e05df3b1SJaegeuk Kim dn->node_page = pages[idx]; 850e05df3b1SJaegeuk Kim dn->nid = nid[idx]; 851e05df3b1SJaegeuk Kim truncate_node(dn); 852e05df3b1SJaegeuk Kim } else { 853e05df3b1SJaegeuk Kim f2fs_put_page(pages[idx], 1); 854e05df3b1SJaegeuk Kim } 855e05df3b1SJaegeuk Kim offset[idx]++; 856a225dca3Sshifei10.ge offset[idx + 1] = 0; 857a225dca3Sshifei10.ge idx--; 858e05df3b1SJaegeuk Kim fail: 859a225dca3Sshifei10.ge for (i = idx; i >= 0; i--) 860e05df3b1SJaegeuk Kim f2fs_put_page(pages[i], 1); 86151dd6249SNamjae Jeon 86251dd6249SNamjae Jeon trace_f2fs_truncate_partial_nodes(dn->inode, nid, depth, err); 86351dd6249SNamjae Jeon 864e05df3b1SJaegeuk Kim return err; 865e05df3b1SJaegeuk Kim } 866e05df3b1SJaegeuk Kim 8670a8165d7SJaegeuk Kim /* 868e05df3b1SJaegeuk Kim * All the block addresses of data and nodes should be nullified. 869e05df3b1SJaegeuk Kim */ 870e05df3b1SJaegeuk Kim int truncate_inode_blocks(struct inode *inode, pgoff_t from) 871e05df3b1SJaegeuk Kim { 8724081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 873e05df3b1SJaegeuk Kim int err = 0, cont = 1; 874e05df3b1SJaegeuk Kim int level, offset[4], noffset[4]; 8757dd690c8SJaegeuk Kim unsigned int nofs = 0; 87658bfaf44SJaegeuk Kim struct f2fs_inode *ri; 877e05df3b1SJaegeuk Kim struct dnode_of_data dn; 878e05df3b1SJaegeuk Kim struct page *page; 879e05df3b1SJaegeuk Kim 88051dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_enter(inode, from); 88151dd6249SNamjae Jeon 88281ca7350SChao Yu level = get_node_path(inode, from, offset, noffset); 883ff373558SJaegeuk Kim 884e05df3b1SJaegeuk Kim page = get_node_page(sbi, inode->i_ino); 88551dd6249SNamjae Jeon if (IS_ERR(page)) { 88651dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, PTR_ERR(page)); 887e05df3b1SJaegeuk Kim return PTR_ERR(page); 88851dd6249SNamjae Jeon } 889e05df3b1SJaegeuk Kim 890e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, page, NULL, 0); 891e05df3b1SJaegeuk Kim unlock_page(page); 892e05df3b1SJaegeuk Kim 89358bfaf44SJaegeuk Kim ri = F2FS_INODE(page); 894e05df3b1SJaegeuk Kim switch (level) { 895e05df3b1SJaegeuk Kim case 0: 896e05df3b1SJaegeuk Kim case 1: 897e05df3b1SJaegeuk Kim nofs = noffset[1]; 898e05df3b1SJaegeuk Kim break; 899e05df3b1SJaegeuk Kim case 2: 900e05df3b1SJaegeuk Kim nofs = noffset[1]; 901e05df3b1SJaegeuk Kim if (!offset[level - 1]) 902e05df3b1SJaegeuk Kim goto skip_partial; 90358bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 904e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 905e05df3b1SJaegeuk Kim goto fail; 906e05df3b1SJaegeuk Kim nofs += 1 + NIDS_PER_BLOCK; 907e05df3b1SJaegeuk Kim break; 908e05df3b1SJaegeuk Kim case 3: 909e05df3b1SJaegeuk Kim nofs = 5 + 2 * NIDS_PER_BLOCK; 910e05df3b1SJaegeuk Kim if (!offset[level - 1]) 911e05df3b1SJaegeuk Kim goto skip_partial; 91258bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 913e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 914e05df3b1SJaegeuk Kim goto fail; 915e05df3b1SJaegeuk Kim break; 916e05df3b1SJaegeuk Kim default: 917e05df3b1SJaegeuk Kim BUG(); 918e05df3b1SJaegeuk Kim } 919e05df3b1SJaegeuk Kim 920e05df3b1SJaegeuk Kim skip_partial: 921e05df3b1SJaegeuk Kim while (cont) { 92258bfaf44SJaegeuk Kim dn.nid = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 923e05df3b1SJaegeuk Kim switch (offset[0]) { 924e05df3b1SJaegeuk Kim case NODE_DIR1_BLOCK: 925e05df3b1SJaegeuk Kim case NODE_DIR2_BLOCK: 926e05df3b1SJaegeuk Kim err = truncate_dnode(&dn); 927e05df3b1SJaegeuk Kim break; 928e05df3b1SJaegeuk Kim 929e05df3b1SJaegeuk Kim case NODE_IND1_BLOCK: 930e05df3b1SJaegeuk Kim case NODE_IND2_BLOCK: 931e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 2); 932e05df3b1SJaegeuk Kim break; 933e05df3b1SJaegeuk Kim 934e05df3b1SJaegeuk Kim case NODE_DIND_BLOCK: 935e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 3); 936e05df3b1SJaegeuk Kim cont = 0; 937e05df3b1SJaegeuk Kim break; 938e05df3b1SJaegeuk Kim 939e05df3b1SJaegeuk Kim default: 940e05df3b1SJaegeuk Kim BUG(); 941e05df3b1SJaegeuk Kim } 942e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 943e05df3b1SJaegeuk Kim goto fail; 944e05df3b1SJaegeuk Kim if (offset[1] == 0 && 94558bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK]) { 946e05df3b1SJaegeuk Kim lock_page(page); 947ff373558SJaegeuk Kim BUG_ON(page->mapping != NODE_MAPPING(sbi)); 948fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 94958bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK] = 0; 950e05df3b1SJaegeuk Kim set_page_dirty(page); 951e05df3b1SJaegeuk Kim unlock_page(page); 952e05df3b1SJaegeuk Kim } 953e05df3b1SJaegeuk Kim offset[1] = 0; 954e05df3b1SJaegeuk Kim offset[0]++; 955e05df3b1SJaegeuk Kim nofs += err; 956e05df3b1SJaegeuk Kim } 957e05df3b1SJaegeuk Kim fail: 958e05df3b1SJaegeuk Kim f2fs_put_page(page, 0); 95951dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, err); 960e05df3b1SJaegeuk Kim return err > 0 ? 0 : err; 961e05df3b1SJaegeuk Kim } 962e05df3b1SJaegeuk Kim 9634f16fb0fSJaegeuk Kim int truncate_xattr_node(struct inode *inode, struct page *page) 9644f16fb0fSJaegeuk Kim { 9654081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 9664f16fb0fSJaegeuk Kim nid_t nid = F2FS_I(inode)->i_xattr_nid; 9674f16fb0fSJaegeuk Kim struct dnode_of_data dn; 9684f16fb0fSJaegeuk Kim struct page *npage; 9694f16fb0fSJaegeuk Kim 9704f16fb0fSJaegeuk Kim if (!nid) 9714f16fb0fSJaegeuk Kim return 0; 9724f16fb0fSJaegeuk Kim 9734f16fb0fSJaegeuk Kim npage = get_node_page(sbi, nid); 9744f16fb0fSJaegeuk Kim if (IS_ERR(npage)) 9754f16fb0fSJaegeuk Kim return PTR_ERR(npage); 9764f16fb0fSJaegeuk Kim 977205b9822SJaegeuk Kim f2fs_i_xnid_write(inode, 0); 97865985d93SJaegeuk Kim 9794f16fb0fSJaegeuk Kim set_new_dnode(&dn, inode, page, npage, nid); 9804f16fb0fSJaegeuk Kim 9814f16fb0fSJaegeuk Kim if (page) 98201d2d1aaSChao Yu dn.inode_page_locked = true; 9834f16fb0fSJaegeuk Kim truncate_node(&dn); 9844f16fb0fSJaegeuk Kim return 0; 9854f16fb0fSJaegeuk Kim } 9864f16fb0fSJaegeuk Kim 98739936837SJaegeuk Kim /* 9884f4124d0SChao Yu * Caller should grab and release a rwsem by calling f2fs_lock_op() and 9894f4124d0SChao Yu * f2fs_unlock_op(). 99039936837SJaegeuk Kim */ 99113ec7297SChao Yu int remove_inode_page(struct inode *inode) 992e05df3b1SJaegeuk Kim { 993e05df3b1SJaegeuk Kim struct dnode_of_data dn; 99413ec7297SChao Yu int err; 995e05df3b1SJaegeuk Kim 996c2e69583SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 99713ec7297SChao Yu err = get_dnode_of_data(&dn, 0, LOOKUP_NODE); 99813ec7297SChao Yu if (err) 99913ec7297SChao Yu return err; 1000e05df3b1SJaegeuk Kim 100113ec7297SChao Yu err = truncate_xattr_node(inode, dn.inode_page); 100213ec7297SChao Yu if (err) { 1003c2e69583SJaegeuk Kim f2fs_put_dnode(&dn); 100413ec7297SChao Yu return err; 1005e05df3b1SJaegeuk Kim } 1006c2e69583SJaegeuk Kim 1007c2e69583SJaegeuk Kim /* remove potential inline_data blocks */ 1008c2e69583SJaegeuk Kim if (S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) || 1009c2e69583SJaegeuk Kim S_ISLNK(inode->i_mode)) 1010c2e69583SJaegeuk Kim truncate_data_blocks_range(&dn, 1); 1011c2e69583SJaegeuk Kim 1012e1c42045Sarter97 /* 0 is possible, after f2fs_new_inode() has failed */ 10139850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), 10149850cf4aSJaegeuk Kim inode->i_blocks != 0 && inode->i_blocks != 1); 1015c2e69583SJaegeuk Kim 1016c2e69583SJaegeuk Kim /* will put inode & node pages */ 1017e05df3b1SJaegeuk Kim truncate_node(&dn); 101813ec7297SChao Yu return 0; 1019e05df3b1SJaegeuk Kim } 1020e05df3b1SJaegeuk Kim 1021a014e037SJaegeuk Kim struct page *new_inode_page(struct inode *inode) 1022e05df3b1SJaegeuk Kim { 1023e05df3b1SJaegeuk Kim struct dnode_of_data dn; 1024e05df3b1SJaegeuk Kim 1025e05df3b1SJaegeuk Kim /* allocate inode page for new inode */ 1026e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 102744a83ff6SJaegeuk Kim 102844a83ff6SJaegeuk Kim /* caller should f2fs_put_page(page, 1); */ 10298ae8f162SJaegeuk Kim return new_node_page(&dn, 0, NULL); 1030e05df3b1SJaegeuk Kim } 1031e05df3b1SJaegeuk Kim 10328ae8f162SJaegeuk Kim struct page *new_node_page(struct dnode_of_data *dn, 10338ae8f162SJaegeuk Kim unsigned int ofs, struct page *ipage) 1034e05df3b1SJaegeuk Kim { 10354081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 103625cc5d3bSJaegeuk Kim struct node_info new_ni; 1037e05df3b1SJaegeuk Kim struct page *page; 1038e05df3b1SJaegeuk Kim int err; 1039e05df3b1SJaegeuk Kim 104091942321SJaegeuk Kim if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC))) 1041e05df3b1SJaegeuk Kim return ERR_PTR(-EPERM); 1042e05df3b1SJaegeuk Kim 1043300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), dn->nid, false); 1044e05df3b1SJaegeuk Kim if (!page) 1045e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1046e05df3b1SJaegeuk Kim 10476bacf52fSJaegeuk Kim if (unlikely(!inc_valid_node_count(sbi, dn->inode))) { 10489c02740cSJaegeuk Kim err = -ENOSPC; 10499c02740cSJaegeuk Kim goto fail; 10509c02740cSJaegeuk Kim } 105125cc5d3bSJaegeuk Kim #ifdef CONFIG_F2FS_CHECK_FS 105225cc5d3bSJaegeuk Kim get_node_info(sbi, dn->nid, &new_ni); 105325cc5d3bSJaegeuk Kim f2fs_bug_on(sbi, new_ni.blk_addr != NULL_ADDR); 105425cc5d3bSJaegeuk Kim #endif 105525cc5d3bSJaegeuk Kim new_ni.nid = dn->nid; 1056e05df3b1SJaegeuk Kim new_ni.ino = dn->inode->i_ino; 105725cc5d3bSJaegeuk Kim new_ni.blk_addr = NULL_ADDR; 105825cc5d3bSJaegeuk Kim new_ni.flag = 0; 105925cc5d3bSJaegeuk Kim new_ni.version = 0; 1060479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 10619c02740cSJaegeuk Kim 1062fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 10639c02740cSJaegeuk Kim fill_node_footer(page, dn->nid, dn->inode->i_ino, ofs, true); 1064398b1ac5SJaegeuk Kim set_cold_node(dn->inode, page); 1065237c0790SJaegeuk Kim if (!PageUptodate(page)) 10669c02740cSJaegeuk Kim SetPageUptodate(page); 106712719ae1SJaegeuk Kim if (set_page_dirty(page)) 106812719ae1SJaegeuk Kim dn->node_changed = true; 1069e05df3b1SJaegeuk Kim 10704bc8e9bcSChao Yu if (f2fs_has_xattr_block(ofs)) 1071205b9822SJaegeuk Kim f2fs_i_xnid_write(dn->inode, dn->nid); 1072479bd73aSJaegeuk Kim 1073e05df3b1SJaegeuk Kim if (ofs == 0) 1074e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 1075e05df3b1SJaegeuk Kim return page; 1076e05df3b1SJaegeuk Kim 1077e05df3b1SJaegeuk Kim fail: 107871e9fec5SJaegeuk Kim clear_node_page_dirty(page); 1079e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1080e05df3b1SJaegeuk Kim return ERR_PTR(err); 1081e05df3b1SJaegeuk Kim } 1082e05df3b1SJaegeuk Kim 108356ae674cSJaegeuk Kim /* 108456ae674cSJaegeuk Kim * Caller should do after getting the following values. 108556ae674cSJaegeuk Kim * 0: f2fs_put_page(page, 0) 108686531d6bSJaegeuk Kim * LOCKED_PAGE or error: f2fs_put_page(page, 1) 108756ae674cSJaegeuk Kim */ 108804d328deSMike Christie static int read_node_page(struct page *page, int op_flags) 1089e05df3b1SJaegeuk Kim { 10904081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1091e05df3b1SJaegeuk Kim struct node_info ni; 1092cf04e8ebSJaegeuk Kim struct f2fs_io_info fio = { 109305ca3632SJaegeuk Kim .sbi = sbi, 1094cf04e8ebSJaegeuk Kim .type = NODE, 109504d328deSMike Christie .op = REQ_OP_READ, 109604d328deSMike Christie .op_flags = op_flags, 109705ca3632SJaegeuk Kim .page = page, 10984375a336SJaegeuk Kim .encrypted_page = NULL, 1099cf04e8ebSJaegeuk Kim }; 1100e05df3b1SJaegeuk Kim 11013bdad3c7SJaegeuk Kim if (PageUptodate(page)) 11023bdad3c7SJaegeuk Kim return LOCKED_PAGE; 11033bdad3c7SJaegeuk Kim 1104e05df3b1SJaegeuk Kim get_node_info(sbi, page->index, &ni); 1105e05df3b1SJaegeuk Kim 11066bacf52fSJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 11072bca1e23SJaegeuk Kim ClearPageUptodate(page); 1108e05df3b1SJaegeuk Kim return -ENOENT; 1109393ff91fSJaegeuk Kim } 1110393ff91fSJaegeuk Kim 11117a9d7548SChao Yu fio.new_blkaddr = fio.old_blkaddr = ni.blk_addr; 111205ca3632SJaegeuk Kim return f2fs_submit_page_bio(&fio); 1113e05df3b1SJaegeuk Kim } 1114e05df3b1SJaegeuk Kim 11150a8165d7SJaegeuk Kim /* 1116e05df3b1SJaegeuk Kim * Readahead a node page 1117e05df3b1SJaegeuk Kim */ 1118e05df3b1SJaegeuk Kim void ra_node_page(struct f2fs_sb_info *sbi, nid_t nid) 1119e05df3b1SJaegeuk Kim { 1120e05df3b1SJaegeuk Kim struct page *apage; 112156ae674cSJaegeuk Kim int err; 1122e05df3b1SJaegeuk Kim 1123e8458725SChao Yu if (!nid) 1124e8458725SChao Yu return; 1125e8458725SChao Yu f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1126e8458725SChao Yu 1127999270deSFan Li rcu_read_lock(); 1128999270deSFan Li apage = radix_tree_lookup(&NODE_MAPPING(sbi)->page_tree, nid); 1129999270deSFan Li rcu_read_unlock(); 1130999270deSFan Li if (apage) 1131393ff91fSJaegeuk Kim return; 1132e05df3b1SJaegeuk Kim 1133300e129cSJaegeuk Kim apage = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1134e05df3b1SJaegeuk Kim if (!apage) 1135e05df3b1SJaegeuk Kim return; 1136e05df3b1SJaegeuk Kim 113770246286SChristoph Hellwig err = read_node_page(apage, REQ_RAHEAD); 113886531d6bSJaegeuk Kim f2fs_put_page(apage, err ? 1 : 0); 1139e05df3b1SJaegeuk Kim } 1140e05df3b1SJaegeuk Kim 114117a0ee55SJaegeuk Kim static struct page *__get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid, 11420e022ea8SChao Yu struct page *parent, int start) 1143e05df3b1SJaegeuk Kim { 114456ae674cSJaegeuk Kim struct page *page; 114556ae674cSJaegeuk Kim int err; 11464aa69d56SJaegeuk Kim 11474aa69d56SJaegeuk Kim if (!nid) 11484aa69d56SJaegeuk Kim return ERR_PTR(-ENOENT); 11494aa69d56SJaegeuk Kim f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1150afcb7ca0SJaegeuk Kim repeat: 1151300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1152e05df3b1SJaegeuk Kim if (!page) 1153e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1154e05df3b1SJaegeuk Kim 115570fd7614SChristoph Hellwig err = read_node_page(page, 0); 115686531d6bSJaegeuk Kim if (err < 0) { 115786531d6bSJaegeuk Kim f2fs_put_page(page, 1); 1158e05df3b1SJaegeuk Kim return ERR_PTR(err); 1159e1c51b9fSChao Yu } else if (err == LOCKED_PAGE) { 11601f258ec1SChao Yu err = 0; 1161e1c51b9fSChao Yu goto page_hit; 116286531d6bSJaegeuk Kim } 1163aaf96075SJaegeuk Kim 11640e022ea8SChao Yu if (parent) 116579344efbSJaegeuk Kim ra_node_pages(parent, start + 1, MAX_RA_NODE); 11660e022ea8SChao Yu 1167e1c51b9fSChao Yu lock_page(page); 1168e1c51b9fSChao Yu 11694ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1170afcb7ca0SJaegeuk Kim f2fs_put_page(page, 1); 1171afcb7ca0SJaegeuk Kim goto repeat; 1172afcb7ca0SJaegeuk Kim } 11731563ac75SChao Yu 11741f258ec1SChao Yu if (unlikely(!PageUptodate(page))) { 11751f258ec1SChao Yu err = -EIO; 11761563ac75SChao Yu goto out_err; 11771f258ec1SChao Yu } 1178e1c51b9fSChao Yu page_hit: 11790c9df7fbSYunlong Song if(unlikely(nid != nid_of_node(page))) { 11801f258ec1SChao Yu f2fs_msg(sbi->sb, KERN_WARNING, "inconsistent node block, " 11811f258ec1SChao Yu "nid:%lu, node_footer[nid:%u,ino:%u,ofs:%u,cpver:%llu,blkaddr:%u]", 11821f258ec1SChao Yu nid, nid_of_node(page), ino_of_node(page), 11831f258ec1SChao Yu ofs_of_node(page), cpver_of_node(page), 11841f258ec1SChao Yu next_blkaddr_of_node(page)); 11850c9df7fbSYunlong Song ClearPageUptodate(page); 11861f258ec1SChao Yu err = -EINVAL; 11870c9df7fbSYunlong Song out_err: 11880c9df7fbSYunlong Song f2fs_put_page(page, 1); 11891f258ec1SChao Yu return ERR_PTR(err); 11900c9df7fbSYunlong Song } 1191e05df3b1SJaegeuk Kim return page; 1192e05df3b1SJaegeuk Kim } 1193e05df3b1SJaegeuk Kim 11940e022ea8SChao Yu struct page *get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid) 11950e022ea8SChao Yu { 11960e022ea8SChao Yu return __get_node_page(sbi, nid, NULL, 0); 11970e022ea8SChao Yu } 11980e022ea8SChao Yu 1199e05df3b1SJaegeuk Kim struct page *get_node_page_ra(struct page *parent, int start) 1200e05df3b1SJaegeuk Kim { 12014081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 12020e022ea8SChao Yu nid_t nid = get_nid(parent, start, false); 1203e05df3b1SJaegeuk Kim 12040e022ea8SChao Yu return __get_node_page(sbi, nid, parent, start); 1205e05df3b1SJaegeuk Kim } 1206e05df3b1SJaegeuk Kim 12072049d4fcSJaegeuk Kim static void flush_inline_data(struct f2fs_sb_info *sbi, nid_t ino) 12082049d4fcSJaegeuk Kim { 12092049d4fcSJaegeuk Kim struct inode *inode; 12102049d4fcSJaegeuk Kim struct page *page; 12110f3311a8SChao Yu int ret; 12122049d4fcSJaegeuk Kim 12132049d4fcSJaegeuk Kim /* should flush inline_data before evict_inode */ 12142049d4fcSJaegeuk Kim inode = ilookup(sbi->sb, ino); 12152049d4fcSJaegeuk Kim if (!inode) 12162049d4fcSJaegeuk Kim return; 12172049d4fcSJaegeuk Kim 12184a6de50dSJaegeuk Kim page = pagecache_get_page(inode->i_mapping, 0, FGP_LOCK|FGP_NOWAIT, 0); 12192049d4fcSJaegeuk Kim if (!page) 12202049d4fcSJaegeuk Kim goto iput_out; 12212049d4fcSJaegeuk Kim 12222049d4fcSJaegeuk Kim if (!PageUptodate(page)) 12232049d4fcSJaegeuk Kim goto page_out; 12242049d4fcSJaegeuk Kim 12252049d4fcSJaegeuk Kim if (!PageDirty(page)) 12262049d4fcSJaegeuk Kim goto page_out; 12272049d4fcSJaegeuk Kim 12282049d4fcSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 12292049d4fcSJaegeuk Kim goto page_out; 12302049d4fcSJaegeuk Kim 12310f3311a8SChao Yu ret = f2fs_write_inline_data(inode, page); 12322049d4fcSJaegeuk Kim inode_dec_dirty_pages(inode); 1233933439c8SChao Yu remove_dirty_inode(inode); 12340f3311a8SChao Yu if (ret) 12352049d4fcSJaegeuk Kim set_page_dirty(page); 12362049d4fcSJaegeuk Kim page_out: 12374a6de50dSJaegeuk Kim f2fs_put_page(page, 1); 12382049d4fcSJaegeuk Kim iput_out: 12392049d4fcSJaegeuk Kim iput(inode); 12402049d4fcSJaegeuk Kim } 12412049d4fcSJaegeuk Kim 1242da011cc0SChao Yu void move_node_page(struct page *node_page, int gc_type) 1243da011cc0SChao Yu { 1244da011cc0SChao Yu if (gc_type == FG_GC) { 1245da011cc0SChao Yu struct f2fs_sb_info *sbi = F2FS_P_SB(node_page); 1246da011cc0SChao Yu struct writeback_control wbc = { 1247da011cc0SChao Yu .sync_mode = WB_SYNC_ALL, 1248da011cc0SChao Yu .nr_to_write = 1, 1249da011cc0SChao Yu .for_reclaim = 0, 1250da011cc0SChao Yu }; 1251da011cc0SChao Yu 1252da011cc0SChao Yu set_page_dirty(node_page); 1253da011cc0SChao Yu f2fs_wait_on_page_writeback(node_page, NODE, true); 1254da011cc0SChao Yu 1255da011cc0SChao Yu f2fs_bug_on(sbi, PageWriteback(node_page)); 1256da011cc0SChao Yu if (!clear_page_dirty_for_io(node_page)) 1257da011cc0SChao Yu goto out_page; 1258da011cc0SChao Yu 1259da011cc0SChao Yu if (NODE_MAPPING(sbi)->a_ops->writepage(node_page, &wbc)) 1260da011cc0SChao Yu unlock_page(node_page); 1261da011cc0SChao Yu goto release_page; 1262da011cc0SChao Yu } else { 1263da011cc0SChao Yu /* set page dirty and write it */ 1264da011cc0SChao Yu if (!PageWriteback(node_page)) 1265da011cc0SChao Yu set_page_dirty(node_page); 1266da011cc0SChao Yu } 1267da011cc0SChao Yu out_page: 1268da011cc0SChao Yu unlock_page(node_page); 1269da011cc0SChao Yu release_page: 1270da011cc0SChao Yu f2fs_put_page(node_page, 0); 1271da011cc0SChao Yu } 1272da011cc0SChao Yu 1273608514deSJaegeuk Kim static struct page *last_fsync_dnode(struct f2fs_sb_info *sbi, nid_t ino) 1274e05df3b1SJaegeuk Kim { 1275e05df3b1SJaegeuk Kim pgoff_t index, end; 1276e05df3b1SJaegeuk Kim struct pagevec pvec; 1277608514deSJaegeuk Kim struct page *last_page = NULL; 127852681375SJaegeuk Kim 127952681375SJaegeuk Kim pagevec_init(&pvec, 0); 128052681375SJaegeuk Kim index = 0; 128152681375SJaegeuk Kim end = ULONG_MAX; 128252681375SJaegeuk Kim 128352681375SJaegeuk Kim while (index <= end) { 128452681375SJaegeuk Kim int i, nr_pages; 128552681375SJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 128652681375SJaegeuk Kim PAGECACHE_TAG_DIRTY, 128752681375SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 128852681375SJaegeuk Kim if (nr_pages == 0) 128952681375SJaegeuk Kim break; 129052681375SJaegeuk Kim 129152681375SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 129252681375SJaegeuk Kim struct page *page = pvec.pages[i]; 129352681375SJaegeuk Kim 129452681375SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1295608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 129652681375SJaegeuk Kim pagevec_release(&pvec); 1297608514deSJaegeuk Kim return ERR_PTR(-EIO); 129852681375SJaegeuk Kim } 129952681375SJaegeuk Kim 130052681375SJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 130152681375SJaegeuk Kim continue; 130252681375SJaegeuk Kim if (ino_of_node(page) != ino) 130352681375SJaegeuk Kim continue; 130452681375SJaegeuk Kim 130552681375SJaegeuk Kim lock_page(page); 130652681375SJaegeuk Kim 130752681375SJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 130852681375SJaegeuk Kim continue_unlock: 130952681375SJaegeuk Kim unlock_page(page); 131052681375SJaegeuk Kim continue; 131152681375SJaegeuk Kim } 131252681375SJaegeuk Kim if (ino_of_node(page) != ino) 131352681375SJaegeuk Kim goto continue_unlock; 131452681375SJaegeuk Kim 131552681375SJaegeuk Kim if (!PageDirty(page)) { 131652681375SJaegeuk Kim /* someone wrote it for us */ 131752681375SJaegeuk Kim goto continue_unlock; 131852681375SJaegeuk Kim } 131952681375SJaegeuk Kim 1320608514deSJaegeuk Kim if (last_page) 1321608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1322608514deSJaegeuk Kim 1323608514deSJaegeuk Kim get_page(page); 1324608514deSJaegeuk Kim last_page = page; 1325608514deSJaegeuk Kim unlock_page(page); 1326608514deSJaegeuk Kim } 1327608514deSJaegeuk Kim pagevec_release(&pvec); 1328608514deSJaegeuk Kim cond_resched(); 1329608514deSJaegeuk Kim } 1330608514deSJaegeuk Kim return last_page; 1331608514deSJaegeuk Kim } 1332608514deSJaegeuk Kim 1333d68f735bSJaegeuk Kim static int __write_node_page(struct page *page, bool atomic, bool *submitted, 1334faa24895SJaegeuk Kim struct writeback_control *wbc) 1335faa24895SJaegeuk Kim { 1336faa24895SJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1337faa24895SJaegeuk Kim nid_t nid; 1338faa24895SJaegeuk Kim struct node_info ni; 1339faa24895SJaegeuk Kim struct f2fs_io_info fio = { 1340faa24895SJaegeuk Kim .sbi = sbi, 1341faa24895SJaegeuk Kim .type = NODE, 1342faa24895SJaegeuk Kim .op = REQ_OP_WRITE, 1343faa24895SJaegeuk Kim .op_flags = wbc_to_write_flags(wbc), 1344faa24895SJaegeuk Kim .page = page, 1345faa24895SJaegeuk Kim .encrypted_page = NULL, 1346d68f735bSJaegeuk Kim .submitted = false, 1347faa24895SJaegeuk Kim }; 1348faa24895SJaegeuk Kim 1349faa24895SJaegeuk Kim trace_f2fs_writepage(page, NODE); 1350faa24895SJaegeuk Kim 1351faa24895SJaegeuk Kim if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING))) 1352faa24895SJaegeuk Kim goto redirty_out; 1353faa24895SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) 1354faa24895SJaegeuk Kim goto redirty_out; 1355faa24895SJaegeuk Kim 1356faa24895SJaegeuk Kim /* get old block addr of this node page */ 1357faa24895SJaegeuk Kim nid = nid_of_node(page); 1358faa24895SJaegeuk Kim f2fs_bug_on(sbi, page->index != nid); 1359faa24895SJaegeuk Kim 1360faa24895SJaegeuk Kim if (wbc->for_reclaim) { 1361faa24895SJaegeuk Kim if (!down_read_trylock(&sbi->node_write)) 1362faa24895SJaegeuk Kim goto redirty_out; 1363faa24895SJaegeuk Kim } else { 1364faa24895SJaegeuk Kim down_read(&sbi->node_write); 1365faa24895SJaegeuk Kim } 1366faa24895SJaegeuk Kim 1367faa24895SJaegeuk Kim get_node_info(sbi, nid, &ni); 1368faa24895SJaegeuk Kim 1369faa24895SJaegeuk Kim /* This page is already truncated */ 1370faa24895SJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 1371faa24895SJaegeuk Kim ClearPageUptodate(page); 1372faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1373faa24895SJaegeuk Kim up_read(&sbi->node_write); 1374faa24895SJaegeuk Kim unlock_page(page); 1375faa24895SJaegeuk Kim return 0; 1376faa24895SJaegeuk Kim } 1377faa24895SJaegeuk Kim 1378e7c75ab0SJaegeuk Kim if (atomic && !test_opt(sbi, NOBARRIER)) 1379e7c75ab0SJaegeuk Kim fio.op_flags |= REQ_PREFLUSH | REQ_FUA; 1380e7c75ab0SJaegeuk Kim 1381faa24895SJaegeuk Kim set_page_writeback(page); 1382faa24895SJaegeuk Kim fio.old_blkaddr = ni.blk_addr; 1383faa24895SJaegeuk Kim write_node_page(nid, &fio); 1384faa24895SJaegeuk Kim set_node_addr(sbi, &ni, fio.new_blkaddr, is_fsync_dnode(page)); 1385faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1386faa24895SJaegeuk Kim up_read(&sbi->node_write); 1387faa24895SJaegeuk Kim 1388d68f735bSJaegeuk Kim if (wbc->for_reclaim) { 1389b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, page->mapping->host, 0, 1390b9109b0eSJaegeuk Kim page->index, NODE); 1391d68f735bSJaegeuk Kim submitted = NULL; 1392d68f735bSJaegeuk Kim } 1393faa24895SJaegeuk Kim 1394faa24895SJaegeuk Kim unlock_page(page); 1395faa24895SJaegeuk Kim 1396d68f735bSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1397b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 1398d68f735bSJaegeuk Kim submitted = NULL; 1399d68f735bSJaegeuk Kim } 1400d68f735bSJaegeuk Kim if (submitted) 1401d68f735bSJaegeuk Kim *submitted = fio.submitted; 1402faa24895SJaegeuk Kim 1403faa24895SJaegeuk Kim return 0; 1404faa24895SJaegeuk Kim 1405faa24895SJaegeuk Kim redirty_out: 1406faa24895SJaegeuk Kim redirty_page_for_writepage(wbc, page); 1407faa24895SJaegeuk Kim return AOP_WRITEPAGE_ACTIVATE; 1408faa24895SJaegeuk Kim } 1409faa24895SJaegeuk Kim 1410faa24895SJaegeuk Kim static int f2fs_write_node_page(struct page *page, 1411faa24895SJaegeuk Kim struct writeback_control *wbc) 1412faa24895SJaegeuk Kim { 1413d68f735bSJaegeuk Kim return __write_node_page(page, false, NULL, wbc); 1414faa24895SJaegeuk Kim } 1415faa24895SJaegeuk Kim 141626de9b11SJaegeuk Kim int fsync_node_pages(struct f2fs_sb_info *sbi, struct inode *inode, 1417608514deSJaegeuk Kim struct writeback_control *wbc, bool atomic) 1418608514deSJaegeuk Kim { 1419608514deSJaegeuk Kim pgoff_t index, end; 1420942fd319SJaegeuk Kim pgoff_t last_idx = ULONG_MAX; 1421608514deSJaegeuk Kim struct pagevec pvec; 1422608514deSJaegeuk Kim int ret = 0; 1423608514deSJaegeuk Kim struct page *last_page = NULL; 1424608514deSJaegeuk Kim bool marked = false; 142526de9b11SJaegeuk Kim nid_t ino = inode->i_ino; 1426608514deSJaegeuk Kim 1427608514deSJaegeuk Kim if (atomic) { 1428608514deSJaegeuk Kim last_page = last_fsync_dnode(sbi, ino); 1429608514deSJaegeuk Kim if (IS_ERR_OR_NULL(last_page)) 1430608514deSJaegeuk Kim return PTR_ERR_OR_ZERO(last_page); 1431608514deSJaegeuk Kim } 1432608514deSJaegeuk Kim retry: 1433608514deSJaegeuk Kim pagevec_init(&pvec, 0); 1434608514deSJaegeuk Kim index = 0; 1435608514deSJaegeuk Kim end = ULONG_MAX; 1436608514deSJaegeuk Kim 1437608514deSJaegeuk Kim while (index <= end) { 1438608514deSJaegeuk Kim int i, nr_pages; 1439608514deSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1440608514deSJaegeuk Kim PAGECACHE_TAG_DIRTY, 1441608514deSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1442608514deSJaegeuk Kim if (nr_pages == 0) 1443608514deSJaegeuk Kim break; 1444608514deSJaegeuk Kim 1445608514deSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1446608514deSJaegeuk Kim struct page *page = pvec.pages[i]; 1447d68f735bSJaegeuk Kim bool submitted = false; 1448608514deSJaegeuk Kim 1449608514deSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1450608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1451608514deSJaegeuk Kim pagevec_release(&pvec); 14529de69279SChao Yu ret = -EIO; 14539de69279SChao Yu goto out; 1454608514deSJaegeuk Kim } 1455608514deSJaegeuk Kim 1456608514deSJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 1457608514deSJaegeuk Kim continue; 1458608514deSJaegeuk Kim if (ino_of_node(page) != ino) 1459608514deSJaegeuk Kim continue; 1460608514deSJaegeuk Kim 1461608514deSJaegeuk Kim lock_page(page); 1462608514deSJaegeuk Kim 1463608514deSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1464608514deSJaegeuk Kim continue_unlock: 1465608514deSJaegeuk Kim unlock_page(page); 1466608514deSJaegeuk Kim continue; 1467608514deSJaegeuk Kim } 1468608514deSJaegeuk Kim if (ino_of_node(page) != ino) 146952681375SJaegeuk Kim goto continue_unlock; 147052681375SJaegeuk Kim 1471608514deSJaegeuk Kim if (!PageDirty(page) && page != last_page) { 1472608514deSJaegeuk Kim /* someone wrote it for us */ 1473608514deSJaegeuk Kim goto continue_unlock; 1474608514deSJaegeuk Kim } 1475608514deSJaegeuk Kim 1476608514deSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1477608514deSJaegeuk Kim BUG_ON(PageWriteback(page)); 1478608514deSJaegeuk Kim 1479d29fd172SJaegeuk Kim set_fsync_mark(page, 0); 1480d29fd172SJaegeuk Kim set_dentry_mark(page, 0); 1481d29fd172SJaegeuk Kim 1482608514deSJaegeuk Kim if (!atomic || page == last_page) { 148352681375SJaegeuk Kim set_fsync_mark(page, 1); 148426de9b11SJaegeuk Kim if (IS_INODE(page)) { 148526de9b11SJaegeuk Kim if (is_inode_flag_set(inode, 148626de9b11SJaegeuk Kim FI_DIRTY_INODE)) 148726de9b11SJaegeuk Kim update_inode(inode, page); 148852681375SJaegeuk Kim set_dentry_mark(page, 148952681375SJaegeuk Kim need_dentry_mark(sbi, ino)); 149026de9b11SJaegeuk Kim } 1491608514deSJaegeuk Kim /* may be written by other thread */ 1492608514deSJaegeuk Kim if (!PageDirty(page)) 1493608514deSJaegeuk Kim set_page_dirty(page); 1494608514deSJaegeuk Kim } 1495608514deSJaegeuk Kim 1496608514deSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1497608514deSJaegeuk Kim goto continue_unlock; 149852681375SJaegeuk Kim 1499e7c75ab0SJaegeuk Kim ret = __write_node_page(page, atomic && 1500d68f735bSJaegeuk Kim page == last_page, 1501d68f735bSJaegeuk Kim &submitted, wbc); 1502c267ec15SJaegeuk Kim if (ret) { 150352681375SJaegeuk Kim unlock_page(page); 1504608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1505608514deSJaegeuk Kim break; 1506d68f735bSJaegeuk Kim } else if (submitted) { 1507942fd319SJaegeuk Kim last_idx = page->index; 1508608514deSJaegeuk Kim } 15093f5f4959SChao Yu 1510608514deSJaegeuk Kim if (page == last_page) { 1511608514deSJaegeuk Kim f2fs_put_page(page, 0); 1512608514deSJaegeuk Kim marked = true; 151352681375SJaegeuk Kim break; 151452681375SJaegeuk Kim } 1515c267ec15SJaegeuk Kim } 151652681375SJaegeuk Kim pagevec_release(&pvec); 151752681375SJaegeuk Kim cond_resched(); 151852681375SJaegeuk Kim 1519608514deSJaegeuk Kim if (ret || marked) 152052681375SJaegeuk Kim break; 152152681375SJaegeuk Kim } 1522608514deSJaegeuk Kim if (!ret && atomic && !marked) { 1523608514deSJaegeuk Kim f2fs_msg(sbi->sb, KERN_DEBUG, 1524608514deSJaegeuk Kim "Retry to write fsync mark: ino=%u, idx=%lx", 1525608514deSJaegeuk Kim ino, last_page->index); 1526608514deSJaegeuk Kim lock_page(last_page); 1527d40a43afSYunlei He f2fs_wait_on_page_writeback(last_page, NODE, true); 1528608514deSJaegeuk Kim set_page_dirty(last_page); 1529608514deSJaegeuk Kim unlock_page(last_page); 1530608514deSJaegeuk Kim goto retry; 1531608514deSJaegeuk Kim } 15329de69279SChao Yu out: 1533942fd319SJaegeuk Kim if (last_idx != ULONG_MAX) 1534b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, NULL, ino, last_idx, NODE); 1535c267ec15SJaegeuk Kim return ret ? -EIO: 0; 153652681375SJaegeuk Kim } 153752681375SJaegeuk Kim 153852681375SJaegeuk Kim int sync_node_pages(struct f2fs_sb_info *sbi, struct writeback_control *wbc) 153952681375SJaegeuk Kim { 154052681375SJaegeuk Kim pgoff_t index, end; 154152681375SJaegeuk Kim struct pagevec pvec; 154252681375SJaegeuk Kim int step = 0; 154312bb0a8fSJaegeuk Kim int nwritten = 0; 15443f5f4959SChao Yu int ret = 0; 1545e05df3b1SJaegeuk Kim 1546e05df3b1SJaegeuk Kim pagevec_init(&pvec, 0); 1547e05df3b1SJaegeuk Kim 1548e05df3b1SJaegeuk Kim next_step: 1549e05df3b1SJaegeuk Kim index = 0; 155080dd9c0eSChao Yu end = ULONG_MAX; 1551e05df3b1SJaegeuk Kim 1552e05df3b1SJaegeuk Kim while (index <= end) { 1553e05df3b1SJaegeuk Kim int i, nr_pages; 15544ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1555e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY, 1556e05df3b1SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1557e05df3b1SJaegeuk Kim if (nr_pages == 0) 1558e05df3b1SJaegeuk Kim break; 1559e05df3b1SJaegeuk Kim 1560e05df3b1SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1561e05df3b1SJaegeuk Kim struct page *page = pvec.pages[i]; 1562d68f735bSJaegeuk Kim bool submitted = false; 1563e05df3b1SJaegeuk Kim 15646d5a1495SChao Yu if (unlikely(f2fs_cp_error(sbi))) { 15656d5a1495SChao Yu pagevec_release(&pvec); 15663f5f4959SChao Yu ret = -EIO; 15673f5f4959SChao Yu goto out; 15686d5a1495SChao Yu } 15696d5a1495SChao Yu 1570e05df3b1SJaegeuk Kim /* 1571e05df3b1SJaegeuk Kim * flushing sequence with step: 1572e05df3b1SJaegeuk Kim * 0. indirect nodes 1573e05df3b1SJaegeuk Kim * 1. dentry dnodes 1574e05df3b1SJaegeuk Kim * 2. file dnodes 1575e05df3b1SJaegeuk Kim */ 1576e05df3b1SJaegeuk Kim if (step == 0 && IS_DNODE(page)) 1577e05df3b1SJaegeuk Kim continue; 1578e05df3b1SJaegeuk Kim if (step == 1 && (!IS_DNODE(page) || 1579e05df3b1SJaegeuk Kim is_cold_node(page))) 1580e05df3b1SJaegeuk Kim continue; 1581e05df3b1SJaegeuk Kim if (step == 2 && (!IS_DNODE(page) || 1582e05df3b1SJaegeuk Kim !is_cold_node(page))) 1583e05df3b1SJaegeuk Kim continue; 15849a4cbc9eSChao Yu lock_node: 158552681375SJaegeuk Kim if (!trylock_page(page)) 1586e05df3b1SJaegeuk Kim continue; 1587e05df3b1SJaegeuk Kim 15884ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1589e05df3b1SJaegeuk Kim continue_unlock: 1590e05df3b1SJaegeuk Kim unlock_page(page); 1591e05df3b1SJaegeuk Kim continue; 1592e05df3b1SJaegeuk Kim } 1593e05df3b1SJaegeuk Kim 1594e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1595e05df3b1SJaegeuk Kim /* someone wrote it for us */ 1596e05df3b1SJaegeuk Kim goto continue_unlock; 1597e05df3b1SJaegeuk Kim } 1598e05df3b1SJaegeuk Kim 15992049d4fcSJaegeuk Kim /* flush inline_data */ 160052681375SJaegeuk Kim if (is_inline_node(page)) { 16012049d4fcSJaegeuk Kim clear_inline_node(page); 16022049d4fcSJaegeuk Kim unlock_page(page); 16032049d4fcSJaegeuk Kim flush_inline_data(sbi, ino_of_node(page)); 16049a4cbc9eSChao Yu goto lock_node; 16052049d4fcSJaegeuk Kim } 16062049d4fcSJaegeuk Kim 1607fa3d2bdfSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1608fa3d2bdfSJaegeuk Kim 1609fa3d2bdfSJaegeuk Kim BUG_ON(PageWriteback(page)); 1610e05df3b1SJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1611e05df3b1SJaegeuk Kim goto continue_unlock; 1612e05df3b1SJaegeuk Kim 1613e05df3b1SJaegeuk Kim set_fsync_mark(page, 0); 1614e05df3b1SJaegeuk Kim set_dentry_mark(page, 0); 161552746519SJaegeuk Kim 1616d68f735bSJaegeuk Kim ret = __write_node_page(page, false, &submitted, wbc); 1617d68f735bSJaegeuk Kim if (ret) 161852746519SJaegeuk Kim unlock_page(page); 1619d68f735bSJaegeuk Kim else if (submitted) 16203f5f4959SChao Yu nwritten++; 1621e05df3b1SJaegeuk Kim 1622e05df3b1SJaegeuk Kim if (--wbc->nr_to_write == 0) 1623e05df3b1SJaegeuk Kim break; 1624e05df3b1SJaegeuk Kim } 1625e05df3b1SJaegeuk Kim pagevec_release(&pvec); 1626e05df3b1SJaegeuk Kim cond_resched(); 1627e05df3b1SJaegeuk Kim 1628e05df3b1SJaegeuk Kim if (wbc->nr_to_write == 0) { 1629e05df3b1SJaegeuk Kim step = 2; 1630e05df3b1SJaegeuk Kim break; 1631e05df3b1SJaegeuk Kim } 1632e05df3b1SJaegeuk Kim } 1633e05df3b1SJaegeuk Kim 1634e05df3b1SJaegeuk Kim if (step < 2) { 1635e05df3b1SJaegeuk Kim step++; 1636e05df3b1SJaegeuk Kim goto next_step; 1637e05df3b1SJaegeuk Kim } 16383f5f4959SChao Yu out: 16393f5f4959SChao Yu if (nwritten) 1640b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 16413f5f4959SChao Yu return ret; 1642e05df3b1SJaegeuk Kim } 1643e05df3b1SJaegeuk Kim 1644cfe58f9dSJaegeuk Kim int wait_on_node_pages_writeback(struct f2fs_sb_info *sbi, nid_t ino) 1645cfe58f9dSJaegeuk Kim { 164680dd9c0eSChao Yu pgoff_t index = 0, end = ULONG_MAX; 1647cfe58f9dSJaegeuk Kim struct pagevec pvec; 1648280db3c8SMiklos Szeredi int ret2, ret = 0; 1649cfe58f9dSJaegeuk Kim 1650cfe58f9dSJaegeuk Kim pagevec_init(&pvec, 0); 16514ef51a8fSJaegeuk Kim 16524ef51a8fSJaegeuk Kim while (index <= end) { 16534ef51a8fSJaegeuk Kim int i, nr_pages; 16544ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1655cfe58f9dSJaegeuk Kim PAGECACHE_TAG_WRITEBACK, 16564ef51a8fSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 16574ef51a8fSJaegeuk Kim if (nr_pages == 0) 16584ef51a8fSJaegeuk Kim break; 1659cfe58f9dSJaegeuk Kim 1660cfe58f9dSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1661cfe58f9dSJaegeuk Kim struct page *page = pvec.pages[i]; 1662cfe58f9dSJaegeuk Kim 1663cfe58f9dSJaegeuk Kim /* until radix tree lookup accepts end_index */ 1664cfb271d4SChao Yu if (unlikely(page->index > end)) 1665cfe58f9dSJaegeuk Kim continue; 1666cfe58f9dSJaegeuk Kim 16674bf08ff6SChao Yu if (ino && ino_of_node(page) == ino) { 1668fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1669cfe58f9dSJaegeuk Kim if (TestClearPageError(page)) 1670cfe58f9dSJaegeuk Kim ret = -EIO; 1671cfe58f9dSJaegeuk Kim } 16724bf08ff6SChao Yu } 1673cfe58f9dSJaegeuk Kim pagevec_release(&pvec); 1674cfe58f9dSJaegeuk Kim cond_resched(); 1675cfe58f9dSJaegeuk Kim } 1676cfe58f9dSJaegeuk Kim 1677280db3c8SMiklos Szeredi ret2 = filemap_check_errors(NODE_MAPPING(sbi)); 1678cfe58f9dSJaegeuk Kim if (!ret) 1679cfe58f9dSJaegeuk Kim ret = ret2; 1680cfe58f9dSJaegeuk Kim return ret; 1681cfe58f9dSJaegeuk Kim } 1682cfe58f9dSJaegeuk Kim 1683e05df3b1SJaegeuk Kim static int f2fs_write_node_pages(struct address_space *mapping, 1684e05df3b1SJaegeuk Kim struct writeback_control *wbc) 1685e05df3b1SJaegeuk Kim { 16864081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_M_SB(mapping); 16879dfa1bafSJaegeuk Kim struct blk_plug plug; 168850c8cdb3SJaegeuk Kim long diff; 1689e05df3b1SJaegeuk Kim 16904660f9c0SJaegeuk Kim /* balancing f2fs's metadata in background */ 16914660f9c0SJaegeuk Kim f2fs_balance_fs_bg(sbi); 1692e05df3b1SJaegeuk Kim 1693a7fdffbdSJaegeuk Kim /* collect a number of dirty node pages and write together */ 169487d6f890SJaegeuk Kim if (get_pages(sbi, F2FS_DIRTY_NODES) < nr_pages_to_skip(sbi, NODE)) 1695d3baf95dSJaegeuk Kim goto skip_write; 1696a7fdffbdSJaegeuk Kim 1697d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1698d31c7c3fSYunlei He 169950c8cdb3SJaegeuk Kim diff = nr_pages_to_write(sbi, NODE, wbc); 1700fb5566daSJaegeuk Kim wbc->sync_mode = WB_SYNC_NONE; 17019dfa1bafSJaegeuk Kim blk_start_plug(&plug); 170252681375SJaegeuk Kim sync_node_pages(sbi, wbc); 17039dfa1bafSJaegeuk Kim blk_finish_plug(&plug); 170450c8cdb3SJaegeuk Kim wbc->nr_to_write = max((long)0, wbc->nr_to_write - diff); 1705e05df3b1SJaegeuk Kim return 0; 1706d3baf95dSJaegeuk Kim 1707d3baf95dSJaegeuk Kim skip_write: 1708d3baf95dSJaegeuk Kim wbc->pages_skipped += get_pages(sbi, F2FS_DIRTY_NODES); 1709d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1710d3baf95dSJaegeuk Kim return 0; 1711e05df3b1SJaegeuk Kim } 1712e05df3b1SJaegeuk Kim 1713e05df3b1SJaegeuk Kim static int f2fs_set_node_page_dirty(struct page *page) 1714e05df3b1SJaegeuk Kim { 171526c6b887SJaegeuk Kim trace_f2fs_set_page_dirty(page, NODE); 171626c6b887SJaegeuk Kim 1717237c0790SJaegeuk Kim if (!PageUptodate(page)) 1718e05df3b1SJaegeuk Kim SetPageUptodate(page); 1719e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1720fe76b796SJaegeuk Kim f2fs_set_page_dirty_nobuffers(page); 17214081363fSJaegeuk Kim inc_page_count(F2FS_P_SB(page), F2FS_DIRTY_NODES); 1722e05df3b1SJaegeuk Kim SetPagePrivate(page); 17239e4ded3fSJaegeuk Kim f2fs_trace_pid(page); 1724e05df3b1SJaegeuk Kim return 1; 1725e05df3b1SJaegeuk Kim } 1726e05df3b1SJaegeuk Kim return 0; 1727e05df3b1SJaegeuk Kim } 1728e05df3b1SJaegeuk Kim 17290a8165d7SJaegeuk Kim /* 1730e05df3b1SJaegeuk Kim * Structure of the f2fs node operations 1731e05df3b1SJaegeuk Kim */ 1732e05df3b1SJaegeuk Kim const struct address_space_operations f2fs_node_aops = { 1733e05df3b1SJaegeuk Kim .writepage = f2fs_write_node_page, 1734e05df3b1SJaegeuk Kim .writepages = f2fs_write_node_pages, 1735e05df3b1SJaegeuk Kim .set_page_dirty = f2fs_set_node_page_dirty, 1736487261f3SChao Yu .invalidatepage = f2fs_invalidate_page, 1737487261f3SChao Yu .releasepage = f2fs_release_page, 17385b7a487cSWeichao Guo #ifdef CONFIG_MIGRATION 17395b7a487cSWeichao Guo .migratepage = f2fs_migrate_page, 17405b7a487cSWeichao Guo #endif 1741e05df3b1SJaegeuk Kim }; 1742e05df3b1SJaegeuk Kim 17438a7ed66aSJaegeuk Kim static struct free_nid *__lookup_free_nid_list(struct f2fs_nm_info *nm_i, 17448a7ed66aSJaegeuk Kim nid_t n) 1745e05df3b1SJaegeuk Kim { 17468a7ed66aSJaegeuk Kim return radix_tree_lookup(&nm_i->free_nid_root, n); 17473aa770a9SNamjae Jeon } 1748e05df3b1SJaegeuk Kim 1749eb0aa4b8SJaegeuk Kim static int __insert_nid_to_list(struct f2fs_sb_info *sbi, 1750eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool new) 1751e05df3b1SJaegeuk Kim { 1752b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1753b8559dc2SChao Yu 1754eb0aa4b8SJaegeuk Kim if (new) { 1755eb0aa4b8SJaegeuk Kim int err = radix_tree_insert(&nm_i->free_nid_root, i->nid, i); 1756eb0aa4b8SJaegeuk Kim if (err) 1757eb0aa4b8SJaegeuk Kim return err; 1758eb0aa4b8SJaegeuk Kim } 1759eb0aa4b8SJaegeuk Kim 1760b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1761b8559dc2SChao Yu i->state != NID_ALLOC); 1762b8559dc2SChao Yu nm_i->nid_cnt[list]++; 1763b8559dc2SChao Yu list_add_tail(&i->list, &nm_i->nid_list[list]); 1764eb0aa4b8SJaegeuk Kim return 0; 1765b8559dc2SChao Yu } 1766b8559dc2SChao Yu 1767b8559dc2SChao Yu static void __remove_nid_from_list(struct f2fs_sb_info *sbi, 1768eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool reuse) 1769b8559dc2SChao Yu { 1770b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1771b8559dc2SChao Yu 1772b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1773b8559dc2SChao Yu i->state != NID_ALLOC); 1774b8559dc2SChao Yu nm_i->nid_cnt[list]--; 1775e05df3b1SJaegeuk Kim list_del(&i->list); 1776eb0aa4b8SJaegeuk Kim if (!reuse) 17778a7ed66aSJaegeuk Kim radix_tree_delete(&nm_i->free_nid_root, i->nid); 1778e05df3b1SJaegeuk Kim } 1779e05df3b1SJaegeuk Kim 17804ac91242SChao Yu /* return if the nid is recognized as free */ 17814ac91242SChao Yu static bool add_free_nid(struct f2fs_sb_info *sbi, nid_t nid, bool build) 1782e05df3b1SJaegeuk Kim { 17836fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 178430a61ddfSChao Yu struct free_nid *i, *e; 178559bbd474SJaegeuk Kim struct nat_entry *ne; 178630a61ddfSChao Yu int err = -EINVAL; 178730a61ddfSChao Yu bool ret = false; 17889198acebSJaegeuk Kim 17899198acebSJaegeuk Kim /* 0 nid should not be used */ 1790cfb271d4SChao Yu if (unlikely(nid == 0)) 17914ac91242SChao Yu return false; 179259bbd474SJaegeuk Kim 17937bd59381SGu Zheng i = f2fs_kmem_cache_alloc(free_nid_slab, GFP_NOFS); 1794e05df3b1SJaegeuk Kim i->nid = nid; 1795e05df3b1SJaegeuk Kim i->state = NID_NEW; 1796e05df3b1SJaegeuk Kim 179730a61ddfSChao Yu if (radix_tree_preload(GFP_NOFS)) 179830a61ddfSChao Yu goto err; 1799769ec6e5SJaegeuk Kim 1800b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 180130a61ddfSChao Yu 180230a61ddfSChao Yu if (build) { 180330a61ddfSChao Yu /* 180430a61ddfSChao Yu * Thread A Thread B 180530a61ddfSChao Yu * - f2fs_create 180630a61ddfSChao Yu * - f2fs_new_inode 180730a61ddfSChao Yu * - alloc_nid 180830a61ddfSChao Yu * - __insert_nid_to_list(ALLOC_NID_LIST) 180930a61ddfSChao Yu * - f2fs_balance_fs_bg 181030a61ddfSChao Yu * - build_free_nids 181130a61ddfSChao Yu * - __build_free_nids 181230a61ddfSChao Yu * - scan_nat_page 181330a61ddfSChao Yu * - add_free_nid 181430a61ddfSChao Yu * - __lookup_nat_cache 181530a61ddfSChao Yu * - f2fs_add_link 181630a61ddfSChao Yu * - init_inode_metadata 181730a61ddfSChao Yu * - new_inode_page 181830a61ddfSChao Yu * - new_node_page 181930a61ddfSChao Yu * - set_node_addr 182030a61ddfSChao Yu * - alloc_nid_done 182130a61ddfSChao Yu * - __remove_nid_from_list(ALLOC_NID_LIST) 182230a61ddfSChao Yu * - __insert_nid_to_list(FREE_NID_LIST) 182330a61ddfSChao Yu */ 182430a61ddfSChao Yu ne = __lookup_nat_cache(nm_i, nid); 182530a61ddfSChao Yu if (ne && (!get_nat_flag(ne, IS_CHECKPOINTED) || 182630a61ddfSChao Yu nat_get_blkaddr(ne) != NULL_ADDR)) 182730a61ddfSChao Yu goto err_out; 182830a61ddfSChao Yu 182930a61ddfSChao Yu e = __lookup_free_nid_list(nm_i, nid); 183030a61ddfSChao Yu if (e) { 183130a61ddfSChao Yu if (e->state == NID_NEW) 183230a61ddfSChao Yu ret = true; 183330a61ddfSChao Yu goto err_out; 183430a61ddfSChao Yu } 183530a61ddfSChao Yu } 183630a61ddfSChao Yu ret = true; 1837eb0aa4b8SJaegeuk Kim err = __insert_nid_to_list(sbi, i, FREE_NID_LIST, true); 183830a61ddfSChao Yu err_out: 1839b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1840769ec6e5SJaegeuk Kim radix_tree_preload_end(); 184130a61ddfSChao Yu err: 184230a61ddfSChao Yu if (err) 1843e05df3b1SJaegeuk Kim kmem_cache_free(free_nid_slab, i); 184430a61ddfSChao Yu return ret; 1845e05df3b1SJaegeuk Kim } 1846e05df3b1SJaegeuk Kim 1847b8559dc2SChao Yu static void remove_free_nid(struct f2fs_sb_info *sbi, nid_t nid) 1848e05df3b1SJaegeuk Kim { 1849b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1850e05df3b1SJaegeuk Kim struct free_nid *i; 1851cf0ee0f0SChao Yu bool need_free = false; 1852cf0ee0f0SChao Yu 1853b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 18548a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 1855e05df3b1SJaegeuk Kim if (i && i->state == NID_NEW) { 1856eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 1857cf0ee0f0SChao Yu need_free = true; 1858e05df3b1SJaegeuk Kim } 1859b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1860cf0ee0f0SChao Yu 1861cf0ee0f0SChao Yu if (need_free) 1862cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 1863e05df3b1SJaegeuk Kim } 1864e05df3b1SJaegeuk Kim 18659f7e4a2cSJaegeuk Kim static void update_free_nid_bitmap(struct f2fs_sb_info *sbi, nid_t nid, 1866346fe752SChao Yu bool set, bool build) 18674ac91242SChao Yu { 18684ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 18694ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(nid); 18704ac91242SChao Yu unsigned int nid_ofs = nid - START_NID(nid); 18714ac91242SChao Yu 18724ac91242SChao Yu if (!test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 18734ac91242SChao Yu return; 18744ac91242SChao Yu 18754ac91242SChao Yu if (set) 187623380b85SJaegeuk Kim __set_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 18774ac91242SChao Yu else 187823380b85SJaegeuk Kim __clear_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 1879586d1492SChao Yu 1880586d1492SChao Yu if (set) 1881586d1492SChao Yu nm_i->free_nid_count[nat_ofs]++; 1882586d1492SChao Yu else if (!build) 1883586d1492SChao Yu nm_i->free_nid_count[nat_ofs]--; 18844ac91242SChao Yu } 18854ac91242SChao Yu 18866fb03f3aSJaegeuk Kim static void scan_nat_page(struct f2fs_sb_info *sbi, 1887e05df3b1SJaegeuk Kim struct page *nat_page, nid_t start_nid) 1888e05df3b1SJaegeuk Kim { 18896fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1890e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(nat_page); 1891e05df3b1SJaegeuk Kim block_t blk_addr; 18924ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(start_nid); 1893e05df3b1SJaegeuk Kim int i; 1894e05df3b1SJaegeuk Kim 1895586d1492SChao Yu if (test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 1896586d1492SChao Yu return; 1897586d1492SChao Yu 189823380b85SJaegeuk Kim __set_bit_le(nat_ofs, nm_i->nat_block_bitmap); 18994ac91242SChao Yu 1900e05df3b1SJaegeuk Kim i = start_nid % NAT_ENTRY_PER_BLOCK; 1901e05df3b1SJaegeuk Kim 1902e05df3b1SJaegeuk Kim for (; i < NAT_ENTRY_PER_BLOCK; i++, start_nid++) { 19034ac91242SChao Yu bool freed = false; 190423d38844SHaicheng Li 1905cfb271d4SChao Yu if (unlikely(start_nid >= nm_i->max_nid)) 190604431c44SJaegeuk Kim break; 190723d38844SHaicheng Li 1908e05df3b1SJaegeuk Kim blk_addr = le32_to_cpu(nat_blk->entries[i].block_addr); 19099850cf4aSJaegeuk Kim f2fs_bug_on(sbi, blk_addr == NEW_ADDR); 19103a2ad567SChao Yu if (blk_addr == NULL_ADDR) 19114ac91242SChao Yu freed = add_free_nid(sbi, start_nid, true); 1912346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 1913346fe752SChao Yu update_free_nid_bitmap(sbi, start_nid, freed, true); 1914346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 1915e05df3b1SJaegeuk Kim } 1916e05df3b1SJaegeuk Kim } 1917e05df3b1SJaegeuk Kim 19184ac91242SChao Yu static void scan_free_nid_bits(struct f2fs_sb_info *sbi) 19194ac91242SChao Yu { 19204ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 19214ac91242SChao Yu struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 19224ac91242SChao Yu struct f2fs_journal *journal = curseg->journal; 19234ac91242SChao Yu unsigned int i, idx; 19244ac91242SChao Yu 19254ac91242SChao Yu down_read(&nm_i->nat_tree_lock); 19264ac91242SChao Yu 19274ac91242SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 19284ac91242SChao Yu if (!test_bit_le(i, nm_i->nat_block_bitmap)) 19294ac91242SChao Yu continue; 1930586d1492SChao Yu if (!nm_i->free_nid_count[i]) 1931586d1492SChao Yu continue; 19324ac91242SChao Yu for (idx = 0; idx < NAT_ENTRY_PER_BLOCK; idx++) { 19334ac91242SChao Yu nid_t nid; 19344ac91242SChao Yu 19354ac91242SChao Yu if (!test_bit_le(idx, nm_i->free_nid_bitmap[i])) 19364ac91242SChao Yu continue; 19374ac91242SChao Yu 19384ac91242SChao Yu nid = i * NAT_ENTRY_PER_BLOCK + idx; 19394ac91242SChao Yu add_free_nid(sbi, nid, true); 19404ac91242SChao Yu 1941f0cdbfe6SKinglong Mee if (nm_i->nid_cnt[FREE_NID_LIST] >= MAX_FREE_NIDS) 19424ac91242SChao Yu goto out; 19434ac91242SChao Yu } 19444ac91242SChao Yu } 19454ac91242SChao Yu out: 19464ac91242SChao Yu down_read(&curseg->journal_rwsem); 19474ac91242SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 19484ac91242SChao Yu block_t addr; 19494ac91242SChao Yu nid_t nid; 19504ac91242SChao Yu 19514ac91242SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 19524ac91242SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 19534ac91242SChao Yu if (addr == NULL_ADDR) 19544ac91242SChao Yu add_free_nid(sbi, nid, true); 19554ac91242SChao Yu else 19564ac91242SChao Yu remove_free_nid(sbi, nid); 19574ac91242SChao Yu } 19584ac91242SChao Yu up_read(&curseg->journal_rwsem); 19594ac91242SChao Yu up_read(&nm_i->nat_tree_lock); 19604ac91242SChao Yu } 19614ac91242SChao Yu 196222ad0b6aSJaegeuk Kim static void __build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 1963e05df3b1SJaegeuk Kim { 1964e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1965e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 1966b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 19678760952dSHaicheng Li int i = 0; 196855008d84SJaegeuk Kim nid_t nid = nm_i->next_scan_nid; 1969e05df3b1SJaegeuk Kim 1970e9cdd307SYunlei He if (unlikely(nid >= nm_i->max_nid)) 1971e9cdd307SYunlei He nid = 0; 1972e9cdd307SYunlei He 197355008d84SJaegeuk Kim /* Enough entries */ 1974b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] >= NAT_ENTRY_PER_BLOCK) 197555008d84SJaegeuk Kim return; 1976e05df3b1SJaegeuk Kim 19773a2ad567SChao Yu if (!sync && !available_free_memory(sbi, FREE_NIDS)) 1978e05df3b1SJaegeuk Kim return; 1979e05df3b1SJaegeuk Kim 19804ac91242SChao Yu if (!mount) { 19814ac91242SChao Yu /* try to find free nids in free_nid_bitmap */ 19824ac91242SChao Yu scan_free_nid_bits(sbi); 19834ac91242SChao Yu 19844ac91242SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST]) 198522ad0b6aSJaegeuk Kim return; 198622ad0b6aSJaegeuk Kim } 198722ad0b6aSJaegeuk Kim 198855008d84SJaegeuk Kim /* readahead nat pages to be scanned */ 198926879fb1SChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nid), FREE_NID_PAGES, 199026879fb1SChao Yu META_NAT, true); 1991e05df3b1SJaegeuk Kim 1992b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 1993a5131193SJaegeuk Kim 1994e05df3b1SJaegeuk Kim while (1) { 1995e05df3b1SJaegeuk Kim struct page *page = get_current_nat_page(sbi, nid); 1996e05df3b1SJaegeuk Kim 19976fb03f3aSJaegeuk Kim scan_nat_page(sbi, page, nid); 1998e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1999e05df3b1SJaegeuk Kim 2000e05df3b1SJaegeuk Kim nid += (NAT_ENTRY_PER_BLOCK - (nid % NAT_ENTRY_PER_BLOCK)); 2001cfb271d4SChao Yu if (unlikely(nid >= nm_i->max_nid)) 2002e05df3b1SJaegeuk Kim nid = 0; 200355008d84SJaegeuk Kim 2004a6d494b6SChao Yu if (++i >= FREE_NID_PAGES) 2005e05df3b1SJaegeuk Kim break; 2006e05df3b1SJaegeuk Kim } 2007e05df3b1SJaegeuk Kim 200855008d84SJaegeuk Kim /* go to the next free nat pages to find free nids abundantly */ 200955008d84SJaegeuk Kim nm_i->next_scan_nid = nid; 2010e05df3b1SJaegeuk Kim 2011e05df3b1SJaegeuk Kim /* find free nids from current sum_pages */ 2012b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 2013dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2014dfc08a12SChao Yu block_t addr; 2015dfc08a12SChao Yu 2016dfc08a12SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 2017dfc08a12SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 2018e05df3b1SJaegeuk Kim if (addr == NULL_ADDR) 20196fb03f3aSJaegeuk Kim add_free_nid(sbi, nid, true); 2020e05df3b1SJaegeuk Kim else 2021b8559dc2SChao Yu remove_free_nid(sbi, nid); 2022e05df3b1SJaegeuk Kim } 2023b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 2024b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 20252db2388fSChao Yu 20262db2388fSChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nm_i->next_scan_nid), 2027ea1a29a0SChao Yu nm_i->ra_nid_pages, META_NAT, false); 2028e05df3b1SJaegeuk Kim } 2029e05df3b1SJaegeuk Kim 203022ad0b6aSJaegeuk Kim void build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 20312411cf5bSChao Yu { 20322411cf5bSChao Yu mutex_lock(&NM_I(sbi)->build_lock); 203322ad0b6aSJaegeuk Kim __build_free_nids(sbi, sync, mount); 20342411cf5bSChao Yu mutex_unlock(&NM_I(sbi)->build_lock); 20352411cf5bSChao Yu } 20362411cf5bSChao Yu 2037e05df3b1SJaegeuk Kim /* 2038e05df3b1SJaegeuk Kim * If this function returns success, caller can obtain a new nid 2039e05df3b1SJaegeuk Kim * from second parameter of this function. 2040e05df3b1SJaegeuk Kim * The returned nid could be used ino as well as nid when inode is created. 2041e05df3b1SJaegeuk Kim */ 2042e05df3b1SJaegeuk Kim bool alloc_nid(struct f2fs_sb_info *sbi, nid_t *nid) 2043e05df3b1SJaegeuk Kim { 2044e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2045e05df3b1SJaegeuk Kim struct free_nid *i = NULL; 2046e05df3b1SJaegeuk Kim retry: 2047cb78942bSJaegeuk Kim #ifdef CONFIG_F2FS_FAULT_INJECTION 204855523519SChao Yu if (time_to_inject(sbi, FAULT_ALLOC_NID)) { 204955523519SChao Yu f2fs_show_injection_info(FAULT_ALLOC_NID); 2050cb78942bSJaegeuk Kim return false; 205155523519SChao Yu } 2052cb78942bSJaegeuk Kim #endif 2053b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2054e05df3b1SJaegeuk Kim 205504d47e67SChao Yu if (unlikely(nm_i->available_nids == 0)) { 205604d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 205704d47e67SChao Yu return false; 205804d47e67SChao Yu } 2059e05df3b1SJaegeuk Kim 206055008d84SJaegeuk Kim /* We should not use stale free nids created by build_free_nids */ 2061b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] && !on_build_free_nids(nm_i)) { 2062b8559dc2SChao Yu f2fs_bug_on(sbi, list_empty(&nm_i->nid_list[FREE_NID_LIST])); 2063b8559dc2SChao Yu i = list_first_entry(&nm_i->nid_list[FREE_NID_LIST], 2064b8559dc2SChao Yu struct free_nid, list); 2065e05df3b1SJaegeuk Kim *nid = i->nid; 2066b8559dc2SChao Yu 2067eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, true); 2068e05df3b1SJaegeuk Kim i->state = NID_ALLOC; 2069eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, ALLOC_NID_LIST, false); 207004d47e67SChao Yu nm_i->available_nids--; 20714ac91242SChao Yu 2072346fe752SChao Yu update_free_nid_bitmap(sbi, *nid, false, false); 20734ac91242SChao Yu 2074b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2075e05df3b1SJaegeuk Kim return true; 2076e05df3b1SJaegeuk Kim } 2077b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 207855008d84SJaegeuk Kim 207955008d84SJaegeuk Kim /* Let's scan nat pages and its caches to get free nids */ 208022ad0b6aSJaegeuk Kim build_free_nids(sbi, true, false); 208155008d84SJaegeuk Kim goto retry; 208255008d84SJaegeuk Kim } 2083e05df3b1SJaegeuk Kim 20840a8165d7SJaegeuk Kim /* 2085e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2086e05df3b1SJaegeuk Kim */ 2087e05df3b1SJaegeuk Kim void alloc_nid_done(struct f2fs_sb_info *sbi, nid_t nid) 2088e05df3b1SJaegeuk Kim { 2089e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2090e05df3b1SJaegeuk Kim struct free_nid *i; 2091e05df3b1SJaegeuk Kim 2092b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 20938a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2094b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2095eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2096b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2097cf0ee0f0SChao Yu 2098cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2099e05df3b1SJaegeuk Kim } 2100e05df3b1SJaegeuk Kim 21010a8165d7SJaegeuk Kim /* 2102e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2103e05df3b1SJaegeuk Kim */ 2104e05df3b1SJaegeuk Kim void alloc_nid_failed(struct f2fs_sb_info *sbi, nid_t nid) 2105e05df3b1SJaegeuk Kim { 210649952fa1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 210749952fa1SJaegeuk Kim struct free_nid *i; 2108cf0ee0f0SChao Yu bool need_free = false; 210949952fa1SJaegeuk Kim 211065985d93SJaegeuk Kim if (!nid) 211165985d93SJaegeuk Kim return; 211265985d93SJaegeuk Kim 2113b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 21148a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2115b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2116b8559dc2SChao Yu 21176fb03f3aSJaegeuk Kim if (!available_free_memory(sbi, FREE_NIDS)) { 2118eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2119cf0ee0f0SChao Yu need_free = true; 212095630cbaSHaicheng Li } else { 2121eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, true); 212249952fa1SJaegeuk Kim i->state = NID_NEW; 2123eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, FREE_NID_LIST, false); 212495630cbaSHaicheng Li } 212504d47e67SChao Yu 212604d47e67SChao Yu nm_i->available_nids++; 212704d47e67SChao Yu 2128346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 21294ac91242SChao Yu 2130b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2131cf0ee0f0SChao Yu 2132cf0ee0f0SChao Yu if (need_free) 2133cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2134e05df3b1SJaegeuk Kim } 2135e05df3b1SJaegeuk Kim 213631696580SChao Yu int try_to_free_nids(struct f2fs_sb_info *sbi, int nr_shrink) 213731696580SChao Yu { 213831696580SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 213931696580SChao Yu struct free_nid *i, *next; 214031696580SChao Yu int nr = nr_shrink; 214131696580SChao Yu 2142b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 2143ad4edb83SJaegeuk Kim return 0; 2144ad4edb83SJaegeuk Kim 214531696580SChao Yu if (!mutex_trylock(&nm_i->build_lock)) 214631696580SChao Yu return 0; 214731696580SChao Yu 2148b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2149b8559dc2SChao Yu list_for_each_entry_safe(i, next, &nm_i->nid_list[FREE_NID_LIST], 2150b8559dc2SChao Yu list) { 2151b8559dc2SChao Yu if (nr_shrink <= 0 || 2152b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 215331696580SChao Yu break; 2154b8559dc2SChao Yu 2155eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 215631696580SChao Yu kmem_cache_free(free_nid_slab, i); 215731696580SChao Yu nr_shrink--; 215831696580SChao Yu } 2159b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 216031696580SChao Yu mutex_unlock(&nm_i->build_lock); 216131696580SChao Yu 216231696580SChao Yu return nr - nr_shrink; 216331696580SChao Yu } 216431696580SChao Yu 216570cfed88SChao Yu void recover_inline_xattr(struct inode *inode, struct page *page) 216628cdce04SChao Yu { 216728cdce04SChao Yu void *src_addr, *dst_addr; 216828cdce04SChao Yu size_t inline_size; 216928cdce04SChao Yu struct page *ipage; 217028cdce04SChao Yu struct f2fs_inode *ri; 217128cdce04SChao Yu 21724081363fSJaegeuk Kim ipage = get_node_page(F2FS_I_SB(inode), inode->i_ino); 21739850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), IS_ERR(ipage)); 217428cdce04SChao Yu 2175e3b4d43fSJaegeuk Kim ri = F2FS_INODE(page); 2176e3b4d43fSJaegeuk Kim if (!(ri->i_inline & F2FS_INLINE_XATTR)) { 217791942321SJaegeuk Kim clear_inode_flag(inode, FI_INLINE_XATTR); 2178e3b4d43fSJaegeuk Kim goto update_inode; 2179e3b4d43fSJaegeuk Kim } 2180e3b4d43fSJaegeuk Kim 218128cdce04SChao Yu dst_addr = inline_xattr_addr(ipage); 218228cdce04SChao Yu src_addr = inline_xattr_addr(page); 218328cdce04SChao Yu inline_size = inline_xattr_size(inode); 218428cdce04SChao Yu 2185fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(ipage, NODE, true); 218628cdce04SChao Yu memcpy(dst_addr, src_addr, inline_size); 2187e3b4d43fSJaegeuk Kim update_inode: 218828cdce04SChao Yu update_inode(inode, ipage); 218928cdce04SChao Yu f2fs_put_page(ipage, 1); 219028cdce04SChao Yu } 219128cdce04SChao Yu 2192d260081cSChao Yu int recover_xattr_data(struct inode *inode, struct page *page, block_t blkaddr) 2193abb2366cSJaegeuk Kim { 21944081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 2195abb2366cSJaegeuk Kim nid_t prev_xnid = F2FS_I(inode)->i_xattr_nid; 2196abb2366cSJaegeuk Kim nid_t new_xnid = nid_of_node(page); 2197abb2366cSJaegeuk Kim struct node_info ni; 2198d260081cSChao Yu struct page *xpage; 2199abb2366cSJaegeuk Kim 2200abb2366cSJaegeuk Kim if (!prev_xnid) 2201abb2366cSJaegeuk Kim goto recover_xnid; 2202abb2366cSJaegeuk Kim 2203d260081cSChao Yu /* 1: invalidate the previous xattr nid */ 2204abb2366cSJaegeuk Kim get_node_info(sbi, prev_xnid, &ni); 22059850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 2206abb2366cSJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 2207abb2366cSJaegeuk Kim dec_valid_node_count(sbi, inode); 2208479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 2209abb2366cSJaegeuk Kim 2210abb2366cSJaegeuk Kim recover_xnid: 2211d260081cSChao Yu /* 2: update xattr nid in inode */ 2212d260081cSChao Yu remove_free_nid(sbi, new_xnid); 2213d260081cSChao Yu f2fs_i_xnid_write(inode, new_xnid); 2214abb2366cSJaegeuk Kim if (unlikely(!inc_valid_node_count(sbi, inode))) 22159850cf4aSJaegeuk Kim f2fs_bug_on(sbi, 1); 2216d260081cSChao Yu update_inode_page(inode); 2217abb2366cSJaegeuk Kim 2218d260081cSChao Yu /* 3: update and set xattr node page dirty */ 2219d260081cSChao Yu xpage = grab_cache_page(NODE_MAPPING(sbi), new_xnid); 2220d260081cSChao Yu if (!xpage) 2221d260081cSChao Yu return -ENOMEM; 2222d260081cSChao Yu 2223d260081cSChao Yu memcpy(F2FS_NODE(xpage), F2FS_NODE(page), PAGE_SIZE); 2224d260081cSChao Yu 2225abb2366cSJaegeuk Kim get_node_info(sbi, new_xnid, &ni); 2226abb2366cSJaegeuk Kim ni.ino = inode->i_ino; 2227479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NEW_ADDR, false); 2228d260081cSChao Yu set_page_dirty(xpage); 2229d260081cSChao Yu f2fs_put_page(xpage, 1); 2230abb2366cSJaegeuk Kim 2231d260081cSChao Yu return 0; 2232abb2366cSJaegeuk Kim } 2233abb2366cSJaegeuk Kim 2234e05df3b1SJaegeuk Kim int recover_inode_page(struct f2fs_sb_info *sbi, struct page *page) 2235e05df3b1SJaegeuk Kim { 223658bfaf44SJaegeuk Kim struct f2fs_inode *src, *dst; 2237e05df3b1SJaegeuk Kim nid_t ino = ino_of_node(page); 2238e05df3b1SJaegeuk Kim struct node_info old_ni, new_ni; 2239e05df3b1SJaegeuk Kim struct page *ipage; 2240e05df3b1SJaegeuk Kim 2241e8271fa3SJaegeuk Kim get_node_info(sbi, ino, &old_ni); 2242e8271fa3SJaegeuk Kim 2243e8271fa3SJaegeuk Kim if (unlikely(old_ni.blk_addr != NULL_ADDR)) 2244e8271fa3SJaegeuk Kim return -EINVAL; 2245e8ea9b3dSJaegeuk Kim retry: 2246300e129cSJaegeuk Kim ipage = f2fs_grab_cache_page(NODE_MAPPING(sbi), ino, false); 2247e8ea9b3dSJaegeuk Kim if (!ipage) { 2248e8ea9b3dSJaegeuk Kim congestion_wait(BLK_RW_ASYNC, HZ/50); 2249e8ea9b3dSJaegeuk Kim goto retry; 2250e8ea9b3dSJaegeuk Kim } 2251e05df3b1SJaegeuk Kim 2252e05df3b1SJaegeuk Kim /* Should not use this inode from free nid list */ 2253b8559dc2SChao Yu remove_free_nid(sbi, ino); 2254e05df3b1SJaegeuk Kim 2255237c0790SJaegeuk Kim if (!PageUptodate(ipage)) 2256e05df3b1SJaegeuk Kim SetPageUptodate(ipage); 2257e05df3b1SJaegeuk Kim fill_node_footer(ipage, ino, ino, 0, true); 2258e05df3b1SJaegeuk Kim 225958bfaf44SJaegeuk Kim src = F2FS_INODE(page); 226058bfaf44SJaegeuk Kim dst = F2FS_INODE(ipage); 2261e05df3b1SJaegeuk Kim 226258bfaf44SJaegeuk Kim memcpy(dst, src, (unsigned long)&src->i_ext - (unsigned long)src); 226358bfaf44SJaegeuk Kim dst->i_size = 0; 226458bfaf44SJaegeuk Kim dst->i_blocks = cpu_to_le64(1); 226558bfaf44SJaegeuk Kim dst->i_links = cpu_to_le32(1); 226658bfaf44SJaegeuk Kim dst->i_xattr_nid = 0; 2267617deb8cSJaegeuk Kim dst->i_inline = src->i_inline & F2FS_INLINE_XATTR; 2268e05df3b1SJaegeuk Kim 2269e05df3b1SJaegeuk Kim new_ni = old_ni; 2270e05df3b1SJaegeuk Kim new_ni.ino = ino; 2271e05df3b1SJaegeuk Kim 2272cfb271d4SChao Yu if (unlikely(!inc_valid_node_count(sbi, NULL))) 227365e5cd0aSJaegeuk Kim WARN_ON(1); 2274479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 2275e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 2276617deb8cSJaegeuk Kim set_page_dirty(ipage); 2277e05df3b1SJaegeuk Kim f2fs_put_page(ipage, 1); 2278e05df3b1SJaegeuk Kim return 0; 2279e05df3b1SJaegeuk Kim } 2280e05df3b1SJaegeuk Kim 2281e05df3b1SJaegeuk Kim int restore_node_summary(struct f2fs_sb_info *sbi, 2282e05df3b1SJaegeuk Kim unsigned int segno, struct f2fs_summary_block *sum) 2283e05df3b1SJaegeuk Kim { 2284e05df3b1SJaegeuk Kim struct f2fs_node *rn; 2285e05df3b1SJaegeuk Kim struct f2fs_summary *sum_entry; 2286e05df3b1SJaegeuk Kim block_t addr; 22879ecf4b80SChao Yu int i, idx, last_offset, nrpages; 2288e05df3b1SJaegeuk Kim 2289e05df3b1SJaegeuk Kim /* scan the node segment */ 2290e05df3b1SJaegeuk Kim last_offset = sbi->blocks_per_seg; 2291e05df3b1SJaegeuk Kim addr = START_BLOCK(sbi, segno); 2292e05df3b1SJaegeuk Kim sum_entry = &sum->entries[0]; 2293e05df3b1SJaegeuk Kim 22949ecf4b80SChao Yu for (i = 0; i < last_offset; i += nrpages, addr += nrpages) { 2295664ba972SJaegeuk Kim nrpages = min(last_offset - i, BIO_MAX_PAGES); 2296393ff91fSJaegeuk Kim 22979af0ff1cSChao Yu /* readahead node pages */ 229826879fb1SChao Yu ra_meta_pages(sbi, addr, nrpages, META_POR, true); 22999af0ff1cSChao Yu 23009ecf4b80SChao Yu for (idx = addr; idx < addr + nrpages; idx++) { 23012b947003SChao Yu struct page *page = get_tmp_page(sbi, idx); 2302393ff91fSJaegeuk Kim 23039ecf4b80SChao Yu rn = F2FS_NODE(page); 2304393ff91fSJaegeuk Kim sum_entry->nid = rn->footer.nid; 2305393ff91fSJaegeuk Kim sum_entry->version = 0; 2306393ff91fSJaegeuk Kim sum_entry->ofs_in_node = 0; 23079af0ff1cSChao Yu sum_entry++; 23089ecf4b80SChao Yu f2fs_put_page(page, 1); 23099af0ff1cSChao Yu } 2310bac4eef6SChao Yu 23119ecf4b80SChao Yu invalidate_mapping_pages(META_MAPPING(sbi), addr, 2312bac4eef6SChao Yu addr + nrpages); 23139af0ff1cSChao Yu } 23149ecf4b80SChao Yu return 0; 2315e05df3b1SJaegeuk Kim } 2316e05df3b1SJaegeuk Kim 2317aec71382SChao Yu static void remove_nats_in_journal(struct f2fs_sb_info *sbi) 2318e05df3b1SJaegeuk Kim { 2319e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2320e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2321b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2322e05df3b1SJaegeuk Kim int i; 2323e05df3b1SJaegeuk Kim 2324b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2325dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2326e05df3b1SJaegeuk Kim struct nat_entry *ne; 2327e05df3b1SJaegeuk Kim struct f2fs_nat_entry raw_ne; 2328dfc08a12SChao Yu nid_t nid = le32_to_cpu(nid_in_journal(journal, i)); 2329e05df3b1SJaegeuk Kim 2330dfc08a12SChao Yu raw_ne = nat_in_journal(journal, i); 23319be32d72SJaegeuk Kim 2332e05df3b1SJaegeuk Kim ne = __lookup_nat_cache(nm_i, nid); 2333e05df3b1SJaegeuk Kim if (!ne) { 23345c9e4184SChao Yu ne = grab_nat_entry(nm_i, nid, true); 233594dac22eSChao Yu node_info_from_raw_nat(&ne->ni, &raw_ne); 23369be32d72SJaegeuk Kim } 233704d47e67SChao Yu 233804d47e67SChao Yu /* 233904d47e67SChao Yu * if a free nat in journal has not been used after last 234004d47e67SChao Yu * checkpoint, we should remove it from available nids, 234104d47e67SChao Yu * since later we will add it again. 234204d47e67SChao Yu */ 234304d47e67SChao Yu if (!get_nat_flag(ne, IS_DIRTY) && 234404d47e67SChao Yu le32_to_cpu(raw_ne.block_addr) == NULL_ADDR) { 234504d47e67SChao Yu spin_lock(&nm_i->nid_list_lock); 234604d47e67SChao Yu nm_i->available_nids--; 234704d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 234804d47e67SChao Yu } 234904d47e67SChao Yu 2350e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, ne); 2351e05df3b1SJaegeuk Kim } 2352dfc08a12SChao Yu update_nats_in_cursum(journal, -i); 2353b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 2354e05df3b1SJaegeuk Kim } 2355e05df3b1SJaegeuk Kim 2356309cc2b6SJaegeuk Kim static void __adjust_nat_entry_set(struct nat_entry_set *nes, 2357309cc2b6SJaegeuk Kim struct list_head *head, int max) 2358e05df3b1SJaegeuk Kim { 2359309cc2b6SJaegeuk Kim struct nat_entry_set *cur; 2360e05df3b1SJaegeuk Kim 2361309cc2b6SJaegeuk Kim if (nes->entry_cnt >= max) 2362309cc2b6SJaegeuk Kim goto add_out; 2363e05df3b1SJaegeuk Kim 2364309cc2b6SJaegeuk Kim list_for_each_entry(cur, head, set_list) { 2365309cc2b6SJaegeuk Kim if (cur->entry_cnt >= nes->entry_cnt) { 2366309cc2b6SJaegeuk Kim list_add(&nes->set_list, cur->set_list.prev); 2367309cc2b6SJaegeuk Kim return; 2368309cc2b6SJaegeuk Kim } 2369309cc2b6SJaegeuk Kim } 2370309cc2b6SJaegeuk Kim add_out: 2371309cc2b6SJaegeuk Kim list_add_tail(&nes->set_list, head); 2372aec71382SChao Yu } 2373aec71382SChao Yu 23749f7e4a2cSJaegeuk Kim static void __update_nat_bits(struct f2fs_sb_info *sbi, nid_t start_nid, 237522ad0b6aSJaegeuk Kim struct page *page) 237622ad0b6aSJaegeuk Kim { 237722ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 237822ad0b6aSJaegeuk Kim unsigned int nat_index = start_nid / NAT_ENTRY_PER_BLOCK; 237922ad0b6aSJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(page); 238022ad0b6aSJaegeuk Kim int valid = 0; 238122ad0b6aSJaegeuk Kim int i; 238222ad0b6aSJaegeuk Kim 238322ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 238422ad0b6aSJaegeuk Kim return; 238522ad0b6aSJaegeuk Kim 238622ad0b6aSJaegeuk Kim for (i = 0; i < NAT_ENTRY_PER_BLOCK; i++) { 238722ad0b6aSJaegeuk Kim if (start_nid == 0 && i == 0) 238822ad0b6aSJaegeuk Kim valid++; 238922ad0b6aSJaegeuk Kim if (nat_blk->entries[i].block_addr) 239022ad0b6aSJaegeuk Kim valid++; 239122ad0b6aSJaegeuk Kim } 239222ad0b6aSJaegeuk Kim if (valid == 0) { 239323380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->empty_nat_bits); 239423380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 239522ad0b6aSJaegeuk Kim return; 239622ad0b6aSJaegeuk Kim } 239722ad0b6aSJaegeuk Kim 239823380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->empty_nat_bits); 239922ad0b6aSJaegeuk Kim if (valid == NAT_ENTRY_PER_BLOCK) 240023380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->full_nat_bits); 240122ad0b6aSJaegeuk Kim else 240223380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 240322ad0b6aSJaegeuk Kim } 240422ad0b6aSJaegeuk Kim 2405309cc2b6SJaegeuk Kim static void __flush_nat_entry_set(struct f2fs_sb_info *sbi, 240622ad0b6aSJaegeuk Kim struct nat_entry_set *set, struct cp_control *cpc) 2407309cc2b6SJaegeuk Kim { 2408309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2409b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2410309cc2b6SJaegeuk Kim nid_t start_nid = set->set * NAT_ENTRY_PER_BLOCK; 2411309cc2b6SJaegeuk Kim bool to_journal = true; 2412309cc2b6SJaegeuk Kim struct f2fs_nat_block *nat_blk; 2413309cc2b6SJaegeuk Kim struct nat_entry *ne, *cur; 2414309cc2b6SJaegeuk Kim struct page *page = NULL; 2415aec71382SChao Yu 2416aec71382SChao Yu /* 2417aec71382SChao Yu * there are two steps to flush nat entries: 2418aec71382SChao Yu * #1, flush nat entries to journal in current hot data summary block. 2419aec71382SChao Yu * #2, flush nat entries to nat page. 2420aec71382SChao Yu */ 242122ad0b6aSJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 242222ad0b6aSJaegeuk Kim !__has_cursum_space(journal, set->entry_cnt, NAT_JOURNAL)) 2423aec71382SChao Yu to_journal = false; 2424aec71382SChao Yu 2425aec71382SChao Yu if (to_journal) { 2426b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2427aec71382SChao Yu } else { 2428e05df3b1SJaegeuk Kim page = get_next_nat_page(sbi, start_nid); 2429e05df3b1SJaegeuk Kim nat_blk = page_address(page); 24309850cf4aSJaegeuk Kim f2fs_bug_on(sbi, !nat_blk); 2431e05df3b1SJaegeuk Kim } 2432e05df3b1SJaegeuk Kim 2433aec71382SChao Yu /* flush dirty nats in nat entry set */ 2434309cc2b6SJaegeuk Kim list_for_each_entry_safe(ne, cur, &set->entry_list, list) { 2435aec71382SChao Yu struct f2fs_nat_entry *raw_ne; 2436aec71382SChao Yu nid_t nid = nat_get_nid(ne); 2437aec71382SChao Yu int offset; 2438aec71382SChao Yu 2439febeca6dSChao Yu f2fs_bug_on(sbi, nat_get_blkaddr(ne) == NEW_ADDR); 2440309cc2b6SJaegeuk Kim 2441aec71382SChao Yu if (to_journal) { 2442dfc08a12SChao Yu offset = lookup_journal_in_cursum(journal, 2443aec71382SChao Yu NAT_JOURNAL, nid, 1); 24449850cf4aSJaegeuk Kim f2fs_bug_on(sbi, offset < 0); 2445dfc08a12SChao Yu raw_ne = &nat_in_journal(journal, offset); 2446dfc08a12SChao Yu nid_in_journal(journal, offset) = cpu_to_le32(nid); 2447aec71382SChao Yu } else { 2448aec71382SChao Yu raw_ne = &nat_blk->entries[nid - start_nid]; 2449aec71382SChao Yu } 2450aec71382SChao Yu raw_nat_from_node_info(raw_ne, &ne->ni); 245188bd02c9SJaegeuk Kim nat_reset_flag(ne); 24520b28b71eSKinglong Mee __clear_nat_cache_dirty(NM_I(sbi), set, ne); 245304d47e67SChao Yu if (nat_get_blkaddr(ne) == NULL_ADDR) { 2454309cc2b6SJaegeuk Kim add_free_nid(sbi, nid, false); 245504d47e67SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 245604d47e67SChao Yu NM_I(sbi)->available_nids++; 2457346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 24584ac91242SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 24594ac91242SChao Yu } else { 24604ac91242SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 2461346fe752SChao Yu update_free_nid_bitmap(sbi, nid, false, false); 246204d47e67SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 246304d47e67SChao Yu } 2464e05df3b1SJaegeuk Kim } 2465aec71382SChao Yu 246622ad0b6aSJaegeuk Kim if (to_journal) { 2467b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 246822ad0b6aSJaegeuk Kim } else { 246922ad0b6aSJaegeuk Kim __update_nat_bits(sbi, start_nid, page); 2470e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 247122ad0b6aSJaegeuk Kim } 2472aec71382SChao Yu 247359c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 247459c9081bSYunlei He if (!set->entry_cnt) { 2475309cc2b6SJaegeuk Kim radix_tree_delete(&NM_I(sbi)->nat_set_root, set->set); 2476309cc2b6SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, set); 2477309cc2b6SJaegeuk Kim } 247859c9081bSYunlei He } 2479aec71382SChao Yu 2480309cc2b6SJaegeuk Kim /* 2481309cc2b6SJaegeuk Kim * This function is called during the checkpointing process. 2482309cc2b6SJaegeuk Kim */ 248322ad0b6aSJaegeuk Kim void flush_nat_entries(struct f2fs_sb_info *sbi, struct cp_control *cpc) 2484309cc2b6SJaegeuk Kim { 2485309cc2b6SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2486309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2487b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 24887aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2489309cc2b6SJaegeuk Kim struct nat_entry_set *set, *tmp; 2490309cc2b6SJaegeuk Kim unsigned int found; 2491309cc2b6SJaegeuk Kim nid_t set_idx = 0; 2492309cc2b6SJaegeuk Kim LIST_HEAD(sets); 2493309cc2b6SJaegeuk Kim 249420d047c8SChangman Lee if (!nm_i->dirty_nat_cnt) 249520d047c8SChangman Lee return; 2496a5131193SJaegeuk Kim 2497b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2498a5131193SJaegeuk Kim 2499309cc2b6SJaegeuk Kim /* 2500309cc2b6SJaegeuk Kim * if there are no enough space in journal to store dirty nat 2501309cc2b6SJaegeuk Kim * entries, remove all entries from journal and merge them 2502309cc2b6SJaegeuk Kim * into nat entry set. 2503309cc2b6SJaegeuk Kim */ 2504900f7362SJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 250522ad0b6aSJaegeuk Kim !__has_cursum_space(journal, nm_i->dirty_nat_cnt, NAT_JOURNAL)) 2506309cc2b6SJaegeuk Kim remove_nats_in_journal(sbi); 2507309cc2b6SJaegeuk Kim 2508309cc2b6SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 25097aed0d45SJaegeuk Kim set_idx, SETVEC_SIZE, setvec))) { 2510309cc2b6SJaegeuk Kim unsigned idx; 2511309cc2b6SJaegeuk Kim set_idx = setvec[found - 1]->set + 1; 2512309cc2b6SJaegeuk Kim for (idx = 0; idx < found; idx++) 2513309cc2b6SJaegeuk Kim __adjust_nat_entry_set(setvec[idx], &sets, 2514dfc08a12SChao Yu MAX_NAT_JENTRIES(journal)); 2515309cc2b6SJaegeuk Kim } 2516309cc2b6SJaegeuk Kim 2517309cc2b6SJaegeuk Kim /* flush dirty nats in nat entry set */ 2518309cc2b6SJaegeuk Kim list_for_each_entry_safe(set, tmp, &sets, set_list) 251922ad0b6aSJaegeuk Kim __flush_nat_entry_set(sbi, set, cpc); 2520309cc2b6SJaegeuk Kim 2521b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 252259c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 2523e05df3b1SJaegeuk Kim } 2524e05df3b1SJaegeuk Kim 252522ad0b6aSJaegeuk Kim static int __get_nat_bitmaps(struct f2fs_sb_info *sbi) 252622ad0b6aSJaegeuk Kim { 252722ad0b6aSJaegeuk Kim struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi); 252822ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 252922ad0b6aSJaegeuk Kim unsigned int nat_bits_bytes = nm_i->nat_blocks / BITS_PER_BYTE; 253022ad0b6aSJaegeuk Kim unsigned int i; 253122ad0b6aSJaegeuk Kim __u64 cp_ver = cur_cp_version(ckpt); 253222ad0b6aSJaegeuk Kim block_t nat_bits_addr; 253322ad0b6aSJaegeuk Kim 253422ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 253522ad0b6aSJaegeuk Kim return 0; 253622ad0b6aSJaegeuk Kim 253722ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks = F2FS_BYTES_TO_BLK((nat_bits_bytes << 1) + 8 + 253822ad0b6aSJaegeuk Kim F2FS_BLKSIZE - 1); 253922ad0b6aSJaegeuk Kim nm_i->nat_bits = kzalloc(nm_i->nat_bits_blocks << F2FS_BLKSIZE_BITS, 254022ad0b6aSJaegeuk Kim GFP_KERNEL); 254122ad0b6aSJaegeuk Kim if (!nm_i->nat_bits) 254222ad0b6aSJaegeuk Kim return -ENOMEM; 254322ad0b6aSJaegeuk Kim 254422ad0b6aSJaegeuk Kim nat_bits_addr = __start_cp_addr(sbi) + sbi->blocks_per_seg - 254522ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks; 254622ad0b6aSJaegeuk Kim for (i = 0; i < nm_i->nat_bits_blocks; i++) { 254722ad0b6aSJaegeuk Kim struct page *page = get_meta_page(sbi, nat_bits_addr++); 254822ad0b6aSJaegeuk Kim 254922ad0b6aSJaegeuk Kim memcpy(nm_i->nat_bits + (i << F2FS_BLKSIZE_BITS), 255022ad0b6aSJaegeuk Kim page_address(page), F2FS_BLKSIZE); 255122ad0b6aSJaegeuk Kim f2fs_put_page(page, 1); 255222ad0b6aSJaegeuk Kim } 255322ad0b6aSJaegeuk Kim 2554ced2c7eaSKinglong Mee cp_ver |= (cur_cp_crc(ckpt) << 32); 255522ad0b6aSJaegeuk Kim if (cpu_to_le64(cp_ver) != *(__le64 *)nm_i->nat_bits) { 255622ad0b6aSJaegeuk Kim disable_nat_bits(sbi, true); 255722ad0b6aSJaegeuk Kim return 0; 255822ad0b6aSJaegeuk Kim } 255922ad0b6aSJaegeuk Kim 256022ad0b6aSJaegeuk Kim nm_i->full_nat_bits = nm_i->nat_bits + 8; 256122ad0b6aSJaegeuk Kim nm_i->empty_nat_bits = nm_i->full_nat_bits + nat_bits_bytes; 256222ad0b6aSJaegeuk Kim 256322ad0b6aSJaegeuk Kim f2fs_msg(sbi->sb, KERN_NOTICE, "Found nat_bits in checkpoint"); 256422ad0b6aSJaegeuk Kim return 0; 256522ad0b6aSJaegeuk Kim } 256622ad0b6aSJaegeuk Kim 2567bd80a4b9SHou Pengyang static inline void load_free_nid_bitmap(struct f2fs_sb_info *sbi) 25687041d5d2SChao Yu { 25697041d5d2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 25707041d5d2SChao Yu unsigned int i = 0; 25717041d5d2SChao Yu nid_t nid, last_nid; 25727041d5d2SChao Yu 25737041d5d2SChao Yu if (!enabled_nat_bits(sbi, NULL)) 25747041d5d2SChao Yu return; 25757041d5d2SChao Yu 25767041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25777041d5d2SChao Yu i = find_next_bit_le(nm_i->empty_nat_bits, nm_i->nat_blocks, i); 25787041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25797041d5d2SChao Yu break; 25807041d5d2SChao Yu 25817041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25827041d5d2SChao Yu 25837041d5d2SChao Yu nid = i * NAT_ENTRY_PER_BLOCK; 25847041d5d2SChao Yu last_nid = (i + 1) * NAT_ENTRY_PER_BLOCK; 25857041d5d2SChao Yu 2586346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 25877041d5d2SChao Yu for (; nid < last_nid; nid++) 2588346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, true); 2589346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 25907041d5d2SChao Yu } 25917041d5d2SChao Yu 25927041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25937041d5d2SChao Yu i = find_next_bit_le(nm_i->full_nat_bits, nm_i->nat_blocks, i); 25947041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25957041d5d2SChao Yu break; 25967041d5d2SChao Yu 25977041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25987041d5d2SChao Yu } 25997041d5d2SChao Yu } 26007041d5d2SChao Yu 2601e05df3b1SJaegeuk Kim static int init_node_manager(struct f2fs_sb_info *sbi) 2602e05df3b1SJaegeuk Kim { 2603e05df3b1SJaegeuk Kim struct f2fs_super_block *sb_raw = F2FS_RAW_SUPER(sbi); 2604e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2605e05df3b1SJaegeuk Kim unsigned char *version_bitmap; 260622ad0b6aSJaegeuk Kim unsigned int nat_segs; 260722ad0b6aSJaegeuk Kim int err; 2608e05df3b1SJaegeuk Kim 2609e05df3b1SJaegeuk Kim nm_i->nat_blkaddr = le32_to_cpu(sb_raw->nat_blkaddr); 2610e05df3b1SJaegeuk Kim 2611e05df3b1SJaegeuk Kim /* segment_count_nat includes pair segment so divide to 2. */ 2612e05df3b1SJaegeuk Kim nat_segs = le32_to_cpu(sb_raw->segment_count_nat) >> 1; 261322ad0b6aSJaegeuk Kim nm_i->nat_blocks = nat_segs << le32_to_cpu(sb_raw->log_blocks_per_seg); 261422ad0b6aSJaegeuk Kim nm_i->max_nid = NAT_ENTRY_PER_BLOCK * nm_i->nat_blocks; 26157ee0eeabSJaegeuk Kim 2616b63da15eSJaegeuk Kim /* not used nids: 0, node, meta, (and root counted as valid node) */ 261704d47e67SChao Yu nm_i->available_nids = nm_i->max_nid - sbi->total_valid_node_count - 261804d47e67SChao Yu F2FS_RESERVED_NODE_NUM; 2619b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] = 0; 2620b8559dc2SChao Yu nm_i->nid_cnt[ALLOC_NID_LIST] = 0; 2621e05df3b1SJaegeuk Kim nm_i->nat_cnt = 0; 2622cdfc41c1SJaegeuk Kim nm_i->ram_thresh = DEF_RAM_THRESHOLD; 2623ea1a29a0SChao Yu nm_i->ra_nid_pages = DEF_RA_NID_PAGES; 26242304cb0cSChao Yu nm_i->dirty_nats_ratio = DEF_DIRTY_NAT_RATIO_THRESHOLD; 2625e05df3b1SJaegeuk Kim 26268a7ed66aSJaegeuk Kim INIT_RADIX_TREE(&nm_i->free_nid_root, GFP_ATOMIC); 2627b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[FREE_NID_LIST]); 2628b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[ALLOC_NID_LIST]); 2629769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_root, GFP_NOIO); 2630769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_set_root, GFP_NOIO); 2631e05df3b1SJaegeuk Kim INIT_LIST_HEAD(&nm_i->nat_entries); 2632e05df3b1SJaegeuk Kim 2633e05df3b1SJaegeuk Kim mutex_init(&nm_i->build_lock); 2634b8559dc2SChao Yu spin_lock_init(&nm_i->nid_list_lock); 2635b873b798SJaegeuk Kim init_rwsem(&nm_i->nat_tree_lock); 2636e05df3b1SJaegeuk Kim 2637e05df3b1SJaegeuk Kim nm_i->next_scan_nid = le32_to_cpu(sbi->ckpt->next_free_nid); 263879b5793bSAlexandru Gheorghiu nm_i->bitmap_size = __bitmap_size(sbi, NAT_BITMAP); 2639e05df3b1SJaegeuk Kim version_bitmap = __bitmap_ptr(sbi, NAT_BITMAP); 2640e05df3b1SJaegeuk Kim if (!version_bitmap) 2641e05df3b1SJaegeuk Kim return -EFAULT; 2642e05df3b1SJaegeuk Kim 264379b5793bSAlexandru Gheorghiu nm_i->nat_bitmap = kmemdup(version_bitmap, nm_i->bitmap_size, 264479b5793bSAlexandru Gheorghiu GFP_KERNEL); 264579b5793bSAlexandru Gheorghiu if (!nm_i->nat_bitmap) 264679b5793bSAlexandru Gheorghiu return -ENOMEM; 2647599a09b2SChao Yu 264822ad0b6aSJaegeuk Kim err = __get_nat_bitmaps(sbi); 264922ad0b6aSJaegeuk Kim if (err) 265022ad0b6aSJaegeuk Kim return err; 265122ad0b6aSJaegeuk Kim 2652599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2653599a09b2SChao Yu nm_i->nat_bitmap_mir = kmemdup(version_bitmap, nm_i->bitmap_size, 2654599a09b2SChao Yu GFP_KERNEL); 2655599a09b2SChao Yu if (!nm_i->nat_bitmap_mir) 2656599a09b2SChao Yu return -ENOMEM; 2657599a09b2SChao Yu #endif 2658599a09b2SChao Yu 2659e05df3b1SJaegeuk Kim return 0; 2660e05df3b1SJaegeuk Kim } 2661e05df3b1SJaegeuk Kim 26629f7e4a2cSJaegeuk Kim static int init_free_nid_cache(struct f2fs_sb_info *sbi) 26634ac91242SChao Yu { 26644ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 26654ac91242SChao Yu 26664ac91242SChao Yu nm_i->free_nid_bitmap = f2fs_kvzalloc(nm_i->nat_blocks * 26674ac91242SChao Yu NAT_ENTRY_BITMAP_SIZE, GFP_KERNEL); 26684ac91242SChao Yu if (!nm_i->free_nid_bitmap) 26694ac91242SChao Yu return -ENOMEM; 26704ac91242SChao Yu 26714ac91242SChao Yu nm_i->nat_block_bitmap = f2fs_kvzalloc(nm_i->nat_blocks / 8, 26724ac91242SChao Yu GFP_KERNEL); 26734ac91242SChao Yu if (!nm_i->nat_block_bitmap) 26744ac91242SChao Yu return -ENOMEM; 2675586d1492SChao Yu 2676586d1492SChao Yu nm_i->free_nid_count = f2fs_kvzalloc(nm_i->nat_blocks * 2677586d1492SChao Yu sizeof(unsigned short), GFP_KERNEL); 2678586d1492SChao Yu if (!nm_i->free_nid_count) 2679586d1492SChao Yu return -ENOMEM; 26804ac91242SChao Yu return 0; 26814ac91242SChao Yu } 26824ac91242SChao Yu 2683e05df3b1SJaegeuk Kim int build_node_manager(struct f2fs_sb_info *sbi) 2684e05df3b1SJaegeuk Kim { 2685e05df3b1SJaegeuk Kim int err; 2686e05df3b1SJaegeuk Kim 2687e05df3b1SJaegeuk Kim sbi->nm_info = kzalloc(sizeof(struct f2fs_nm_info), GFP_KERNEL); 2688e05df3b1SJaegeuk Kim if (!sbi->nm_info) 2689e05df3b1SJaegeuk Kim return -ENOMEM; 2690e05df3b1SJaegeuk Kim 2691e05df3b1SJaegeuk Kim err = init_node_manager(sbi); 2692e05df3b1SJaegeuk Kim if (err) 2693e05df3b1SJaegeuk Kim return err; 2694e05df3b1SJaegeuk Kim 26954ac91242SChao Yu err = init_free_nid_cache(sbi); 26964ac91242SChao Yu if (err) 26974ac91242SChao Yu return err; 26984ac91242SChao Yu 26997041d5d2SChao Yu /* load free nid status from nat_bits table */ 27007041d5d2SChao Yu load_free_nid_bitmap(sbi); 27017041d5d2SChao Yu 270222ad0b6aSJaegeuk Kim build_free_nids(sbi, true, true); 2703e05df3b1SJaegeuk Kim return 0; 2704e05df3b1SJaegeuk Kim } 2705e05df3b1SJaegeuk Kim 2706e05df3b1SJaegeuk Kim void destroy_node_manager(struct f2fs_sb_info *sbi) 2707e05df3b1SJaegeuk Kim { 2708e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2709e05df3b1SJaegeuk Kim struct free_nid *i, *next_i; 2710e05df3b1SJaegeuk Kim struct nat_entry *natvec[NATVEC_SIZE]; 27117aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2712e05df3b1SJaegeuk Kim nid_t nid = 0; 2713e05df3b1SJaegeuk Kim unsigned int found; 2714e05df3b1SJaegeuk Kim 2715e05df3b1SJaegeuk Kim if (!nm_i) 2716e05df3b1SJaegeuk Kim return; 2717e05df3b1SJaegeuk Kim 2718e05df3b1SJaegeuk Kim /* destroy free nid list */ 2719b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2720b8559dc2SChao Yu list_for_each_entry_safe(i, next_i, &nm_i->nid_list[FREE_NID_LIST], 2721b8559dc2SChao Yu list) { 2722eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 2723b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2724cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2725b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2726e05df3b1SJaegeuk Kim } 2727b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[FREE_NID_LIST]); 2728b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[ALLOC_NID_LIST]); 2729b8559dc2SChao Yu f2fs_bug_on(sbi, !list_empty(&nm_i->nid_list[ALLOC_NID_LIST])); 2730b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2731e05df3b1SJaegeuk Kim 2732e05df3b1SJaegeuk Kim /* destroy nat cache */ 2733b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2734e05df3b1SJaegeuk Kim while ((found = __gang_lookup_nat_cache(nm_i, 2735e05df3b1SJaegeuk Kim nid, NATVEC_SIZE, natvec))) { 2736e05df3b1SJaegeuk Kim unsigned idx; 27377aed0d45SJaegeuk Kim 2738b6ce391eSGu Zheng nid = nat_get_nid(natvec[found - 1]) + 1; 2739b6ce391eSGu Zheng for (idx = 0; idx < found; idx++) 2740b6ce391eSGu Zheng __del_from_nat_cache(nm_i, natvec[idx]); 2741e05df3b1SJaegeuk Kim } 27429850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nm_i->nat_cnt); 27437aed0d45SJaegeuk Kim 27447aed0d45SJaegeuk Kim /* destroy nat set cache */ 27457aed0d45SJaegeuk Kim nid = 0; 27467aed0d45SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 27477aed0d45SJaegeuk Kim nid, SETVEC_SIZE, setvec))) { 27487aed0d45SJaegeuk Kim unsigned idx; 27497aed0d45SJaegeuk Kim 27507aed0d45SJaegeuk Kim nid = setvec[found - 1]->set + 1; 27517aed0d45SJaegeuk Kim for (idx = 0; idx < found; idx++) { 27527aed0d45SJaegeuk Kim /* entry_cnt is not zero, when cp_error was occurred */ 27537aed0d45SJaegeuk Kim f2fs_bug_on(sbi, !list_empty(&setvec[idx]->entry_list)); 27547aed0d45SJaegeuk Kim radix_tree_delete(&nm_i->nat_set_root, setvec[idx]->set); 27557aed0d45SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, setvec[idx]); 27567aed0d45SJaegeuk Kim } 27577aed0d45SJaegeuk Kim } 2758b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 2759e05df3b1SJaegeuk Kim 27604ac91242SChao Yu kvfree(nm_i->nat_block_bitmap); 27614ac91242SChao Yu kvfree(nm_i->free_nid_bitmap); 2762586d1492SChao Yu kvfree(nm_i->free_nid_count); 27634ac91242SChao Yu 2764e05df3b1SJaegeuk Kim kfree(nm_i->nat_bitmap); 276522ad0b6aSJaegeuk Kim kfree(nm_i->nat_bits); 2766599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2767599a09b2SChao Yu kfree(nm_i->nat_bitmap_mir); 2768599a09b2SChao Yu #endif 2769e05df3b1SJaegeuk Kim sbi->nm_info = NULL; 2770e05df3b1SJaegeuk Kim kfree(nm_i); 2771e05df3b1SJaegeuk Kim } 2772e05df3b1SJaegeuk Kim 27736e6093a8SNamjae Jeon int __init create_node_manager_caches(void) 2774e05df3b1SJaegeuk Kim { 2775e05df3b1SJaegeuk Kim nat_entry_slab = f2fs_kmem_cache_create("nat_entry", 2776e8512d2eSGu Zheng sizeof(struct nat_entry)); 2777e05df3b1SJaegeuk Kim if (!nat_entry_slab) 2778aec71382SChao Yu goto fail; 2779e05df3b1SJaegeuk Kim 2780e05df3b1SJaegeuk Kim free_nid_slab = f2fs_kmem_cache_create("free_nid", 2781e8512d2eSGu Zheng sizeof(struct free_nid)); 2782aec71382SChao Yu if (!free_nid_slab) 2783ce3e6d25SMarkus Elfring goto destroy_nat_entry; 2784aec71382SChao Yu 2785aec71382SChao Yu nat_entry_set_slab = f2fs_kmem_cache_create("nat_entry_set", 2786aec71382SChao Yu sizeof(struct nat_entry_set)); 2787aec71382SChao Yu if (!nat_entry_set_slab) 2788ce3e6d25SMarkus Elfring goto destroy_free_nid; 2789e05df3b1SJaegeuk Kim return 0; 2790aec71382SChao Yu 2791ce3e6d25SMarkus Elfring destroy_free_nid: 2792aec71382SChao Yu kmem_cache_destroy(free_nid_slab); 2793ce3e6d25SMarkus Elfring destroy_nat_entry: 2794aec71382SChao Yu kmem_cache_destroy(nat_entry_slab); 2795aec71382SChao Yu fail: 2796aec71382SChao Yu return -ENOMEM; 2797e05df3b1SJaegeuk Kim } 2798e05df3b1SJaegeuk Kim 2799e05df3b1SJaegeuk Kim void destroy_node_manager_caches(void) 2800e05df3b1SJaegeuk Kim { 2801aec71382SChao Yu kmem_cache_destroy(nat_entry_set_slab); 2802e05df3b1SJaegeuk Kim kmem_cache_destroy(free_nid_slab); 2803e05df3b1SJaegeuk Kim kmem_cache_destroy(nat_entry_slab); 2804e05df3b1SJaegeuk Kim } 2805