10a8165d7SJaegeuk Kim /* 2e05df3b1SJaegeuk Kim * fs/f2fs/node.c 3e05df3b1SJaegeuk Kim * 4e05df3b1SJaegeuk Kim * Copyright (c) 2012 Samsung Electronics Co., Ltd. 5e05df3b1SJaegeuk Kim * http://www.samsung.com/ 6e05df3b1SJaegeuk Kim * 7e05df3b1SJaegeuk Kim * This program is free software; you can redistribute it and/or modify 8e05df3b1SJaegeuk Kim * it under the terms of the GNU General Public License version 2 as 9e05df3b1SJaegeuk Kim * published by the Free Software Foundation. 10e05df3b1SJaegeuk Kim */ 11e05df3b1SJaegeuk Kim #include <linux/fs.h> 12e05df3b1SJaegeuk Kim #include <linux/f2fs_fs.h> 13e05df3b1SJaegeuk Kim #include <linux/mpage.h> 14e05df3b1SJaegeuk Kim #include <linux/backing-dev.h> 15e05df3b1SJaegeuk Kim #include <linux/blkdev.h> 16e05df3b1SJaegeuk Kim #include <linux/pagevec.h> 17e05df3b1SJaegeuk Kim #include <linux/swap.h> 18e05df3b1SJaegeuk Kim 19e05df3b1SJaegeuk Kim #include "f2fs.h" 20e05df3b1SJaegeuk Kim #include "node.h" 21e05df3b1SJaegeuk Kim #include "segment.h" 2287905682SYunlei He #include "xattr.h" 239e4ded3fSJaegeuk Kim #include "trace.h" 2451dd6249SNamjae Jeon #include <trace/events/f2fs.h> 25e05df3b1SJaegeuk Kim 2668afcf2dSTomohiro Kusumi #define on_build_free_nids(nmi) mutex_is_locked(&(nm_i)->build_lock) 27f978f5a0SGu Zheng 28e05df3b1SJaegeuk Kim static struct kmem_cache *nat_entry_slab; 29e05df3b1SJaegeuk Kim static struct kmem_cache *free_nid_slab; 30aec71382SChao Yu static struct kmem_cache *nat_entry_set_slab; 31e05df3b1SJaegeuk Kim 326fb03f3aSJaegeuk Kim bool available_free_memory(struct f2fs_sb_info *sbi, int type) 33cdfc41c1SJaegeuk Kim { 346fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 35cdfc41c1SJaegeuk Kim struct sysinfo val; 36e5e7ea3cSJaegeuk Kim unsigned long avail_ram; 37cdfc41c1SJaegeuk Kim unsigned long mem_size = 0; 386fb03f3aSJaegeuk Kim bool res = false; 39cdfc41c1SJaegeuk Kim 40cdfc41c1SJaegeuk Kim si_meminfo(&val); 41e5e7ea3cSJaegeuk Kim 42e5e7ea3cSJaegeuk Kim /* only uses low memory */ 43e5e7ea3cSJaegeuk Kim avail_ram = val.totalram - val.totalhigh; 44e5e7ea3cSJaegeuk Kim 45429511cdSChao Yu /* 46429511cdSChao Yu * give 25%, 25%, 50%, 50%, 50% memory for each components respectively 47429511cdSChao Yu */ 486fb03f3aSJaegeuk Kim if (type == FREE_NIDS) { 49b8559dc2SChao Yu mem_size = (nm_i->nid_cnt[FREE_NID_LIST] * 50b8559dc2SChao Yu sizeof(struct free_nid)) >> PAGE_SHIFT; 51e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 526fb03f3aSJaegeuk Kim } else if (type == NAT_ENTRIES) { 53e5e7ea3cSJaegeuk Kim mem_size = (nm_i->nat_cnt * sizeof(struct nat_entry)) >> 5409cbfeafSKirill A. Shutemov PAGE_SHIFT; 55e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 56e589c2c4SJaegeuk Kim if (excess_cached_nats(sbi)) 57e589c2c4SJaegeuk Kim res = false; 58a1257023SJaegeuk Kim } else if (type == DIRTY_DENTS) { 59a1257023SJaegeuk Kim if (sbi->sb->s_bdi->wb.dirty_exceeded) 60a1257023SJaegeuk Kim return false; 61a1257023SJaegeuk Kim mem_size = get_pages(sbi, F2FS_DIRTY_DENTS); 62a1257023SJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 63e5e7ea3cSJaegeuk Kim } else if (type == INO_ENTRIES) { 64e5e7ea3cSJaegeuk Kim int i; 65e5e7ea3cSJaegeuk Kim 66e5e7ea3cSJaegeuk Kim for (i = 0; i <= UPDATE_INO; i++) 678f73cbb7SKinglong Mee mem_size += sbi->im[i].ino_num * 688f73cbb7SKinglong Mee sizeof(struct ino_entry); 698f73cbb7SKinglong Mee mem_size >>= PAGE_SHIFT; 70e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 71429511cdSChao Yu } else if (type == EXTENT_CACHE) { 727441ccefSJaegeuk Kim mem_size = (atomic_read(&sbi->total_ext_tree) * 737441ccefSJaegeuk Kim sizeof(struct extent_tree) + 74429511cdSChao Yu atomic_read(&sbi->total_ext_node) * 7509cbfeafSKirill A. Shutemov sizeof(struct extent_node)) >> PAGE_SHIFT; 76429511cdSChao Yu res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 771e84371fSJaegeuk Kim } else { 781663cae4SJaegeuk Kim if (!sbi->sb->s_bdi->wb.dirty_exceeded) 791663cae4SJaegeuk Kim return true; 806fb03f3aSJaegeuk Kim } 816fb03f3aSJaegeuk Kim return res; 82cdfc41c1SJaegeuk Kim } 83cdfc41c1SJaegeuk Kim 84e05df3b1SJaegeuk Kim static void clear_node_page_dirty(struct page *page) 85e05df3b1SJaegeuk Kim { 86e05df3b1SJaegeuk Kim struct address_space *mapping = page->mapping; 87e05df3b1SJaegeuk Kim unsigned int long flags; 88e05df3b1SJaegeuk Kim 89e05df3b1SJaegeuk Kim if (PageDirty(page)) { 90e05df3b1SJaegeuk Kim spin_lock_irqsave(&mapping->tree_lock, flags); 91e05df3b1SJaegeuk Kim radix_tree_tag_clear(&mapping->page_tree, 92e05df3b1SJaegeuk Kim page_index(page), 93e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY); 94e05df3b1SJaegeuk Kim spin_unlock_irqrestore(&mapping->tree_lock, flags); 95e05df3b1SJaegeuk Kim 96e05df3b1SJaegeuk Kim clear_page_dirty_for_io(page); 974081363fSJaegeuk Kim dec_page_count(F2FS_M_SB(mapping), F2FS_DIRTY_NODES); 98e05df3b1SJaegeuk Kim } 99e05df3b1SJaegeuk Kim ClearPageUptodate(page); 100e05df3b1SJaegeuk Kim } 101e05df3b1SJaegeuk Kim 102e05df3b1SJaegeuk Kim static struct page *get_current_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 103e05df3b1SJaegeuk Kim { 104e05df3b1SJaegeuk Kim pgoff_t index = current_nat_addr(sbi, nid); 105e05df3b1SJaegeuk Kim return get_meta_page(sbi, index); 106e05df3b1SJaegeuk Kim } 107e05df3b1SJaegeuk Kim 108e05df3b1SJaegeuk Kim static struct page *get_next_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 109e05df3b1SJaegeuk Kim { 110e05df3b1SJaegeuk Kim struct page *src_page; 111e05df3b1SJaegeuk Kim struct page *dst_page; 112e05df3b1SJaegeuk Kim pgoff_t src_off; 113e05df3b1SJaegeuk Kim pgoff_t dst_off; 114e05df3b1SJaegeuk Kim void *src_addr; 115e05df3b1SJaegeuk Kim void *dst_addr; 116e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 117e05df3b1SJaegeuk Kim 118e05df3b1SJaegeuk Kim src_off = current_nat_addr(sbi, nid); 119e05df3b1SJaegeuk Kim dst_off = next_nat_addr(sbi, src_off); 120e05df3b1SJaegeuk Kim 121e05df3b1SJaegeuk Kim /* get current nat block page with lock */ 122e05df3b1SJaegeuk Kim src_page = get_meta_page(sbi, src_off); 123e05df3b1SJaegeuk Kim dst_page = grab_meta_page(sbi, dst_off); 1249850cf4aSJaegeuk Kim f2fs_bug_on(sbi, PageDirty(src_page)); 125e05df3b1SJaegeuk Kim 126e05df3b1SJaegeuk Kim src_addr = page_address(src_page); 127e05df3b1SJaegeuk Kim dst_addr = page_address(dst_page); 12809cbfeafSKirill A. Shutemov memcpy(dst_addr, src_addr, PAGE_SIZE); 129e05df3b1SJaegeuk Kim set_page_dirty(dst_page); 130e05df3b1SJaegeuk Kim f2fs_put_page(src_page, 1); 131e05df3b1SJaegeuk Kim 132e05df3b1SJaegeuk Kim set_to_next_nat(nm_i, nid); 133e05df3b1SJaegeuk Kim 134e05df3b1SJaegeuk Kim return dst_page; 135e05df3b1SJaegeuk Kim } 136e05df3b1SJaegeuk Kim 137e05df3b1SJaegeuk Kim static struct nat_entry *__lookup_nat_cache(struct f2fs_nm_info *nm_i, nid_t n) 138e05df3b1SJaegeuk Kim { 139e05df3b1SJaegeuk Kim return radix_tree_lookup(&nm_i->nat_root, n); 140e05df3b1SJaegeuk Kim } 141e05df3b1SJaegeuk Kim 142e05df3b1SJaegeuk Kim static unsigned int __gang_lookup_nat_cache(struct f2fs_nm_info *nm_i, 143e05df3b1SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry **ep) 144e05df3b1SJaegeuk Kim { 145e05df3b1SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_root, (void **)ep, start, nr); 146e05df3b1SJaegeuk Kim } 147e05df3b1SJaegeuk Kim 148e05df3b1SJaegeuk Kim static void __del_from_nat_cache(struct f2fs_nm_info *nm_i, struct nat_entry *e) 149e05df3b1SJaegeuk Kim { 150e05df3b1SJaegeuk Kim list_del(&e->list); 151e05df3b1SJaegeuk Kim radix_tree_delete(&nm_i->nat_root, nat_get_nid(e)); 152e05df3b1SJaegeuk Kim nm_i->nat_cnt--; 153e05df3b1SJaegeuk Kim kmem_cache_free(nat_entry_slab, e); 154e05df3b1SJaegeuk Kim } 155e05df3b1SJaegeuk Kim 156309cc2b6SJaegeuk Kim static void __set_nat_cache_dirty(struct f2fs_nm_info *nm_i, 157309cc2b6SJaegeuk Kim struct nat_entry *ne) 158309cc2b6SJaegeuk Kim { 159309cc2b6SJaegeuk Kim nid_t set = NAT_BLOCK_OFFSET(ne->ni.nid); 160309cc2b6SJaegeuk Kim struct nat_entry_set *head; 161309cc2b6SJaegeuk Kim 162309cc2b6SJaegeuk Kim head = radix_tree_lookup(&nm_i->nat_set_root, set); 163309cc2b6SJaegeuk Kim if (!head) { 16480c54505SJaegeuk Kim head = f2fs_kmem_cache_alloc(nat_entry_set_slab, GFP_NOFS); 165309cc2b6SJaegeuk Kim 166309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->entry_list); 167309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->set_list); 168309cc2b6SJaegeuk Kim head->set = set; 169309cc2b6SJaegeuk Kim head->entry_cnt = 0; 1709be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_set_root, set, head); 171309cc2b6SJaegeuk Kim } 172febeca6dSChao Yu 173febeca6dSChao Yu if (get_nat_flag(ne, IS_DIRTY)) 174febeca6dSChao Yu goto refresh_list; 175febeca6dSChao Yu 176309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt++; 177309cc2b6SJaegeuk Kim head->entry_cnt++; 178309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, true); 179febeca6dSChao Yu refresh_list: 180febeca6dSChao Yu if (nat_get_blkaddr(ne) == NEW_ADDR) 181febeca6dSChao Yu list_del_init(&ne->list); 182febeca6dSChao Yu else 183febeca6dSChao Yu list_move_tail(&ne->list, &head->entry_list); 184309cc2b6SJaegeuk Kim } 185309cc2b6SJaegeuk Kim 186309cc2b6SJaegeuk Kim static void __clear_nat_cache_dirty(struct f2fs_nm_info *nm_i, 1870b28b71eSKinglong Mee struct nat_entry_set *set, struct nat_entry *ne) 188309cc2b6SJaegeuk Kim { 189309cc2b6SJaegeuk Kim list_move_tail(&ne->list, &nm_i->nat_entries); 190309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, false); 1910b28b71eSKinglong Mee set->entry_cnt--; 192309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt--; 193309cc2b6SJaegeuk Kim } 194309cc2b6SJaegeuk Kim 195309cc2b6SJaegeuk Kim static unsigned int __gang_lookup_nat_set(struct f2fs_nm_info *nm_i, 196309cc2b6SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry_set **ep) 197309cc2b6SJaegeuk Kim { 198309cc2b6SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_set_root, (void **)ep, 199309cc2b6SJaegeuk Kim start, nr); 200309cc2b6SJaegeuk Kim } 201309cc2b6SJaegeuk Kim 2022dcf51abSJaegeuk Kim int need_dentry_mark(struct f2fs_sb_info *sbi, nid_t nid) 2032dcf51abSJaegeuk Kim { 2042dcf51abSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2052dcf51abSJaegeuk Kim struct nat_entry *e; 2062dcf51abSJaegeuk Kim bool need = false; 2072dcf51abSJaegeuk Kim 208b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 2092dcf51abSJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2102dcf51abSJaegeuk Kim if (e) { 2112dcf51abSJaegeuk Kim if (!get_nat_flag(e, IS_CHECKPOINTED) && 2122dcf51abSJaegeuk Kim !get_nat_flag(e, HAS_FSYNCED_INODE)) 2132dcf51abSJaegeuk Kim need = true; 2142dcf51abSJaegeuk Kim } 215b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 2162dcf51abSJaegeuk Kim return need; 2172dcf51abSJaegeuk Kim } 2182dcf51abSJaegeuk Kim 21988bd02c9SJaegeuk Kim bool is_checkpointed_node(struct f2fs_sb_info *sbi, nid_t nid) 220e05df3b1SJaegeuk Kim { 221e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 222e05df3b1SJaegeuk Kim struct nat_entry *e; 22388bd02c9SJaegeuk Kim bool is_cp = true; 224e05df3b1SJaegeuk Kim 225b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 226e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2277ef35e3bSJaegeuk Kim if (e && !get_nat_flag(e, IS_CHECKPOINTED)) 22888bd02c9SJaegeuk Kim is_cp = false; 229b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 230e05df3b1SJaegeuk Kim return is_cp; 231e05df3b1SJaegeuk Kim } 232e05df3b1SJaegeuk Kim 23388bd02c9SJaegeuk Kim bool need_inode_block_update(struct f2fs_sb_info *sbi, nid_t ino) 234b6fe5873SJaegeuk Kim { 235b6fe5873SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 236b6fe5873SJaegeuk Kim struct nat_entry *e; 23788bd02c9SJaegeuk Kim bool need_update = true; 238b6fe5873SJaegeuk Kim 239b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 24088bd02c9SJaegeuk Kim e = __lookup_nat_cache(nm_i, ino); 24188bd02c9SJaegeuk Kim if (e && get_nat_flag(e, HAS_LAST_FSYNC) && 24288bd02c9SJaegeuk Kim (get_nat_flag(e, IS_CHECKPOINTED) || 24388bd02c9SJaegeuk Kim get_nat_flag(e, HAS_FSYNCED_INODE))) 24488bd02c9SJaegeuk Kim need_update = false; 245b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 24688bd02c9SJaegeuk Kim return need_update; 247b6fe5873SJaegeuk Kim } 248b6fe5873SJaegeuk Kim 2495c9e4184SChao Yu static struct nat_entry *grab_nat_entry(struct f2fs_nm_info *nm_i, nid_t nid, 2505c9e4184SChao Yu bool no_fail) 251e05df3b1SJaegeuk Kim { 252e05df3b1SJaegeuk Kim struct nat_entry *new; 253e05df3b1SJaegeuk Kim 2545c9e4184SChao Yu if (no_fail) { 25580c54505SJaegeuk Kim new = f2fs_kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2569be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_root, nid, new); 2575c9e4184SChao Yu } else { 2585c9e4184SChao Yu new = kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2595c9e4184SChao Yu if (!new) 2605c9e4184SChao Yu return NULL; 2615c9e4184SChao Yu if (radix_tree_insert(&nm_i->nat_root, nid, new)) { 2625c9e4184SChao Yu kmem_cache_free(nat_entry_slab, new); 2635c9e4184SChao Yu return NULL; 2645c9e4184SChao Yu } 2655c9e4184SChao Yu } 2665c9e4184SChao Yu 267e05df3b1SJaegeuk Kim memset(new, 0, sizeof(struct nat_entry)); 268e05df3b1SJaegeuk Kim nat_set_nid(new, nid); 26988bd02c9SJaegeuk Kim nat_reset_flag(new); 270e05df3b1SJaegeuk Kim list_add_tail(&new->list, &nm_i->nat_entries); 271e05df3b1SJaegeuk Kim nm_i->nat_cnt++; 272e05df3b1SJaegeuk Kim return new; 273e05df3b1SJaegeuk Kim } 274e05df3b1SJaegeuk Kim 2751515aef0SChao Yu static void cache_nat_entry(struct f2fs_sb_info *sbi, nid_t nid, 276e05df3b1SJaegeuk Kim struct f2fs_nat_entry *ne) 277e05df3b1SJaegeuk Kim { 2781515aef0SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 279e05df3b1SJaegeuk Kim struct nat_entry *e; 2809be32d72SJaegeuk Kim 281e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 282e05df3b1SJaegeuk Kim if (!e) { 2835c9e4184SChao Yu e = grab_nat_entry(nm_i, nid, false); 2845c9e4184SChao Yu if (e) 28594dac22eSChao Yu node_info_from_raw_nat(&e->ni, ne); 2861515aef0SChao Yu } else { 2870c0b471eSEric Biggers f2fs_bug_on(sbi, nat_get_ino(e) != le32_to_cpu(ne->ino) || 2880c0b471eSEric Biggers nat_get_blkaddr(e) != 2890c0b471eSEric Biggers le32_to_cpu(ne->block_addr) || 2901515aef0SChao Yu nat_get_version(e) != ne->version); 291e05df3b1SJaegeuk Kim } 292e05df3b1SJaegeuk Kim } 293e05df3b1SJaegeuk Kim 294e05df3b1SJaegeuk Kim static void set_node_addr(struct f2fs_sb_info *sbi, struct node_info *ni, 295479f40c4SJaegeuk Kim block_t new_blkaddr, bool fsync_done) 296e05df3b1SJaegeuk Kim { 297e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 298e05df3b1SJaegeuk Kim struct nat_entry *e; 2999be32d72SJaegeuk Kim 300b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 301e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->nid); 302e05df3b1SJaegeuk Kim if (!e) { 3035c9e4184SChao Yu e = grab_nat_entry(nm_i, ni->nid, true); 3045c27f4eeSChao Yu copy_node_info(&e->ni, ni); 3059850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr == NEW_ADDR); 306e05df3b1SJaegeuk Kim } else if (new_blkaddr == NEW_ADDR) { 307e05df3b1SJaegeuk Kim /* 308e05df3b1SJaegeuk Kim * when nid is reallocated, 309e05df3b1SJaegeuk Kim * previous nat entry can be remained in nat cache. 310e05df3b1SJaegeuk Kim * So, reinitialize it with new information. 311e05df3b1SJaegeuk Kim */ 3125c27f4eeSChao Yu copy_node_info(&e->ni, ni); 3139850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr != NULL_ADDR); 314e05df3b1SJaegeuk Kim } 315e05df3b1SJaegeuk Kim 316e05df3b1SJaegeuk Kim /* sanity check */ 3179850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != ni->blk_addr); 3189850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NULL_ADDR && 319e05df3b1SJaegeuk Kim new_blkaddr == NULL_ADDR); 3209850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NEW_ADDR && 321e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 3229850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != NEW_ADDR && 323e05df3b1SJaegeuk Kim nat_get_blkaddr(e) != NULL_ADDR && 324e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 325e05df3b1SJaegeuk Kim 326e1c42045Sarter97 /* increment version no as node is removed */ 327e05df3b1SJaegeuk Kim if (nat_get_blkaddr(e) != NEW_ADDR && new_blkaddr == NULL_ADDR) { 328e05df3b1SJaegeuk Kim unsigned char version = nat_get_version(e); 329e05df3b1SJaegeuk Kim nat_set_version(e, inc_node_version(version)); 33026834466SJaegeuk Kim 33126834466SJaegeuk Kim /* in order to reuse the nid */ 33226834466SJaegeuk Kim if (nm_i->next_scan_nid > ni->nid) 33326834466SJaegeuk Kim nm_i->next_scan_nid = ni->nid; 334e05df3b1SJaegeuk Kim } 335e05df3b1SJaegeuk Kim 336e05df3b1SJaegeuk Kim /* change address */ 337e05df3b1SJaegeuk Kim nat_set_blkaddr(e, new_blkaddr); 33888bd02c9SJaegeuk Kim if (new_blkaddr == NEW_ADDR || new_blkaddr == NULL_ADDR) 33988bd02c9SJaegeuk Kim set_nat_flag(e, IS_CHECKPOINTED, false); 340e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, e); 341479f40c4SJaegeuk Kim 342479f40c4SJaegeuk Kim /* update fsync_mark if its inode nat entry is still alive */ 343d5b692b7SChao Yu if (ni->nid != ni->ino) 344479f40c4SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->ino); 34588bd02c9SJaegeuk Kim if (e) { 34688bd02c9SJaegeuk Kim if (fsync_done && ni->nid == ni->ino) 34788bd02c9SJaegeuk Kim set_nat_flag(e, HAS_FSYNCED_INODE, true); 34888bd02c9SJaegeuk Kim set_nat_flag(e, HAS_LAST_FSYNC, fsync_done); 34988bd02c9SJaegeuk Kim } 350b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 351e05df3b1SJaegeuk Kim } 352e05df3b1SJaegeuk Kim 3534660f9c0SJaegeuk Kim int try_to_free_nats(struct f2fs_sb_info *sbi, int nr_shrink) 354e05df3b1SJaegeuk Kim { 355e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 3561b38dc8eSJaegeuk Kim int nr = nr_shrink; 357e05df3b1SJaegeuk Kim 358b873b798SJaegeuk Kim if (!down_write_trylock(&nm_i->nat_tree_lock)) 359b873b798SJaegeuk Kim return 0; 360e05df3b1SJaegeuk Kim 361e05df3b1SJaegeuk Kim while (nr_shrink && !list_empty(&nm_i->nat_entries)) { 362e05df3b1SJaegeuk Kim struct nat_entry *ne; 363e05df3b1SJaegeuk Kim ne = list_first_entry(&nm_i->nat_entries, 364e05df3b1SJaegeuk Kim struct nat_entry, list); 365e05df3b1SJaegeuk Kim __del_from_nat_cache(nm_i, ne); 366e05df3b1SJaegeuk Kim nr_shrink--; 367e05df3b1SJaegeuk Kim } 368b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 3691b38dc8eSJaegeuk Kim return nr - nr_shrink; 370e05df3b1SJaegeuk Kim } 371e05df3b1SJaegeuk Kim 3720a8165d7SJaegeuk Kim /* 373e1c42045Sarter97 * This function always returns success 374e05df3b1SJaegeuk Kim */ 375e05df3b1SJaegeuk Kim void get_node_info(struct f2fs_sb_info *sbi, nid_t nid, struct node_info *ni) 376e05df3b1SJaegeuk Kim { 377e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 378e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 379b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 380e05df3b1SJaegeuk Kim nid_t start_nid = START_NID(nid); 381e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk; 382e05df3b1SJaegeuk Kim struct page *page = NULL; 383e05df3b1SJaegeuk Kim struct f2fs_nat_entry ne; 384e05df3b1SJaegeuk Kim struct nat_entry *e; 38566a82d1fSYunlei He pgoff_t index; 386e05df3b1SJaegeuk Kim int i; 387e05df3b1SJaegeuk Kim 388e05df3b1SJaegeuk Kim ni->nid = nid; 389e05df3b1SJaegeuk Kim 390e05df3b1SJaegeuk Kim /* Check nat cache */ 391b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 392e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 393e05df3b1SJaegeuk Kim if (e) { 394e05df3b1SJaegeuk Kim ni->ino = nat_get_ino(e); 395e05df3b1SJaegeuk Kim ni->blk_addr = nat_get_blkaddr(e); 396e05df3b1SJaegeuk Kim ni->version = nat_get_version(e); 397b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 398e05df3b1SJaegeuk Kim return; 3991515aef0SChao Yu } 400e05df3b1SJaegeuk Kim 4013547ea96SJaegeuk Kim memset(&ne, 0, sizeof(struct f2fs_nat_entry)); 4023547ea96SJaegeuk Kim 403e05df3b1SJaegeuk Kim /* Check current segment summary */ 404b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 405dfc08a12SChao Yu i = lookup_journal_in_cursum(journal, NAT_JOURNAL, nid, 0); 406e05df3b1SJaegeuk Kim if (i >= 0) { 407dfc08a12SChao Yu ne = nat_in_journal(journal, i); 408e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 409e05df3b1SJaegeuk Kim } 410b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 41166a82d1fSYunlei He if (i >= 0) { 41266a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 413e05df3b1SJaegeuk Kim goto cache; 41466a82d1fSYunlei He } 415e05df3b1SJaegeuk Kim 416e05df3b1SJaegeuk Kim /* Fill node_info from nat page */ 41766a82d1fSYunlei He index = current_nat_addr(sbi, nid); 41866a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 41966a82d1fSYunlei He 42066a82d1fSYunlei He page = get_meta_page(sbi, index); 421e05df3b1SJaegeuk Kim nat_blk = (struct f2fs_nat_block *)page_address(page); 422e05df3b1SJaegeuk Kim ne = nat_blk->entries[nid - start_nid]; 423e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 424e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 425e05df3b1SJaegeuk Kim cache: 426e05df3b1SJaegeuk Kim /* cache nat entry */ 427b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 4281515aef0SChao Yu cache_nat_entry(sbi, nid, &ne); 429b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 430e05df3b1SJaegeuk Kim } 431e05df3b1SJaegeuk Kim 43279344efbSJaegeuk Kim /* 43379344efbSJaegeuk Kim * readahead MAX_RA_NODE number of node pages. 43479344efbSJaegeuk Kim */ 43579344efbSJaegeuk Kim static void ra_node_pages(struct page *parent, int start, int n) 43679344efbSJaegeuk Kim { 43779344efbSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 43879344efbSJaegeuk Kim struct blk_plug plug; 43979344efbSJaegeuk Kim int i, end; 44079344efbSJaegeuk Kim nid_t nid; 44179344efbSJaegeuk Kim 44279344efbSJaegeuk Kim blk_start_plug(&plug); 44379344efbSJaegeuk Kim 44479344efbSJaegeuk Kim /* Then, try readahead for siblings of the desired node */ 44579344efbSJaegeuk Kim end = start + n; 44679344efbSJaegeuk Kim end = min(end, NIDS_PER_BLOCK); 44779344efbSJaegeuk Kim for (i = start; i < end; i++) { 44879344efbSJaegeuk Kim nid = get_nid(parent, i, false); 44979344efbSJaegeuk Kim ra_node_page(sbi, nid); 45079344efbSJaegeuk Kim } 45179344efbSJaegeuk Kim 45279344efbSJaegeuk Kim blk_finish_plug(&plug); 45379344efbSJaegeuk Kim } 45479344efbSJaegeuk Kim 4553cf45747SChao Yu pgoff_t get_next_page_offset(struct dnode_of_data *dn, pgoff_t pgofs) 4563cf45747SChao Yu { 4573cf45747SChao Yu const long direct_index = ADDRS_PER_INODE(dn->inode); 4583cf45747SChao Yu const long direct_blks = ADDRS_PER_BLOCK; 4593cf45747SChao Yu const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 4603cf45747SChao Yu unsigned int skipped_unit = ADDRS_PER_BLOCK; 4613cf45747SChao Yu int cur_level = dn->cur_level; 4623cf45747SChao Yu int max_level = dn->max_level; 4633cf45747SChao Yu pgoff_t base = 0; 4643cf45747SChao Yu 4653cf45747SChao Yu if (!dn->max_level) 4663cf45747SChao Yu return pgofs + 1; 4673cf45747SChao Yu 4683cf45747SChao Yu while (max_level-- > cur_level) 4693cf45747SChao Yu skipped_unit *= NIDS_PER_BLOCK; 4703cf45747SChao Yu 4713cf45747SChao Yu switch (dn->max_level) { 4723cf45747SChao Yu case 3: 4733cf45747SChao Yu base += 2 * indirect_blks; 4743cf45747SChao Yu case 2: 4753cf45747SChao Yu base += 2 * direct_blks; 4763cf45747SChao Yu case 1: 4773cf45747SChao Yu base += direct_index; 4783cf45747SChao Yu break; 4793cf45747SChao Yu default: 4803cf45747SChao Yu f2fs_bug_on(F2FS_I_SB(dn->inode), 1); 4813cf45747SChao Yu } 4823cf45747SChao Yu 4833cf45747SChao Yu return ((pgofs - base) / skipped_unit + 1) * skipped_unit + base; 4843cf45747SChao Yu } 4853cf45747SChao Yu 4860a8165d7SJaegeuk Kim /* 487e05df3b1SJaegeuk Kim * The maximum depth is four. 488e05df3b1SJaegeuk Kim * Offset[0] will have raw inode offset. 489e05df3b1SJaegeuk Kim */ 49081ca7350SChao Yu static int get_node_path(struct inode *inode, long block, 491de93653fSJaegeuk Kim int offset[4], unsigned int noffset[4]) 492e05df3b1SJaegeuk Kim { 49381ca7350SChao Yu const long direct_index = ADDRS_PER_INODE(inode); 494e05df3b1SJaegeuk Kim const long direct_blks = ADDRS_PER_BLOCK; 495e05df3b1SJaegeuk Kim const long dptrs_per_blk = NIDS_PER_BLOCK; 496e05df3b1SJaegeuk Kim const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 497e05df3b1SJaegeuk Kim const long dindirect_blks = indirect_blks * NIDS_PER_BLOCK; 498e05df3b1SJaegeuk Kim int n = 0; 499e05df3b1SJaegeuk Kim int level = 0; 500e05df3b1SJaegeuk Kim 501e05df3b1SJaegeuk Kim noffset[0] = 0; 502e05df3b1SJaegeuk Kim 503e05df3b1SJaegeuk Kim if (block < direct_index) { 50425c0a6e5SNamjae Jeon offset[n] = block; 505e05df3b1SJaegeuk Kim goto got; 506e05df3b1SJaegeuk Kim } 507e05df3b1SJaegeuk Kim block -= direct_index; 508e05df3b1SJaegeuk Kim if (block < direct_blks) { 509e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR1_BLOCK; 510e05df3b1SJaegeuk Kim noffset[n] = 1; 51125c0a6e5SNamjae Jeon offset[n] = block; 512e05df3b1SJaegeuk Kim level = 1; 513e05df3b1SJaegeuk Kim goto got; 514e05df3b1SJaegeuk Kim } 515e05df3b1SJaegeuk Kim block -= direct_blks; 516e05df3b1SJaegeuk Kim if (block < direct_blks) { 517e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR2_BLOCK; 518e05df3b1SJaegeuk Kim noffset[n] = 2; 51925c0a6e5SNamjae Jeon offset[n] = block; 520e05df3b1SJaegeuk Kim level = 1; 521e05df3b1SJaegeuk Kim goto got; 522e05df3b1SJaegeuk Kim } 523e05df3b1SJaegeuk Kim block -= direct_blks; 524e05df3b1SJaegeuk Kim if (block < indirect_blks) { 525e05df3b1SJaegeuk Kim offset[n++] = NODE_IND1_BLOCK; 526e05df3b1SJaegeuk Kim noffset[n] = 3; 527e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 528e05df3b1SJaegeuk Kim noffset[n] = 4 + offset[n - 1]; 52925c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 530e05df3b1SJaegeuk Kim level = 2; 531e05df3b1SJaegeuk Kim goto got; 532e05df3b1SJaegeuk Kim } 533e05df3b1SJaegeuk Kim block -= indirect_blks; 534e05df3b1SJaegeuk Kim if (block < indirect_blks) { 535e05df3b1SJaegeuk Kim offset[n++] = NODE_IND2_BLOCK; 536e05df3b1SJaegeuk Kim noffset[n] = 4 + dptrs_per_blk; 537e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 538e05df3b1SJaegeuk Kim noffset[n] = 5 + dptrs_per_blk + offset[n - 1]; 53925c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 540e05df3b1SJaegeuk Kim level = 2; 541e05df3b1SJaegeuk Kim goto got; 542e05df3b1SJaegeuk Kim } 543e05df3b1SJaegeuk Kim block -= indirect_blks; 544e05df3b1SJaegeuk Kim if (block < dindirect_blks) { 545e05df3b1SJaegeuk Kim offset[n++] = NODE_DIND_BLOCK; 546e05df3b1SJaegeuk Kim noffset[n] = 5 + (dptrs_per_blk * 2); 547e05df3b1SJaegeuk Kim offset[n++] = block / indirect_blks; 548e05df3b1SJaegeuk Kim noffset[n] = 6 + (dptrs_per_blk * 2) + 549e05df3b1SJaegeuk Kim offset[n - 1] * (dptrs_per_blk + 1); 550e05df3b1SJaegeuk Kim offset[n++] = (block / direct_blks) % dptrs_per_blk; 551e05df3b1SJaegeuk Kim noffset[n] = 7 + (dptrs_per_blk * 2) + 552e05df3b1SJaegeuk Kim offset[n - 2] * (dptrs_per_blk + 1) + 553e05df3b1SJaegeuk Kim offset[n - 1]; 55425c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 555e05df3b1SJaegeuk Kim level = 3; 556e05df3b1SJaegeuk Kim goto got; 557e05df3b1SJaegeuk Kim } else { 558e05df3b1SJaegeuk Kim BUG(); 559e05df3b1SJaegeuk Kim } 560e05df3b1SJaegeuk Kim got: 561e05df3b1SJaegeuk Kim return level; 562e05df3b1SJaegeuk Kim } 563e05df3b1SJaegeuk Kim 564e05df3b1SJaegeuk Kim /* 565e05df3b1SJaegeuk Kim * Caller should call f2fs_put_dnode(dn). 5664f4124d0SChao Yu * Also, it should grab and release a rwsem by calling f2fs_lock_op() and 5674f4124d0SChao Yu * f2fs_unlock_op() only if ro is not set RDONLY_NODE. 56839936837SJaegeuk Kim * In the case of RDONLY_NODE, we don't need to care about mutex. 569e05df3b1SJaegeuk Kim */ 570266e97a8SJaegeuk Kim int get_dnode_of_data(struct dnode_of_data *dn, pgoff_t index, int mode) 571e05df3b1SJaegeuk Kim { 5724081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 573e05df3b1SJaegeuk Kim struct page *npage[4]; 574f1a3b98eSJaegeuk Kim struct page *parent = NULL; 575e05df3b1SJaegeuk Kim int offset[4]; 576e05df3b1SJaegeuk Kim unsigned int noffset[4]; 577e05df3b1SJaegeuk Kim nid_t nids[4]; 5783cf45747SChao Yu int level, i = 0; 579e05df3b1SJaegeuk Kim int err = 0; 580e05df3b1SJaegeuk Kim 58181ca7350SChao Yu level = get_node_path(dn->inode, index, offset, noffset); 582e05df3b1SJaegeuk Kim 583e05df3b1SJaegeuk Kim nids[0] = dn->inode->i_ino; 5841646cfacSJaegeuk Kim npage[0] = dn->inode_page; 5851646cfacSJaegeuk Kim 5861646cfacSJaegeuk Kim if (!npage[0]) { 587e05df3b1SJaegeuk Kim npage[0] = get_node_page(sbi, nids[0]); 588e05df3b1SJaegeuk Kim if (IS_ERR(npage[0])) 589e05df3b1SJaegeuk Kim return PTR_ERR(npage[0]); 5901646cfacSJaegeuk Kim } 591f1a3b98eSJaegeuk Kim 592f1a3b98eSJaegeuk Kim /* if inline_data is set, should not report any block indices */ 593f1a3b98eSJaegeuk Kim if (f2fs_has_inline_data(dn->inode) && index) { 59476629165SJaegeuk Kim err = -ENOENT; 595f1a3b98eSJaegeuk Kim f2fs_put_page(npage[0], 1); 596f1a3b98eSJaegeuk Kim goto release_out; 597f1a3b98eSJaegeuk Kim } 598f1a3b98eSJaegeuk Kim 599e05df3b1SJaegeuk Kim parent = npage[0]; 60052c2db3fSChangman Lee if (level != 0) 601e05df3b1SJaegeuk Kim nids[1] = get_nid(parent, offset[0], true); 602e05df3b1SJaegeuk Kim dn->inode_page = npage[0]; 603e05df3b1SJaegeuk Kim dn->inode_page_locked = true; 604e05df3b1SJaegeuk Kim 605e05df3b1SJaegeuk Kim /* get indirect or direct nodes */ 606e05df3b1SJaegeuk Kim for (i = 1; i <= level; i++) { 607e05df3b1SJaegeuk Kim bool done = false; 608e05df3b1SJaegeuk Kim 609266e97a8SJaegeuk Kim if (!nids[i] && mode == ALLOC_NODE) { 610e05df3b1SJaegeuk Kim /* alloc new node */ 611e05df3b1SJaegeuk Kim if (!alloc_nid(sbi, &(nids[i]))) { 612e05df3b1SJaegeuk Kim err = -ENOSPC; 613e05df3b1SJaegeuk Kim goto release_pages; 614e05df3b1SJaegeuk Kim } 615e05df3b1SJaegeuk Kim 616e05df3b1SJaegeuk Kim dn->nid = nids[i]; 6175f4ce6abSYunlei He npage[i] = new_node_page(dn, noffset[i]); 618e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 619e05df3b1SJaegeuk Kim alloc_nid_failed(sbi, nids[i]); 620e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 621e05df3b1SJaegeuk Kim goto release_pages; 622e05df3b1SJaegeuk Kim } 623e05df3b1SJaegeuk Kim 624e05df3b1SJaegeuk Kim set_nid(parent, offset[i - 1], nids[i], i == 1); 625e05df3b1SJaegeuk Kim alloc_nid_done(sbi, nids[i]); 626e05df3b1SJaegeuk Kim done = true; 627266e97a8SJaegeuk Kim } else if (mode == LOOKUP_NODE_RA && i == level && level > 1) { 628e05df3b1SJaegeuk Kim npage[i] = get_node_page_ra(parent, offset[i - 1]); 629e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 630e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 631e05df3b1SJaegeuk Kim goto release_pages; 632e05df3b1SJaegeuk Kim } 633e05df3b1SJaegeuk Kim done = true; 634e05df3b1SJaegeuk Kim } 635e05df3b1SJaegeuk Kim if (i == 1) { 636e05df3b1SJaegeuk Kim dn->inode_page_locked = false; 637e05df3b1SJaegeuk Kim unlock_page(parent); 638e05df3b1SJaegeuk Kim } else { 639e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 640e05df3b1SJaegeuk Kim } 641e05df3b1SJaegeuk Kim 642e05df3b1SJaegeuk Kim if (!done) { 643e05df3b1SJaegeuk Kim npage[i] = get_node_page(sbi, nids[i]); 644e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 645e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 646e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 647e05df3b1SJaegeuk Kim goto release_out; 648e05df3b1SJaegeuk Kim } 649e05df3b1SJaegeuk Kim } 650e05df3b1SJaegeuk Kim if (i < level) { 651e05df3b1SJaegeuk Kim parent = npage[i]; 652e05df3b1SJaegeuk Kim nids[i + 1] = get_nid(parent, offset[i], false); 653e05df3b1SJaegeuk Kim } 654e05df3b1SJaegeuk Kim } 655e05df3b1SJaegeuk Kim dn->nid = nids[level]; 656e05df3b1SJaegeuk Kim dn->ofs_in_node = offset[level]; 657e05df3b1SJaegeuk Kim dn->node_page = npage[level]; 658e05df3b1SJaegeuk Kim dn->data_blkaddr = datablock_addr(dn->node_page, dn->ofs_in_node); 659e05df3b1SJaegeuk Kim return 0; 660e05df3b1SJaegeuk Kim 661e05df3b1SJaegeuk Kim release_pages: 662e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 663e05df3b1SJaegeuk Kim if (i > 1) 664e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 665e05df3b1SJaegeuk Kim release_out: 666e05df3b1SJaegeuk Kim dn->inode_page = NULL; 667e05df3b1SJaegeuk Kim dn->node_page = NULL; 6683cf45747SChao Yu if (err == -ENOENT) { 6693cf45747SChao Yu dn->cur_level = i; 6703cf45747SChao Yu dn->max_level = level; 6710a2aa8fbSJaegeuk Kim dn->ofs_in_node = offset[level]; 6723cf45747SChao Yu } 673e05df3b1SJaegeuk Kim return err; 674e05df3b1SJaegeuk Kim } 675e05df3b1SJaegeuk Kim 676e05df3b1SJaegeuk Kim static void truncate_node(struct dnode_of_data *dn) 677e05df3b1SJaegeuk Kim { 6784081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 679e05df3b1SJaegeuk Kim struct node_info ni; 680e05df3b1SJaegeuk Kim 681e05df3b1SJaegeuk Kim get_node_info(sbi, dn->nid, &ni); 6829850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 683e05df3b1SJaegeuk Kim 684e05df3b1SJaegeuk Kim /* Deallocate node address */ 68571e9fec5SJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 686000519f2SChao Yu dec_valid_node_count(sbi, dn->inode, dn->nid == dn->inode->i_ino); 687479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 688e05df3b1SJaegeuk Kim 689e05df3b1SJaegeuk Kim if (dn->nid == dn->inode->i_ino) { 690e05df3b1SJaegeuk Kim remove_orphan_inode(sbi, dn->nid); 691e05df3b1SJaegeuk Kim dec_valid_inode_count(sbi); 6920f18b462SJaegeuk Kim f2fs_inode_synced(dn->inode); 693e05df3b1SJaegeuk Kim } 694000519f2SChao Yu 695e05df3b1SJaegeuk Kim clear_node_page_dirty(dn->node_page); 696caf0047eSChao Yu set_sbi_flag(sbi, SBI_IS_DIRTY); 697e05df3b1SJaegeuk Kim 698e05df3b1SJaegeuk Kim f2fs_put_page(dn->node_page, 1); 699bf39c00aSJaegeuk Kim 700bf39c00aSJaegeuk Kim invalidate_mapping_pages(NODE_MAPPING(sbi), 701bf39c00aSJaegeuk Kim dn->node_page->index, dn->node_page->index); 702bf39c00aSJaegeuk Kim 703e05df3b1SJaegeuk Kim dn->node_page = NULL; 70451dd6249SNamjae Jeon trace_f2fs_truncate_node(dn->inode, dn->nid, ni.blk_addr); 705e05df3b1SJaegeuk Kim } 706e05df3b1SJaegeuk Kim 707e05df3b1SJaegeuk Kim static int truncate_dnode(struct dnode_of_data *dn) 708e05df3b1SJaegeuk Kim { 709e05df3b1SJaegeuk Kim struct page *page; 710e05df3b1SJaegeuk Kim 711e05df3b1SJaegeuk Kim if (dn->nid == 0) 712e05df3b1SJaegeuk Kim return 1; 713e05df3b1SJaegeuk Kim 714e05df3b1SJaegeuk Kim /* get direct node */ 7154081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 716e05df3b1SJaegeuk Kim if (IS_ERR(page) && PTR_ERR(page) == -ENOENT) 717e05df3b1SJaegeuk Kim return 1; 718e05df3b1SJaegeuk Kim else if (IS_ERR(page)) 719e05df3b1SJaegeuk Kim return PTR_ERR(page); 720e05df3b1SJaegeuk Kim 721e05df3b1SJaegeuk Kim /* Make dnode_of_data for parameter */ 722e05df3b1SJaegeuk Kim dn->node_page = page; 723e05df3b1SJaegeuk Kim dn->ofs_in_node = 0; 724e05df3b1SJaegeuk Kim truncate_data_blocks(dn); 725e05df3b1SJaegeuk Kim truncate_node(dn); 726e05df3b1SJaegeuk Kim return 1; 727e05df3b1SJaegeuk Kim } 728e05df3b1SJaegeuk Kim 729e05df3b1SJaegeuk Kim static int truncate_nodes(struct dnode_of_data *dn, unsigned int nofs, 730e05df3b1SJaegeuk Kim int ofs, int depth) 731e05df3b1SJaegeuk Kim { 732e05df3b1SJaegeuk Kim struct dnode_of_data rdn = *dn; 733e05df3b1SJaegeuk Kim struct page *page; 734e05df3b1SJaegeuk Kim struct f2fs_node *rn; 735e05df3b1SJaegeuk Kim nid_t child_nid; 736e05df3b1SJaegeuk Kim unsigned int child_nofs; 737e05df3b1SJaegeuk Kim int freed = 0; 738e05df3b1SJaegeuk Kim int i, ret; 739e05df3b1SJaegeuk Kim 740e05df3b1SJaegeuk Kim if (dn->nid == 0) 741e05df3b1SJaegeuk Kim return NIDS_PER_BLOCK + 1; 742e05df3b1SJaegeuk Kim 74351dd6249SNamjae Jeon trace_f2fs_truncate_nodes_enter(dn->inode, dn->nid, dn->data_blkaddr); 74451dd6249SNamjae Jeon 7454081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 74651dd6249SNamjae Jeon if (IS_ERR(page)) { 74751dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, PTR_ERR(page)); 748e05df3b1SJaegeuk Kim return PTR_ERR(page); 74951dd6249SNamjae Jeon } 750e05df3b1SJaegeuk Kim 75179344efbSJaegeuk Kim ra_node_pages(page, ofs, NIDS_PER_BLOCK); 75279344efbSJaegeuk Kim 75345590710SGu Zheng rn = F2FS_NODE(page); 754e05df3b1SJaegeuk Kim if (depth < 3) { 755e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++, freed++) { 756e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 757e05df3b1SJaegeuk Kim if (child_nid == 0) 758e05df3b1SJaegeuk Kim continue; 759e05df3b1SJaegeuk Kim rdn.nid = child_nid; 760e05df3b1SJaegeuk Kim ret = truncate_dnode(&rdn); 761e05df3b1SJaegeuk Kim if (ret < 0) 762e05df3b1SJaegeuk Kim goto out_err; 76312719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 76493bae099SJaegeuk Kim dn->node_changed = true; 765e05df3b1SJaegeuk Kim } 766e05df3b1SJaegeuk Kim } else { 767e05df3b1SJaegeuk Kim child_nofs = nofs + ofs * (NIDS_PER_BLOCK + 1) + 1; 768e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++) { 769e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 770e05df3b1SJaegeuk Kim if (child_nid == 0) { 771e05df3b1SJaegeuk Kim child_nofs += NIDS_PER_BLOCK + 1; 772e05df3b1SJaegeuk Kim continue; 773e05df3b1SJaegeuk Kim } 774e05df3b1SJaegeuk Kim rdn.nid = child_nid; 775e05df3b1SJaegeuk Kim ret = truncate_nodes(&rdn, child_nofs, 0, depth - 1); 776e05df3b1SJaegeuk Kim if (ret == (NIDS_PER_BLOCK + 1)) { 77712719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 77893bae099SJaegeuk Kim dn->node_changed = true; 779e05df3b1SJaegeuk Kim child_nofs += ret; 780e05df3b1SJaegeuk Kim } else if (ret < 0 && ret != -ENOENT) { 781e05df3b1SJaegeuk Kim goto out_err; 782e05df3b1SJaegeuk Kim } 783e05df3b1SJaegeuk Kim } 784e05df3b1SJaegeuk Kim freed = child_nofs; 785e05df3b1SJaegeuk Kim } 786e05df3b1SJaegeuk Kim 787e05df3b1SJaegeuk Kim if (!ofs) { 788e05df3b1SJaegeuk Kim /* remove current indirect node */ 789e05df3b1SJaegeuk Kim dn->node_page = page; 790e05df3b1SJaegeuk Kim truncate_node(dn); 791e05df3b1SJaegeuk Kim freed++; 792e05df3b1SJaegeuk Kim } else { 793e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 794e05df3b1SJaegeuk Kim } 79551dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, freed); 796e05df3b1SJaegeuk Kim return freed; 797e05df3b1SJaegeuk Kim 798e05df3b1SJaegeuk Kim out_err: 799e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 80051dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, ret); 801e05df3b1SJaegeuk Kim return ret; 802e05df3b1SJaegeuk Kim } 803e05df3b1SJaegeuk Kim 804e05df3b1SJaegeuk Kim static int truncate_partial_nodes(struct dnode_of_data *dn, 805e05df3b1SJaegeuk Kim struct f2fs_inode *ri, int *offset, int depth) 806e05df3b1SJaegeuk Kim { 807e05df3b1SJaegeuk Kim struct page *pages[2]; 808e05df3b1SJaegeuk Kim nid_t nid[3]; 809e05df3b1SJaegeuk Kim nid_t child_nid; 810e05df3b1SJaegeuk Kim int err = 0; 811e05df3b1SJaegeuk Kim int i; 812e05df3b1SJaegeuk Kim int idx = depth - 2; 813e05df3b1SJaegeuk Kim 814e05df3b1SJaegeuk Kim nid[0] = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 815e05df3b1SJaegeuk Kim if (!nid[0]) 816e05df3b1SJaegeuk Kim return 0; 817e05df3b1SJaegeuk Kim 818e05df3b1SJaegeuk Kim /* get indirect nodes in the path */ 819a225dca3Sshifei10.ge for (i = 0; i < idx + 1; i++) { 820e1c42045Sarter97 /* reference count'll be increased */ 8214081363fSJaegeuk Kim pages[i] = get_node_page(F2FS_I_SB(dn->inode), nid[i]); 822e05df3b1SJaegeuk Kim if (IS_ERR(pages[i])) { 823e05df3b1SJaegeuk Kim err = PTR_ERR(pages[i]); 824a225dca3Sshifei10.ge idx = i - 1; 825e05df3b1SJaegeuk Kim goto fail; 826e05df3b1SJaegeuk Kim } 827e05df3b1SJaegeuk Kim nid[i + 1] = get_nid(pages[i], offset[i + 1], false); 828e05df3b1SJaegeuk Kim } 829e05df3b1SJaegeuk Kim 83079344efbSJaegeuk Kim ra_node_pages(pages[idx], offset[idx + 1], NIDS_PER_BLOCK); 83179344efbSJaegeuk Kim 832e05df3b1SJaegeuk Kim /* free direct nodes linked to a partial indirect node */ 833a225dca3Sshifei10.ge for (i = offset[idx + 1]; i < NIDS_PER_BLOCK; i++) { 834e05df3b1SJaegeuk Kim child_nid = get_nid(pages[idx], i, false); 835e05df3b1SJaegeuk Kim if (!child_nid) 836e05df3b1SJaegeuk Kim continue; 837e05df3b1SJaegeuk Kim dn->nid = child_nid; 838e05df3b1SJaegeuk Kim err = truncate_dnode(dn); 839e05df3b1SJaegeuk Kim if (err < 0) 840e05df3b1SJaegeuk Kim goto fail; 84112719ae1SJaegeuk Kim if (set_nid(pages[idx], i, 0, false)) 84293bae099SJaegeuk Kim dn->node_changed = true; 843e05df3b1SJaegeuk Kim } 844e05df3b1SJaegeuk Kim 845a225dca3Sshifei10.ge if (offset[idx + 1] == 0) { 846e05df3b1SJaegeuk Kim dn->node_page = pages[idx]; 847e05df3b1SJaegeuk Kim dn->nid = nid[idx]; 848e05df3b1SJaegeuk Kim truncate_node(dn); 849e05df3b1SJaegeuk Kim } else { 850e05df3b1SJaegeuk Kim f2fs_put_page(pages[idx], 1); 851e05df3b1SJaegeuk Kim } 852e05df3b1SJaegeuk Kim offset[idx]++; 853a225dca3Sshifei10.ge offset[idx + 1] = 0; 854a225dca3Sshifei10.ge idx--; 855e05df3b1SJaegeuk Kim fail: 856a225dca3Sshifei10.ge for (i = idx; i >= 0; i--) 857e05df3b1SJaegeuk Kim f2fs_put_page(pages[i], 1); 85851dd6249SNamjae Jeon 85951dd6249SNamjae Jeon trace_f2fs_truncate_partial_nodes(dn->inode, nid, depth, err); 86051dd6249SNamjae Jeon 861e05df3b1SJaegeuk Kim return err; 862e05df3b1SJaegeuk Kim } 863e05df3b1SJaegeuk Kim 8640a8165d7SJaegeuk Kim /* 865e05df3b1SJaegeuk Kim * All the block addresses of data and nodes should be nullified. 866e05df3b1SJaegeuk Kim */ 867e05df3b1SJaegeuk Kim int truncate_inode_blocks(struct inode *inode, pgoff_t from) 868e05df3b1SJaegeuk Kim { 8694081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 870e05df3b1SJaegeuk Kim int err = 0, cont = 1; 871e05df3b1SJaegeuk Kim int level, offset[4], noffset[4]; 8727dd690c8SJaegeuk Kim unsigned int nofs = 0; 87358bfaf44SJaegeuk Kim struct f2fs_inode *ri; 874e05df3b1SJaegeuk Kim struct dnode_of_data dn; 875e05df3b1SJaegeuk Kim struct page *page; 876e05df3b1SJaegeuk Kim 87751dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_enter(inode, from); 87851dd6249SNamjae Jeon 87981ca7350SChao Yu level = get_node_path(inode, from, offset, noffset); 880ff373558SJaegeuk Kim 881e05df3b1SJaegeuk Kim page = get_node_page(sbi, inode->i_ino); 88251dd6249SNamjae Jeon if (IS_ERR(page)) { 88351dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, PTR_ERR(page)); 884e05df3b1SJaegeuk Kim return PTR_ERR(page); 88551dd6249SNamjae Jeon } 886e05df3b1SJaegeuk Kim 887e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, page, NULL, 0); 888e05df3b1SJaegeuk Kim unlock_page(page); 889e05df3b1SJaegeuk Kim 89058bfaf44SJaegeuk Kim ri = F2FS_INODE(page); 891e05df3b1SJaegeuk Kim switch (level) { 892e05df3b1SJaegeuk Kim case 0: 893e05df3b1SJaegeuk Kim case 1: 894e05df3b1SJaegeuk Kim nofs = noffset[1]; 895e05df3b1SJaegeuk Kim break; 896e05df3b1SJaegeuk Kim case 2: 897e05df3b1SJaegeuk Kim nofs = noffset[1]; 898e05df3b1SJaegeuk Kim if (!offset[level - 1]) 899e05df3b1SJaegeuk Kim goto skip_partial; 90058bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 901e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 902e05df3b1SJaegeuk Kim goto fail; 903e05df3b1SJaegeuk Kim nofs += 1 + NIDS_PER_BLOCK; 904e05df3b1SJaegeuk Kim break; 905e05df3b1SJaegeuk Kim case 3: 906e05df3b1SJaegeuk Kim nofs = 5 + 2 * NIDS_PER_BLOCK; 907e05df3b1SJaegeuk Kim if (!offset[level - 1]) 908e05df3b1SJaegeuk Kim goto skip_partial; 90958bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 910e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 911e05df3b1SJaegeuk Kim goto fail; 912e05df3b1SJaegeuk Kim break; 913e05df3b1SJaegeuk Kim default: 914e05df3b1SJaegeuk Kim BUG(); 915e05df3b1SJaegeuk Kim } 916e05df3b1SJaegeuk Kim 917e05df3b1SJaegeuk Kim skip_partial: 918e05df3b1SJaegeuk Kim while (cont) { 91958bfaf44SJaegeuk Kim dn.nid = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 920e05df3b1SJaegeuk Kim switch (offset[0]) { 921e05df3b1SJaegeuk Kim case NODE_DIR1_BLOCK: 922e05df3b1SJaegeuk Kim case NODE_DIR2_BLOCK: 923e05df3b1SJaegeuk Kim err = truncate_dnode(&dn); 924e05df3b1SJaegeuk Kim break; 925e05df3b1SJaegeuk Kim 926e05df3b1SJaegeuk Kim case NODE_IND1_BLOCK: 927e05df3b1SJaegeuk Kim case NODE_IND2_BLOCK: 928e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 2); 929e05df3b1SJaegeuk Kim break; 930e05df3b1SJaegeuk Kim 931e05df3b1SJaegeuk Kim case NODE_DIND_BLOCK: 932e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 3); 933e05df3b1SJaegeuk Kim cont = 0; 934e05df3b1SJaegeuk Kim break; 935e05df3b1SJaegeuk Kim 936e05df3b1SJaegeuk Kim default: 937e05df3b1SJaegeuk Kim BUG(); 938e05df3b1SJaegeuk Kim } 939e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 940e05df3b1SJaegeuk Kim goto fail; 941e05df3b1SJaegeuk Kim if (offset[1] == 0 && 94258bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK]) { 943e05df3b1SJaegeuk Kim lock_page(page); 944ff373558SJaegeuk Kim BUG_ON(page->mapping != NODE_MAPPING(sbi)); 945fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 94658bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK] = 0; 947e05df3b1SJaegeuk Kim set_page_dirty(page); 948e05df3b1SJaegeuk Kim unlock_page(page); 949e05df3b1SJaegeuk Kim } 950e05df3b1SJaegeuk Kim offset[1] = 0; 951e05df3b1SJaegeuk Kim offset[0]++; 952e05df3b1SJaegeuk Kim nofs += err; 953e05df3b1SJaegeuk Kim } 954e05df3b1SJaegeuk Kim fail: 955e05df3b1SJaegeuk Kim f2fs_put_page(page, 0); 95651dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, err); 957e05df3b1SJaegeuk Kim return err > 0 ? 0 : err; 958e05df3b1SJaegeuk Kim } 959e05df3b1SJaegeuk Kim 9604f16fb0fSJaegeuk Kim int truncate_xattr_node(struct inode *inode, struct page *page) 9614f16fb0fSJaegeuk Kim { 9624081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 9634f16fb0fSJaegeuk Kim nid_t nid = F2FS_I(inode)->i_xattr_nid; 9644f16fb0fSJaegeuk Kim struct dnode_of_data dn; 9654f16fb0fSJaegeuk Kim struct page *npage; 9664f16fb0fSJaegeuk Kim 9674f16fb0fSJaegeuk Kim if (!nid) 9684f16fb0fSJaegeuk Kim return 0; 9694f16fb0fSJaegeuk Kim 9704f16fb0fSJaegeuk Kim npage = get_node_page(sbi, nid); 9714f16fb0fSJaegeuk Kim if (IS_ERR(npage)) 9724f16fb0fSJaegeuk Kim return PTR_ERR(npage); 9734f16fb0fSJaegeuk Kim 974205b9822SJaegeuk Kim f2fs_i_xnid_write(inode, 0); 97565985d93SJaegeuk Kim 9764f16fb0fSJaegeuk Kim set_new_dnode(&dn, inode, page, npage, nid); 9774f16fb0fSJaegeuk Kim 9784f16fb0fSJaegeuk Kim if (page) 97901d2d1aaSChao Yu dn.inode_page_locked = true; 9804f16fb0fSJaegeuk Kim truncate_node(&dn); 9814f16fb0fSJaegeuk Kim return 0; 9824f16fb0fSJaegeuk Kim } 9834f16fb0fSJaegeuk Kim 98439936837SJaegeuk Kim /* 9854f4124d0SChao Yu * Caller should grab and release a rwsem by calling f2fs_lock_op() and 9864f4124d0SChao Yu * f2fs_unlock_op(). 98739936837SJaegeuk Kim */ 98813ec7297SChao Yu int remove_inode_page(struct inode *inode) 989e05df3b1SJaegeuk Kim { 990e05df3b1SJaegeuk Kim struct dnode_of_data dn; 99113ec7297SChao Yu int err; 992e05df3b1SJaegeuk Kim 993c2e69583SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 99413ec7297SChao Yu err = get_dnode_of_data(&dn, 0, LOOKUP_NODE); 99513ec7297SChao Yu if (err) 99613ec7297SChao Yu return err; 997e05df3b1SJaegeuk Kim 99813ec7297SChao Yu err = truncate_xattr_node(inode, dn.inode_page); 99913ec7297SChao Yu if (err) { 1000c2e69583SJaegeuk Kim f2fs_put_dnode(&dn); 100113ec7297SChao Yu return err; 1002e05df3b1SJaegeuk Kim } 1003c2e69583SJaegeuk Kim 1004c2e69583SJaegeuk Kim /* remove potential inline_data blocks */ 1005c2e69583SJaegeuk Kim if (S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) || 1006c2e69583SJaegeuk Kim S_ISLNK(inode->i_mode)) 1007c2e69583SJaegeuk Kim truncate_data_blocks_range(&dn, 1); 1008c2e69583SJaegeuk Kim 1009e1c42045Sarter97 /* 0 is possible, after f2fs_new_inode() has failed */ 10109850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), 10110eb0adadSChao Yu inode->i_blocks != 0 && inode->i_blocks != 8); 1012c2e69583SJaegeuk Kim 1013c2e69583SJaegeuk Kim /* will put inode & node pages */ 1014e05df3b1SJaegeuk Kim truncate_node(&dn); 101513ec7297SChao Yu return 0; 1016e05df3b1SJaegeuk Kim } 1017e05df3b1SJaegeuk Kim 1018a014e037SJaegeuk Kim struct page *new_inode_page(struct inode *inode) 1019e05df3b1SJaegeuk Kim { 1020e05df3b1SJaegeuk Kim struct dnode_of_data dn; 1021e05df3b1SJaegeuk Kim 1022e05df3b1SJaegeuk Kim /* allocate inode page for new inode */ 1023e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 102444a83ff6SJaegeuk Kim 102544a83ff6SJaegeuk Kim /* caller should f2fs_put_page(page, 1); */ 10265f4ce6abSYunlei He return new_node_page(&dn, 0); 1027e05df3b1SJaegeuk Kim } 1028e05df3b1SJaegeuk Kim 10295f4ce6abSYunlei He struct page *new_node_page(struct dnode_of_data *dn, unsigned int ofs) 1030e05df3b1SJaegeuk Kim { 10314081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 103225cc5d3bSJaegeuk Kim struct node_info new_ni; 1033e05df3b1SJaegeuk Kim struct page *page; 1034e05df3b1SJaegeuk Kim int err; 1035e05df3b1SJaegeuk Kim 103691942321SJaegeuk Kim if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC))) 1037e05df3b1SJaegeuk Kim return ERR_PTR(-EPERM); 1038e05df3b1SJaegeuk Kim 1039300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), dn->nid, false); 1040e05df3b1SJaegeuk Kim if (!page) 1041e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1042e05df3b1SJaegeuk Kim 10430abd675eSChao Yu if (unlikely((err = inc_valid_node_count(sbi, dn->inode, !ofs)))) 10449c02740cSJaegeuk Kim goto fail; 10450abd675eSChao Yu 104625cc5d3bSJaegeuk Kim #ifdef CONFIG_F2FS_CHECK_FS 104725cc5d3bSJaegeuk Kim get_node_info(sbi, dn->nid, &new_ni); 104825cc5d3bSJaegeuk Kim f2fs_bug_on(sbi, new_ni.blk_addr != NULL_ADDR); 104925cc5d3bSJaegeuk Kim #endif 105025cc5d3bSJaegeuk Kim new_ni.nid = dn->nid; 1051e05df3b1SJaegeuk Kim new_ni.ino = dn->inode->i_ino; 105225cc5d3bSJaegeuk Kim new_ni.blk_addr = NULL_ADDR; 105325cc5d3bSJaegeuk Kim new_ni.flag = 0; 105425cc5d3bSJaegeuk Kim new_ni.version = 0; 1055479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 10569c02740cSJaegeuk Kim 1057fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 10589c02740cSJaegeuk Kim fill_node_footer(page, dn->nid, dn->inode->i_ino, ofs, true); 1059398b1ac5SJaegeuk Kim set_cold_node(dn->inode, page); 1060237c0790SJaegeuk Kim if (!PageUptodate(page)) 10619c02740cSJaegeuk Kim SetPageUptodate(page); 106212719ae1SJaegeuk Kim if (set_page_dirty(page)) 106312719ae1SJaegeuk Kim dn->node_changed = true; 1064e05df3b1SJaegeuk Kim 10654bc8e9bcSChao Yu if (f2fs_has_xattr_block(ofs)) 1066205b9822SJaegeuk Kim f2fs_i_xnid_write(dn->inode, dn->nid); 1067479bd73aSJaegeuk Kim 1068e05df3b1SJaegeuk Kim if (ofs == 0) 1069e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 1070e05df3b1SJaegeuk Kim return page; 1071e05df3b1SJaegeuk Kim 1072e05df3b1SJaegeuk Kim fail: 107371e9fec5SJaegeuk Kim clear_node_page_dirty(page); 1074e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1075e05df3b1SJaegeuk Kim return ERR_PTR(err); 1076e05df3b1SJaegeuk Kim } 1077e05df3b1SJaegeuk Kim 107856ae674cSJaegeuk Kim /* 107956ae674cSJaegeuk Kim * Caller should do after getting the following values. 108056ae674cSJaegeuk Kim * 0: f2fs_put_page(page, 0) 108186531d6bSJaegeuk Kim * LOCKED_PAGE or error: f2fs_put_page(page, 1) 108256ae674cSJaegeuk Kim */ 108304d328deSMike Christie static int read_node_page(struct page *page, int op_flags) 1084e05df3b1SJaegeuk Kim { 10854081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1086e05df3b1SJaegeuk Kim struct node_info ni; 1087cf04e8ebSJaegeuk Kim struct f2fs_io_info fio = { 108805ca3632SJaegeuk Kim .sbi = sbi, 1089cf04e8ebSJaegeuk Kim .type = NODE, 109004d328deSMike Christie .op = REQ_OP_READ, 109104d328deSMike Christie .op_flags = op_flags, 109205ca3632SJaegeuk Kim .page = page, 10934375a336SJaegeuk Kim .encrypted_page = NULL, 1094cf04e8ebSJaegeuk Kim }; 1095e05df3b1SJaegeuk Kim 10963bdad3c7SJaegeuk Kim if (PageUptodate(page)) 10973bdad3c7SJaegeuk Kim return LOCKED_PAGE; 10983bdad3c7SJaegeuk Kim 1099e05df3b1SJaegeuk Kim get_node_info(sbi, page->index, &ni); 1100e05df3b1SJaegeuk Kim 11016bacf52fSJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 11022bca1e23SJaegeuk Kim ClearPageUptodate(page); 1103e05df3b1SJaegeuk Kim return -ENOENT; 1104393ff91fSJaegeuk Kim } 1105393ff91fSJaegeuk Kim 11067a9d7548SChao Yu fio.new_blkaddr = fio.old_blkaddr = ni.blk_addr; 110705ca3632SJaegeuk Kim return f2fs_submit_page_bio(&fio); 1108e05df3b1SJaegeuk Kim } 1109e05df3b1SJaegeuk Kim 11100a8165d7SJaegeuk Kim /* 1111e05df3b1SJaegeuk Kim * Readahead a node page 1112e05df3b1SJaegeuk Kim */ 1113e05df3b1SJaegeuk Kim void ra_node_page(struct f2fs_sb_info *sbi, nid_t nid) 1114e05df3b1SJaegeuk Kim { 1115e05df3b1SJaegeuk Kim struct page *apage; 111656ae674cSJaegeuk Kim int err; 1117e05df3b1SJaegeuk Kim 1118e8458725SChao Yu if (!nid) 1119e8458725SChao Yu return; 1120e8458725SChao Yu f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1121e8458725SChao Yu 1122999270deSFan Li rcu_read_lock(); 1123999270deSFan Li apage = radix_tree_lookup(&NODE_MAPPING(sbi)->page_tree, nid); 1124999270deSFan Li rcu_read_unlock(); 1125999270deSFan Li if (apage) 1126393ff91fSJaegeuk Kim return; 1127e05df3b1SJaegeuk Kim 1128300e129cSJaegeuk Kim apage = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1129e05df3b1SJaegeuk Kim if (!apage) 1130e05df3b1SJaegeuk Kim return; 1131e05df3b1SJaegeuk Kim 113270246286SChristoph Hellwig err = read_node_page(apage, REQ_RAHEAD); 113386531d6bSJaegeuk Kim f2fs_put_page(apage, err ? 1 : 0); 1134e05df3b1SJaegeuk Kim } 1135e05df3b1SJaegeuk Kim 113617a0ee55SJaegeuk Kim static struct page *__get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid, 11370e022ea8SChao Yu struct page *parent, int start) 1138e05df3b1SJaegeuk Kim { 113956ae674cSJaegeuk Kim struct page *page; 114056ae674cSJaegeuk Kim int err; 11414aa69d56SJaegeuk Kim 11424aa69d56SJaegeuk Kim if (!nid) 11434aa69d56SJaegeuk Kim return ERR_PTR(-ENOENT); 11444aa69d56SJaegeuk Kim f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1145afcb7ca0SJaegeuk Kim repeat: 1146300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1147e05df3b1SJaegeuk Kim if (!page) 1148e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1149e05df3b1SJaegeuk Kim 115070fd7614SChristoph Hellwig err = read_node_page(page, 0); 115186531d6bSJaegeuk Kim if (err < 0) { 115286531d6bSJaegeuk Kim f2fs_put_page(page, 1); 1153e05df3b1SJaegeuk Kim return ERR_PTR(err); 1154e1c51b9fSChao Yu } else if (err == LOCKED_PAGE) { 11551f258ec1SChao Yu err = 0; 1156e1c51b9fSChao Yu goto page_hit; 115786531d6bSJaegeuk Kim } 1158aaf96075SJaegeuk Kim 11590e022ea8SChao Yu if (parent) 116079344efbSJaegeuk Kim ra_node_pages(parent, start + 1, MAX_RA_NODE); 11610e022ea8SChao Yu 1162e1c51b9fSChao Yu lock_page(page); 1163e1c51b9fSChao Yu 11644ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1165afcb7ca0SJaegeuk Kim f2fs_put_page(page, 1); 1166afcb7ca0SJaegeuk Kim goto repeat; 1167afcb7ca0SJaegeuk Kim } 11681563ac75SChao Yu 11691f258ec1SChao Yu if (unlikely(!PageUptodate(page))) { 11701f258ec1SChao Yu err = -EIO; 11711563ac75SChao Yu goto out_err; 11721f258ec1SChao Yu } 1173e1c51b9fSChao Yu page_hit: 11740c9df7fbSYunlong Song if(unlikely(nid != nid_of_node(page))) { 11751f258ec1SChao Yu f2fs_msg(sbi->sb, KERN_WARNING, "inconsistent node block, " 11761f258ec1SChao Yu "nid:%lu, node_footer[nid:%u,ino:%u,ofs:%u,cpver:%llu,blkaddr:%u]", 11771f258ec1SChao Yu nid, nid_of_node(page), ino_of_node(page), 11781f258ec1SChao Yu ofs_of_node(page), cpver_of_node(page), 11791f258ec1SChao Yu next_blkaddr_of_node(page)); 11800c9df7fbSYunlong Song ClearPageUptodate(page); 11811f258ec1SChao Yu err = -EINVAL; 11820c9df7fbSYunlong Song out_err: 11830c9df7fbSYunlong Song f2fs_put_page(page, 1); 11841f258ec1SChao Yu return ERR_PTR(err); 11850c9df7fbSYunlong Song } 1186e05df3b1SJaegeuk Kim return page; 1187e05df3b1SJaegeuk Kim } 1188e05df3b1SJaegeuk Kim 11890e022ea8SChao Yu struct page *get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid) 11900e022ea8SChao Yu { 11910e022ea8SChao Yu return __get_node_page(sbi, nid, NULL, 0); 11920e022ea8SChao Yu } 11930e022ea8SChao Yu 1194e05df3b1SJaegeuk Kim struct page *get_node_page_ra(struct page *parent, int start) 1195e05df3b1SJaegeuk Kim { 11964081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 11970e022ea8SChao Yu nid_t nid = get_nid(parent, start, false); 1198e05df3b1SJaegeuk Kim 11990e022ea8SChao Yu return __get_node_page(sbi, nid, parent, start); 1200e05df3b1SJaegeuk Kim } 1201e05df3b1SJaegeuk Kim 12022049d4fcSJaegeuk Kim static void flush_inline_data(struct f2fs_sb_info *sbi, nid_t ino) 12032049d4fcSJaegeuk Kim { 12042049d4fcSJaegeuk Kim struct inode *inode; 12052049d4fcSJaegeuk Kim struct page *page; 12060f3311a8SChao Yu int ret; 12072049d4fcSJaegeuk Kim 12082049d4fcSJaegeuk Kim /* should flush inline_data before evict_inode */ 12092049d4fcSJaegeuk Kim inode = ilookup(sbi->sb, ino); 12102049d4fcSJaegeuk Kim if (!inode) 12112049d4fcSJaegeuk Kim return; 12122049d4fcSJaegeuk Kim 12134a6de50dSJaegeuk Kim page = pagecache_get_page(inode->i_mapping, 0, FGP_LOCK|FGP_NOWAIT, 0); 12142049d4fcSJaegeuk Kim if (!page) 12152049d4fcSJaegeuk Kim goto iput_out; 12162049d4fcSJaegeuk Kim 12172049d4fcSJaegeuk Kim if (!PageUptodate(page)) 12182049d4fcSJaegeuk Kim goto page_out; 12192049d4fcSJaegeuk Kim 12202049d4fcSJaegeuk Kim if (!PageDirty(page)) 12212049d4fcSJaegeuk Kim goto page_out; 12222049d4fcSJaegeuk Kim 12232049d4fcSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 12242049d4fcSJaegeuk Kim goto page_out; 12252049d4fcSJaegeuk Kim 12260f3311a8SChao Yu ret = f2fs_write_inline_data(inode, page); 12272049d4fcSJaegeuk Kim inode_dec_dirty_pages(inode); 1228933439c8SChao Yu remove_dirty_inode(inode); 12290f3311a8SChao Yu if (ret) 12302049d4fcSJaegeuk Kim set_page_dirty(page); 12312049d4fcSJaegeuk Kim page_out: 12324a6de50dSJaegeuk Kim f2fs_put_page(page, 1); 12332049d4fcSJaegeuk Kim iput_out: 12342049d4fcSJaegeuk Kim iput(inode); 12352049d4fcSJaegeuk Kim } 12362049d4fcSJaegeuk Kim 1237da011cc0SChao Yu void move_node_page(struct page *node_page, int gc_type) 1238da011cc0SChao Yu { 1239da011cc0SChao Yu if (gc_type == FG_GC) { 1240da011cc0SChao Yu struct f2fs_sb_info *sbi = F2FS_P_SB(node_page); 1241da011cc0SChao Yu struct writeback_control wbc = { 1242da011cc0SChao Yu .sync_mode = WB_SYNC_ALL, 1243da011cc0SChao Yu .nr_to_write = 1, 1244da011cc0SChao Yu .for_reclaim = 0, 1245da011cc0SChao Yu }; 1246da011cc0SChao Yu 1247da011cc0SChao Yu set_page_dirty(node_page); 1248da011cc0SChao Yu f2fs_wait_on_page_writeback(node_page, NODE, true); 1249da011cc0SChao Yu 1250da011cc0SChao Yu f2fs_bug_on(sbi, PageWriteback(node_page)); 1251da011cc0SChao Yu if (!clear_page_dirty_for_io(node_page)) 1252da011cc0SChao Yu goto out_page; 1253da011cc0SChao Yu 1254da011cc0SChao Yu if (NODE_MAPPING(sbi)->a_ops->writepage(node_page, &wbc)) 1255da011cc0SChao Yu unlock_page(node_page); 1256da011cc0SChao Yu goto release_page; 1257da011cc0SChao Yu } else { 1258da011cc0SChao Yu /* set page dirty and write it */ 1259da011cc0SChao Yu if (!PageWriteback(node_page)) 1260da011cc0SChao Yu set_page_dirty(node_page); 1261da011cc0SChao Yu } 1262da011cc0SChao Yu out_page: 1263da011cc0SChao Yu unlock_page(node_page); 1264da011cc0SChao Yu release_page: 1265da011cc0SChao Yu f2fs_put_page(node_page, 0); 1266da011cc0SChao Yu } 1267da011cc0SChao Yu 1268608514deSJaegeuk Kim static struct page *last_fsync_dnode(struct f2fs_sb_info *sbi, nid_t ino) 1269e05df3b1SJaegeuk Kim { 1270e05df3b1SJaegeuk Kim pgoff_t index, end; 1271e05df3b1SJaegeuk Kim struct pagevec pvec; 1272608514deSJaegeuk Kim struct page *last_page = NULL; 127352681375SJaegeuk Kim 127452681375SJaegeuk Kim pagevec_init(&pvec, 0); 127552681375SJaegeuk Kim index = 0; 127652681375SJaegeuk Kim end = ULONG_MAX; 127752681375SJaegeuk Kim 127852681375SJaegeuk Kim while (index <= end) { 127952681375SJaegeuk Kim int i, nr_pages; 128052681375SJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 128152681375SJaegeuk Kim PAGECACHE_TAG_DIRTY, 128252681375SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 128352681375SJaegeuk Kim if (nr_pages == 0) 128452681375SJaegeuk Kim break; 128552681375SJaegeuk Kim 128652681375SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 128752681375SJaegeuk Kim struct page *page = pvec.pages[i]; 128852681375SJaegeuk Kim 128952681375SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1290608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 129152681375SJaegeuk Kim pagevec_release(&pvec); 1292608514deSJaegeuk Kim return ERR_PTR(-EIO); 129352681375SJaegeuk Kim } 129452681375SJaegeuk Kim 129552681375SJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 129652681375SJaegeuk Kim continue; 129752681375SJaegeuk Kim if (ino_of_node(page) != ino) 129852681375SJaegeuk Kim continue; 129952681375SJaegeuk Kim 130052681375SJaegeuk Kim lock_page(page); 130152681375SJaegeuk Kim 130252681375SJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 130352681375SJaegeuk Kim continue_unlock: 130452681375SJaegeuk Kim unlock_page(page); 130552681375SJaegeuk Kim continue; 130652681375SJaegeuk Kim } 130752681375SJaegeuk Kim if (ino_of_node(page) != ino) 130852681375SJaegeuk Kim goto continue_unlock; 130952681375SJaegeuk Kim 131052681375SJaegeuk Kim if (!PageDirty(page)) { 131152681375SJaegeuk Kim /* someone wrote it for us */ 131252681375SJaegeuk Kim goto continue_unlock; 131352681375SJaegeuk Kim } 131452681375SJaegeuk Kim 1315608514deSJaegeuk Kim if (last_page) 1316608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1317608514deSJaegeuk Kim 1318608514deSJaegeuk Kim get_page(page); 1319608514deSJaegeuk Kim last_page = page; 1320608514deSJaegeuk Kim unlock_page(page); 1321608514deSJaegeuk Kim } 1322608514deSJaegeuk Kim pagevec_release(&pvec); 1323608514deSJaegeuk Kim cond_resched(); 1324608514deSJaegeuk Kim } 1325608514deSJaegeuk Kim return last_page; 1326608514deSJaegeuk Kim } 1327608514deSJaegeuk Kim 1328d68f735bSJaegeuk Kim static int __write_node_page(struct page *page, bool atomic, bool *submitted, 1329faa24895SJaegeuk Kim struct writeback_control *wbc) 1330faa24895SJaegeuk Kim { 1331faa24895SJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1332faa24895SJaegeuk Kim nid_t nid; 1333faa24895SJaegeuk Kim struct node_info ni; 1334faa24895SJaegeuk Kim struct f2fs_io_info fio = { 1335faa24895SJaegeuk Kim .sbi = sbi, 1336faa24895SJaegeuk Kim .type = NODE, 1337faa24895SJaegeuk Kim .op = REQ_OP_WRITE, 1338faa24895SJaegeuk Kim .op_flags = wbc_to_write_flags(wbc), 1339faa24895SJaegeuk Kim .page = page, 1340faa24895SJaegeuk Kim .encrypted_page = NULL, 1341d68f735bSJaegeuk Kim .submitted = false, 1342faa24895SJaegeuk Kim }; 1343faa24895SJaegeuk Kim 1344faa24895SJaegeuk Kim trace_f2fs_writepage(page, NODE); 1345faa24895SJaegeuk Kim 1346faa24895SJaegeuk Kim if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING))) 1347faa24895SJaegeuk Kim goto redirty_out; 1348faa24895SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) 1349faa24895SJaegeuk Kim goto redirty_out; 1350faa24895SJaegeuk Kim 1351faa24895SJaegeuk Kim /* get old block addr of this node page */ 1352faa24895SJaegeuk Kim nid = nid_of_node(page); 1353faa24895SJaegeuk Kim f2fs_bug_on(sbi, page->index != nid); 1354faa24895SJaegeuk Kim 1355faa24895SJaegeuk Kim if (wbc->for_reclaim) { 1356faa24895SJaegeuk Kim if (!down_read_trylock(&sbi->node_write)) 1357faa24895SJaegeuk Kim goto redirty_out; 1358faa24895SJaegeuk Kim } else { 1359faa24895SJaegeuk Kim down_read(&sbi->node_write); 1360faa24895SJaegeuk Kim } 1361faa24895SJaegeuk Kim 1362faa24895SJaegeuk Kim get_node_info(sbi, nid, &ni); 1363faa24895SJaegeuk Kim 1364faa24895SJaegeuk Kim /* This page is already truncated */ 1365faa24895SJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 1366faa24895SJaegeuk Kim ClearPageUptodate(page); 1367faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1368faa24895SJaegeuk Kim up_read(&sbi->node_write); 1369faa24895SJaegeuk Kim unlock_page(page); 1370faa24895SJaegeuk Kim return 0; 1371faa24895SJaegeuk Kim } 1372faa24895SJaegeuk Kim 1373e7c75ab0SJaegeuk Kim if (atomic && !test_opt(sbi, NOBARRIER)) 1374e7c75ab0SJaegeuk Kim fio.op_flags |= REQ_PREFLUSH | REQ_FUA; 1375e7c75ab0SJaegeuk Kim 1376faa24895SJaegeuk Kim set_page_writeback(page); 1377faa24895SJaegeuk Kim fio.old_blkaddr = ni.blk_addr; 1378faa24895SJaegeuk Kim write_node_page(nid, &fio); 1379faa24895SJaegeuk Kim set_node_addr(sbi, &ni, fio.new_blkaddr, is_fsync_dnode(page)); 1380faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1381faa24895SJaegeuk Kim up_read(&sbi->node_write); 1382faa24895SJaegeuk Kim 1383d68f735bSJaegeuk Kim if (wbc->for_reclaim) { 1384b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, page->mapping->host, 0, 1385b9109b0eSJaegeuk Kim page->index, NODE); 1386d68f735bSJaegeuk Kim submitted = NULL; 1387d68f735bSJaegeuk Kim } 1388faa24895SJaegeuk Kim 1389faa24895SJaegeuk Kim unlock_page(page); 1390faa24895SJaegeuk Kim 1391d68f735bSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1392b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 1393d68f735bSJaegeuk Kim submitted = NULL; 1394d68f735bSJaegeuk Kim } 1395d68f735bSJaegeuk Kim if (submitted) 1396d68f735bSJaegeuk Kim *submitted = fio.submitted; 1397faa24895SJaegeuk Kim 1398faa24895SJaegeuk Kim return 0; 1399faa24895SJaegeuk Kim 1400faa24895SJaegeuk Kim redirty_out: 1401faa24895SJaegeuk Kim redirty_page_for_writepage(wbc, page); 1402faa24895SJaegeuk Kim return AOP_WRITEPAGE_ACTIVATE; 1403faa24895SJaegeuk Kim } 1404faa24895SJaegeuk Kim 1405faa24895SJaegeuk Kim static int f2fs_write_node_page(struct page *page, 1406faa24895SJaegeuk Kim struct writeback_control *wbc) 1407faa24895SJaegeuk Kim { 1408d68f735bSJaegeuk Kim return __write_node_page(page, false, NULL, wbc); 1409faa24895SJaegeuk Kim } 1410faa24895SJaegeuk Kim 141126de9b11SJaegeuk Kim int fsync_node_pages(struct f2fs_sb_info *sbi, struct inode *inode, 1412608514deSJaegeuk Kim struct writeback_control *wbc, bool atomic) 1413608514deSJaegeuk Kim { 1414608514deSJaegeuk Kim pgoff_t index, end; 1415942fd319SJaegeuk Kim pgoff_t last_idx = ULONG_MAX; 1416608514deSJaegeuk Kim struct pagevec pvec; 1417608514deSJaegeuk Kim int ret = 0; 1418608514deSJaegeuk Kim struct page *last_page = NULL; 1419608514deSJaegeuk Kim bool marked = false; 142026de9b11SJaegeuk Kim nid_t ino = inode->i_ino; 1421608514deSJaegeuk Kim 1422608514deSJaegeuk Kim if (atomic) { 1423608514deSJaegeuk Kim last_page = last_fsync_dnode(sbi, ino); 1424608514deSJaegeuk Kim if (IS_ERR_OR_NULL(last_page)) 1425608514deSJaegeuk Kim return PTR_ERR_OR_ZERO(last_page); 1426608514deSJaegeuk Kim } 1427608514deSJaegeuk Kim retry: 1428608514deSJaegeuk Kim pagevec_init(&pvec, 0); 1429608514deSJaegeuk Kim index = 0; 1430608514deSJaegeuk Kim end = ULONG_MAX; 1431608514deSJaegeuk Kim 1432608514deSJaegeuk Kim while (index <= end) { 1433608514deSJaegeuk Kim int i, nr_pages; 1434608514deSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1435608514deSJaegeuk Kim PAGECACHE_TAG_DIRTY, 1436608514deSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1437608514deSJaegeuk Kim if (nr_pages == 0) 1438608514deSJaegeuk Kim break; 1439608514deSJaegeuk Kim 1440608514deSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1441608514deSJaegeuk Kim struct page *page = pvec.pages[i]; 1442d68f735bSJaegeuk Kim bool submitted = false; 1443608514deSJaegeuk Kim 1444608514deSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1445608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1446608514deSJaegeuk Kim pagevec_release(&pvec); 14479de69279SChao Yu ret = -EIO; 14489de69279SChao Yu goto out; 1449608514deSJaegeuk Kim } 1450608514deSJaegeuk Kim 1451608514deSJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 1452608514deSJaegeuk Kim continue; 1453608514deSJaegeuk Kim if (ino_of_node(page) != ino) 1454608514deSJaegeuk Kim continue; 1455608514deSJaegeuk Kim 1456608514deSJaegeuk Kim lock_page(page); 1457608514deSJaegeuk Kim 1458608514deSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1459608514deSJaegeuk Kim continue_unlock: 1460608514deSJaegeuk Kim unlock_page(page); 1461608514deSJaegeuk Kim continue; 1462608514deSJaegeuk Kim } 1463608514deSJaegeuk Kim if (ino_of_node(page) != ino) 146452681375SJaegeuk Kim goto continue_unlock; 146552681375SJaegeuk Kim 1466608514deSJaegeuk Kim if (!PageDirty(page) && page != last_page) { 1467608514deSJaegeuk Kim /* someone wrote it for us */ 1468608514deSJaegeuk Kim goto continue_unlock; 1469608514deSJaegeuk Kim } 1470608514deSJaegeuk Kim 1471608514deSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1472608514deSJaegeuk Kim BUG_ON(PageWriteback(page)); 1473608514deSJaegeuk Kim 1474d29fd172SJaegeuk Kim set_fsync_mark(page, 0); 1475d29fd172SJaegeuk Kim set_dentry_mark(page, 0); 1476d29fd172SJaegeuk Kim 1477608514deSJaegeuk Kim if (!atomic || page == last_page) { 147852681375SJaegeuk Kim set_fsync_mark(page, 1); 147926de9b11SJaegeuk Kim if (IS_INODE(page)) { 148026de9b11SJaegeuk Kim if (is_inode_flag_set(inode, 148126de9b11SJaegeuk Kim FI_DIRTY_INODE)) 148226de9b11SJaegeuk Kim update_inode(inode, page); 148352681375SJaegeuk Kim set_dentry_mark(page, 148452681375SJaegeuk Kim need_dentry_mark(sbi, ino)); 148526de9b11SJaegeuk Kim } 1486608514deSJaegeuk Kim /* may be written by other thread */ 1487608514deSJaegeuk Kim if (!PageDirty(page)) 1488608514deSJaegeuk Kim set_page_dirty(page); 1489608514deSJaegeuk Kim } 1490608514deSJaegeuk Kim 1491608514deSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1492608514deSJaegeuk Kim goto continue_unlock; 149352681375SJaegeuk Kim 1494e7c75ab0SJaegeuk Kim ret = __write_node_page(page, atomic && 1495d68f735bSJaegeuk Kim page == last_page, 1496d68f735bSJaegeuk Kim &submitted, wbc); 1497c267ec15SJaegeuk Kim if (ret) { 149852681375SJaegeuk Kim unlock_page(page); 1499608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1500608514deSJaegeuk Kim break; 1501d68f735bSJaegeuk Kim } else if (submitted) { 1502942fd319SJaegeuk Kim last_idx = page->index; 1503608514deSJaegeuk Kim } 15043f5f4959SChao Yu 1505608514deSJaegeuk Kim if (page == last_page) { 1506608514deSJaegeuk Kim f2fs_put_page(page, 0); 1507608514deSJaegeuk Kim marked = true; 150852681375SJaegeuk Kim break; 150952681375SJaegeuk Kim } 1510c267ec15SJaegeuk Kim } 151152681375SJaegeuk Kim pagevec_release(&pvec); 151252681375SJaegeuk Kim cond_resched(); 151352681375SJaegeuk Kim 1514608514deSJaegeuk Kim if (ret || marked) 151552681375SJaegeuk Kim break; 151652681375SJaegeuk Kim } 1517608514deSJaegeuk Kim if (!ret && atomic && !marked) { 1518608514deSJaegeuk Kim f2fs_msg(sbi->sb, KERN_DEBUG, 1519608514deSJaegeuk Kim "Retry to write fsync mark: ino=%u, idx=%lx", 1520608514deSJaegeuk Kim ino, last_page->index); 1521608514deSJaegeuk Kim lock_page(last_page); 1522d40a43afSYunlei He f2fs_wait_on_page_writeback(last_page, NODE, true); 1523608514deSJaegeuk Kim set_page_dirty(last_page); 1524608514deSJaegeuk Kim unlock_page(last_page); 1525608514deSJaegeuk Kim goto retry; 1526608514deSJaegeuk Kim } 15279de69279SChao Yu out: 1528942fd319SJaegeuk Kim if (last_idx != ULONG_MAX) 1529b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, NULL, ino, last_idx, NODE); 1530c267ec15SJaegeuk Kim return ret ? -EIO: 0; 153152681375SJaegeuk Kim } 153252681375SJaegeuk Kim 153352681375SJaegeuk Kim int sync_node_pages(struct f2fs_sb_info *sbi, struct writeback_control *wbc) 153452681375SJaegeuk Kim { 153552681375SJaegeuk Kim pgoff_t index, end; 153652681375SJaegeuk Kim struct pagevec pvec; 153752681375SJaegeuk Kim int step = 0; 153812bb0a8fSJaegeuk Kim int nwritten = 0; 15393f5f4959SChao Yu int ret = 0; 1540e05df3b1SJaegeuk Kim 1541e05df3b1SJaegeuk Kim pagevec_init(&pvec, 0); 1542e05df3b1SJaegeuk Kim 1543e05df3b1SJaegeuk Kim next_step: 1544e05df3b1SJaegeuk Kim index = 0; 154580dd9c0eSChao Yu end = ULONG_MAX; 1546e05df3b1SJaegeuk Kim 1547e05df3b1SJaegeuk Kim while (index <= end) { 1548e05df3b1SJaegeuk Kim int i, nr_pages; 15494ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1550e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY, 1551e05df3b1SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1552e05df3b1SJaegeuk Kim if (nr_pages == 0) 1553e05df3b1SJaegeuk Kim break; 1554e05df3b1SJaegeuk Kim 1555e05df3b1SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1556e05df3b1SJaegeuk Kim struct page *page = pvec.pages[i]; 1557d68f735bSJaegeuk Kim bool submitted = false; 1558e05df3b1SJaegeuk Kim 15596d5a1495SChao Yu if (unlikely(f2fs_cp_error(sbi))) { 15606d5a1495SChao Yu pagevec_release(&pvec); 15613f5f4959SChao Yu ret = -EIO; 15623f5f4959SChao Yu goto out; 15636d5a1495SChao Yu } 15646d5a1495SChao Yu 1565e05df3b1SJaegeuk Kim /* 1566e05df3b1SJaegeuk Kim * flushing sequence with step: 1567e05df3b1SJaegeuk Kim * 0. indirect nodes 1568e05df3b1SJaegeuk Kim * 1. dentry dnodes 1569e05df3b1SJaegeuk Kim * 2. file dnodes 1570e05df3b1SJaegeuk Kim */ 1571e05df3b1SJaegeuk Kim if (step == 0 && IS_DNODE(page)) 1572e05df3b1SJaegeuk Kim continue; 1573e05df3b1SJaegeuk Kim if (step == 1 && (!IS_DNODE(page) || 1574e05df3b1SJaegeuk Kim is_cold_node(page))) 1575e05df3b1SJaegeuk Kim continue; 1576e05df3b1SJaegeuk Kim if (step == 2 && (!IS_DNODE(page) || 1577e05df3b1SJaegeuk Kim !is_cold_node(page))) 1578e05df3b1SJaegeuk Kim continue; 15799a4cbc9eSChao Yu lock_node: 158052681375SJaegeuk Kim if (!trylock_page(page)) 1581e05df3b1SJaegeuk Kim continue; 1582e05df3b1SJaegeuk Kim 15834ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1584e05df3b1SJaegeuk Kim continue_unlock: 1585e05df3b1SJaegeuk Kim unlock_page(page); 1586e05df3b1SJaegeuk Kim continue; 1587e05df3b1SJaegeuk Kim } 1588e05df3b1SJaegeuk Kim 1589e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1590e05df3b1SJaegeuk Kim /* someone wrote it for us */ 1591e05df3b1SJaegeuk Kim goto continue_unlock; 1592e05df3b1SJaegeuk Kim } 1593e05df3b1SJaegeuk Kim 15942049d4fcSJaegeuk Kim /* flush inline_data */ 159552681375SJaegeuk Kim if (is_inline_node(page)) { 15962049d4fcSJaegeuk Kim clear_inline_node(page); 15972049d4fcSJaegeuk Kim unlock_page(page); 15982049d4fcSJaegeuk Kim flush_inline_data(sbi, ino_of_node(page)); 15999a4cbc9eSChao Yu goto lock_node; 16002049d4fcSJaegeuk Kim } 16012049d4fcSJaegeuk Kim 1602fa3d2bdfSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1603fa3d2bdfSJaegeuk Kim 1604fa3d2bdfSJaegeuk Kim BUG_ON(PageWriteback(page)); 1605e05df3b1SJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1606e05df3b1SJaegeuk Kim goto continue_unlock; 1607e05df3b1SJaegeuk Kim 1608e05df3b1SJaegeuk Kim set_fsync_mark(page, 0); 1609e05df3b1SJaegeuk Kim set_dentry_mark(page, 0); 161052746519SJaegeuk Kim 1611d68f735bSJaegeuk Kim ret = __write_node_page(page, false, &submitted, wbc); 1612d68f735bSJaegeuk Kim if (ret) 161352746519SJaegeuk Kim unlock_page(page); 1614d68f735bSJaegeuk Kim else if (submitted) 16153f5f4959SChao Yu nwritten++; 1616e05df3b1SJaegeuk Kim 1617e05df3b1SJaegeuk Kim if (--wbc->nr_to_write == 0) 1618e05df3b1SJaegeuk Kim break; 1619e05df3b1SJaegeuk Kim } 1620e05df3b1SJaegeuk Kim pagevec_release(&pvec); 1621e05df3b1SJaegeuk Kim cond_resched(); 1622e05df3b1SJaegeuk Kim 1623e05df3b1SJaegeuk Kim if (wbc->nr_to_write == 0) { 1624e05df3b1SJaegeuk Kim step = 2; 1625e05df3b1SJaegeuk Kim break; 1626e05df3b1SJaegeuk Kim } 1627e05df3b1SJaegeuk Kim } 1628e05df3b1SJaegeuk Kim 1629e05df3b1SJaegeuk Kim if (step < 2) { 1630e05df3b1SJaegeuk Kim step++; 1631e05df3b1SJaegeuk Kim goto next_step; 1632e05df3b1SJaegeuk Kim } 16333f5f4959SChao Yu out: 16343f5f4959SChao Yu if (nwritten) 1635b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 16363f5f4959SChao Yu return ret; 1637e05df3b1SJaegeuk Kim } 1638e05df3b1SJaegeuk Kim 1639cfe58f9dSJaegeuk Kim int wait_on_node_pages_writeback(struct f2fs_sb_info *sbi, nid_t ino) 1640cfe58f9dSJaegeuk Kim { 164180dd9c0eSChao Yu pgoff_t index = 0, end = ULONG_MAX; 1642cfe58f9dSJaegeuk Kim struct pagevec pvec; 1643280db3c8SMiklos Szeredi int ret2, ret = 0; 1644cfe58f9dSJaegeuk Kim 1645cfe58f9dSJaegeuk Kim pagevec_init(&pvec, 0); 16464ef51a8fSJaegeuk Kim 16474ef51a8fSJaegeuk Kim while (index <= end) { 16484ef51a8fSJaegeuk Kim int i, nr_pages; 16494ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1650cfe58f9dSJaegeuk Kim PAGECACHE_TAG_WRITEBACK, 16514ef51a8fSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 16524ef51a8fSJaegeuk Kim if (nr_pages == 0) 16534ef51a8fSJaegeuk Kim break; 1654cfe58f9dSJaegeuk Kim 1655cfe58f9dSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1656cfe58f9dSJaegeuk Kim struct page *page = pvec.pages[i]; 1657cfe58f9dSJaegeuk Kim 1658cfe58f9dSJaegeuk Kim /* until radix tree lookup accepts end_index */ 1659cfb271d4SChao Yu if (unlikely(page->index > end)) 1660cfe58f9dSJaegeuk Kim continue; 1661cfe58f9dSJaegeuk Kim 16624bf08ff6SChao Yu if (ino && ino_of_node(page) == ino) { 1663fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1664cfe58f9dSJaegeuk Kim if (TestClearPageError(page)) 1665cfe58f9dSJaegeuk Kim ret = -EIO; 1666cfe58f9dSJaegeuk Kim } 16674bf08ff6SChao Yu } 1668cfe58f9dSJaegeuk Kim pagevec_release(&pvec); 1669cfe58f9dSJaegeuk Kim cond_resched(); 1670cfe58f9dSJaegeuk Kim } 1671cfe58f9dSJaegeuk Kim 1672280db3c8SMiklos Szeredi ret2 = filemap_check_errors(NODE_MAPPING(sbi)); 1673cfe58f9dSJaegeuk Kim if (!ret) 1674cfe58f9dSJaegeuk Kim ret = ret2; 1675cfe58f9dSJaegeuk Kim return ret; 1676cfe58f9dSJaegeuk Kim } 1677cfe58f9dSJaegeuk Kim 1678e05df3b1SJaegeuk Kim static int f2fs_write_node_pages(struct address_space *mapping, 1679e05df3b1SJaegeuk Kim struct writeback_control *wbc) 1680e05df3b1SJaegeuk Kim { 16814081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_M_SB(mapping); 16829dfa1bafSJaegeuk Kim struct blk_plug plug; 168350c8cdb3SJaegeuk Kim long diff; 1684e05df3b1SJaegeuk Kim 16850771fcc7SChao Yu if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING))) 16860771fcc7SChao Yu goto skip_write; 16870771fcc7SChao Yu 16884660f9c0SJaegeuk Kim /* balancing f2fs's metadata in background */ 16894660f9c0SJaegeuk Kim f2fs_balance_fs_bg(sbi); 1690e05df3b1SJaegeuk Kim 1691a7fdffbdSJaegeuk Kim /* collect a number of dirty node pages and write together */ 169287d6f890SJaegeuk Kim if (get_pages(sbi, F2FS_DIRTY_NODES) < nr_pages_to_skip(sbi, NODE)) 1693d3baf95dSJaegeuk Kim goto skip_write; 1694a7fdffbdSJaegeuk Kim 1695d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1696d31c7c3fSYunlei He 169750c8cdb3SJaegeuk Kim diff = nr_pages_to_write(sbi, NODE, wbc); 1698fb5566daSJaegeuk Kim wbc->sync_mode = WB_SYNC_NONE; 16999dfa1bafSJaegeuk Kim blk_start_plug(&plug); 170052681375SJaegeuk Kim sync_node_pages(sbi, wbc); 17019dfa1bafSJaegeuk Kim blk_finish_plug(&plug); 170250c8cdb3SJaegeuk Kim wbc->nr_to_write = max((long)0, wbc->nr_to_write - diff); 1703e05df3b1SJaegeuk Kim return 0; 1704d3baf95dSJaegeuk Kim 1705d3baf95dSJaegeuk Kim skip_write: 1706d3baf95dSJaegeuk Kim wbc->pages_skipped += get_pages(sbi, F2FS_DIRTY_NODES); 1707d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1708d3baf95dSJaegeuk Kim return 0; 1709e05df3b1SJaegeuk Kim } 1710e05df3b1SJaegeuk Kim 1711e05df3b1SJaegeuk Kim static int f2fs_set_node_page_dirty(struct page *page) 1712e05df3b1SJaegeuk Kim { 171326c6b887SJaegeuk Kim trace_f2fs_set_page_dirty(page, NODE); 171426c6b887SJaegeuk Kim 1715237c0790SJaegeuk Kim if (!PageUptodate(page)) 1716e05df3b1SJaegeuk Kim SetPageUptodate(page); 1717e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1718fe76b796SJaegeuk Kim f2fs_set_page_dirty_nobuffers(page); 17194081363fSJaegeuk Kim inc_page_count(F2FS_P_SB(page), F2FS_DIRTY_NODES); 1720e05df3b1SJaegeuk Kim SetPagePrivate(page); 17219e4ded3fSJaegeuk Kim f2fs_trace_pid(page); 1722e05df3b1SJaegeuk Kim return 1; 1723e05df3b1SJaegeuk Kim } 1724e05df3b1SJaegeuk Kim return 0; 1725e05df3b1SJaegeuk Kim } 1726e05df3b1SJaegeuk Kim 17270a8165d7SJaegeuk Kim /* 1728e05df3b1SJaegeuk Kim * Structure of the f2fs node operations 1729e05df3b1SJaegeuk Kim */ 1730e05df3b1SJaegeuk Kim const struct address_space_operations f2fs_node_aops = { 1731e05df3b1SJaegeuk Kim .writepage = f2fs_write_node_page, 1732e05df3b1SJaegeuk Kim .writepages = f2fs_write_node_pages, 1733e05df3b1SJaegeuk Kim .set_page_dirty = f2fs_set_node_page_dirty, 1734487261f3SChao Yu .invalidatepage = f2fs_invalidate_page, 1735487261f3SChao Yu .releasepage = f2fs_release_page, 17365b7a487cSWeichao Guo #ifdef CONFIG_MIGRATION 17375b7a487cSWeichao Guo .migratepage = f2fs_migrate_page, 17385b7a487cSWeichao Guo #endif 1739e05df3b1SJaegeuk Kim }; 1740e05df3b1SJaegeuk Kim 17418a7ed66aSJaegeuk Kim static struct free_nid *__lookup_free_nid_list(struct f2fs_nm_info *nm_i, 17428a7ed66aSJaegeuk Kim nid_t n) 1743e05df3b1SJaegeuk Kim { 17448a7ed66aSJaegeuk Kim return radix_tree_lookup(&nm_i->free_nid_root, n); 17453aa770a9SNamjae Jeon } 1746e05df3b1SJaegeuk Kim 1747eb0aa4b8SJaegeuk Kim static int __insert_nid_to_list(struct f2fs_sb_info *sbi, 1748eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool new) 1749e05df3b1SJaegeuk Kim { 1750b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1751b8559dc2SChao Yu 1752eb0aa4b8SJaegeuk Kim if (new) { 1753eb0aa4b8SJaegeuk Kim int err = radix_tree_insert(&nm_i->free_nid_root, i->nid, i); 1754eb0aa4b8SJaegeuk Kim if (err) 1755eb0aa4b8SJaegeuk Kim return err; 1756eb0aa4b8SJaegeuk Kim } 1757eb0aa4b8SJaegeuk Kim 1758b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1759b8559dc2SChao Yu i->state != NID_ALLOC); 1760b8559dc2SChao Yu nm_i->nid_cnt[list]++; 1761b8559dc2SChao Yu list_add_tail(&i->list, &nm_i->nid_list[list]); 1762eb0aa4b8SJaegeuk Kim return 0; 1763b8559dc2SChao Yu } 1764b8559dc2SChao Yu 1765b8559dc2SChao Yu static void __remove_nid_from_list(struct f2fs_sb_info *sbi, 1766eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool reuse) 1767b8559dc2SChao Yu { 1768b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1769b8559dc2SChao Yu 1770b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1771b8559dc2SChao Yu i->state != NID_ALLOC); 1772b8559dc2SChao Yu nm_i->nid_cnt[list]--; 1773e05df3b1SJaegeuk Kim list_del(&i->list); 1774eb0aa4b8SJaegeuk Kim if (!reuse) 17758a7ed66aSJaegeuk Kim radix_tree_delete(&nm_i->free_nid_root, i->nid); 1776e05df3b1SJaegeuk Kim } 1777e05df3b1SJaegeuk Kim 17784ac91242SChao Yu /* return if the nid is recognized as free */ 17794ac91242SChao Yu static bool add_free_nid(struct f2fs_sb_info *sbi, nid_t nid, bool build) 1780e05df3b1SJaegeuk Kim { 17816fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 178230a61ddfSChao Yu struct free_nid *i, *e; 178359bbd474SJaegeuk Kim struct nat_entry *ne; 178430a61ddfSChao Yu int err = -EINVAL; 178530a61ddfSChao Yu bool ret = false; 17869198acebSJaegeuk Kim 17879198acebSJaegeuk Kim /* 0 nid should not be used */ 1788cfb271d4SChao Yu if (unlikely(nid == 0)) 17894ac91242SChao Yu return false; 179059bbd474SJaegeuk Kim 17917bd59381SGu Zheng i = f2fs_kmem_cache_alloc(free_nid_slab, GFP_NOFS); 1792e05df3b1SJaegeuk Kim i->nid = nid; 1793e05df3b1SJaegeuk Kim i->state = NID_NEW; 1794e05df3b1SJaegeuk Kim 179530a61ddfSChao Yu if (radix_tree_preload(GFP_NOFS)) 179630a61ddfSChao Yu goto err; 1797769ec6e5SJaegeuk Kim 1798b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 179930a61ddfSChao Yu 180030a61ddfSChao Yu if (build) { 180130a61ddfSChao Yu /* 180230a61ddfSChao Yu * Thread A Thread B 180330a61ddfSChao Yu * - f2fs_create 180430a61ddfSChao Yu * - f2fs_new_inode 180530a61ddfSChao Yu * - alloc_nid 180630a61ddfSChao Yu * - __insert_nid_to_list(ALLOC_NID_LIST) 180730a61ddfSChao Yu * - f2fs_balance_fs_bg 180830a61ddfSChao Yu * - build_free_nids 180930a61ddfSChao Yu * - __build_free_nids 181030a61ddfSChao Yu * - scan_nat_page 181130a61ddfSChao Yu * - add_free_nid 181230a61ddfSChao Yu * - __lookup_nat_cache 181330a61ddfSChao Yu * - f2fs_add_link 181430a61ddfSChao Yu * - init_inode_metadata 181530a61ddfSChao Yu * - new_inode_page 181630a61ddfSChao Yu * - new_node_page 181730a61ddfSChao Yu * - set_node_addr 181830a61ddfSChao Yu * - alloc_nid_done 181930a61ddfSChao Yu * - __remove_nid_from_list(ALLOC_NID_LIST) 182030a61ddfSChao Yu * - __insert_nid_to_list(FREE_NID_LIST) 182130a61ddfSChao Yu */ 182230a61ddfSChao Yu ne = __lookup_nat_cache(nm_i, nid); 182330a61ddfSChao Yu if (ne && (!get_nat_flag(ne, IS_CHECKPOINTED) || 182430a61ddfSChao Yu nat_get_blkaddr(ne) != NULL_ADDR)) 182530a61ddfSChao Yu goto err_out; 182630a61ddfSChao Yu 182730a61ddfSChao Yu e = __lookup_free_nid_list(nm_i, nid); 182830a61ddfSChao Yu if (e) { 182930a61ddfSChao Yu if (e->state == NID_NEW) 183030a61ddfSChao Yu ret = true; 183130a61ddfSChao Yu goto err_out; 183230a61ddfSChao Yu } 183330a61ddfSChao Yu } 183430a61ddfSChao Yu ret = true; 1835eb0aa4b8SJaegeuk Kim err = __insert_nid_to_list(sbi, i, FREE_NID_LIST, true); 183630a61ddfSChao Yu err_out: 1837b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1838769ec6e5SJaegeuk Kim radix_tree_preload_end(); 183930a61ddfSChao Yu err: 184030a61ddfSChao Yu if (err) 1841e05df3b1SJaegeuk Kim kmem_cache_free(free_nid_slab, i); 184230a61ddfSChao Yu return ret; 1843e05df3b1SJaegeuk Kim } 1844e05df3b1SJaegeuk Kim 1845b8559dc2SChao Yu static void remove_free_nid(struct f2fs_sb_info *sbi, nid_t nid) 1846e05df3b1SJaegeuk Kim { 1847b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1848e05df3b1SJaegeuk Kim struct free_nid *i; 1849cf0ee0f0SChao Yu bool need_free = false; 1850cf0ee0f0SChao Yu 1851b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 18528a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 1853e05df3b1SJaegeuk Kim if (i && i->state == NID_NEW) { 1854eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 1855cf0ee0f0SChao Yu need_free = true; 1856e05df3b1SJaegeuk Kim } 1857b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1858cf0ee0f0SChao Yu 1859cf0ee0f0SChao Yu if (need_free) 1860cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 1861e05df3b1SJaegeuk Kim } 1862e05df3b1SJaegeuk Kim 18639f7e4a2cSJaegeuk Kim static void update_free_nid_bitmap(struct f2fs_sb_info *sbi, nid_t nid, 1864346fe752SChao Yu bool set, bool build) 18654ac91242SChao Yu { 18664ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 18674ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(nid); 18684ac91242SChao Yu unsigned int nid_ofs = nid - START_NID(nid); 18694ac91242SChao Yu 18704ac91242SChao Yu if (!test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 18714ac91242SChao Yu return; 18724ac91242SChao Yu 18734ac91242SChao Yu if (set) 187423380b85SJaegeuk Kim __set_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 18754ac91242SChao Yu else 187623380b85SJaegeuk Kim __clear_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 1877586d1492SChao Yu 1878586d1492SChao Yu if (set) 1879586d1492SChao Yu nm_i->free_nid_count[nat_ofs]++; 1880586d1492SChao Yu else if (!build) 1881586d1492SChao Yu nm_i->free_nid_count[nat_ofs]--; 18824ac91242SChao Yu } 18834ac91242SChao Yu 18846fb03f3aSJaegeuk Kim static void scan_nat_page(struct f2fs_sb_info *sbi, 1885e05df3b1SJaegeuk Kim struct page *nat_page, nid_t start_nid) 1886e05df3b1SJaegeuk Kim { 18876fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1888e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(nat_page); 1889e05df3b1SJaegeuk Kim block_t blk_addr; 18904ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(start_nid); 1891e05df3b1SJaegeuk Kim int i; 1892e05df3b1SJaegeuk Kim 1893586d1492SChao Yu if (test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 1894586d1492SChao Yu return; 1895586d1492SChao Yu 189623380b85SJaegeuk Kim __set_bit_le(nat_ofs, nm_i->nat_block_bitmap); 18974ac91242SChao Yu 1898e05df3b1SJaegeuk Kim i = start_nid % NAT_ENTRY_PER_BLOCK; 1899e05df3b1SJaegeuk Kim 1900e05df3b1SJaegeuk Kim for (; i < NAT_ENTRY_PER_BLOCK; i++, start_nid++) { 19014ac91242SChao Yu bool freed = false; 190223d38844SHaicheng Li 1903cfb271d4SChao Yu if (unlikely(start_nid >= nm_i->max_nid)) 190404431c44SJaegeuk Kim break; 190523d38844SHaicheng Li 1906e05df3b1SJaegeuk Kim blk_addr = le32_to_cpu(nat_blk->entries[i].block_addr); 19079850cf4aSJaegeuk Kim f2fs_bug_on(sbi, blk_addr == NEW_ADDR); 19083a2ad567SChao Yu if (blk_addr == NULL_ADDR) 19094ac91242SChao Yu freed = add_free_nid(sbi, start_nid, true); 1910346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 1911346fe752SChao Yu update_free_nid_bitmap(sbi, start_nid, freed, true); 1912346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 1913e05df3b1SJaegeuk Kim } 1914e05df3b1SJaegeuk Kim } 1915e05df3b1SJaegeuk Kim 19164ac91242SChao Yu static void scan_free_nid_bits(struct f2fs_sb_info *sbi) 19174ac91242SChao Yu { 19184ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 19194ac91242SChao Yu struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 19204ac91242SChao Yu struct f2fs_journal *journal = curseg->journal; 19214ac91242SChao Yu unsigned int i, idx; 19224ac91242SChao Yu 19234ac91242SChao Yu down_read(&nm_i->nat_tree_lock); 19244ac91242SChao Yu 19254ac91242SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 19264ac91242SChao Yu if (!test_bit_le(i, nm_i->nat_block_bitmap)) 19274ac91242SChao Yu continue; 1928586d1492SChao Yu if (!nm_i->free_nid_count[i]) 1929586d1492SChao Yu continue; 19304ac91242SChao Yu for (idx = 0; idx < NAT_ENTRY_PER_BLOCK; idx++) { 19314ac91242SChao Yu nid_t nid; 19324ac91242SChao Yu 19334ac91242SChao Yu if (!test_bit_le(idx, nm_i->free_nid_bitmap[i])) 19344ac91242SChao Yu continue; 19354ac91242SChao Yu 19364ac91242SChao Yu nid = i * NAT_ENTRY_PER_BLOCK + idx; 19374ac91242SChao Yu add_free_nid(sbi, nid, true); 19384ac91242SChao Yu 1939f0cdbfe6SKinglong Mee if (nm_i->nid_cnt[FREE_NID_LIST] >= MAX_FREE_NIDS) 19404ac91242SChao Yu goto out; 19414ac91242SChao Yu } 19424ac91242SChao Yu } 19434ac91242SChao Yu out: 19444ac91242SChao Yu down_read(&curseg->journal_rwsem); 19454ac91242SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 19464ac91242SChao Yu block_t addr; 19474ac91242SChao Yu nid_t nid; 19484ac91242SChao Yu 19494ac91242SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 19504ac91242SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 19514ac91242SChao Yu if (addr == NULL_ADDR) 19524ac91242SChao Yu add_free_nid(sbi, nid, true); 19534ac91242SChao Yu else 19544ac91242SChao Yu remove_free_nid(sbi, nid); 19554ac91242SChao Yu } 19564ac91242SChao Yu up_read(&curseg->journal_rwsem); 19574ac91242SChao Yu up_read(&nm_i->nat_tree_lock); 19584ac91242SChao Yu } 19594ac91242SChao Yu 196022ad0b6aSJaegeuk Kim static void __build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 1961e05df3b1SJaegeuk Kim { 1962e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1963e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 1964b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 19658760952dSHaicheng Li int i = 0; 196655008d84SJaegeuk Kim nid_t nid = nm_i->next_scan_nid; 1967e05df3b1SJaegeuk Kim 1968e9cdd307SYunlei He if (unlikely(nid >= nm_i->max_nid)) 1969e9cdd307SYunlei He nid = 0; 1970e9cdd307SYunlei He 197155008d84SJaegeuk Kim /* Enough entries */ 1972b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] >= NAT_ENTRY_PER_BLOCK) 197355008d84SJaegeuk Kim return; 1974e05df3b1SJaegeuk Kim 19753a2ad567SChao Yu if (!sync && !available_free_memory(sbi, FREE_NIDS)) 1976e05df3b1SJaegeuk Kim return; 1977e05df3b1SJaegeuk Kim 19784ac91242SChao Yu if (!mount) { 19794ac91242SChao Yu /* try to find free nids in free_nid_bitmap */ 19804ac91242SChao Yu scan_free_nid_bits(sbi); 19814ac91242SChao Yu 19824ac91242SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST]) 198322ad0b6aSJaegeuk Kim return; 198422ad0b6aSJaegeuk Kim } 198522ad0b6aSJaegeuk Kim 198655008d84SJaegeuk Kim /* readahead nat pages to be scanned */ 198726879fb1SChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nid), FREE_NID_PAGES, 198826879fb1SChao Yu META_NAT, true); 1989e05df3b1SJaegeuk Kim 1990b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 1991a5131193SJaegeuk Kim 1992e05df3b1SJaegeuk Kim while (1) { 1993e05df3b1SJaegeuk Kim struct page *page = get_current_nat_page(sbi, nid); 1994e05df3b1SJaegeuk Kim 19956fb03f3aSJaegeuk Kim scan_nat_page(sbi, page, nid); 1996e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1997e05df3b1SJaegeuk Kim 1998e05df3b1SJaegeuk Kim nid += (NAT_ENTRY_PER_BLOCK - (nid % NAT_ENTRY_PER_BLOCK)); 1999cfb271d4SChao Yu if (unlikely(nid >= nm_i->max_nid)) 2000e05df3b1SJaegeuk Kim nid = 0; 200155008d84SJaegeuk Kim 2002a6d494b6SChao Yu if (++i >= FREE_NID_PAGES) 2003e05df3b1SJaegeuk Kim break; 2004e05df3b1SJaegeuk Kim } 2005e05df3b1SJaegeuk Kim 200655008d84SJaegeuk Kim /* go to the next free nat pages to find free nids abundantly */ 200755008d84SJaegeuk Kim nm_i->next_scan_nid = nid; 2008e05df3b1SJaegeuk Kim 2009e05df3b1SJaegeuk Kim /* find free nids from current sum_pages */ 2010b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 2011dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2012dfc08a12SChao Yu block_t addr; 2013dfc08a12SChao Yu 2014dfc08a12SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 2015dfc08a12SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 2016e05df3b1SJaegeuk Kim if (addr == NULL_ADDR) 20176fb03f3aSJaegeuk Kim add_free_nid(sbi, nid, true); 2018e05df3b1SJaegeuk Kim else 2019b8559dc2SChao Yu remove_free_nid(sbi, nid); 2020e05df3b1SJaegeuk Kim } 2021b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 2022b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 20232db2388fSChao Yu 20242db2388fSChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nm_i->next_scan_nid), 2025ea1a29a0SChao Yu nm_i->ra_nid_pages, META_NAT, false); 2026e05df3b1SJaegeuk Kim } 2027e05df3b1SJaegeuk Kim 202822ad0b6aSJaegeuk Kim void build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 20292411cf5bSChao Yu { 20302411cf5bSChao Yu mutex_lock(&NM_I(sbi)->build_lock); 203122ad0b6aSJaegeuk Kim __build_free_nids(sbi, sync, mount); 20322411cf5bSChao Yu mutex_unlock(&NM_I(sbi)->build_lock); 20332411cf5bSChao Yu } 20342411cf5bSChao Yu 2035e05df3b1SJaegeuk Kim /* 2036e05df3b1SJaegeuk Kim * If this function returns success, caller can obtain a new nid 2037e05df3b1SJaegeuk Kim * from second parameter of this function. 2038e05df3b1SJaegeuk Kim * The returned nid could be used ino as well as nid when inode is created. 2039e05df3b1SJaegeuk Kim */ 2040e05df3b1SJaegeuk Kim bool alloc_nid(struct f2fs_sb_info *sbi, nid_t *nid) 2041e05df3b1SJaegeuk Kim { 2042e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2043e05df3b1SJaegeuk Kim struct free_nid *i = NULL; 2044e05df3b1SJaegeuk Kim retry: 2045cb78942bSJaegeuk Kim #ifdef CONFIG_F2FS_FAULT_INJECTION 204655523519SChao Yu if (time_to_inject(sbi, FAULT_ALLOC_NID)) { 204755523519SChao Yu f2fs_show_injection_info(FAULT_ALLOC_NID); 2048cb78942bSJaegeuk Kim return false; 204955523519SChao Yu } 2050cb78942bSJaegeuk Kim #endif 2051b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2052e05df3b1SJaegeuk Kim 205304d47e67SChao Yu if (unlikely(nm_i->available_nids == 0)) { 205404d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 205504d47e67SChao Yu return false; 205604d47e67SChao Yu } 2057e05df3b1SJaegeuk Kim 205855008d84SJaegeuk Kim /* We should not use stale free nids created by build_free_nids */ 2059b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] && !on_build_free_nids(nm_i)) { 2060b8559dc2SChao Yu f2fs_bug_on(sbi, list_empty(&nm_i->nid_list[FREE_NID_LIST])); 2061b8559dc2SChao Yu i = list_first_entry(&nm_i->nid_list[FREE_NID_LIST], 2062b8559dc2SChao Yu struct free_nid, list); 2063e05df3b1SJaegeuk Kim *nid = i->nid; 2064b8559dc2SChao Yu 2065eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, true); 2066e05df3b1SJaegeuk Kim i->state = NID_ALLOC; 2067eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, ALLOC_NID_LIST, false); 206804d47e67SChao Yu nm_i->available_nids--; 20694ac91242SChao Yu 2070346fe752SChao Yu update_free_nid_bitmap(sbi, *nid, false, false); 20714ac91242SChao Yu 2072b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2073e05df3b1SJaegeuk Kim return true; 2074e05df3b1SJaegeuk Kim } 2075b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 207655008d84SJaegeuk Kim 207755008d84SJaegeuk Kim /* Let's scan nat pages and its caches to get free nids */ 207822ad0b6aSJaegeuk Kim build_free_nids(sbi, true, false); 207955008d84SJaegeuk Kim goto retry; 208055008d84SJaegeuk Kim } 2081e05df3b1SJaegeuk Kim 20820a8165d7SJaegeuk Kim /* 2083e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2084e05df3b1SJaegeuk Kim */ 2085e05df3b1SJaegeuk Kim void alloc_nid_done(struct f2fs_sb_info *sbi, nid_t nid) 2086e05df3b1SJaegeuk Kim { 2087e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2088e05df3b1SJaegeuk Kim struct free_nid *i; 2089e05df3b1SJaegeuk Kim 2090b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 20918a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2092b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2093eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2094b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2095cf0ee0f0SChao Yu 2096cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2097e05df3b1SJaegeuk Kim } 2098e05df3b1SJaegeuk Kim 20990a8165d7SJaegeuk Kim /* 2100e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2101e05df3b1SJaegeuk Kim */ 2102e05df3b1SJaegeuk Kim void alloc_nid_failed(struct f2fs_sb_info *sbi, nid_t nid) 2103e05df3b1SJaegeuk Kim { 210449952fa1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 210549952fa1SJaegeuk Kim struct free_nid *i; 2106cf0ee0f0SChao Yu bool need_free = false; 210749952fa1SJaegeuk Kim 210865985d93SJaegeuk Kim if (!nid) 210965985d93SJaegeuk Kim return; 211065985d93SJaegeuk Kim 2111b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 21128a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2113b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2114b8559dc2SChao Yu 21156fb03f3aSJaegeuk Kim if (!available_free_memory(sbi, FREE_NIDS)) { 2116eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2117cf0ee0f0SChao Yu need_free = true; 211895630cbaSHaicheng Li } else { 2119eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, true); 212049952fa1SJaegeuk Kim i->state = NID_NEW; 2121eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, FREE_NID_LIST, false); 212295630cbaSHaicheng Li } 212304d47e67SChao Yu 212404d47e67SChao Yu nm_i->available_nids++; 212504d47e67SChao Yu 2126346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 21274ac91242SChao Yu 2128b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2129cf0ee0f0SChao Yu 2130cf0ee0f0SChao Yu if (need_free) 2131cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2132e05df3b1SJaegeuk Kim } 2133e05df3b1SJaegeuk Kim 213431696580SChao Yu int try_to_free_nids(struct f2fs_sb_info *sbi, int nr_shrink) 213531696580SChao Yu { 213631696580SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 213731696580SChao Yu struct free_nid *i, *next; 213831696580SChao Yu int nr = nr_shrink; 213931696580SChao Yu 2140b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 2141ad4edb83SJaegeuk Kim return 0; 2142ad4edb83SJaegeuk Kim 214331696580SChao Yu if (!mutex_trylock(&nm_i->build_lock)) 214431696580SChao Yu return 0; 214531696580SChao Yu 2146b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2147b8559dc2SChao Yu list_for_each_entry_safe(i, next, &nm_i->nid_list[FREE_NID_LIST], 2148b8559dc2SChao Yu list) { 2149b8559dc2SChao Yu if (nr_shrink <= 0 || 2150b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 215131696580SChao Yu break; 2152b8559dc2SChao Yu 2153eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 215431696580SChao Yu kmem_cache_free(free_nid_slab, i); 215531696580SChao Yu nr_shrink--; 215631696580SChao Yu } 2157b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 215831696580SChao Yu mutex_unlock(&nm_i->build_lock); 215931696580SChao Yu 216031696580SChao Yu return nr - nr_shrink; 216131696580SChao Yu } 216231696580SChao Yu 216370cfed88SChao Yu void recover_inline_xattr(struct inode *inode, struct page *page) 216428cdce04SChao Yu { 216528cdce04SChao Yu void *src_addr, *dst_addr; 216628cdce04SChao Yu size_t inline_size; 216728cdce04SChao Yu struct page *ipage; 216828cdce04SChao Yu struct f2fs_inode *ri; 216928cdce04SChao Yu 21704081363fSJaegeuk Kim ipage = get_node_page(F2FS_I_SB(inode), inode->i_ino); 21719850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), IS_ERR(ipage)); 217228cdce04SChao Yu 2173e3b4d43fSJaegeuk Kim ri = F2FS_INODE(page); 2174e3b4d43fSJaegeuk Kim if (!(ri->i_inline & F2FS_INLINE_XATTR)) { 217591942321SJaegeuk Kim clear_inode_flag(inode, FI_INLINE_XATTR); 2176e3b4d43fSJaegeuk Kim goto update_inode; 2177e3b4d43fSJaegeuk Kim } 2178e3b4d43fSJaegeuk Kim 217928cdce04SChao Yu dst_addr = inline_xattr_addr(ipage); 218028cdce04SChao Yu src_addr = inline_xattr_addr(page); 218128cdce04SChao Yu inline_size = inline_xattr_size(inode); 218228cdce04SChao Yu 2183fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(ipage, NODE, true); 218428cdce04SChao Yu memcpy(dst_addr, src_addr, inline_size); 2185e3b4d43fSJaegeuk Kim update_inode: 218628cdce04SChao Yu update_inode(inode, ipage); 218728cdce04SChao Yu f2fs_put_page(ipage, 1); 218828cdce04SChao Yu } 218928cdce04SChao Yu 2190d260081cSChao Yu int recover_xattr_data(struct inode *inode, struct page *page, block_t blkaddr) 2191abb2366cSJaegeuk Kim { 21924081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 2193abb2366cSJaegeuk Kim nid_t prev_xnid = F2FS_I(inode)->i_xattr_nid; 219487905682SYunlei He nid_t new_xnid; 219587905682SYunlei He struct dnode_of_data dn; 2196abb2366cSJaegeuk Kim struct node_info ni; 2197d260081cSChao Yu struct page *xpage; 2198abb2366cSJaegeuk Kim 2199abb2366cSJaegeuk Kim if (!prev_xnid) 2200abb2366cSJaegeuk Kim goto recover_xnid; 2201abb2366cSJaegeuk Kim 2202d260081cSChao Yu /* 1: invalidate the previous xattr nid */ 2203abb2366cSJaegeuk Kim get_node_info(sbi, prev_xnid, &ni); 22049850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 2205abb2366cSJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 2206000519f2SChao Yu dec_valid_node_count(sbi, inode, false); 2207479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 2208abb2366cSJaegeuk Kim 2209abb2366cSJaegeuk Kim recover_xnid: 2210d260081cSChao Yu /* 2: update xattr nid in inode */ 221187905682SYunlei He if (!alloc_nid(sbi, &new_xnid)) 221287905682SYunlei He return -ENOSPC; 221387905682SYunlei He 221487905682SYunlei He set_new_dnode(&dn, inode, NULL, NULL, new_xnid); 221587905682SYunlei He xpage = new_node_page(&dn, XATTR_NODE_OFFSET); 221687905682SYunlei He if (IS_ERR(xpage)) { 221787905682SYunlei He alloc_nid_failed(sbi, new_xnid); 221887905682SYunlei He return PTR_ERR(xpage); 221987905682SYunlei He } 222087905682SYunlei He 222187905682SYunlei He alloc_nid_done(sbi, new_xnid); 2222d260081cSChao Yu update_inode_page(inode); 2223abb2366cSJaegeuk Kim 2224d260081cSChao Yu /* 3: update and set xattr node page dirty */ 222587905682SYunlei He memcpy(F2FS_NODE(xpage), F2FS_NODE(page), VALID_XATTR_BLOCK_SIZE); 2226d260081cSChao Yu 2227d260081cSChao Yu set_page_dirty(xpage); 2228d260081cSChao Yu f2fs_put_page(xpage, 1); 2229abb2366cSJaegeuk Kim 2230d260081cSChao Yu return 0; 2231abb2366cSJaegeuk Kim } 2232abb2366cSJaegeuk Kim 2233e05df3b1SJaegeuk Kim int recover_inode_page(struct f2fs_sb_info *sbi, struct page *page) 2234e05df3b1SJaegeuk Kim { 223558bfaf44SJaegeuk Kim struct f2fs_inode *src, *dst; 2236e05df3b1SJaegeuk Kim nid_t ino = ino_of_node(page); 2237e05df3b1SJaegeuk Kim struct node_info old_ni, new_ni; 2238e05df3b1SJaegeuk Kim struct page *ipage; 2239e05df3b1SJaegeuk Kim 2240e8271fa3SJaegeuk Kim get_node_info(sbi, ino, &old_ni); 2241e8271fa3SJaegeuk Kim 2242e8271fa3SJaegeuk Kim if (unlikely(old_ni.blk_addr != NULL_ADDR)) 2243e8271fa3SJaegeuk Kim return -EINVAL; 2244e8ea9b3dSJaegeuk Kim retry: 2245300e129cSJaegeuk Kim ipage = f2fs_grab_cache_page(NODE_MAPPING(sbi), ino, false); 2246e8ea9b3dSJaegeuk Kim if (!ipage) { 2247e8ea9b3dSJaegeuk Kim congestion_wait(BLK_RW_ASYNC, HZ/50); 2248e8ea9b3dSJaegeuk Kim goto retry; 2249e8ea9b3dSJaegeuk Kim } 2250e05df3b1SJaegeuk Kim 2251e05df3b1SJaegeuk Kim /* Should not use this inode from free nid list */ 2252b8559dc2SChao Yu remove_free_nid(sbi, ino); 2253e05df3b1SJaegeuk Kim 2254237c0790SJaegeuk Kim if (!PageUptodate(ipage)) 2255e05df3b1SJaegeuk Kim SetPageUptodate(ipage); 2256e05df3b1SJaegeuk Kim fill_node_footer(ipage, ino, ino, 0, true); 2257e05df3b1SJaegeuk Kim 225858bfaf44SJaegeuk Kim src = F2FS_INODE(page); 225958bfaf44SJaegeuk Kim dst = F2FS_INODE(ipage); 2260e05df3b1SJaegeuk Kim 226158bfaf44SJaegeuk Kim memcpy(dst, src, (unsigned long)&src->i_ext - (unsigned long)src); 226258bfaf44SJaegeuk Kim dst->i_size = 0; 226358bfaf44SJaegeuk Kim dst->i_blocks = cpu_to_le64(1); 226458bfaf44SJaegeuk Kim dst->i_links = cpu_to_le32(1); 226558bfaf44SJaegeuk Kim dst->i_xattr_nid = 0; 2266617deb8cSJaegeuk Kim dst->i_inline = src->i_inline & F2FS_INLINE_XATTR; 2267e05df3b1SJaegeuk Kim 2268e05df3b1SJaegeuk Kim new_ni = old_ni; 2269e05df3b1SJaegeuk Kim new_ni.ino = ino; 2270e05df3b1SJaegeuk Kim 22710abd675eSChao Yu if (unlikely(inc_valid_node_count(sbi, NULL, true))) 227265e5cd0aSJaegeuk Kim WARN_ON(1); 2273479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 2274e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 2275617deb8cSJaegeuk Kim set_page_dirty(ipage); 2276e05df3b1SJaegeuk Kim f2fs_put_page(ipage, 1); 2277e05df3b1SJaegeuk Kim return 0; 2278e05df3b1SJaegeuk Kim } 2279e05df3b1SJaegeuk Kim 2280e05df3b1SJaegeuk Kim int restore_node_summary(struct f2fs_sb_info *sbi, 2281e05df3b1SJaegeuk Kim unsigned int segno, struct f2fs_summary_block *sum) 2282e05df3b1SJaegeuk Kim { 2283e05df3b1SJaegeuk Kim struct f2fs_node *rn; 2284e05df3b1SJaegeuk Kim struct f2fs_summary *sum_entry; 2285e05df3b1SJaegeuk Kim block_t addr; 22869ecf4b80SChao Yu int i, idx, last_offset, nrpages; 2287e05df3b1SJaegeuk Kim 2288e05df3b1SJaegeuk Kim /* scan the node segment */ 2289e05df3b1SJaegeuk Kim last_offset = sbi->blocks_per_seg; 2290e05df3b1SJaegeuk Kim addr = START_BLOCK(sbi, segno); 2291e05df3b1SJaegeuk Kim sum_entry = &sum->entries[0]; 2292e05df3b1SJaegeuk Kim 22939ecf4b80SChao Yu for (i = 0; i < last_offset; i += nrpages, addr += nrpages) { 2294664ba972SJaegeuk Kim nrpages = min(last_offset - i, BIO_MAX_PAGES); 2295393ff91fSJaegeuk Kim 22969af0ff1cSChao Yu /* readahead node pages */ 229726879fb1SChao Yu ra_meta_pages(sbi, addr, nrpages, META_POR, true); 22989af0ff1cSChao Yu 22999ecf4b80SChao Yu for (idx = addr; idx < addr + nrpages; idx++) { 23002b947003SChao Yu struct page *page = get_tmp_page(sbi, idx); 2301393ff91fSJaegeuk Kim 23029ecf4b80SChao Yu rn = F2FS_NODE(page); 2303393ff91fSJaegeuk Kim sum_entry->nid = rn->footer.nid; 2304393ff91fSJaegeuk Kim sum_entry->version = 0; 2305393ff91fSJaegeuk Kim sum_entry->ofs_in_node = 0; 23069af0ff1cSChao Yu sum_entry++; 23079ecf4b80SChao Yu f2fs_put_page(page, 1); 23089af0ff1cSChao Yu } 2309bac4eef6SChao Yu 23109ecf4b80SChao Yu invalidate_mapping_pages(META_MAPPING(sbi), addr, 2311bac4eef6SChao Yu addr + nrpages); 23129af0ff1cSChao Yu } 23139ecf4b80SChao Yu return 0; 2314e05df3b1SJaegeuk Kim } 2315e05df3b1SJaegeuk Kim 2316aec71382SChao Yu static void remove_nats_in_journal(struct f2fs_sb_info *sbi) 2317e05df3b1SJaegeuk Kim { 2318e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2319e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2320b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2321e05df3b1SJaegeuk Kim int i; 2322e05df3b1SJaegeuk Kim 2323b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2324dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2325e05df3b1SJaegeuk Kim struct nat_entry *ne; 2326e05df3b1SJaegeuk Kim struct f2fs_nat_entry raw_ne; 2327dfc08a12SChao Yu nid_t nid = le32_to_cpu(nid_in_journal(journal, i)); 2328e05df3b1SJaegeuk Kim 2329dfc08a12SChao Yu raw_ne = nat_in_journal(journal, i); 23309be32d72SJaegeuk Kim 2331e05df3b1SJaegeuk Kim ne = __lookup_nat_cache(nm_i, nid); 2332e05df3b1SJaegeuk Kim if (!ne) { 23335c9e4184SChao Yu ne = grab_nat_entry(nm_i, nid, true); 233494dac22eSChao Yu node_info_from_raw_nat(&ne->ni, &raw_ne); 23359be32d72SJaegeuk Kim } 233604d47e67SChao Yu 233704d47e67SChao Yu /* 233804d47e67SChao Yu * if a free nat in journal has not been used after last 233904d47e67SChao Yu * checkpoint, we should remove it from available nids, 234004d47e67SChao Yu * since later we will add it again. 234104d47e67SChao Yu */ 234204d47e67SChao Yu if (!get_nat_flag(ne, IS_DIRTY) && 234304d47e67SChao Yu le32_to_cpu(raw_ne.block_addr) == NULL_ADDR) { 234404d47e67SChao Yu spin_lock(&nm_i->nid_list_lock); 234504d47e67SChao Yu nm_i->available_nids--; 234604d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 234704d47e67SChao Yu } 234804d47e67SChao Yu 2349e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, ne); 2350e05df3b1SJaegeuk Kim } 2351dfc08a12SChao Yu update_nats_in_cursum(journal, -i); 2352b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 2353e05df3b1SJaegeuk Kim } 2354e05df3b1SJaegeuk Kim 2355309cc2b6SJaegeuk Kim static void __adjust_nat_entry_set(struct nat_entry_set *nes, 2356309cc2b6SJaegeuk Kim struct list_head *head, int max) 2357e05df3b1SJaegeuk Kim { 2358309cc2b6SJaegeuk Kim struct nat_entry_set *cur; 2359e05df3b1SJaegeuk Kim 2360309cc2b6SJaegeuk Kim if (nes->entry_cnt >= max) 2361309cc2b6SJaegeuk Kim goto add_out; 2362e05df3b1SJaegeuk Kim 2363309cc2b6SJaegeuk Kim list_for_each_entry(cur, head, set_list) { 2364309cc2b6SJaegeuk Kim if (cur->entry_cnt >= nes->entry_cnt) { 2365309cc2b6SJaegeuk Kim list_add(&nes->set_list, cur->set_list.prev); 2366309cc2b6SJaegeuk Kim return; 2367309cc2b6SJaegeuk Kim } 2368309cc2b6SJaegeuk Kim } 2369309cc2b6SJaegeuk Kim add_out: 2370309cc2b6SJaegeuk Kim list_add_tail(&nes->set_list, head); 2371aec71382SChao Yu } 2372aec71382SChao Yu 23739f7e4a2cSJaegeuk Kim static void __update_nat_bits(struct f2fs_sb_info *sbi, nid_t start_nid, 237422ad0b6aSJaegeuk Kim struct page *page) 237522ad0b6aSJaegeuk Kim { 237622ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 237722ad0b6aSJaegeuk Kim unsigned int nat_index = start_nid / NAT_ENTRY_PER_BLOCK; 237822ad0b6aSJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(page); 237922ad0b6aSJaegeuk Kim int valid = 0; 238022ad0b6aSJaegeuk Kim int i; 238122ad0b6aSJaegeuk Kim 238222ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 238322ad0b6aSJaegeuk Kim return; 238422ad0b6aSJaegeuk Kim 238522ad0b6aSJaegeuk Kim for (i = 0; i < NAT_ENTRY_PER_BLOCK; i++) { 238622ad0b6aSJaegeuk Kim if (start_nid == 0 && i == 0) 238722ad0b6aSJaegeuk Kim valid++; 238822ad0b6aSJaegeuk Kim if (nat_blk->entries[i].block_addr) 238922ad0b6aSJaegeuk Kim valid++; 239022ad0b6aSJaegeuk Kim } 239122ad0b6aSJaegeuk Kim if (valid == 0) { 239223380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->empty_nat_bits); 239323380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 239422ad0b6aSJaegeuk Kim return; 239522ad0b6aSJaegeuk Kim } 239622ad0b6aSJaegeuk Kim 239723380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->empty_nat_bits); 239822ad0b6aSJaegeuk Kim if (valid == NAT_ENTRY_PER_BLOCK) 239923380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->full_nat_bits); 240022ad0b6aSJaegeuk Kim else 240123380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 240222ad0b6aSJaegeuk Kim } 240322ad0b6aSJaegeuk Kim 2404309cc2b6SJaegeuk Kim static void __flush_nat_entry_set(struct f2fs_sb_info *sbi, 240522ad0b6aSJaegeuk Kim struct nat_entry_set *set, struct cp_control *cpc) 2406309cc2b6SJaegeuk Kim { 2407309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2408b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2409309cc2b6SJaegeuk Kim nid_t start_nid = set->set * NAT_ENTRY_PER_BLOCK; 2410309cc2b6SJaegeuk Kim bool to_journal = true; 2411309cc2b6SJaegeuk Kim struct f2fs_nat_block *nat_blk; 2412309cc2b6SJaegeuk Kim struct nat_entry *ne, *cur; 2413309cc2b6SJaegeuk Kim struct page *page = NULL; 2414aec71382SChao Yu 2415aec71382SChao Yu /* 2416aec71382SChao Yu * there are two steps to flush nat entries: 2417aec71382SChao Yu * #1, flush nat entries to journal in current hot data summary block. 2418aec71382SChao Yu * #2, flush nat entries to nat page. 2419aec71382SChao Yu */ 242022ad0b6aSJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 242122ad0b6aSJaegeuk Kim !__has_cursum_space(journal, set->entry_cnt, NAT_JOURNAL)) 2422aec71382SChao Yu to_journal = false; 2423aec71382SChao Yu 2424aec71382SChao Yu if (to_journal) { 2425b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2426aec71382SChao Yu } else { 2427e05df3b1SJaegeuk Kim page = get_next_nat_page(sbi, start_nid); 2428e05df3b1SJaegeuk Kim nat_blk = page_address(page); 24299850cf4aSJaegeuk Kim f2fs_bug_on(sbi, !nat_blk); 2430e05df3b1SJaegeuk Kim } 2431e05df3b1SJaegeuk Kim 2432aec71382SChao Yu /* flush dirty nats in nat entry set */ 2433309cc2b6SJaegeuk Kim list_for_each_entry_safe(ne, cur, &set->entry_list, list) { 2434aec71382SChao Yu struct f2fs_nat_entry *raw_ne; 2435aec71382SChao Yu nid_t nid = nat_get_nid(ne); 2436aec71382SChao Yu int offset; 2437aec71382SChao Yu 2438febeca6dSChao Yu f2fs_bug_on(sbi, nat_get_blkaddr(ne) == NEW_ADDR); 2439309cc2b6SJaegeuk Kim 2440aec71382SChao Yu if (to_journal) { 2441dfc08a12SChao Yu offset = lookup_journal_in_cursum(journal, 2442aec71382SChao Yu NAT_JOURNAL, nid, 1); 24439850cf4aSJaegeuk Kim f2fs_bug_on(sbi, offset < 0); 2444dfc08a12SChao Yu raw_ne = &nat_in_journal(journal, offset); 2445dfc08a12SChao Yu nid_in_journal(journal, offset) = cpu_to_le32(nid); 2446aec71382SChao Yu } else { 2447aec71382SChao Yu raw_ne = &nat_blk->entries[nid - start_nid]; 2448aec71382SChao Yu } 2449aec71382SChao Yu raw_nat_from_node_info(raw_ne, &ne->ni); 245088bd02c9SJaegeuk Kim nat_reset_flag(ne); 24510b28b71eSKinglong Mee __clear_nat_cache_dirty(NM_I(sbi), set, ne); 245204d47e67SChao Yu if (nat_get_blkaddr(ne) == NULL_ADDR) { 2453309cc2b6SJaegeuk Kim add_free_nid(sbi, nid, false); 245404d47e67SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 245504d47e67SChao Yu NM_I(sbi)->available_nids++; 2456346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 24574ac91242SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 24584ac91242SChao Yu } else { 24594ac91242SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 2460346fe752SChao Yu update_free_nid_bitmap(sbi, nid, false, false); 246104d47e67SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 246204d47e67SChao Yu } 2463e05df3b1SJaegeuk Kim } 2464aec71382SChao Yu 246522ad0b6aSJaegeuk Kim if (to_journal) { 2466b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 246722ad0b6aSJaegeuk Kim } else { 246822ad0b6aSJaegeuk Kim __update_nat_bits(sbi, start_nid, page); 2469e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 247022ad0b6aSJaegeuk Kim } 2471aec71382SChao Yu 247259c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 247359c9081bSYunlei He if (!set->entry_cnt) { 2474309cc2b6SJaegeuk Kim radix_tree_delete(&NM_I(sbi)->nat_set_root, set->set); 2475309cc2b6SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, set); 2476309cc2b6SJaegeuk Kim } 247759c9081bSYunlei He } 2478aec71382SChao Yu 2479309cc2b6SJaegeuk Kim /* 2480309cc2b6SJaegeuk Kim * This function is called during the checkpointing process. 2481309cc2b6SJaegeuk Kim */ 248222ad0b6aSJaegeuk Kim void flush_nat_entries(struct f2fs_sb_info *sbi, struct cp_control *cpc) 2483309cc2b6SJaegeuk Kim { 2484309cc2b6SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2485309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2486b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 24877aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2488309cc2b6SJaegeuk Kim struct nat_entry_set *set, *tmp; 2489309cc2b6SJaegeuk Kim unsigned int found; 2490309cc2b6SJaegeuk Kim nid_t set_idx = 0; 2491309cc2b6SJaegeuk Kim LIST_HEAD(sets); 2492309cc2b6SJaegeuk Kim 249320d047c8SChangman Lee if (!nm_i->dirty_nat_cnt) 249420d047c8SChangman Lee return; 2495a5131193SJaegeuk Kim 2496b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2497a5131193SJaegeuk Kim 2498309cc2b6SJaegeuk Kim /* 2499309cc2b6SJaegeuk Kim * if there are no enough space in journal to store dirty nat 2500309cc2b6SJaegeuk Kim * entries, remove all entries from journal and merge them 2501309cc2b6SJaegeuk Kim * into nat entry set. 2502309cc2b6SJaegeuk Kim */ 2503900f7362SJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 250422ad0b6aSJaegeuk Kim !__has_cursum_space(journal, nm_i->dirty_nat_cnt, NAT_JOURNAL)) 2505309cc2b6SJaegeuk Kim remove_nats_in_journal(sbi); 2506309cc2b6SJaegeuk Kim 2507309cc2b6SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 25087aed0d45SJaegeuk Kim set_idx, SETVEC_SIZE, setvec))) { 2509309cc2b6SJaegeuk Kim unsigned idx; 2510309cc2b6SJaegeuk Kim set_idx = setvec[found - 1]->set + 1; 2511309cc2b6SJaegeuk Kim for (idx = 0; idx < found; idx++) 2512309cc2b6SJaegeuk Kim __adjust_nat_entry_set(setvec[idx], &sets, 2513dfc08a12SChao Yu MAX_NAT_JENTRIES(journal)); 2514309cc2b6SJaegeuk Kim } 2515309cc2b6SJaegeuk Kim 2516309cc2b6SJaegeuk Kim /* flush dirty nats in nat entry set */ 2517309cc2b6SJaegeuk Kim list_for_each_entry_safe(set, tmp, &sets, set_list) 251822ad0b6aSJaegeuk Kim __flush_nat_entry_set(sbi, set, cpc); 2519309cc2b6SJaegeuk Kim 2520b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 252159c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 2522e05df3b1SJaegeuk Kim } 2523e05df3b1SJaegeuk Kim 252422ad0b6aSJaegeuk Kim static int __get_nat_bitmaps(struct f2fs_sb_info *sbi) 252522ad0b6aSJaegeuk Kim { 252622ad0b6aSJaegeuk Kim struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi); 252722ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 252822ad0b6aSJaegeuk Kim unsigned int nat_bits_bytes = nm_i->nat_blocks / BITS_PER_BYTE; 252922ad0b6aSJaegeuk Kim unsigned int i; 253022ad0b6aSJaegeuk Kim __u64 cp_ver = cur_cp_version(ckpt); 253122ad0b6aSJaegeuk Kim block_t nat_bits_addr; 253222ad0b6aSJaegeuk Kim 253322ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 253422ad0b6aSJaegeuk Kim return 0; 253522ad0b6aSJaegeuk Kim 253622ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks = F2FS_BYTES_TO_BLK((nat_bits_bytes << 1) + 8 + 253722ad0b6aSJaegeuk Kim F2FS_BLKSIZE - 1); 253822ad0b6aSJaegeuk Kim nm_i->nat_bits = kzalloc(nm_i->nat_bits_blocks << F2FS_BLKSIZE_BITS, 253922ad0b6aSJaegeuk Kim GFP_KERNEL); 254022ad0b6aSJaegeuk Kim if (!nm_i->nat_bits) 254122ad0b6aSJaegeuk Kim return -ENOMEM; 254222ad0b6aSJaegeuk Kim 254322ad0b6aSJaegeuk Kim nat_bits_addr = __start_cp_addr(sbi) + sbi->blocks_per_seg - 254422ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks; 254522ad0b6aSJaegeuk Kim for (i = 0; i < nm_i->nat_bits_blocks; i++) { 254622ad0b6aSJaegeuk Kim struct page *page = get_meta_page(sbi, nat_bits_addr++); 254722ad0b6aSJaegeuk Kim 254822ad0b6aSJaegeuk Kim memcpy(nm_i->nat_bits + (i << F2FS_BLKSIZE_BITS), 254922ad0b6aSJaegeuk Kim page_address(page), F2FS_BLKSIZE); 255022ad0b6aSJaegeuk Kim f2fs_put_page(page, 1); 255122ad0b6aSJaegeuk Kim } 255222ad0b6aSJaegeuk Kim 2553ced2c7eaSKinglong Mee cp_ver |= (cur_cp_crc(ckpt) << 32); 255422ad0b6aSJaegeuk Kim if (cpu_to_le64(cp_ver) != *(__le64 *)nm_i->nat_bits) { 255522ad0b6aSJaegeuk Kim disable_nat_bits(sbi, true); 255622ad0b6aSJaegeuk Kim return 0; 255722ad0b6aSJaegeuk Kim } 255822ad0b6aSJaegeuk Kim 255922ad0b6aSJaegeuk Kim nm_i->full_nat_bits = nm_i->nat_bits + 8; 256022ad0b6aSJaegeuk Kim nm_i->empty_nat_bits = nm_i->full_nat_bits + nat_bits_bytes; 256122ad0b6aSJaegeuk Kim 256222ad0b6aSJaegeuk Kim f2fs_msg(sbi->sb, KERN_NOTICE, "Found nat_bits in checkpoint"); 256322ad0b6aSJaegeuk Kim return 0; 256422ad0b6aSJaegeuk Kim } 256522ad0b6aSJaegeuk Kim 2566bd80a4b9SHou Pengyang static inline void load_free_nid_bitmap(struct f2fs_sb_info *sbi) 25677041d5d2SChao Yu { 25687041d5d2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 25697041d5d2SChao Yu unsigned int i = 0; 25707041d5d2SChao Yu nid_t nid, last_nid; 25717041d5d2SChao Yu 25727041d5d2SChao Yu if (!enabled_nat_bits(sbi, NULL)) 25737041d5d2SChao Yu return; 25747041d5d2SChao Yu 25757041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25767041d5d2SChao Yu i = find_next_bit_le(nm_i->empty_nat_bits, nm_i->nat_blocks, i); 25777041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25787041d5d2SChao Yu break; 25797041d5d2SChao Yu 25807041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25817041d5d2SChao Yu 25827041d5d2SChao Yu nid = i * NAT_ENTRY_PER_BLOCK; 25837041d5d2SChao Yu last_nid = (i + 1) * NAT_ENTRY_PER_BLOCK; 25847041d5d2SChao Yu 2585346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 25867041d5d2SChao Yu for (; nid < last_nid; nid++) 2587346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, true); 2588346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 25897041d5d2SChao Yu } 25907041d5d2SChao Yu 25917041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25927041d5d2SChao Yu i = find_next_bit_le(nm_i->full_nat_bits, nm_i->nat_blocks, i); 25937041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25947041d5d2SChao Yu break; 25957041d5d2SChao Yu 25967041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25977041d5d2SChao Yu } 25987041d5d2SChao Yu } 25997041d5d2SChao Yu 2600e05df3b1SJaegeuk Kim static int init_node_manager(struct f2fs_sb_info *sbi) 2601e05df3b1SJaegeuk Kim { 2602e05df3b1SJaegeuk Kim struct f2fs_super_block *sb_raw = F2FS_RAW_SUPER(sbi); 2603e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2604e05df3b1SJaegeuk Kim unsigned char *version_bitmap; 260522ad0b6aSJaegeuk Kim unsigned int nat_segs; 260622ad0b6aSJaegeuk Kim int err; 2607e05df3b1SJaegeuk Kim 2608e05df3b1SJaegeuk Kim nm_i->nat_blkaddr = le32_to_cpu(sb_raw->nat_blkaddr); 2609e05df3b1SJaegeuk Kim 2610e05df3b1SJaegeuk Kim /* segment_count_nat includes pair segment so divide to 2. */ 2611e05df3b1SJaegeuk Kim nat_segs = le32_to_cpu(sb_raw->segment_count_nat) >> 1; 261222ad0b6aSJaegeuk Kim nm_i->nat_blocks = nat_segs << le32_to_cpu(sb_raw->log_blocks_per_seg); 261322ad0b6aSJaegeuk Kim nm_i->max_nid = NAT_ENTRY_PER_BLOCK * nm_i->nat_blocks; 26147ee0eeabSJaegeuk Kim 2615b63da15eSJaegeuk Kim /* not used nids: 0, node, meta, (and root counted as valid node) */ 261604d47e67SChao Yu nm_i->available_nids = nm_i->max_nid - sbi->total_valid_node_count - 261704d47e67SChao Yu F2FS_RESERVED_NODE_NUM; 2618b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] = 0; 2619b8559dc2SChao Yu nm_i->nid_cnt[ALLOC_NID_LIST] = 0; 2620e05df3b1SJaegeuk Kim nm_i->nat_cnt = 0; 2621cdfc41c1SJaegeuk Kim nm_i->ram_thresh = DEF_RAM_THRESHOLD; 2622ea1a29a0SChao Yu nm_i->ra_nid_pages = DEF_RA_NID_PAGES; 26232304cb0cSChao Yu nm_i->dirty_nats_ratio = DEF_DIRTY_NAT_RATIO_THRESHOLD; 2624e05df3b1SJaegeuk Kim 26258a7ed66aSJaegeuk Kim INIT_RADIX_TREE(&nm_i->free_nid_root, GFP_ATOMIC); 2626b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[FREE_NID_LIST]); 2627b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[ALLOC_NID_LIST]); 2628769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_root, GFP_NOIO); 2629769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_set_root, GFP_NOIO); 2630e05df3b1SJaegeuk Kim INIT_LIST_HEAD(&nm_i->nat_entries); 2631e05df3b1SJaegeuk Kim 2632e05df3b1SJaegeuk Kim mutex_init(&nm_i->build_lock); 2633b8559dc2SChao Yu spin_lock_init(&nm_i->nid_list_lock); 2634b873b798SJaegeuk Kim init_rwsem(&nm_i->nat_tree_lock); 2635e05df3b1SJaegeuk Kim 2636e05df3b1SJaegeuk Kim nm_i->next_scan_nid = le32_to_cpu(sbi->ckpt->next_free_nid); 263779b5793bSAlexandru Gheorghiu nm_i->bitmap_size = __bitmap_size(sbi, NAT_BITMAP); 2638e05df3b1SJaegeuk Kim version_bitmap = __bitmap_ptr(sbi, NAT_BITMAP); 2639e05df3b1SJaegeuk Kim if (!version_bitmap) 2640e05df3b1SJaegeuk Kim return -EFAULT; 2641e05df3b1SJaegeuk Kim 264279b5793bSAlexandru Gheorghiu nm_i->nat_bitmap = kmemdup(version_bitmap, nm_i->bitmap_size, 264379b5793bSAlexandru Gheorghiu GFP_KERNEL); 264479b5793bSAlexandru Gheorghiu if (!nm_i->nat_bitmap) 264579b5793bSAlexandru Gheorghiu return -ENOMEM; 2646599a09b2SChao Yu 264722ad0b6aSJaegeuk Kim err = __get_nat_bitmaps(sbi); 264822ad0b6aSJaegeuk Kim if (err) 264922ad0b6aSJaegeuk Kim return err; 265022ad0b6aSJaegeuk Kim 2651599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2652599a09b2SChao Yu nm_i->nat_bitmap_mir = kmemdup(version_bitmap, nm_i->bitmap_size, 2653599a09b2SChao Yu GFP_KERNEL); 2654599a09b2SChao Yu if (!nm_i->nat_bitmap_mir) 2655599a09b2SChao Yu return -ENOMEM; 2656599a09b2SChao Yu #endif 2657599a09b2SChao Yu 2658e05df3b1SJaegeuk Kim return 0; 2659e05df3b1SJaegeuk Kim } 2660e05df3b1SJaegeuk Kim 26619f7e4a2cSJaegeuk Kim static int init_free_nid_cache(struct f2fs_sb_info *sbi) 26624ac91242SChao Yu { 26634ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 26644ac91242SChao Yu 2665a7c3e901SMichal Hocko nm_i->free_nid_bitmap = kvzalloc(nm_i->nat_blocks * 26664ac91242SChao Yu NAT_ENTRY_BITMAP_SIZE, GFP_KERNEL); 26674ac91242SChao Yu if (!nm_i->free_nid_bitmap) 26684ac91242SChao Yu return -ENOMEM; 26694ac91242SChao Yu 2670a7c3e901SMichal Hocko nm_i->nat_block_bitmap = kvzalloc(nm_i->nat_blocks / 8, 26714ac91242SChao Yu GFP_KERNEL); 26724ac91242SChao Yu if (!nm_i->nat_block_bitmap) 26734ac91242SChao Yu return -ENOMEM; 2674586d1492SChao Yu 2675a7c3e901SMichal Hocko nm_i->free_nid_count = kvzalloc(nm_i->nat_blocks * 2676586d1492SChao Yu sizeof(unsigned short), GFP_KERNEL); 2677586d1492SChao Yu if (!nm_i->free_nid_count) 2678586d1492SChao Yu return -ENOMEM; 26794ac91242SChao Yu return 0; 26804ac91242SChao Yu } 26814ac91242SChao Yu 2682e05df3b1SJaegeuk Kim int build_node_manager(struct f2fs_sb_info *sbi) 2683e05df3b1SJaegeuk Kim { 2684e05df3b1SJaegeuk Kim int err; 2685e05df3b1SJaegeuk Kim 2686e05df3b1SJaegeuk Kim sbi->nm_info = kzalloc(sizeof(struct f2fs_nm_info), GFP_KERNEL); 2687e05df3b1SJaegeuk Kim if (!sbi->nm_info) 2688e05df3b1SJaegeuk Kim return -ENOMEM; 2689e05df3b1SJaegeuk Kim 2690e05df3b1SJaegeuk Kim err = init_node_manager(sbi); 2691e05df3b1SJaegeuk Kim if (err) 2692e05df3b1SJaegeuk Kim return err; 2693e05df3b1SJaegeuk Kim 26944ac91242SChao Yu err = init_free_nid_cache(sbi); 26954ac91242SChao Yu if (err) 26964ac91242SChao Yu return err; 26974ac91242SChao Yu 26987041d5d2SChao Yu /* load free nid status from nat_bits table */ 26997041d5d2SChao Yu load_free_nid_bitmap(sbi); 27007041d5d2SChao Yu 270122ad0b6aSJaegeuk Kim build_free_nids(sbi, true, true); 2702e05df3b1SJaegeuk Kim return 0; 2703e05df3b1SJaegeuk Kim } 2704e05df3b1SJaegeuk Kim 2705e05df3b1SJaegeuk Kim void destroy_node_manager(struct f2fs_sb_info *sbi) 2706e05df3b1SJaegeuk Kim { 2707e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2708e05df3b1SJaegeuk Kim struct free_nid *i, *next_i; 2709e05df3b1SJaegeuk Kim struct nat_entry *natvec[NATVEC_SIZE]; 27107aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2711e05df3b1SJaegeuk Kim nid_t nid = 0; 2712e05df3b1SJaegeuk Kim unsigned int found; 2713e05df3b1SJaegeuk Kim 2714e05df3b1SJaegeuk Kim if (!nm_i) 2715e05df3b1SJaegeuk Kim return; 2716e05df3b1SJaegeuk Kim 2717e05df3b1SJaegeuk Kim /* destroy free nid list */ 2718b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2719b8559dc2SChao Yu list_for_each_entry_safe(i, next_i, &nm_i->nid_list[FREE_NID_LIST], 2720b8559dc2SChao Yu list) { 2721eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 2722b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2723cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2724b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2725e05df3b1SJaegeuk Kim } 2726b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[FREE_NID_LIST]); 2727b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[ALLOC_NID_LIST]); 2728b8559dc2SChao Yu f2fs_bug_on(sbi, !list_empty(&nm_i->nid_list[ALLOC_NID_LIST])); 2729b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2730e05df3b1SJaegeuk Kim 2731e05df3b1SJaegeuk Kim /* destroy nat cache */ 2732b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2733e05df3b1SJaegeuk Kim while ((found = __gang_lookup_nat_cache(nm_i, 2734e05df3b1SJaegeuk Kim nid, NATVEC_SIZE, natvec))) { 2735e05df3b1SJaegeuk Kim unsigned idx; 27367aed0d45SJaegeuk Kim 2737b6ce391eSGu Zheng nid = nat_get_nid(natvec[found - 1]) + 1; 2738b6ce391eSGu Zheng for (idx = 0; idx < found; idx++) 2739b6ce391eSGu Zheng __del_from_nat_cache(nm_i, natvec[idx]); 2740e05df3b1SJaegeuk Kim } 27419850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nm_i->nat_cnt); 27427aed0d45SJaegeuk Kim 27437aed0d45SJaegeuk Kim /* destroy nat set cache */ 27447aed0d45SJaegeuk Kim nid = 0; 27457aed0d45SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 27467aed0d45SJaegeuk Kim nid, SETVEC_SIZE, setvec))) { 27477aed0d45SJaegeuk Kim unsigned idx; 27487aed0d45SJaegeuk Kim 27497aed0d45SJaegeuk Kim nid = setvec[found - 1]->set + 1; 27507aed0d45SJaegeuk Kim for (idx = 0; idx < found; idx++) { 27517aed0d45SJaegeuk Kim /* entry_cnt is not zero, when cp_error was occurred */ 27527aed0d45SJaegeuk Kim f2fs_bug_on(sbi, !list_empty(&setvec[idx]->entry_list)); 27537aed0d45SJaegeuk Kim radix_tree_delete(&nm_i->nat_set_root, setvec[idx]->set); 27547aed0d45SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, setvec[idx]); 27557aed0d45SJaegeuk Kim } 27567aed0d45SJaegeuk Kim } 2757b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 2758e05df3b1SJaegeuk Kim 27594ac91242SChao Yu kvfree(nm_i->nat_block_bitmap); 27604ac91242SChao Yu kvfree(nm_i->free_nid_bitmap); 2761586d1492SChao Yu kvfree(nm_i->free_nid_count); 27624ac91242SChao Yu 2763e05df3b1SJaegeuk Kim kfree(nm_i->nat_bitmap); 276422ad0b6aSJaegeuk Kim kfree(nm_i->nat_bits); 2765599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2766599a09b2SChao Yu kfree(nm_i->nat_bitmap_mir); 2767599a09b2SChao Yu #endif 2768e05df3b1SJaegeuk Kim sbi->nm_info = NULL; 2769e05df3b1SJaegeuk Kim kfree(nm_i); 2770e05df3b1SJaegeuk Kim } 2771e05df3b1SJaegeuk Kim 27726e6093a8SNamjae Jeon int __init create_node_manager_caches(void) 2773e05df3b1SJaegeuk Kim { 2774e05df3b1SJaegeuk Kim nat_entry_slab = f2fs_kmem_cache_create("nat_entry", 2775e8512d2eSGu Zheng sizeof(struct nat_entry)); 2776e05df3b1SJaegeuk Kim if (!nat_entry_slab) 2777aec71382SChao Yu goto fail; 2778e05df3b1SJaegeuk Kim 2779e05df3b1SJaegeuk Kim free_nid_slab = f2fs_kmem_cache_create("free_nid", 2780e8512d2eSGu Zheng sizeof(struct free_nid)); 2781aec71382SChao Yu if (!free_nid_slab) 2782ce3e6d25SMarkus Elfring goto destroy_nat_entry; 2783aec71382SChao Yu 2784aec71382SChao Yu nat_entry_set_slab = f2fs_kmem_cache_create("nat_entry_set", 2785aec71382SChao Yu sizeof(struct nat_entry_set)); 2786aec71382SChao Yu if (!nat_entry_set_slab) 2787ce3e6d25SMarkus Elfring goto destroy_free_nid; 2788e05df3b1SJaegeuk Kim return 0; 2789aec71382SChao Yu 2790ce3e6d25SMarkus Elfring destroy_free_nid: 2791aec71382SChao Yu kmem_cache_destroy(free_nid_slab); 2792ce3e6d25SMarkus Elfring destroy_nat_entry: 2793aec71382SChao Yu kmem_cache_destroy(nat_entry_slab); 2794aec71382SChao Yu fail: 2795aec71382SChao Yu return -ENOMEM; 2796e05df3b1SJaegeuk Kim } 2797e05df3b1SJaegeuk Kim 2798e05df3b1SJaegeuk Kim void destroy_node_manager_caches(void) 2799e05df3b1SJaegeuk Kim { 2800aec71382SChao Yu kmem_cache_destroy(nat_entry_set_slab); 2801e05df3b1SJaegeuk Kim kmem_cache_destroy(free_nid_slab); 2802e05df3b1SJaegeuk Kim kmem_cache_destroy(nat_entry_slab); 2803e05df3b1SJaegeuk Kim } 2804