10a8165d7SJaegeuk Kim /* 2e05df3b1SJaegeuk Kim * fs/f2fs/node.c 3e05df3b1SJaegeuk Kim * 4e05df3b1SJaegeuk Kim * Copyright (c) 2012 Samsung Electronics Co., Ltd. 5e05df3b1SJaegeuk Kim * http://www.samsung.com/ 6e05df3b1SJaegeuk Kim * 7e05df3b1SJaegeuk Kim * This program is free software; you can redistribute it and/or modify 8e05df3b1SJaegeuk Kim * it under the terms of the GNU General Public License version 2 as 9e05df3b1SJaegeuk Kim * published by the Free Software Foundation. 10e05df3b1SJaegeuk Kim */ 11e05df3b1SJaegeuk Kim #include <linux/fs.h> 12e05df3b1SJaegeuk Kim #include <linux/f2fs_fs.h> 13e05df3b1SJaegeuk Kim #include <linux/mpage.h> 14e05df3b1SJaegeuk Kim #include <linux/backing-dev.h> 15e05df3b1SJaegeuk Kim #include <linux/blkdev.h> 16e05df3b1SJaegeuk Kim #include <linux/pagevec.h> 17e05df3b1SJaegeuk Kim #include <linux/swap.h> 18e05df3b1SJaegeuk Kim 19e05df3b1SJaegeuk Kim #include "f2fs.h" 20e05df3b1SJaegeuk Kim #include "node.h" 21e05df3b1SJaegeuk Kim #include "segment.h" 229e4ded3fSJaegeuk Kim #include "trace.h" 2351dd6249SNamjae Jeon #include <trace/events/f2fs.h> 24e05df3b1SJaegeuk Kim 2568afcf2dSTomohiro Kusumi #define on_build_free_nids(nmi) mutex_is_locked(&(nm_i)->build_lock) 26f978f5a0SGu Zheng 27e05df3b1SJaegeuk Kim static struct kmem_cache *nat_entry_slab; 28e05df3b1SJaegeuk Kim static struct kmem_cache *free_nid_slab; 29aec71382SChao Yu static struct kmem_cache *nat_entry_set_slab; 30e05df3b1SJaegeuk Kim 316fb03f3aSJaegeuk Kim bool available_free_memory(struct f2fs_sb_info *sbi, int type) 32cdfc41c1SJaegeuk Kim { 336fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 34cdfc41c1SJaegeuk Kim struct sysinfo val; 35e5e7ea3cSJaegeuk Kim unsigned long avail_ram; 36cdfc41c1SJaegeuk Kim unsigned long mem_size = 0; 376fb03f3aSJaegeuk Kim bool res = false; 38cdfc41c1SJaegeuk Kim 39cdfc41c1SJaegeuk Kim si_meminfo(&val); 40e5e7ea3cSJaegeuk Kim 41e5e7ea3cSJaegeuk Kim /* only uses low memory */ 42e5e7ea3cSJaegeuk Kim avail_ram = val.totalram - val.totalhigh; 43e5e7ea3cSJaegeuk Kim 44429511cdSChao Yu /* 45429511cdSChao Yu * give 25%, 25%, 50%, 50%, 50% memory for each components respectively 46429511cdSChao Yu */ 476fb03f3aSJaegeuk Kim if (type == FREE_NIDS) { 48b8559dc2SChao Yu mem_size = (nm_i->nid_cnt[FREE_NID_LIST] * 49b8559dc2SChao Yu sizeof(struct free_nid)) >> PAGE_SHIFT; 50e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 516fb03f3aSJaegeuk Kim } else if (type == NAT_ENTRIES) { 52e5e7ea3cSJaegeuk Kim mem_size = (nm_i->nat_cnt * sizeof(struct nat_entry)) >> 5309cbfeafSKirill A. Shutemov PAGE_SHIFT; 54e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2); 55e589c2c4SJaegeuk Kim if (excess_cached_nats(sbi)) 56e589c2c4SJaegeuk Kim res = false; 57a1257023SJaegeuk Kim } else if (type == DIRTY_DENTS) { 58a1257023SJaegeuk Kim if (sbi->sb->s_bdi->wb.dirty_exceeded) 59a1257023SJaegeuk Kim return false; 60a1257023SJaegeuk Kim mem_size = get_pages(sbi, F2FS_DIRTY_DENTS); 61a1257023SJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 62e5e7ea3cSJaegeuk Kim } else if (type == INO_ENTRIES) { 63e5e7ea3cSJaegeuk Kim int i; 64e5e7ea3cSJaegeuk Kim 65e5e7ea3cSJaegeuk Kim for (i = 0; i <= UPDATE_INO; i++) 668f73cbb7SKinglong Mee mem_size += sbi->im[i].ino_num * 678f73cbb7SKinglong Mee sizeof(struct ino_entry); 688f73cbb7SKinglong Mee mem_size >>= PAGE_SHIFT; 69e5e7ea3cSJaegeuk Kim res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 70429511cdSChao Yu } else if (type == EXTENT_CACHE) { 717441ccefSJaegeuk Kim mem_size = (atomic_read(&sbi->total_ext_tree) * 727441ccefSJaegeuk Kim sizeof(struct extent_tree) + 73429511cdSChao Yu atomic_read(&sbi->total_ext_node) * 7409cbfeafSKirill A. Shutemov sizeof(struct extent_node)) >> PAGE_SHIFT; 75429511cdSChao Yu res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1); 761e84371fSJaegeuk Kim } else { 771663cae4SJaegeuk Kim if (!sbi->sb->s_bdi->wb.dirty_exceeded) 781663cae4SJaegeuk Kim return true; 796fb03f3aSJaegeuk Kim } 806fb03f3aSJaegeuk Kim return res; 81cdfc41c1SJaegeuk Kim } 82cdfc41c1SJaegeuk Kim 83e05df3b1SJaegeuk Kim static void clear_node_page_dirty(struct page *page) 84e05df3b1SJaegeuk Kim { 85e05df3b1SJaegeuk Kim struct address_space *mapping = page->mapping; 86e05df3b1SJaegeuk Kim unsigned int long flags; 87e05df3b1SJaegeuk Kim 88e05df3b1SJaegeuk Kim if (PageDirty(page)) { 89e05df3b1SJaegeuk Kim spin_lock_irqsave(&mapping->tree_lock, flags); 90e05df3b1SJaegeuk Kim radix_tree_tag_clear(&mapping->page_tree, 91e05df3b1SJaegeuk Kim page_index(page), 92e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY); 93e05df3b1SJaegeuk Kim spin_unlock_irqrestore(&mapping->tree_lock, flags); 94e05df3b1SJaegeuk Kim 95e05df3b1SJaegeuk Kim clear_page_dirty_for_io(page); 964081363fSJaegeuk Kim dec_page_count(F2FS_M_SB(mapping), F2FS_DIRTY_NODES); 97e05df3b1SJaegeuk Kim } 98e05df3b1SJaegeuk Kim ClearPageUptodate(page); 99e05df3b1SJaegeuk Kim } 100e05df3b1SJaegeuk Kim 101e05df3b1SJaegeuk Kim static struct page *get_current_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 102e05df3b1SJaegeuk Kim { 103e05df3b1SJaegeuk Kim pgoff_t index = current_nat_addr(sbi, nid); 104e05df3b1SJaegeuk Kim return get_meta_page(sbi, index); 105e05df3b1SJaegeuk Kim } 106e05df3b1SJaegeuk Kim 107e05df3b1SJaegeuk Kim static struct page *get_next_nat_page(struct f2fs_sb_info *sbi, nid_t nid) 108e05df3b1SJaegeuk Kim { 109e05df3b1SJaegeuk Kim struct page *src_page; 110e05df3b1SJaegeuk Kim struct page *dst_page; 111e05df3b1SJaegeuk Kim pgoff_t src_off; 112e05df3b1SJaegeuk Kim pgoff_t dst_off; 113e05df3b1SJaegeuk Kim void *src_addr; 114e05df3b1SJaegeuk Kim void *dst_addr; 115e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 116e05df3b1SJaegeuk Kim 117e05df3b1SJaegeuk Kim src_off = current_nat_addr(sbi, nid); 118e05df3b1SJaegeuk Kim dst_off = next_nat_addr(sbi, src_off); 119e05df3b1SJaegeuk Kim 120e05df3b1SJaegeuk Kim /* get current nat block page with lock */ 121e05df3b1SJaegeuk Kim src_page = get_meta_page(sbi, src_off); 122e05df3b1SJaegeuk Kim dst_page = grab_meta_page(sbi, dst_off); 1239850cf4aSJaegeuk Kim f2fs_bug_on(sbi, PageDirty(src_page)); 124e05df3b1SJaegeuk Kim 125e05df3b1SJaegeuk Kim src_addr = page_address(src_page); 126e05df3b1SJaegeuk Kim dst_addr = page_address(dst_page); 12709cbfeafSKirill A. Shutemov memcpy(dst_addr, src_addr, PAGE_SIZE); 128e05df3b1SJaegeuk Kim set_page_dirty(dst_page); 129e05df3b1SJaegeuk Kim f2fs_put_page(src_page, 1); 130e05df3b1SJaegeuk Kim 131e05df3b1SJaegeuk Kim set_to_next_nat(nm_i, nid); 132e05df3b1SJaegeuk Kim 133e05df3b1SJaegeuk Kim return dst_page; 134e05df3b1SJaegeuk Kim } 135e05df3b1SJaegeuk Kim 136e05df3b1SJaegeuk Kim static struct nat_entry *__lookup_nat_cache(struct f2fs_nm_info *nm_i, nid_t n) 137e05df3b1SJaegeuk Kim { 138e05df3b1SJaegeuk Kim return radix_tree_lookup(&nm_i->nat_root, n); 139e05df3b1SJaegeuk Kim } 140e05df3b1SJaegeuk Kim 141e05df3b1SJaegeuk Kim static unsigned int __gang_lookup_nat_cache(struct f2fs_nm_info *nm_i, 142e05df3b1SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry **ep) 143e05df3b1SJaegeuk Kim { 144e05df3b1SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_root, (void **)ep, start, nr); 145e05df3b1SJaegeuk Kim } 146e05df3b1SJaegeuk Kim 147e05df3b1SJaegeuk Kim static void __del_from_nat_cache(struct f2fs_nm_info *nm_i, struct nat_entry *e) 148e05df3b1SJaegeuk Kim { 149e05df3b1SJaegeuk Kim list_del(&e->list); 150e05df3b1SJaegeuk Kim radix_tree_delete(&nm_i->nat_root, nat_get_nid(e)); 151e05df3b1SJaegeuk Kim nm_i->nat_cnt--; 152e05df3b1SJaegeuk Kim kmem_cache_free(nat_entry_slab, e); 153e05df3b1SJaegeuk Kim } 154e05df3b1SJaegeuk Kim 155309cc2b6SJaegeuk Kim static void __set_nat_cache_dirty(struct f2fs_nm_info *nm_i, 156309cc2b6SJaegeuk Kim struct nat_entry *ne) 157309cc2b6SJaegeuk Kim { 158309cc2b6SJaegeuk Kim nid_t set = NAT_BLOCK_OFFSET(ne->ni.nid); 159309cc2b6SJaegeuk Kim struct nat_entry_set *head; 160309cc2b6SJaegeuk Kim 161309cc2b6SJaegeuk Kim if (get_nat_flag(ne, IS_DIRTY)) 162309cc2b6SJaegeuk Kim return; 1639be32d72SJaegeuk Kim 164309cc2b6SJaegeuk Kim head = radix_tree_lookup(&nm_i->nat_set_root, set); 165309cc2b6SJaegeuk Kim if (!head) { 16680c54505SJaegeuk Kim head = f2fs_kmem_cache_alloc(nat_entry_set_slab, GFP_NOFS); 167309cc2b6SJaegeuk Kim 168309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->entry_list); 169309cc2b6SJaegeuk Kim INIT_LIST_HEAD(&head->set_list); 170309cc2b6SJaegeuk Kim head->set = set; 171309cc2b6SJaegeuk Kim head->entry_cnt = 0; 1729be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_set_root, set, head); 173309cc2b6SJaegeuk Kim } 174309cc2b6SJaegeuk Kim list_move_tail(&ne->list, &head->entry_list); 175309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt++; 176309cc2b6SJaegeuk Kim head->entry_cnt++; 177309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, true); 178309cc2b6SJaegeuk Kim } 179309cc2b6SJaegeuk Kim 180309cc2b6SJaegeuk Kim static void __clear_nat_cache_dirty(struct f2fs_nm_info *nm_i, 1810b28b71eSKinglong Mee struct nat_entry_set *set, struct nat_entry *ne) 182309cc2b6SJaegeuk Kim { 183309cc2b6SJaegeuk Kim list_move_tail(&ne->list, &nm_i->nat_entries); 184309cc2b6SJaegeuk Kim set_nat_flag(ne, IS_DIRTY, false); 1850b28b71eSKinglong Mee set->entry_cnt--; 186309cc2b6SJaegeuk Kim nm_i->dirty_nat_cnt--; 187309cc2b6SJaegeuk Kim } 188309cc2b6SJaegeuk Kim 189309cc2b6SJaegeuk Kim static unsigned int __gang_lookup_nat_set(struct f2fs_nm_info *nm_i, 190309cc2b6SJaegeuk Kim nid_t start, unsigned int nr, struct nat_entry_set **ep) 191309cc2b6SJaegeuk Kim { 192309cc2b6SJaegeuk Kim return radix_tree_gang_lookup(&nm_i->nat_set_root, (void **)ep, 193309cc2b6SJaegeuk Kim start, nr); 194309cc2b6SJaegeuk Kim } 195309cc2b6SJaegeuk Kim 1962dcf51abSJaegeuk Kim int need_dentry_mark(struct f2fs_sb_info *sbi, nid_t nid) 1972dcf51abSJaegeuk Kim { 1982dcf51abSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1992dcf51abSJaegeuk Kim struct nat_entry *e; 2002dcf51abSJaegeuk Kim bool need = false; 2012dcf51abSJaegeuk Kim 202b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 2032dcf51abSJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2042dcf51abSJaegeuk Kim if (e) { 2052dcf51abSJaegeuk Kim if (!get_nat_flag(e, IS_CHECKPOINTED) && 2062dcf51abSJaegeuk Kim !get_nat_flag(e, HAS_FSYNCED_INODE)) 2072dcf51abSJaegeuk Kim need = true; 2082dcf51abSJaegeuk Kim } 209b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 2102dcf51abSJaegeuk Kim return need; 2112dcf51abSJaegeuk Kim } 2122dcf51abSJaegeuk Kim 21388bd02c9SJaegeuk Kim bool is_checkpointed_node(struct f2fs_sb_info *sbi, nid_t nid) 214e05df3b1SJaegeuk Kim { 215e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 216e05df3b1SJaegeuk Kim struct nat_entry *e; 21788bd02c9SJaegeuk Kim bool is_cp = true; 218e05df3b1SJaegeuk Kim 219b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 220e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 2217ef35e3bSJaegeuk Kim if (e && !get_nat_flag(e, IS_CHECKPOINTED)) 22288bd02c9SJaegeuk Kim is_cp = false; 223b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 224e05df3b1SJaegeuk Kim return is_cp; 225e05df3b1SJaegeuk Kim } 226e05df3b1SJaegeuk Kim 22788bd02c9SJaegeuk Kim bool need_inode_block_update(struct f2fs_sb_info *sbi, nid_t ino) 228b6fe5873SJaegeuk Kim { 229b6fe5873SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 230b6fe5873SJaegeuk Kim struct nat_entry *e; 23188bd02c9SJaegeuk Kim bool need_update = true; 232b6fe5873SJaegeuk Kim 233b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 23488bd02c9SJaegeuk Kim e = __lookup_nat_cache(nm_i, ino); 23588bd02c9SJaegeuk Kim if (e && get_nat_flag(e, HAS_LAST_FSYNC) && 23688bd02c9SJaegeuk Kim (get_nat_flag(e, IS_CHECKPOINTED) || 23788bd02c9SJaegeuk Kim get_nat_flag(e, HAS_FSYNCED_INODE))) 23888bd02c9SJaegeuk Kim need_update = false; 239b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 24088bd02c9SJaegeuk Kim return need_update; 241b6fe5873SJaegeuk Kim } 242b6fe5873SJaegeuk Kim 2435c9e4184SChao Yu static struct nat_entry *grab_nat_entry(struct f2fs_nm_info *nm_i, nid_t nid, 2445c9e4184SChao Yu bool no_fail) 245e05df3b1SJaegeuk Kim { 246e05df3b1SJaegeuk Kim struct nat_entry *new; 247e05df3b1SJaegeuk Kim 2485c9e4184SChao Yu if (no_fail) { 24980c54505SJaegeuk Kim new = f2fs_kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2509be32d72SJaegeuk Kim f2fs_radix_tree_insert(&nm_i->nat_root, nid, new); 2515c9e4184SChao Yu } else { 2525c9e4184SChao Yu new = kmem_cache_alloc(nat_entry_slab, GFP_NOFS); 2535c9e4184SChao Yu if (!new) 2545c9e4184SChao Yu return NULL; 2555c9e4184SChao Yu if (radix_tree_insert(&nm_i->nat_root, nid, new)) { 2565c9e4184SChao Yu kmem_cache_free(nat_entry_slab, new); 2575c9e4184SChao Yu return NULL; 2585c9e4184SChao Yu } 2595c9e4184SChao Yu } 2605c9e4184SChao Yu 261e05df3b1SJaegeuk Kim memset(new, 0, sizeof(struct nat_entry)); 262e05df3b1SJaegeuk Kim nat_set_nid(new, nid); 26388bd02c9SJaegeuk Kim nat_reset_flag(new); 264e05df3b1SJaegeuk Kim list_add_tail(&new->list, &nm_i->nat_entries); 265e05df3b1SJaegeuk Kim nm_i->nat_cnt++; 266e05df3b1SJaegeuk Kim return new; 267e05df3b1SJaegeuk Kim } 268e05df3b1SJaegeuk Kim 2691515aef0SChao Yu static void cache_nat_entry(struct f2fs_sb_info *sbi, nid_t nid, 270e05df3b1SJaegeuk Kim struct f2fs_nat_entry *ne) 271e05df3b1SJaegeuk Kim { 2721515aef0SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 273e05df3b1SJaegeuk Kim struct nat_entry *e; 2749be32d72SJaegeuk Kim 275e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 276e05df3b1SJaegeuk Kim if (!e) { 2775c9e4184SChao Yu e = grab_nat_entry(nm_i, nid, false); 2785c9e4184SChao Yu if (e) 27994dac22eSChao Yu node_info_from_raw_nat(&e->ni, ne); 2801515aef0SChao Yu } else { 2810c0b471eSEric Biggers f2fs_bug_on(sbi, nat_get_ino(e) != le32_to_cpu(ne->ino) || 2820c0b471eSEric Biggers nat_get_blkaddr(e) != 2830c0b471eSEric Biggers le32_to_cpu(ne->block_addr) || 2841515aef0SChao Yu nat_get_version(e) != ne->version); 285e05df3b1SJaegeuk Kim } 286e05df3b1SJaegeuk Kim } 287e05df3b1SJaegeuk Kim 288e05df3b1SJaegeuk Kim static void set_node_addr(struct f2fs_sb_info *sbi, struct node_info *ni, 289479f40c4SJaegeuk Kim block_t new_blkaddr, bool fsync_done) 290e05df3b1SJaegeuk Kim { 291e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 292e05df3b1SJaegeuk Kim struct nat_entry *e; 2939be32d72SJaegeuk Kim 294b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 295e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->nid); 296e05df3b1SJaegeuk Kim if (!e) { 2975c9e4184SChao Yu e = grab_nat_entry(nm_i, ni->nid, true); 2985c27f4eeSChao Yu copy_node_info(&e->ni, ni); 2999850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr == NEW_ADDR); 300e05df3b1SJaegeuk Kim } else if (new_blkaddr == NEW_ADDR) { 301e05df3b1SJaegeuk Kim /* 302e05df3b1SJaegeuk Kim * when nid is reallocated, 303e05df3b1SJaegeuk Kim * previous nat entry can be remained in nat cache. 304e05df3b1SJaegeuk Kim * So, reinitialize it with new information. 305e05df3b1SJaegeuk Kim */ 3065c27f4eeSChao Yu copy_node_info(&e->ni, ni); 3079850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni->blk_addr != NULL_ADDR); 308e05df3b1SJaegeuk Kim } 309e05df3b1SJaegeuk Kim 310e05df3b1SJaegeuk Kim /* sanity check */ 3119850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != ni->blk_addr); 3129850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NULL_ADDR && 313e05df3b1SJaegeuk Kim new_blkaddr == NULL_ADDR); 3149850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) == NEW_ADDR && 315e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 3169850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nat_get_blkaddr(e) != NEW_ADDR && 317e05df3b1SJaegeuk Kim nat_get_blkaddr(e) != NULL_ADDR && 318e05df3b1SJaegeuk Kim new_blkaddr == NEW_ADDR); 319e05df3b1SJaegeuk Kim 320e1c42045Sarter97 /* increment version no as node is removed */ 321e05df3b1SJaegeuk Kim if (nat_get_blkaddr(e) != NEW_ADDR && new_blkaddr == NULL_ADDR) { 322e05df3b1SJaegeuk Kim unsigned char version = nat_get_version(e); 323e05df3b1SJaegeuk Kim nat_set_version(e, inc_node_version(version)); 32426834466SJaegeuk Kim 32526834466SJaegeuk Kim /* in order to reuse the nid */ 32626834466SJaegeuk Kim if (nm_i->next_scan_nid > ni->nid) 32726834466SJaegeuk Kim nm_i->next_scan_nid = ni->nid; 328e05df3b1SJaegeuk Kim } 329e05df3b1SJaegeuk Kim 330e05df3b1SJaegeuk Kim /* change address */ 331e05df3b1SJaegeuk Kim nat_set_blkaddr(e, new_blkaddr); 33288bd02c9SJaegeuk Kim if (new_blkaddr == NEW_ADDR || new_blkaddr == NULL_ADDR) 33388bd02c9SJaegeuk Kim set_nat_flag(e, IS_CHECKPOINTED, false); 334e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, e); 335479f40c4SJaegeuk Kim 336479f40c4SJaegeuk Kim /* update fsync_mark if its inode nat entry is still alive */ 337d5b692b7SChao Yu if (ni->nid != ni->ino) 338479f40c4SJaegeuk Kim e = __lookup_nat_cache(nm_i, ni->ino); 33988bd02c9SJaegeuk Kim if (e) { 34088bd02c9SJaegeuk Kim if (fsync_done && ni->nid == ni->ino) 34188bd02c9SJaegeuk Kim set_nat_flag(e, HAS_FSYNCED_INODE, true); 34288bd02c9SJaegeuk Kim set_nat_flag(e, HAS_LAST_FSYNC, fsync_done); 34388bd02c9SJaegeuk Kim } 344b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 345e05df3b1SJaegeuk Kim } 346e05df3b1SJaegeuk Kim 3474660f9c0SJaegeuk Kim int try_to_free_nats(struct f2fs_sb_info *sbi, int nr_shrink) 348e05df3b1SJaegeuk Kim { 349e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 3501b38dc8eSJaegeuk Kim int nr = nr_shrink; 351e05df3b1SJaegeuk Kim 352b873b798SJaegeuk Kim if (!down_write_trylock(&nm_i->nat_tree_lock)) 353b873b798SJaegeuk Kim return 0; 354e05df3b1SJaegeuk Kim 355e05df3b1SJaegeuk Kim while (nr_shrink && !list_empty(&nm_i->nat_entries)) { 356e05df3b1SJaegeuk Kim struct nat_entry *ne; 357e05df3b1SJaegeuk Kim ne = list_first_entry(&nm_i->nat_entries, 358e05df3b1SJaegeuk Kim struct nat_entry, list); 359e05df3b1SJaegeuk Kim __del_from_nat_cache(nm_i, ne); 360e05df3b1SJaegeuk Kim nr_shrink--; 361e05df3b1SJaegeuk Kim } 362b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 3631b38dc8eSJaegeuk Kim return nr - nr_shrink; 364e05df3b1SJaegeuk Kim } 365e05df3b1SJaegeuk Kim 3660a8165d7SJaegeuk Kim /* 367e1c42045Sarter97 * This function always returns success 368e05df3b1SJaegeuk Kim */ 369e05df3b1SJaegeuk Kim void get_node_info(struct f2fs_sb_info *sbi, nid_t nid, struct node_info *ni) 370e05df3b1SJaegeuk Kim { 371e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 372e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 373b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 374e05df3b1SJaegeuk Kim nid_t start_nid = START_NID(nid); 375e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk; 376e05df3b1SJaegeuk Kim struct page *page = NULL; 377e05df3b1SJaegeuk Kim struct f2fs_nat_entry ne; 378e05df3b1SJaegeuk Kim struct nat_entry *e; 37966a82d1fSYunlei He pgoff_t index; 380e05df3b1SJaegeuk Kim int i; 381e05df3b1SJaegeuk Kim 382e05df3b1SJaegeuk Kim ni->nid = nid; 383e05df3b1SJaegeuk Kim 384e05df3b1SJaegeuk Kim /* Check nat cache */ 385b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 386e05df3b1SJaegeuk Kim e = __lookup_nat_cache(nm_i, nid); 387e05df3b1SJaegeuk Kim if (e) { 388e05df3b1SJaegeuk Kim ni->ino = nat_get_ino(e); 389e05df3b1SJaegeuk Kim ni->blk_addr = nat_get_blkaddr(e); 390e05df3b1SJaegeuk Kim ni->version = nat_get_version(e); 391b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 392e05df3b1SJaegeuk Kim return; 3931515aef0SChao Yu } 394e05df3b1SJaegeuk Kim 3953547ea96SJaegeuk Kim memset(&ne, 0, sizeof(struct f2fs_nat_entry)); 3963547ea96SJaegeuk Kim 397e05df3b1SJaegeuk Kim /* Check current segment summary */ 398b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 399dfc08a12SChao Yu i = lookup_journal_in_cursum(journal, NAT_JOURNAL, nid, 0); 400e05df3b1SJaegeuk Kim if (i >= 0) { 401dfc08a12SChao Yu ne = nat_in_journal(journal, i); 402e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 403e05df3b1SJaegeuk Kim } 404b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 40566a82d1fSYunlei He if (i >= 0) { 40666a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 407e05df3b1SJaegeuk Kim goto cache; 40866a82d1fSYunlei He } 409e05df3b1SJaegeuk Kim 410e05df3b1SJaegeuk Kim /* Fill node_info from nat page */ 41166a82d1fSYunlei He index = current_nat_addr(sbi, nid); 41266a82d1fSYunlei He up_read(&nm_i->nat_tree_lock); 41366a82d1fSYunlei He 41466a82d1fSYunlei He page = get_meta_page(sbi, index); 415e05df3b1SJaegeuk Kim nat_blk = (struct f2fs_nat_block *)page_address(page); 416e05df3b1SJaegeuk Kim ne = nat_blk->entries[nid - start_nid]; 417e05df3b1SJaegeuk Kim node_info_from_raw_nat(ni, &ne); 418e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 419e05df3b1SJaegeuk Kim cache: 420e05df3b1SJaegeuk Kim /* cache nat entry */ 421b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 4221515aef0SChao Yu cache_nat_entry(sbi, nid, &ne); 423b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 424e05df3b1SJaegeuk Kim } 425e05df3b1SJaegeuk Kim 42679344efbSJaegeuk Kim /* 42779344efbSJaegeuk Kim * readahead MAX_RA_NODE number of node pages. 42879344efbSJaegeuk Kim */ 42979344efbSJaegeuk Kim static void ra_node_pages(struct page *parent, int start, int n) 43079344efbSJaegeuk Kim { 43179344efbSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 43279344efbSJaegeuk Kim struct blk_plug plug; 43379344efbSJaegeuk Kim int i, end; 43479344efbSJaegeuk Kim nid_t nid; 43579344efbSJaegeuk Kim 43679344efbSJaegeuk Kim blk_start_plug(&plug); 43779344efbSJaegeuk Kim 43879344efbSJaegeuk Kim /* Then, try readahead for siblings of the desired node */ 43979344efbSJaegeuk Kim end = start + n; 44079344efbSJaegeuk Kim end = min(end, NIDS_PER_BLOCK); 44179344efbSJaegeuk Kim for (i = start; i < end; i++) { 44279344efbSJaegeuk Kim nid = get_nid(parent, i, false); 44379344efbSJaegeuk Kim ra_node_page(sbi, nid); 44479344efbSJaegeuk Kim } 44579344efbSJaegeuk Kim 44679344efbSJaegeuk Kim blk_finish_plug(&plug); 44779344efbSJaegeuk Kim } 44879344efbSJaegeuk Kim 4493cf45747SChao Yu pgoff_t get_next_page_offset(struct dnode_of_data *dn, pgoff_t pgofs) 4503cf45747SChao Yu { 4513cf45747SChao Yu const long direct_index = ADDRS_PER_INODE(dn->inode); 4523cf45747SChao Yu const long direct_blks = ADDRS_PER_BLOCK; 4533cf45747SChao Yu const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 4543cf45747SChao Yu unsigned int skipped_unit = ADDRS_PER_BLOCK; 4553cf45747SChao Yu int cur_level = dn->cur_level; 4563cf45747SChao Yu int max_level = dn->max_level; 4573cf45747SChao Yu pgoff_t base = 0; 4583cf45747SChao Yu 4593cf45747SChao Yu if (!dn->max_level) 4603cf45747SChao Yu return pgofs + 1; 4613cf45747SChao Yu 4623cf45747SChao Yu while (max_level-- > cur_level) 4633cf45747SChao Yu skipped_unit *= NIDS_PER_BLOCK; 4643cf45747SChao Yu 4653cf45747SChao Yu switch (dn->max_level) { 4663cf45747SChao Yu case 3: 4673cf45747SChao Yu base += 2 * indirect_blks; 4683cf45747SChao Yu case 2: 4693cf45747SChao Yu base += 2 * direct_blks; 4703cf45747SChao Yu case 1: 4713cf45747SChao Yu base += direct_index; 4723cf45747SChao Yu break; 4733cf45747SChao Yu default: 4743cf45747SChao Yu f2fs_bug_on(F2FS_I_SB(dn->inode), 1); 4753cf45747SChao Yu } 4763cf45747SChao Yu 4773cf45747SChao Yu return ((pgofs - base) / skipped_unit + 1) * skipped_unit + base; 4783cf45747SChao Yu } 4793cf45747SChao Yu 4800a8165d7SJaegeuk Kim /* 481e05df3b1SJaegeuk Kim * The maximum depth is four. 482e05df3b1SJaegeuk Kim * Offset[0] will have raw inode offset. 483e05df3b1SJaegeuk Kim */ 48481ca7350SChao Yu static int get_node_path(struct inode *inode, long block, 485de93653fSJaegeuk Kim int offset[4], unsigned int noffset[4]) 486e05df3b1SJaegeuk Kim { 48781ca7350SChao Yu const long direct_index = ADDRS_PER_INODE(inode); 488e05df3b1SJaegeuk Kim const long direct_blks = ADDRS_PER_BLOCK; 489e05df3b1SJaegeuk Kim const long dptrs_per_blk = NIDS_PER_BLOCK; 490e05df3b1SJaegeuk Kim const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK; 491e05df3b1SJaegeuk Kim const long dindirect_blks = indirect_blks * NIDS_PER_BLOCK; 492e05df3b1SJaegeuk Kim int n = 0; 493e05df3b1SJaegeuk Kim int level = 0; 494e05df3b1SJaegeuk Kim 495e05df3b1SJaegeuk Kim noffset[0] = 0; 496e05df3b1SJaegeuk Kim 497e05df3b1SJaegeuk Kim if (block < direct_index) { 49825c0a6e5SNamjae Jeon offset[n] = block; 499e05df3b1SJaegeuk Kim goto got; 500e05df3b1SJaegeuk Kim } 501e05df3b1SJaegeuk Kim block -= direct_index; 502e05df3b1SJaegeuk Kim if (block < direct_blks) { 503e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR1_BLOCK; 504e05df3b1SJaegeuk Kim noffset[n] = 1; 50525c0a6e5SNamjae Jeon offset[n] = block; 506e05df3b1SJaegeuk Kim level = 1; 507e05df3b1SJaegeuk Kim goto got; 508e05df3b1SJaegeuk Kim } 509e05df3b1SJaegeuk Kim block -= direct_blks; 510e05df3b1SJaegeuk Kim if (block < direct_blks) { 511e05df3b1SJaegeuk Kim offset[n++] = NODE_DIR2_BLOCK; 512e05df3b1SJaegeuk Kim noffset[n] = 2; 51325c0a6e5SNamjae Jeon offset[n] = block; 514e05df3b1SJaegeuk Kim level = 1; 515e05df3b1SJaegeuk Kim goto got; 516e05df3b1SJaegeuk Kim } 517e05df3b1SJaegeuk Kim block -= direct_blks; 518e05df3b1SJaegeuk Kim if (block < indirect_blks) { 519e05df3b1SJaegeuk Kim offset[n++] = NODE_IND1_BLOCK; 520e05df3b1SJaegeuk Kim noffset[n] = 3; 521e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 522e05df3b1SJaegeuk Kim noffset[n] = 4 + offset[n - 1]; 52325c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 524e05df3b1SJaegeuk Kim level = 2; 525e05df3b1SJaegeuk Kim goto got; 526e05df3b1SJaegeuk Kim } 527e05df3b1SJaegeuk Kim block -= indirect_blks; 528e05df3b1SJaegeuk Kim if (block < indirect_blks) { 529e05df3b1SJaegeuk Kim offset[n++] = NODE_IND2_BLOCK; 530e05df3b1SJaegeuk Kim noffset[n] = 4 + dptrs_per_blk; 531e05df3b1SJaegeuk Kim offset[n++] = block / direct_blks; 532e05df3b1SJaegeuk Kim noffset[n] = 5 + dptrs_per_blk + offset[n - 1]; 53325c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 534e05df3b1SJaegeuk Kim level = 2; 535e05df3b1SJaegeuk Kim goto got; 536e05df3b1SJaegeuk Kim } 537e05df3b1SJaegeuk Kim block -= indirect_blks; 538e05df3b1SJaegeuk Kim if (block < dindirect_blks) { 539e05df3b1SJaegeuk Kim offset[n++] = NODE_DIND_BLOCK; 540e05df3b1SJaegeuk Kim noffset[n] = 5 + (dptrs_per_blk * 2); 541e05df3b1SJaegeuk Kim offset[n++] = block / indirect_blks; 542e05df3b1SJaegeuk Kim noffset[n] = 6 + (dptrs_per_blk * 2) + 543e05df3b1SJaegeuk Kim offset[n - 1] * (dptrs_per_blk + 1); 544e05df3b1SJaegeuk Kim offset[n++] = (block / direct_blks) % dptrs_per_blk; 545e05df3b1SJaegeuk Kim noffset[n] = 7 + (dptrs_per_blk * 2) + 546e05df3b1SJaegeuk Kim offset[n - 2] * (dptrs_per_blk + 1) + 547e05df3b1SJaegeuk Kim offset[n - 1]; 54825c0a6e5SNamjae Jeon offset[n] = block % direct_blks; 549e05df3b1SJaegeuk Kim level = 3; 550e05df3b1SJaegeuk Kim goto got; 551e05df3b1SJaegeuk Kim } else { 552e05df3b1SJaegeuk Kim BUG(); 553e05df3b1SJaegeuk Kim } 554e05df3b1SJaegeuk Kim got: 555e05df3b1SJaegeuk Kim return level; 556e05df3b1SJaegeuk Kim } 557e05df3b1SJaegeuk Kim 558e05df3b1SJaegeuk Kim /* 559e05df3b1SJaegeuk Kim * Caller should call f2fs_put_dnode(dn). 5604f4124d0SChao Yu * Also, it should grab and release a rwsem by calling f2fs_lock_op() and 5614f4124d0SChao Yu * f2fs_unlock_op() only if ro is not set RDONLY_NODE. 56239936837SJaegeuk Kim * In the case of RDONLY_NODE, we don't need to care about mutex. 563e05df3b1SJaegeuk Kim */ 564266e97a8SJaegeuk Kim int get_dnode_of_data(struct dnode_of_data *dn, pgoff_t index, int mode) 565e05df3b1SJaegeuk Kim { 5664081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 567e05df3b1SJaegeuk Kim struct page *npage[4]; 568f1a3b98eSJaegeuk Kim struct page *parent = NULL; 569e05df3b1SJaegeuk Kim int offset[4]; 570e05df3b1SJaegeuk Kim unsigned int noffset[4]; 571e05df3b1SJaegeuk Kim nid_t nids[4]; 5723cf45747SChao Yu int level, i = 0; 573e05df3b1SJaegeuk Kim int err = 0; 574e05df3b1SJaegeuk Kim 57581ca7350SChao Yu level = get_node_path(dn->inode, index, offset, noffset); 576e05df3b1SJaegeuk Kim 577e05df3b1SJaegeuk Kim nids[0] = dn->inode->i_ino; 5781646cfacSJaegeuk Kim npage[0] = dn->inode_page; 5791646cfacSJaegeuk Kim 5801646cfacSJaegeuk Kim if (!npage[0]) { 581e05df3b1SJaegeuk Kim npage[0] = get_node_page(sbi, nids[0]); 582e05df3b1SJaegeuk Kim if (IS_ERR(npage[0])) 583e05df3b1SJaegeuk Kim return PTR_ERR(npage[0]); 5841646cfacSJaegeuk Kim } 585f1a3b98eSJaegeuk Kim 586f1a3b98eSJaegeuk Kim /* if inline_data is set, should not report any block indices */ 587f1a3b98eSJaegeuk Kim if (f2fs_has_inline_data(dn->inode) && index) { 58876629165SJaegeuk Kim err = -ENOENT; 589f1a3b98eSJaegeuk Kim f2fs_put_page(npage[0], 1); 590f1a3b98eSJaegeuk Kim goto release_out; 591f1a3b98eSJaegeuk Kim } 592f1a3b98eSJaegeuk Kim 593e05df3b1SJaegeuk Kim parent = npage[0]; 59452c2db3fSChangman Lee if (level != 0) 595e05df3b1SJaegeuk Kim nids[1] = get_nid(parent, offset[0], true); 596e05df3b1SJaegeuk Kim dn->inode_page = npage[0]; 597e05df3b1SJaegeuk Kim dn->inode_page_locked = true; 598e05df3b1SJaegeuk Kim 599e05df3b1SJaegeuk Kim /* get indirect or direct nodes */ 600e05df3b1SJaegeuk Kim for (i = 1; i <= level; i++) { 601e05df3b1SJaegeuk Kim bool done = false; 602e05df3b1SJaegeuk Kim 603266e97a8SJaegeuk Kim if (!nids[i] && mode == ALLOC_NODE) { 604e05df3b1SJaegeuk Kim /* alloc new node */ 605e05df3b1SJaegeuk Kim if (!alloc_nid(sbi, &(nids[i]))) { 606e05df3b1SJaegeuk Kim err = -ENOSPC; 607e05df3b1SJaegeuk Kim goto release_pages; 608e05df3b1SJaegeuk Kim } 609e05df3b1SJaegeuk Kim 610e05df3b1SJaegeuk Kim dn->nid = nids[i]; 6118ae8f162SJaegeuk Kim npage[i] = new_node_page(dn, noffset[i], NULL); 612e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 613e05df3b1SJaegeuk Kim alloc_nid_failed(sbi, nids[i]); 614e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 615e05df3b1SJaegeuk Kim goto release_pages; 616e05df3b1SJaegeuk Kim } 617e05df3b1SJaegeuk Kim 618e05df3b1SJaegeuk Kim set_nid(parent, offset[i - 1], nids[i], i == 1); 619e05df3b1SJaegeuk Kim alloc_nid_done(sbi, nids[i]); 620e05df3b1SJaegeuk Kim done = true; 621266e97a8SJaegeuk Kim } else if (mode == LOOKUP_NODE_RA && i == level && level > 1) { 622e05df3b1SJaegeuk Kim npage[i] = get_node_page_ra(parent, offset[i - 1]); 623e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 624e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 625e05df3b1SJaegeuk Kim goto release_pages; 626e05df3b1SJaegeuk Kim } 627e05df3b1SJaegeuk Kim done = true; 628e05df3b1SJaegeuk Kim } 629e05df3b1SJaegeuk Kim if (i == 1) { 630e05df3b1SJaegeuk Kim dn->inode_page_locked = false; 631e05df3b1SJaegeuk Kim unlock_page(parent); 632e05df3b1SJaegeuk Kim } else { 633e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 634e05df3b1SJaegeuk Kim } 635e05df3b1SJaegeuk Kim 636e05df3b1SJaegeuk Kim if (!done) { 637e05df3b1SJaegeuk Kim npage[i] = get_node_page(sbi, nids[i]); 638e05df3b1SJaegeuk Kim if (IS_ERR(npage[i])) { 639e05df3b1SJaegeuk Kim err = PTR_ERR(npage[i]); 640e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 641e05df3b1SJaegeuk Kim goto release_out; 642e05df3b1SJaegeuk Kim } 643e05df3b1SJaegeuk Kim } 644e05df3b1SJaegeuk Kim if (i < level) { 645e05df3b1SJaegeuk Kim parent = npage[i]; 646e05df3b1SJaegeuk Kim nids[i + 1] = get_nid(parent, offset[i], false); 647e05df3b1SJaegeuk Kim } 648e05df3b1SJaegeuk Kim } 649e05df3b1SJaegeuk Kim dn->nid = nids[level]; 650e05df3b1SJaegeuk Kim dn->ofs_in_node = offset[level]; 651e05df3b1SJaegeuk Kim dn->node_page = npage[level]; 652e05df3b1SJaegeuk Kim dn->data_blkaddr = datablock_addr(dn->node_page, dn->ofs_in_node); 653e05df3b1SJaegeuk Kim return 0; 654e05df3b1SJaegeuk Kim 655e05df3b1SJaegeuk Kim release_pages: 656e05df3b1SJaegeuk Kim f2fs_put_page(parent, 1); 657e05df3b1SJaegeuk Kim if (i > 1) 658e05df3b1SJaegeuk Kim f2fs_put_page(npage[0], 0); 659e05df3b1SJaegeuk Kim release_out: 660e05df3b1SJaegeuk Kim dn->inode_page = NULL; 661e05df3b1SJaegeuk Kim dn->node_page = NULL; 6623cf45747SChao Yu if (err == -ENOENT) { 6633cf45747SChao Yu dn->cur_level = i; 6643cf45747SChao Yu dn->max_level = level; 6650a2aa8fbSJaegeuk Kim dn->ofs_in_node = offset[level]; 6663cf45747SChao Yu } 667e05df3b1SJaegeuk Kim return err; 668e05df3b1SJaegeuk Kim } 669e05df3b1SJaegeuk Kim 670e05df3b1SJaegeuk Kim static void truncate_node(struct dnode_of_data *dn) 671e05df3b1SJaegeuk Kim { 6724081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 673e05df3b1SJaegeuk Kim struct node_info ni; 674e05df3b1SJaegeuk Kim 675e05df3b1SJaegeuk Kim get_node_info(sbi, dn->nid, &ni); 67671e9fec5SJaegeuk Kim if (dn->inode->i_blocks == 0) { 6779850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr != NULL_ADDR); 67871e9fec5SJaegeuk Kim goto invalidate; 67971e9fec5SJaegeuk Kim } 6809850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 681e05df3b1SJaegeuk Kim 682e05df3b1SJaegeuk Kim /* Deallocate node address */ 68371e9fec5SJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 684ef86d709SGu Zheng dec_valid_node_count(sbi, dn->inode); 685479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 686e05df3b1SJaegeuk Kim 687e05df3b1SJaegeuk Kim if (dn->nid == dn->inode->i_ino) { 688e05df3b1SJaegeuk Kim remove_orphan_inode(sbi, dn->nid); 689e05df3b1SJaegeuk Kim dec_valid_inode_count(sbi); 6900f18b462SJaegeuk Kim f2fs_inode_synced(dn->inode); 691e05df3b1SJaegeuk Kim } 69271e9fec5SJaegeuk Kim invalidate: 693e05df3b1SJaegeuk Kim clear_node_page_dirty(dn->node_page); 694caf0047eSChao Yu set_sbi_flag(sbi, SBI_IS_DIRTY); 695e05df3b1SJaegeuk Kim 696e05df3b1SJaegeuk Kim f2fs_put_page(dn->node_page, 1); 697bf39c00aSJaegeuk Kim 698bf39c00aSJaegeuk Kim invalidate_mapping_pages(NODE_MAPPING(sbi), 699bf39c00aSJaegeuk Kim dn->node_page->index, dn->node_page->index); 700bf39c00aSJaegeuk Kim 701e05df3b1SJaegeuk Kim dn->node_page = NULL; 70251dd6249SNamjae Jeon trace_f2fs_truncate_node(dn->inode, dn->nid, ni.blk_addr); 703e05df3b1SJaegeuk Kim } 704e05df3b1SJaegeuk Kim 705e05df3b1SJaegeuk Kim static int truncate_dnode(struct dnode_of_data *dn) 706e05df3b1SJaegeuk Kim { 707e05df3b1SJaegeuk Kim struct page *page; 708e05df3b1SJaegeuk Kim 709e05df3b1SJaegeuk Kim if (dn->nid == 0) 710e05df3b1SJaegeuk Kim return 1; 711e05df3b1SJaegeuk Kim 712e05df3b1SJaegeuk Kim /* get direct node */ 7134081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 714e05df3b1SJaegeuk Kim if (IS_ERR(page) && PTR_ERR(page) == -ENOENT) 715e05df3b1SJaegeuk Kim return 1; 716e05df3b1SJaegeuk Kim else if (IS_ERR(page)) 717e05df3b1SJaegeuk Kim return PTR_ERR(page); 718e05df3b1SJaegeuk Kim 719e05df3b1SJaegeuk Kim /* Make dnode_of_data for parameter */ 720e05df3b1SJaegeuk Kim dn->node_page = page; 721e05df3b1SJaegeuk Kim dn->ofs_in_node = 0; 722e05df3b1SJaegeuk Kim truncate_data_blocks(dn); 723e05df3b1SJaegeuk Kim truncate_node(dn); 724e05df3b1SJaegeuk Kim return 1; 725e05df3b1SJaegeuk Kim } 726e05df3b1SJaegeuk Kim 727e05df3b1SJaegeuk Kim static int truncate_nodes(struct dnode_of_data *dn, unsigned int nofs, 728e05df3b1SJaegeuk Kim int ofs, int depth) 729e05df3b1SJaegeuk Kim { 730e05df3b1SJaegeuk Kim struct dnode_of_data rdn = *dn; 731e05df3b1SJaegeuk Kim struct page *page; 732e05df3b1SJaegeuk Kim struct f2fs_node *rn; 733e05df3b1SJaegeuk Kim nid_t child_nid; 734e05df3b1SJaegeuk Kim unsigned int child_nofs; 735e05df3b1SJaegeuk Kim int freed = 0; 736e05df3b1SJaegeuk Kim int i, ret; 737e05df3b1SJaegeuk Kim 738e05df3b1SJaegeuk Kim if (dn->nid == 0) 739e05df3b1SJaegeuk Kim return NIDS_PER_BLOCK + 1; 740e05df3b1SJaegeuk Kim 74151dd6249SNamjae Jeon trace_f2fs_truncate_nodes_enter(dn->inode, dn->nid, dn->data_blkaddr); 74251dd6249SNamjae Jeon 7434081363fSJaegeuk Kim page = get_node_page(F2FS_I_SB(dn->inode), dn->nid); 74451dd6249SNamjae Jeon if (IS_ERR(page)) { 74551dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, PTR_ERR(page)); 746e05df3b1SJaegeuk Kim return PTR_ERR(page); 74751dd6249SNamjae Jeon } 748e05df3b1SJaegeuk Kim 74979344efbSJaegeuk Kim ra_node_pages(page, ofs, NIDS_PER_BLOCK); 75079344efbSJaegeuk Kim 75145590710SGu Zheng rn = F2FS_NODE(page); 752e05df3b1SJaegeuk Kim if (depth < 3) { 753e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++, freed++) { 754e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 755e05df3b1SJaegeuk Kim if (child_nid == 0) 756e05df3b1SJaegeuk Kim continue; 757e05df3b1SJaegeuk Kim rdn.nid = child_nid; 758e05df3b1SJaegeuk Kim ret = truncate_dnode(&rdn); 759e05df3b1SJaegeuk Kim if (ret < 0) 760e05df3b1SJaegeuk Kim goto out_err; 76112719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 76293bae099SJaegeuk Kim dn->node_changed = true; 763e05df3b1SJaegeuk Kim } 764e05df3b1SJaegeuk Kim } else { 765e05df3b1SJaegeuk Kim child_nofs = nofs + ofs * (NIDS_PER_BLOCK + 1) + 1; 766e05df3b1SJaegeuk Kim for (i = ofs; i < NIDS_PER_BLOCK; i++) { 767e05df3b1SJaegeuk Kim child_nid = le32_to_cpu(rn->in.nid[i]); 768e05df3b1SJaegeuk Kim if (child_nid == 0) { 769e05df3b1SJaegeuk Kim child_nofs += NIDS_PER_BLOCK + 1; 770e05df3b1SJaegeuk Kim continue; 771e05df3b1SJaegeuk Kim } 772e05df3b1SJaegeuk Kim rdn.nid = child_nid; 773e05df3b1SJaegeuk Kim ret = truncate_nodes(&rdn, child_nofs, 0, depth - 1); 774e05df3b1SJaegeuk Kim if (ret == (NIDS_PER_BLOCK + 1)) { 77512719ae1SJaegeuk Kim if (set_nid(page, i, 0, false)) 77693bae099SJaegeuk Kim dn->node_changed = true; 777e05df3b1SJaegeuk Kim child_nofs += ret; 778e05df3b1SJaegeuk Kim } else if (ret < 0 && ret != -ENOENT) { 779e05df3b1SJaegeuk Kim goto out_err; 780e05df3b1SJaegeuk Kim } 781e05df3b1SJaegeuk Kim } 782e05df3b1SJaegeuk Kim freed = child_nofs; 783e05df3b1SJaegeuk Kim } 784e05df3b1SJaegeuk Kim 785e05df3b1SJaegeuk Kim if (!ofs) { 786e05df3b1SJaegeuk Kim /* remove current indirect node */ 787e05df3b1SJaegeuk Kim dn->node_page = page; 788e05df3b1SJaegeuk Kim truncate_node(dn); 789e05df3b1SJaegeuk Kim freed++; 790e05df3b1SJaegeuk Kim } else { 791e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 792e05df3b1SJaegeuk Kim } 79351dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, freed); 794e05df3b1SJaegeuk Kim return freed; 795e05df3b1SJaegeuk Kim 796e05df3b1SJaegeuk Kim out_err: 797e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 79851dd6249SNamjae Jeon trace_f2fs_truncate_nodes_exit(dn->inode, ret); 799e05df3b1SJaegeuk Kim return ret; 800e05df3b1SJaegeuk Kim } 801e05df3b1SJaegeuk Kim 802e05df3b1SJaegeuk Kim static int truncate_partial_nodes(struct dnode_of_data *dn, 803e05df3b1SJaegeuk Kim struct f2fs_inode *ri, int *offset, int depth) 804e05df3b1SJaegeuk Kim { 805e05df3b1SJaegeuk Kim struct page *pages[2]; 806e05df3b1SJaegeuk Kim nid_t nid[3]; 807e05df3b1SJaegeuk Kim nid_t child_nid; 808e05df3b1SJaegeuk Kim int err = 0; 809e05df3b1SJaegeuk Kim int i; 810e05df3b1SJaegeuk Kim int idx = depth - 2; 811e05df3b1SJaegeuk Kim 812e05df3b1SJaegeuk Kim nid[0] = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 813e05df3b1SJaegeuk Kim if (!nid[0]) 814e05df3b1SJaegeuk Kim return 0; 815e05df3b1SJaegeuk Kim 816e05df3b1SJaegeuk Kim /* get indirect nodes in the path */ 817a225dca3Sshifei10.ge for (i = 0; i < idx + 1; i++) { 818e1c42045Sarter97 /* reference count'll be increased */ 8194081363fSJaegeuk Kim pages[i] = get_node_page(F2FS_I_SB(dn->inode), nid[i]); 820e05df3b1SJaegeuk Kim if (IS_ERR(pages[i])) { 821e05df3b1SJaegeuk Kim err = PTR_ERR(pages[i]); 822a225dca3Sshifei10.ge idx = i - 1; 823e05df3b1SJaegeuk Kim goto fail; 824e05df3b1SJaegeuk Kim } 825e05df3b1SJaegeuk Kim nid[i + 1] = get_nid(pages[i], offset[i + 1], false); 826e05df3b1SJaegeuk Kim } 827e05df3b1SJaegeuk Kim 82879344efbSJaegeuk Kim ra_node_pages(pages[idx], offset[idx + 1], NIDS_PER_BLOCK); 82979344efbSJaegeuk Kim 830e05df3b1SJaegeuk Kim /* free direct nodes linked to a partial indirect node */ 831a225dca3Sshifei10.ge for (i = offset[idx + 1]; i < NIDS_PER_BLOCK; i++) { 832e05df3b1SJaegeuk Kim child_nid = get_nid(pages[idx], i, false); 833e05df3b1SJaegeuk Kim if (!child_nid) 834e05df3b1SJaegeuk Kim continue; 835e05df3b1SJaegeuk Kim dn->nid = child_nid; 836e05df3b1SJaegeuk Kim err = truncate_dnode(dn); 837e05df3b1SJaegeuk Kim if (err < 0) 838e05df3b1SJaegeuk Kim goto fail; 83912719ae1SJaegeuk Kim if (set_nid(pages[idx], i, 0, false)) 84093bae099SJaegeuk Kim dn->node_changed = true; 841e05df3b1SJaegeuk Kim } 842e05df3b1SJaegeuk Kim 843a225dca3Sshifei10.ge if (offset[idx + 1] == 0) { 844e05df3b1SJaegeuk Kim dn->node_page = pages[idx]; 845e05df3b1SJaegeuk Kim dn->nid = nid[idx]; 846e05df3b1SJaegeuk Kim truncate_node(dn); 847e05df3b1SJaegeuk Kim } else { 848e05df3b1SJaegeuk Kim f2fs_put_page(pages[idx], 1); 849e05df3b1SJaegeuk Kim } 850e05df3b1SJaegeuk Kim offset[idx]++; 851a225dca3Sshifei10.ge offset[idx + 1] = 0; 852a225dca3Sshifei10.ge idx--; 853e05df3b1SJaegeuk Kim fail: 854a225dca3Sshifei10.ge for (i = idx; i >= 0; i--) 855e05df3b1SJaegeuk Kim f2fs_put_page(pages[i], 1); 85651dd6249SNamjae Jeon 85751dd6249SNamjae Jeon trace_f2fs_truncate_partial_nodes(dn->inode, nid, depth, err); 85851dd6249SNamjae Jeon 859e05df3b1SJaegeuk Kim return err; 860e05df3b1SJaegeuk Kim } 861e05df3b1SJaegeuk Kim 8620a8165d7SJaegeuk Kim /* 863e05df3b1SJaegeuk Kim * All the block addresses of data and nodes should be nullified. 864e05df3b1SJaegeuk Kim */ 865e05df3b1SJaegeuk Kim int truncate_inode_blocks(struct inode *inode, pgoff_t from) 866e05df3b1SJaegeuk Kim { 8674081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 868e05df3b1SJaegeuk Kim int err = 0, cont = 1; 869e05df3b1SJaegeuk Kim int level, offset[4], noffset[4]; 8707dd690c8SJaegeuk Kim unsigned int nofs = 0; 87158bfaf44SJaegeuk Kim struct f2fs_inode *ri; 872e05df3b1SJaegeuk Kim struct dnode_of_data dn; 873e05df3b1SJaegeuk Kim struct page *page; 874e05df3b1SJaegeuk Kim 87551dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_enter(inode, from); 87651dd6249SNamjae Jeon 87781ca7350SChao Yu level = get_node_path(inode, from, offset, noffset); 878ff373558SJaegeuk Kim 879e05df3b1SJaegeuk Kim page = get_node_page(sbi, inode->i_ino); 88051dd6249SNamjae Jeon if (IS_ERR(page)) { 88151dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, PTR_ERR(page)); 882e05df3b1SJaegeuk Kim return PTR_ERR(page); 88351dd6249SNamjae Jeon } 884e05df3b1SJaegeuk Kim 885e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, page, NULL, 0); 886e05df3b1SJaegeuk Kim unlock_page(page); 887e05df3b1SJaegeuk Kim 88858bfaf44SJaegeuk Kim ri = F2FS_INODE(page); 889e05df3b1SJaegeuk Kim switch (level) { 890e05df3b1SJaegeuk Kim case 0: 891e05df3b1SJaegeuk Kim case 1: 892e05df3b1SJaegeuk Kim nofs = noffset[1]; 893e05df3b1SJaegeuk Kim break; 894e05df3b1SJaegeuk Kim case 2: 895e05df3b1SJaegeuk Kim nofs = noffset[1]; 896e05df3b1SJaegeuk Kim if (!offset[level - 1]) 897e05df3b1SJaegeuk Kim goto skip_partial; 89858bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 899e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 900e05df3b1SJaegeuk Kim goto fail; 901e05df3b1SJaegeuk Kim nofs += 1 + NIDS_PER_BLOCK; 902e05df3b1SJaegeuk Kim break; 903e05df3b1SJaegeuk Kim case 3: 904e05df3b1SJaegeuk Kim nofs = 5 + 2 * NIDS_PER_BLOCK; 905e05df3b1SJaegeuk Kim if (!offset[level - 1]) 906e05df3b1SJaegeuk Kim goto skip_partial; 90758bfaf44SJaegeuk Kim err = truncate_partial_nodes(&dn, ri, offset, level); 908e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 909e05df3b1SJaegeuk Kim goto fail; 910e05df3b1SJaegeuk Kim break; 911e05df3b1SJaegeuk Kim default: 912e05df3b1SJaegeuk Kim BUG(); 913e05df3b1SJaegeuk Kim } 914e05df3b1SJaegeuk Kim 915e05df3b1SJaegeuk Kim skip_partial: 916e05df3b1SJaegeuk Kim while (cont) { 91758bfaf44SJaegeuk Kim dn.nid = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]); 918e05df3b1SJaegeuk Kim switch (offset[0]) { 919e05df3b1SJaegeuk Kim case NODE_DIR1_BLOCK: 920e05df3b1SJaegeuk Kim case NODE_DIR2_BLOCK: 921e05df3b1SJaegeuk Kim err = truncate_dnode(&dn); 922e05df3b1SJaegeuk Kim break; 923e05df3b1SJaegeuk Kim 924e05df3b1SJaegeuk Kim case NODE_IND1_BLOCK: 925e05df3b1SJaegeuk Kim case NODE_IND2_BLOCK: 926e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 2); 927e05df3b1SJaegeuk Kim break; 928e05df3b1SJaegeuk Kim 929e05df3b1SJaegeuk Kim case NODE_DIND_BLOCK: 930e05df3b1SJaegeuk Kim err = truncate_nodes(&dn, nofs, offset[1], 3); 931e05df3b1SJaegeuk Kim cont = 0; 932e05df3b1SJaegeuk Kim break; 933e05df3b1SJaegeuk Kim 934e05df3b1SJaegeuk Kim default: 935e05df3b1SJaegeuk Kim BUG(); 936e05df3b1SJaegeuk Kim } 937e05df3b1SJaegeuk Kim if (err < 0 && err != -ENOENT) 938e05df3b1SJaegeuk Kim goto fail; 939e05df3b1SJaegeuk Kim if (offset[1] == 0 && 94058bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK]) { 941e05df3b1SJaegeuk Kim lock_page(page); 942ff373558SJaegeuk Kim BUG_ON(page->mapping != NODE_MAPPING(sbi)); 943fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 94458bfaf44SJaegeuk Kim ri->i_nid[offset[0] - NODE_DIR1_BLOCK] = 0; 945e05df3b1SJaegeuk Kim set_page_dirty(page); 946e05df3b1SJaegeuk Kim unlock_page(page); 947e05df3b1SJaegeuk Kim } 948e05df3b1SJaegeuk Kim offset[1] = 0; 949e05df3b1SJaegeuk Kim offset[0]++; 950e05df3b1SJaegeuk Kim nofs += err; 951e05df3b1SJaegeuk Kim } 952e05df3b1SJaegeuk Kim fail: 953e05df3b1SJaegeuk Kim f2fs_put_page(page, 0); 95451dd6249SNamjae Jeon trace_f2fs_truncate_inode_blocks_exit(inode, err); 955e05df3b1SJaegeuk Kim return err > 0 ? 0 : err; 956e05df3b1SJaegeuk Kim } 957e05df3b1SJaegeuk Kim 9584f16fb0fSJaegeuk Kim int truncate_xattr_node(struct inode *inode, struct page *page) 9594f16fb0fSJaegeuk Kim { 9604081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 9614f16fb0fSJaegeuk Kim nid_t nid = F2FS_I(inode)->i_xattr_nid; 9624f16fb0fSJaegeuk Kim struct dnode_of_data dn; 9634f16fb0fSJaegeuk Kim struct page *npage; 9644f16fb0fSJaegeuk Kim 9654f16fb0fSJaegeuk Kim if (!nid) 9664f16fb0fSJaegeuk Kim return 0; 9674f16fb0fSJaegeuk Kim 9684f16fb0fSJaegeuk Kim npage = get_node_page(sbi, nid); 9694f16fb0fSJaegeuk Kim if (IS_ERR(npage)) 9704f16fb0fSJaegeuk Kim return PTR_ERR(npage); 9714f16fb0fSJaegeuk Kim 972205b9822SJaegeuk Kim f2fs_i_xnid_write(inode, 0); 97365985d93SJaegeuk Kim 9744f16fb0fSJaegeuk Kim set_new_dnode(&dn, inode, page, npage, nid); 9754f16fb0fSJaegeuk Kim 9764f16fb0fSJaegeuk Kim if (page) 97701d2d1aaSChao Yu dn.inode_page_locked = true; 9784f16fb0fSJaegeuk Kim truncate_node(&dn); 9794f16fb0fSJaegeuk Kim return 0; 9804f16fb0fSJaegeuk Kim } 9814f16fb0fSJaegeuk Kim 98239936837SJaegeuk Kim /* 9834f4124d0SChao Yu * Caller should grab and release a rwsem by calling f2fs_lock_op() and 9844f4124d0SChao Yu * f2fs_unlock_op(). 98539936837SJaegeuk Kim */ 98613ec7297SChao Yu int remove_inode_page(struct inode *inode) 987e05df3b1SJaegeuk Kim { 988e05df3b1SJaegeuk Kim struct dnode_of_data dn; 98913ec7297SChao Yu int err; 990e05df3b1SJaegeuk Kim 991c2e69583SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 99213ec7297SChao Yu err = get_dnode_of_data(&dn, 0, LOOKUP_NODE); 99313ec7297SChao Yu if (err) 99413ec7297SChao Yu return err; 995e05df3b1SJaegeuk Kim 99613ec7297SChao Yu err = truncate_xattr_node(inode, dn.inode_page); 99713ec7297SChao Yu if (err) { 998c2e69583SJaegeuk Kim f2fs_put_dnode(&dn); 99913ec7297SChao Yu return err; 1000e05df3b1SJaegeuk Kim } 1001c2e69583SJaegeuk Kim 1002c2e69583SJaegeuk Kim /* remove potential inline_data blocks */ 1003c2e69583SJaegeuk Kim if (S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) || 1004c2e69583SJaegeuk Kim S_ISLNK(inode->i_mode)) 1005c2e69583SJaegeuk Kim truncate_data_blocks_range(&dn, 1); 1006c2e69583SJaegeuk Kim 1007e1c42045Sarter97 /* 0 is possible, after f2fs_new_inode() has failed */ 10089850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), 10099850cf4aSJaegeuk Kim inode->i_blocks != 0 && inode->i_blocks != 1); 1010c2e69583SJaegeuk Kim 1011c2e69583SJaegeuk Kim /* will put inode & node pages */ 1012e05df3b1SJaegeuk Kim truncate_node(&dn); 101313ec7297SChao Yu return 0; 1014e05df3b1SJaegeuk Kim } 1015e05df3b1SJaegeuk Kim 1016a014e037SJaegeuk Kim struct page *new_inode_page(struct inode *inode) 1017e05df3b1SJaegeuk Kim { 1018e05df3b1SJaegeuk Kim struct dnode_of_data dn; 1019e05df3b1SJaegeuk Kim 1020e05df3b1SJaegeuk Kim /* allocate inode page for new inode */ 1021e05df3b1SJaegeuk Kim set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino); 102244a83ff6SJaegeuk Kim 102344a83ff6SJaegeuk Kim /* caller should f2fs_put_page(page, 1); */ 10248ae8f162SJaegeuk Kim return new_node_page(&dn, 0, NULL); 1025e05df3b1SJaegeuk Kim } 1026e05df3b1SJaegeuk Kim 10278ae8f162SJaegeuk Kim struct page *new_node_page(struct dnode_of_data *dn, 10288ae8f162SJaegeuk Kim unsigned int ofs, struct page *ipage) 1029e05df3b1SJaegeuk Kim { 10304081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode); 103125cc5d3bSJaegeuk Kim struct node_info new_ni; 1032e05df3b1SJaegeuk Kim struct page *page; 1033e05df3b1SJaegeuk Kim int err; 1034e05df3b1SJaegeuk Kim 103591942321SJaegeuk Kim if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC))) 1036e05df3b1SJaegeuk Kim return ERR_PTR(-EPERM); 1037e05df3b1SJaegeuk Kim 1038300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), dn->nid, false); 1039e05df3b1SJaegeuk Kim if (!page) 1040e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1041e05df3b1SJaegeuk Kim 10426bacf52fSJaegeuk Kim if (unlikely(!inc_valid_node_count(sbi, dn->inode))) { 10439c02740cSJaegeuk Kim err = -ENOSPC; 10449c02740cSJaegeuk Kim goto fail; 10459c02740cSJaegeuk Kim } 104625cc5d3bSJaegeuk Kim #ifdef CONFIG_F2FS_CHECK_FS 104725cc5d3bSJaegeuk Kim get_node_info(sbi, dn->nid, &new_ni); 104825cc5d3bSJaegeuk Kim f2fs_bug_on(sbi, new_ni.blk_addr != NULL_ADDR); 104925cc5d3bSJaegeuk Kim #endif 105025cc5d3bSJaegeuk Kim new_ni.nid = dn->nid; 1051e05df3b1SJaegeuk Kim new_ni.ino = dn->inode->i_ino; 105225cc5d3bSJaegeuk Kim new_ni.blk_addr = NULL_ADDR; 105325cc5d3bSJaegeuk Kim new_ni.flag = 0; 105425cc5d3bSJaegeuk Kim new_ni.version = 0; 1055479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 10569c02740cSJaegeuk Kim 1057fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 10589c02740cSJaegeuk Kim fill_node_footer(page, dn->nid, dn->inode->i_ino, ofs, true); 1059398b1ac5SJaegeuk Kim set_cold_node(dn->inode, page); 1060237c0790SJaegeuk Kim if (!PageUptodate(page)) 10619c02740cSJaegeuk Kim SetPageUptodate(page); 106212719ae1SJaegeuk Kim if (set_page_dirty(page)) 106312719ae1SJaegeuk Kim dn->node_changed = true; 1064e05df3b1SJaegeuk Kim 10654bc8e9bcSChao Yu if (f2fs_has_xattr_block(ofs)) 1066205b9822SJaegeuk Kim f2fs_i_xnid_write(dn->inode, dn->nid); 1067479bd73aSJaegeuk Kim 1068e05df3b1SJaegeuk Kim if (ofs == 0) 1069e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 1070e05df3b1SJaegeuk Kim return page; 1071e05df3b1SJaegeuk Kim 1072e05df3b1SJaegeuk Kim fail: 107371e9fec5SJaegeuk Kim clear_node_page_dirty(page); 1074e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1075e05df3b1SJaegeuk Kim return ERR_PTR(err); 1076e05df3b1SJaegeuk Kim } 1077e05df3b1SJaegeuk Kim 107856ae674cSJaegeuk Kim /* 107956ae674cSJaegeuk Kim * Caller should do after getting the following values. 108056ae674cSJaegeuk Kim * 0: f2fs_put_page(page, 0) 108186531d6bSJaegeuk Kim * LOCKED_PAGE or error: f2fs_put_page(page, 1) 108256ae674cSJaegeuk Kim */ 108304d328deSMike Christie static int read_node_page(struct page *page, int op_flags) 1084e05df3b1SJaegeuk Kim { 10854081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1086e05df3b1SJaegeuk Kim struct node_info ni; 1087cf04e8ebSJaegeuk Kim struct f2fs_io_info fio = { 108805ca3632SJaegeuk Kim .sbi = sbi, 1089cf04e8ebSJaegeuk Kim .type = NODE, 109004d328deSMike Christie .op = REQ_OP_READ, 109104d328deSMike Christie .op_flags = op_flags, 109205ca3632SJaegeuk Kim .page = page, 10934375a336SJaegeuk Kim .encrypted_page = NULL, 1094cf04e8ebSJaegeuk Kim }; 1095e05df3b1SJaegeuk Kim 10963bdad3c7SJaegeuk Kim if (PageUptodate(page)) 10973bdad3c7SJaegeuk Kim return LOCKED_PAGE; 10983bdad3c7SJaegeuk Kim 1099e05df3b1SJaegeuk Kim get_node_info(sbi, page->index, &ni); 1100e05df3b1SJaegeuk Kim 11016bacf52fSJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 11022bca1e23SJaegeuk Kim ClearPageUptodate(page); 1103e05df3b1SJaegeuk Kim return -ENOENT; 1104393ff91fSJaegeuk Kim } 1105393ff91fSJaegeuk Kim 11067a9d7548SChao Yu fio.new_blkaddr = fio.old_blkaddr = ni.blk_addr; 110705ca3632SJaegeuk Kim return f2fs_submit_page_bio(&fio); 1108e05df3b1SJaegeuk Kim } 1109e05df3b1SJaegeuk Kim 11100a8165d7SJaegeuk Kim /* 1111e05df3b1SJaegeuk Kim * Readahead a node page 1112e05df3b1SJaegeuk Kim */ 1113e05df3b1SJaegeuk Kim void ra_node_page(struct f2fs_sb_info *sbi, nid_t nid) 1114e05df3b1SJaegeuk Kim { 1115e05df3b1SJaegeuk Kim struct page *apage; 111656ae674cSJaegeuk Kim int err; 1117e05df3b1SJaegeuk Kim 1118e8458725SChao Yu if (!nid) 1119e8458725SChao Yu return; 1120e8458725SChao Yu f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1121e8458725SChao Yu 1122999270deSFan Li rcu_read_lock(); 1123999270deSFan Li apage = radix_tree_lookup(&NODE_MAPPING(sbi)->page_tree, nid); 1124999270deSFan Li rcu_read_unlock(); 1125999270deSFan Li if (apage) 1126393ff91fSJaegeuk Kim return; 1127e05df3b1SJaegeuk Kim 1128300e129cSJaegeuk Kim apage = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1129e05df3b1SJaegeuk Kim if (!apage) 1130e05df3b1SJaegeuk Kim return; 1131e05df3b1SJaegeuk Kim 113270246286SChristoph Hellwig err = read_node_page(apage, REQ_RAHEAD); 113386531d6bSJaegeuk Kim f2fs_put_page(apage, err ? 1 : 0); 1134e05df3b1SJaegeuk Kim } 1135e05df3b1SJaegeuk Kim 113617a0ee55SJaegeuk Kim static struct page *__get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid, 11370e022ea8SChao Yu struct page *parent, int start) 1138e05df3b1SJaegeuk Kim { 113956ae674cSJaegeuk Kim struct page *page; 114056ae674cSJaegeuk Kim int err; 11414aa69d56SJaegeuk Kim 11424aa69d56SJaegeuk Kim if (!nid) 11434aa69d56SJaegeuk Kim return ERR_PTR(-ENOENT); 11444aa69d56SJaegeuk Kim f2fs_bug_on(sbi, check_nid_range(sbi, nid)); 1145afcb7ca0SJaegeuk Kim repeat: 1146300e129cSJaegeuk Kim page = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false); 1147e05df3b1SJaegeuk Kim if (!page) 1148e05df3b1SJaegeuk Kim return ERR_PTR(-ENOMEM); 1149e05df3b1SJaegeuk Kim 115070fd7614SChristoph Hellwig err = read_node_page(page, 0); 115186531d6bSJaegeuk Kim if (err < 0) { 115286531d6bSJaegeuk Kim f2fs_put_page(page, 1); 1153e05df3b1SJaegeuk Kim return ERR_PTR(err); 1154e1c51b9fSChao Yu } else if (err == LOCKED_PAGE) { 1155e1c51b9fSChao Yu goto page_hit; 115686531d6bSJaegeuk Kim } 1157aaf96075SJaegeuk Kim 11580e022ea8SChao Yu if (parent) 115979344efbSJaegeuk Kim ra_node_pages(parent, start + 1, MAX_RA_NODE); 11600e022ea8SChao Yu 1161e1c51b9fSChao Yu lock_page(page); 1162e1c51b9fSChao Yu 11634ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1164afcb7ca0SJaegeuk Kim f2fs_put_page(page, 1); 1165afcb7ca0SJaegeuk Kim goto repeat; 1166afcb7ca0SJaegeuk Kim } 11671563ac75SChao Yu 11681563ac75SChao Yu if (unlikely(!PageUptodate(page))) 11691563ac75SChao Yu goto out_err; 1170e1c51b9fSChao Yu page_hit: 11710c9df7fbSYunlong Song if(unlikely(nid != nid_of_node(page))) { 11720c9df7fbSYunlong Song f2fs_bug_on(sbi, 1); 11730c9df7fbSYunlong Song ClearPageUptodate(page); 11740c9df7fbSYunlong Song out_err: 11750c9df7fbSYunlong Song f2fs_put_page(page, 1); 11760c9df7fbSYunlong Song return ERR_PTR(-EIO); 11770c9df7fbSYunlong Song } 1178e05df3b1SJaegeuk Kim return page; 1179e05df3b1SJaegeuk Kim } 1180e05df3b1SJaegeuk Kim 11810e022ea8SChao Yu struct page *get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid) 11820e022ea8SChao Yu { 11830e022ea8SChao Yu return __get_node_page(sbi, nid, NULL, 0); 11840e022ea8SChao Yu } 11850e022ea8SChao Yu 1186e05df3b1SJaegeuk Kim struct page *get_node_page_ra(struct page *parent, int start) 1187e05df3b1SJaegeuk Kim { 11884081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(parent); 11890e022ea8SChao Yu nid_t nid = get_nid(parent, start, false); 1190e05df3b1SJaegeuk Kim 11910e022ea8SChao Yu return __get_node_page(sbi, nid, parent, start); 1192e05df3b1SJaegeuk Kim } 1193e05df3b1SJaegeuk Kim 11942049d4fcSJaegeuk Kim static void flush_inline_data(struct f2fs_sb_info *sbi, nid_t ino) 11952049d4fcSJaegeuk Kim { 11962049d4fcSJaegeuk Kim struct inode *inode; 11972049d4fcSJaegeuk Kim struct page *page; 11980f3311a8SChao Yu int ret; 11992049d4fcSJaegeuk Kim 12002049d4fcSJaegeuk Kim /* should flush inline_data before evict_inode */ 12012049d4fcSJaegeuk Kim inode = ilookup(sbi->sb, ino); 12022049d4fcSJaegeuk Kim if (!inode) 12032049d4fcSJaegeuk Kim return; 12042049d4fcSJaegeuk Kim 12054a6de50dSJaegeuk Kim page = pagecache_get_page(inode->i_mapping, 0, FGP_LOCK|FGP_NOWAIT, 0); 12062049d4fcSJaegeuk Kim if (!page) 12072049d4fcSJaegeuk Kim goto iput_out; 12082049d4fcSJaegeuk Kim 12092049d4fcSJaegeuk Kim if (!PageUptodate(page)) 12102049d4fcSJaegeuk Kim goto page_out; 12112049d4fcSJaegeuk Kim 12122049d4fcSJaegeuk Kim if (!PageDirty(page)) 12132049d4fcSJaegeuk Kim goto page_out; 12142049d4fcSJaegeuk Kim 12152049d4fcSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 12162049d4fcSJaegeuk Kim goto page_out; 12172049d4fcSJaegeuk Kim 12180f3311a8SChao Yu ret = f2fs_write_inline_data(inode, page); 12192049d4fcSJaegeuk Kim inode_dec_dirty_pages(inode); 1220933439c8SChao Yu remove_dirty_inode(inode); 12210f3311a8SChao Yu if (ret) 12222049d4fcSJaegeuk Kim set_page_dirty(page); 12232049d4fcSJaegeuk Kim page_out: 12244a6de50dSJaegeuk Kim f2fs_put_page(page, 1); 12252049d4fcSJaegeuk Kim iput_out: 12262049d4fcSJaegeuk Kim iput(inode); 12272049d4fcSJaegeuk Kim } 12282049d4fcSJaegeuk Kim 1229da011cc0SChao Yu void move_node_page(struct page *node_page, int gc_type) 1230da011cc0SChao Yu { 1231da011cc0SChao Yu if (gc_type == FG_GC) { 1232da011cc0SChao Yu struct f2fs_sb_info *sbi = F2FS_P_SB(node_page); 1233da011cc0SChao Yu struct writeback_control wbc = { 1234da011cc0SChao Yu .sync_mode = WB_SYNC_ALL, 1235da011cc0SChao Yu .nr_to_write = 1, 1236da011cc0SChao Yu .for_reclaim = 0, 1237da011cc0SChao Yu }; 1238da011cc0SChao Yu 1239da011cc0SChao Yu set_page_dirty(node_page); 1240da011cc0SChao Yu f2fs_wait_on_page_writeback(node_page, NODE, true); 1241da011cc0SChao Yu 1242da011cc0SChao Yu f2fs_bug_on(sbi, PageWriteback(node_page)); 1243da011cc0SChao Yu if (!clear_page_dirty_for_io(node_page)) 1244da011cc0SChao Yu goto out_page; 1245da011cc0SChao Yu 1246da011cc0SChao Yu if (NODE_MAPPING(sbi)->a_ops->writepage(node_page, &wbc)) 1247da011cc0SChao Yu unlock_page(node_page); 1248da011cc0SChao Yu goto release_page; 1249da011cc0SChao Yu } else { 1250da011cc0SChao Yu /* set page dirty and write it */ 1251da011cc0SChao Yu if (!PageWriteback(node_page)) 1252da011cc0SChao Yu set_page_dirty(node_page); 1253da011cc0SChao Yu } 1254da011cc0SChao Yu out_page: 1255da011cc0SChao Yu unlock_page(node_page); 1256da011cc0SChao Yu release_page: 1257da011cc0SChao Yu f2fs_put_page(node_page, 0); 1258da011cc0SChao Yu } 1259da011cc0SChao Yu 1260608514deSJaegeuk Kim static struct page *last_fsync_dnode(struct f2fs_sb_info *sbi, nid_t ino) 1261e05df3b1SJaegeuk Kim { 1262e05df3b1SJaegeuk Kim pgoff_t index, end; 1263e05df3b1SJaegeuk Kim struct pagevec pvec; 1264608514deSJaegeuk Kim struct page *last_page = NULL; 126552681375SJaegeuk Kim 126652681375SJaegeuk Kim pagevec_init(&pvec, 0); 126752681375SJaegeuk Kim index = 0; 126852681375SJaegeuk Kim end = ULONG_MAX; 126952681375SJaegeuk Kim 127052681375SJaegeuk Kim while (index <= end) { 127152681375SJaegeuk Kim int i, nr_pages; 127252681375SJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 127352681375SJaegeuk Kim PAGECACHE_TAG_DIRTY, 127452681375SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 127552681375SJaegeuk Kim if (nr_pages == 0) 127652681375SJaegeuk Kim break; 127752681375SJaegeuk Kim 127852681375SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 127952681375SJaegeuk Kim struct page *page = pvec.pages[i]; 128052681375SJaegeuk Kim 128152681375SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1282608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 128352681375SJaegeuk Kim pagevec_release(&pvec); 1284608514deSJaegeuk Kim return ERR_PTR(-EIO); 128552681375SJaegeuk Kim } 128652681375SJaegeuk Kim 128752681375SJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 128852681375SJaegeuk Kim continue; 128952681375SJaegeuk Kim if (ino_of_node(page) != ino) 129052681375SJaegeuk Kim continue; 129152681375SJaegeuk Kim 129252681375SJaegeuk Kim lock_page(page); 129352681375SJaegeuk Kim 129452681375SJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 129552681375SJaegeuk Kim continue_unlock: 129652681375SJaegeuk Kim unlock_page(page); 129752681375SJaegeuk Kim continue; 129852681375SJaegeuk Kim } 129952681375SJaegeuk Kim if (ino_of_node(page) != ino) 130052681375SJaegeuk Kim goto continue_unlock; 130152681375SJaegeuk Kim 130252681375SJaegeuk Kim if (!PageDirty(page)) { 130352681375SJaegeuk Kim /* someone wrote it for us */ 130452681375SJaegeuk Kim goto continue_unlock; 130552681375SJaegeuk Kim } 130652681375SJaegeuk Kim 1307608514deSJaegeuk Kim if (last_page) 1308608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1309608514deSJaegeuk Kim 1310608514deSJaegeuk Kim get_page(page); 1311608514deSJaegeuk Kim last_page = page; 1312608514deSJaegeuk Kim unlock_page(page); 1313608514deSJaegeuk Kim } 1314608514deSJaegeuk Kim pagevec_release(&pvec); 1315608514deSJaegeuk Kim cond_resched(); 1316608514deSJaegeuk Kim } 1317608514deSJaegeuk Kim return last_page; 1318608514deSJaegeuk Kim } 1319608514deSJaegeuk Kim 1320d68f735bSJaegeuk Kim static int __write_node_page(struct page *page, bool atomic, bool *submitted, 1321faa24895SJaegeuk Kim struct writeback_control *wbc) 1322faa24895SJaegeuk Kim { 1323faa24895SJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_P_SB(page); 1324faa24895SJaegeuk Kim nid_t nid; 1325faa24895SJaegeuk Kim struct node_info ni; 1326faa24895SJaegeuk Kim struct f2fs_io_info fio = { 1327faa24895SJaegeuk Kim .sbi = sbi, 1328faa24895SJaegeuk Kim .type = NODE, 1329faa24895SJaegeuk Kim .op = REQ_OP_WRITE, 1330faa24895SJaegeuk Kim .op_flags = wbc_to_write_flags(wbc), 1331faa24895SJaegeuk Kim .page = page, 1332faa24895SJaegeuk Kim .encrypted_page = NULL, 1333d68f735bSJaegeuk Kim .submitted = false, 1334faa24895SJaegeuk Kim }; 1335faa24895SJaegeuk Kim 1336faa24895SJaegeuk Kim trace_f2fs_writepage(page, NODE); 1337faa24895SJaegeuk Kim 1338faa24895SJaegeuk Kim if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING))) 1339faa24895SJaegeuk Kim goto redirty_out; 1340faa24895SJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) 1341faa24895SJaegeuk Kim goto redirty_out; 1342faa24895SJaegeuk Kim 1343faa24895SJaegeuk Kim /* get old block addr of this node page */ 1344faa24895SJaegeuk Kim nid = nid_of_node(page); 1345faa24895SJaegeuk Kim f2fs_bug_on(sbi, page->index != nid); 1346faa24895SJaegeuk Kim 1347faa24895SJaegeuk Kim if (wbc->for_reclaim) { 1348faa24895SJaegeuk Kim if (!down_read_trylock(&sbi->node_write)) 1349faa24895SJaegeuk Kim goto redirty_out; 1350faa24895SJaegeuk Kim } else { 1351faa24895SJaegeuk Kim down_read(&sbi->node_write); 1352faa24895SJaegeuk Kim } 1353faa24895SJaegeuk Kim 1354faa24895SJaegeuk Kim get_node_info(sbi, nid, &ni); 1355faa24895SJaegeuk Kim 1356faa24895SJaegeuk Kim /* This page is already truncated */ 1357faa24895SJaegeuk Kim if (unlikely(ni.blk_addr == NULL_ADDR)) { 1358faa24895SJaegeuk Kim ClearPageUptodate(page); 1359faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1360faa24895SJaegeuk Kim up_read(&sbi->node_write); 1361faa24895SJaegeuk Kim unlock_page(page); 1362faa24895SJaegeuk Kim return 0; 1363faa24895SJaegeuk Kim } 1364faa24895SJaegeuk Kim 1365e7c75ab0SJaegeuk Kim if (atomic && !test_opt(sbi, NOBARRIER)) 1366e7c75ab0SJaegeuk Kim fio.op_flags |= REQ_PREFLUSH | REQ_FUA; 1367e7c75ab0SJaegeuk Kim 1368faa24895SJaegeuk Kim set_page_writeback(page); 1369faa24895SJaegeuk Kim fio.old_blkaddr = ni.blk_addr; 1370faa24895SJaegeuk Kim write_node_page(nid, &fio); 1371faa24895SJaegeuk Kim set_node_addr(sbi, &ni, fio.new_blkaddr, is_fsync_dnode(page)); 1372faa24895SJaegeuk Kim dec_page_count(sbi, F2FS_DIRTY_NODES); 1373faa24895SJaegeuk Kim up_read(&sbi->node_write); 1374faa24895SJaegeuk Kim 1375d68f735bSJaegeuk Kim if (wbc->for_reclaim) { 1376b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, page->mapping->host, 0, 1377b9109b0eSJaegeuk Kim page->index, NODE); 1378d68f735bSJaegeuk Kim submitted = NULL; 1379d68f735bSJaegeuk Kim } 1380faa24895SJaegeuk Kim 1381faa24895SJaegeuk Kim unlock_page(page); 1382faa24895SJaegeuk Kim 1383d68f735bSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1384b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 1385d68f735bSJaegeuk Kim submitted = NULL; 1386d68f735bSJaegeuk Kim } 1387d68f735bSJaegeuk Kim if (submitted) 1388d68f735bSJaegeuk Kim *submitted = fio.submitted; 1389faa24895SJaegeuk Kim 1390faa24895SJaegeuk Kim return 0; 1391faa24895SJaegeuk Kim 1392faa24895SJaegeuk Kim redirty_out: 1393faa24895SJaegeuk Kim redirty_page_for_writepage(wbc, page); 1394faa24895SJaegeuk Kim return AOP_WRITEPAGE_ACTIVATE; 1395faa24895SJaegeuk Kim } 1396faa24895SJaegeuk Kim 1397faa24895SJaegeuk Kim static int f2fs_write_node_page(struct page *page, 1398faa24895SJaegeuk Kim struct writeback_control *wbc) 1399faa24895SJaegeuk Kim { 1400d68f735bSJaegeuk Kim return __write_node_page(page, false, NULL, wbc); 1401faa24895SJaegeuk Kim } 1402faa24895SJaegeuk Kim 140326de9b11SJaegeuk Kim int fsync_node_pages(struct f2fs_sb_info *sbi, struct inode *inode, 1404608514deSJaegeuk Kim struct writeback_control *wbc, bool atomic) 1405608514deSJaegeuk Kim { 1406608514deSJaegeuk Kim pgoff_t index, end; 1407942fd319SJaegeuk Kim pgoff_t last_idx = ULONG_MAX; 1408608514deSJaegeuk Kim struct pagevec pvec; 1409608514deSJaegeuk Kim int ret = 0; 1410608514deSJaegeuk Kim struct page *last_page = NULL; 1411608514deSJaegeuk Kim bool marked = false; 141226de9b11SJaegeuk Kim nid_t ino = inode->i_ino; 1413608514deSJaegeuk Kim 1414608514deSJaegeuk Kim if (atomic) { 1415608514deSJaegeuk Kim last_page = last_fsync_dnode(sbi, ino); 1416608514deSJaegeuk Kim if (IS_ERR_OR_NULL(last_page)) 1417608514deSJaegeuk Kim return PTR_ERR_OR_ZERO(last_page); 1418608514deSJaegeuk Kim } 1419608514deSJaegeuk Kim retry: 1420608514deSJaegeuk Kim pagevec_init(&pvec, 0); 1421608514deSJaegeuk Kim index = 0; 1422608514deSJaegeuk Kim end = ULONG_MAX; 1423608514deSJaegeuk Kim 1424608514deSJaegeuk Kim while (index <= end) { 1425608514deSJaegeuk Kim int i, nr_pages; 1426608514deSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1427608514deSJaegeuk Kim PAGECACHE_TAG_DIRTY, 1428608514deSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1429608514deSJaegeuk Kim if (nr_pages == 0) 1430608514deSJaegeuk Kim break; 1431608514deSJaegeuk Kim 1432608514deSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1433608514deSJaegeuk Kim struct page *page = pvec.pages[i]; 1434d68f735bSJaegeuk Kim bool submitted = false; 1435608514deSJaegeuk Kim 1436608514deSJaegeuk Kim if (unlikely(f2fs_cp_error(sbi))) { 1437608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1438608514deSJaegeuk Kim pagevec_release(&pvec); 14399de69279SChao Yu ret = -EIO; 14409de69279SChao Yu goto out; 1441608514deSJaegeuk Kim } 1442608514deSJaegeuk Kim 1443608514deSJaegeuk Kim if (!IS_DNODE(page) || !is_cold_node(page)) 1444608514deSJaegeuk Kim continue; 1445608514deSJaegeuk Kim if (ino_of_node(page) != ino) 1446608514deSJaegeuk Kim continue; 1447608514deSJaegeuk Kim 1448608514deSJaegeuk Kim lock_page(page); 1449608514deSJaegeuk Kim 1450608514deSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1451608514deSJaegeuk Kim continue_unlock: 1452608514deSJaegeuk Kim unlock_page(page); 1453608514deSJaegeuk Kim continue; 1454608514deSJaegeuk Kim } 1455608514deSJaegeuk Kim if (ino_of_node(page) != ino) 145652681375SJaegeuk Kim goto continue_unlock; 145752681375SJaegeuk Kim 1458608514deSJaegeuk Kim if (!PageDirty(page) && page != last_page) { 1459608514deSJaegeuk Kim /* someone wrote it for us */ 1460608514deSJaegeuk Kim goto continue_unlock; 1461608514deSJaegeuk Kim } 1462608514deSJaegeuk Kim 1463608514deSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1464608514deSJaegeuk Kim BUG_ON(PageWriteback(page)); 1465608514deSJaegeuk Kim 1466d29fd172SJaegeuk Kim set_fsync_mark(page, 0); 1467d29fd172SJaegeuk Kim set_dentry_mark(page, 0); 1468d29fd172SJaegeuk Kim 1469608514deSJaegeuk Kim if (!atomic || page == last_page) { 147052681375SJaegeuk Kim set_fsync_mark(page, 1); 147126de9b11SJaegeuk Kim if (IS_INODE(page)) { 147226de9b11SJaegeuk Kim if (is_inode_flag_set(inode, 147326de9b11SJaegeuk Kim FI_DIRTY_INODE)) 147426de9b11SJaegeuk Kim update_inode(inode, page); 147552681375SJaegeuk Kim set_dentry_mark(page, 147652681375SJaegeuk Kim need_dentry_mark(sbi, ino)); 147726de9b11SJaegeuk Kim } 1478608514deSJaegeuk Kim /* may be written by other thread */ 1479608514deSJaegeuk Kim if (!PageDirty(page)) 1480608514deSJaegeuk Kim set_page_dirty(page); 1481608514deSJaegeuk Kim } 1482608514deSJaegeuk Kim 1483608514deSJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1484608514deSJaegeuk Kim goto continue_unlock; 148552681375SJaegeuk Kim 1486e7c75ab0SJaegeuk Kim ret = __write_node_page(page, atomic && 1487d68f735bSJaegeuk Kim page == last_page, 1488d68f735bSJaegeuk Kim &submitted, wbc); 1489c267ec15SJaegeuk Kim if (ret) { 149052681375SJaegeuk Kim unlock_page(page); 1491608514deSJaegeuk Kim f2fs_put_page(last_page, 0); 1492608514deSJaegeuk Kim break; 1493d68f735bSJaegeuk Kim } else if (submitted) { 1494942fd319SJaegeuk Kim last_idx = page->index; 1495608514deSJaegeuk Kim } 14963f5f4959SChao Yu 1497608514deSJaegeuk Kim if (page == last_page) { 1498608514deSJaegeuk Kim f2fs_put_page(page, 0); 1499608514deSJaegeuk Kim marked = true; 150052681375SJaegeuk Kim break; 150152681375SJaegeuk Kim } 1502c267ec15SJaegeuk Kim } 150352681375SJaegeuk Kim pagevec_release(&pvec); 150452681375SJaegeuk Kim cond_resched(); 150552681375SJaegeuk Kim 1506608514deSJaegeuk Kim if (ret || marked) 150752681375SJaegeuk Kim break; 150852681375SJaegeuk Kim } 1509608514deSJaegeuk Kim if (!ret && atomic && !marked) { 1510608514deSJaegeuk Kim f2fs_msg(sbi->sb, KERN_DEBUG, 1511608514deSJaegeuk Kim "Retry to write fsync mark: ino=%u, idx=%lx", 1512608514deSJaegeuk Kim ino, last_page->index); 1513608514deSJaegeuk Kim lock_page(last_page); 1514d40a43afSYunlei He f2fs_wait_on_page_writeback(last_page, NODE, true); 1515608514deSJaegeuk Kim set_page_dirty(last_page); 1516608514deSJaegeuk Kim unlock_page(last_page); 1517608514deSJaegeuk Kim goto retry; 1518608514deSJaegeuk Kim } 15199de69279SChao Yu out: 1520942fd319SJaegeuk Kim if (last_idx != ULONG_MAX) 1521b9109b0eSJaegeuk Kim f2fs_submit_merged_write_cond(sbi, NULL, ino, last_idx, NODE); 1522c267ec15SJaegeuk Kim return ret ? -EIO: 0; 152352681375SJaegeuk Kim } 152452681375SJaegeuk Kim 152552681375SJaegeuk Kim int sync_node_pages(struct f2fs_sb_info *sbi, struct writeback_control *wbc) 152652681375SJaegeuk Kim { 152752681375SJaegeuk Kim pgoff_t index, end; 152852681375SJaegeuk Kim struct pagevec pvec; 152952681375SJaegeuk Kim int step = 0; 153012bb0a8fSJaegeuk Kim int nwritten = 0; 15313f5f4959SChao Yu int ret = 0; 1532e05df3b1SJaegeuk Kim 1533e05df3b1SJaegeuk Kim pagevec_init(&pvec, 0); 1534e05df3b1SJaegeuk Kim 1535e05df3b1SJaegeuk Kim next_step: 1536e05df3b1SJaegeuk Kim index = 0; 153780dd9c0eSChao Yu end = ULONG_MAX; 1538e05df3b1SJaegeuk Kim 1539e05df3b1SJaegeuk Kim while (index <= end) { 1540e05df3b1SJaegeuk Kim int i, nr_pages; 15414ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1542e05df3b1SJaegeuk Kim PAGECACHE_TAG_DIRTY, 1543e05df3b1SJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 1544e05df3b1SJaegeuk Kim if (nr_pages == 0) 1545e05df3b1SJaegeuk Kim break; 1546e05df3b1SJaegeuk Kim 1547e05df3b1SJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1548e05df3b1SJaegeuk Kim struct page *page = pvec.pages[i]; 1549d68f735bSJaegeuk Kim bool submitted = false; 1550e05df3b1SJaegeuk Kim 15516d5a1495SChao Yu if (unlikely(f2fs_cp_error(sbi))) { 15526d5a1495SChao Yu pagevec_release(&pvec); 15533f5f4959SChao Yu ret = -EIO; 15543f5f4959SChao Yu goto out; 15556d5a1495SChao Yu } 15566d5a1495SChao Yu 1557e05df3b1SJaegeuk Kim /* 1558e05df3b1SJaegeuk Kim * flushing sequence with step: 1559e05df3b1SJaegeuk Kim * 0. indirect nodes 1560e05df3b1SJaegeuk Kim * 1. dentry dnodes 1561e05df3b1SJaegeuk Kim * 2. file dnodes 1562e05df3b1SJaegeuk Kim */ 1563e05df3b1SJaegeuk Kim if (step == 0 && IS_DNODE(page)) 1564e05df3b1SJaegeuk Kim continue; 1565e05df3b1SJaegeuk Kim if (step == 1 && (!IS_DNODE(page) || 1566e05df3b1SJaegeuk Kim is_cold_node(page))) 1567e05df3b1SJaegeuk Kim continue; 1568e05df3b1SJaegeuk Kim if (step == 2 && (!IS_DNODE(page) || 1569e05df3b1SJaegeuk Kim !is_cold_node(page))) 1570e05df3b1SJaegeuk Kim continue; 15719a4cbc9eSChao Yu lock_node: 157252681375SJaegeuk Kim if (!trylock_page(page)) 1573e05df3b1SJaegeuk Kim continue; 1574e05df3b1SJaegeuk Kim 15754ef51a8fSJaegeuk Kim if (unlikely(page->mapping != NODE_MAPPING(sbi))) { 1576e05df3b1SJaegeuk Kim continue_unlock: 1577e05df3b1SJaegeuk Kim unlock_page(page); 1578e05df3b1SJaegeuk Kim continue; 1579e05df3b1SJaegeuk Kim } 1580e05df3b1SJaegeuk Kim 1581e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1582e05df3b1SJaegeuk Kim /* someone wrote it for us */ 1583e05df3b1SJaegeuk Kim goto continue_unlock; 1584e05df3b1SJaegeuk Kim } 1585e05df3b1SJaegeuk Kim 15862049d4fcSJaegeuk Kim /* flush inline_data */ 158752681375SJaegeuk Kim if (is_inline_node(page)) { 15882049d4fcSJaegeuk Kim clear_inline_node(page); 15892049d4fcSJaegeuk Kim unlock_page(page); 15902049d4fcSJaegeuk Kim flush_inline_data(sbi, ino_of_node(page)); 15919a4cbc9eSChao Yu goto lock_node; 15922049d4fcSJaegeuk Kim } 15932049d4fcSJaegeuk Kim 1594fa3d2bdfSJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1595fa3d2bdfSJaegeuk Kim 1596fa3d2bdfSJaegeuk Kim BUG_ON(PageWriteback(page)); 1597e05df3b1SJaegeuk Kim if (!clear_page_dirty_for_io(page)) 1598e05df3b1SJaegeuk Kim goto continue_unlock; 1599e05df3b1SJaegeuk Kim 1600e05df3b1SJaegeuk Kim set_fsync_mark(page, 0); 1601e05df3b1SJaegeuk Kim set_dentry_mark(page, 0); 160252746519SJaegeuk Kim 1603d68f735bSJaegeuk Kim ret = __write_node_page(page, false, &submitted, wbc); 1604d68f735bSJaegeuk Kim if (ret) 160552746519SJaegeuk Kim unlock_page(page); 1606d68f735bSJaegeuk Kim else if (submitted) 16073f5f4959SChao Yu nwritten++; 1608e05df3b1SJaegeuk Kim 1609e05df3b1SJaegeuk Kim if (--wbc->nr_to_write == 0) 1610e05df3b1SJaegeuk Kim break; 1611e05df3b1SJaegeuk Kim } 1612e05df3b1SJaegeuk Kim pagevec_release(&pvec); 1613e05df3b1SJaegeuk Kim cond_resched(); 1614e05df3b1SJaegeuk Kim 1615e05df3b1SJaegeuk Kim if (wbc->nr_to_write == 0) { 1616e05df3b1SJaegeuk Kim step = 2; 1617e05df3b1SJaegeuk Kim break; 1618e05df3b1SJaegeuk Kim } 1619e05df3b1SJaegeuk Kim } 1620e05df3b1SJaegeuk Kim 1621e05df3b1SJaegeuk Kim if (step < 2) { 1622e05df3b1SJaegeuk Kim step++; 1623e05df3b1SJaegeuk Kim goto next_step; 1624e05df3b1SJaegeuk Kim } 16253f5f4959SChao Yu out: 16263f5f4959SChao Yu if (nwritten) 1627b9109b0eSJaegeuk Kim f2fs_submit_merged_write(sbi, NODE); 16283f5f4959SChao Yu return ret; 1629e05df3b1SJaegeuk Kim } 1630e05df3b1SJaegeuk Kim 1631cfe58f9dSJaegeuk Kim int wait_on_node_pages_writeback(struct f2fs_sb_info *sbi, nid_t ino) 1632cfe58f9dSJaegeuk Kim { 163380dd9c0eSChao Yu pgoff_t index = 0, end = ULONG_MAX; 1634cfe58f9dSJaegeuk Kim struct pagevec pvec; 1635280db3c8SMiklos Szeredi int ret2, ret = 0; 1636cfe58f9dSJaegeuk Kim 1637cfe58f9dSJaegeuk Kim pagevec_init(&pvec, 0); 16384ef51a8fSJaegeuk Kim 16394ef51a8fSJaegeuk Kim while (index <= end) { 16404ef51a8fSJaegeuk Kim int i, nr_pages; 16414ef51a8fSJaegeuk Kim nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index, 1642cfe58f9dSJaegeuk Kim PAGECACHE_TAG_WRITEBACK, 16434ef51a8fSJaegeuk Kim min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1); 16444ef51a8fSJaegeuk Kim if (nr_pages == 0) 16454ef51a8fSJaegeuk Kim break; 1646cfe58f9dSJaegeuk Kim 1647cfe58f9dSJaegeuk Kim for (i = 0; i < nr_pages; i++) { 1648cfe58f9dSJaegeuk Kim struct page *page = pvec.pages[i]; 1649cfe58f9dSJaegeuk Kim 1650cfe58f9dSJaegeuk Kim /* until radix tree lookup accepts end_index */ 1651cfb271d4SChao Yu if (unlikely(page->index > end)) 1652cfe58f9dSJaegeuk Kim continue; 1653cfe58f9dSJaegeuk Kim 16544bf08ff6SChao Yu if (ino && ino_of_node(page) == ino) { 1655fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(page, NODE, true); 1656cfe58f9dSJaegeuk Kim if (TestClearPageError(page)) 1657cfe58f9dSJaegeuk Kim ret = -EIO; 1658cfe58f9dSJaegeuk Kim } 16594bf08ff6SChao Yu } 1660cfe58f9dSJaegeuk Kim pagevec_release(&pvec); 1661cfe58f9dSJaegeuk Kim cond_resched(); 1662cfe58f9dSJaegeuk Kim } 1663cfe58f9dSJaegeuk Kim 1664280db3c8SMiklos Szeredi ret2 = filemap_check_errors(NODE_MAPPING(sbi)); 1665cfe58f9dSJaegeuk Kim if (!ret) 1666cfe58f9dSJaegeuk Kim ret = ret2; 1667cfe58f9dSJaegeuk Kim return ret; 1668cfe58f9dSJaegeuk Kim } 1669cfe58f9dSJaegeuk Kim 1670e05df3b1SJaegeuk Kim static int f2fs_write_node_pages(struct address_space *mapping, 1671e05df3b1SJaegeuk Kim struct writeback_control *wbc) 1672e05df3b1SJaegeuk Kim { 16734081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_M_SB(mapping); 16749dfa1bafSJaegeuk Kim struct blk_plug plug; 167550c8cdb3SJaegeuk Kim long diff; 1676e05df3b1SJaegeuk Kim 16774660f9c0SJaegeuk Kim /* balancing f2fs's metadata in background */ 16784660f9c0SJaegeuk Kim f2fs_balance_fs_bg(sbi); 1679e05df3b1SJaegeuk Kim 1680a7fdffbdSJaegeuk Kim /* collect a number of dirty node pages and write together */ 168187d6f890SJaegeuk Kim if (get_pages(sbi, F2FS_DIRTY_NODES) < nr_pages_to_skip(sbi, NODE)) 1682d3baf95dSJaegeuk Kim goto skip_write; 1683a7fdffbdSJaegeuk Kim 1684d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1685d31c7c3fSYunlei He 168650c8cdb3SJaegeuk Kim diff = nr_pages_to_write(sbi, NODE, wbc); 1687fb5566daSJaegeuk Kim wbc->sync_mode = WB_SYNC_NONE; 16889dfa1bafSJaegeuk Kim blk_start_plug(&plug); 168952681375SJaegeuk Kim sync_node_pages(sbi, wbc); 16909dfa1bafSJaegeuk Kim blk_finish_plug(&plug); 169150c8cdb3SJaegeuk Kim wbc->nr_to_write = max((long)0, wbc->nr_to_write - diff); 1692e05df3b1SJaegeuk Kim return 0; 1693d3baf95dSJaegeuk Kim 1694d3baf95dSJaegeuk Kim skip_write: 1695d3baf95dSJaegeuk Kim wbc->pages_skipped += get_pages(sbi, F2FS_DIRTY_NODES); 1696d31c7c3fSYunlei He trace_f2fs_writepages(mapping->host, wbc, NODE); 1697d3baf95dSJaegeuk Kim return 0; 1698e05df3b1SJaegeuk Kim } 1699e05df3b1SJaegeuk Kim 1700e05df3b1SJaegeuk Kim static int f2fs_set_node_page_dirty(struct page *page) 1701e05df3b1SJaegeuk Kim { 170226c6b887SJaegeuk Kim trace_f2fs_set_page_dirty(page, NODE); 170326c6b887SJaegeuk Kim 1704237c0790SJaegeuk Kim if (!PageUptodate(page)) 1705e05df3b1SJaegeuk Kim SetPageUptodate(page); 1706e05df3b1SJaegeuk Kim if (!PageDirty(page)) { 1707fe76b796SJaegeuk Kim f2fs_set_page_dirty_nobuffers(page); 17084081363fSJaegeuk Kim inc_page_count(F2FS_P_SB(page), F2FS_DIRTY_NODES); 1709e05df3b1SJaegeuk Kim SetPagePrivate(page); 17109e4ded3fSJaegeuk Kim f2fs_trace_pid(page); 1711e05df3b1SJaegeuk Kim return 1; 1712e05df3b1SJaegeuk Kim } 1713e05df3b1SJaegeuk Kim return 0; 1714e05df3b1SJaegeuk Kim } 1715e05df3b1SJaegeuk Kim 17160a8165d7SJaegeuk Kim /* 1717e05df3b1SJaegeuk Kim * Structure of the f2fs node operations 1718e05df3b1SJaegeuk Kim */ 1719e05df3b1SJaegeuk Kim const struct address_space_operations f2fs_node_aops = { 1720e05df3b1SJaegeuk Kim .writepage = f2fs_write_node_page, 1721e05df3b1SJaegeuk Kim .writepages = f2fs_write_node_pages, 1722e05df3b1SJaegeuk Kim .set_page_dirty = f2fs_set_node_page_dirty, 1723487261f3SChao Yu .invalidatepage = f2fs_invalidate_page, 1724487261f3SChao Yu .releasepage = f2fs_release_page, 17255b7a487cSWeichao Guo #ifdef CONFIG_MIGRATION 17265b7a487cSWeichao Guo .migratepage = f2fs_migrate_page, 17275b7a487cSWeichao Guo #endif 1728e05df3b1SJaegeuk Kim }; 1729e05df3b1SJaegeuk Kim 17308a7ed66aSJaegeuk Kim static struct free_nid *__lookup_free_nid_list(struct f2fs_nm_info *nm_i, 17318a7ed66aSJaegeuk Kim nid_t n) 1732e05df3b1SJaegeuk Kim { 17338a7ed66aSJaegeuk Kim return radix_tree_lookup(&nm_i->free_nid_root, n); 17343aa770a9SNamjae Jeon } 1735e05df3b1SJaegeuk Kim 1736eb0aa4b8SJaegeuk Kim static int __insert_nid_to_list(struct f2fs_sb_info *sbi, 1737eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool new) 1738e05df3b1SJaegeuk Kim { 1739b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1740b8559dc2SChao Yu 1741eb0aa4b8SJaegeuk Kim if (new) { 1742eb0aa4b8SJaegeuk Kim int err = radix_tree_insert(&nm_i->free_nid_root, i->nid, i); 1743eb0aa4b8SJaegeuk Kim if (err) 1744eb0aa4b8SJaegeuk Kim return err; 1745eb0aa4b8SJaegeuk Kim } 1746eb0aa4b8SJaegeuk Kim 1747b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1748b8559dc2SChao Yu i->state != NID_ALLOC); 1749b8559dc2SChao Yu nm_i->nid_cnt[list]++; 1750b8559dc2SChao Yu list_add_tail(&i->list, &nm_i->nid_list[list]); 1751eb0aa4b8SJaegeuk Kim return 0; 1752b8559dc2SChao Yu } 1753b8559dc2SChao Yu 1754b8559dc2SChao Yu static void __remove_nid_from_list(struct f2fs_sb_info *sbi, 1755eb0aa4b8SJaegeuk Kim struct free_nid *i, enum nid_list list, bool reuse) 1756b8559dc2SChao Yu { 1757b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1758b8559dc2SChao Yu 1759b8559dc2SChao Yu f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW : 1760b8559dc2SChao Yu i->state != NID_ALLOC); 1761b8559dc2SChao Yu nm_i->nid_cnt[list]--; 1762e05df3b1SJaegeuk Kim list_del(&i->list); 1763eb0aa4b8SJaegeuk Kim if (!reuse) 17648a7ed66aSJaegeuk Kim radix_tree_delete(&nm_i->free_nid_root, i->nid); 1765e05df3b1SJaegeuk Kim } 1766e05df3b1SJaegeuk Kim 17674ac91242SChao Yu /* return if the nid is recognized as free */ 17684ac91242SChao Yu static bool add_free_nid(struct f2fs_sb_info *sbi, nid_t nid, bool build) 1769e05df3b1SJaegeuk Kim { 17706fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 177130a61ddfSChao Yu struct free_nid *i, *e; 177259bbd474SJaegeuk Kim struct nat_entry *ne; 177330a61ddfSChao Yu int err = -EINVAL; 177430a61ddfSChao Yu bool ret = false; 17759198acebSJaegeuk Kim 17769198acebSJaegeuk Kim /* 0 nid should not be used */ 1777cfb271d4SChao Yu if (unlikely(nid == 0)) 17784ac91242SChao Yu return false; 177959bbd474SJaegeuk Kim 17807bd59381SGu Zheng i = f2fs_kmem_cache_alloc(free_nid_slab, GFP_NOFS); 1781e05df3b1SJaegeuk Kim i->nid = nid; 1782e05df3b1SJaegeuk Kim i->state = NID_NEW; 1783e05df3b1SJaegeuk Kim 178430a61ddfSChao Yu if (radix_tree_preload(GFP_NOFS)) 178530a61ddfSChao Yu goto err; 1786769ec6e5SJaegeuk Kim 1787b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 178830a61ddfSChao Yu 178930a61ddfSChao Yu if (build) { 179030a61ddfSChao Yu /* 179130a61ddfSChao Yu * Thread A Thread B 179230a61ddfSChao Yu * - f2fs_create 179330a61ddfSChao Yu * - f2fs_new_inode 179430a61ddfSChao Yu * - alloc_nid 179530a61ddfSChao Yu * - __insert_nid_to_list(ALLOC_NID_LIST) 179630a61ddfSChao Yu * - f2fs_balance_fs_bg 179730a61ddfSChao Yu * - build_free_nids 179830a61ddfSChao Yu * - __build_free_nids 179930a61ddfSChao Yu * - scan_nat_page 180030a61ddfSChao Yu * - add_free_nid 180130a61ddfSChao Yu * - __lookup_nat_cache 180230a61ddfSChao Yu * - f2fs_add_link 180330a61ddfSChao Yu * - init_inode_metadata 180430a61ddfSChao Yu * - new_inode_page 180530a61ddfSChao Yu * - new_node_page 180630a61ddfSChao Yu * - set_node_addr 180730a61ddfSChao Yu * - alloc_nid_done 180830a61ddfSChao Yu * - __remove_nid_from_list(ALLOC_NID_LIST) 180930a61ddfSChao Yu * - __insert_nid_to_list(FREE_NID_LIST) 181030a61ddfSChao Yu */ 181130a61ddfSChao Yu ne = __lookup_nat_cache(nm_i, nid); 181230a61ddfSChao Yu if (ne && (!get_nat_flag(ne, IS_CHECKPOINTED) || 181330a61ddfSChao Yu nat_get_blkaddr(ne) != NULL_ADDR)) 181430a61ddfSChao Yu goto err_out; 181530a61ddfSChao Yu 181630a61ddfSChao Yu e = __lookup_free_nid_list(nm_i, nid); 181730a61ddfSChao Yu if (e) { 181830a61ddfSChao Yu if (e->state == NID_NEW) 181930a61ddfSChao Yu ret = true; 182030a61ddfSChao Yu goto err_out; 182130a61ddfSChao Yu } 182230a61ddfSChao Yu } 182330a61ddfSChao Yu ret = true; 1824eb0aa4b8SJaegeuk Kim err = __insert_nid_to_list(sbi, i, FREE_NID_LIST, true); 182530a61ddfSChao Yu err_out: 1826b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1827769ec6e5SJaegeuk Kim radix_tree_preload_end(); 182830a61ddfSChao Yu err: 182930a61ddfSChao Yu if (err) 1830e05df3b1SJaegeuk Kim kmem_cache_free(free_nid_slab, i); 183130a61ddfSChao Yu return ret; 1832e05df3b1SJaegeuk Kim } 1833e05df3b1SJaegeuk Kim 1834b8559dc2SChao Yu static void remove_free_nid(struct f2fs_sb_info *sbi, nid_t nid) 1835e05df3b1SJaegeuk Kim { 1836b8559dc2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 1837e05df3b1SJaegeuk Kim struct free_nid *i; 1838cf0ee0f0SChao Yu bool need_free = false; 1839cf0ee0f0SChao Yu 1840b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 18418a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 1842e05df3b1SJaegeuk Kim if (i && i->state == NID_NEW) { 1843eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 1844cf0ee0f0SChao Yu need_free = true; 1845e05df3b1SJaegeuk Kim } 1846b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 1847cf0ee0f0SChao Yu 1848cf0ee0f0SChao Yu if (need_free) 1849cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 1850e05df3b1SJaegeuk Kim } 1851e05df3b1SJaegeuk Kim 18529f7e4a2cSJaegeuk Kim static void update_free_nid_bitmap(struct f2fs_sb_info *sbi, nid_t nid, 1853346fe752SChao Yu bool set, bool build) 18544ac91242SChao Yu { 18554ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 18564ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(nid); 18574ac91242SChao Yu unsigned int nid_ofs = nid - START_NID(nid); 18584ac91242SChao Yu 18594ac91242SChao Yu if (!test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 18604ac91242SChao Yu return; 18614ac91242SChao Yu 18624ac91242SChao Yu if (set) 186323380b85SJaegeuk Kim __set_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 18644ac91242SChao Yu else 186523380b85SJaegeuk Kim __clear_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]); 1866586d1492SChao Yu 1867586d1492SChao Yu if (set) 1868586d1492SChao Yu nm_i->free_nid_count[nat_ofs]++; 1869586d1492SChao Yu else if (!build) 1870586d1492SChao Yu nm_i->free_nid_count[nat_ofs]--; 18714ac91242SChao Yu } 18724ac91242SChao Yu 18736fb03f3aSJaegeuk Kim static void scan_nat_page(struct f2fs_sb_info *sbi, 1874e05df3b1SJaegeuk Kim struct page *nat_page, nid_t start_nid) 1875e05df3b1SJaegeuk Kim { 18766fb03f3aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1877e05df3b1SJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(nat_page); 1878e05df3b1SJaegeuk Kim block_t blk_addr; 18794ac91242SChao Yu unsigned int nat_ofs = NAT_BLOCK_OFFSET(start_nid); 1880e05df3b1SJaegeuk Kim int i; 1881e05df3b1SJaegeuk Kim 1882586d1492SChao Yu if (test_bit_le(nat_ofs, nm_i->nat_block_bitmap)) 1883586d1492SChao Yu return; 1884586d1492SChao Yu 188523380b85SJaegeuk Kim __set_bit_le(nat_ofs, nm_i->nat_block_bitmap); 18864ac91242SChao Yu 1887e05df3b1SJaegeuk Kim i = start_nid % NAT_ENTRY_PER_BLOCK; 1888e05df3b1SJaegeuk Kim 1889e05df3b1SJaegeuk Kim for (; i < NAT_ENTRY_PER_BLOCK; i++, start_nid++) { 18904ac91242SChao Yu bool freed = false; 189123d38844SHaicheng Li 1892cfb271d4SChao Yu if (unlikely(start_nid >= nm_i->max_nid)) 189304431c44SJaegeuk Kim break; 189423d38844SHaicheng Li 1895e05df3b1SJaegeuk Kim blk_addr = le32_to_cpu(nat_blk->entries[i].block_addr); 18969850cf4aSJaegeuk Kim f2fs_bug_on(sbi, blk_addr == NEW_ADDR); 18973a2ad567SChao Yu if (blk_addr == NULL_ADDR) 18984ac91242SChao Yu freed = add_free_nid(sbi, start_nid, true); 1899346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 1900346fe752SChao Yu update_free_nid_bitmap(sbi, start_nid, freed, true); 1901346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 1902e05df3b1SJaegeuk Kim } 1903e05df3b1SJaegeuk Kim } 1904e05df3b1SJaegeuk Kim 19054ac91242SChao Yu static void scan_free_nid_bits(struct f2fs_sb_info *sbi) 19064ac91242SChao Yu { 19074ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 19084ac91242SChao Yu struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 19094ac91242SChao Yu struct f2fs_journal *journal = curseg->journal; 19104ac91242SChao Yu unsigned int i, idx; 19114ac91242SChao Yu 19124ac91242SChao Yu down_read(&nm_i->nat_tree_lock); 19134ac91242SChao Yu 19144ac91242SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 19154ac91242SChao Yu if (!test_bit_le(i, nm_i->nat_block_bitmap)) 19164ac91242SChao Yu continue; 1917586d1492SChao Yu if (!nm_i->free_nid_count[i]) 1918586d1492SChao Yu continue; 19194ac91242SChao Yu for (idx = 0; idx < NAT_ENTRY_PER_BLOCK; idx++) { 19204ac91242SChao Yu nid_t nid; 19214ac91242SChao Yu 19224ac91242SChao Yu if (!test_bit_le(idx, nm_i->free_nid_bitmap[i])) 19234ac91242SChao Yu continue; 19244ac91242SChao Yu 19254ac91242SChao Yu nid = i * NAT_ENTRY_PER_BLOCK + idx; 19264ac91242SChao Yu add_free_nid(sbi, nid, true); 19274ac91242SChao Yu 1928f0cdbfe6SKinglong Mee if (nm_i->nid_cnt[FREE_NID_LIST] >= MAX_FREE_NIDS) 19294ac91242SChao Yu goto out; 19304ac91242SChao Yu } 19314ac91242SChao Yu } 19324ac91242SChao Yu out: 19334ac91242SChao Yu down_read(&curseg->journal_rwsem); 19344ac91242SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 19354ac91242SChao Yu block_t addr; 19364ac91242SChao Yu nid_t nid; 19374ac91242SChao Yu 19384ac91242SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 19394ac91242SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 19404ac91242SChao Yu if (addr == NULL_ADDR) 19414ac91242SChao Yu add_free_nid(sbi, nid, true); 19424ac91242SChao Yu else 19434ac91242SChao Yu remove_free_nid(sbi, nid); 19444ac91242SChao Yu } 19454ac91242SChao Yu up_read(&curseg->journal_rwsem); 19464ac91242SChao Yu up_read(&nm_i->nat_tree_lock); 19474ac91242SChao Yu } 19484ac91242SChao Yu 194922ad0b6aSJaegeuk Kim static void __build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 1950e05df3b1SJaegeuk Kim { 1951e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 1952e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 1953b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 19548760952dSHaicheng Li int i = 0; 195555008d84SJaegeuk Kim nid_t nid = nm_i->next_scan_nid; 1956e05df3b1SJaegeuk Kim 1957e9cdd307SYunlei He if (unlikely(nid >= nm_i->max_nid)) 1958e9cdd307SYunlei He nid = 0; 1959e9cdd307SYunlei He 196055008d84SJaegeuk Kim /* Enough entries */ 1961b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] >= NAT_ENTRY_PER_BLOCK) 196255008d84SJaegeuk Kim return; 1963e05df3b1SJaegeuk Kim 19643a2ad567SChao Yu if (!sync && !available_free_memory(sbi, FREE_NIDS)) 1965e05df3b1SJaegeuk Kim return; 1966e05df3b1SJaegeuk Kim 19674ac91242SChao Yu if (!mount) { 19684ac91242SChao Yu /* try to find free nids in free_nid_bitmap */ 19694ac91242SChao Yu scan_free_nid_bits(sbi); 19704ac91242SChao Yu 19714ac91242SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST]) 197222ad0b6aSJaegeuk Kim return; 197322ad0b6aSJaegeuk Kim } 197422ad0b6aSJaegeuk Kim 197555008d84SJaegeuk Kim /* readahead nat pages to be scanned */ 197626879fb1SChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nid), FREE_NID_PAGES, 197726879fb1SChao Yu META_NAT, true); 1978e05df3b1SJaegeuk Kim 1979b873b798SJaegeuk Kim down_read(&nm_i->nat_tree_lock); 1980a5131193SJaegeuk Kim 1981e05df3b1SJaegeuk Kim while (1) { 1982e05df3b1SJaegeuk Kim struct page *page = get_current_nat_page(sbi, nid); 1983e05df3b1SJaegeuk Kim 19846fb03f3aSJaegeuk Kim scan_nat_page(sbi, page, nid); 1985e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 1986e05df3b1SJaegeuk Kim 1987e05df3b1SJaegeuk Kim nid += (NAT_ENTRY_PER_BLOCK - (nid % NAT_ENTRY_PER_BLOCK)); 1988cfb271d4SChao Yu if (unlikely(nid >= nm_i->max_nid)) 1989e05df3b1SJaegeuk Kim nid = 0; 199055008d84SJaegeuk Kim 1991a6d494b6SChao Yu if (++i >= FREE_NID_PAGES) 1992e05df3b1SJaegeuk Kim break; 1993e05df3b1SJaegeuk Kim } 1994e05df3b1SJaegeuk Kim 199555008d84SJaegeuk Kim /* go to the next free nat pages to find free nids abundantly */ 199655008d84SJaegeuk Kim nm_i->next_scan_nid = nid; 1997e05df3b1SJaegeuk Kim 1998e05df3b1SJaegeuk Kim /* find free nids from current sum_pages */ 1999b7ad7512SChao Yu down_read(&curseg->journal_rwsem); 2000dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2001dfc08a12SChao Yu block_t addr; 2002dfc08a12SChao Yu 2003dfc08a12SChao Yu addr = le32_to_cpu(nat_in_journal(journal, i).block_addr); 2004dfc08a12SChao Yu nid = le32_to_cpu(nid_in_journal(journal, i)); 2005e05df3b1SJaegeuk Kim if (addr == NULL_ADDR) 20066fb03f3aSJaegeuk Kim add_free_nid(sbi, nid, true); 2007e05df3b1SJaegeuk Kim else 2008b8559dc2SChao Yu remove_free_nid(sbi, nid); 2009e05df3b1SJaegeuk Kim } 2010b7ad7512SChao Yu up_read(&curseg->journal_rwsem); 2011b873b798SJaegeuk Kim up_read(&nm_i->nat_tree_lock); 20122db2388fSChao Yu 20132db2388fSChao Yu ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nm_i->next_scan_nid), 2014ea1a29a0SChao Yu nm_i->ra_nid_pages, META_NAT, false); 2015e05df3b1SJaegeuk Kim } 2016e05df3b1SJaegeuk Kim 201722ad0b6aSJaegeuk Kim void build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount) 20182411cf5bSChao Yu { 20192411cf5bSChao Yu mutex_lock(&NM_I(sbi)->build_lock); 202022ad0b6aSJaegeuk Kim __build_free_nids(sbi, sync, mount); 20212411cf5bSChao Yu mutex_unlock(&NM_I(sbi)->build_lock); 20222411cf5bSChao Yu } 20232411cf5bSChao Yu 2024e05df3b1SJaegeuk Kim /* 2025e05df3b1SJaegeuk Kim * If this function returns success, caller can obtain a new nid 2026e05df3b1SJaegeuk Kim * from second parameter of this function. 2027e05df3b1SJaegeuk Kim * The returned nid could be used ino as well as nid when inode is created. 2028e05df3b1SJaegeuk Kim */ 2029e05df3b1SJaegeuk Kim bool alloc_nid(struct f2fs_sb_info *sbi, nid_t *nid) 2030e05df3b1SJaegeuk Kim { 2031e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2032e05df3b1SJaegeuk Kim struct free_nid *i = NULL; 2033e05df3b1SJaegeuk Kim retry: 2034cb78942bSJaegeuk Kim #ifdef CONFIG_F2FS_FAULT_INJECTION 203555523519SChao Yu if (time_to_inject(sbi, FAULT_ALLOC_NID)) { 203655523519SChao Yu f2fs_show_injection_info(FAULT_ALLOC_NID); 2037cb78942bSJaegeuk Kim return false; 203855523519SChao Yu } 2039cb78942bSJaegeuk Kim #endif 2040b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2041e05df3b1SJaegeuk Kim 204204d47e67SChao Yu if (unlikely(nm_i->available_nids == 0)) { 204304d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 204404d47e67SChao Yu return false; 204504d47e67SChao Yu } 2046e05df3b1SJaegeuk Kim 204755008d84SJaegeuk Kim /* We should not use stale free nids created by build_free_nids */ 2048b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] && !on_build_free_nids(nm_i)) { 2049b8559dc2SChao Yu f2fs_bug_on(sbi, list_empty(&nm_i->nid_list[FREE_NID_LIST])); 2050b8559dc2SChao Yu i = list_first_entry(&nm_i->nid_list[FREE_NID_LIST], 2051b8559dc2SChao Yu struct free_nid, list); 2052e05df3b1SJaegeuk Kim *nid = i->nid; 2053b8559dc2SChao Yu 2054eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, true); 2055e05df3b1SJaegeuk Kim i->state = NID_ALLOC; 2056eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, ALLOC_NID_LIST, false); 205704d47e67SChao Yu nm_i->available_nids--; 20584ac91242SChao Yu 2059346fe752SChao Yu update_free_nid_bitmap(sbi, *nid, false, false); 20604ac91242SChao Yu 2061b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2062e05df3b1SJaegeuk Kim return true; 2063e05df3b1SJaegeuk Kim } 2064b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 206555008d84SJaegeuk Kim 206655008d84SJaegeuk Kim /* Let's scan nat pages and its caches to get free nids */ 206722ad0b6aSJaegeuk Kim build_free_nids(sbi, true, false); 206855008d84SJaegeuk Kim goto retry; 206955008d84SJaegeuk Kim } 2070e05df3b1SJaegeuk Kim 20710a8165d7SJaegeuk Kim /* 2072e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2073e05df3b1SJaegeuk Kim */ 2074e05df3b1SJaegeuk Kim void alloc_nid_done(struct f2fs_sb_info *sbi, nid_t nid) 2075e05df3b1SJaegeuk Kim { 2076e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2077e05df3b1SJaegeuk Kim struct free_nid *i; 2078e05df3b1SJaegeuk Kim 2079b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 20808a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2081b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2082eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2083b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2084cf0ee0f0SChao Yu 2085cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2086e05df3b1SJaegeuk Kim } 2087e05df3b1SJaegeuk Kim 20880a8165d7SJaegeuk Kim /* 2089e05df3b1SJaegeuk Kim * alloc_nid() should be called prior to this function. 2090e05df3b1SJaegeuk Kim */ 2091e05df3b1SJaegeuk Kim void alloc_nid_failed(struct f2fs_sb_info *sbi, nid_t nid) 2092e05df3b1SJaegeuk Kim { 209349952fa1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 209449952fa1SJaegeuk Kim struct free_nid *i; 2095cf0ee0f0SChao Yu bool need_free = false; 209649952fa1SJaegeuk Kim 209765985d93SJaegeuk Kim if (!nid) 209865985d93SJaegeuk Kim return; 209965985d93SJaegeuk Kim 2100b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 21018a7ed66aSJaegeuk Kim i = __lookup_free_nid_list(nm_i, nid); 2102b8559dc2SChao Yu f2fs_bug_on(sbi, !i); 2103b8559dc2SChao Yu 21046fb03f3aSJaegeuk Kim if (!available_free_memory(sbi, FREE_NIDS)) { 2105eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false); 2106cf0ee0f0SChao Yu need_free = true; 210795630cbaSHaicheng Li } else { 2108eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, ALLOC_NID_LIST, true); 210949952fa1SJaegeuk Kim i->state = NID_NEW; 2110eb0aa4b8SJaegeuk Kim __insert_nid_to_list(sbi, i, FREE_NID_LIST, false); 211195630cbaSHaicheng Li } 211204d47e67SChao Yu 211304d47e67SChao Yu nm_i->available_nids++; 211404d47e67SChao Yu 2115346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 21164ac91242SChao Yu 2117b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2118cf0ee0f0SChao Yu 2119cf0ee0f0SChao Yu if (need_free) 2120cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2121e05df3b1SJaegeuk Kim } 2122e05df3b1SJaegeuk Kim 212331696580SChao Yu int try_to_free_nids(struct f2fs_sb_info *sbi, int nr_shrink) 212431696580SChao Yu { 212531696580SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 212631696580SChao Yu struct free_nid *i, *next; 212731696580SChao Yu int nr = nr_shrink; 212831696580SChao Yu 2129b8559dc2SChao Yu if (nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 2130ad4edb83SJaegeuk Kim return 0; 2131ad4edb83SJaegeuk Kim 213231696580SChao Yu if (!mutex_trylock(&nm_i->build_lock)) 213331696580SChao Yu return 0; 213431696580SChao Yu 2135b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2136b8559dc2SChao Yu list_for_each_entry_safe(i, next, &nm_i->nid_list[FREE_NID_LIST], 2137b8559dc2SChao Yu list) { 2138b8559dc2SChao Yu if (nr_shrink <= 0 || 2139b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS) 214031696580SChao Yu break; 2141b8559dc2SChao Yu 2142eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 214331696580SChao Yu kmem_cache_free(free_nid_slab, i); 214431696580SChao Yu nr_shrink--; 214531696580SChao Yu } 2146b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 214731696580SChao Yu mutex_unlock(&nm_i->build_lock); 214831696580SChao Yu 214931696580SChao Yu return nr - nr_shrink; 215031696580SChao Yu } 215131696580SChao Yu 215270cfed88SChao Yu void recover_inline_xattr(struct inode *inode, struct page *page) 215328cdce04SChao Yu { 215428cdce04SChao Yu void *src_addr, *dst_addr; 215528cdce04SChao Yu size_t inline_size; 215628cdce04SChao Yu struct page *ipage; 215728cdce04SChao Yu struct f2fs_inode *ri; 215828cdce04SChao Yu 21594081363fSJaegeuk Kim ipage = get_node_page(F2FS_I_SB(inode), inode->i_ino); 21609850cf4aSJaegeuk Kim f2fs_bug_on(F2FS_I_SB(inode), IS_ERR(ipage)); 216128cdce04SChao Yu 2162e3b4d43fSJaegeuk Kim ri = F2FS_INODE(page); 2163e3b4d43fSJaegeuk Kim if (!(ri->i_inline & F2FS_INLINE_XATTR)) { 216491942321SJaegeuk Kim clear_inode_flag(inode, FI_INLINE_XATTR); 2165e3b4d43fSJaegeuk Kim goto update_inode; 2166e3b4d43fSJaegeuk Kim } 2167e3b4d43fSJaegeuk Kim 216828cdce04SChao Yu dst_addr = inline_xattr_addr(ipage); 216928cdce04SChao Yu src_addr = inline_xattr_addr(page); 217028cdce04SChao Yu inline_size = inline_xattr_size(inode); 217128cdce04SChao Yu 2172fec1d657SJaegeuk Kim f2fs_wait_on_page_writeback(ipage, NODE, true); 217328cdce04SChao Yu memcpy(dst_addr, src_addr, inline_size); 2174e3b4d43fSJaegeuk Kim update_inode: 217528cdce04SChao Yu update_inode(inode, ipage); 217628cdce04SChao Yu f2fs_put_page(ipage, 1); 217728cdce04SChao Yu } 217828cdce04SChao Yu 2179d260081cSChao Yu int recover_xattr_data(struct inode *inode, struct page *page, block_t blkaddr) 2180abb2366cSJaegeuk Kim { 21814081363fSJaegeuk Kim struct f2fs_sb_info *sbi = F2FS_I_SB(inode); 2182abb2366cSJaegeuk Kim nid_t prev_xnid = F2FS_I(inode)->i_xattr_nid; 2183abb2366cSJaegeuk Kim nid_t new_xnid = nid_of_node(page); 2184abb2366cSJaegeuk Kim struct node_info ni; 2185d260081cSChao Yu struct page *xpage; 2186abb2366cSJaegeuk Kim 2187abb2366cSJaegeuk Kim if (!prev_xnid) 2188abb2366cSJaegeuk Kim goto recover_xnid; 2189abb2366cSJaegeuk Kim 2190d260081cSChao Yu /* 1: invalidate the previous xattr nid */ 2191abb2366cSJaegeuk Kim get_node_info(sbi, prev_xnid, &ni); 21929850cf4aSJaegeuk Kim f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR); 2193abb2366cSJaegeuk Kim invalidate_blocks(sbi, ni.blk_addr); 2194abb2366cSJaegeuk Kim dec_valid_node_count(sbi, inode); 2195479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NULL_ADDR, false); 2196abb2366cSJaegeuk Kim 2197abb2366cSJaegeuk Kim recover_xnid: 2198d260081cSChao Yu /* 2: update xattr nid in inode */ 2199d260081cSChao Yu remove_free_nid(sbi, new_xnid); 2200d260081cSChao Yu f2fs_i_xnid_write(inode, new_xnid); 2201abb2366cSJaegeuk Kim if (unlikely(!inc_valid_node_count(sbi, inode))) 22029850cf4aSJaegeuk Kim f2fs_bug_on(sbi, 1); 2203d260081cSChao Yu update_inode_page(inode); 2204abb2366cSJaegeuk Kim 2205d260081cSChao Yu /* 3: update and set xattr node page dirty */ 2206d260081cSChao Yu xpage = grab_cache_page(NODE_MAPPING(sbi), new_xnid); 2207d260081cSChao Yu if (!xpage) 2208d260081cSChao Yu return -ENOMEM; 2209d260081cSChao Yu 2210d260081cSChao Yu memcpy(F2FS_NODE(xpage), F2FS_NODE(page), PAGE_SIZE); 2211d260081cSChao Yu 2212abb2366cSJaegeuk Kim get_node_info(sbi, new_xnid, &ni); 2213abb2366cSJaegeuk Kim ni.ino = inode->i_ino; 2214479f40c4SJaegeuk Kim set_node_addr(sbi, &ni, NEW_ADDR, false); 2215d260081cSChao Yu set_page_dirty(xpage); 2216d260081cSChao Yu f2fs_put_page(xpage, 1); 2217abb2366cSJaegeuk Kim 2218d260081cSChao Yu return 0; 2219abb2366cSJaegeuk Kim } 2220abb2366cSJaegeuk Kim 2221e05df3b1SJaegeuk Kim int recover_inode_page(struct f2fs_sb_info *sbi, struct page *page) 2222e05df3b1SJaegeuk Kim { 222358bfaf44SJaegeuk Kim struct f2fs_inode *src, *dst; 2224e05df3b1SJaegeuk Kim nid_t ino = ino_of_node(page); 2225e05df3b1SJaegeuk Kim struct node_info old_ni, new_ni; 2226e05df3b1SJaegeuk Kim struct page *ipage; 2227e05df3b1SJaegeuk Kim 2228e8271fa3SJaegeuk Kim get_node_info(sbi, ino, &old_ni); 2229e8271fa3SJaegeuk Kim 2230e8271fa3SJaegeuk Kim if (unlikely(old_ni.blk_addr != NULL_ADDR)) 2231e8271fa3SJaegeuk Kim return -EINVAL; 2232e8ea9b3dSJaegeuk Kim retry: 2233300e129cSJaegeuk Kim ipage = f2fs_grab_cache_page(NODE_MAPPING(sbi), ino, false); 2234e8ea9b3dSJaegeuk Kim if (!ipage) { 2235e8ea9b3dSJaegeuk Kim congestion_wait(BLK_RW_ASYNC, HZ/50); 2236e8ea9b3dSJaegeuk Kim goto retry; 2237e8ea9b3dSJaegeuk Kim } 2238e05df3b1SJaegeuk Kim 2239e05df3b1SJaegeuk Kim /* Should not use this inode from free nid list */ 2240b8559dc2SChao Yu remove_free_nid(sbi, ino); 2241e05df3b1SJaegeuk Kim 2242237c0790SJaegeuk Kim if (!PageUptodate(ipage)) 2243e05df3b1SJaegeuk Kim SetPageUptodate(ipage); 2244e05df3b1SJaegeuk Kim fill_node_footer(ipage, ino, ino, 0, true); 2245e05df3b1SJaegeuk Kim 224658bfaf44SJaegeuk Kim src = F2FS_INODE(page); 224758bfaf44SJaegeuk Kim dst = F2FS_INODE(ipage); 2248e05df3b1SJaegeuk Kim 224958bfaf44SJaegeuk Kim memcpy(dst, src, (unsigned long)&src->i_ext - (unsigned long)src); 225058bfaf44SJaegeuk Kim dst->i_size = 0; 225158bfaf44SJaegeuk Kim dst->i_blocks = cpu_to_le64(1); 225258bfaf44SJaegeuk Kim dst->i_links = cpu_to_le32(1); 225358bfaf44SJaegeuk Kim dst->i_xattr_nid = 0; 2254617deb8cSJaegeuk Kim dst->i_inline = src->i_inline & F2FS_INLINE_XATTR; 2255e05df3b1SJaegeuk Kim 2256e05df3b1SJaegeuk Kim new_ni = old_ni; 2257e05df3b1SJaegeuk Kim new_ni.ino = ino; 2258e05df3b1SJaegeuk Kim 2259cfb271d4SChao Yu if (unlikely(!inc_valid_node_count(sbi, NULL))) 226065e5cd0aSJaegeuk Kim WARN_ON(1); 2261479f40c4SJaegeuk Kim set_node_addr(sbi, &new_ni, NEW_ADDR, false); 2262e05df3b1SJaegeuk Kim inc_valid_inode_count(sbi); 2263617deb8cSJaegeuk Kim set_page_dirty(ipage); 2264e05df3b1SJaegeuk Kim f2fs_put_page(ipage, 1); 2265e05df3b1SJaegeuk Kim return 0; 2266e05df3b1SJaegeuk Kim } 2267e05df3b1SJaegeuk Kim 2268e05df3b1SJaegeuk Kim int restore_node_summary(struct f2fs_sb_info *sbi, 2269e05df3b1SJaegeuk Kim unsigned int segno, struct f2fs_summary_block *sum) 2270e05df3b1SJaegeuk Kim { 2271e05df3b1SJaegeuk Kim struct f2fs_node *rn; 2272e05df3b1SJaegeuk Kim struct f2fs_summary *sum_entry; 2273e05df3b1SJaegeuk Kim block_t addr; 22749ecf4b80SChao Yu int i, idx, last_offset, nrpages; 2275e05df3b1SJaegeuk Kim 2276e05df3b1SJaegeuk Kim /* scan the node segment */ 2277e05df3b1SJaegeuk Kim last_offset = sbi->blocks_per_seg; 2278e05df3b1SJaegeuk Kim addr = START_BLOCK(sbi, segno); 2279e05df3b1SJaegeuk Kim sum_entry = &sum->entries[0]; 2280e05df3b1SJaegeuk Kim 22819ecf4b80SChao Yu for (i = 0; i < last_offset; i += nrpages, addr += nrpages) { 2282664ba972SJaegeuk Kim nrpages = min(last_offset - i, BIO_MAX_PAGES); 2283393ff91fSJaegeuk Kim 22849af0ff1cSChao Yu /* readahead node pages */ 228526879fb1SChao Yu ra_meta_pages(sbi, addr, nrpages, META_POR, true); 22869af0ff1cSChao Yu 22879ecf4b80SChao Yu for (idx = addr; idx < addr + nrpages; idx++) { 22882b947003SChao Yu struct page *page = get_tmp_page(sbi, idx); 2289393ff91fSJaegeuk Kim 22909ecf4b80SChao Yu rn = F2FS_NODE(page); 2291393ff91fSJaegeuk Kim sum_entry->nid = rn->footer.nid; 2292393ff91fSJaegeuk Kim sum_entry->version = 0; 2293393ff91fSJaegeuk Kim sum_entry->ofs_in_node = 0; 22949af0ff1cSChao Yu sum_entry++; 22959ecf4b80SChao Yu f2fs_put_page(page, 1); 22969af0ff1cSChao Yu } 2297bac4eef6SChao Yu 22989ecf4b80SChao Yu invalidate_mapping_pages(META_MAPPING(sbi), addr, 2299bac4eef6SChao Yu addr + nrpages); 23009af0ff1cSChao Yu } 23019ecf4b80SChao Yu return 0; 2302e05df3b1SJaegeuk Kim } 2303e05df3b1SJaegeuk Kim 2304aec71382SChao Yu static void remove_nats_in_journal(struct f2fs_sb_info *sbi) 2305e05df3b1SJaegeuk Kim { 2306e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2307e05df3b1SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2308b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2309e05df3b1SJaegeuk Kim int i; 2310e05df3b1SJaegeuk Kim 2311b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2312dfc08a12SChao Yu for (i = 0; i < nats_in_cursum(journal); i++) { 2313e05df3b1SJaegeuk Kim struct nat_entry *ne; 2314e05df3b1SJaegeuk Kim struct f2fs_nat_entry raw_ne; 2315dfc08a12SChao Yu nid_t nid = le32_to_cpu(nid_in_journal(journal, i)); 2316e05df3b1SJaegeuk Kim 2317dfc08a12SChao Yu raw_ne = nat_in_journal(journal, i); 23189be32d72SJaegeuk Kim 2319e05df3b1SJaegeuk Kim ne = __lookup_nat_cache(nm_i, nid); 2320e05df3b1SJaegeuk Kim if (!ne) { 23215c9e4184SChao Yu ne = grab_nat_entry(nm_i, nid, true); 232294dac22eSChao Yu node_info_from_raw_nat(&ne->ni, &raw_ne); 23239be32d72SJaegeuk Kim } 232404d47e67SChao Yu 232504d47e67SChao Yu /* 232604d47e67SChao Yu * if a free nat in journal has not been used after last 232704d47e67SChao Yu * checkpoint, we should remove it from available nids, 232804d47e67SChao Yu * since later we will add it again. 232904d47e67SChao Yu */ 233004d47e67SChao Yu if (!get_nat_flag(ne, IS_DIRTY) && 233104d47e67SChao Yu le32_to_cpu(raw_ne.block_addr) == NULL_ADDR) { 233204d47e67SChao Yu spin_lock(&nm_i->nid_list_lock); 233304d47e67SChao Yu nm_i->available_nids--; 233404d47e67SChao Yu spin_unlock(&nm_i->nid_list_lock); 233504d47e67SChao Yu } 233604d47e67SChao Yu 2337e05df3b1SJaegeuk Kim __set_nat_cache_dirty(nm_i, ne); 2338e05df3b1SJaegeuk Kim } 2339dfc08a12SChao Yu update_nats_in_cursum(journal, -i); 2340b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 2341e05df3b1SJaegeuk Kim } 2342e05df3b1SJaegeuk Kim 2343309cc2b6SJaegeuk Kim static void __adjust_nat_entry_set(struct nat_entry_set *nes, 2344309cc2b6SJaegeuk Kim struct list_head *head, int max) 2345e05df3b1SJaegeuk Kim { 2346309cc2b6SJaegeuk Kim struct nat_entry_set *cur; 2347e05df3b1SJaegeuk Kim 2348309cc2b6SJaegeuk Kim if (nes->entry_cnt >= max) 2349309cc2b6SJaegeuk Kim goto add_out; 2350e05df3b1SJaegeuk Kim 2351309cc2b6SJaegeuk Kim list_for_each_entry(cur, head, set_list) { 2352309cc2b6SJaegeuk Kim if (cur->entry_cnt >= nes->entry_cnt) { 2353309cc2b6SJaegeuk Kim list_add(&nes->set_list, cur->set_list.prev); 2354309cc2b6SJaegeuk Kim return; 2355309cc2b6SJaegeuk Kim } 2356309cc2b6SJaegeuk Kim } 2357309cc2b6SJaegeuk Kim add_out: 2358309cc2b6SJaegeuk Kim list_add_tail(&nes->set_list, head); 2359aec71382SChao Yu } 2360aec71382SChao Yu 23619f7e4a2cSJaegeuk Kim static void __update_nat_bits(struct f2fs_sb_info *sbi, nid_t start_nid, 236222ad0b6aSJaegeuk Kim struct page *page) 236322ad0b6aSJaegeuk Kim { 236422ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 236522ad0b6aSJaegeuk Kim unsigned int nat_index = start_nid / NAT_ENTRY_PER_BLOCK; 236622ad0b6aSJaegeuk Kim struct f2fs_nat_block *nat_blk = page_address(page); 236722ad0b6aSJaegeuk Kim int valid = 0; 236822ad0b6aSJaegeuk Kim int i; 236922ad0b6aSJaegeuk Kim 237022ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 237122ad0b6aSJaegeuk Kim return; 237222ad0b6aSJaegeuk Kim 237322ad0b6aSJaegeuk Kim for (i = 0; i < NAT_ENTRY_PER_BLOCK; i++) { 237422ad0b6aSJaegeuk Kim if (start_nid == 0 && i == 0) 237522ad0b6aSJaegeuk Kim valid++; 237622ad0b6aSJaegeuk Kim if (nat_blk->entries[i].block_addr) 237722ad0b6aSJaegeuk Kim valid++; 237822ad0b6aSJaegeuk Kim } 237922ad0b6aSJaegeuk Kim if (valid == 0) { 238023380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->empty_nat_bits); 238123380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 238222ad0b6aSJaegeuk Kim return; 238322ad0b6aSJaegeuk Kim } 238422ad0b6aSJaegeuk Kim 238523380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->empty_nat_bits); 238622ad0b6aSJaegeuk Kim if (valid == NAT_ENTRY_PER_BLOCK) 238723380b85SJaegeuk Kim __set_bit_le(nat_index, nm_i->full_nat_bits); 238822ad0b6aSJaegeuk Kim else 238923380b85SJaegeuk Kim __clear_bit_le(nat_index, nm_i->full_nat_bits); 239022ad0b6aSJaegeuk Kim } 239122ad0b6aSJaegeuk Kim 2392309cc2b6SJaegeuk Kim static void __flush_nat_entry_set(struct f2fs_sb_info *sbi, 239322ad0b6aSJaegeuk Kim struct nat_entry_set *set, struct cp_control *cpc) 2394309cc2b6SJaegeuk Kim { 2395309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2396b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 2397309cc2b6SJaegeuk Kim nid_t start_nid = set->set * NAT_ENTRY_PER_BLOCK; 2398309cc2b6SJaegeuk Kim bool to_journal = true; 2399309cc2b6SJaegeuk Kim struct f2fs_nat_block *nat_blk; 2400309cc2b6SJaegeuk Kim struct nat_entry *ne, *cur; 2401309cc2b6SJaegeuk Kim struct page *page = NULL; 2402aec71382SChao Yu 2403aec71382SChao Yu /* 2404aec71382SChao Yu * there are two steps to flush nat entries: 2405aec71382SChao Yu * #1, flush nat entries to journal in current hot data summary block. 2406aec71382SChao Yu * #2, flush nat entries to nat page. 2407aec71382SChao Yu */ 240822ad0b6aSJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 240922ad0b6aSJaegeuk Kim !__has_cursum_space(journal, set->entry_cnt, NAT_JOURNAL)) 2410aec71382SChao Yu to_journal = false; 2411aec71382SChao Yu 2412aec71382SChao Yu if (to_journal) { 2413b7ad7512SChao Yu down_write(&curseg->journal_rwsem); 2414aec71382SChao Yu } else { 2415e05df3b1SJaegeuk Kim page = get_next_nat_page(sbi, start_nid); 2416e05df3b1SJaegeuk Kim nat_blk = page_address(page); 24179850cf4aSJaegeuk Kim f2fs_bug_on(sbi, !nat_blk); 2418e05df3b1SJaegeuk Kim } 2419e05df3b1SJaegeuk Kim 2420aec71382SChao Yu /* flush dirty nats in nat entry set */ 2421309cc2b6SJaegeuk Kim list_for_each_entry_safe(ne, cur, &set->entry_list, list) { 2422aec71382SChao Yu struct f2fs_nat_entry *raw_ne; 2423aec71382SChao Yu nid_t nid = nat_get_nid(ne); 2424aec71382SChao Yu int offset; 2425aec71382SChao Yu 2426309cc2b6SJaegeuk Kim if (nat_get_blkaddr(ne) == NEW_ADDR) 2427309cc2b6SJaegeuk Kim continue; 2428309cc2b6SJaegeuk Kim 2429aec71382SChao Yu if (to_journal) { 2430dfc08a12SChao Yu offset = lookup_journal_in_cursum(journal, 2431aec71382SChao Yu NAT_JOURNAL, nid, 1); 24329850cf4aSJaegeuk Kim f2fs_bug_on(sbi, offset < 0); 2433dfc08a12SChao Yu raw_ne = &nat_in_journal(journal, offset); 2434dfc08a12SChao Yu nid_in_journal(journal, offset) = cpu_to_le32(nid); 2435aec71382SChao Yu } else { 2436aec71382SChao Yu raw_ne = &nat_blk->entries[nid - start_nid]; 2437aec71382SChao Yu } 2438aec71382SChao Yu raw_nat_from_node_info(raw_ne, &ne->ni); 243988bd02c9SJaegeuk Kim nat_reset_flag(ne); 24400b28b71eSKinglong Mee __clear_nat_cache_dirty(NM_I(sbi), set, ne); 244104d47e67SChao Yu if (nat_get_blkaddr(ne) == NULL_ADDR) { 2442309cc2b6SJaegeuk Kim add_free_nid(sbi, nid, false); 244304d47e67SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 244404d47e67SChao Yu NM_I(sbi)->available_nids++; 2445346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, false); 24464ac91242SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 24474ac91242SChao Yu } else { 24484ac91242SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 2449346fe752SChao Yu update_free_nid_bitmap(sbi, nid, false, false); 245004d47e67SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 245104d47e67SChao Yu } 2452e05df3b1SJaegeuk Kim } 2453aec71382SChao Yu 245422ad0b6aSJaegeuk Kim if (to_journal) { 2455b7ad7512SChao Yu up_write(&curseg->journal_rwsem); 245622ad0b6aSJaegeuk Kim } else { 245722ad0b6aSJaegeuk Kim __update_nat_bits(sbi, start_nid, page); 2458e05df3b1SJaegeuk Kim f2fs_put_page(page, 1); 245922ad0b6aSJaegeuk Kim } 2460aec71382SChao Yu 246159c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 246259c9081bSYunlei He if (!set->entry_cnt) { 2463309cc2b6SJaegeuk Kim radix_tree_delete(&NM_I(sbi)->nat_set_root, set->set); 2464309cc2b6SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, set); 2465309cc2b6SJaegeuk Kim } 246659c9081bSYunlei He } 2467aec71382SChao Yu 2468309cc2b6SJaegeuk Kim /* 2469309cc2b6SJaegeuk Kim * This function is called during the checkpointing process. 2470309cc2b6SJaegeuk Kim */ 247122ad0b6aSJaegeuk Kim void flush_nat_entries(struct f2fs_sb_info *sbi, struct cp_control *cpc) 2472309cc2b6SJaegeuk Kim { 2473309cc2b6SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2474309cc2b6SJaegeuk Kim struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA); 2475b7ad7512SChao Yu struct f2fs_journal *journal = curseg->journal; 24767aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2477309cc2b6SJaegeuk Kim struct nat_entry_set *set, *tmp; 2478309cc2b6SJaegeuk Kim unsigned int found; 2479309cc2b6SJaegeuk Kim nid_t set_idx = 0; 2480309cc2b6SJaegeuk Kim LIST_HEAD(sets); 2481309cc2b6SJaegeuk Kim 248220d047c8SChangman Lee if (!nm_i->dirty_nat_cnt) 248320d047c8SChangman Lee return; 2484a5131193SJaegeuk Kim 2485b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2486a5131193SJaegeuk Kim 2487309cc2b6SJaegeuk Kim /* 2488309cc2b6SJaegeuk Kim * if there are no enough space in journal to store dirty nat 2489309cc2b6SJaegeuk Kim * entries, remove all entries from journal and merge them 2490309cc2b6SJaegeuk Kim * into nat entry set. 2491309cc2b6SJaegeuk Kim */ 2492900f7362SJaegeuk Kim if (enabled_nat_bits(sbi, cpc) || 249322ad0b6aSJaegeuk Kim !__has_cursum_space(journal, nm_i->dirty_nat_cnt, NAT_JOURNAL)) 2494309cc2b6SJaegeuk Kim remove_nats_in_journal(sbi); 2495309cc2b6SJaegeuk Kim 2496309cc2b6SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 24977aed0d45SJaegeuk Kim set_idx, SETVEC_SIZE, setvec))) { 2498309cc2b6SJaegeuk Kim unsigned idx; 2499309cc2b6SJaegeuk Kim set_idx = setvec[found - 1]->set + 1; 2500309cc2b6SJaegeuk Kim for (idx = 0; idx < found; idx++) 2501309cc2b6SJaegeuk Kim __adjust_nat_entry_set(setvec[idx], &sets, 2502dfc08a12SChao Yu MAX_NAT_JENTRIES(journal)); 2503309cc2b6SJaegeuk Kim } 2504309cc2b6SJaegeuk Kim 2505309cc2b6SJaegeuk Kim /* flush dirty nats in nat entry set */ 2506309cc2b6SJaegeuk Kim list_for_each_entry_safe(set, tmp, &sets, set_list) 250722ad0b6aSJaegeuk Kim __flush_nat_entry_set(sbi, set, cpc); 2508309cc2b6SJaegeuk Kim 2509b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 251059c9081bSYunlei He /* Allow dirty nats by node block allocation in write_begin */ 2511e05df3b1SJaegeuk Kim } 2512e05df3b1SJaegeuk Kim 251322ad0b6aSJaegeuk Kim static int __get_nat_bitmaps(struct f2fs_sb_info *sbi) 251422ad0b6aSJaegeuk Kim { 251522ad0b6aSJaegeuk Kim struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi); 251622ad0b6aSJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 251722ad0b6aSJaegeuk Kim unsigned int nat_bits_bytes = nm_i->nat_blocks / BITS_PER_BYTE; 251822ad0b6aSJaegeuk Kim unsigned int i; 251922ad0b6aSJaegeuk Kim __u64 cp_ver = cur_cp_version(ckpt); 252022ad0b6aSJaegeuk Kim block_t nat_bits_addr; 252122ad0b6aSJaegeuk Kim 252222ad0b6aSJaegeuk Kim if (!enabled_nat_bits(sbi, NULL)) 252322ad0b6aSJaegeuk Kim return 0; 252422ad0b6aSJaegeuk Kim 252522ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks = F2FS_BYTES_TO_BLK((nat_bits_bytes << 1) + 8 + 252622ad0b6aSJaegeuk Kim F2FS_BLKSIZE - 1); 252722ad0b6aSJaegeuk Kim nm_i->nat_bits = kzalloc(nm_i->nat_bits_blocks << F2FS_BLKSIZE_BITS, 252822ad0b6aSJaegeuk Kim GFP_KERNEL); 252922ad0b6aSJaegeuk Kim if (!nm_i->nat_bits) 253022ad0b6aSJaegeuk Kim return -ENOMEM; 253122ad0b6aSJaegeuk Kim 253222ad0b6aSJaegeuk Kim nat_bits_addr = __start_cp_addr(sbi) + sbi->blocks_per_seg - 253322ad0b6aSJaegeuk Kim nm_i->nat_bits_blocks; 253422ad0b6aSJaegeuk Kim for (i = 0; i < nm_i->nat_bits_blocks; i++) { 253522ad0b6aSJaegeuk Kim struct page *page = get_meta_page(sbi, nat_bits_addr++); 253622ad0b6aSJaegeuk Kim 253722ad0b6aSJaegeuk Kim memcpy(nm_i->nat_bits + (i << F2FS_BLKSIZE_BITS), 253822ad0b6aSJaegeuk Kim page_address(page), F2FS_BLKSIZE); 253922ad0b6aSJaegeuk Kim f2fs_put_page(page, 1); 254022ad0b6aSJaegeuk Kim } 254122ad0b6aSJaegeuk Kim 2542ced2c7eaSKinglong Mee cp_ver |= (cur_cp_crc(ckpt) << 32); 254322ad0b6aSJaegeuk Kim if (cpu_to_le64(cp_ver) != *(__le64 *)nm_i->nat_bits) { 254422ad0b6aSJaegeuk Kim disable_nat_bits(sbi, true); 254522ad0b6aSJaegeuk Kim return 0; 254622ad0b6aSJaegeuk Kim } 254722ad0b6aSJaegeuk Kim 254822ad0b6aSJaegeuk Kim nm_i->full_nat_bits = nm_i->nat_bits + 8; 254922ad0b6aSJaegeuk Kim nm_i->empty_nat_bits = nm_i->full_nat_bits + nat_bits_bytes; 255022ad0b6aSJaegeuk Kim 255122ad0b6aSJaegeuk Kim f2fs_msg(sbi->sb, KERN_NOTICE, "Found nat_bits in checkpoint"); 255222ad0b6aSJaegeuk Kim return 0; 255322ad0b6aSJaegeuk Kim } 255422ad0b6aSJaegeuk Kim 25557041d5d2SChao Yu inline void load_free_nid_bitmap(struct f2fs_sb_info *sbi) 25567041d5d2SChao Yu { 25577041d5d2SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 25587041d5d2SChao Yu unsigned int i = 0; 25597041d5d2SChao Yu nid_t nid, last_nid; 25607041d5d2SChao Yu 25617041d5d2SChao Yu if (!enabled_nat_bits(sbi, NULL)) 25627041d5d2SChao Yu return; 25637041d5d2SChao Yu 25647041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25657041d5d2SChao Yu i = find_next_bit_le(nm_i->empty_nat_bits, nm_i->nat_blocks, i); 25667041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25677041d5d2SChao Yu break; 25687041d5d2SChao Yu 25697041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25707041d5d2SChao Yu 25717041d5d2SChao Yu nid = i * NAT_ENTRY_PER_BLOCK; 25727041d5d2SChao Yu last_nid = (i + 1) * NAT_ENTRY_PER_BLOCK; 25737041d5d2SChao Yu 2574346fe752SChao Yu spin_lock(&NM_I(sbi)->nid_list_lock); 25757041d5d2SChao Yu for (; nid < last_nid; nid++) 2576346fe752SChao Yu update_free_nid_bitmap(sbi, nid, true, true); 2577346fe752SChao Yu spin_unlock(&NM_I(sbi)->nid_list_lock); 25787041d5d2SChao Yu } 25797041d5d2SChao Yu 25807041d5d2SChao Yu for (i = 0; i < nm_i->nat_blocks; i++) { 25817041d5d2SChao Yu i = find_next_bit_le(nm_i->full_nat_bits, nm_i->nat_blocks, i); 25827041d5d2SChao Yu if (i >= nm_i->nat_blocks) 25837041d5d2SChao Yu break; 25847041d5d2SChao Yu 25857041d5d2SChao Yu __set_bit_le(i, nm_i->nat_block_bitmap); 25867041d5d2SChao Yu } 25877041d5d2SChao Yu } 25887041d5d2SChao Yu 2589e05df3b1SJaegeuk Kim static int init_node_manager(struct f2fs_sb_info *sbi) 2590e05df3b1SJaegeuk Kim { 2591e05df3b1SJaegeuk Kim struct f2fs_super_block *sb_raw = F2FS_RAW_SUPER(sbi); 2592e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2593e05df3b1SJaegeuk Kim unsigned char *version_bitmap; 259422ad0b6aSJaegeuk Kim unsigned int nat_segs; 259522ad0b6aSJaegeuk Kim int err; 2596e05df3b1SJaegeuk Kim 2597e05df3b1SJaegeuk Kim nm_i->nat_blkaddr = le32_to_cpu(sb_raw->nat_blkaddr); 2598e05df3b1SJaegeuk Kim 2599e05df3b1SJaegeuk Kim /* segment_count_nat includes pair segment so divide to 2. */ 2600e05df3b1SJaegeuk Kim nat_segs = le32_to_cpu(sb_raw->segment_count_nat) >> 1; 260122ad0b6aSJaegeuk Kim nm_i->nat_blocks = nat_segs << le32_to_cpu(sb_raw->log_blocks_per_seg); 260222ad0b6aSJaegeuk Kim nm_i->max_nid = NAT_ENTRY_PER_BLOCK * nm_i->nat_blocks; 26037ee0eeabSJaegeuk Kim 2604b63da15eSJaegeuk Kim /* not used nids: 0, node, meta, (and root counted as valid node) */ 260504d47e67SChao Yu nm_i->available_nids = nm_i->max_nid - sbi->total_valid_node_count - 260604d47e67SChao Yu F2FS_RESERVED_NODE_NUM; 2607b8559dc2SChao Yu nm_i->nid_cnt[FREE_NID_LIST] = 0; 2608b8559dc2SChao Yu nm_i->nid_cnt[ALLOC_NID_LIST] = 0; 2609e05df3b1SJaegeuk Kim nm_i->nat_cnt = 0; 2610cdfc41c1SJaegeuk Kim nm_i->ram_thresh = DEF_RAM_THRESHOLD; 2611ea1a29a0SChao Yu nm_i->ra_nid_pages = DEF_RA_NID_PAGES; 26122304cb0cSChao Yu nm_i->dirty_nats_ratio = DEF_DIRTY_NAT_RATIO_THRESHOLD; 2613e05df3b1SJaegeuk Kim 26148a7ed66aSJaegeuk Kim INIT_RADIX_TREE(&nm_i->free_nid_root, GFP_ATOMIC); 2615b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[FREE_NID_LIST]); 2616b8559dc2SChao Yu INIT_LIST_HEAD(&nm_i->nid_list[ALLOC_NID_LIST]); 2617769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_root, GFP_NOIO); 2618769ec6e5SJaegeuk Kim INIT_RADIX_TREE(&nm_i->nat_set_root, GFP_NOIO); 2619e05df3b1SJaegeuk Kim INIT_LIST_HEAD(&nm_i->nat_entries); 2620e05df3b1SJaegeuk Kim 2621e05df3b1SJaegeuk Kim mutex_init(&nm_i->build_lock); 2622b8559dc2SChao Yu spin_lock_init(&nm_i->nid_list_lock); 2623b873b798SJaegeuk Kim init_rwsem(&nm_i->nat_tree_lock); 2624e05df3b1SJaegeuk Kim 2625e05df3b1SJaegeuk Kim nm_i->next_scan_nid = le32_to_cpu(sbi->ckpt->next_free_nid); 262679b5793bSAlexandru Gheorghiu nm_i->bitmap_size = __bitmap_size(sbi, NAT_BITMAP); 2627e05df3b1SJaegeuk Kim version_bitmap = __bitmap_ptr(sbi, NAT_BITMAP); 2628e05df3b1SJaegeuk Kim if (!version_bitmap) 2629e05df3b1SJaegeuk Kim return -EFAULT; 2630e05df3b1SJaegeuk Kim 263179b5793bSAlexandru Gheorghiu nm_i->nat_bitmap = kmemdup(version_bitmap, nm_i->bitmap_size, 263279b5793bSAlexandru Gheorghiu GFP_KERNEL); 263379b5793bSAlexandru Gheorghiu if (!nm_i->nat_bitmap) 263479b5793bSAlexandru Gheorghiu return -ENOMEM; 2635599a09b2SChao Yu 263622ad0b6aSJaegeuk Kim err = __get_nat_bitmaps(sbi); 263722ad0b6aSJaegeuk Kim if (err) 263822ad0b6aSJaegeuk Kim return err; 263922ad0b6aSJaegeuk Kim 2640599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2641599a09b2SChao Yu nm_i->nat_bitmap_mir = kmemdup(version_bitmap, nm_i->bitmap_size, 2642599a09b2SChao Yu GFP_KERNEL); 2643599a09b2SChao Yu if (!nm_i->nat_bitmap_mir) 2644599a09b2SChao Yu return -ENOMEM; 2645599a09b2SChao Yu #endif 2646599a09b2SChao Yu 2647e05df3b1SJaegeuk Kim return 0; 2648e05df3b1SJaegeuk Kim } 2649e05df3b1SJaegeuk Kim 26509f7e4a2cSJaegeuk Kim static int init_free_nid_cache(struct f2fs_sb_info *sbi) 26514ac91242SChao Yu { 26524ac91242SChao Yu struct f2fs_nm_info *nm_i = NM_I(sbi); 26534ac91242SChao Yu 26544ac91242SChao Yu nm_i->free_nid_bitmap = f2fs_kvzalloc(nm_i->nat_blocks * 26554ac91242SChao Yu NAT_ENTRY_BITMAP_SIZE, GFP_KERNEL); 26564ac91242SChao Yu if (!nm_i->free_nid_bitmap) 26574ac91242SChao Yu return -ENOMEM; 26584ac91242SChao Yu 26594ac91242SChao Yu nm_i->nat_block_bitmap = f2fs_kvzalloc(nm_i->nat_blocks / 8, 26604ac91242SChao Yu GFP_KERNEL); 26614ac91242SChao Yu if (!nm_i->nat_block_bitmap) 26624ac91242SChao Yu return -ENOMEM; 2663586d1492SChao Yu 2664586d1492SChao Yu nm_i->free_nid_count = f2fs_kvzalloc(nm_i->nat_blocks * 2665586d1492SChao Yu sizeof(unsigned short), GFP_KERNEL); 2666586d1492SChao Yu if (!nm_i->free_nid_count) 2667586d1492SChao Yu return -ENOMEM; 26684ac91242SChao Yu return 0; 26694ac91242SChao Yu } 26704ac91242SChao Yu 2671e05df3b1SJaegeuk Kim int build_node_manager(struct f2fs_sb_info *sbi) 2672e05df3b1SJaegeuk Kim { 2673e05df3b1SJaegeuk Kim int err; 2674e05df3b1SJaegeuk Kim 2675e05df3b1SJaegeuk Kim sbi->nm_info = kzalloc(sizeof(struct f2fs_nm_info), GFP_KERNEL); 2676e05df3b1SJaegeuk Kim if (!sbi->nm_info) 2677e05df3b1SJaegeuk Kim return -ENOMEM; 2678e05df3b1SJaegeuk Kim 2679e05df3b1SJaegeuk Kim err = init_node_manager(sbi); 2680e05df3b1SJaegeuk Kim if (err) 2681e05df3b1SJaegeuk Kim return err; 2682e05df3b1SJaegeuk Kim 26834ac91242SChao Yu err = init_free_nid_cache(sbi); 26844ac91242SChao Yu if (err) 26854ac91242SChao Yu return err; 26864ac91242SChao Yu 26877041d5d2SChao Yu /* load free nid status from nat_bits table */ 26887041d5d2SChao Yu load_free_nid_bitmap(sbi); 26897041d5d2SChao Yu 269022ad0b6aSJaegeuk Kim build_free_nids(sbi, true, true); 2691e05df3b1SJaegeuk Kim return 0; 2692e05df3b1SJaegeuk Kim } 2693e05df3b1SJaegeuk Kim 2694e05df3b1SJaegeuk Kim void destroy_node_manager(struct f2fs_sb_info *sbi) 2695e05df3b1SJaegeuk Kim { 2696e05df3b1SJaegeuk Kim struct f2fs_nm_info *nm_i = NM_I(sbi); 2697e05df3b1SJaegeuk Kim struct free_nid *i, *next_i; 2698e05df3b1SJaegeuk Kim struct nat_entry *natvec[NATVEC_SIZE]; 26997aed0d45SJaegeuk Kim struct nat_entry_set *setvec[SETVEC_SIZE]; 2700e05df3b1SJaegeuk Kim nid_t nid = 0; 2701e05df3b1SJaegeuk Kim unsigned int found; 2702e05df3b1SJaegeuk Kim 2703e05df3b1SJaegeuk Kim if (!nm_i) 2704e05df3b1SJaegeuk Kim return; 2705e05df3b1SJaegeuk Kim 2706e05df3b1SJaegeuk Kim /* destroy free nid list */ 2707b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2708b8559dc2SChao Yu list_for_each_entry_safe(i, next_i, &nm_i->nid_list[FREE_NID_LIST], 2709b8559dc2SChao Yu list) { 2710eb0aa4b8SJaegeuk Kim __remove_nid_from_list(sbi, i, FREE_NID_LIST, false); 2711b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2712cf0ee0f0SChao Yu kmem_cache_free(free_nid_slab, i); 2713b8559dc2SChao Yu spin_lock(&nm_i->nid_list_lock); 2714e05df3b1SJaegeuk Kim } 2715b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[FREE_NID_LIST]); 2716b8559dc2SChao Yu f2fs_bug_on(sbi, nm_i->nid_cnt[ALLOC_NID_LIST]); 2717b8559dc2SChao Yu f2fs_bug_on(sbi, !list_empty(&nm_i->nid_list[ALLOC_NID_LIST])); 2718b8559dc2SChao Yu spin_unlock(&nm_i->nid_list_lock); 2719e05df3b1SJaegeuk Kim 2720e05df3b1SJaegeuk Kim /* destroy nat cache */ 2721b873b798SJaegeuk Kim down_write(&nm_i->nat_tree_lock); 2722e05df3b1SJaegeuk Kim while ((found = __gang_lookup_nat_cache(nm_i, 2723e05df3b1SJaegeuk Kim nid, NATVEC_SIZE, natvec))) { 2724e05df3b1SJaegeuk Kim unsigned idx; 27257aed0d45SJaegeuk Kim 2726b6ce391eSGu Zheng nid = nat_get_nid(natvec[found - 1]) + 1; 2727b6ce391eSGu Zheng for (idx = 0; idx < found; idx++) 2728b6ce391eSGu Zheng __del_from_nat_cache(nm_i, natvec[idx]); 2729e05df3b1SJaegeuk Kim } 27309850cf4aSJaegeuk Kim f2fs_bug_on(sbi, nm_i->nat_cnt); 27317aed0d45SJaegeuk Kim 27327aed0d45SJaegeuk Kim /* destroy nat set cache */ 27337aed0d45SJaegeuk Kim nid = 0; 27347aed0d45SJaegeuk Kim while ((found = __gang_lookup_nat_set(nm_i, 27357aed0d45SJaegeuk Kim nid, SETVEC_SIZE, setvec))) { 27367aed0d45SJaegeuk Kim unsigned idx; 27377aed0d45SJaegeuk Kim 27387aed0d45SJaegeuk Kim nid = setvec[found - 1]->set + 1; 27397aed0d45SJaegeuk Kim for (idx = 0; idx < found; idx++) { 27407aed0d45SJaegeuk Kim /* entry_cnt is not zero, when cp_error was occurred */ 27417aed0d45SJaegeuk Kim f2fs_bug_on(sbi, !list_empty(&setvec[idx]->entry_list)); 27427aed0d45SJaegeuk Kim radix_tree_delete(&nm_i->nat_set_root, setvec[idx]->set); 27437aed0d45SJaegeuk Kim kmem_cache_free(nat_entry_set_slab, setvec[idx]); 27447aed0d45SJaegeuk Kim } 27457aed0d45SJaegeuk Kim } 2746b873b798SJaegeuk Kim up_write(&nm_i->nat_tree_lock); 2747e05df3b1SJaegeuk Kim 27484ac91242SChao Yu kvfree(nm_i->nat_block_bitmap); 27494ac91242SChao Yu kvfree(nm_i->free_nid_bitmap); 2750586d1492SChao Yu kvfree(nm_i->free_nid_count); 27514ac91242SChao Yu 2752e05df3b1SJaegeuk Kim kfree(nm_i->nat_bitmap); 275322ad0b6aSJaegeuk Kim kfree(nm_i->nat_bits); 2754599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS 2755599a09b2SChao Yu kfree(nm_i->nat_bitmap_mir); 2756599a09b2SChao Yu #endif 2757e05df3b1SJaegeuk Kim sbi->nm_info = NULL; 2758e05df3b1SJaegeuk Kim kfree(nm_i); 2759e05df3b1SJaegeuk Kim } 2760e05df3b1SJaegeuk Kim 27616e6093a8SNamjae Jeon int __init create_node_manager_caches(void) 2762e05df3b1SJaegeuk Kim { 2763e05df3b1SJaegeuk Kim nat_entry_slab = f2fs_kmem_cache_create("nat_entry", 2764e8512d2eSGu Zheng sizeof(struct nat_entry)); 2765e05df3b1SJaegeuk Kim if (!nat_entry_slab) 2766aec71382SChao Yu goto fail; 2767e05df3b1SJaegeuk Kim 2768e05df3b1SJaegeuk Kim free_nid_slab = f2fs_kmem_cache_create("free_nid", 2769e8512d2eSGu Zheng sizeof(struct free_nid)); 2770aec71382SChao Yu if (!free_nid_slab) 2771ce3e6d25SMarkus Elfring goto destroy_nat_entry; 2772aec71382SChao Yu 2773aec71382SChao Yu nat_entry_set_slab = f2fs_kmem_cache_create("nat_entry_set", 2774aec71382SChao Yu sizeof(struct nat_entry_set)); 2775aec71382SChao Yu if (!nat_entry_set_slab) 2776ce3e6d25SMarkus Elfring goto destroy_free_nid; 2777e05df3b1SJaegeuk Kim return 0; 2778aec71382SChao Yu 2779ce3e6d25SMarkus Elfring destroy_free_nid: 2780aec71382SChao Yu kmem_cache_destroy(free_nid_slab); 2781ce3e6d25SMarkus Elfring destroy_nat_entry: 2782aec71382SChao Yu kmem_cache_destroy(nat_entry_slab); 2783aec71382SChao Yu fail: 2784aec71382SChao Yu return -ENOMEM; 2785e05df3b1SJaegeuk Kim } 2786e05df3b1SJaegeuk Kim 2787e05df3b1SJaegeuk Kim void destroy_node_manager_caches(void) 2788e05df3b1SJaegeuk Kim { 2789aec71382SChao Yu kmem_cache_destroy(nat_entry_set_slab); 2790e05df3b1SJaegeuk Kim kmem_cache_destroy(free_nid_slab); 2791e05df3b1SJaegeuk Kim kmem_cache_destroy(nat_entry_slab); 2792e05df3b1SJaegeuk Kim } 2793