xref: /openbmc/linux/fs/f2fs/node.c (revision 1f258ec1)
10a8165d7SJaegeuk Kim /*
2e05df3b1SJaegeuk Kim  * fs/f2fs/node.c
3e05df3b1SJaegeuk Kim  *
4e05df3b1SJaegeuk Kim  * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5e05df3b1SJaegeuk Kim  *             http://www.samsung.com/
6e05df3b1SJaegeuk Kim  *
7e05df3b1SJaegeuk Kim  * This program is free software; you can redistribute it and/or modify
8e05df3b1SJaegeuk Kim  * it under the terms of the GNU General Public License version 2 as
9e05df3b1SJaegeuk Kim  * published by the Free Software Foundation.
10e05df3b1SJaegeuk Kim  */
11e05df3b1SJaegeuk Kim #include <linux/fs.h>
12e05df3b1SJaegeuk Kim #include <linux/f2fs_fs.h>
13e05df3b1SJaegeuk Kim #include <linux/mpage.h>
14e05df3b1SJaegeuk Kim #include <linux/backing-dev.h>
15e05df3b1SJaegeuk Kim #include <linux/blkdev.h>
16e05df3b1SJaegeuk Kim #include <linux/pagevec.h>
17e05df3b1SJaegeuk Kim #include <linux/swap.h>
18e05df3b1SJaegeuk Kim 
19e05df3b1SJaegeuk Kim #include "f2fs.h"
20e05df3b1SJaegeuk Kim #include "node.h"
21e05df3b1SJaegeuk Kim #include "segment.h"
229e4ded3fSJaegeuk Kim #include "trace.h"
2351dd6249SNamjae Jeon #include <trace/events/f2fs.h>
24e05df3b1SJaegeuk Kim 
2568afcf2dSTomohiro Kusumi #define on_build_free_nids(nmi) mutex_is_locked(&(nm_i)->build_lock)
26f978f5a0SGu Zheng 
27e05df3b1SJaegeuk Kim static struct kmem_cache *nat_entry_slab;
28e05df3b1SJaegeuk Kim static struct kmem_cache *free_nid_slab;
29aec71382SChao Yu static struct kmem_cache *nat_entry_set_slab;
30e05df3b1SJaegeuk Kim 
316fb03f3aSJaegeuk Kim bool available_free_memory(struct f2fs_sb_info *sbi, int type)
32cdfc41c1SJaegeuk Kim {
336fb03f3aSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
34cdfc41c1SJaegeuk Kim 	struct sysinfo val;
35e5e7ea3cSJaegeuk Kim 	unsigned long avail_ram;
36cdfc41c1SJaegeuk Kim 	unsigned long mem_size = 0;
376fb03f3aSJaegeuk Kim 	bool res = false;
38cdfc41c1SJaegeuk Kim 
39cdfc41c1SJaegeuk Kim 	si_meminfo(&val);
40e5e7ea3cSJaegeuk Kim 
41e5e7ea3cSJaegeuk Kim 	/* only uses low memory */
42e5e7ea3cSJaegeuk Kim 	avail_ram = val.totalram - val.totalhigh;
43e5e7ea3cSJaegeuk Kim 
44429511cdSChao Yu 	/*
45429511cdSChao Yu 	 * give 25%, 25%, 50%, 50%, 50% memory for each components respectively
46429511cdSChao Yu 	 */
476fb03f3aSJaegeuk Kim 	if (type == FREE_NIDS) {
48b8559dc2SChao Yu 		mem_size = (nm_i->nid_cnt[FREE_NID_LIST] *
49b8559dc2SChao Yu 				sizeof(struct free_nid)) >> PAGE_SHIFT;
50e5e7ea3cSJaegeuk Kim 		res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2);
516fb03f3aSJaegeuk Kim 	} else if (type == NAT_ENTRIES) {
52e5e7ea3cSJaegeuk Kim 		mem_size = (nm_i->nat_cnt * sizeof(struct nat_entry)) >>
5309cbfeafSKirill A. Shutemov 							PAGE_SHIFT;
54e5e7ea3cSJaegeuk Kim 		res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 2);
55e589c2c4SJaegeuk Kim 		if (excess_cached_nats(sbi))
56e589c2c4SJaegeuk Kim 			res = false;
57a1257023SJaegeuk Kim 	} else if (type == DIRTY_DENTS) {
58a1257023SJaegeuk Kim 		if (sbi->sb->s_bdi->wb.dirty_exceeded)
59a1257023SJaegeuk Kim 			return false;
60a1257023SJaegeuk Kim 		mem_size = get_pages(sbi, F2FS_DIRTY_DENTS);
61a1257023SJaegeuk Kim 		res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1);
62e5e7ea3cSJaegeuk Kim 	} else if (type == INO_ENTRIES) {
63e5e7ea3cSJaegeuk Kim 		int i;
64e5e7ea3cSJaegeuk Kim 
65e5e7ea3cSJaegeuk Kim 		for (i = 0; i <= UPDATE_INO; i++)
668f73cbb7SKinglong Mee 			mem_size += sbi->im[i].ino_num *
678f73cbb7SKinglong Mee 						sizeof(struct ino_entry);
688f73cbb7SKinglong Mee 		mem_size >>= PAGE_SHIFT;
69e5e7ea3cSJaegeuk Kim 		res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1);
70429511cdSChao Yu 	} else if (type == EXTENT_CACHE) {
717441ccefSJaegeuk Kim 		mem_size = (atomic_read(&sbi->total_ext_tree) *
727441ccefSJaegeuk Kim 				sizeof(struct extent_tree) +
73429511cdSChao Yu 				atomic_read(&sbi->total_ext_node) *
7409cbfeafSKirill A. Shutemov 				sizeof(struct extent_node)) >> PAGE_SHIFT;
75429511cdSChao Yu 		res = mem_size < ((avail_ram * nm_i->ram_thresh / 100) >> 1);
761e84371fSJaegeuk Kim 	} else {
771663cae4SJaegeuk Kim 		if (!sbi->sb->s_bdi->wb.dirty_exceeded)
781663cae4SJaegeuk Kim 			return true;
796fb03f3aSJaegeuk Kim 	}
806fb03f3aSJaegeuk Kim 	return res;
81cdfc41c1SJaegeuk Kim }
82cdfc41c1SJaegeuk Kim 
83e05df3b1SJaegeuk Kim static void clear_node_page_dirty(struct page *page)
84e05df3b1SJaegeuk Kim {
85e05df3b1SJaegeuk Kim 	struct address_space *mapping = page->mapping;
86e05df3b1SJaegeuk Kim 	unsigned int long flags;
87e05df3b1SJaegeuk Kim 
88e05df3b1SJaegeuk Kim 	if (PageDirty(page)) {
89e05df3b1SJaegeuk Kim 		spin_lock_irqsave(&mapping->tree_lock, flags);
90e05df3b1SJaegeuk Kim 		radix_tree_tag_clear(&mapping->page_tree,
91e05df3b1SJaegeuk Kim 				page_index(page),
92e05df3b1SJaegeuk Kim 				PAGECACHE_TAG_DIRTY);
93e05df3b1SJaegeuk Kim 		spin_unlock_irqrestore(&mapping->tree_lock, flags);
94e05df3b1SJaegeuk Kim 
95e05df3b1SJaegeuk Kim 		clear_page_dirty_for_io(page);
964081363fSJaegeuk Kim 		dec_page_count(F2FS_M_SB(mapping), F2FS_DIRTY_NODES);
97e05df3b1SJaegeuk Kim 	}
98e05df3b1SJaegeuk Kim 	ClearPageUptodate(page);
99e05df3b1SJaegeuk Kim }
100e05df3b1SJaegeuk Kim 
101e05df3b1SJaegeuk Kim static struct page *get_current_nat_page(struct f2fs_sb_info *sbi, nid_t nid)
102e05df3b1SJaegeuk Kim {
103e05df3b1SJaegeuk Kim 	pgoff_t index = current_nat_addr(sbi, nid);
104e05df3b1SJaegeuk Kim 	return get_meta_page(sbi, index);
105e05df3b1SJaegeuk Kim }
106e05df3b1SJaegeuk Kim 
107e05df3b1SJaegeuk Kim static struct page *get_next_nat_page(struct f2fs_sb_info *sbi, nid_t nid)
108e05df3b1SJaegeuk Kim {
109e05df3b1SJaegeuk Kim 	struct page *src_page;
110e05df3b1SJaegeuk Kim 	struct page *dst_page;
111e05df3b1SJaegeuk Kim 	pgoff_t src_off;
112e05df3b1SJaegeuk Kim 	pgoff_t dst_off;
113e05df3b1SJaegeuk Kim 	void *src_addr;
114e05df3b1SJaegeuk Kim 	void *dst_addr;
115e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
116e05df3b1SJaegeuk Kim 
117e05df3b1SJaegeuk Kim 	src_off = current_nat_addr(sbi, nid);
118e05df3b1SJaegeuk Kim 	dst_off = next_nat_addr(sbi, src_off);
119e05df3b1SJaegeuk Kim 
120e05df3b1SJaegeuk Kim 	/* get current nat block page with lock */
121e05df3b1SJaegeuk Kim 	src_page = get_meta_page(sbi, src_off);
122e05df3b1SJaegeuk Kim 	dst_page = grab_meta_page(sbi, dst_off);
1239850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, PageDirty(src_page));
124e05df3b1SJaegeuk Kim 
125e05df3b1SJaegeuk Kim 	src_addr = page_address(src_page);
126e05df3b1SJaegeuk Kim 	dst_addr = page_address(dst_page);
12709cbfeafSKirill A. Shutemov 	memcpy(dst_addr, src_addr, PAGE_SIZE);
128e05df3b1SJaegeuk Kim 	set_page_dirty(dst_page);
129e05df3b1SJaegeuk Kim 	f2fs_put_page(src_page, 1);
130e05df3b1SJaegeuk Kim 
131e05df3b1SJaegeuk Kim 	set_to_next_nat(nm_i, nid);
132e05df3b1SJaegeuk Kim 
133e05df3b1SJaegeuk Kim 	return dst_page;
134e05df3b1SJaegeuk Kim }
135e05df3b1SJaegeuk Kim 
136e05df3b1SJaegeuk Kim static struct nat_entry *__lookup_nat_cache(struct f2fs_nm_info *nm_i, nid_t n)
137e05df3b1SJaegeuk Kim {
138e05df3b1SJaegeuk Kim 	return radix_tree_lookup(&nm_i->nat_root, n);
139e05df3b1SJaegeuk Kim }
140e05df3b1SJaegeuk Kim 
141e05df3b1SJaegeuk Kim static unsigned int __gang_lookup_nat_cache(struct f2fs_nm_info *nm_i,
142e05df3b1SJaegeuk Kim 		nid_t start, unsigned int nr, struct nat_entry **ep)
143e05df3b1SJaegeuk Kim {
144e05df3b1SJaegeuk Kim 	return radix_tree_gang_lookup(&nm_i->nat_root, (void **)ep, start, nr);
145e05df3b1SJaegeuk Kim }
146e05df3b1SJaegeuk Kim 
147e05df3b1SJaegeuk Kim static void __del_from_nat_cache(struct f2fs_nm_info *nm_i, struct nat_entry *e)
148e05df3b1SJaegeuk Kim {
149e05df3b1SJaegeuk Kim 	list_del(&e->list);
150e05df3b1SJaegeuk Kim 	radix_tree_delete(&nm_i->nat_root, nat_get_nid(e));
151e05df3b1SJaegeuk Kim 	nm_i->nat_cnt--;
152e05df3b1SJaegeuk Kim 	kmem_cache_free(nat_entry_slab, e);
153e05df3b1SJaegeuk Kim }
154e05df3b1SJaegeuk Kim 
155309cc2b6SJaegeuk Kim static void __set_nat_cache_dirty(struct f2fs_nm_info *nm_i,
156309cc2b6SJaegeuk Kim 						struct nat_entry *ne)
157309cc2b6SJaegeuk Kim {
158309cc2b6SJaegeuk Kim 	nid_t set = NAT_BLOCK_OFFSET(ne->ni.nid);
159309cc2b6SJaegeuk Kim 	struct nat_entry_set *head;
160309cc2b6SJaegeuk Kim 
161309cc2b6SJaegeuk Kim 	head = radix_tree_lookup(&nm_i->nat_set_root, set);
162309cc2b6SJaegeuk Kim 	if (!head) {
16380c54505SJaegeuk Kim 		head = f2fs_kmem_cache_alloc(nat_entry_set_slab, GFP_NOFS);
164309cc2b6SJaegeuk Kim 
165309cc2b6SJaegeuk Kim 		INIT_LIST_HEAD(&head->entry_list);
166309cc2b6SJaegeuk Kim 		INIT_LIST_HEAD(&head->set_list);
167309cc2b6SJaegeuk Kim 		head->set = set;
168309cc2b6SJaegeuk Kim 		head->entry_cnt = 0;
1699be32d72SJaegeuk Kim 		f2fs_radix_tree_insert(&nm_i->nat_set_root, set, head);
170309cc2b6SJaegeuk Kim 	}
171febeca6dSChao Yu 
172febeca6dSChao Yu 	if (get_nat_flag(ne, IS_DIRTY))
173febeca6dSChao Yu 		goto refresh_list;
174febeca6dSChao Yu 
175309cc2b6SJaegeuk Kim 	nm_i->dirty_nat_cnt++;
176309cc2b6SJaegeuk Kim 	head->entry_cnt++;
177309cc2b6SJaegeuk Kim 	set_nat_flag(ne, IS_DIRTY, true);
178febeca6dSChao Yu refresh_list:
179febeca6dSChao Yu 	if (nat_get_blkaddr(ne) == NEW_ADDR)
180febeca6dSChao Yu 		list_del_init(&ne->list);
181febeca6dSChao Yu 	else
182febeca6dSChao Yu 		list_move_tail(&ne->list, &head->entry_list);
183309cc2b6SJaegeuk Kim }
184309cc2b6SJaegeuk Kim 
185309cc2b6SJaegeuk Kim static void __clear_nat_cache_dirty(struct f2fs_nm_info *nm_i,
1860b28b71eSKinglong Mee 		struct nat_entry_set *set, struct nat_entry *ne)
187309cc2b6SJaegeuk Kim {
188309cc2b6SJaegeuk Kim 	list_move_tail(&ne->list, &nm_i->nat_entries);
189309cc2b6SJaegeuk Kim 	set_nat_flag(ne, IS_DIRTY, false);
1900b28b71eSKinglong Mee 	set->entry_cnt--;
191309cc2b6SJaegeuk Kim 	nm_i->dirty_nat_cnt--;
192309cc2b6SJaegeuk Kim }
193309cc2b6SJaegeuk Kim 
194309cc2b6SJaegeuk Kim static unsigned int __gang_lookup_nat_set(struct f2fs_nm_info *nm_i,
195309cc2b6SJaegeuk Kim 		nid_t start, unsigned int nr, struct nat_entry_set **ep)
196309cc2b6SJaegeuk Kim {
197309cc2b6SJaegeuk Kim 	return radix_tree_gang_lookup(&nm_i->nat_set_root, (void **)ep,
198309cc2b6SJaegeuk Kim 							start, nr);
199309cc2b6SJaegeuk Kim }
200309cc2b6SJaegeuk Kim 
2012dcf51abSJaegeuk Kim int need_dentry_mark(struct f2fs_sb_info *sbi, nid_t nid)
2022dcf51abSJaegeuk Kim {
2032dcf51abSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2042dcf51abSJaegeuk Kim 	struct nat_entry *e;
2052dcf51abSJaegeuk Kim 	bool need = false;
2062dcf51abSJaegeuk Kim 
207b873b798SJaegeuk Kim 	down_read(&nm_i->nat_tree_lock);
2082dcf51abSJaegeuk Kim 	e = __lookup_nat_cache(nm_i, nid);
2092dcf51abSJaegeuk Kim 	if (e) {
2102dcf51abSJaegeuk Kim 		if (!get_nat_flag(e, IS_CHECKPOINTED) &&
2112dcf51abSJaegeuk Kim 				!get_nat_flag(e, HAS_FSYNCED_INODE))
2122dcf51abSJaegeuk Kim 			need = true;
2132dcf51abSJaegeuk Kim 	}
214b873b798SJaegeuk Kim 	up_read(&nm_i->nat_tree_lock);
2152dcf51abSJaegeuk Kim 	return need;
2162dcf51abSJaegeuk Kim }
2172dcf51abSJaegeuk Kim 
21888bd02c9SJaegeuk Kim bool is_checkpointed_node(struct f2fs_sb_info *sbi, nid_t nid)
219e05df3b1SJaegeuk Kim {
220e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
221e05df3b1SJaegeuk Kim 	struct nat_entry *e;
22288bd02c9SJaegeuk Kim 	bool is_cp = true;
223e05df3b1SJaegeuk Kim 
224b873b798SJaegeuk Kim 	down_read(&nm_i->nat_tree_lock);
225e05df3b1SJaegeuk Kim 	e = __lookup_nat_cache(nm_i, nid);
2267ef35e3bSJaegeuk Kim 	if (e && !get_nat_flag(e, IS_CHECKPOINTED))
22788bd02c9SJaegeuk Kim 		is_cp = false;
228b873b798SJaegeuk Kim 	up_read(&nm_i->nat_tree_lock);
229e05df3b1SJaegeuk Kim 	return is_cp;
230e05df3b1SJaegeuk Kim }
231e05df3b1SJaegeuk Kim 
23288bd02c9SJaegeuk Kim bool need_inode_block_update(struct f2fs_sb_info *sbi, nid_t ino)
233b6fe5873SJaegeuk Kim {
234b6fe5873SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
235b6fe5873SJaegeuk Kim 	struct nat_entry *e;
23688bd02c9SJaegeuk Kim 	bool need_update = true;
237b6fe5873SJaegeuk Kim 
238b873b798SJaegeuk Kim 	down_read(&nm_i->nat_tree_lock);
23988bd02c9SJaegeuk Kim 	e = __lookup_nat_cache(nm_i, ino);
24088bd02c9SJaegeuk Kim 	if (e && get_nat_flag(e, HAS_LAST_FSYNC) &&
24188bd02c9SJaegeuk Kim 			(get_nat_flag(e, IS_CHECKPOINTED) ||
24288bd02c9SJaegeuk Kim 			 get_nat_flag(e, HAS_FSYNCED_INODE)))
24388bd02c9SJaegeuk Kim 		need_update = false;
244b873b798SJaegeuk Kim 	up_read(&nm_i->nat_tree_lock);
24588bd02c9SJaegeuk Kim 	return need_update;
246b6fe5873SJaegeuk Kim }
247b6fe5873SJaegeuk Kim 
2485c9e4184SChao Yu static struct nat_entry *grab_nat_entry(struct f2fs_nm_info *nm_i, nid_t nid,
2495c9e4184SChao Yu 								bool no_fail)
250e05df3b1SJaegeuk Kim {
251e05df3b1SJaegeuk Kim 	struct nat_entry *new;
252e05df3b1SJaegeuk Kim 
2535c9e4184SChao Yu 	if (no_fail) {
25480c54505SJaegeuk Kim 		new = f2fs_kmem_cache_alloc(nat_entry_slab, GFP_NOFS);
2559be32d72SJaegeuk Kim 		f2fs_radix_tree_insert(&nm_i->nat_root, nid, new);
2565c9e4184SChao Yu 	} else {
2575c9e4184SChao Yu 		new = kmem_cache_alloc(nat_entry_slab, GFP_NOFS);
2585c9e4184SChao Yu 		if (!new)
2595c9e4184SChao Yu 			return NULL;
2605c9e4184SChao Yu 		if (radix_tree_insert(&nm_i->nat_root, nid, new)) {
2615c9e4184SChao Yu 			kmem_cache_free(nat_entry_slab, new);
2625c9e4184SChao Yu 			return NULL;
2635c9e4184SChao Yu 		}
2645c9e4184SChao Yu 	}
2655c9e4184SChao Yu 
266e05df3b1SJaegeuk Kim 	memset(new, 0, sizeof(struct nat_entry));
267e05df3b1SJaegeuk Kim 	nat_set_nid(new, nid);
26888bd02c9SJaegeuk Kim 	nat_reset_flag(new);
269e05df3b1SJaegeuk Kim 	list_add_tail(&new->list, &nm_i->nat_entries);
270e05df3b1SJaegeuk Kim 	nm_i->nat_cnt++;
271e05df3b1SJaegeuk Kim 	return new;
272e05df3b1SJaegeuk Kim }
273e05df3b1SJaegeuk Kim 
2741515aef0SChao Yu static void cache_nat_entry(struct f2fs_sb_info *sbi, nid_t nid,
275e05df3b1SJaegeuk Kim 						struct f2fs_nat_entry *ne)
276e05df3b1SJaegeuk Kim {
2771515aef0SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
278e05df3b1SJaegeuk Kim 	struct nat_entry *e;
2799be32d72SJaegeuk Kim 
280e05df3b1SJaegeuk Kim 	e = __lookup_nat_cache(nm_i, nid);
281e05df3b1SJaegeuk Kim 	if (!e) {
2825c9e4184SChao Yu 		e = grab_nat_entry(nm_i, nid, false);
2835c9e4184SChao Yu 		if (e)
28494dac22eSChao Yu 			node_info_from_raw_nat(&e->ni, ne);
2851515aef0SChao Yu 	} else {
2860c0b471eSEric Biggers 		f2fs_bug_on(sbi, nat_get_ino(e) != le32_to_cpu(ne->ino) ||
2870c0b471eSEric Biggers 				nat_get_blkaddr(e) !=
2880c0b471eSEric Biggers 					le32_to_cpu(ne->block_addr) ||
2891515aef0SChao Yu 				nat_get_version(e) != ne->version);
290e05df3b1SJaegeuk Kim 	}
291e05df3b1SJaegeuk Kim }
292e05df3b1SJaegeuk Kim 
293e05df3b1SJaegeuk Kim static void set_node_addr(struct f2fs_sb_info *sbi, struct node_info *ni,
294479f40c4SJaegeuk Kim 			block_t new_blkaddr, bool fsync_done)
295e05df3b1SJaegeuk Kim {
296e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
297e05df3b1SJaegeuk Kim 	struct nat_entry *e;
2989be32d72SJaegeuk Kim 
299b873b798SJaegeuk Kim 	down_write(&nm_i->nat_tree_lock);
300e05df3b1SJaegeuk Kim 	e = __lookup_nat_cache(nm_i, ni->nid);
301e05df3b1SJaegeuk Kim 	if (!e) {
3025c9e4184SChao Yu 		e = grab_nat_entry(nm_i, ni->nid, true);
3035c27f4eeSChao Yu 		copy_node_info(&e->ni, ni);
3049850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, ni->blk_addr == NEW_ADDR);
305e05df3b1SJaegeuk Kim 	} else if (new_blkaddr == NEW_ADDR) {
306e05df3b1SJaegeuk Kim 		/*
307e05df3b1SJaegeuk Kim 		 * when nid is reallocated,
308e05df3b1SJaegeuk Kim 		 * previous nat entry can be remained in nat cache.
309e05df3b1SJaegeuk Kim 		 * So, reinitialize it with new information.
310e05df3b1SJaegeuk Kim 		 */
3115c27f4eeSChao Yu 		copy_node_info(&e->ni, ni);
3129850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, ni->blk_addr != NULL_ADDR);
313e05df3b1SJaegeuk Kim 	}
314e05df3b1SJaegeuk Kim 
315e05df3b1SJaegeuk Kim 	/* sanity check */
3169850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, nat_get_blkaddr(e) != ni->blk_addr);
3179850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, nat_get_blkaddr(e) == NULL_ADDR &&
318e05df3b1SJaegeuk Kim 			new_blkaddr == NULL_ADDR);
3199850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, nat_get_blkaddr(e) == NEW_ADDR &&
320e05df3b1SJaegeuk Kim 			new_blkaddr == NEW_ADDR);
3219850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, nat_get_blkaddr(e) != NEW_ADDR &&
322e05df3b1SJaegeuk Kim 			nat_get_blkaddr(e) != NULL_ADDR &&
323e05df3b1SJaegeuk Kim 			new_blkaddr == NEW_ADDR);
324e05df3b1SJaegeuk Kim 
325e1c42045Sarter97 	/* increment version no as node is removed */
326e05df3b1SJaegeuk Kim 	if (nat_get_blkaddr(e) != NEW_ADDR && new_blkaddr == NULL_ADDR) {
327e05df3b1SJaegeuk Kim 		unsigned char version = nat_get_version(e);
328e05df3b1SJaegeuk Kim 		nat_set_version(e, inc_node_version(version));
32926834466SJaegeuk Kim 
33026834466SJaegeuk Kim 		/* in order to reuse the nid */
33126834466SJaegeuk Kim 		if (nm_i->next_scan_nid > ni->nid)
33226834466SJaegeuk Kim 			nm_i->next_scan_nid = ni->nid;
333e05df3b1SJaegeuk Kim 	}
334e05df3b1SJaegeuk Kim 
335e05df3b1SJaegeuk Kim 	/* change address */
336e05df3b1SJaegeuk Kim 	nat_set_blkaddr(e, new_blkaddr);
33788bd02c9SJaegeuk Kim 	if (new_blkaddr == NEW_ADDR || new_blkaddr == NULL_ADDR)
33888bd02c9SJaegeuk Kim 		set_nat_flag(e, IS_CHECKPOINTED, false);
339e05df3b1SJaegeuk Kim 	__set_nat_cache_dirty(nm_i, e);
340479f40c4SJaegeuk Kim 
341479f40c4SJaegeuk Kim 	/* update fsync_mark if its inode nat entry is still alive */
342d5b692b7SChao Yu 	if (ni->nid != ni->ino)
343479f40c4SJaegeuk Kim 		e = __lookup_nat_cache(nm_i, ni->ino);
34488bd02c9SJaegeuk Kim 	if (e) {
34588bd02c9SJaegeuk Kim 		if (fsync_done && ni->nid == ni->ino)
34688bd02c9SJaegeuk Kim 			set_nat_flag(e, HAS_FSYNCED_INODE, true);
34788bd02c9SJaegeuk Kim 		set_nat_flag(e, HAS_LAST_FSYNC, fsync_done);
34888bd02c9SJaegeuk Kim 	}
349b873b798SJaegeuk Kim 	up_write(&nm_i->nat_tree_lock);
350e05df3b1SJaegeuk Kim }
351e05df3b1SJaegeuk Kim 
3524660f9c0SJaegeuk Kim int try_to_free_nats(struct f2fs_sb_info *sbi, int nr_shrink)
353e05df3b1SJaegeuk Kim {
354e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
3551b38dc8eSJaegeuk Kim 	int nr = nr_shrink;
356e05df3b1SJaegeuk Kim 
357b873b798SJaegeuk Kim 	if (!down_write_trylock(&nm_i->nat_tree_lock))
358b873b798SJaegeuk Kim 		return 0;
359e05df3b1SJaegeuk Kim 
360e05df3b1SJaegeuk Kim 	while (nr_shrink && !list_empty(&nm_i->nat_entries)) {
361e05df3b1SJaegeuk Kim 		struct nat_entry *ne;
362e05df3b1SJaegeuk Kim 		ne = list_first_entry(&nm_i->nat_entries,
363e05df3b1SJaegeuk Kim 					struct nat_entry, list);
364e05df3b1SJaegeuk Kim 		__del_from_nat_cache(nm_i, ne);
365e05df3b1SJaegeuk Kim 		nr_shrink--;
366e05df3b1SJaegeuk Kim 	}
367b873b798SJaegeuk Kim 	up_write(&nm_i->nat_tree_lock);
3681b38dc8eSJaegeuk Kim 	return nr - nr_shrink;
369e05df3b1SJaegeuk Kim }
370e05df3b1SJaegeuk Kim 
3710a8165d7SJaegeuk Kim /*
372e1c42045Sarter97  * This function always returns success
373e05df3b1SJaegeuk Kim  */
374e05df3b1SJaegeuk Kim void get_node_info(struct f2fs_sb_info *sbi, nid_t nid, struct node_info *ni)
375e05df3b1SJaegeuk Kim {
376e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
377e05df3b1SJaegeuk Kim 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
378b7ad7512SChao Yu 	struct f2fs_journal *journal = curseg->journal;
379e05df3b1SJaegeuk Kim 	nid_t start_nid = START_NID(nid);
380e05df3b1SJaegeuk Kim 	struct f2fs_nat_block *nat_blk;
381e05df3b1SJaegeuk Kim 	struct page *page = NULL;
382e05df3b1SJaegeuk Kim 	struct f2fs_nat_entry ne;
383e05df3b1SJaegeuk Kim 	struct nat_entry *e;
38466a82d1fSYunlei He 	pgoff_t index;
385e05df3b1SJaegeuk Kim 	int i;
386e05df3b1SJaegeuk Kim 
387e05df3b1SJaegeuk Kim 	ni->nid = nid;
388e05df3b1SJaegeuk Kim 
389e05df3b1SJaegeuk Kim 	/* Check nat cache */
390b873b798SJaegeuk Kim 	down_read(&nm_i->nat_tree_lock);
391e05df3b1SJaegeuk Kim 	e = __lookup_nat_cache(nm_i, nid);
392e05df3b1SJaegeuk Kim 	if (e) {
393e05df3b1SJaegeuk Kim 		ni->ino = nat_get_ino(e);
394e05df3b1SJaegeuk Kim 		ni->blk_addr = nat_get_blkaddr(e);
395e05df3b1SJaegeuk Kim 		ni->version = nat_get_version(e);
396b873b798SJaegeuk Kim 		up_read(&nm_i->nat_tree_lock);
397e05df3b1SJaegeuk Kim 		return;
3981515aef0SChao Yu 	}
399e05df3b1SJaegeuk Kim 
4003547ea96SJaegeuk Kim 	memset(&ne, 0, sizeof(struct f2fs_nat_entry));
4013547ea96SJaegeuk Kim 
402e05df3b1SJaegeuk Kim 	/* Check current segment summary */
403b7ad7512SChao Yu 	down_read(&curseg->journal_rwsem);
404dfc08a12SChao Yu 	i = lookup_journal_in_cursum(journal, NAT_JOURNAL, nid, 0);
405e05df3b1SJaegeuk Kim 	if (i >= 0) {
406dfc08a12SChao Yu 		ne = nat_in_journal(journal, i);
407e05df3b1SJaegeuk Kim 		node_info_from_raw_nat(ni, &ne);
408e05df3b1SJaegeuk Kim 	}
409b7ad7512SChao Yu 	up_read(&curseg->journal_rwsem);
41066a82d1fSYunlei He 	if (i >= 0) {
41166a82d1fSYunlei He 		up_read(&nm_i->nat_tree_lock);
412e05df3b1SJaegeuk Kim 		goto cache;
41366a82d1fSYunlei He 	}
414e05df3b1SJaegeuk Kim 
415e05df3b1SJaegeuk Kim 	/* Fill node_info from nat page */
41666a82d1fSYunlei He 	index = current_nat_addr(sbi, nid);
41766a82d1fSYunlei He 	up_read(&nm_i->nat_tree_lock);
41866a82d1fSYunlei He 
41966a82d1fSYunlei He 	page = get_meta_page(sbi, index);
420e05df3b1SJaegeuk Kim 	nat_blk = (struct f2fs_nat_block *)page_address(page);
421e05df3b1SJaegeuk Kim 	ne = nat_blk->entries[nid - start_nid];
422e05df3b1SJaegeuk Kim 	node_info_from_raw_nat(ni, &ne);
423e05df3b1SJaegeuk Kim 	f2fs_put_page(page, 1);
424e05df3b1SJaegeuk Kim cache:
425e05df3b1SJaegeuk Kim 	/* cache nat entry */
426b873b798SJaegeuk Kim 	down_write(&nm_i->nat_tree_lock);
4271515aef0SChao Yu 	cache_nat_entry(sbi, nid, &ne);
428b873b798SJaegeuk Kim 	up_write(&nm_i->nat_tree_lock);
429e05df3b1SJaegeuk Kim }
430e05df3b1SJaegeuk Kim 
43179344efbSJaegeuk Kim /*
43279344efbSJaegeuk Kim  * readahead MAX_RA_NODE number of node pages.
43379344efbSJaegeuk Kim  */
43479344efbSJaegeuk Kim static void ra_node_pages(struct page *parent, int start, int n)
43579344efbSJaegeuk Kim {
43679344efbSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_P_SB(parent);
43779344efbSJaegeuk Kim 	struct blk_plug plug;
43879344efbSJaegeuk Kim 	int i, end;
43979344efbSJaegeuk Kim 	nid_t nid;
44079344efbSJaegeuk Kim 
44179344efbSJaegeuk Kim 	blk_start_plug(&plug);
44279344efbSJaegeuk Kim 
44379344efbSJaegeuk Kim 	/* Then, try readahead for siblings of the desired node */
44479344efbSJaegeuk Kim 	end = start + n;
44579344efbSJaegeuk Kim 	end = min(end, NIDS_PER_BLOCK);
44679344efbSJaegeuk Kim 	for (i = start; i < end; i++) {
44779344efbSJaegeuk Kim 		nid = get_nid(parent, i, false);
44879344efbSJaegeuk Kim 		ra_node_page(sbi, nid);
44979344efbSJaegeuk Kim 	}
45079344efbSJaegeuk Kim 
45179344efbSJaegeuk Kim 	blk_finish_plug(&plug);
45279344efbSJaegeuk Kim }
45379344efbSJaegeuk Kim 
4543cf45747SChao Yu pgoff_t get_next_page_offset(struct dnode_of_data *dn, pgoff_t pgofs)
4553cf45747SChao Yu {
4563cf45747SChao Yu 	const long direct_index = ADDRS_PER_INODE(dn->inode);
4573cf45747SChao Yu 	const long direct_blks = ADDRS_PER_BLOCK;
4583cf45747SChao Yu 	const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK;
4593cf45747SChao Yu 	unsigned int skipped_unit = ADDRS_PER_BLOCK;
4603cf45747SChao Yu 	int cur_level = dn->cur_level;
4613cf45747SChao Yu 	int max_level = dn->max_level;
4623cf45747SChao Yu 	pgoff_t base = 0;
4633cf45747SChao Yu 
4643cf45747SChao Yu 	if (!dn->max_level)
4653cf45747SChao Yu 		return pgofs + 1;
4663cf45747SChao Yu 
4673cf45747SChao Yu 	while (max_level-- > cur_level)
4683cf45747SChao Yu 		skipped_unit *= NIDS_PER_BLOCK;
4693cf45747SChao Yu 
4703cf45747SChao Yu 	switch (dn->max_level) {
4713cf45747SChao Yu 	case 3:
4723cf45747SChao Yu 		base += 2 * indirect_blks;
4733cf45747SChao Yu 	case 2:
4743cf45747SChao Yu 		base += 2 * direct_blks;
4753cf45747SChao Yu 	case 1:
4763cf45747SChao Yu 		base += direct_index;
4773cf45747SChao Yu 		break;
4783cf45747SChao Yu 	default:
4793cf45747SChao Yu 		f2fs_bug_on(F2FS_I_SB(dn->inode), 1);
4803cf45747SChao Yu 	}
4813cf45747SChao Yu 
4823cf45747SChao Yu 	return ((pgofs - base) / skipped_unit + 1) * skipped_unit + base;
4833cf45747SChao Yu }
4843cf45747SChao Yu 
4850a8165d7SJaegeuk Kim /*
486e05df3b1SJaegeuk Kim  * The maximum depth is four.
487e05df3b1SJaegeuk Kim  * Offset[0] will have raw inode offset.
488e05df3b1SJaegeuk Kim  */
48981ca7350SChao Yu static int get_node_path(struct inode *inode, long block,
490de93653fSJaegeuk Kim 				int offset[4], unsigned int noffset[4])
491e05df3b1SJaegeuk Kim {
49281ca7350SChao Yu 	const long direct_index = ADDRS_PER_INODE(inode);
493e05df3b1SJaegeuk Kim 	const long direct_blks = ADDRS_PER_BLOCK;
494e05df3b1SJaegeuk Kim 	const long dptrs_per_blk = NIDS_PER_BLOCK;
495e05df3b1SJaegeuk Kim 	const long indirect_blks = ADDRS_PER_BLOCK * NIDS_PER_BLOCK;
496e05df3b1SJaegeuk Kim 	const long dindirect_blks = indirect_blks * NIDS_PER_BLOCK;
497e05df3b1SJaegeuk Kim 	int n = 0;
498e05df3b1SJaegeuk Kim 	int level = 0;
499e05df3b1SJaegeuk Kim 
500e05df3b1SJaegeuk Kim 	noffset[0] = 0;
501e05df3b1SJaegeuk Kim 
502e05df3b1SJaegeuk Kim 	if (block < direct_index) {
50325c0a6e5SNamjae Jeon 		offset[n] = block;
504e05df3b1SJaegeuk Kim 		goto got;
505e05df3b1SJaegeuk Kim 	}
506e05df3b1SJaegeuk Kim 	block -= direct_index;
507e05df3b1SJaegeuk Kim 	if (block < direct_blks) {
508e05df3b1SJaegeuk Kim 		offset[n++] = NODE_DIR1_BLOCK;
509e05df3b1SJaegeuk Kim 		noffset[n] = 1;
51025c0a6e5SNamjae Jeon 		offset[n] = block;
511e05df3b1SJaegeuk Kim 		level = 1;
512e05df3b1SJaegeuk Kim 		goto got;
513e05df3b1SJaegeuk Kim 	}
514e05df3b1SJaegeuk Kim 	block -= direct_blks;
515e05df3b1SJaegeuk Kim 	if (block < direct_blks) {
516e05df3b1SJaegeuk Kim 		offset[n++] = NODE_DIR2_BLOCK;
517e05df3b1SJaegeuk Kim 		noffset[n] = 2;
51825c0a6e5SNamjae Jeon 		offset[n] = block;
519e05df3b1SJaegeuk Kim 		level = 1;
520e05df3b1SJaegeuk Kim 		goto got;
521e05df3b1SJaegeuk Kim 	}
522e05df3b1SJaegeuk Kim 	block -= direct_blks;
523e05df3b1SJaegeuk Kim 	if (block < indirect_blks) {
524e05df3b1SJaegeuk Kim 		offset[n++] = NODE_IND1_BLOCK;
525e05df3b1SJaegeuk Kim 		noffset[n] = 3;
526e05df3b1SJaegeuk Kim 		offset[n++] = block / direct_blks;
527e05df3b1SJaegeuk Kim 		noffset[n] = 4 + offset[n - 1];
52825c0a6e5SNamjae Jeon 		offset[n] = block % direct_blks;
529e05df3b1SJaegeuk Kim 		level = 2;
530e05df3b1SJaegeuk Kim 		goto got;
531e05df3b1SJaegeuk Kim 	}
532e05df3b1SJaegeuk Kim 	block -= indirect_blks;
533e05df3b1SJaegeuk Kim 	if (block < indirect_blks) {
534e05df3b1SJaegeuk Kim 		offset[n++] = NODE_IND2_BLOCK;
535e05df3b1SJaegeuk Kim 		noffset[n] = 4 + dptrs_per_blk;
536e05df3b1SJaegeuk Kim 		offset[n++] = block / direct_blks;
537e05df3b1SJaegeuk Kim 		noffset[n] = 5 + dptrs_per_blk + offset[n - 1];
53825c0a6e5SNamjae Jeon 		offset[n] = block % direct_blks;
539e05df3b1SJaegeuk Kim 		level = 2;
540e05df3b1SJaegeuk Kim 		goto got;
541e05df3b1SJaegeuk Kim 	}
542e05df3b1SJaegeuk Kim 	block -= indirect_blks;
543e05df3b1SJaegeuk Kim 	if (block < dindirect_blks) {
544e05df3b1SJaegeuk Kim 		offset[n++] = NODE_DIND_BLOCK;
545e05df3b1SJaegeuk Kim 		noffset[n] = 5 + (dptrs_per_blk * 2);
546e05df3b1SJaegeuk Kim 		offset[n++] = block / indirect_blks;
547e05df3b1SJaegeuk Kim 		noffset[n] = 6 + (dptrs_per_blk * 2) +
548e05df3b1SJaegeuk Kim 			      offset[n - 1] * (dptrs_per_blk + 1);
549e05df3b1SJaegeuk Kim 		offset[n++] = (block / direct_blks) % dptrs_per_blk;
550e05df3b1SJaegeuk Kim 		noffset[n] = 7 + (dptrs_per_blk * 2) +
551e05df3b1SJaegeuk Kim 			      offset[n - 2] * (dptrs_per_blk + 1) +
552e05df3b1SJaegeuk Kim 			      offset[n - 1];
55325c0a6e5SNamjae Jeon 		offset[n] = block % direct_blks;
554e05df3b1SJaegeuk Kim 		level = 3;
555e05df3b1SJaegeuk Kim 		goto got;
556e05df3b1SJaegeuk Kim 	} else {
557e05df3b1SJaegeuk Kim 		BUG();
558e05df3b1SJaegeuk Kim 	}
559e05df3b1SJaegeuk Kim got:
560e05df3b1SJaegeuk Kim 	return level;
561e05df3b1SJaegeuk Kim }
562e05df3b1SJaegeuk Kim 
563e05df3b1SJaegeuk Kim /*
564e05df3b1SJaegeuk Kim  * Caller should call f2fs_put_dnode(dn).
5654f4124d0SChao Yu  * Also, it should grab and release a rwsem by calling f2fs_lock_op() and
5664f4124d0SChao Yu  * f2fs_unlock_op() only if ro is not set RDONLY_NODE.
56739936837SJaegeuk Kim  * In the case of RDONLY_NODE, we don't need to care about mutex.
568e05df3b1SJaegeuk Kim  */
569266e97a8SJaegeuk Kim int get_dnode_of_data(struct dnode_of_data *dn, pgoff_t index, int mode)
570e05df3b1SJaegeuk Kim {
5714081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
572e05df3b1SJaegeuk Kim 	struct page *npage[4];
573f1a3b98eSJaegeuk Kim 	struct page *parent = NULL;
574e05df3b1SJaegeuk Kim 	int offset[4];
575e05df3b1SJaegeuk Kim 	unsigned int noffset[4];
576e05df3b1SJaegeuk Kim 	nid_t nids[4];
5773cf45747SChao Yu 	int level, i = 0;
578e05df3b1SJaegeuk Kim 	int err = 0;
579e05df3b1SJaegeuk Kim 
58081ca7350SChao Yu 	level = get_node_path(dn->inode, index, offset, noffset);
581e05df3b1SJaegeuk Kim 
582e05df3b1SJaegeuk Kim 	nids[0] = dn->inode->i_ino;
5831646cfacSJaegeuk Kim 	npage[0] = dn->inode_page;
5841646cfacSJaegeuk Kim 
5851646cfacSJaegeuk Kim 	if (!npage[0]) {
586e05df3b1SJaegeuk Kim 		npage[0] = get_node_page(sbi, nids[0]);
587e05df3b1SJaegeuk Kim 		if (IS_ERR(npage[0]))
588e05df3b1SJaegeuk Kim 			return PTR_ERR(npage[0]);
5891646cfacSJaegeuk Kim 	}
590f1a3b98eSJaegeuk Kim 
591f1a3b98eSJaegeuk Kim 	/* if inline_data is set, should not report any block indices */
592f1a3b98eSJaegeuk Kim 	if (f2fs_has_inline_data(dn->inode) && index) {
59376629165SJaegeuk Kim 		err = -ENOENT;
594f1a3b98eSJaegeuk Kim 		f2fs_put_page(npage[0], 1);
595f1a3b98eSJaegeuk Kim 		goto release_out;
596f1a3b98eSJaegeuk Kim 	}
597f1a3b98eSJaegeuk Kim 
598e05df3b1SJaegeuk Kim 	parent = npage[0];
59952c2db3fSChangman Lee 	if (level != 0)
600e05df3b1SJaegeuk Kim 		nids[1] = get_nid(parent, offset[0], true);
601e05df3b1SJaegeuk Kim 	dn->inode_page = npage[0];
602e05df3b1SJaegeuk Kim 	dn->inode_page_locked = true;
603e05df3b1SJaegeuk Kim 
604e05df3b1SJaegeuk Kim 	/* get indirect or direct nodes */
605e05df3b1SJaegeuk Kim 	for (i = 1; i <= level; i++) {
606e05df3b1SJaegeuk Kim 		bool done = false;
607e05df3b1SJaegeuk Kim 
608266e97a8SJaegeuk Kim 		if (!nids[i] && mode == ALLOC_NODE) {
609e05df3b1SJaegeuk Kim 			/* alloc new node */
610e05df3b1SJaegeuk Kim 			if (!alloc_nid(sbi, &(nids[i]))) {
611e05df3b1SJaegeuk Kim 				err = -ENOSPC;
612e05df3b1SJaegeuk Kim 				goto release_pages;
613e05df3b1SJaegeuk Kim 			}
614e05df3b1SJaegeuk Kim 
615e05df3b1SJaegeuk Kim 			dn->nid = nids[i];
6168ae8f162SJaegeuk Kim 			npage[i] = new_node_page(dn, noffset[i], NULL);
617e05df3b1SJaegeuk Kim 			if (IS_ERR(npage[i])) {
618e05df3b1SJaegeuk Kim 				alloc_nid_failed(sbi, nids[i]);
619e05df3b1SJaegeuk Kim 				err = PTR_ERR(npage[i]);
620e05df3b1SJaegeuk Kim 				goto release_pages;
621e05df3b1SJaegeuk Kim 			}
622e05df3b1SJaegeuk Kim 
623e05df3b1SJaegeuk Kim 			set_nid(parent, offset[i - 1], nids[i], i == 1);
624e05df3b1SJaegeuk Kim 			alloc_nid_done(sbi, nids[i]);
625e05df3b1SJaegeuk Kim 			done = true;
626266e97a8SJaegeuk Kim 		} else if (mode == LOOKUP_NODE_RA && i == level && level > 1) {
627e05df3b1SJaegeuk Kim 			npage[i] = get_node_page_ra(parent, offset[i - 1]);
628e05df3b1SJaegeuk Kim 			if (IS_ERR(npage[i])) {
629e05df3b1SJaegeuk Kim 				err = PTR_ERR(npage[i]);
630e05df3b1SJaegeuk Kim 				goto release_pages;
631e05df3b1SJaegeuk Kim 			}
632e05df3b1SJaegeuk Kim 			done = true;
633e05df3b1SJaegeuk Kim 		}
634e05df3b1SJaegeuk Kim 		if (i == 1) {
635e05df3b1SJaegeuk Kim 			dn->inode_page_locked = false;
636e05df3b1SJaegeuk Kim 			unlock_page(parent);
637e05df3b1SJaegeuk Kim 		} else {
638e05df3b1SJaegeuk Kim 			f2fs_put_page(parent, 1);
639e05df3b1SJaegeuk Kim 		}
640e05df3b1SJaegeuk Kim 
641e05df3b1SJaegeuk Kim 		if (!done) {
642e05df3b1SJaegeuk Kim 			npage[i] = get_node_page(sbi, nids[i]);
643e05df3b1SJaegeuk Kim 			if (IS_ERR(npage[i])) {
644e05df3b1SJaegeuk Kim 				err = PTR_ERR(npage[i]);
645e05df3b1SJaegeuk Kim 				f2fs_put_page(npage[0], 0);
646e05df3b1SJaegeuk Kim 				goto release_out;
647e05df3b1SJaegeuk Kim 			}
648e05df3b1SJaegeuk Kim 		}
649e05df3b1SJaegeuk Kim 		if (i < level) {
650e05df3b1SJaegeuk Kim 			parent = npage[i];
651e05df3b1SJaegeuk Kim 			nids[i + 1] = get_nid(parent, offset[i], false);
652e05df3b1SJaegeuk Kim 		}
653e05df3b1SJaegeuk Kim 	}
654e05df3b1SJaegeuk Kim 	dn->nid = nids[level];
655e05df3b1SJaegeuk Kim 	dn->ofs_in_node = offset[level];
656e05df3b1SJaegeuk Kim 	dn->node_page = npage[level];
657e05df3b1SJaegeuk Kim 	dn->data_blkaddr = datablock_addr(dn->node_page, dn->ofs_in_node);
658e05df3b1SJaegeuk Kim 	return 0;
659e05df3b1SJaegeuk Kim 
660e05df3b1SJaegeuk Kim release_pages:
661e05df3b1SJaegeuk Kim 	f2fs_put_page(parent, 1);
662e05df3b1SJaegeuk Kim 	if (i > 1)
663e05df3b1SJaegeuk Kim 		f2fs_put_page(npage[0], 0);
664e05df3b1SJaegeuk Kim release_out:
665e05df3b1SJaegeuk Kim 	dn->inode_page = NULL;
666e05df3b1SJaegeuk Kim 	dn->node_page = NULL;
6673cf45747SChao Yu 	if (err == -ENOENT) {
6683cf45747SChao Yu 		dn->cur_level = i;
6693cf45747SChao Yu 		dn->max_level = level;
6700a2aa8fbSJaegeuk Kim 		dn->ofs_in_node = offset[level];
6713cf45747SChao Yu 	}
672e05df3b1SJaegeuk Kim 	return err;
673e05df3b1SJaegeuk Kim }
674e05df3b1SJaegeuk Kim 
675e05df3b1SJaegeuk Kim static void truncate_node(struct dnode_of_data *dn)
676e05df3b1SJaegeuk Kim {
6774081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
678e05df3b1SJaegeuk Kim 	struct node_info ni;
679e05df3b1SJaegeuk Kim 
680e05df3b1SJaegeuk Kim 	get_node_info(sbi, dn->nid, &ni);
68171e9fec5SJaegeuk Kim 	if (dn->inode->i_blocks == 0) {
6829850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, ni.blk_addr != NULL_ADDR);
68371e9fec5SJaegeuk Kim 		goto invalidate;
68471e9fec5SJaegeuk Kim 	}
6859850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR);
686e05df3b1SJaegeuk Kim 
687e05df3b1SJaegeuk Kim 	/* Deallocate node address */
68871e9fec5SJaegeuk Kim 	invalidate_blocks(sbi, ni.blk_addr);
689ef86d709SGu Zheng 	dec_valid_node_count(sbi, dn->inode);
690479f40c4SJaegeuk Kim 	set_node_addr(sbi, &ni, NULL_ADDR, false);
691e05df3b1SJaegeuk Kim 
692e05df3b1SJaegeuk Kim 	if (dn->nid == dn->inode->i_ino) {
693e05df3b1SJaegeuk Kim 		remove_orphan_inode(sbi, dn->nid);
694e05df3b1SJaegeuk Kim 		dec_valid_inode_count(sbi);
6950f18b462SJaegeuk Kim 		f2fs_inode_synced(dn->inode);
696e05df3b1SJaegeuk Kim 	}
69771e9fec5SJaegeuk Kim invalidate:
698e05df3b1SJaegeuk Kim 	clear_node_page_dirty(dn->node_page);
699caf0047eSChao Yu 	set_sbi_flag(sbi, SBI_IS_DIRTY);
700e05df3b1SJaegeuk Kim 
701e05df3b1SJaegeuk Kim 	f2fs_put_page(dn->node_page, 1);
702bf39c00aSJaegeuk Kim 
703bf39c00aSJaegeuk Kim 	invalidate_mapping_pages(NODE_MAPPING(sbi),
704bf39c00aSJaegeuk Kim 			dn->node_page->index, dn->node_page->index);
705bf39c00aSJaegeuk Kim 
706e05df3b1SJaegeuk Kim 	dn->node_page = NULL;
70751dd6249SNamjae Jeon 	trace_f2fs_truncate_node(dn->inode, dn->nid, ni.blk_addr);
708e05df3b1SJaegeuk Kim }
709e05df3b1SJaegeuk Kim 
710e05df3b1SJaegeuk Kim static int truncate_dnode(struct dnode_of_data *dn)
711e05df3b1SJaegeuk Kim {
712e05df3b1SJaegeuk Kim 	struct page *page;
713e05df3b1SJaegeuk Kim 
714e05df3b1SJaegeuk Kim 	if (dn->nid == 0)
715e05df3b1SJaegeuk Kim 		return 1;
716e05df3b1SJaegeuk Kim 
717e05df3b1SJaegeuk Kim 	/* get direct node */
7184081363fSJaegeuk Kim 	page = get_node_page(F2FS_I_SB(dn->inode), dn->nid);
719e05df3b1SJaegeuk Kim 	if (IS_ERR(page) && PTR_ERR(page) == -ENOENT)
720e05df3b1SJaegeuk Kim 		return 1;
721e05df3b1SJaegeuk Kim 	else if (IS_ERR(page))
722e05df3b1SJaegeuk Kim 		return PTR_ERR(page);
723e05df3b1SJaegeuk Kim 
724e05df3b1SJaegeuk Kim 	/* Make dnode_of_data for parameter */
725e05df3b1SJaegeuk Kim 	dn->node_page = page;
726e05df3b1SJaegeuk Kim 	dn->ofs_in_node = 0;
727e05df3b1SJaegeuk Kim 	truncate_data_blocks(dn);
728e05df3b1SJaegeuk Kim 	truncate_node(dn);
729e05df3b1SJaegeuk Kim 	return 1;
730e05df3b1SJaegeuk Kim }
731e05df3b1SJaegeuk Kim 
732e05df3b1SJaegeuk Kim static int truncate_nodes(struct dnode_of_data *dn, unsigned int nofs,
733e05df3b1SJaegeuk Kim 						int ofs, int depth)
734e05df3b1SJaegeuk Kim {
735e05df3b1SJaegeuk Kim 	struct dnode_of_data rdn = *dn;
736e05df3b1SJaegeuk Kim 	struct page *page;
737e05df3b1SJaegeuk Kim 	struct f2fs_node *rn;
738e05df3b1SJaegeuk Kim 	nid_t child_nid;
739e05df3b1SJaegeuk Kim 	unsigned int child_nofs;
740e05df3b1SJaegeuk Kim 	int freed = 0;
741e05df3b1SJaegeuk Kim 	int i, ret;
742e05df3b1SJaegeuk Kim 
743e05df3b1SJaegeuk Kim 	if (dn->nid == 0)
744e05df3b1SJaegeuk Kim 		return NIDS_PER_BLOCK + 1;
745e05df3b1SJaegeuk Kim 
74651dd6249SNamjae Jeon 	trace_f2fs_truncate_nodes_enter(dn->inode, dn->nid, dn->data_blkaddr);
74751dd6249SNamjae Jeon 
7484081363fSJaegeuk Kim 	page = get_node_page(F2FS_I_SB(dn->inode), dn->nid);
74951dd6249SNamjae Jeon 	if (IS_ERR(page)) {
75051dd6249SNamjae Jeon 		trace_f2fs_truncate_nodes_exit(dn->inode, PTR_ERR(page));
751e05df3b1SJaegeuk Kim 		return PTR_ERR(page);
75251dd6249SNamjae Jeon 	}
753e05df3b1SJaegeuk Kim 
75479344efbSJaegeuk Kim 	ra_node_pages(page, ofs, NIDS_PER_BLOCK);
75579344efbSJaegeuk Kim 
75645590710SGu Zheng 	rn = F2FS_NODE(page);
757e05df3b1SJaegeuk Kim 	if (depth < 3) {
758e05df3b1SJaegeuk Kim 		for (i = ofs; i < NIDS_PER_BLOCK; i++, freed++) {
759e05df3b1SJaegeuk Kim 			child_nid = le32_to_cpu(rn->in.nid[i]);
760e05df3b1SJaegeuk Kim 			if (child_nid == 0)
761e05df3b1SJaegeuk Kim 				continue;
762e05df3b1SJaegeuk Kim 			rdn.nid = child_nid;
763e05df3b1SJaegeuk Kim 			ret = truncate_dnode(&rdn);
764e05df3b1SJaegeuk Kim 			if (ret < 0)
765e05df3b1SJaegeuk Kim 				goto out_err;
76612719ae1SJaegeuk Kim 			if (set_nid(page, i, 0, false))
76793bae099SJaegeuk Kim 				dn->node_changed = true;
768e05df3b1SJaegeuk Kim 		}
769e05df3b1SJaegeuk Kim 	} else {
770e05df3b1SJaegeuk Kim 		child_nofs = nofs + ofs * (NIDS_PER_BLOCK + 1) + 1;
771e05df3b1SJaegeuk Kim 		for (i = ofs; i < NIDS_PER_BLOCK; i++) {
772e05df3b1SJaegeuk Kim 			child_nid = le32_to_cpu(rn->in.nid[i]);
773e05df3b1SJaegeuk Kim 			if (child_nid == 0) {
774e05df3b1SJaegeuk Kim 				child_nofs += NIDS_PER_BLOCK + 1;
775e05df3b1SJaegeuk Kim 				continue;
776e05df3b1SJaegeuk Kim 			}
777e05df3b1SJaegeuk Kim 			rdn.nid = child_nid;
778e05df3b1SJaegeuk Kim 			ret = truncate_nodes(&rdn, child_nofs, 0, depth - 1);
779e05df3b1SJaegeuk Kim 			if (ret == (NIDS_PER_BLOCK + 1)) {
78012719ae1SJaegeuk Kim 				if (set_nid(page, i, 0, false))
78193bae099SJaegeuk Kim 					dn->node_changed = true;
782e05df3b1SJaegeuk Kim 				child_nofs += ret;
783e05df3b1SJaegeuk Kim 			} else if (ret < 0 && ret != -ENOENT) {
784e05df3b1SJaegeuk Kim 				goto out_err;
785e05df3b1SJaegeuk Kim 			}
786e05df3b1SJaegeuk Kim 		}
787e05df3b1SJaegeuk Kim 		freed = child_nofs;
788e05df3b1SJaegeuk Kim 	}
789e05df3b1SJaegeuk Kim 
790e05df3b1SJaegeuk Kim 	if (!ofs) {
791e05df3b1SJaegeuk Kim 		/* remove current indirect node */
792e05df3b1SJaegeuk Kim 		dn->node_page = page;
793e05df3b1SJaegeuk Kim 		truncate_node(dn);
794e05df3b1SJaegeuk Kim 		freed++;
795e05df3b1SJaegeuk Kim 	} else {
796e05df3b1SJaegeuk Kim 		f2fs_put_page(page, 1);
797e05df3b1SJaegeuk Kim 	}
79851dd6249SNamjae Jeon 	trace_f2fs_truncate_nodes_exit(dn->inode, freed);
799e05df3b1SJaegeuk Kim 	return freed;
800e05df3b1SJaegeuk Kim 
801e05df3b1SJaegeuk Kim out_err:
802e05df3b1SJaegeuk Kim 	f2fs_put_page(page, 1);
80351dd6249SNamjae Jeon 	trace_f2fs_truncate_nodes_exit(dn->inode, ret);
804e05df3b1SJaegeuk Kim 	return ret;
805e05df3b1SJaegeuk Kim }
806e05df3b1SJaegeuk Kim 
807e05df3b1SJaegeuk Kim static int truncate_partial_nodes(struct dnode_of_data *dn,
808e05df3b1SJaegeuk Kim 			struct f2fs_inode *ri, int *offset, int depth)
809e05df3b1SJaegeuk Kim {
810e05df3b1SJaegeuk Kim 	struct page *pages[2];
811e05df3b1SJaegeuk Kim 	nid_t nid[3];
812e05df3b1SJaegeuk Kim 	nid_t child_nid;
813e05df3b1SJaegeuk Kim 	int err = 0;
814e05df3b1SJaegeuk Kim 	int i;
815e05df3b1SJaegeuk Kim 	int idx = depth - 2;
816e05df3b1SJaegeuk Kim 
817e05df3b1SJaegeuk Kim 	nid[0] = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]);
818e05df3b1SJaegeuk Kim 	if (!nid[0])
819e05df3b1SJaegeuk Kim 		return 0;
820e05df3b1SJaegeuk Kim 
821e05df3b1SJaegeuk Kim 	/* get indirect nodes in the path */
822a225dca3Sshifei10.ge 	for (i = 0; i < idx + 1; i++) {
823e1c42045Sarter97 		/* reference count'll be increased */
8244081363fSJaegeuk Kim 		pages[i] = get_node_page(F2FS_I_SB(dn->inode), nid[i]);
825e05df3b1SJaegeuk Kim 		if (IS_ERR(pages[i])) {
826e05df3b1SJaegeuk Kim 			err = PTR_ERR(pages[i]);
827a225dca3Sshifei10.ge 			idx = i - 1;
828e05df3b1SJaegeuk Kim 			goto fail;
829e05df3b1SJaegeuk Kim 		}
830e05df3b1SJaegeuk Kim 		nid[i + 1] = get_nid(pages[i], offset[i + 1], false);
831e05df3b1SJaegeuk Kim 	}
832e05df3b1SJaegeuk Kim 
83379344efbSJaegeuk Kim 	ra_node_pages(pages[idx], offset[idx + 1], NIDS_PER_BLOCK);
83479344efbSJaegeuk Kim 
835e05df3b1SJaegeuk Kim 	/* free direct nodes linked to a partial indirect node */
836a225dca3Sshifei10.ge 	for (i = offset[idx + 1]; i < NIDS_PER_BLOCK; i++) {
837e05df3b1SJaegeuk Kim 		child_nid = get_nid(pages[idx], i, false);
838e05df3b1SJaegeuk Kim 		if (!child_nid)
839e05df3b1SJaegeuk Kim 			continue;
840e05df3b1SJaegeuk Kim 		dn->nid = child_nid;
841e05df3b1SJaegeuk Kim 		err = truncate_dnode(dn);
842e05df3b1SJaegeuk Kim 		if (err < 0)
843e05df3b1SJaegeuk Kim 			goto fail;
84412719ae1SJaegeuk Kim 		if (set_nid(pages[idx], i, 0, false))
84593bae099SJaegeuk Kim 			dn->node_changed = true;
846e05df3b1SJaegeuk Kim 	}
847e05df3b1SJaegeuk Kim 
848a225dca3Sshifei10.ge 	if (offset[idx + 1] == 0) {
849e05df3b1SJaegeuk Kim 		dn->node_page = pages[idx];
850e05df3b1SJaegeuk Kim 		dn->nid = nid[idx];
851e05df3b1SJaegeuk Kim 		truncate_node(dn);
852e05df3b1SJaegeuk Kim 	} else {
853e05df3b1SJaegeuk Kim 		f2fs_put_page(pages[idx], 1);
854e05df3b1SJaegeuk Kim 	}
855e05df3b1SJaegeuk Kim 	offset[idx]++;
856a225dca3Sshifei10.ge 	offset[idx + 1] = 0;
857a225dca3Sshifei10.ge 	idx--;
858e05df3b1SJaegeuk Kim fail:
859a225dca3Sshifei10.ge 	for (i = idx; i >= 0; i--)
860e05df3b1SJaegeuk Kim 		f2fs_put_page(pages[i], 1);
86151dd6249SNamjae Jeon 
86251dd6249SNamjae Jeon 	trace_f2fs_truncate_partial_nodes(dn->inode, nid, depth, err);
86351dd6249SNamjae Jeon 
864e05df3b1SJaegeuk Kim 	return err;
865e05df3b1SJaegeuk Kim }
866e05df3b1SJaegeuk Kim 
8670a8165d7SJaegeuk Kim /*
868e05df3b1SJaegeuk Kim  * All the block addresses of data and nodes should be nullified.
869e05df3b1SJaegeuk Kim  */
870e05df3b1SJaegeuk Kim int truncate_inode_blocks(struct inode *inode, pgoff_t from)
871e05df3b1SJaegeuk Kim {
8724081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
873e05df3b1SJaegeuk Kim 	int err = 0, cont = 1;
874e05df3b1SJaegeuk Kim 	int level, offset[4], noffset[4];
8757dd690c8SJaegeuk Kim 	unsigned int nofs = 0;
87658bfaf44SJaegeuk Kim 	struct f2fs_inode *ri;
877e05df3b1SJaegeuk Kim 	struct dnode_of_data dn;
878e05df3b1SJaegeuk Kim 	struct page *page;
879e05df3b1SJaegeuk Kim 
88051dd6249SNamjae Jeon 	trace_f2fs_truncate_inode_blocks_enter(inode, from);
88151dd6249SNamjae Jeon 
88281ca7350SChao Yu 	level = get_node_path(inode, from, offset, noffset);
883ff373558SJaegeuk Kim 
884e05df3b1SJaegeuk Kim 	page = get_node_page(sbi, inode->i_ino);
88551dd6249SNamjae Jeon 	if (IS_ERR(page)) {
88651dd6249SNamjae Jeon 		trace_f2fs_truncate_inode_blocks_exit(inode, PTR_ERR(page));
887e05df3b1SJaegeuk Kim 		return PTR_ERR(page);
88851dd6249SNamjae Jeon 	}
889e05df3b1SJaegeuk Kim 
890e05df3b1SJaegeuk Kim 	set_new_dnode(&dn, inode, page, NULL, 0);
891e05df3b1SJaegeuk Kim 	unlock_page(page);
892e05df3b1SJaegeuk Kim 
89358bfaf44SJaegeuk Kim 	ri = F2FS_INODE(page);
894e05df3b1SJaegeuk Kim 	switch (level) {
895e05df3b1SJaegeuk Kim 	case 0:
896e05df3b1SJaegeuk Kim 	case 1:
897e05df3b1SJaegeuk Kim 		nofs = noffset[1];
898e05df3b1SJaegeuk Kim 		break;
899e05df3b1SJaegeuk Kim 	case 2:
900e05df3b1SJaegeuk Kim 		nofs = noffset[1];
901e05df3b1SJaegeuk Kim 		if (!offset[level - 1])
902e05df3b1SJaegeuk Kim 			goto skip_partial;
90358bfaf44SJaegeuk Kim 		err = truncate_partial_nodes(&dn, ri, offset, level);
904e05df3b1SJaegeuk Kim 		if (err < 0 && err != -ENOENT)
905e05df3b1SJaegeuk Kim 			goto fail;
906e05df3b1SJaegeuk Kim 		nofs += 1 + NIDS_PER_BLOCK;
907e05df3b1SJaegeuk Kim 		break;
908e05df3b1SJaegeuk Kim 	case 3:
909e05df3b1SJaegeuk Kim 		nofs = 5 + 2 * NIDS_PER_BLOCK;
910e05df3b1SJaegeuk Kim 		if (!offset[level - 1])
911e05df3b1SJaegeuk Kim 			goto skip_partial;
91258bfaf44SJaegeuk Kim 		err = truncate_partial_nodes(&dn, ri, offset, level);
913e05df3b1SJaegeuk Kim 		if (err < 0 && err != -ENOENT)
914e05df3b1SJaegeuk Kim 			goto fail;
915e05df3b1SJaegeuk Kim 		break;
916e05df3b1SJaegeuk Kim 	default:
917e05df3b1SJaegeuk Kim 		BUG();
918e05df3b1SJaegeuk Kim 	}
919e05df3b1SJaegeuk Kim 
920e05df3b1SJaegeuk Kim skip_partial:
921e05df3b1SJaegeuk Kim 	while (cont) {
92258bfaf44SJaegeuk Kim 		dn.nid = le32_to_cpu(ri->i_nid[offset[0] - NODE_DIR1_BLOCK]);
923e05df3b1SJaegeuk Kim 		switch (offset[0]) {
924e05df3b1SJaegeuk Kim 		case NODE_DIR1_BLOCK:
925e05df3b1SJaegeuk Kim 		case NODE_DIR2_BLOCK:
926e05df3b1SJaegeuk Kim 			err = truncate_dnode(&dn);
927e05df3b1SJaegeuk Kim 			break;
928e05df3b1SJaegeuk Kim 
929e05df3b1SJaegeuk Kim 		case NODE_IND1_BLOCK:
930e05df3b1SJaegeuk Kim 		case NODE_IND2_BLOCK:
931e05df3b1SJaegeuk Kim 			err = truncate_nodes(&dn, nofs, offset[1], 2);
932e05df3b1SJaegeuk Kim 			break;
933e05df3b1SJaegeuk Kim 
934e05df3b1SJaegeuk Kim 		case NODE_DIND_BLOCK:
935e05df3b1SJaegeuk Kim 			err = truncate_nodes(&dn, nofs, offset[1], 3);
936e05df3b1SJaegeuk Kim 			cont = 0;
937e05df3b1SJaegeuk Kim 			break;
938e05df3b1SJaegeuk Kim 
939e05df3b1SJaegeuk Kim 		default:
940e05df3b1SJaegeuk Kim 			BUG();
941e05df3b1SJaegeuk Kim 		}
942e05df3b1SJaegeuk Kim 		if (err < 0 && err != -ENOENT)
943e05df3b1SJaegeuk Kim 			goto fail;
944e05df3b1SJaegeuk Kim 		if (offset[1] == 0 &&
94558bfaf44SJaegeuk Kim 				ri->i_nid[offset[0] - NODE_DIR1_BLOCK]) {
946e05df3b1SJaegeuk Kim 			lock_page(page);
947ff373558SJaegeuk Kim 			BUG_ON(page->mapping != NODE_MAPPING(sbi));
948fec1d657SJaegeuk Kim 			f2fs_wait_on_page_writeback(page, NODE, true);
94958bfaf44SJaegeuk Kim 			ri->i_nid[offset[0] - NODE_DIR1_BLOCK] = 0;
950e05df3b1SJaegeuk Kim 			set_page_dirty(page);
951e05df3b1SJaegeuk Kim 			unlock_page(page);
952e05df3b1SJaegeuk Kim 		}
953e05df3b1SJaegeuk Kim 		offset[1] = 0;
954e05df3b1SJaegeuk Kim 		offset[0]++;
955e05df3b1SJaegeuk Kim 		nofs += err;
956e05df3b1SJaegeuk Kim 	}
957e05df3b1SJaegeuk Kim fail:
958e05df3b1SJaegeuk Kim 	f2fs_put_page(page, 0);
95951dd6249SNamjae Jeon 	trace_f2fs_truncate_inode_blocks_exit(inode, err);
960e05df3b1SJaegeuk Kim 	return err > 0 ? 0 : err;
961e05df3b1SJaegeuk Kim }
962e05df3b1SJaegeuk Kim 
9634f16fb0fSJaegeuk Kim int truncate_xattr_node(struct inode *inode, struct page *page)
9644f16fb0fSJaegeuk Kim {
9654081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
9664f16fb0fSJaegeuk Kim 	nid_t nid = F2FS_I(inode)->i_xattr_nid;
9674f16fb0fSJaegeuk Kim 	struct dnode_of_data dn;
9684f16fb0fSJaegeuk Kim 	struct page *npage;
9694f16fb0fSJaegeuk Kim 
9704f16fb0fSJaegeuk Kim 	if (!nid)
9714f16fb0fSJaegeuk Kim 		return 0;
9724f16fb0fSJaegeuk Kim 
9734f16fb0fSJaegeuk Kim 	npage = get_node_page(sbi, nid);
9744f16fb0fSJaegeuk Kim 	if (IS_ERR(npage))
9754f16fb0fSJaegeuk Kim 		return PTR_ERR(npage);
9764f16fb0fSJaegeuk Kim 
977205b9822SJaegeuk Kim 	f2fs_i_xnid_write(inode, 0);
97865985d93SJaegeuk Kim 
9794f16fb0fSJaegeuk Kim 	set_new_dnode(&dn, inode, page, npage, nid);
9804f16fb0fSJaegeuk Kim 
9814f16fb0fSJaegeuk Kim 	if (page)
98201d2d1aaSChao Yu 		dn.inode_page_locked = true;
9834f16fb0fSJaegeuk Kim 	truncate_node(&dn);
9844f16fb0fSJaegeuk Kim 	return 0;
9854f16fb0fSJaegeuk Kim }
9864f16fb0fSJaegeuk Kim 
98739936837SJaegeuk Kim /*
9884f4124d0SChao Yu  * Caller should grab and release a rwsem by calling f2fs_lock_op() and
9894f4124d0SChao Yu  * f2fs_unlock_op().
99039936837SJaegeuk Kim  */
99113ec7297SChao Yu int remove_inode_page(struct inode *inode)
992e05df3b1SJaegeuk Kim {
993e05df3b1SJaegeuk Kim 	struct dnode_of_data dn;
99413ec7297SChao Yu 	int err;
995e05df3b1SJaegeuk Kim 
996c2e69583SJaegeuk Kim 	set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino);
99713ec7297SChao Yu 	err = get_dnode_of_data(&dn, 0, LOOKUP_NODE);
99813ec7297SChao Yu 	if (err)
99913ec7297SChao Yu 		return err;
1000e05df3b1SJaegeuk Kim 
100113ec7297SChao Yu 	err = truncate_xattr_node(inode, dn.inode_page);
100213ec7297SChao Yu 	if (err) {
1003c2e69583SJaegeuk Kim 		f2fs_put_dnode(&dn);
100413ec7297SChao Yu 		return err;
1005e05df3b1SJaegeuk Kim 	}
1006c2e69583SJaegeuk Kim 
1007c2e69583SJaegeuk Kim 	/* remove potential inline_data blocks */
1008c2e69583SJaegeuk Kim 	if (S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
1009c2e69583SJaegeuk Kim 				S_ISLNK(inode->i_mode))
1010c2e69583SJaegeuk Kim 		truncate_data_blocks_range(&dn, 1);
1011c2e69583SJaegeuk Kim 
1012e1c42045Sarter97 	/* 0 is possible, after f2fs_new_inode() has failed */
10139850cf4aSJaegeuk Kim 	f2fs_bug_on(F2FS_I_SB(inode),
10149850cf4aSJaegeuk Kim 			inode->i_blocks != 0 && inode->i_blocks != 1);
1015c2e69583SJaegeuk Kim 
1016c2e69583SJaegeuk Kim 	/* will put inode & node pages */
1017e05df3b1SJaegeuk Kim 	truncate_node(&dn);
101813ec7297SChao Yu 	return 0;
1019e05df3b1SJaegeuk Kim }
1020e05df3b1SJaegeuk Kim 
1021a014e037SJaegeuk Kim struct page *new_inode_page(struct inode *inode)
1022e05df3b1SJaegeuk Kim {
1023e05df3b1SJaegeuk Kim 	struct dnode_of_data dn;
1024e05df3b1SJaegeuk Kim 
1025e05df3b1SJaegeuk Kim 	/* allocate inode page for new inode */
1026e05df3b1SJaegeuk Kim 	set_new_dnode(&dn, inode, NULL, NULL, inode->i_ino);
102744a83ff6SJaegeuk Kim 
102844a83ff6SJaegeuk Kim 	/* caller should f2fs_put_page(page, 1); */
10298ae8f162SJaegeuk Kim 	return new_node_page(&dn, 0, NULL);
1030e05df3b1SJaegeuk Kim }
1031e05df3b1SJaegeuk Kim 
10328ae8f162SJaegeuk Kim struct page *new_node_page(struct dnode_of_data *dn,
10338ae8f162SJaegeuk Kim 				unsigned int ofs, struct page *ipage)
1034e05df3b1SJaegeuk Kim {
10354081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
103625cc5d3bSJaegeuk Kim 	struct node_info new_ni;
1037e05df3b1SJaegeuk Kim 	struct page *page;
1038e05df3b1SJaegeuk Kim 	int err;
1039e05df3b1SJaegeuk Kim 
104091942321SJaegeuk Kim 	if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC)))
1041e05df3b1SJaegeuk Kim 		return ERR_PTR(-EPERM);
1042e05df3b1SJaegeuk Kim 
1043300e129cSJaegeuk Kim 	page = f2fs_grab_cache_page(NODE_MAPPING(sbi), dn->nid, false);
1044e05df3b1SJaegeuk Kim 	if (!page)
1045e05df3b1SJaegeuk Kim 		return ERR_PTR(-ENOMEM);
1046e05df3b1SJaegeuk Kim 
10476bacf52fSJaegeuk Kim 	if (unlikely(!inc_valid_node_count(sbi, dn->inode))) {
10489c02740cSJaegeuk Kim 		err = -ENOSPC;
10499c02740cSJaegeuk Kim 		goto fail;
10509c02740cSJaegeuk Kim 	}
105125cc5d3bSJaegeuk Kim #ifdef CONFIG_F2FS_CHECK_FS
105225cc5d3bSJaegeuk Kim 	get_node_info(sbi, dn->nid, &new_ni);
105325cc5d3bSJaegeuk Kim 	f2fs_bug_on(sbi, new_ni.blk_addr != NULL_ADDR);
105425cc5d3bSJaegeuk Kim #endif
105525cc5d3bSJaegeuk Kim 	new_ni.nid = dn->nid;
1056e05df3b1SJaegeuk Kim 	new_ni.ino = dn->inode->i_ino;
105725cc5d3bSJaegeuk Kim 	new_ni.blk_addr = NULL_ADDR;
105825cc5d3bSJaegeuk Kim 	new_ni.flag = 0;
105925cc5d3bSJaegeuk Kim 	new_ni.version = 0;
1060479f40c4SJaegeuk Kim 	set_node_addr(sbi, &new_ni, NEW_ADDR, false);
10619c02740cSJaegeuk Kim 
1062fec1d657SJaegeuk Kim 	f2fs_wait_on_page_writeback(page, NODE, true);
10639c02740cSJaegeuk Kim 	fill_node_footer(page, dn->nid, dn->inode->i_ino, ofs, true);
1064398b1ac5SJaegeuk Kim 	set_cold_node(dn->inode, page);
1065237c0790SJaegeuk Kim 	if (!PageUptodate(page))
10669c02740cSJaegeuk Kim 		SetPageUptodate(page);
106712719ae1SJaegeuk Kim 	if (set_page_dirty(page))
106812719ae1SJaegeuk Kim 		dn->node_changed = true;
1069e05df3b1SJaegeuk Kim 
10704bc8e9bcSChao Yu 	if (f2fs_has_xattr_block(ofs))
1071205b9822SJaegeuk Kim 		f2fs_i_xnid_write(dn->inode, dn->nid);
1072479bd73aSJaegeuk Kim 
1073e05df3b1SJaegeuk Kim 	if (ofs == 0)
1074e05df3b1SJaegeuk Kim 		inc_valid_inode_count(sbi);
1075e05df3b1SJaegeuk Kim 	return page;
1076e05df3b1SJaegeuk Kim 
1077e05df3b1SJaegeuk Kim fail:
107871e9fec5SJaegeuk Kim 	clear_node_page_dirty(page);
1079e05df3b1SJaegeuk Kim 	f2fs_put_page(page, 1);
1080e05df3b1SJaegeuk Kim 	return ERR_PTR(err);
1081e05df3b1SJaegeuk Kim }
1082e05df3b1SJaegeuk Kim 
108356ae674cSJaegeuk Kim /*
108456ae674cSJaegeuk Kim  * Caller should do after getting the following values.
108556ae674cSJaegeuk Kim  * 0: f2fs_put_page(page, 0)
108686531d6bSJaegeuk Kim  * LOCKED_PAGE or error: f2fs_put_page(page, 1)
108756ae674cSJaegeuk Kim  */
108804d328deSMike Christie static int read_node_page(struct page *page, int op_flags)
1089e05df3b1SJaegeuk Kim {
10904081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_P_SB(page);
1091e05df3b1SJaegeuk Kim 	struct node_info ni;
1092cf04e8ebSJaegeuk Kim 	struct f2fs_io_info fio = {
109305ca3632SJaegeuk Kim 		.sbi = sbi,
1094cf04e8ebSJaegeuk Kim 		.type = NODE,
109504d328deSMike Christie 		.op = REQ_OP_READ,
109604d328deSMike Christie 		.op_flags = op_flags,
109705ca3632SJaegeuk Kim 		.page = page,
10984375a336SJaegeuk Kim 		.encrypted_page = NULL,
1099cf04e8ebSJaegeuk Kim 	};
1100e05df3b1SJaegeuk Kim 
11013bdad3c7SJaegeuk Kim 	if (PageUptodate(page))
11023bdad3c7SJaegeuk Kim 		return LOCKED_PAGE;
11033bdad3c7SJaegeuk Kim 
1104e05df3b1SJaegeuk Kim 	get_node_info(sbi, page->index, &ni);
1105e05df3b1SJaegeuk Kim 
11066bacf52fSJaegeuk Kim 	if (unlikely(ni.blk_addr == NULL_ADDR)) {
11072bca1e23SJaegeuk Kim 		ClearPageUptodate(page);
1108e05df3b1SJaegeuk Kim 		return -ENOENT;
1109393ff91fSJaegeuk Kim 	}
1110393ff91fSJaegeuk Kim 
11117a9d7548SChao Yu 	fio.new_blkaddr = fio.old_blkaddr = ni.blk_addr;
111205ca3632SJaegeuk Kim 	return f2fs_submit_page_bio(&fio);
1113e05df3b1SJaegeuk Kim }
1114e05df3b1SJaegeuk Kim 
11150a8165d7SJaegeuk Kim /*
1116e05df3b1SJaegeuk Kim  * Readahead a node page
1117e05df3b1SJaegeuk Kim  */
1118e05df3b1SJaegeuk Kim void ra_node_page(struct f2fs_sb_info *sbi, nid_t nid)
1119e05df3b1SJaegeuk Kim {
1120e05df3b1SJaegeuk Kim 	struct page *apage;
112156ae674cSJaegeuk Kim 	int err;
1122e05df3b1SJaegeuk Kim 
1123e8458725SChao Yu 	if (!nid)
1124e8458725SChao Yu 		return;
1125e8458725SChao Yu 	f2fs_bug_on(sbi, check_nid_range(sbi, nid));
1126e8458725SChao Yu 
1127999270deSFan Li 	rcu_read_lock();
1128999270deSFan Li 	apage = radix_tree_lookup(&NODE_MAPPING(sbi)->page_tree, nid);
1129999270deSFan Li 	rcu_read_unlock();
1130999270deSFan Li 	if (apage)
1131393ff91fSJaegeuk Kim 		return;
1132e05df3b1SJaegeuk Kim 
1133300e129cSJaegeuk Kim 	apage = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false);
1134e05df3b1SJaegeuk Kim 	if (!apage)
1135e05df3b1SJaegeuk Kim 		return;
1136e05df3b1SJaegeuk Kim 
113770246286SChristoph Hellwig 	err = read_node_page(apage, REQ_RAHEAD);
113886531d6bSJaegeuk Kim 	f2fs_put_page(apage, err ? 1 : 0);
1139e05df3b1SJaegeuk Kim }
1140e05df3b1SJaegeuk Kim 
114117a0ee55SJaegeuk Kim static struct page *__get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid,
11420e022ea8SChao Yu 					struct page *parent, int start)
1143e05df3b1SJaegeuk Kim {
114456ae674cSJaegeuk Kim 	struct page *page;
114556ae674cSJaegeuk Kim 	int err;
11464aa69d56SJaegeuk Kim 
11474aa69d56SJaegeuk Kim 	if (!nid)
11484aa69d56SJaegeuk Kim 		return ERR_PTR(-ENOENT);
11494aa69d56SJaegeuk Kim 	f2fs_bug_on(sbi, check_nid_range(sbi, nid));
1150afcb7ca0SJaegeuk Kim repeat:
1151300e129cSJaegeuk Kim 	page = f2fs_grab_cache_page(NODE_MAPPING(sbi), nid, false);
1152e05df3b1SJaegeuk Kim 	if (!page)
1153e05df3b1SJaegeuk Kim 		return ERR_PTR(-ENOMEM);
1154e05df3b1SJaegeuk Kim 
115570fd7614SChristoph Hellwig 	err = read_node_page(page, 0);
115686531d6bSJaegeuk Kim 	if (err < 0) {
115786531d6bSJaegeuk Kim 		f2fs_put_page(page, 1);
1158e05df3b1SJaegeuk Kim 		return ERR_PTR(err);
1159e1c51b9fSChao Yu 	} else if (err == LOCKED_PAGE) {
11601f258ec1SChao Yu 		err = 0;
1161e1c51b9fSChao Yu 		goto page_hit;
116286531d6bSJaegeuk Kim 	}
1163aaf96075SJaegeuk Kim 
11640e022ea8SChao Yu 	if (parent)
116579344efbSJaegeuk Kim 		ra_node_pages(parent, start + 1, MAX_RA_NODE);
11660e022ea8SChao Yu 
1167e1c51b9fSChao Yu 	lock_page(page);
1168e1c51b9fSChao Yu 
11694ef51a8fSJaegeuk Kim 	if (unlikely(page->mapping != NODE_MAPPING(sbi))) {
1170afcb7ca0SJaegeuk Kim 		f2fs_put_page(page, 1);
1171afcb7ca0SJaegeuk Kim 		goto repeat;
1172afcb7ca0SJaegeuk Kim 	}
11731563ac75SChao Yu 
11741f258ec1SChao Yu 	if (unlikely(!PageUptodate(page))) {
11751f258ec1SChao Yu 		err = -EIO;
11761563ac75SChao Yu 		goto out_err;
11771f258ec1SChao Yu 	}
1178e1c51b9fSChao Yu page_hit:
11790c9df7fbSYunlong Song 	if(unlikely(nid != nid_of_node(page))) {
11801f258ec1SChao Yu 		f2fs_msg(sbi->sb, KERN_WARNING, "inconsistent node block, "
11811f258ec1SChao Yu 			"nid:%lu, node_footer[nid:%u,ino:%u,ofs:%u,cpver:%llu,blkaddr:%u]",
11821f258ec1SChao Yu 			nid, nid_of_node(page), ino_of_node(page),
11831f258ec1SChao Yu 			ofs_of_node(page), cpver_of_node(page),
11841f258ec1SChao Yu 			next_blkaddr_of_node(page));
11850c9df7fbSYunlong Song 		ClearPageUptodate(page);
11861f258ec1SChao Yu 		err = -EINVAL;
11870c9df7fbSYunlong Song out_err:
11880c9df7fbSYunlong Song 		f2fs_put_page(page, 1);
11891f258ec1SChao Yu 		return ERR_PTR(err);
11900c9df7fbSYunlong Song 	}
1191e05df3b1SJaegeuk Kim 	return page;
1192e05df3b1SJaegeuk Kim }
1193e05df3b1SJaegeuk Kim 
11940e022ea8SChao Yu struct page *get_node_page(struct f2fs_sb_info *sbi, pgoff_t nid)
11950e022ea8SChao Yu {
11960e022ea8SChao Yu 	return __get_node_page(sbi, nid, NULL, 0);
11970e022ea8SChao Yu }
11980e022ea8SChao Yu 
1199e05df3b1SJaegeuk Kim struct page *get_node_page_ra(struct page *parent, int start)
1200e05df3b1SJaegeuk Kim {
12014081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_P_SB(parent);
12020e022ea8SChao Yu 	nid_t nid = get_nid(parent, start, false);
1203e05df3b1SJaegeuk Kim 
12040e022ea8SChao Yu 	return __get_node_page(sbi, nid, parent, start);
1205e05df3b1SJaegeuk Kim }
1206e05df3b1SJaegeuk Kim 
12072049d4fcSJaegeuk Kim static void flush_inline_data(struct f2fs_sb_info *sbi, nid_t ino)
12082049d4fcSJaegeuk Kim {
12092049d4fcSJaegeuk Kim 	struct inode *inode;
12102049d4fcSJaegeuk Kim 	struct page *page;
12110f3311a8SChao Yu 	int ret;
12122049d4fcSJaegeuk Kim 
12132049d4fcSJaegeuk Kim 	/* should flush inline_data before evict_inode */
12142049d4fcSJaegeuk Kim 	inode = ilookup(sbi->sb, ino);
12152049d4fcSJaegeuk Kim 	if (!inode)
12162049d4fcSJaegeuk Kim 		return;
12172049d4fcSJaegeuk Kim 
12184a6de50dSJaegeuk Kim 	page = pagecache_get_page(inode->i_mapping, 0, FGP_LOCK|FGP_NOWAIT, 0);
12192049d4fcSJaegeuk Kim 	if (!page)
12202049d4fcSJaegeuk Kim 		goto iput_out;
12212049d4fcSJaegeuk Kim 
12222049d4fcSJaegeuk Kim 	if (!PageUptodate(page))
12232049d4fcSJaegeuk Kim 		goto page_out;
12242049d4fcSJaegeuk Kim 
12252049d4fcSJaegeuk Kim 	if (!PageDirty(page))
12262049d4fcSJaegeuk Kim 		goto page_out;
12272049d4fcSJaegeuk Kim 
12282049d4fcSJaegeuk Kim 	if (!clear_page_dirty_for_io(page))
12292049d4fcSJaegeuk Kim 		goto page_out;
12302049d4fcSJaegeuk Kim 
12310f3311a8SChao Yu 	ret = f2fs_write_inline_data(inode, page);
12322049d4fcSJaegeuk Kim 	inode_dec_dirty_pages(inode);
1233933439c8SChao Yu 	remove_dirty_inode(inode);
12340f3311a8SChao Yu 	if (ret)
12352049d4fcSJaegeuk Kim 		set_page_dirty(page);
12362049d4fcSJaegeuk Kim page_out:
12374a6de50dSJaegeuk Kim 	f2fs_put_page(page, 1);
12382049d4fcSJaegeuk Kim iput_out:
12392049d4fcSJaegeuk Kim 	iput(inode);
12402049d4fcSJaegeuk Kim }
12412049d4fcSJaegeuk Kim 
1242da011cc0SChao Yu void move_node_page(struct page *node_page, int gc_type)
1243da011cc0SChao Yu {
1244da011cc0SChao Yu 	if (gc_type == FG_GC) {
1245da011cc0SChao Yu 		struct f2fs_sb_info *sbi = F2FS_P_SB(node_page);
1246da011cc0SChao Yu 		struct writeback_control wbc = {
1247da011cc0SChao Yu 			.sync_mode = WB_SYNC_ALL,
1248da011cc0SChao Yu 			.nr_to_write = 1,
1249da011cc0SChao Yu 			.for_reclaim = 0,
1250da011cc0SChao Yu 		};
1251da011cc0SChao Yu 
1252da011cc0SChao Yu 		set_page_dirty(node_page);
1253da011cc0SChao Yu 		f2fs_wait_on_page_writeback(node_page, NODE, true);
1254da011cc0SChao Yu 
1255da011cc0SChao Yu 		f2fs_bug_on(sbi, PageWriteback(node_page));
1256da011cc0SChao Yu 		if (!clear_page_dirty_for_io(node_page))
1257da011cc0SChao Yu 			goto out_page;
1258da011cc0SChao Yu 
1259da011cc0SChao Yu 		if (NODE_MAPPING(sbi)->a_ops->writepage(node_page, &wbc))
1260da011cc0SChao Yu 			unlock_page(node_page);
1261da011cc0SChao Yu 		goto release_page;
1262da011cc0SChao Yu 	} else {
1263da011cc0SChao Yu 		/* set page dirty and write it */
1264da011cc0SChao Yu 		if (!PageWriteback(node_page))
1265da011cc0SChao Yu 			set_page_dirty(node_page);
1266da011cc0SChao Yu 	}
1267da011cc0SChao Yu out_page:
1268da011cc0SChao Yu 	unlock_page(node_page);
1269da011cc0SChao Yu release_page:
1270da011cc0SChao Yu 	f2fs_put_page(node_page, 0);
1271da011cc0SChao Yu }
1272da011cc0SChao Yu 
1273608514deSJaegeuk Kim static struct page *last_fsync_dnode(struct f2fs_sb_info *sbi, nid_t ino)
1274e05df3b1SJaegeuk Kim {
1275e05df3b1SJaegeuk Kim 	pgoff_t index, end;
1276e05df3b1SJaegeuk Kim 	struct pagevec pvec;
1277608514deSJaegeuk Kim 	struct page *last_page = NULL;
127852681375SJaegeuk Kim 
127952681375SJaegeuk Kim 	pagevec_init(&pvec, 0);
128052681375SJaegeuk Kim 	index = 0;
128152681375SJaegeuk Kim 	end = ULONG_MAX;
128252681375SJaegeuk Kim 
128352681375SJaegeuk Kim 	while (index <= end) {
128452681375SJaegeuk Kim 		int i, nr_pages;
128552681375SJaegeuk Kim 		nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index,
128652681375SJaegeuk Kim 				PAGECACHE_TAG_DIRTY,
128752681375SJaegeuk Kim 				min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
128852681375SJaegeuk Kim 		if (nr_pages == 0)
128952681375SJaegeuk Kim 			break;
129052681375SJaegeuk Kim 
129152681375SJaegeuk Kim 		for (i = 0; i < nr_pages; i++) {
129252681375SJaegeuk Kim 			struct page *page = pvec.pages[i];
129352681375SJaegeuk Kim 
129452681375SJaegeuk Kim 			if (unlikely(f2fs_cp_error(sbi))) {
1295608514deSJaegeuk Kim 				f2fs_put_page(last_page, 0);
129652681375SJaegeuk Kim 				pagevec_release(&pvec);
1297608514deSJaegeuk Kim 				return ERR_PTR(-EIO);
129852681375SJaegeuk Kim 			}
129952681375SJaegeuk Kim 
130052681375SJaegeuk Kim 			if (!IS_DNODE(page) || !is_cold_node(page))
130152681375SJaegeuk Kim 				continue;
130252681375SJaegeuk Kim 			if (ino_of_node(page) != ino)
130352681375SJaegeuk Kim 				continue;
130452681375SJaegeuk Kim 
130552681375SJaegeuk Kim 			lock_page(page);
130652681375SJaegeuk Kim 
130752681375SJaegeuk Kim 			if (unlikely(page->mapping != NODE_MAPPING(sbi))) {
130852681375SJaegeuk Kim continue_unlock:
130952681375SJaegeuk Kim 				unlock_page(page);
131052681375SJaegeuk Kim 				continue;
131152681375SJaegeuk Kim 			}
131252681375SJaegeuk Kim 			if (ino_of_node(page) != ino)
131352681375SJaegeuk Kim 				goto continue_unlock;
131452681375SJaegeuk Kim 
131552681375SJaegeuk Kim 			if (!PageDirty(page)) {
131652681375SJaegeuk Kim 				/* someone wrote it for us */
131752681375SJaegeuk Kim 				goto continue_unlock;
131852681375SJaegeuk Kim 			}
131952681375SJaegeuk Kim 
1320608514deSJaegeuk Kim 			if (last_page)
1321608514deSJaegeuk Kim 				f2fs_put_page(last_page, 0);
1322608514deSJaegeuk Kim 
1323608514deSJaegeuk Kim 			get_page(page);
1324608514deSJaegeuk Kim 			last_page = page;
1325608514deSJaegeuk Kim 			unlock_page(page);
1326608514deSJaegeuk Kim 		}
1327608514deSJaegeuk Kim 		pagevec_release(&pvec);
1328608514deSJaegeuk Kim 		cond_resched();
1329608514deSJaegeuk Kim 	}
1330608514deSJaegeuk Kim 	return last_page;
1331608514deSJaegeuk Kim }
1332608514deSJaegeuk Kim 
1333d68f735bSJaegeuk Kim static int __write_node_page(struct page *page, bool atomic, bool *submitted,
1334faa24895SJaegeuk Kim 				struct writeback_control *wbc)
1335faa24895SJaegeuk Kim {
1336faa24895SJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_P_SB(page);
1337faa24895SJaegeuk Kim 	nid_t nid;
1338faa24895SJaegeuk Kim 	struct node_info ni;
1339faa24895SJaegeuk Kim 	struct f2fs_io_info fio = {
1340faa24895SJaegeuk Kim 		.sbi = sbi,
1341faa24895SJaegeuk Kim 		.type = NODE,
1342faa24895SJaegeuk Kim 		.op = REQ_OP_WRITE,
1343faa24895SJaegeuk Kim 		.op_flags = wbc_to_write_flags(wbc),
1344faa24895SJaegeuk Kim 		.page = page,
1345faa24895SJaegeuk Kim 		.encrypted_page = NULL,
1346d68f735bSJaegeuk Kim 		.submitted = false,
1347faa24895SJaegeuk Kim 	};
1348faa24895SJaegeuk Kim 
1349faa24895SJaegeuk Kim 	trace_f2fs_writepage(page, NODE);
1350faa24895SJaegeuk Kim 
1351faa24895SJaegeuk Kim 	if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
1352faa24895SJaegeuk Kim 		goto redirty_out;
1353faa24895SJaegeuk Kim 	if (unlikely(f2fs_cp_error(sbi)))
1354faa24895SJaegeuk Kim 		goto redirty_out;
1355faa24895SJaegeuk Kim 
1356faa24895SJaegeuk Kim 	/* get old block addr of this node page */
1357faa24895SJaegeuk Kim 	nid = nid_of_node(page);
1358faa24895SJaegeuk Kim 	f2fs_bug_on(sbi, page->index != nid);
1359faa24895SJaegeuk Kim 
1360faa24895SJaegeuk Kim 	if (wbc->for_reclaim) {
1361faa24895SJaegeuk Kim 		if (!down_read_trylock(&sbi->node_write))
1362faa24895SJaegeuk Kim 			goto redirty_out;
1363faa24895SJaegeuk Kim 	} else {
1364faa24895SJaegeuk Kim 		down_read(&sbi->node_write);
1365faa24895SJaegeuk Kim 	}
1366faa24895SJaegeuk Kim 
1367faa24895SJaegeuk Kim 	get_node_info(sbi, nid, &ni);
1368faa24895SJaegeuk Kim 
1369faa24895SJaegeuk Kim 	/* This page is already truncated */
1370faa24895SJaegeuk Kim 	if (unlikely(ni.blk_addr == NULL_ADDR)) {
1371faa24895SJaegeuk Kim 		ClearPageUptodate(page);
1372faa24895SJaegeuk Kim 		dec_page_count(sbi, F2FS_DIRTY_NODES);
1373faa24895SJaegeuk Kim 		up_read(&sbi->node_write);
1374faa24895SJaegeuk Kim 		unlock_page(page);
1375faa24895SJaegeuk Kim 		return 0;
1376faa24895SJaegeuk Kim 	}
1377faa24895SJaegeuk Kim 
1378e7c75ab0SJaegeuk Kim 	if (atomic && !test_opt(sbi, NOBARRIER))
1379e7c75ab0SJaegeuk Kim 		fio.op_flags |= REQ_PREFLUSH | REQ_FUA;
1380e7c75ab0SJaegeuk Kim 
1381faa24895SJaegeuk Kim 	set_page_writeback(page);
1382faa24895SJaegeuk Kim 	fio.old_blkaddr = ni.blk_addr;
1383faa24895SJaegeuk Kim 	write_node_page(nid, &fio);
1384faa24895SJaegeuk Kim 	set_node_addr(sbi, &ni, fio.new_blkaddr, is_fsync_dnode(page));
1385faa24895SJaegeuk Kim 	dec_page_count(sbi, F2FS_DIRTY_NODES);
1386faa24895SJaegeuk Kim 	up_read(&sbi->node_write);
1387faa24895SJaegeuk Kim 
1388d68f735bSJaegeuk Kim 	if (wbc->for_reclaim) {
1389b9109b0eSJaegeuk Kim 		f2fs_submit_merged_write_cond(sbi, page->mapping->host, 0,
1390b9109b0eSJaegeuk Kim 						page->index, NODE);
1391d68f735bSJaegeuk Kim 		submitted = NULL;
1392d68f735bSJaegeuk Kim 	}
1393faa24895SJaegeuk Kim 
1394faa24895SJaegeuk Kim 	unlock_page(page);
1395faa24895SJaegeuk Kim 
1396d68f735bSJaegeuk Kim 	if (unlikely(f2fs_cp_error(sbi))) {
1397b9109b0eSJaegeuk Kim 		f2fs_submit_merged_write(sbi, NODE);
1398d68f735bSJaegeuk Kim 		submitted = NULL;
1399d68f735bSJaegeuk Kim 	}
1400d68f735bSJaegeuk Kim 	if (submitted)
1401d68f735bSJaegeuk Kim 		*submitted = fio.submitted;
1402faa24895SJaegeuk Kim 
1403faa24895SJaegeuk Kim 	return 0;
1404faa24895SJaegeuk Kim 
1405faa24895SJaegeuk Kim redirty_out:
1406faa24895SJaegeuk Kim 	redirty_page_for_writepage(wbc, page);
1407faa24895SJaegeuk Kim 	return AOP_WRITEPAGE_ACTIVATE;
1408faa24895SJaegeuk Kim }
1409faa24895SJaegeuk Kim 
1410faa24895SJaegeuk Kim static int f2fs_write_node_page(struct page *page,
1411faa24895SJaegeuk Kim 				struct writeback_control *wbc)
1412faa24895SJaegeuk Kim {
1413d68f735bSJaegeuk Kim 	return __write_node_page(page, false, NULL, wbc);
1414faa24895SJaegeuk Kim }
1415faa24895SJaegeuk Kim 
141626de9b11SJaegeuk Kim int fsync_node_pages(struct f2fs_sb_info *sbi, struct inode *inode,
1417608514deSJaegeuk Kim 			struct writeback_control *wbc, bool atomic)
1418608514deSJaegeuk Kim {
1419608514deSJaegeuk Kim 	pgoff_t index, end;
1420942fd319SJaegeuk Kim 	pgoff_t last_idx = ULONG_MAX;
1421608514deSJaegeuk Kim 	struct pagevec pvec;
1422608514deSJaegeuk Kim 	int ret = 0;
1423608514deSJaegeuk Kim 	struct page *last_page = NULL;
1424608514deSJaegeuk Kim 	bool marked = false;
142526de9b11SJaegeuk Kim 	nid_t ino = inode->i_ino;
1426608514deSJaegeuk Kim 
1427608514deSJaegeuk Kim 	if (atomic) {
1428608514deSJaegeuk Kim 		last_page = last_fsync_dnode(sbi, ino);
1429608514deSJaegeuk Kim 		if (IS_ERR_OR_NULL(last_page))
1430608514deSJaegeuk Kim 			return PTR_ERR_OR_ZERO(last_page);
1431608514deSJaegeuk Kim 	}
1432608514deSJaegeuk Kim retry:
1433608514deSJaegeuk Kim 	pagevec_init(&pvec, 0);
1434608514deSJaegeuk Kim 	index = 0;
1435608514deSJaegeuk Kim 	end = ULONG_MAX;
1436608514deSJaegeuk Kim 
1437608514deSJaegeuk Kim 	while (index <= end) {
1438608514deSJaegeuk Kim 		int i, nr_pages;
1439608514deSJaegeuk Kim 		nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index,
1440608514deSJaegeuk Kim 				PAGECACHE_TAG_DIRTY,
1441608514deSJaegeuk Kim 				min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
1442608514deSJaegeuk Kim 		if (nr_pages == 0)
1443608514deSJaegeuk Kim 			break;
1444608514deSJaegeuk Kim 
1445608514deSJaegeuk Kim 		for (i = 0; i < nr_pages; i++) {
1446608514deSJaegeuk Kim 			struct page *page = pvec.pages[i];
1447d68f735bSJaegeuk Kim 			bool submitted = false;
1448608514deSJaegeuk Kim 
1449608514deSJaegeuk Kim 			if (unlikely(f2fs_cp_error(sbi))) {
1450608514deSJaegeuk Kim 				f2fs_put_page(last_page, 0);
1451608514deSJaegeuk Kim 				pagevec_release(&pvec);
14529de69279SChao Yu 				ret = -EIO;
14539de69279SChao Yu 				goto out;
1454608514deSJaegeuk Kim 			}
1455608514deSJaegeuk Kim 
1456608514deSJaegeuk Kim 			if (!IS_DNODE(page) || !is_cold_node(page))
1457608514deSJaegeuk Kim 				continue;
1458608514deSJaegeuk Kim 			if (ino_of_node(page) != ino)
1459608514deSJaegeuk Kim 				continue;
1460608514deSJaegeuk Kim 
1461608514deSJaegeuk Kim 			lock_page(page);
1462608514deSJaegeuk Kim 
1463608514deSJaegeuk Kim 			if (unlikely(page->mapping != NODE_MAPPING(sbi))) {
1464608514deSJaegeuk Kim continue_unlock:
1465608514deSJaegeuk Kim 				unlock_page(page);
1466608514deSJaegeuk Kim 				continue;
1467608514deSJaegeuk Kim 			}
1468608514deSJaegeuk Kim 			if (ino_of_node(page) != ino)
146952681375SJaegeuk Kim 				goto continue_unlock;
147052681375SJaegeuk Kim 
1471608514deSJaegeuk Kim 			if (!PageDirty(page) && page != last_page) {
1472608514deSJaegeuk Kim 				/* someone wrote it for us */
1473608514deSJaegeuk Kim 				goto continue_unlock;
1474608514deSJaegeuk Kim 			}
1475608514deSJaegeuk Kim 
1476608514deSJaegeuk Kim 			f2fs_wait_on_page_writeback(page, NODE, true);
1477608514deSJaegeuk Kim 			BUG_ON(PageWriteback(page));
1478608514deSJaegeuk Kim 
1479d29fd172SJaegeuk Kim 			set_fsync_mark(page, 0);
1480d29fd172SJaegeuk Kim 			set_dentry_mark(page, 0);
1481d29fd172SJaegeuk Kim 
1482608514deSJaegeuk Kim 			if (!atomic || page == last_page) {
148352681375SJaegeuk Kim 				set_fsync_mark(page, 1);
148426de9b11SJaegeuk Kim 				if (IS_INODE(page)) {
148526de9b11SJaegeuk Kim 					if (is_inode_flag_set(inode,
148626de9b11SJaegeuk Kim 								FI_DIRTY_INODE))
148726de9b11SJaegeuk Kim 						update_inode(inode, page);
148852681375SJaegeuk Kim 					set_dentry_mark(page,
148952681375SJaegeuk Kim 						need_dentry_mark(sbi, ino));
149026de9b11SJaegeuk Kim 				}
1491608514deSJaegeuk Kim 				/*  may be written by other thread */
1492608514deSJaegeuk Kim 				if (!PageDirty(page))
1493608514deSJaegeuk Kim 					set_page_dirty(page);
1494608514deSJaegeuk Kim 			}
1495608514deSJaegeuk Kim 
1496608514deSJaegeuk Kim 			if (!clear_page_dirty_for_io(page))
1497608514deSJaegeuk Kim 				goto continue_unlock;
149852681375SJaegeuk Kim 
1499e7c75ab0SJaegeuk Kim 			ret = __write_node_page(page, atomic &&
1500d68f735bSJaegeuk Kim 						page == last_page,
1501d68f735bSJaegeuk Kim 						&submitted, wbc);
1502c267ec15SJaegeuk Kim 			if (ret) {
150352681375SJaegeuk Kim 				unlock_page(page);
1504608514deSJaegeuk Kim 				f2fs_put_page(last_page, 0);
1505608514deSJaegeuk Kim 				break;
1506d68f735bSJaegeuk Kim 			} else if (submitted) {
1507942fd319SJaegeuk Kim 				last_idx = page->index;
1508608514deSJaegeuk Kim 			}
15093f5f4959SChao Yu 
1510608514deSJaegeuk Kim 			if (page == last_page) {
1511608514deSJaegeuk Kim 				f2fs_put_page(page, 0);
1512608514deSJaegeuk Kim 				marked = true;
151352681375SJaegeuk Kim 				break;
151452681375SJaegeuk Kim 			}
1515c267ec15SJaegeuk Kim 		}
151652681375SJaegeuk Kim 		pagevec_release(&pvec);
151752681375SJaegeuk Kim 		cond_resched();
151852681375SJaegeuk Kim 
1519608514deSJaegeuk Kim 		if (ret || marked)
152052681375SJaegeuk Kim 			break;
152152681375SJaegeuk Kim 	}
1522608514deSJaegeuk Kim 	if (!ret && atomic && !marked) {
1523608514deSJaegeuk Kim 		f2fs_msg(sbi->sb, KERN_DEBUG,
1524608514deSJaegeuk Kim 			"Retry to write fsync mark: ino=%u, idx=%lx",
1525608514deSJaegeuk Kim 					ino, last_page->index);
1526608514deSJaegeuk Kim 		lock_page(last_page);
1527d40a43afSYunlei He 		f2fs_wait_on_page_writeback(last_page, NODE, true);
1528608514deSJaegeuk Kim 		set_page_dirty(last_page);
1529608514deSJaegeuk Kim 		unlock_page(last_page);
1530608514deSJaegeuk Kim 		goto retry;
1531608514deSJaegeuk Kim 	}
15329de69279SChao Yu out:
1533942fd319SJaegeuk Kim 	if (last_idx != ULONG_MAX)
1534b9109b0eSJaegeuk Kim 		f2fs_submit_merged_write_cond(sbi, NULL, ino, last_idx, NODE);
1535c267ec15SJaegeuk Kim 	return ret ? -EIO: 0;
153652681375SJaegeuk Kim }
153752681375SJaegeuk Kim 
153852681375SJaegeuk Kim int sync_node_pages(struct f2fs_sb_info *sbi, struct writeback_control *wbc)
153952681375SJaegeuk Kim {
154052681375SJaegeuk Kim 	pgoff_t index, end;
154152681375SJaegeuk Kim 	struct pagevec pvec;
154252681375SJaegeuk Kim 	int step = 0;
154312bb0a8fSJaegeuk Kim 	int nwritten = 0;
15443f5f4959SChao Yu 	int ret = 0;
1545e05df3b1SJaegeuk Kim 
1546e05df3b1SJaegeuk Kim 	pagevec_init(&pvec, 0);
1547e05df3b1SJaegeuk Kim 
1548e05df3b1SJaegeuk Kim next_step:
1549e05df3b1SJaegeuk Kim 	index = 0;
155080dd9c0eSChao Yu 	end = ULONG_MAX;
1551e05df3b1SJaegeuk Kim 
1552e05df3b1SJaegeuk Kim 	while (index <= end) {
1553e05df3b1SJaegeuk Kim 		int i, nr_pages;
15544ef51a8fSJaegeuk Kim 		nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index,
1555e05df3b1SJaegeuk Kim 				PAGECACHE_TAG_DIRTY,
1556e05df3b1SJaegeuk Kim 				min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
1557e05df3b1SJaegeuk Kim 		if (nr_pages == 0)
1558e05df3b1SJaegeuk Kim 			break;
1559e05df3b1SJaegeuk Kim 
1560e05df3b1SJaegeuk Kim 		for (i = 0; i < nr_pages; i++) {
1561e05df3b1SJaegeuk Kim 			struct page *page = pvec.pages[i];
1562d68f735bSJaegeuk Kim 			bool submitted = false;
1563e05df3b1SJaegeuk Kim 
15646d5a1495SChao Yu 			if (unlikely(f2fs_cp_error(sbi))) {
15656d5a1495SChao Yu 				pagevec_release(&pvec);
15663f5f4959SChao Yu 				ret = -EIO;
15673f5f4959SChao Yu 				goto out;
15686d5a1495SChao Yu 			}
15696d5a1495SChao Yu 
1570e05df3b1SJaegeuk Kim 			/*
1571e05df3b1SJaegeuk Kim 			 * flushing sequence with step:
1572e05df3b1SJaegeuk Kim 			 * 0. indirect nodes
1573e05df3b1SJaegeuk Kim 			 * 1. dentry dnodes
1574e05df3b1SJaegeuk Kim 			 * 2. file dnodes
1575e05df3b1SJaegeuk Kim 			 */
1576e05df3b1SJaegeuk Kim 			if (step == 0 && IS_DNODE(page))
1577e05df3b1SJaegeuk Kim 				continue;
1578e05df3b1SJaegeuk Kim 			if (step == 1 && (!IS_DNODE(page) ||
1579e05df3b1SJaegeuk Kim 						is_cold_node(page)))
1580e05df3b1SJaegeuk Kim 				continue;
1581e05df3b1SJaegeuk Kim 			if (step == 2 && (!IS_DNODE(page) ||
1582e05df3b1SJaegeuk Kim 						!is_cold_node(page)))
1583e05df3b1SJaegeuk Kim 				continue;
15849a4cbc9eSChao Yu lock_node:
158552681375SJaegeuk Kim 			if (!trylock_page(page))
1586e05df3b1SJaegeuk Kim 				continue;
1587e05df3b1SJaegeuk Kim 
15884ef51a8fSJaegeuk Kim 			if (unlikely(page->mapping != NODE_MAPPING(sbi))) {
1589e05df3b1SJaegeuk Kim continue_unlock:
1590e05df3b1SJaegeuk Kim 				unlock_page(page);
1591e05df3b1SJaegeuk Kim 				continue;
1592e05df3b1SJaegeuk Kim 			}
1593e05df3b1SJaegeuk Kim 
1594e05df3b1SJaegeuk Kim 			if (!PageDirty(page)) {
1595e05df3b1SJaegeuk Kim 				/* someone wrote it for us */
1596e05df3b1SJaegeuk Kim 				goto continue_unlock;
1597e05df3b1SJaegeuk Kim 			}
1598e05df3b1SJaegeuk Kim 
15992049d4fcSJaegeuk Kim 			/* flush inline_data */
160052681375SJaegeuk Kim 			if (is_inline_node(page)) {
16012049d4fcSJaegeuk Kim 				clear_inline_node(page);
16022049d4fcSJaegeuk Kim 				unlock_page(page);
16032049d4fcSJaegeuk Kim 				flush_inline_data(sbi, ino_of_node(page));
16049a4cbc9eSChao Yu 				goto lock_node;
16052049d4fcSJaegeuk Kim 			}
16062049d4fcSJaegeuk Kim 
1607fa3d2bdfSJaegeuk Kim 			f2fs_wait_on_page_writeback(page, NODE, true);
1608fa3d2bdfSJaegeuk Kim 
1609fa3d2bdfSJaegeuk Kim 			BUG_ON(PageWriteback(page));
1610e05df3b1SJaegeuk Kim 			if (!clear_page_dirty_for_io(page))
1611e05df3b1SJaegeuk Kim 				goto continue_unlock;
1612e05df3b1SJaegeuk Kim 
1613e05df3b1SJaegeuk Kim 			set_fsync_mark(page, 0);
1614e05df3b1SJaegeuk Kim 			set_dentry_mark(page, 0);
161552746519SJaegeuk Kim 
1616d68f735bSJaegeuk Kim 			ret = __write_node_page(page, false, &submitted, wbc);
1617d68f735bSJaegeuk Kim 			if (ret)
161852746519SJaegeuk Kim 				unlock_page(page);
1619d68f735bSJaegeuk Kim 			else if (submitted)
16203f5f4959SChao Yu 				nwritten++;
1621e05df3b1SJaegeuk Kim 
1622e05df3b1SJaegeuk Kim 			if (--wbc->nr_to_write == 0)
1623e05df3b1SJaegeuk Kim 				break;
1624e05df3b1SJaegeuk Kim 		}
1625e05df3b1SJaegeuk Kim 		pagevec_release(&pvec);
1626e05df3b1SJaegeuk Kim 		cond_resched();
1627e05df3b1SJaegeuk Kim 
1628e05df3b1SJaegeuk Kim 		if (wbc->nr_to_write == 0) {
1629e05df3b1SJaegeuk Kim 			step = 2;
1630e05df3b1SJaegeuk Kim 			break;
1631e05df3b1SJaegeuk Kim 		}
1632e05df3b1SJaegeuk Kim 	}
1633e05df3b1SJaegeuk Kim 
1634e05df3b1SJaegeuk Kim 	if (step < 2) {
1635e05df3b1SJaegeuk Kim 		step++;
1636e05df3b1SJaegeuk Kim 		goto next_step;
1637e05df3b1SJaegeuk Kim 	}
16383f5f4959SChao Yu out:
16393f5f4959SChao Yu 	if (nwritten)
1640b9109b0eSJaegeuk Kim 		f2fs_submit_merged_write(sbi, NODE);
16413f5f4959SChao Yu 	return ret;
1642e05df3b1SJaegeuk Kim }
1643e05df3b1SJaegeuk Kim 
1644cfe58f9dSJaegeuk Kim int wait_on_node_pages_writeback(struct f2fs_sb_info *sbi, nid_t ino)
1645cfe58f9dSJaegeuk Kim {
164680dd9c0eSChao Yu 	pgoff_t index = 0, end = ULONG_MAX;
1647cfe58f9dSJaegeuk Kim 	struct pagevec pvec;
1648280db3c8SMiklos Szeredi 	int ret2, ret = 0;
1649cfe58f9dSJaegeuk Kim 
1650cfe58f9dSJaegeuk Kim 	pagevec_init(&pvec, 0);
16514ef51a8fSJaegeuk Kim 
16524ef51a8fSJaegeuk Kim 	while (index <= end) {
16534ef51a8fSJaegeuk Kim 		int i, nr_pages;
16544ef51a8fSJaegeuk Kim 		nr_pages = pagevec_lookup_tag(&pvec, NODE_MAPPING(sbi), &index,
1655cfe58f9dSJaegeuk Kim 				PAGECACHE_TAG_WRITEBACK,
16564ef51a8fSJaegeuk Kim 				min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
16574ef51a8fSJaegeuk Kim 		if (nr_pages == 0)
16584ef51a8fSJaegeuk Kim 			break;
1659cfe58f9dSJaegeuk Kim 
1660cfe58f9dSJaegeuk Kim 		for (i = 0; i < nr_pages; i++) {
1661cfe58f9dSJaegeuk Kim 			struct page *page = pvec.pages[i];
1662cfe58f9dSJaegeuk Kim 
1663cfe58f9dSJaegeuk Kim 			/* until radix tree lookup accepts end_index */
1664cfb271d4SChao Yu 			if (unlikely(page->index > end))
1665cfe58f9dSJaegeuk Kim 				continue;
1666cfe58f9dSJaegeuk Kim 
16674bf08ff6SChao Yu 			if (ino && ino_of_node(page) == ino) {
1668fec1d657SJaegeuk Kim 				f2fs_wait_on_page_writeback(page, NODE, true);
1669cfe58f9dSJaegeuk Kim 				if (TestClearPageError(page))
1670cfe58f9dSJaegeuk Kim 					ret = -EIO;
1671cfe58f9dSJaegeuk Kim 			}
16724bf08ff6SChao Yu 		}
1673cfe58f9dSJaegeuk Kim 		pagevec_release(&pvec);
1674cfe58f9dSJaegeuk Kim 		cond_resched();
1675cfe58f9dSJaegeuk Kim 	}
1676cfe58f9dSJaegeuk Kim 
1677280db3c8SMiklos Szeredi 	ret2 = filemap_check_errors(NODE_MAPPING(sbi));
1678cfe58f9dSJaegeuk Kim 	if (!ret)
1679cfe58f9dSJaegeuk Kim 		ret = ret2;
1680cfe58f9dSJaegeuk Kim 	return ret;
1681cfe58f9dSJaegeuk Kim }
1682cfe58f9dSJaegeuk Kim 
1683e05df3b1SJaegeuk Kim static int f2fs_write_node_pages(struct address_space *mapping,
1684e05df3b1SJaegeuk Kim 			    struct writeback_control *wbc)
1685e05df3b1SJaegeuk Kim {
16864081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_M_SB(mapping);
16879dfa1bafSJaegeuk Kim 	struct blk_plug plug;
168850c8cdb3SJaegeuk Kim 	long diff;
1689e05df3b1SJaegeuk Kim 
16904660f9c0SJaegeuk Kim 	/* balancing f2fs's metadata in background */
16914660f9c0SJaegeuk Kim 	f2fs_balance_fs_bg(sbi);
1692e05df3b1SJaegeuk Kim 
1693a7fdffbdSJaegeuk Kim 	/* collect a number of dirty node pages and write together */
169487d6f890SJaegeuk Kim 	if (get_pages(sbi, F2FS_DIRTY_NODES) < nr_pages_to_skip(sbi, NODE))
1695d3baf95dSJaegeuk Kim 		goto skip_write;
1696a7fdffbdSJaegeuk Kim 
1697d31c7c3fSYunlei He 	trace_f2fs_writepages(mapping->host, wbc, NODE);
1698d31c7c3fSYunlei He 
169950c8cdb3SJaegeuk Kim 	diff = nr_pages_to_write(sbi, NODE, wbc);
1700fb5566daSJaegeuk Kim 	wbc->sync_mode = WB_SYNC_NONE;
17019dfa1bafSJaegeuk Kim 	blk_start_plug(&plug);
170252681375SJaegeuk Kim 	sync_node_pages(sbi, wbc);
17039dfa1bafSJaegeuk Kim 	blk_finish_plug(&plug);
170450c8cdb3SJaegeuk Kim 	wbc->nr_to_write = max((long)0, wbc->nr_to_write - diff);
1705e05df3b1SJaegeuk Kim 	return 0;
1706d3baf95dSJaegeuk Kim 
1707d3baf95dSJaegeuk Kim skip_write:
1708d3baf95dSJaegeuk Kim 	wbc->pages_skipped += get_pages(sbi, F2FS_DIRTY_NODES);
1709d31c7c3fSYunlei He 	trace_f2fs_writepages(mapping->host, wbc, NODE);
1710d3baf95dSJaegeuk Kim 	return 0;
1711e05df3b1SJaegeuk Kim }
1712e05df3b1SJaegeuk Kim 
1713e05df3b1SJaegeuk Kim static int f2fs_set_node_page_dirty(struct page *page)
1714e05df3b1SJaegeuk Kim {
171526c6b887SJaegeuk Kim 	trace_f2fs_set_page_dirty(page, NODE);
171626c6b887SJaegeuk Kim 
1717237c0790SJaegeuk Kim 	if (!PageUptodate(page))
1718e05df3b1SJaegeuk Kim 		SetPageUptodate(page);
1719e05df3b1SJaegeuk Kim 	if (!PageDirty(page)) {
1720fe76b796SJaegeuk Kim 		f2fs_set_page_dirty_nobuffers(page);
17214081363fSJaegeuk Kim 		inc_page_count(F2FS_P_SB(page), F2FS_DIRTY_NODES);
1722e05df3b1SJaegeuk Kim 		SetPagePrivate(page);
17239e4ded3fSJaegeuk Kim 		f2fs_trace_pid(page);
1724e05df3b1SJaegeuk Kim 		return 1;
1725e05df3b1SJaegeuk Kim 	}
1726e05df3b1SJaegeuk Kim 	return 0;
1727e05df3b1SJaegeuk Kim }
1728e05df3b1SJaegeuk Kim 
17290a8165d7SJaegeuk Kim /*
1730e05df3b1SJaegeuk Kim  * Structure of the f2fs node operations
1731e05df3b1SJaegeuk Kim  */
1732e05df3b1SJaegeuk Kim const struct address_space_operations f2fs_node_aops = {
1733e05df3b1SJaegeuk Kim 	.writepage	= f2fs_write_node_page,
1734e05df3b1SJaegeuk Kim 	.writepages	= f2fs_write_node_pages,
1735e05df3b1SJaegeuk Kim 	.set_page_dirty	= f2fs_set_node_page_dirty,
1736487261f3SChao Yu 	.invalidatepage	= f2fs_invalidate_page,
1737487261f3SChao Yu 	.releasepage	= f2fs_release_page,
17385b7a487cSWeichao Guo #ifdef CONFIG_MIGRATION
17395b7a487cSWeichao Guo 	.migratepage    = f2fs_migrate_page,
17405b7a487cSWeichao Guo #endif
1741e05df3b1SJaegeuk Kim };
1742e05df3b1SJaegeuk Kim 
17438a7ed66aSJaegeuk Kim static struct free_nid *__lookup_free_nid_list(struct f2fs_nm_info *nm_i,
17448a7ed66aSJaegeuk Kim 						nid_t n)
1745e05df3b1SJaegeuk Kim {
17468a7ed66aSJaegeuk Kim 	return radix_tree_lookup(&nm_i->free_nid_root, n);
17473aa770a9SNamjae Jeon }
1748e05df3b1SJaegeuk Kim 
1749eb0aa4b8SJaegeuk Kim static int __insert_nid_to_list(struct f2fs_sb_info *sbi,
1750eb0aa4b8SJaegeuk Kim 			struct free_nid *i, enum nid_list list, bool new)
1751e05df3b1SJaegeuk Kim {
1752b8559dc2SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
1753b8559dc2SChao Yu 
1754eb0aa4b8SJaegeuk Kim 	if (new) {
1755eb0aa4b8SJaegeuk Kim 		int err = radix_tree_insert(&nm_i->free_nid_root, i->nid, i);
1756eb0aa4b8SJaegeuk Kim 		if (err)
1757eb0aa4b8SJaegeuk Kim 			return err;
1758eb0aa4b8SJaegeuk Kim 	}
1759eb0aa4b8SJaegeuk Kim 
1760b8559dc2SChao Yu 	f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW :
1761b8559dc2SChao Yu 						i->state != NID_ALLOC);
1762b8559dc2SChao Yu 	nm_i->nid_cnt[list]++;
1763b8559dc2SChao Yu 	list_add_tail(&i->list, &nm_i->nid_list[list]);
1764eb0aa4b8SJaegeuk Kim 	return 0;
1765b8559dc2SChao Yu }
1766b8559dc2SChao Yu 
1767b8559dc2SChao Yu static void __remove_nid_from_list(struct f2fs_sb_info *sbi,
1768eb0aa4b8SJaegeuk Kim 			struct free_nid *i, enum nid_list list, bool reuse)
1769b8559dc2SChao Yu {
1770b8559dc2SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
1771b8559dc2SChao Yu 
1772b8559dc2SChao Yu 	f2fs_bug_on(sbi, list == FREE_NID_LIST ? i->state != NID_NEW :
1773b8559dc2SChao Yu 						i->state != NID_ALLOC);
1774b8559dc2SChao Yu 	nm_i->nid_cnt[list]--;
1775e05df3b1SJaegeuk Kim 	list_del(&i->list);
1776eb0aa4b8SJaegeuk Kim 	if (!reuse)
17778a7ed66aSJaegeuk Kim 		radix_tree_delete(&nm_i->free_nid_root, i->nid);
1778e05df3b1SJaegeuk Kim }
1779e05df3b1SJaegeuk Kim 
17804ac91242SChao Yu /* return if the nid is recognized as free */
17814ac91242SChao Yu static bool add_free_nid(struct f2fs_sb_info *sbi, nid_t nid, bool build)
1782e05df3b1SJaegeuk Kim {
17836fb03f3aSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
178430a61ddfSChao Yu 	struct free_nid *i, *e;
178559bbd474SJaegeuk Kim 	struct nat_entry *ne;
178630a61ddfSChao Yu 	int err = -EINVAL;
178730a61ddfSChao Yu 	bool ret = false;
17889198acebSJaegeuk Kim 
17899198acebSJaegeuk Kim 	/* 0 nid should not be used */
1790cfb271d4SChao Yu 	if (unlikely(nid == 0))
17914ac91242SChao Yu 		return false;
179259bbd474SJaegeuk Kim 
17937bd59381SGu Zheng 	i = f2fs_kmem_cache_alloc(free_nid_slab, GFP_NOFS);
1794e05df3b1SJaegeuk Kim 	i->nid = nid;
1795e05df3b1SJaegeuk Kim 	i->state = NID_NEW;
1796e05df3b1SJaegeuk Kim 
179730a61ddfSChao Yu 	if (radix_tree_preload(GFP_NOFS))
179830a61ddfSChao Yu 		goto err;
1799769ec6e5SJaegeuk Kim 
1800b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
180130a61ddfSChao Yu 
180230a61ddfSChao Yu 	if (build) {
180330a61ddfSChao Yu 		/*
180430a61ddfSChao Yu 		 *   Thread A             Thread B
180530a61ddfSChao Yu 		 *  - f2fs_create
180630a61ddfSChao Yu 		 *   - f2fs_new_inode
180730a61ddfSChao Yu 		 *    - alloc_nid
180830a61ddfSChao Yu 		 *     - __insert_nid_to_list(ALLOC_NID_LIST)
180930a61ddfSChao Yu 		 *                     - f2fs_balance_fs_bg
181030a61ddfSChao Yu 		 *                      - build_free_nids
181130a61ddfSChao Yu 		 *                       - __build_free_nids
181230a61ddfSChao Yu 		 *                        - scan_nat_page
181330a61ddfSChao Yu 		 *                         - add_free_nid
181430a61ddfSChao Yu 		 *                          - __lookup_nat_cache
181530a61ddfSChao Yu 		 *  - f2fs_add_link
181630a61ddfSChao Yu 		 *   - init_inode_metadata
181730a61ddfSChao Yu 		 *    - new_inode_page
181830a61ddfSChao Yu 		 *     - new_node_page
181930a61ddfSChao Yu 		 *      - set_node_addr
182030a61ddfSChao Yu 		 *  - alloc_nid_done
182130a61ddfSChao Yu 		 *   - __remove_nid_from_list(ALLOC_NID_LIST)
182230a61ddfSChao Yu 		 *                         - __insert_nid_to_list(FREE_NID_LIST)
182330a61ddfSChao Yu 		 */
182430a61ddfSChao Yu 		ne = __lookup_nat_cache(nm_i, nid);
182530a61ddfSChao Yu 		if (ne && (!get_nat_flag(ne, IS_CHECKPOINTED) ||
182630a61ddfSChao Yu 				nat_get_blkaddr(ne) != NULL_ADDR))
182730a61ddfSChao Yu 			goto err_out;
182830a61ddfSChao Yu 
182930a61ddfSChao Yu 		e = __lookup_free_nid_list(nm_i, nid);
183030a61ddfSChao Yu 		if (e) {
183130a61ddfSChao Yu 			if (e->state == NID_NEW)
183230a61ddfSChao Yu 				ret = true;
183330a61ddfSChao Yu 			goto err_out;
183430a61ddfSChao Yu 		}
183530a61ddfSChao Yu 	}
183630a61ddfSChao Yu 	ret = true;
1837eb0aa4b8SJaegeuk Kim 	err = __insert_nid_to_list(sbi, i, FREE_NID_LIST, true);
183830a61ddfSChao Yu err_out:
1839b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
1840769ec6e5SJaegeuk Kim 	radix_tree_preload_end();
184130a61ddfSChao Yu err:
184230a61ddfSChao Yu 	if (err)
1843e05df3b1SJaegeuk Kim 		kmem_cache_free(free_nid_slab, i);
184430a61ddfSChao Yu 	return ret;
1845e05df3b1SJaegeuk Kim }
1846e05df3b1SJaegeuk Kim 
1847b8559dc2SChao Yu static void remove_free_nid(struct f2fs_sb_info *sbi, nid_t nid)
1848e05df3b1SJaegeuk Kim {
1849b8559dc2SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
1850e05df3b1SJaegeuk Kim 	struct free_nid *i;
1851cf0ee0f0SChao Yu 	bool need_free = false;
1852cf0ee0f0SChao Yu 
1853b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
18548a7ed66aSJaegeuk Kim 	i = __lookup_free_nid_list(nm_i, nid);
1855e05df3b1SJaegeuk Kim 	if (i && i->state == NID_NEW) {
1856eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, FREE_NID_LIST, false);
1857cf0ee0f0SChao Yu 		need_free = true;
1858e05df3b1SJaegeuk Kim 	}
1859b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
1860cf0ee0f0SChao Yu 
1861cf0ee0f0SChao Yu 	if (need_free)
1862cf0ee0f0SChao Yu 		kmem_cache_free(free_nid_slab, i);
1863e05df3b1SJaegeuk Kim }
1864e05df3b1SJaegeuk Kim 
18659f7e4a2cSJaegeuk Kim static void update_free_nid_bitmap(struct f2fs_sb_info *sbi, nid_t nid,
1866346fe752SChao Yu 							bool set, bool build)
18674ac91242SChao Yu {
18684ac91242SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
18694ac91242SChao Yu 	unsigned int nat_ofs = NAT_BLOCK_OFFSET(nid);
18704ac91242SChao Yu 	unsigned int nid_ofs = nid - START_NID(nid);
18714ac91242SChao Yu 
18724ac91242SChao Yu 	if (!test_bit_le(nat_ofs, nm_i->nat_block_bitmap))
18734ac91242SChao Yu 		return;
18744ac91242SChao Yu 
18754ac91242SChao Yu 	if (set)
187623380b85SJaegeuk Kim 		__set_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]);
18774ac91242SChao Yu 	else
187823380b85SJaegeuk Kim 		__clear_bit_le(nid_ofs, nm_i->free_nid_bitmap[nat_ofs]);
1879586d1492SChao Yu 
1880586d1492SChao Yu 	if (set)
1881586d1492SChao Yu 		nm_i->free_nid_count[nat_ofs]++;
1882586d1492SChao Yu 	else if (!build)
1883586d1492SChao Yu 		nm_i->free_nid_count[nat_ofs]--;
18844ac91242SChao Yu }
18854ac91242SChao Yu 
18866fb03f3aSJaegeuk Kim static void scan_nat_page(struct f2fs_sb_info *sbi,
1887e05df3b1SJaegeuk Kim 			struct page *nat_page, nid_t start_nid)
1888e05df3b1SJaegeuk Kim {
18896fb03f3aSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
1890e05df3b1SJaegeuk Kim 	struct f2fs_nat_block *nat_blk = page_address(nat_page);
1891e05df3b1SJaegeuk Kim 	block_t blk_addr;
18924ac91242SChao Yu 	unsigned int nat_ofs = NAT_BLOCK_OFFSET(start_nid);
1893e05df3b1SJaegeuk Kim 	int i;
1894e05df3b1SJaegeuk Kim 
1895586d1492SChao Yu 	if (test_bit_le(nat_ofs, nm_i->nat_block_bitmap))
1896586d1492SChao Yu 		return;
1897586d1492SChao Yu 
189823380b85SJaegeuk Kim 	__set_bit_le(nat_ofs, nm_i->nat_block_bitmap);
18994ac91242SChao Yu 
1900e05df3b1SJaegeuk Kim 	i = start_nid % NAT_ENTRY_PER_BLOCK;
1901e05df3b1SJaegeuk Kim 
1902e05df3b1SJaegeuk Kim 	for (; i < NAT_ENTRY_PER_BLOCK; i++, start_nid++) {
19034ac91242SChao Yu 		bool freed = false;
190423d38844SHaicheng Li 
1905cfb271d4SChao Yu 		if (unlikely(start_nid >= nm_i->max_nid))
190604431c44SJaegeuk Kim 			break;
190723d38844SHaicheng Li 
1908e05df3b1SJaegeuk Kim 		blk_addr = le32_to_cpu(nat_blk->entries[i].block_addr);
19099850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, blk_addr == NEW_ADDR);
19103a2ad567SChao Yu 		if (blk_addr == NULL_ADDR)
19114ac91242SChao Yu 			freed = add_free_nid(sbi, start_nid, true);
1912346fe752SChao Yu 		spin_lock(&NM_I(sbi)->nid_list_lock);
1913346fe752SChao Yu 		update_free_nid_bitmap(sbi, start_nid, freed, true);
1914346fe752SChao Yu 		spin_unlock(&NM_I(sbi)->nid_list_lock);
1915e05df3b1SJaegeuk Kim 	}
1916e05df3b1SJaegeuk Kim }
1917e05df3b1SJaegeuk Kim 
19184ac91242SChao Yu static void scan_free_nid_bits(struct f2fs_sb_info *sbi)
19194ac91242SChao Yu {
19204ac91242SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
19214ac91242SChao Yu 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
19224ac91242SChao Yu 	struct f2fs_journal *journal = curseg->journal;
19234ac91242SChao Yu 	unsigned int i, idx;
19244ac91242SChao Yu 
19254ac91242SChao Yu 	down_read(&nm_i->nat_tree_lock);
19264ac91242SChao Yu 
19274ac91242SChao Yu 	for (i = 0; i < nm_i->nat_blocks; i++) {
19284ac91242SChao Yu 		if (!test_bit_le(i, nm_i->nat_block_bitmap))
19294ac91242SChao Yu 			continue;
1930586d1492SChao Yu 		if (!nm_i->free_nid_count[i])
1931586d1492SChao Yu 			continue;
19324ac91242SChao Yu 		for (idx = 0; idx < NAT_ENTRY_PER_BLOCK; idx++) {
19334ac91242SChao Yu 			nid_t nid;
19344ac91242SChao Yu 
19354ac91242SChao Yu 			if (!test_bit_le(idx, nm_i->free_nid_bitmap[i]))
19364ac91242SChao Yu 				continue;
19374ac91242SChao Yu 
19384ac91242SChao Yu 			nid = i * NAT_ENTRY_PER_BLOCK + idx;
19394ac91242SChao Yu 			add_free_nid(sbi, nid, true);
19404ac91242SChao Yu 
1941f0cdbfe6SKinglong Mee 			if (nm_i->nid_cnt[FREE_NID_LIST] >= MAX_FREE_NIDS)
19424ac91242SChao Yu 				goto out;
19434ac91242SChao Yu 		}
19444ac91242SChao Yu 	}
19454ac91242SChao Yu out:
19464ac91242SChao Yu 	down_read(&curseg->journal_rwsem);
19474ac91242SChao Yu 	for (i = 0; i < nats_in_cursum(journal); i++) {
19484ac91242SChao Yu 		block_t addr;
19494ac91242SChao Yu 		nid_t nid;
19504ac91242SChao Yu 
19514ac91242SChao Yu 		addr = le32_to_cpu(nat_in_journal(journal, i).block_addr);
19524ac91242SChao Yu 		nid = le32_to_cpu(nid_in_journal(journal, i));
19534ac91242SChao Yu 		if (addr == NULL_ADDR)
19544ac91242SChao Yu 			add_free_nid(sbi, nid, true);
19554ac91242SChao Yu 		else
19564ac91242SChao Yu 			remove_free_nid(sbi, nid);
19574ac91242SChao Yu 	}
19584ac91242SChao Yu 	up_read(&curseg->journal_rwsem);
19594ac91242SChao Yu 	up_read(&nm_i->nat_tree_lock);
19604ac91242SChao Yu }
19614ac91242SChao Yu 
196222ad0b6aSJaegeuk Kim static void __build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount)
1963e05df3b1SJaegeuk Kim {
1964e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
1965e05df3b1SJaegeuk Kim 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
1966b7ad7512SChao Yu 	struct f2fs_journal *journal = curseg->journal;
19678760952dSHaicheng Li 	int i = 0;
196855008d84SJaegeuk Kim 	nid_t nid = nm_i->next_scan_nid;
1969e05df3b1SJaegeuk Kim 
1970e9cdd307SYunlei He 	if (unlikely(nid >= nm_i->max_nid))
1971e9cdd307SYunlei He 		nid = 0;
1972e9cdd307SYunlei He 
197355008d84SJaegeuk Kim 	/* Enough entries */
1974b8559dc2SChao Yu 	if (nm_i->nid_cnt[FREE_NID_LIST] >= NAT_ENTRY_PER_BLOCK)
197555008d84SJaegeuk Kim 		return;
1976e05df3b1SJaegeuk Kim 
19773a2ad567SChao Yu 	if (!sync && !available_free_memory(sbi, FREE_NIDS))
1978e05df3b1SJaegeuk Kim 		return;
1979e05df3b1SJaegeuk Kim 
19804ac91242SChao Yu 	if (!mount) {
19814ac91242SChao Yu 		/* try to find free nids in free_nid_bitmap */
19824ac91242SChao Yu 		scan_free_nid_bits(sbi);
19834ac91242SChao Yu 
19844ac91242SChao Yu 		if (nm_i->nid_cnt[FREE_NID_LIST])
198522ad0b6aSJaegeuk Kim 			return;
198622ad0b6aSJaegeuk Kim 	}
198722ad0b6aSJaegeuk Kim 
198855008d84SJaegeuk Kim 	/* readahead nat pages to be scanned */
198926879fb1SChao Yu 	ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nid), FREE_NID_PAGES,
199026879fb1SChao Yu 							META_NAT, true);
1991e05df3b1SJaegeuk Kim 
1992b873b798SJaegeuk Kim 	down_read(&nm_i->nat_tree_lock);
1993a5131193SJaegeuk Kim 
1994e05df3b1SJaegeuk Kim 	while (1) {
1995e05df3b1SJaegeuk Kim 		struct page *page = get_current_nat_page(sbi, nid);
1996e05df3b1SJaegeuk Kim 
19976fb03f3aSJaegeuk Kim 		scan_nat_page(sbi, page, nid);
1998e05df3b1SJaegeuk Kim 		f2fs_put_page(page, 1);
1999e05df3b1SJaegeuk Kim 
2000e05df3b1SJaegeuk Kim 		nid += (NAT_ENTRY_PER_BLOCK - (nid % NAT_ENTRY_PER_BLOCK));
2001cfb271d4SChao Yu 		if (unlikely(nid >= nm_i->max_nid))
2002e05df3b1SJaegeuk Kim 			nid = 0;
200355008d84SJaegeuk Kim 
2004a6d494b6SChao Yu 		if (++i >= FREE_NID_PAGES)
2005e05df3b1SJaegeuk Kim 			break;
2006e05df3b1SJaegeuk Kim 	}
2007e05df3b1SJaegeuk Kim 
200855008d84SJaegeuk Kim 	/* go to the next free nat pages to find free nids abundantly */
200955008d84SJaegeuk Kim 	nm_i->next_scan_nid = nid;
2010e05df3b1SJaegeuk Kim 
2011e05df3b1SJaegeuk Kim 	/* find free nids from current sum_pages */
2012b7ad7512SChao Yu 	down_read(&curseg->journal_rwsem);
2013dfc08a12SChao Yu 	for (i = 0; i < nats_in_cursum(journal); i++) {
2014dfc08a12SChao Yu 		block_t addr;
2015dfc08a12SChao Yu 
2016dfc08a12SChao Yu 		addr = le32_to_cpu(nat_in_journal(journal, i).block_addr);
2017dfc08a12SChao Yu 		nid = le32_to_cpu(nid_in_journal(journal, i));
2018e05df3b1SJaegeuk Kim 		if (addr == NULL_ADDR)
20196fb03f3aSJaegeuk Kim 			add_free_nid(sbi, nid, true);
2020e05df3b1SJaegeuk Kim 		else
2021b8559dc2SChao Yu 			remove_free_nid(sbi, nid);
2022e05df3b1SJaegeuk Kim 	}
2023b7ad7512SChao Yu 	up_read(&curseg->journal_rwsem);
2024b873b798SJaegeuk Kim 	up_read(&nm_i->nat_tree_lock);
20252db2388fSChao Yu 
20262db2388fSChao Yu 	ra_meta_pages(sbi, NAT_BLOCK_OFFSET(nm_i->next_scan_nid),
2027ea1a29a0SChao Yu 					nm_i->ra_nid_pages, META_NAT, false);
2028e05df3b1SJaegeuk Kim }
2029e05df3b1SJaegeuk Kim 
203022ad0b6aSJaegeuk Kim void build_free_nids(struct f2fs_sb_info *sbi, bool sync, bool mount)
20312411cf5bSChao Yu {
20322411cf5bSChao Yu 	mutex_lock(&NM_I(sbi)->build_lock);
203322ad0b6aSJaegeuk Kim 	__build_free_nids(sbi, sync, mount);
20342411cf5bSChao Yu 	mutex_unlock(&NM_I(sbi)->build_lock);
20352411cf5bSChao Yu }
20362411cf5bSChao Yu 
2037e05df3b1SJaegeuk Kim /*
2038e05df3b1SJaegeuk Kim  * If this function returns success, caller can obtain a new nid
2039e05df3b1SJaegeuk Kim  * from second parameter of this function.
2040e05df3b1SJaegeuk Kim  * The returned nid could be used ino as well as nid when inode is created.
2041e05df3b1SJaegeuk Kim  */
2042e05df3b1SJaegeuk Kim bool alloc_nid(struct f2fs_sb_info *sbi, nid_t *nid)
2043e05df3b1SJaegeuk Kim {
2044e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2045e05df3b1SJaegeuk Kim 	struct free_nid *i = NULL;
2046e05df3b1SJaegeuk Kim retry:
2047cb78942bSJaegeuk Kim #ifdef CONFIG_F2FS_FAULT_INJECTION
204855523519SChao Yu 	if (time_to_inject(sbi, FAULT_ALLOC_NID)) {
204955523519SChao Yu 		f2fs_show_injection_info(FAULT_ALLOC_NID);
2050cb78942bSJaegeuk Kim 		return false;
205155523519SChao Yu 	}
2052cb78942bSJaegeuk Kim #endif
2053b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
2054e05df3b1SJaegeuk Kim 
205504d47e67SChao Yu 	if (unlikely(nm_i->available_nids == 0)) {
205604d47e67SChao Yu 		spin_unlock(&nm_i->nid_list_lock);
205704d47e67SChao Yu 		return false;
205804d47e67SChao Yu 	}
2059e05df3b1SJaegeuk Kim 
206055008d84SJaegeuk Kim 	/* We should not use stale free nids created by build_free_nids */
2061b8559dc2SChao Yu 	if (nm_i->nid_cnt[FREE_NID_LIST] && !on_build_free_nids(nm_i)) {
2062b8559dc2SChao Yu 		f2fs_bug_on(sbi, list_empty(&nm_i->nid_list[FREE_NID_LIST]));
2063b8559dc2SChao Yu 		i = list_first_entry(&nm_i->nid_list[FREE_NID_LIST],
2064b8559dc2SChao Yu 					struct free_nid, list);
2065e05df3b1SJaegeuk Kim 		*nid = i->nid;
2066b8559dc2SChao Yu 
2067eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, FREE_NID_LIST, true);
2068e05df3b1SJaegeuk Kim 		i->state = NID_ALLOC;
2069eb0aa4b8SJaegeuk Kim 		__insert_nid_to_list(sbi, i, ALLOC_NID_LIST, false);
207004d47e67SChao Yu 		nm_i->available_nids--;
20714ac91242SChao Yu 
2072346fe752SChao Yu 		update_free_nid_bitmap(sbi, *nid, false, false);
20734ac91242SChao Yu 
2074b8559dc2SChao Yu 		spin_unlock(&nm_i->nid_list_lock);
2075e05df3b1SJaegeuk Kim 		return true;
2076e05df3b1SJaegeuk Kim 	}
2077b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
207855008d84SJaegeuk Kim 
207955008d84SJaegeuk Kim 	/* Let's scan nat pages and its caches to get free nids */
208022ad0b6aSJaegeuk Kim 	build_free_nids(sbi, true, false);
208155008d84SJaegeuk Kim 	goto retry;
208255008d84SJaegeuk Kim }
2083e05df3b1SJaegeuk Kim 
20840a8165d7SJaegeuk Kim /*
2085e05df3b1SJaegeuk Kim  * alloc_nid() should be called prior to this function.
2086e05df3b1SJaegeuk Kim  */
2087e05df3b1SJaegeuk Kim void alloc_nid_done(struct f2fs_sb_info *sbi, nid_t nid)
2088e05df3b1SJaegeuk Kim {
2089e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2090e05df3b1SJaegeuk Kim 	struct free_nid *i;
2091e05df3b1SJaegeuk Kim 
2092b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
20938a7ed66aSJaegeuk Kim 	i = __lookup_free_nid_list(nm_i, nid);
2094b8559dc2SChao Yu 	f2fs_bug_on(sbi, !i);
2095eb0aa4b8SJaegeuk Kim 	__remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false);
2096b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
2097cf0ee0f0SChao Yu 
2098cf0ee0f0SChao Yu 	kmem_cache_free(free_nid_slab, i);
2099e05df3b1SJaegeuk Kim }
2100e05df3b1SJaegeuk Kim 
21010a8165d7SJaegeuk Kim /*
2102e05df3b1SJaegeuk Kim  * alloc_nid() should be called prior to this function.
2103e05df3b1SJaegeuk Kim  */
2104e05df3b1SJaegeuk Kim void alloc_nid_failed(struct f2fs_sb_info *sbi, nid_t nid)
2105e05df3b1SJaegeuk Kim {
210649952fa1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
210749952fa1SJaegeuk Kim 	struct free_nid *i;
2108cf0ee0f0SChao Yu 	bool need_free = false;
210949952fa1SJaegeuk Kim 
211065985d93SJaegeuk Kim 	if (!nid)
211165985d93SJaegeuk Kim 		return;
211265985d93SJaegeuk Kim 
2113b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
21148a7ed66aSJaegeuk Kim 	i = __lookup_free_nid_list(nm_i, nid);
2115b8559dc2SChao Yu 	f2fs_bug_on(sbi, !i);
2116b8559dc2SChao Yu 
21176fb03f3aSJaegeuk Kim 	if (!available_free_memory(sbi, FREE_NIDS)) {
2118eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, ALLOC_NID_LIST, false);
2119cf0ee0f0SChao Yu 		need_free = true;
212095630cbaSHaicheng Li 	} else {
2121eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, ALLOC_NID_LIST, true);
212249952fa1SJaegeuk Kim 		i->state = NID_NEW;
2123eb0aa4b8SJaegeuk Kim 		__insert_nid_to_list(sbi, i, FREE_NID_LIST, false);
212495630cbaSHaicheng Li 	}
212504d47e67SChao Yu 
212604d47e67SChao Yu 	nm_i->available_nids++;
212704d47e67SChao Yu 
2128346fe752SChao Yu 	update_free_nid_bitmap(sbi, nid, true, false);
21294ac91242SChao Yu 
2130b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
2131cf0ee0f0SChao Yu 
2132cf0ee0f0SChao Yu 	if (need_free)
2133cf0ee0f0SChao Yu 		kmem_cache_free(free_nid_slab, i);
2134e05df3b1SJaegeuk Kim }
2135e05df3b1SJaegeuk Kim 
213631696580SChao Yu int try_to_free_nids(struct f2fs_sb_info *sbi, int nr_shrink)
213731696580SChao Yu {
213831696580SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
213931696580SChao Yu 	struct free_nid *i, *next;
214031696580SChao Yu 	int nr = nr_shrink;
214131696580SChao Yu 
2142b8559dc2SChao Yu 	if (nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS)
2143ad4edb83SJaegeuk Kim 		return 0;
2144ad4edb83SJaegeuk Kim 
214531696580SChao Yu 	if (!mutex_trylock(&nm_i->build_lock))
214631696580SChao Yu 		return 0;
214731696580SChao Yu 
2148b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
2149b8559dc2SChao Yu 	list_for_each_entry_safe(i, next, &nm_i->nid_list[FREE_NID_LIST],
2150b8559dc2SChao Yu 									list) {
2151b8559dc2SChao Yu 		if (nr_shrink <= 0 ||
2152b8559dc2SChao Yu 				nm_i->nid_cnt[FREE_NID_LIST] <= MAX_FREE_NIDS)
215331696580SChao Yu 			break;
2154b8559dc2SChao Yu 
2155eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, FREE_NID_LIST, false);
215631696580SChao Yu 		kmem_cache_free(free_nid_slab, i);
215731696580SChao Yu 		nr_shrink--;
215831696580SChao Yu 	}
2159b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
216031696580SChao Yu 	mutex_unlock(&nm_i->build_lock);
216131696580SChao Yu 
216231696580SChao Yu 	return nr - nr_shrink;
216331696580SChao Yu }
216431696580SChao Yu 
216570cfed88SChao Yu void recover_inline_xattr(struct inode *inode, struct page *page)
216628cdce04SChao Yu {
216728cdce04SChao Yu 	void *src_addr, *dst_addr;
216828cdce04SChao Yu 	size_t inline_size;
216928cdce04SChao Yu 	struct page *ipage;
217028cdce04SChao Yu 	struct f2fs_inode *ri;
217128cdce04SChao Yu 
21724081363fSJaegeuk Kim 	ipage = get_node_page(F2FS_I_SB(inode), inode->i_ino);
21739850cf4aSJaegeuk Kim 	f2fs_bug_on(F2FS_I_SB(inode), IS_ERR(ipage));
217428cdce04SChao Yu 
2175e3b4d43fSJaegeuk Kim 	ri = F2FS_INODE(page);
2176e3b4d43fSJaegeuk Kim 	if (!(ri->i_inline & F2FS_INLINE_XATTR)) {
217791942321SJaegeuk Kim 		clear_inode_flag(inode, FI_INLINE_XATTR);
2178e3b4d43fSJaegeuk Kim 		goto update_inode;
2179e3b4d43fSJaegeuk Kim 	}
2180e3b4d43fSJaegeuk Kim 
218128cdce04SChao Yu 	dst_addr = inline_xattr_addr(ipage);
218228cdce04SChao Yu 	src_addr = inline_xattr_addr(page);
218328cdce04SChao Yu 	inline_size = inline_xattr_size(inode);
218428cdce04SChao Yu 
2185fec1d657SJaegeuk Kim 	f2fs_wait_on_page_writeback(ipage, NODE, true);
218628cdce04SChao Yu 	memcpy(dst_addr, src_addr, inline_size);
2187e3b4d43fSJaegeuk Kim update_inode:
218828cdce04SChao Yu 	update_inode(inode, ipage);
218928cdce04SChao Yu 	f2fs_put_page(ipage, 1);
219028cdce04SChao Yu }
219128cdce04SChao Yu 
2192d260081cSChao Yu int recover_xattr_data(struct inode *inode, struct page *page, block_t blkaddr)
2193abb2366cSJaegeuk Kim {
21944081363fSJaegeuk Kim 	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2195abb2366cSJaegeuk Kim 	nid_t prev_xnid = F2FS_I(inode)->i_xattr_nid;
2196abb2366cSJaegeuk Kim 	nid_t new_xnid = nid_of_node(page);
2197abb2366cSJaegeuk Kim 	struct node_info ni;
2198d260081cSChao Yu 	struct page *xpage;
2199abb2366cSJaegeuk Kim 
2200abb2366cSJaegeuk Kim 	if (!prev_xnid)
2201abb2366cSJaegeuk Kim 		goto recover_xnid;
2202abb2366cSJaegeuk Kim 
2203d260081cSChao Yu 	/* 1: invalidate the previous xattr nid */
2204abb2366cSJaegeuk Kim 	get_node_info(sbi, prev_xnid, &ni);
22059850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, ni.blk_addr == NULL_ADDR);
2206abb2366cSJaegeuk Kim 	invalidate_blocks(sbi, ni.blk_addr);
2207abb2366cSJaegeuk Kim 	dec_valid_node_count(sbi, inode);
2208479f40c4SJaegeuk Kim 	set_node_addr(sbi, &ni, NULL_ADDR, false);
2209abb2366cSJaegeuk Kim 
2210abb2366cSJaegeuk Kim recover_xnid:
2211d260081cSChao Yu 	/* 2: update xattr nid in inode */
2212d260081cSChao Yu 	remove_free_nid(sbi, new_xnid);
2213d260081cSChao Yu 	f2fs_i_xnid_write(inode, new_xnid);
2214abb2366cSJaegeuk Kim 	if (unlikely(!inc_valid_node_count(sbi, inode)))
22159850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, 1);
2216d260081cSChao Yu 	update_inode_page(inode);
2217abb2366cSJaegeuk Kim 
2218d260081cSChao Yu 	/* 3: update and set xattr node page dirty */
2219d260081cSChao Yu 	xpage = grab_cache_page(NODE_MAPPING(sbi), new_xnid);
2220d260081cSChao Yu 	if (!xpage)
2221d260081cSChao Yu 		return -ENOMEM;
2222d260081cSChao Yu 
2223d260081cSChao Yu 	memcpy(F2FS_NODE(xpage), F2FS_NODE(page), PAGE_SIZE);
2224d260081cSChao Yu 
2225abb2366cSJaegeuk Kim 	get_node_info(sbi, new_xnid, &ni);
2226abb2366cSJaegeuk Kim 	ni.ino = inode->i_ino;
2227479f40c4SJaegeuk Kim 	set_node_addr(sbi, &ni, NEW_ADDR, false);
2228d260081cSChao Yu 	set_page_dirty(xpage);
2229d260081cSChao Yu 	f2fs_put_page(xpage, 1);
2230abb2366cSJaegeuk Kim 
2231d260081cSChao Yu 	return 0;
2232abb2366cSJaegeuk Kim }
2233abb2366cSJaegeuk Kim 
2234e05df3b1SJaegeuk Kim int recover_inode_page(struct f2fs_sb_info *sbi, struct page *page)
2235e05df3b1SJaegeuk Kim {
223658bfaf44SJaegeuk Kim 	struct f2fs_inode *src, *dst;
2237e05df3b1SJaegeuk Kim 	nid_t ino = ino_of_node(page);
2238e05df3b1SJaegeuk Kim 	struct node_info old_ni, new_ni;
2239e05df3b1SJaegeuk Kim 	struct page *ipage;
2240e05df3b1SJaegeuk Kim 
2241e8271fa3SJaegeuk Kim 	get_node_info(sbi, ino, &old_ni);
2242e8271fa3SJaegeuk Kim 
2243e8271fa3SJaegeuk Kim 	if (unlikely(old_ni.blk_addr != NULL_ADDR))
2244e8271fa3SJaegeuk Kim 		return -EINVAL;
2245e8ea9b3dSJaegeuk Kim retry:
2246300e129cSJaegeuk Kim 	ipage = f2fs_grab_cache_page(NODE_MAPPING(sbi), ino, false);
2247e8ea9b3dSJaegeuk Kim 	if (!ipage) {
2248e8ea9b3dSJaegeuk Kim 		congestion_wait(BLK_RW_ASYNC, HZ/50);
2249e8ea9b3dSJaegeuk Kim 		goto retry;
2250e8ea9b3dSJaegeuk Kim 	}
2251e05df3b1SJaegeuk Kim 
2252e05df3b1SJaegeuk Kim 	/* Should not use this inode from free nid list */
2253b8559dc2SChao Yu 	remove_free_nid(sbi, ino);
2254e05df3b1SJaegeuk Kim 
2255237c0790SJaegeuk Kim 	if (!PageUptodate(ipage))
2256e05df3b1SJaegeuk Kim 		SetPageUptodate(ipage);
2257e05df3b1SJaegeuk Kim 	fill_node_footer(ipage, ino, ino, 0, true);
2258e05df3b1SJaegeuk Kim 
225958bfaf44SJaegeuk Kim 	src = F2FS_INODE(page);
226058bfaf44SJaegeuk Kim 	dst = F2FS_INODE(ipage);
2261e05df3b1SJaegeuk Kim 
226258bfaf44SJaegeuk Kim 	memcpy(dst, src, (unsigned long)&src->i_ext - (unsigned long)src);
226358bfaf44SJaegeuk Kim 	dst->i_size = 0;
226458bfaf44SJaegeuk Kim 	dst->i_blocks = cpu_to_le64(1);
226558bfaf44SJaegeuk Kim 	dst->i_links = cpu_to_le32(1);
226658bfaf44SJaegeuk Kim 	dst->i_xattr_nid = 0;
2267617deb8cSJaegeuk Kim 	dst->i_inline = src->i_inline & F2FS_INLINE_XATTR;
2268e05df3b1SJaegeuk Kim 
2269e05df3b1SJaegeuk Kim 	new_ni = old_ni;
2270e05df3b1SJaegeuk Kim 	new_ni.ino = ino;
2271e05df3b1SJaegeuk Kim 
2272cfb271d4SChao Yu 	if (unlikely(!inc_valid_node_count(sbi, NULL)))
227365e5cd0aSJaegeuk Kim 		WARN_ON(1);
2274479f40c4SJaegeuk Kim 	set_node_addr(sbi, &new_ni, NEW_ADDR, false);
2275e05df3b1SJaegeuk Kim 	inc_valid_inode_count(sbi);
2276617deb8cSJaegeuk Kim 	set_page_dirty(ipage);
2277e05df3b1SJaegeuk Kim 	f2fs_put_page(ipage, 1);
2278e05df3b1SJaegeuk Kim 	return 0;
2279e05df3b1SJaegeuk Kim }
2280e05df3b1SJaegeuk Kim 
2281e05df3b1SJaegeuk Kim int restore_node_summary(struct f2fs_sb_info *sbi,
2282e05df3b1SJaegeuk Kim 			unsigned int segno, struct f2fs_summary_block *sum)
2283e05df3b1SJaegeuk Kim {
2284e05df3b1SJaegeuk Kim 	struct f2fs_node *rn;
2285e05df3b1SJaegeuk Kim 	struct f2fs_summary *sum_entry;
2286e05df3b1SJaegeuk Kim 	block_t addr;
22879ecf4b80SChao Yu 	int i, idx, last_offset, nrpages;
2288e05df3b1SJaegeuk Kim 
2289e05df3b1SJaegeuk Kim 	/* scan the node segment */
2290e05df3b1SJaegeuk Kim 	last_offset = sbi->blocks_per_seg;
2291e05df3b1SJaegeuk Kim 	addr = START_BLOCK(sbi, segno);
2292e05df3b1SJaegeuk Kim 	sum_entry = &sum->entries[0];
2293e05df3b1SJaegeuk Kim 
22949ecf4b80SChao Yu 	for (i = 0; i < last_offset; i += nrpages, addr += nrpages) {
2295664ba972SJaegeuk Kim 		nrpages = min(last_offset - i, BIO_MAX_PAGES);
2296393ff91fSJaegeuk Kim 
22979af0ff1cSChao Yu 		/* readahead node pages */
229826879fb1SChao Yu 		ra_meta_pages(sbi, addr, nrpages, META_POR, true);
22999af0ff1cSChao Yu 
23009ecf4b80SChao Yu 		for (idx = addr; idx < addr + nrpages; idx++) {
23012b947003SChao Yu 			struct page *page = get_tmp_page(sbi, idx);
2302393ff91fSJaegeuk Kim 
23039ecf4b80SChao Yu 			rn = F2FS_NODE(page);
2304393ff91fSJaegeuk Kim 			sum_entry->nid = rn->footer.nid;
2305393ff91fSJaegeuk Kim 			sum_entry->version = 0;
2306393ff91fSJaegeuk Kim 			sum_entry->ofs_in_node = 0;
23079af0ff1cSChao Yu 			sum_entry++;
23089ecf4b80SChao Yu 			f2fs_put_page(page, 1);
23099af0ff1cSChao Yu 		}
2310bac4eef6SChao Yu 
23119ecf4b80SChao Yu 		invalidate_mapping_pages(META_MAPPING(sbi), addr,
2312bac4eef6SChao Yu 							addr + nrpages);
23139af0ff1cSChao Yu 	}
23149ecf4b80SChao Yu 	return 0;
2315e05df3b1SJaegeuk Kim }
2316e05df3b1SJaegeuk Kim 
2317aec71382SChao Yu static void remove_nats_in_journal(struct f2fs_sb_info *sbi)
2318e05df3b1SJaegeuk Kim {
2319e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2320e05df3b1SJaegeuk Kim 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
2321b7ad7512SChao Yu 	struct f2fs_journal *journal = curseg->journal;
2322e05df3b1SJaegeuk Kim 	int i;
2323e05df3b1SJaegeuk Kim 
2324b7ad7512SChao Yu 	down_write(&curseg->journal_rwsem);
2325dfc08a12SChao Yu 	for (i = 0; i < nats_in_cursum(journal); i++) {
2326e05df3b1SJaegeuk Kim 		struct nat_entry *ne;
2327e05df3b1SJaegeuk Kim 		struct f2fs_nat_entry raw_ne;
2328dfc08a12SChao Yu 		nid_t nid = le32_to_cpu(nid_in_journal(journal, i));
2329e05df3b1SJaegeuk Kim 
2330dfc08a12SChao Yu 		raw_ne = nat_in_journal(journal, i);
23319be32d72SJaegeuk Kim 
2332e05df3b1SJaegeuk Kim 		ne = __lookup_nat_cache(nm_i, nid);
2333e05df3b1SJaegeuk Kim 		if (!ne) {
23345c9e4184SChao Yu 			ne = grab_nat_entry(nm_i, nid, true);
233594dac22eSChao Yu 			node_info_from_raw_nat(&ne->ni, &raw_ne);
23369be32d72SJaegeuk Kim 		}
233704d47e67SChao Yu 
233804d47e67SChao Yu 		/*
233904d47e67SChao Yu 		 * if a free nat in journal has not been used after last
234004d47e67SChao Yu 		 * checkpoint, we should remove it from available nids,
234104d47e67SChao Yu 		 * since later we will add it again.
234204d47e67SChao Yu 		 */
234304d47e67SChao Yu 		if (!get_nat_flag(ne, IS_DIRTY) &&
234404d47e67SChao Yu 				le32_to_cpu(raw_ne.block_addr) == NULL_ADDR) {
234504d47e67SChao Yu 			spin_lock(&nm_i->nid_list_lock);
234604d47e67SChao Yu 			nm_i->available_nids--;
234704d47e67SChao Yu 			spin_unlock(&nm_i->nid_list_lock);
234804d47e67SChao Yu 		}
234904d47e67SChao Yu 
2350e05df3b1SJaegeuk Kim 		__set_nat_cache_dirty(nm_i, ne);
2351e05df3b1SJaegeuk Kim 	}
2352dfc08a12SChao Yu 	update_nats_in_cursum(journal, -i);
2353b7ad7512SChao Yu 	up_write(&curseg->journal_rwsem);
2354e05df3b1SJaegeuk Kim }
2355e05df3b1SJaegeuk Kim 
2356309cc2b6SJaegeuk Kim static void __adjust_nat_entry_set(struct nat_entry_set *nes,
2357309cc2b6SJaegeuk Kim 						struct list_head *head, int max)
2358e05df3b1SJaegeuk Kim {
2359309cc2b6SJaegeuk Kim 	struct nat_entry_set *cur;
2360e05df3b1SJaegeuk Kim 
2361309cc2b6SJaegeuk Kim 	if (nes->entry_cnt >= max)
2362309cc2b6SJaegeuk Kim 		goto add_out;
2363e05df3b1SJaegeuk Kim 
2364309cc2b6SJaegeuk Kim 	list_for_each_entry(cur, head, set_list) {
2365309cc2b6SJaegeuk Kim 		if (cur->entry_cnt >= nes->entry_cnt) {
2366309cc2b6SJaegeuk Kim 			list_add(&nes->set_list, cur->set_list.prev);
2367309cc2b6SJaegeuk Kim 			return;
2368309cc2b6SJaegeuk Kim 		}
2369309cc2b6SJaegeuk Kim 	}
2370309cc2b6SJaegeuk Kim add_out:
2371309cc2b6SJaegeuk Kim 	list_add_tail(&nes->set_list, head);
2372aec71382SChao Yu }
2373aec71382SChao Yu 
23749f7e4a2cSJaegeuk Kim static void __update_nat_bits(struct f2fs_sb_info *sbi, nid_t start_nid,
237522ad0b6aSJaegeuk Kim 						struct page *page)
237622ad0b6aSJaegeuk Kim {
237722ad0b6aSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
237822ad0b6aSJaegeuk Kim 	unsigned int nat_index = start_nid / NAT_ENTRY_PER_BLOCK;
237922ad0b6aSJaegeuk Kim 	struct f2fs_nat_block *nat_blk = page_address(page);
238022ad0b6aSJaegeuk Kim 	int valid = 0;
238122ad0b6aSJaegeuk Kim 	int i;
238222ad0b6aSJaegeuk Kim 
238322ad0b6aSJaegeuk Kim 	if (!enabled_nat_bits(sbi, NULL))
238422ad0b6aSJaegeuk Kim 		return;
238522ad0b6aSJaegeuk Kim 
238622ad0b6aSJaegeuk Kim 	for (i = 0; i < NAT_ENTRY_PER_BLOCK; i++) {
238722ad0b6aSJaegeuk Kim 		if (start_nid == 0 && i == 0)
238822ad0b6aSJaegeuk Kim 			valid++;
238922ad0b6aSJaegeuk Kim 		if (nat_blk->entries[i].block_addr)
239022ad0b6aSJaegeuk Kim 			valid++;
239122ad0b6aSJaegeuk Kim 	}
239222ad0b6aSJaegeuk Kim 	if (valid == 0) {
239323380b85SJaegeuk Kim 		__set_bit_le(nat_index, nm_i->empty_nat_bits);
239423380b85SJaegeuk Kim 		__clear_bit_le(nat_index, nm_i->full_nat_bits);
239522ad0b6aSJaegeuk Kim 		return;
239622ad0b6aSJaegeuk Kim 	}
239722ad0b6aSJaegeuk Kim 
239823380b85SJaegeuk Kim 	__clear_bit_le(nat_index, nm_i->empty_nat_bits);
239922ad0b6aSJaegeuk Kim 	if (valid == NAT_ENTRY_PER_BLOCK)
240023380b85SJaegeuk Kim 		__set_bit_le(nat_index, nm_i->full_nat_bits);
240122ad0b6aSJaegeuk Kim 	else
240223380b85SJaegeuk Kim 		__clear_bit_le(nat_index, nm_i->full_nat_bits);
240322ad0b6aSJaegeuk Kim }
240422ad0b6aSJaegeuk Kim 
2405309cc2b6SJaegeuk Kim static void __flush_nat_entry_set(struct f2fs_sb_info *sbi,
240622ad0b6aSJaegeuk Kim 		struct nat_entry_set *set, struct cp_control *cpc)
2407309cc2b6SJaegeuk Kim {
2408309cc2b6SJaegeuk Kim 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
2409b7ad7512SChao Yu 	struct f2fs_journal *journal = curseg->journal;
2410309cc2b6SJaegeuk Kim 	nid_t start_nid = set->set * NAT_ENTRY_PER_BLOCK;
2411309cc2b6SJaegeuk Kim 	bool to_journal = true;
2412309cc2b6SJaegeuk Kim 	struct f2fs_nat_block *nat_blk;
2413309cc2b6SJaegeuk Kim 	struct nat_entry *ne, *cur;
2414309cc2b6SJaegeuk Kim 	struct page *page = NULL;
2415aec71382SChao Yu 
2416aec71382SChao Yu 	/*
2417aec71382SChao Yu 	 * there are two steps to flush nat entries:
2418aec71382SChao Yu 	 * #1, flush nat entries to journal in current hot data summary block.
2419aec71382SChao Yu 	 * #2, flush nat entries to nat page.
2420aec71382SChao Yu 	 */
242122ad0b6aSJaegeuk Kim 	if (enabled_nat_bits(sbi, cpc) ||
242222ad0b6aSJaegeuk Kim 		!__has_cursum_space(journal, set->entry_cnt, NAT_JOURNAL))
2423aec71382SChao Yu 		to_journal = false;
2424aec71382SChao Yu 
2425aec71382SChao Yu 	if (to_journal) {
2426b7ad7512SChao Yu 		down_write(&curseg->journal_rwsem);
2427aec71382SChao Yu 	} else {
2428e05df3b1SJaegeuk Kim 		page = get_next_nat_page(sbi, start_nid);
2429e05df3b1SJaegeuk Kim 		nat_blk = page_address(page);
24309850cf4aSJaegeuk Kim 		f2fs_bug_on(sbi, !nat_blk);
2431e05df3b1SJaegeuk Kim 	}
2432e05df3b1SJaegeuk Kim 
2433aec71382SChao Yu 	/* flush dirty nats in nat entry set */
2434309cc2b6SJaegeuk Kim 	list_for_each_entry_safe(ne, cur, &set->entry_list, list) {
2435aec71382SChao Yu 		struct f2fs_nat_entry *raw_ne;
2436aec71382SChao Yu 		nid_t nid = nat_get_nid(ne);
2437aec71382SChao Yu 		int offset;
2438aec71382SChao Yu 
2439febeca6dSChao Yu 		f2fs_bug_on(sbi, nat_get_blkaddr(ne) == NEW_ADDR);
2440309cc2b6SJaegeuk Kim 
2441aec71382SChao Yu 		if (to_journal) {
2442dfc08a12SChao Yu 			offset = lookup_journal_in_cursum(journal,
2443aec71382SChao Yu 							NAT_JOURNAL, nid, 1);
24449850cf4aSJaegeuk Kim 			f2fs_bug_on(sbi, offset < 0);
2445dfc08a12SChao Yu 			raw_ne = &nat_in_journal(journal, offset);
2446dfc08a12SChao Yu 			nid_in_journal(journal, offset) = cpu_to_le32(nid);
2447aec71382SChao Yu 		} else {
2448aec71382SChao Yu 			raw_ne = &nat_blk->entries[nid - start_nid];
2449aec71382SChao Yu 		}
2450aec71382SChao Yu 		raw_nat_from_node_info(raw_ne, &ne->ni);
245188bd02c9SJaegeuk Kim 		nat_reset_flag(ne);
24520b28b71eSKinglong Mee 		__clear_nat_cache_dirty(NM_I(sbi), set, ne);
245304d47e67SChao Yu 		if (nat_get_blkaddr(ne) == NULL_ADDR) {
2454309cc2b6SJaegeuk Kim 			add_free_nid(sbi, nid, false);
245504d47e67SChao Yu 			spin_lock(&NM_I(sbi)->nid_list_lock);
245604d47e67SChao Yu 			NM_I(sbi)->available_nids++;
2457346fe752SChao Yu 			update_free_nid_bitmap(sbi, nid, true, false);
24584ac91242SChao Yu 			spin_unlock(&NM_I(sbi)->nid_list_lock);
24594ac91242SChao Yu 		} else {
24604ac91242SChao Yu 			spin_lock(&NM_I(sbi)->nid_list_lock);
2461346fe752SChao Yu 			update_free_nid_bitmap(sbi, nid, false, false);
246204d47e67SChao Yu 			spin_unlock(&NM_I(sbi)->nid_list_lock);
246304d47e67SChao Yu 		}
2464e05df3b1SJaegeuk Kim 	}
2465aec71382SChao Yu 
246622ad0b6aSJaegeuk Kim 	if (to_journal) {
2467b7ad7512SChao Yu 		up_write(&curseg->journal_rwsem);
246822ad0b6aSJaegeuk Kim 	} else {
246922ad0b6aSJaegeuk Kim 		__update_nat_bits(sbi, start_nid, page);
2470e05df3b1SJaegeuk Kim 		f2fs_put_page(page, 1);
247122ad0b6aSJaegeuk Kim 	}
2472aec71382SChao Yu 
247359c9081bSYunlei He 	/* Allow dirty nats by node block allocation in write_begin */
247459c9081bSYunlei He 	if (!set->entry_cnt) {
2475309cc2b6SJaegeuk Kim 		radix_tree_delete(&NM_I(sbi)->nat_set_root, set->set);
2476309cc2b6SJaegeuk Kim 		kmem_cache_free(nat_entry_set_slab, set);
2477309cc2b6SJaegeuk Kim 	}
247859c9081bSYunlei He }
2479aec71382SChao Yu 
2480309cc2b6SJaegeuk Kim /*
2481309cc2b6SJaegeuk Kim  * This function is called during the checkpointing process.
2482309cc2b6SJaegeuk Kim  */
248322ad0b6aSJaegeuk Kim void flush_nat_entries(struct f2fs_sb_info *sbi, struct cp_control *cpc)
2484309cc2b6SJaegeuk Kim {
2485309cc2b6SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2486309cc2b6SJaegeuk Kim 	struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_HOT_DATA);
2487b7ad7512SChao Yu 	struct f2fs_journal *journal = curseg->journal;
24887aed0d45SJaegeuk Kim 	struct nat_entry_set *setvec[SETVEC_SIZE];
2489309cc2b6SJaegeuk Kim 	struct nat_entry_set *set, *tmp;
2490309cc2b6SJaegeuk Kim 	unsigned int found;
2491309cc2b6SJaegeuk Kim 	nid_t set_idx = 0;
2492309cc2b6SJaegeuk Kim 	LIST_HEAD(sets);
2493309cc2b6SJaegeuk Kim 
249420d047c8SChangman Lee 	if (!nm_i->dirty_nat_cnt)
249520d047c8SChangman Lee 		return;
2496a5131193SJaegeuk Kim 
2497b873b798SJaegeuk Kim 	down_write(&nm_i->nat_tree_lock);
2498a5131193SJaegeuk Kim 
2499309cc2b6SJaegeuk Kim 	/*
2500309cc2b6SJaegeuk Kim 	 * if there are no enough space in journal to store dirty nat
2501309cc2b6SJaegeuk Kim 	 * entries, remove all entries from journal and merge them
2502309cc2b6SJaegeuk Kim 	 * into nat entry set.
2503309cc2b6SJaegeuk Kim 	 */
2504900f7362SJaegeuk Kim 	if (enabled_nat_bits(sbi, cpc) ||
250522ad0b6aSJaegeuk Kim 		!__has_cursum_space(journal, nm_i->dirty_nat_cnt, NAT_JOURNAL))
2506309cc2b6SJaegeuk Kim 		remove_nats_in_journal(sbi);
2507309cc2b6SJaegeuk Kim 
2508309cc2b6SJaegeuk Kim 	while ((found = __gang_lookup_nat_set(nm_i,
25097aed0d45SJaegeuk Kim 					set_idx, SETVEC_SIZE, setvec))) {
2510309cc2b6SJaegeuk Kim 		unsigned idx;
2511309cc2b6SJaegeuk Kim 		set_idx = setvec[found - 1]->set + 1;
2512309cc2b6SJaegeuk Kim 		for (idx = 0; idx < found; idx++)
2513309cc2b6SJaegeuk Kim 			__adjust_nat_entry_set(setvec[idx], &sets,
2514dfc08a12SChao Yu 						MAX_NAT_JENTRIES(journal));
2515309cc2b6SJaegeuk Kim 	}
2516309cc2b6SJaegeuk Kim 
2517309cc2b6SJaegeuk Kim 	/* flush dirty nats in nat entry set */
2518309cc2b6SJaegeuk Kim 	list_for_each_entry_safe(set, tmp, &sets, set_list)
251922ad0b6aSJaegeuk Kim 		__flush_nat_entry_set(sbi, set, cpc);
2520309cc2b6SJaegeuk Kim 
2521b873b798SJaegeuk Kim 	up_write(&nm_i->nat_tree_lock);
252259c9081bSYunlei He 	/* Allow dirty nats by node block allocation in write_begin */
2523e05df3b1SJaegeuk Kim }
2524e05df3b1SJaegeuk Kim 
252522ad0b6aSJaegeuk Kim static int __get_nat_bitmaps(struct f2fs_sb_info *sbi)
252622ad0b6aSJaegeuk Kim {
252722ad0b6aSJaegeuk Kim 	struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
252822ad0b6aSJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
252922ad0b6aSJaegeuk Kim 	unsigned int nat_bits_bytes = nm_i->nat_blocks / BITS_PER_BYTE;
253022ad0b6aSJaegeuk Kim 	unsigned int i;
253122ad0b6aSJaegeuk Kim 	__u64 cp_ver = cur_cp_version(ckpt);
253222ad0b6aSJaegeuk Kim 	block_t nat_bits_addr;
253322ad0b6aSJaegeuk Kim 
253422ad0b6aSJaegeuk Kim 	if (!enabled_nat_bits(sbi, NULL))
253522ad0b6aSJaegeuk Kim 		return 0;
253622ad0b6aSJaegeuk Kim 
253722ad0b6aSJaegeuk Kim 	nm_i->nat_bits_blocks = F2FS_BYTES_TO_BLK((nat_bits_bytes << 1) + 8 +
253822ad0b6aSJaegeuk Kim 						F2FS_BLKSIZE - 1);
253922ad0b6aSJaegeuk Kim 	nm_i->nat_bits = kzalloc(nm_i->nat_bits_blocks << F2FS_BLKSIZE_BITS,
254022ad0b6aSJaegeuk Kim 						GFP_KERNEL);
254122ad0b6aSJaegeuk Kim 	if (!nm_i->nat_bits)
254222ad0b6aSJaegeuk Kim 		return -ENOMEM;
254322ad0b6aSJaegeuk Kim 
254422ad0b6aSJaegeuk Kim 	nat_bits_addr = __start_cp_addr(sbi) + sbi->blocks_per_seg -
254522ad0b6aSJaegeuk Kim 						nm_i->nat_bits_blocks;
254622ad0b6aSJaegeuk Kim 	for (i = 0; i < nm_i->nat_bits_blocks; i++) {
254722ad0b6aSJaegeuk Kim 		struct page *page = get_meta_page(sbi, nat_bits_addr++);
254822ad0b6aSJaegeuk Kim 
254922ad0b6aSJaegeuk Kim 		memcpy(nm_i->nat_bits + (i << F2FS_BLKSIZE_BITS),
255022ad0b6aSJaegeuk Kim 					page_address(page), F2FS_BLKSIZE);
255122ad0b6aSJaegeuk Kim 		f2fs_put_page(page, 1);
255222ad0b6aSJaegeuk Kim 	}
255322ad0b6aSJaegeuk Kim 
2554ced2c7eaSKinglong Mee 	cp_ver |= (cur_cp_crc(ckpt) << 32);
255522ad0b6aSJaegeuk Kim 	if (cpu_to_le64(cp_ver) != *(__le64 *)nm_i->nat_bits) {
255622ad0b6aSJaegeuk Kim 		disable_nat_bits(sbi, true);
255722ad0b6aSJaegeuk Kim 		return 0;
255822ad0b6aSJaegeuk Kim 	}
255922ad0b6aSJaegeuk Kim 
256022ad0b6aSJaegeuk Kim 	nm_i->full_nat_bits = nm_i->nat_bits + 8;
256122ad0b6aSJaegeuk Kim 	nm_i->empty_nat_bits = nm_i->full_nat_bits + nat_bits_bytes;
256222ad0b6aSJaegeuk Kim 
256322ad0b6aSJaegeuk Kim 	f2fs_msg(sbi->sb, KERN_NOTICE, "Found nat_bits in checkpoint");
256422ad0b6aSJaegeuk Kim 	return 0;
256522ad0b6aSJaegeuk Kim }
256622ad0b6aSJaegeuk Kim 
2567bd80a4b9SHou Pengyang static inline void load_free_nid_bitmap(struct f2fs_sb_info *sbi)
25687041d5d2SChao Yu {
25697041d5d2SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
25707041d5d2SChao Yu 	unsigned int i = 0;
25717041d5d2SChao Yu 	nid_t nid, last_nid;
25727041d5d2SChao Yu 
25737041d5d2SChao Yu 	if (!enabled_nat_bits(sbi, NULL))
25747041d5d2SChao Yu 		return;
25757041d5d2SChao Yu 
25767041d5d2SChao Yu 	for (i = 0; i < nm_i->nat_blocks; i++) {
25777041d5d2SChao Yu 		i = find_next_bit_le(nm_i->empty_nat_bits, nm_i->nat_blocks, i);
25787041d5d2SChao Yu 		if (i >= nm_i->nat_blocks)
25797041d5d2SChao Yu 			break;
25807041d5d2SChao Yu 
25817041d5d2SChao Yu 		__set_bit_le(i, nm_i->nat_block_bitmap);
25827041d5d2SChao Yu 
25837041d5d2SChao Yu 		nid = i * NAT_ENTRY_PER_BLOCK;
25847041d5d2SChao Yu 		last_nid = (i + 1) * NAT_ENTRY_PER_BLOCK;
25857041d5d2SChao Yu 
2586346fe752SChao Yu 		spin_lock(&NM_I(sbi)->nid_list_lock);
25877041d5d2SChao Yu 		for (; nid < last_nid; nid++)
2588346fe752SChao Yu 			update_free_nid_bitmap(sbi, nid, true, true);
2589346fe752SChao Yu 		spin_unlock(&NM_I(sbi)->nid_list_lock);
25907041d5d2SChao Yu 	}
25917041d5d2SChao Yu 
25927041d5d2SChao Yu 	for (i = 0; i < nm_i->nat_blocks; i++) {
25937041d5d2SChao Yu 		i = find_next_bit_le(nm_i->full_nat_bits, nm_i->nat_blocks, i);
25947041d5d2SChao Yu 		if (i >= nm_i->nat_blocks)
25957041d5d2SChao Yu 			break;
25967041d5d2SChao Yu 
25977041d5d2SChao Yu 		__set_bit_le(i, nm_i->nat_block_bitmap);
25987041d5d2SChao Yu 	}
25997041d5d2SChao Yu }
26007041d5d2SChao Yu 
2601e05df3b1SJaegeuk Kim static int init_node_manager(struct f2fs_sb_info *sbi)
2602e05df3b1SJaegeuk Kim {
2603e05df3b1SJaegeuk Kim 	struct f2fs_super_block *sb_raw = F2FS_RAW_SUPER(sbi);
2604e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2605e05df3b1SJaegeuk Kim 	unsigned char *version_bitmap;
260622ad0b6aSJaegeuk Kim 	unsigned int nat_segs;
260722ad0b6aSJaegeuk Kim 	int err;
2608e05df3b1SJaegeuk Kim 
2609e05df3b1SJaegeuk Kim 	nm_i->nat_blkaddr = le32_to_cpu(sb_raw->nat_blkaddr);
2610e05df3b1SJaegeuk Kim 
2611e05df3b1SJaegeuk Kim 	/* segment_count_nat includes pair segment so divide to 2. */
2612e05df3b1SJaegeuk Kim 	nat_segs = le32_to_cpu(sb_raw->segment_count_nat) >> 1;
261322ad0b6aSJaegeuk Kim 	nm_i->nat_blocks = nat_segs << le32_to_cpu(sb_raw->log_blocks_per_seg);
261422ad0b6aSJaegeuk Kim 	nm_i->max_nid = NAT_ENTRY_PER_BLOCK * nm_i->nat_blocks;
26157ee0eeabSJaegeuk Kim 
2616b63da15eSJaegeuk Kim 	/* not used nids: 0, node, meta, (and root counted as valid node) */
261704d47e67SChao Yu 	nm_i->available_nids = nm_i->max_nid - sbi->total_valid_node_count -
261804d47e67SChao Yu 							F2FS_RESERVED_NODE_NUM;
2619b8559dc2SChao Yu 	nm_i->nid_cnt[FREE_NID_LIST] = 0;
2620b8559dc2SChao Yu 	nm_i->nid_cnt[ALLOC_NID_LIST] = 0;
2621e05df3b1SJaegeuk Kim 	nm_i->nat_cnt = 0;
2622cdfc41c1SJaegeuk Kim 	nm_i->ram_thresh = DEF_RAM_THRESHOLD;
2623ea1a29a0SChao Yu 	nm_i->ra_nid_pages = DEF_RA_NID_PAGES;
26242304cb0cSChao Yu 	nm_i->dirty_nats_ratio = DEF_DIRTY_NAT_RATIO_THRESHOLD;
2625e05df3b1SJaegeuk Kim 
26268a7ed66aSJaegeuk Kim 	INIT_RADIX_TREE(&nm_i->free_nid_root, GFP_ATOMIC);
2627b8559dc2SChao Yu 	INIT_LIST_HEAD(&nm_i->nid_list[FREE_NID_LIST]);
2628b8559dc2SChao Yu 	INIT_LIST_HEAD(&nm_i->nid_list[ALLOC_NID_LIST]);
2629769ec6e5SJaegeuk Kim 	INIT_RADIX_TREE(&nm_i->nat_root, GFP_NOIO);
2630769ec6e5SJaegeuk Kim 	INIT_RADIX_TREE(&nm_i->nat_set_root, GFP_NOIO);
2631e05df3b1SJaegeuk Kim 	INIT_LIST_HEAD(&nm_i->nat_entries);
2632e05df3b1SJaegeuk Kim 
2633e05df3b1SJaegeuk Kim 	mutex_init(&nm_i->build_lock);
2634b8559dc2SChao Yu 	spin_lock_init(&nm_i->nid_list_lock);
2635b873b798SJaegeuk Kim 	init_rwsem(&nm_i->nat_tree_lock);
2636e05df3b1SJaegeuk Kim 
2637e05df3b1SJaegeuk Kim 	nm_i->next_scan_nid = le32_to_cpu(sbi->ckpt->next_free_nid);
263879b5793bSAlexandru Gheorghiu 	nm_i->bitmap_size = __bitmap_size(sbi, NAT_BITMAP);
2639e05df3b1SJaegeuk Kim 	version_bitmap = __bitmap_ptr(sbi, NAT_BITMAP);
2640e05df3b1SJaegeuk Kim 	if (!version_bitmap)
2641e05df3b1SJaegeuk Kim 		return -EFAULT;
2642e05df3b1SJaegeuk Kim 
264379b5793bSAlexandru Gheorghiu 	nm_i->nat_bitmap = kmemdup(version_bitmap, nm_i->bitmap_size,
264479b5793bSAlexandru Gheorghiu 					GFP_KERNEL);
264579b5793bSAlexandru Gheorghiu 	if (!nm_i->nat_bitmap)
264679b5793bSAlexandru Gheorghiu 		return -ENOMEM;
2647599a09b2SChao Yu 
264822ad0b6aSJaegeuk Kim 	err = __get_nat_bitmaps(sbi);
264922ad0b6aSJaegeuk Kim 	if (err)
265022ad0b6aSJaegeuk Kim 		return err;
265122ad0b6aSJaegeuk Kim 
2652599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS
2653599a09b2SChao Yu 	nm_i->nat_bitmap_mir = kmemdup(version_bitmap, nm_i->bitmap_size,
2654599a09b2SChao Yu 					GFP_KERNEL);
2655599a09b2SChao Yu 	if (!nm_i->nat_bitmap_mir)
2656599a09b2SChao Yu 		return -ENOMEM;
2657599a09b2SChao Yu #endif
2658599a09b2SChao Yu 
2659e05df3b1SJaegeuk Kim 	return 0;
2660e05df3b1SJaegeuk Kim }
2661e05df3b1SJaegeuk Kim 
26629f7e4a2cSJaegeuk Kim static int init_free_nid_cache(struct f2fs_sb_info *sbi)
26634ac91242SChao Yu {
26644ac91242SChao Yu 	struct f2fs_nm_info *nm_i = NM_I(sbi);
26654ac91242SChao Yu 
26664ac91242SChao Yu 	nm_i->free_nid_bitmap = f2fs_kvzalloc(nm_i->nat_blocks *
26674ac91242SChao Yu 					NAT_ENTRY_BITMAP_SIZE, GFP_KERNEL);
26684ac91242SChao Yu 	if (!nm_i->free_nid_bitmap)
26694ac91242SChao Yu 		return -ENOMEM;
26704ac91242SChao Yu 
26714ac91242SChao Yu 	nm_i->nat_block_bitmap = f2fs_kvzalloc(nm_i->nat_blocks / 8,
26724ac91242SChao Yu 								GFP_KERNEL);
26734ac91242SChao Yu 	if (!nm_i->nat_block_bitmap)
26744ac91242SChao Yu 		return -ENOMEM;
2675586d1492SChao Yu 
2676586d1492SChao Yu 	nm_i->free_nid_count = f2fs_kvzalloc(nm_i->nat_blocks *
2677586d1492SChao Yu 					sizeof(unsigned short), GFP_KERNEL);
2678586d1492SChao Yu 	if (!nm_i->free_nid_count)
2679586d1492SChao Yu 		return -ENOMEM;
26804ac91242SChao Yu 	return 0;
26814ac91242SChao Yu }
26824ac91242SChao Yu 
2683e05df3b1SJaegeuk Kim int build_node_manager(struct f2fs_sb_info *sbi)
2684e05df3b1SJaegeuk Kim {
2685e05df3b1SJaegeuk Kim 	int err;
2686e05df3b1SJaegeuk Kim 
2687e05df3b1SJaegeuk Kim 	sbi->nm_info = kzalloc(sizeof(struct f2fs_nm_info), GFP_KERNEL);
2688e05df3b1SJaegeuk Kim 	if (!sbi->nm_info)
2689e05df3b1SJaegeuk Kim 		return -ENOMEM;
2690e05df3b1SJaegeuk Kim 
2691e05df3b1SJaegeuk Kim 	err = init_node_manager(sbi);
2692e05df3b1SJaegeuk Kim 	if (err)
2693e05df3b1SJaegeuk Kim 		return err;
2694e05df3b1SJaegeuk Kim 
26954ac91242SChao Yu 	err = init_free_nid_cache(sbi);
26964ac91242SChao Yu 	if (err)
26974ac91242SChao Yu 		return err;
26984ac91242SChao Yu 
26997041d5d2SChao Yu 	/* load free nid status from nat_bits table */
27007041d5d2SChao Yu 	load_free_nid_bitmap(sbi);
27017041d5d2SChao Yu 
270222ad0b6aSJaegeuk Kim 	build_free_nids(sbi, true, true);
2703e05df3b1SJaegeuk Kim 	return 0;
2704e05df3b1SJaegeuk Kim }
2705e05df3b1SJaegeuk Kim 
2706e05df3b1SJaegeuk Kim void destroy_node_manager(struct f2fs_sb_info *sbi)
2707e05df3b1SJaegeuk Kim {
2708e05df3b1SJaegeuk Kim 	struct f2fs_nm_info *nm_i = NM_I(sbi);
2709e05df3b1SJaegeuk Kim 	struct free_nid *i, *next_i;
2710e05df3b1SJaegeuk Kim 	struct nat_entry *natvec[NATVEC_SIZE];
27117aed0d45SJaegeuk Kim 	struct nat_entry_set *setvec[SETVEC_SIZE];
2712e05df3b1SJaegeuk Kim 	nid_t nid = 0;
2713e05df3b1SJaegeuk Kim 	unsigned int found;
2714e05df3b1SJaegeuk Kim 
2715e05df3b1SJaegeuk Kim 	if (!nm_i)
2716e05df3b1SJaegeuk Kim 		return;
2717e05df3b1SJaegeuk Kim 
2718e05df3b1SJaegeuk Kim 	/* destroy free nid list */
2719b8559dc2SChao Yu 	spin_lock(&nm_i->nid_list_lock);
2720b8559dc2SChao Yu 	list_for_each_entry_safe(i, next_i, &nm_i->nid_list[FREE_NID_LIST],
2721b8559dc2SChao Yu 									list) {
2722eb0aa4b8SJaegeuk Kim 		__remove_nid_from_list(sbi, i, FREE_NID_LIST, false);
2723b8559dc2SChao Yu 		spin_unlock(&nm_i->nid_list_lock);
2724cf0ee0f0SChao Yu 		kmem_cache_free(free_nid_slab, i);
2725b8559dc2SChao Yu 		spin_lock(&nm_i->nid_list_lock);
2726e05df3b1SJaegeuk Kim 	}
2727b8559dc2SChao Yu 	f2fs_bug_on(sbi, nm_i->nid_cnt[FREE_NID_LIST]);
2728b8559dc2SChao Yu 	f2fs_bug_on(sbi, nm_i->nid_cnt[ALLOC_NID_LIST]);
2729b8559dc2SChao Yu 	f2fs_bug_on(sbi, !list_empty(&nm_i->nid_list[ALLOC_NID_LIST]));
2730b8559dc2SChao Yu 	spin_unlock(&nm_i->nid_list_lock);
2731e05df3b1SJaegeuk Kim 
2732e05df3b1SJaegeuk Kim 	/* destroy nat cache */
2733b873b798SJaegeuk Kim 	down_write(&nm_i->nat_tree_lock);
2734e05df3b1SJaegeuk Kim 	while ((found = __gang_lookup_nat_cache(nm_i,
2735e05df3b1SJaegeuk Kim 					nid, NATVEC_SIZE, natvec))) {
2736e05df3b1SJaegeuk Kim 		unsigned idx;
27377aed0d45SJaegeuk Kim 
2738b6ce391eSGu Zheng 		nid = nat_get_nid(natvec[found - 1]) + 1;
2739b6ce391eSGu Zheng 		for (idx = 0; idx < found; idx++)
2740b6ce391eSGu Zheng 			__del_from_nat_cache(nm_i, natvec[idx]);
2741e05df3b1SJaegeuk Kim 	}
27429850cf4aSJaegeuk Kim 	f2fs_bug_on(sbi, nm_i->nat_cnt);
27437aed0d45SJaegeuk Kim 
27447aed0d45SJaegeuk Kim 	/* destroy nat set cache */
27457aed0d45SJaegeuk Kim 	nid = 0;
27467aed0d45SJaegeuk Kim 	while ((found = __gang_lookup_nat_set(nm_i,
27477aed0d45SJaegeuk Kim 					nid, SETVEC_SIZE, setvec))) {
27487aed0d45SJaegeuk Kim 		unsigned idx;
27497aed0d45SJaegeuk Kim 
27507aed0d45SJaegeuk Kim 		nid = setvec[found - 1]->set + 1;
27517aed0d45SJaegeuk Kim 		for (idx = 0; idx < found; idx++) {
27527aed0d45SJaegeuk Kim 			/* entry_cnt is not zero, when cp_error was occurred */
27537aed0d45SJaegeuk Kim 			f2fs_bug_on(sbi, !list_empty(&setvec[idx]->entry_list));
27547aed0d45SJaegeuk Kim 			radix_tree_delete(&nm_i->nat_set_root, setvec[idx]->set);
27557aed0d45SJaegeuk Kim 			kmem_cache_free(nat_entry_set_slab, setvec[idx]);
27567aed0d45SJaegeuk Kim 		}
27577aed0d45SJaegeuk Kim 	}
2758b873b798SJaegeuk Kim 	up_write(&nm_i->nat_tree_lock);
2759e05df3b1SJaegeuk Kim 
27604ac91242SChao Yu 	kvfree(nm_i->nat_block_bitmap);
27614ac91242SChao Yu 	kvfree(nm_i->free_nid_bitmap);
2762586d1492SChao Yu 	kvfree(nm_i->free_nid_count);
27634ac91242SChao Yu 
2764e05df3b1SJaegeuk Kim 	kfree(nm_i->nat_bitmap);
276522ad0b6aSJaegeuk Kim 	kfree(nm_i->nat_bits);
2766599a09b2SChao Yu #ifdef CONFIG_F2FS_CHECK_FS
2767599a09b2SChao Yu 	kfree(nm_i->nat_bitmap_mir);
2768599a09b2SChao Yu #endif
2769e05df3b1SJaegeuk Kim 	sbi->nm_info = NULL;
2770e05df3b1SJaegeuk Kim 	kfree(nm_i);
2771e05df3b1SJaegeuk Kim }
2772e05df3b1SJaegeuk Kim 
27736e6093a8SNamjae Jeon int __init create_node_manager_caches(void)
2774e05df3b1SJaegeuk Kim {
2775e05df3b1SJaegeuk Kim 	nat_entry_slab = f2fs_kmem_cache_create("nat_entry",
2776e8512d2eSGu Zheng 			sizeof(struct nat_entry));
2777e05df3b1SJaegeuk Kim 	if (!nat_entry_slab)
2778aec71382SChao Yu 		goto fail;
2779e05df3b1SJaegeuk Kim 
2780e05df3b1SJaegeuk Kim 	free_nid_slab = f2fs_kmem_cache_create("free_nid",
2781e8512d2eSGu Zheng 			sizeof(struct free_nid));
2782aec71382SChao Yu 	if (!free_nid_slab)
2783ce3e6d25SMarkus Elfring 		goto destroy_nat_entry;
2784aec71382SChao Yu 
2785aec71382SChao Yu 	nat_entry_set_slab = f2fs_kmem_cache_create("nat_entry_set",
2786aec71382SChao Yu 			sizeof(struct nat_entry_set));
2787aec71382SChao Yu 	if (!nat_entry_set_slab)
2788ce3e6d25SMarkus Elfring 		goto destroy_free_nid;
2789e05df3b1SJaegeuk Kim 	return 0;
2790aec71382SChao Yu 
2791ce3e6d25SMarkus Elfring destroy_free_nid:
2792aec71382SChao Yu 	kmem_cache_destroy(free_nid_slab);
2793ce3e6d25SMarkus Elfring destroy_nat_entry:
2794aec71382SChao Yu 	kmem_cache_destroy(nat_entry_slab);
2795aec71382SChao Yu fail:
2796aec71382SChao Yu 	return -ENOMEM;
2797e05df3b1SJaegeuk Kim }
2798e05df3b1SJaegeuk Kim 
2799e05df3b1SJaegeuk Kim void destroy_node_manager_caches(void)
2800e05df3b1SJaegeuk Kim {
2801aec71382SChao Yu 	kmem_cache_destroy(nat_entry_set_slab);
2802e05df3b1SJaegeuk Kim 	kmem_cache_destroy(free_nid_slab);
2803e05df3b1SJaegeuk Kim 	kmem_cache_destroy(nat_entry_slab);
2804e05df3b1SJaegeuk Kim }
2805