xref: /openbmc/linux/fs/nfsd/filecache.c (revision b3276c1f5b268ff56622e9e125b792b4c3dc03ac)
165294c1fSJeff Layton /*
265294c1fSJeff Layton  * Open file cache.
365294c1fSJeff Layton  *
465294c1fSJeff Layton  * (c) 2015 - Jeff Layton <jeff.layton@primarydata.com>
5*b3276c1fSChuck Lever  *
6*b3276c1fSChuck Lever  * An nfsd_file object is a per-file collection of open state that binds
7*b3276c1fSChuck Lever  * together:
8*b3276c1fSChuck Lever  *   - a struct file *
9*b3276c1fSChuck Lever  *   - a user credential
10*b3276c1fSChuck Lever  *   - a network namespace
11*b3276c1fSChuck Lever  *   - a read-ahead context
12*b3276c1fSChuck Lever  *   - monitoring for writeback errors
13*b3276c1fSChuck Lever  *
14*b3276c1fSChuck Lever  * nfsd_file objects are reference-counted. Consumers acquire a new
15*b3276c1fSChuck Lever  * object via the nfsd_file_acquire API. They manage their interest in
16*b3276c1fSChuck Lever  * the acquired object, and hence the object's reference count, via
17*b3276c1fSChuck Lever  * nfsd_file_get and nfsd_file_put. There are two varieties of nfsd_file
18*b3276c1fSChuck Lever  * object:
19*b3276c1fSChuck Lever  *
20*b3276c1fSChuck Lever  *  * non-garbage-collected: When a consumer wants to precisely control
21*b3276c1fSChuck Lever  *    the lifetime of a file's open state, it acquires a non-garbage-
22*b3276c1fSChuck Lever  *    collected nfsd_file. The final nfsd_file_put releases the open
23*b3276c1fSChuck Lever  *    state immediately.
24*b3276c1fSChuck Lever  *
25*b3276c1fSChuck Lever  *  * garbage-collected: When a consumer does not control the lifetime
26*b3276c1fSChuck Lever  *    of open state, it acquires a garbage-collected nfsd_file. The
27*b3276c1fSChuck Lever  *    final nfsd_file_put allows the open state to linger for a period
28*b3276c1fSChuck Lever  *    during which it may be re-used.
2965294c1fSJeff Layton  */
3065294c1fSJeff Layton 
3165294c1fSJeff Layton #include <linux/hash.h>
3265294c1fSJeff Layton #include <linux/slab.h>
3365294c1fSJeff Layton #include <linux/file.h>
34cbcc268bSMatthew Wilcox (Oracle) #include <linux/pagemap.h>
3565294c1fSJeff Layton #include <linux/sched.h>
3665294c1fSJeff Layton #include <linux/list_lru.h>
3765294c1fSJeff Layton #include <linux/fsnotify_backend.h>
3865294c1fSJeff Layton #include <linux/fsnotify.h>
3965294c1fSJeff Layton #include <linux/seq_file.h>
40fc22945eSChuck Lever #include <linux/rhashtable.h>
4165294c1fSJeff Layton 
4265294c1fSJeff Layton #include "vfs.h"
4365294c1fSJeff Layton #include "nfsd.h"
4465294c1fSJeff Layton #include "nfsfh.h"
455e113224STrond Myklebust #include "netns.h"
4665294c1fSJeff Layton #include "filecache.h"
4765294c1fSJeff Layton #include "trace.h"
4865294c1fSJeff Layton 
4965294c1fSJeff Layton #define NFSD_LAUNDRETTE_DELAY		     (2 * HZ)
5065294c1fSJeff Layton 
51c7b824c3SChuck Lever #define NFSD_FILE_CACHE_UP		     (0)
5265294c1fSJeff Layton 
5365294c1fSJeff Layton /* We only care about NFSD_MAY_READ/WRITE for this cache */
5465294c1fSJeff Layton #define NFSD_FILE_MAY_MASK	(NFSD_MAY_READ|NFSD_MAY_WRITE)
5565294c1fSJeff Layton 
5665294c1fSJeff Layton static DEFINE_PER_CPU(unsigned long, nfsd_file_cache_hits);
5729d4bdbbSChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_acquisitions);
58d6329327SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_releases);
59904940e9SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_total_age);
60df2aff52SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_pages_flushed);
6194660cc1SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_evictions);
6265294c1fSJeff Layton 
639542e6a6STrond Myklebust struct nfsd_fcache_disposal {
649542e6a6STrond Myklebust 	struct work_struct work;
659542e6a6STrond Myklebust 	spinlock_t lock;
669542e6a6STrond Myklebust 	struct list_head freeme;
679542e6a6STrond Myklebust };
689542e6a6STrond Myklebust 
6950d0def9SChen Zhou static struct workqueue_struct *nfsd_filecache_wq __read_mostly;
709542e6a6STrond Myklebust 
7165294c1fSJeff Layton static struct kmem_cache		*nfsd_file_slab;
7265294c1fSJeff Layton static struct kmem_cache		*nfsd_file_mark_slab;
7365294c1fSJeff Layton static struct list_lru			nfsd_file_lru;
74c7b824c3SChuck Lever static unsigned long			nfsd_file_flags;
7565294c1fSJeff Layton static struct fsnotify_group		*nfsd_file_fsnotify_group;
7665294c1fSJeff Layton static struct delayed_work		nfsd_filecache_laundrette;
77fc22945eSChuck Lever static struct rhashtable		nfsd_file_rhash_tbl
78fc22945eSChuck Lever 						____cacheline_aligned_in_smp;
7965294c1fSJeff Layton 
80fc22945eSChuck Lever enum nfsd_file_lookup_type {
81fc22945eSChuck Lever 	NFSD_FILE_KEY_INODE,
82fc22945eSChuck Lever 	NFSD_FILE_KEY_FULL,
83fc22945eSChuck Lever };
84fc22945eSChuck Lever 
85fc22945eSChuck Lever struct nfsd_file_lookup_key {
86fc22945eSChuck Lever 	struct inode			*inode;
87fc22945eSChuck Lever 	struct net			*net;
88fc22945eSChuck Lever 	const struct cred		*cred;
89fc22945eSChuck Lever 	unsigned char			need;
904d1ea845SChuck Lever 	bool				gc;
91fc22945eSChuck Lever 	enum nfsd_file_lookup_type	type;
92fc22945eSChuck Lever };
93fc22945eSChuck Lever 
94fc22945eSChuck Lever /*
95fc22945eSChuck Lever  * The returned hash value is based solely on the address of an in-code
96fc22945eSChuck Lever  * inode, a pointer to a slab-allocated object. The entropy in such a
97fc22945eSChuck Lever  * pointer is concentrated in its middle bits.
98fc22945eSChuck Lever  */
99fc22945eSChuck Lever static u32 nfsd_file_inode_hash(const struct inode *inode, u32 seed)
100fc22945eSChuck Lever {
101fc22945eSChuck Lever 	unsigned long ptr = (unsigned long)inode;
102fc22945eSChuck Lever 	u32 k;
103fc22945eSChuck Lever 
104fc22945eSChuck Lever 	k = ptr >> L1_CACHE_SHIFT;
105fc22945eSChuck Lever 	k &= 0x00ffffff;
106fc22945eSChuck Lever 	return jhash2(&k, 1, seed);
107fc22945eSChuck Lever }
108fc22945eSChuck Lever 
109fc22945eSChuck Lever /**
110fc22945eSChuck Lever  * nfsd_file_key_hashfn - Compute the hash value of a lookup key
111fc22945eSChuck Lever  * @data: key on which to compute the hash value
112fc22945eSChuck Lever  * @len: rhash table's key_len parameter (unused)
113fc22945eSChuck Lever  * @seed: rhash table's random seed of the day
114fc22945eSChuck Lever  *
115fc22945eSChuck Lever  * Return value:
116fc22945eSChuck Lever  *   Computed 32-bit hash value
117fc22945eSChuck Lever  */
118fc22945eSChuck Lever static u32 nfsd_file_key_hashfn(const void *data, u32 len, u32 seed)
119fc22945eSChuck Lever {
120fc22945eSChuck Lever 	const struct nfsd_file_lookup_key *key = data;
121fc22945eSChuck Lever 
122fc22945eSChuck Lever 	return nfsd_file_inode_hash(key->inode, seed);
123fc22945eSChuck Lever }
124fc22945eSChuck Lever 
125fc22945eSChuck Lever /**
126fc22945eSChuck Lever  * nfsd_file_obj_hashfn - Compute the hash value of an nfsd_file
127fc22945eSChuck Lever  * @data: object on which to compute the hash value
128fc22945eSChuck Lever  * @len: rhash table's key_len parameter (unused)
129fc22945eSChuck Lever  * @seed: rhash table's random seed of the day
130fc22945eSChuck Lever  *
131fc22945eSChuck Lever  * Return value:
132fc22945eSChuck Lever  *   Computed 32-bit hash value
133fc22945eSChuck Lever  */
134fc22945eSChuck Lever static u32 nfsd_file_obj_hashfn(const void *data, u32 len, u32 seed)
135fc22945eSChuck Lever {
136fc22945eSChuck Lever 	const struct nfsd_file *nf = data;
137fc22945eSChuck Lever 
138fc22945eSChuck Lever 	return nfsd_file_inode_hash(nf->nf_inode, seed);
139fc22945eSChuck Lever }
140fc22945eSChuck Lever 
141fc22945eSChuck Lever static bool
142fc22945eSChuck Lever nfsd_match_cred(const struct cred *c1, const struct cred *c2)
143fc22945eSChuck Lever {
144fc22945eSChuck Lever 	int i;
145fc22945eSChuck Lever 
146fc22945eSChuck Lever 	if (!uid_eq(c1->fsuid, c2->fsuid))
147fc22945eSChuck Lever 		return false;
148fc22945eSChuck Lever 	if (!gid_eq(c1->fsgid, c2->fsgid))
149fc22945eSChuck Lever 		return false;
150fc22945eSChuck Lever 	if (c1->group_info == NULL || c2->group_info == NULL)
151fc22945eSChuck Lever 		return c1->group_info == c2->group_info;
152fc22945eSChuck Lever 	if (c1->group_info->ngroups != c2->group_info->ngroups)
153fc22945eSChuck Lever 		return false;
154fc22945eSChuck Lever 	for (i = 0; i < c1->group_info->ngroups; i++) {
155fc22945eSChuck Lever 		if (!gid_eq(c1->group_info->gid[i], c2->group_info->gid[i]))
156fc22945eSChuck Lever 			return false;
157fc22945eSChuck Lever 	}
158fc22945eSChuck Lever 	return true;
159fc22945eSChuck Lever }
160fc22945eSChuck Lever 
161fc22945eSChuck Lever /**
162fc22945eSChuck Lever  * nfsd_file_obj_cmpfn - Match a cache item against search criteria
163fc22945eSChuck Lever  * @arg: search criteria
164fc22945eSChuck Lever  * @ptr: cache item to check
165fc22945eSChuck Lever  *
166fc22945eSChuck Lever  * Return values:
167fc22945eSChuck Lever  *   %0 - Item matches search criteria
168fc22945eSChuck Lever  *   %1 - Item does not match search criteria
169fc22945eSChuck Lever  */
170fc22945eSChuck Lever static int nfsd_file_obj_cmpfn(struct rhashtable_compare_arg *arg,
171fc22945eSChuck Lever 			       const void *ptr)
172fc22945eSChuck Lever {
173fc22945eSChuck Lever 	const struct nfsd_file_lookup_key *key = arg->key;
174fc22945eSChuck Lever 	const struct nfsd_file *nf = ptr;
175fc22945eSChuck Lever 
176fc22945eSChuck Lever 	switch (key->type) {
177fc22945eSChuck Lever 	case NFSD_FILE_KEY_INODE:
178fc22945eSChuck Lever 		if (nf->nf_inode != key->inode)
179fc22945eSChuck Lever 			return 1;
180fc22945eSChuck Lever 		break;
181fc22945eSChuck Lever 	case NFSD_FILE_KEY_FULL:
182fc22945eSChuck Lever 		if (nf->nf_inode != key->inode)
183fc22945eSChuck Lever 			return 1;
184fc22945eSChuck Lever 		if (nf->nf_may != key->need)
185fc22945eSChuck Lever 			return 1;
186fc22945eSChuck Lever 		if (nf->nf_net != key->net)
187fc22945eSChuck Lever 			return 1;
188fc22945eSChuck Lever 		if (!nfsd_match_cred(nf->nf_cred, key->cred))
189fc22945eSChuck Lever 			return 1;
1904d1ea845SChuck Lever 		if (!!test_bit(NFSD_FILE_GC, &nf->nf_flags) != key->gc)
1914d1ea845SChuck Lever 			return 1;
192fc22945eSChuck Lever 		if (test_bit(NFSD_FILE_HASHED, &nf->nf_flags) == 0)
193fc22945eSChuck Lever 			return 1;
194fc22945eSChuck Lever 		break;
195fc22945eSChuck Lever 	}
196fc22945eSChuck Lever 	return 0;
197fc22945eSChuck Lever }
198fc22945eSChuck Lever 
199fc22945eSChuck Lever static const struct rhashtable_params nfsd_file_rhash_params = {
200fc22945eSChuck Lever 	.key_len		= sizeof_field(struct nfsd_file, nf_inode),
201fc22945eSChuck Lever 	.key_offset		= offsetof(struct nfsd_file, nf_inode),
202fc22945eSChuck Lever 	.head_offset		= offsetof(struct nfsd_file, nf_rhash),
203fc22945eSChuck Lever 	.hashfn			= nfsd_file_key_hashfn,
204fc22945eSChuck Lever 	.obj_hashfn		= nfsd_file_obj_hashfn,
205fc22945eSChuck Lever 	.obj_cmpfn		= nfsd_file_obj_cmpfn,
206fc22945eSChuck Lever 	/* Reduce resizing churn on light workloads */
207fc22945eSChuck Lever 	.min_size		= 512,		/* buckets */
208fc22945eSChuck Lever 	.automatic_shrinking	= true,
209fc22945eSChuck Lever };
21065294c1fSJeff Layton 
21165294c1fSJeff Layton static void
2129542e6a6STrond Myklebust nfsd_file_schedule_laundrette(void)
21365294c1fSJeff Layton {
214ce502f81SChuck Lever 	if ((atomic_read(&nfsd_file_rhash_tbl.nelems) == 0) ||
215c7b824c3SChuck Lever 	    test_bit(NFSD_FILE_CACHE_UP, &nfsd_file_flags) == 0)
21665294c1fSJeff Layton 		return;
21765294c1fSJeff Layton 
2189542e6a6STrond Myklebust 	queue_delayed_work(system_wq, &nfsd_filecache_laundrette,
2199542e6a6STrond Myklebust 			NFSD_LAUNDRETTE_DELAY);
22065294c1fSJeff Layton }
22165294c1fSJeff Layton 
22265294c1fSJeff Layton static void
22365294c1fSJeff Layton nfsd_file_slab_free(struct rcu_head *rcu)
22465294c1fSJeff Layton {
22565294c1fSJeff Layton 	struct nfsd_file *nf = container_of(rcu, struct nfsd_file, nf_rcu);
22665294c1fSJeff Layton 
22765294c1fSJeff Layton 	put_cred(nf->nf_cred);
22865294c1fSJeff Layton 	kmem_cache_free(nfsd_file_slab, nf);
22965294c1fSJeff Layton }
23065294c1fSJeff Layton 
23165294c1fSJeff Layton static void
23265294c1fSJeff Layton nfsd_file_mark_free(struct fsnotify_mark *mark)
23365294c1fSJeff Layton {
23465294c1fSJeff Layton 	struct nfsd_file_mark *nfm = container_of(mark, struct nfsd_file_mark,
23565294c1fSJeff Layton 						  nfm_mark);
23665294c1fSJeff Layton 
23765294c1fSJeff Layton 	kmem_cache_free(nfsd_file_mark_slab, nfm);
23865294c1fSJeff Layton }
23965294c1fSJeff Layton 
24065294c1fSJeff Layton static struct nfsd_file_mark *
24165294c1fSJeff Layton nfsd_file_mark_get(struct nfsd_file_mark *nfm)
24265294c1fSJeff Layton {
243689827cdSTrond Myklebust 	if (!refcount_inc_not_zero(&nfm->nfm_ref))
24465294c1fSJeff Layton 		return NULL;
24565294c1fSJeff Layton 	return nfm;
24665294c1fSJeff Layton }
24765294c1fSJeff Layton 
24865294c1fSJeff Layton static void
24965294c1fSJeff Layton nfsd_file_mark_put(struct nfsd_file_mark *nfm)
25065294c1fSJeff Layton {
251689827cdSTrond Myklebust 	if (refcount_dec_and_test(&nfm->nfm_ref)) {
25265294c1fSJeff Layton 		fsnotify_destroy_mark(&nfm->nfm_mark, nfsd_file_fsnotify_group);
25365294c1fSJeff Layton 		fsnotify_put_mark(&nfm->nfm_mark);
25465294c1fSJeff Layton 	}
25565294c1fSJeff Layton }
25665294c1fSJeff Layton 
25765294c1fSJeff Layton static struct nfsd_file_mark *
258427f5f83SChuck Lever nfsd_file_mark_find_or_create(struct nfsd_file *nf, struct inode *inode)
25965294c1fSJeff Layton {
26065294c1fSJeff Layton 	int			err;
26165294c1fSJeff Layton 	struct fsnotify_mark	*mark;
26265294c1fSJeff Layton 	struct nfsd_file_mark	*nfm = NULL, *new;
26365294c1fSJeff Layton 
26465294c1fSJeff Layton 	do {
265b8962a9dSAmir Goldstein 		fsnotify_group_lock(nfsd_file_fsnotify_group);
26665294c1fSJeff Layton 		mark = fsnotify_find_mark(&inode->i_fsnotify_marks,
26765294c1fSJeff Layton 					  nfsd_file_fsnotify_group);
26865294c1fSJeff Layton 		if (mark) {
26965294c1fSJeff Layton 			nfm = nfsd_file_mark_get(container_of(mark,
27065294c1fSJeff Layton 						 struct nfsd_file_mark,
27165294c1fSJeff Layton 						 nfm_mark));
272b8962a9dSAmir Goldstein 			fsnotify_group_unlock(nfsd_file_fsnotify_group);
27390d2f1daSTrond Myklebust 			if (nfm) {
27465294c1fSJeff Layton 				fsnotify_put_mark(mark);
27565294c1fSJeff Layton 				break;
27690d2f1daSTrond Myklebust 			}
27790d2f1daSTrond Myklebust 			/* Avoid soft lockup race with nfsd_file_mark_put() */
27890d2f1daSTrond Myklebust 			fsnotify_destroy_mark(mark, nfsd_file_fsnotify_group);
27990d2f1daSTrond Myklebust 			fsnotify_put_mark(mark);
280b8962a9dSAmir Goldstein 		} else {
281b8962a9dSAmir Goldstein 			fsnotify_group_unlock(nfsd_file_fsnotify_group);
282b8962a9dSAmir Goldstein 		}
28365294c1fSJeff Layton 
28465294c1fSJeff Layton 		/* allocate a new nfm */
28565294c1fSJeff Layton 		new = kmem_cache_alloc(nfsd_file_mark_slab, GFP_KERNEL);
28665294c1fSJeff Layton 		if (!new)
28765294c1fSJeff Layton 			return NULL;
28865294c1fSJeff Layton 		fsnotify_init_mark(&new->nfm_mark, nfsd_file_fsnotify_group);
28965294c1fSJeff Layton 		new->nfm_mark.mask = FS_ATTRIB|FS_DELETE_SELF;
290689827cdSTrond Myklebust 		refcount_set(&new->nfm_ref, 1);
29165294c1fSJeff Layton 
29265294c1fSJeff Layton 		err = fsnotify_add_inode_mark(&new->nfm_mark, inode, 0);
29365294c1fSJeff Layton 
29465294c1fSJeff Layton 		/*
29565294c1fSJeff Layton 		 * If the add was successful, then return the object.
29665294c1fSJeff Layton 		 * Otherwise, we need to put the reference we hold on the
29765294c1fSJeff Layton 		 * nfm_mark. The fsnotify code will take a reference and put
29865294c1fSJeff Layton 		 * it on failure, so we can't just free it directly. It's also
29965294c1fSJeff Layton 		 * not safe to call fsnotify_destroy_mark on it as the
30065294c1fSJeff Layton 		 * mark->group will be NULL. Thus, we can't let the nfm_ref
30165294c1fSJeff Layton 		 * counter drive the destruction at this point.
30265294c1fSJeff Layton 		 */
30365294c1fSJeff Layton 		if (likely(!err))
30465294c1fSJeff Layton 			nfm = new;
30565294c1fSJeff Layton 		else
30665294c1fSJeff Layton 			fsnotify_put_mark(&new->nfm_mark);
30765294c1fSJeff Layton 	} while (unlikely(err == -EEXIST));
30865294c1fSJeff Layton 
30965294c1fSJeff Layton 	return nfm;
31065294c1fSJeff Layton }
31165294c1fSJeff Layton 
31265294c1fSJeff Layton static struct nfsd_file *
313ce502f81SChuck Lever nfsd_file_alloc(struct nfsd_file_lookup_key *key, unsigned int may)
31465294c1fSJeff Layton {
31565294c1fSJeff Layton 	struct nfsd_file *nf;
31665294c1fSJeff Layton 
31765294c1fSJeff Layton 	nf = kmem_cache_alloc(nfsd_file_slab, GFP_KERNEL);
31865294c1fSJeff Layton 	if (nf) {
31965294c1fSJeff Layton 		INIT_LIST_HEAD(&nf->nf_lru);
320904940e9SChuck Lever 		nf->nf_birthtime = ktime_get();
32165294c1fSJeff Layton 		nf->nf_file = NULL;
32265294c1fSJeff Layton 		nf->nf_cred = get_current_cred();
323ce502f81SChuck Lever 		nf->nf_net = key->net;
32465294c1fSJeff Layton 		nf->nf_flags = 0;
325ce502f81SChuck Lever 		__set_bit(NFSD_FILE_HASHED, &nf->nf_flags);
326ce502f81SChuck Lever 		__set_bit(NFSD_FILE_PENDING, &nf->nf_flags);
3274d1ea845SChuck Lever 		if (key->gc)
3284d1ea845SChuck Lever 			__set_bit(NFSD_FILE_GC, &nf->nf_flags);
329ce502f81SChuck Lever 		nf->nf_inode = key->inode;
330ce502f81SChuck Lever 		/* nf_ref is pre-incremented for hash table */
331ce502f81SChuck Lever 		refcount_set(&nf->nf_ref, 2);
332ce502f81SChuck Lever 		nf->nf_may = key->need;
33365294c1fSJeff Layton 		nf->nf_mark = NULL;
33465294c1fSJeff Layton 	}
33565294c1fSJeff Layton 	return nf;
33665294c1fSJeff Layton }
33765294c1fSJeff Layton 
33865294c1fSJeff Layton static bool
33965294c1fSJeff Layton nfsd_file_free(struct nfsd_file *nf)
34065294c1fSJeff Layton {
341904940e9SChuck Lever 	s64 age = ktime_to_ms(ktime_sub(ktime_get(), nf->nf_birthtime));
34265294c1fSJeff Layton 	bool flush = false;
34365294c1fSJeff Layton 
344d6329327SChuck Lever 	this_cpu_inc(nfsd_file_releases);
345904940e9SChuck Lever 	this_cpu_add(nfsd_file_total_age, age);
346d6329327SChuck Lever 
34765294c1fSJeff Layton 	trace_nfsd_file_put_final(nf);
34865294c1fSJeff Layton 	if (nf->nf_mark)
34965294c1fSJeff Layton 		nfsd_file_mark_put(nf->nf_mark);
35065294c1fSJeff Layton 	if (nf->nf_file) {
35165294c1fSJeff Layton 		get_file(nf->nf_file);
35265294c1fSJeff Layton 		filp_close(nf->nf_file, NULL);
35365294c1fSJeff Layton 		fput(nf->nf_file);
35465294c1fSJeff Layton 		flush = true;
35565294c1fSJeff Layton 	}
356668ed92eSChuck Lever 
357668ed92eSChuck Lever 	/*
358668ed92eSChuck Lever 	 * If this item is still linked via nf_lru, that's a bug.
359668ed92eSChuck Lever 	 * WARN and leak it to preserve system stability.
360668ed92eSChuck Lever 	 */
361668ed92eSChuck Lever 	if (WARN_ON_ONCE(!list_empty(&nf->nf_lru)))
362668ed92eSChuck Lever 		return flush;
363668ed92eSChuck Lever 
36465294c1fSJeff Layton 	call_rcu(&nf->nf_rcu, nfsd_file_slab_free);
36565294c1fSJeff Layton 	return flush;
36665294c1fSJeff Layton }
36765294c1fSJeff Layton 
368055b24a8STrond Myklebust static bool
369055b24a8STrond Myklebust nfsd_file_check_writeback(struct nfsd_file *nf)
370055b24a8STrond Myklebust {
371055b24a8STrond Myklebust 	struct file *file = nf->nf_file;
372055b24a8STrond Myklebust 	struct address_space *mapping;
373055b24a8STrond Myklebust 
374055b24a8STrond Myklebust 	if (!file || !(file->f_mode & FMODE_WRITE))
375055b24a8STrond Myklebust 		return false;
376055b24a8STrond Myklebust 	mapping = file->f_mapping;
377055b24a8STrond Myklebust 	return mapping_tagged(mapping, PAGECACHE_TAG_DIRTY) ||
378055b24a8STrond Myklebust 		mapping_tagged(mapping, PAGECACHE_TAG_WRITEBACK);
379055b24a8STrond Myklebust }
380055b24a8STrond Myklebust 
381055b24a8STrond Myklebust static int
382055b24a8STrond Myklebust nfsd_file_check_write_error(struct nfsd_file *nf)
383055b24a8STrond Myklebust {
384055b24a8STrond Myklebust 	struct file *file = nf->nf_file;
385055b24a8STrond Myklebust 
386055b24a8STrond Myklebust 	if (!file || !(file->f_mode & FMODE_WRITE))
387055b24a8STrond Myklebust 		return 0;
388055b24a8STrond Myklebust 	return filemap_check_wb_err(file->f_mapping, READ_ONCE(file->f_wb_err));
389055b24a8STrond Myklebust }
390055b24a8STrond Myklebust 
39165294c1fSJeff Layton static void
3926b8a9433STrond Myklebust nfsd_file_flush(struct nfsd_file *nf)
3936b8a9433STrond Myklebust {
394df2aff52SChuck Lever 	struct file *file = nf->nf_file;
395df2aff52SChuck Lever 
396df2aff52SChuck Lever 	if (!file || !(file->f_mode & FMODE_WRITE))
397df2aff52SChuck Lever 		return;
398df2aff52SChuck Lever 	this_cpu_add(nfsd_file_pages_flushed, file->f_mapping->nrpages);
399df2aff52SChuck Lever 	if (vfs_fsync(file, 1) != 0)
4006b8a9433STrond Myklebust 		nfsd_reset_write_verifier(net_generic(nf->nf_net, nfsd_net_id));
4016b8a9433STrond Myklebust }
4026b8a9433STrond Myklebust 
403c46203acSChuck Lever static void nfsd_file_lru_add(struct nfsd_file *nf)
40465294c1fSJeff Layton {
4054a0e73e6SChuck Lever 	set_bit(NFSD_FILE_REFERENCED, &nf->nf_flags);
406c46203acSChuck Lever 	if (list_lru_add(&nfsd_file_lru, &nf->nf_lru))
407c46203acSChuck Lever 		trace_nfsd_file_lru_add(nf);
408c46203acSChuck Lever }
40965294c1fSJeff Layton 
410c46203acSChuck Lever static void nfsd_file_lru_remove(struct nfsd_file *nf)
411c46203acSChuck Lever {
412c46203acSChuck Lever 	if (list_lru_del(&nfsd_file_lru, &nf->nf_lru))
413c46203acSChuck Lever 		trace_nfsd_file_lru_del(nf);
414c46203acSChuck Lever }
415c46203acSChuck Lever 
41665294c1fSJeff Layton static void
417ce502f81SChuck Lever nfsd_file_hash_remove(struct nfsd_file *nf)
41865294c1fSJeff Layton {
41965294c1fSJeff Layton 	trace_nfsd_file_unhash(nf);
42065294c1fSJeff Layton 
421055b24a8STrond Myklebust 	if (nfsd_file_check_write_error(nf))
4223988a578SChuck Lever 		nfsd_reset_write_verifier(net_generic(nf->nf_net, nfsd_net_id));
423ce502f81SChuck Lever 	rhashtable_remove_fast(&nfsd_file_rhash_tbl, &nf->nf_rhash,
424ce502f81SChuck Lever 			       nfsd_file_rhash_params);
42565294c1fSJeff Layton }
42665294c1fSJeff Layton 
42765294c1fSJeff Layton static bool
42865294c1fSJeff Layton nfsd_file_unhash(struct nfsd_file *nf)
42965294c1fSJeff Layton {
43065294c1fSJeff Layton 	if (test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
431ce502f81SChuck Lever 		nfsd_file_hash_remove(nf);
43265294c1fSJeff Layton 		return true;
43365294c1fSJeff Layton 	}
43465294c1fSJeff Layton 	return false;
43565294c1fSJeff Layton }
43665294c1fSJeff Layton 
4378d0d254bSJeff Layton static void
438ce502f81SChuck Lever nfsd_file_unhash_and_dispose(struct nfsd_file *nf, struct list_head *dispose)
43965294c1fSJeff Layton {
440ce502f81SChuck Lever 	trace_nfsd_file_unhash_and_dispose(nf);
4418d0d254bSJeff Layton 	if (nfsd_file_unhash(nf)) {
4428d0d254bSJeff Layton 		/* caller must call nfsd_file_dispose_list() later */
4434a0e73e6SChuck Lever 		nfsd_file_lru_remove(nf);
44465294c1fSJeff Layton 		list_add(&nf->nf_lru, dispose);
4458d0d254bSJeff Layton 	}
44665294c1fSJeff Layton }
44765294c1fSJeff Layton 
448b6669305STrond Myklebust static void
44965294c1fSJeff Layton nfsd_file_put_noref(struct nfsd_file *nf)
45065294c1fSJeff Layton {
45165294c1fSJeff Layton 	trace_nfsd_file_put(nf);
45265294c1fSJeff Layton 
453689827cdSTrond Myklebust 	if (refcount_dec_and_test(&nf->nf_ref)) {
45465294c1fSJeff Layton 		WARN_ON(test_bit(NFSD_FILE_HASHED, &nf->nf_flags));
4554a0e73e6SChuck Lever 		nfsd_file_lru_remove(nf);
45665294c1fSJeff Layton 		nfsd_file_free(nf);
45765294c1fSJeff Layton 	}
45865294c1fSJeff Layton }
45965294c1fSJeff Layton 
4604d1ea845SChuck Lever static void
4614d1ea845SChuck Lever nfsd_file_unhash_and_put(struct nfsd_file *nf)
4624d1ea845SChuck Lever {
4634d1ea845SChuck Lever 	if (nfsd_file_unhash(nf))
4644d1ea845SChuck Lever 		nfsd_file_put_noref(nf);
4654d1ea845SChuck Lever }
4664d1ea845SChuck Lever 
46765294c1fSJeff Layton void
46865294c1fSJeff Layton nfsd_file_put(struct nfsd_file *nf)
46965294c1fSJeff Layton {
47008af54b3SChuck Lever 	might_sleep();
47108af54b3SChuck Lever 
4724d1ea845SChuck Lever 	if (test_bit(NFSD_FILE_GC, &nf->nf_flags))
4734a0e73e6SChuck Lever 		nfsd_file_lru_add(nf);
4744d1ea845SChuck Lever 	else if (refcount_read(&nf->nf_ref) == 2)
4754d1ea845SChuck Lever 		nfsd_file_unhash_and_put(nf);
4764d1ea845SChuck Lever 
4774d1ea845SChuck Lever 	if (!test_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
4786b8a9433STrond Myklebust 		nfsd_file_flush(nf);
479b6669305STrond Myklebust 		nfsd_file_put_noref(nf);
4804d1ea845SChuck Lever 	} else if (nf->nf_file && test_bit(NFSD_FILE_GC, &nf->nf_flags)) {
481b6669305STrond Myklebust 		nfsd_file_put_noref(nf);
4829542e6a6STrond Myklebust 		nfsd_file_schedule_laundrette();
483b6c71c66SChuck Lever 	} else
484b6c71c66SChuck Lever 		nfsd_file_put_noref(nf);
48565294c1fSJeff Layton }
48665294c1fSJeff Layton 
48765294c1fSJeff Layton struct nfsd_file *
48865294c1fSJeff Layton nfsd_file_get(struct nfsd_file *nf)
48965294c1fSJeff Layton {
490689827cdSTrond Myklebust 	if (likely(refcount_inc_not_zero(&nf->nf_ref)))
49165294c1fSJeff Layton 		return nf;
49265294c1fSJeff Layton 	return NULL;
49365294c1fSJeff Layton }
49465294c1fSJeff Layton 
49565294c1fSJeff Layton static void
49665294c1fSJeff Layton nfsd_file_dispose_list(struct list_head *dispose)
49765294c1fSJeff Layton {
49865294c1fSJeff Layton 	struct nfsd_file *nf;
49965294c1fSJeff Layton 
50065294c1fSJeff Layton 	while(!list_empty(dispose)) {
50165294c1fSJeff Layton 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
502668ed92eSChuck Lever 		list_del_init(&nf->nf_lru);
5036b8a9433STrond Myklebust 		nfsd_file_flush(nf);
50465294c1fSJeff Layton 		nfsd_file_put_noref(nf);
50565294c1fSJeff Layton 	}
50665294c1fSJeff Layton }
50765294c1fSJeff Layton 
50865294c1fSJeff Layton static void
50965294c1fSJeff Layton nfsd_file_dispose_list_sync(struct list_head *dispose)
51065294c1fSJeff Layton {
51165294c1fSJeff Layton 	bool flush = false;
51265294c1fSJeff Layton 	struct nfsd_file *nf;
51365294c1fSJeff Layton 
51465294c1fSJeff Layton 	while(!list_empty(dispose)) {
51565294c1fSJeff Layton 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
516668ed92eSChuck Lever 		list_del_init(&nf->nf_lru);
5176b8a9433STrond Myklebust 		nfsd_file_flush(nf);
518689827cdSTrond Myklebust 		if (!refcount_dec_and_test(&nf->nf_ref))
51965294c1fSJeff Layton 			continue;
52065294c1fSJeff Layton 		if (nfsd_file_free(nf))
52165294c1fSJeff Layton 			flush = true;
52265294c1fSJeff Layton 	}
52365294c1fSJeff Layton 	if (flush)
52465294c1fSJeff Layton 		flush_delayed_fput();
52565294c1fSJeff Layton }
52665294c1fSJeff Layton 
5279542e6a6STrond Myklebust static void
5289542e6a6STrond Myklebust nfsd_file_list_remove_disposal(struct list_head *dst,
5299542e6a6STrond Myklebust 		struct nfsd_fcache_disposal *l)
5309542e6a6STrond Myklebust {
5319542e6a6STrond Myklebust 	spin_lock(&l->lock);
5329542e6a6STrond Myklebust 	list_splice_init(&l->freeme, dst);
5339542e6a6STrond Myklebust 	spin_unlock(&l->lock);
5349542e6a6STrond Myklebust }
5359542e6a6STrond Myklebust 
5369542e6a6STrond Myklebust static void
5379542e6a6STrond Myklebust nfsd_file_list_add_disposal(struct list_head *files, struct net *net)
5389542e6a6STrond Myklebust {
5391463b38eSNeilBrown 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5401463b38eSNeilBrown 	struct nfsd_fcache_disposal *l = nn->fcache_disposal;
5419542e6a6STrond Myklebust 
5429542e6a6STrond Myklebust 	spin_lock(&l->lock);
5439542e6a6STrond Myklebust 	list_splice_tail_init(files, &l->freeme);
5449542e6a6STrond Myklebust 	spin_unlock(&l->lock);
5459542e6a6STrond Myklebust 	queue_work(nfsd_filecache_wq, &l->work);
5469542e6a6STrond Myklebust }
5479542e6a6STrond Myklebust 
5489542e6a6STrond Myklebust static void
5499542e6a6STrond Myklebust nfsd_file_list_add_pernet(struct list_head *dst, struct list_head *src,
5509542e6a6STrond Myklebust 		struct net *net)
5519542e6a6STrond Myklebust {
5529542e6a6STrond Myklebust 	struct nfsd_file *nf, *tmp;
5539542e6a6STrond Myklebust 
5549542e6a6STrond Myklebust 	list_for_each_entry_safe(nf, tmp, src, nf_lru) {
5559542e6a6STrond Myklebust 		if (nf->nf_net == net)
5569542e6a6STrond Myklebust 			list_move_tail(&nf->nf_lru, dst);
5579542e6a6STrond Myklebust 	}
5589542e6a6STrond Myklebust }
5599542e6a6STrond Myklebust 
5609542e6a6STrond Myklebust static void
5619542e6a6STrond Myklebust nfsd_file_dispose_list_delayed(struct list_head *dispose)
5629542e6a6STrond Myklebust {
5639542e6a6STrond Myklebust 	LIST_HEAD(list);
5649542e6a6STrond Myklebust 	struct nfsd_file *nf;
5659542e6a6STrond Myklebust 
5669542e6a6STrond Myklebust 	while(!list_empty(dispose)) {
5679542e6a6STrond Myklebust 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
5689542e6a6STrond Myklebust 		nfsd_file_list_add_pernet(&list, dispose, nf->nf_net);
5699542e6a6STrond Myklebust 		nfsd_file_list_add_disposal(&list, nf->nf_net);
5709542e6a6STrond Myklebust 	}
5719542e6a6STrond Myklebust }
5729542e6a6STrond Myklebust 
5734a0e73e6SChuck Lever /**
5744a0e73e6SChuck Lever  * nfsd_file_lru_cb - Examine an entry on the LRU list
5754a0e73e6SChuck Lever  * @item: LRU entry to examine
5764a0e73e6SChuck Lever  * @lru: controlling LRU
5774a0e73e6SChuck Lever  * @lock: LRU list lock (unused)
5784a0e73e6SChuck Lever  * @arg: dispose list
5794a0e73e6SChuck Lever  *
5804a0e73e6SChuck Lever  * Return values:
5814a0e73e6SChuck Lever  *   %LRU_REMOVED: @item was removed from the LRU
582edead3a5SChuck Lever  *   %LRU_ROTATE: @item is to be moved to the LRU tail
5834a0e73e6SChuck Lever  *   %LRU_SKIP: @item cannot be evicted
58465294c1fSJeff Layton  */
58565294c1fSJeff Layton static enum lru_status
58665294c1fSJeff Layton nfsd_file_lru_cb(struct list_head *item, struct list_lru_one *lru,
58765294c1fSJeff Layton 		 spinlock_t *lock, void *arg)
58865294c1fSJeff Layton 	__releases(lock)
58965294c1fSJeff Layton 	__acquires(lock)
59065294c1fSJeff Layton {
59165294c1fSJeff Layton 	struct list_head *head = arg;
59265294c1fSJeff Layton 	struct nfsd_file *nf = list_entry(item, struct nfsd_file, nf_lru);
59365294c1fSJeff Layton 
59465294c1fSJeff Layton 	/*
59565294c1fSJeff Layton 	 * Do a lockless refcount check. The hashtable holds one reference, so
59665294c1fSJeff Layton 	 * we look to see if anything else has a reference, or if any have
59765294c1fSJeff Layton 	 * been put since the shrinker last ran. Those don't get unhashed and
59865294c1fSJeff Layton 	 * released.
59965294c1fSJeff Layton 	 *
60065294c1fSJeff Layton 	 * Note that in the put path, we set the flag and then decrement the
60165294c1fSJeff Layton 	 * counter. Here we check the counter and then test and clear the flag.
60265294c1fSJeff Layton 	 * That order is deliberate to ensure that we can do this locklessly.
60365294c1fSJeff Layton 	 */
604c46203acSChuck Lever 	if (refcount_read(&nf->nf_ref) > 1) {
6054a0e73e6SChuck Lever 		list_lru_isolate(lru, &nf->nf_lru);
606c46203acSChuck Lever 		trace_nfsd_file_gc_in_use(nf);
6074a0e73e6SChuck Lever 		return LRU_REMOVED;
608c46203acSChuck Lever 	}
609055b24a8STrond Myklebust 
610055b24a8STrond Myklebust 	/*
611055b24a8STrond Myklebust 	 * Don't throw out files that are still undergoing I/O or
612055b24a8STrond Myklebust 	 * that have uncleared errors pending.
613055b24a8STrond Myklebust 	 */
614c46203acSChuck Lever 	if (nfsd_file_check_writeback(nf)) {
615c46203acSChuck Lever 		trace_nfsd_file_gc_writeback(nf);
61665294c1fSJeff Layton 		return LRU_SKIP;
61765294c1fSJeff Layton 	}
61865294c1fSJeff Layton 
619c46203acSChuck Lever 	if (test_and_clear_bit(NFSD_FILE_REFERENCED, &nf->nf_flags)) {
620c46203acSChuck Lever 		trace_nfsd_file_gc_referenced(nf);
621edead3a5SChuck Lever 		return LRU_ROTATE;
62265294c1fSJeff Layton 	}
62365294c1fSJeff Layton 
624c46203acSChuck Lever 	if (!test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
625c46203acSChuck Lever 		trace_nfsd_file_gc_hashed(nf);
626c46203acSChuck Lever 		return LRU_SKIP;
627c46203acSChuck Lever 	}
62865294c1fSJeff Layton 
62965294c1fSJeff Layton 	list_lru_isolate_move(lru, &nf->nf_lru, head);
63094660cc1SChuck Lever 	this_cpu_inc(nfsd_file_evictions);
631c46203acSChuck Lever 	trace_nfsd_file_gc_disposed(nf);
63265294c1fSJeff Layton 	return LRU_REMOVED;
63365294c1fSJeff Layton }
63465294c1fSJeff Layton 
6350bac5a26SChuck Lever /*
6360bac5a26SChuck Lever  * Unhash items on @dispose immediately, then queue them on the
6370bac5a26SChuck Lever  * disposal workqueue to finish releasing them in the background.
6380bac5a26SChuck Lever  *
6390bac5a26SChuck Lever  * cel: Note that between the time list_lru_shrink_walk runs and
6400bac5a26SChuck Lever  * now, these items are in the hash table but marked unhashed.
6410bac5a26SChuck Lever  * Why release these outside of lru_cb ? There's no lock ordering
6420bac5a26SChuck Lever  * problem since lru_cb currently takes no lock.
6430bac5a26SChuck Lever  */
6440bac5a26SChuck Lever static void nfsd_file_gc_dispose_list(struct list_head *dispose)
6450bac5a26SChuck Lever {
6460bac5a26SChuck Lever 	struct nfsd_file *nf;
6470bac5a26SChuck Lever 
648cb7ec76eSChuck Lever 	list_for_each_entry(nf, dispose, nf_lru)
649cb7ec76eSChuck Lever 		nfsd_file_hash_remove(nf);
6500bac5a26SChuck Lever 	nfsd_file_dispose_list_delayed(dispose);
6519542e6a6STrond Myklebust }
6529542e6a6STrond Myklebust 
6539542e6a6STrond Myklebust static void
6549542e6a6STrond Myklebust nfsd_file_gc(void)
6559542e6a6STrond Myklebust {
6563bc6d347SChuck Lever 	LIST_HEAD(dispose);
65794660cc1SChuck Lever 	unsigned long ret;
6583bc6d347SChuck Lever 
65994660cc1SChuck Lever 	ret = list_lru_walk(&nfsd_file_lru, nfsd_file_lru_cb,
660edead3a5SChuck Lever 			    &dispose, list_lru_count(&nfsd_file_lru));
66194660cc1SChuck Lever 	trace_nfsd_file_gc_removed(ret, list_lru_count(&nfsd_file_lru));
6623bc6d347SChuck Lever 	nfsd_file_gc_dispose_list(&dispose);
6639542e6a6STrond Myklebust }
6649542e6a6STrond Myklebust 
6659542e6a6STrond Myklebust static void
6669542e6a6STrond Myklebust nfsd_file_gc_worker(struct work_struct *work)
6679542e6a6STrond Myklebust {
6689542e6a6STrond Myklebust 	nfsd_file_gc();
6699542e6a6STrond Myklebust 	nfsd_file_schedule_laundrette();
67065294c1fSJeff Layton }
67165294c1fSJeff Layton 
67265294c1fSJeff Layton static unsigned long
67365294c1fSJeff Layton nfsd_file_lru_count(struct shrinker *s, struct shrink_control *sc)
67465294c1fSJeff Layton {
67565294c1fSJeff Layton 	return list_lru_count(&nfsd_file_lru);
67665294c1fSJeff Layton }
67765294c1fSJeff Layton 
67865294c1fSJeff Layton static unsigned long
67965294c1fSJeff Layton nfsd_file_lru_scan(struct shrinker *s, struct shrink_control *sc)
68065294c1fSJeff Layton {
68139f1d1ffSChuck Lever 	LIST_HEAD(dispose);
68239f1d1ffSChuck Lever 	unsigned long ret;
68339f1d1ffSChuck Lever 
68439f1d1ffSChuck Lever 	ret = list_lru_shrink_walk(&nfsd_file_lru, sc,
68539f1d1ffSChuck Lever 				   nfsd_file_lru_cb, &dispose);
68694660cc1SChuck Lever 	trace_nfsd_file_shrinker_removed(ret, list_lru_count(&nfsd_file_lru));
68739f1d1ffSChuck Lever 	nfsd_file_gc_dispose_list(&dispose);
68839f1d1ffSChuck Lever 	return ret;
68965294c1fSJeff Layton }
69065294c1fSJeff Layton 
69165294c1fSJeff Layton static struct shrinker	nfsd_file_shrinker = {
69265294c1fSJeff Layton 	.scan_objects = nfsd_file_lru_scan,
69365294c1fSJeff Layton 	.count_objects = nfsd_file_lru_count,
69465294c1fSJeff Layton 	.seeks = 1,
69565294c1fSJeff Layton };
69665294c1fSJeff Layton 
697a8455110SChuck Lever /*
698a8455110SChuck Lever  * Find all cache items across all net namespaces that match @inode and
699a8455110SChuck Lever  * move them to @dispose. The lookup is atomic wrt nfsd_file_acquire().
700a8455110SChuck Lever  */
701a8455110SChuck Lever static unsigned int
702a8455110SChuck Lever __nfsd_file_close_inode(struct inode *inode, struct list_head *dispose)
70365294c1fSJeff Layton {
704ce502f81SChuck Lever 	struct nfsd_file_lookup_key key = {
705ce502f81SChuck Lever 		.type	= NFSD_FILE_KEY_INODE,
706ce502f81SChuck Lever 		.inode	= inode,
707ce502f81SChuck Lever 	};
708a8455110SChuck Lever 	unsigned int count = 0;
70965294c1fSJeff Layton 	struct nfsd_file *nf;
71065294c1fSJeff Layton 
711ce502f81SChuck Lever 	rcu_read_lock();
712ce502f81SChuck Lever 	do {
713ce502f81SChuck Lever 		nf = rhashtable_lookup(&nfsd_file_rhash_tbl, &key,
714ce502f81SChuck Lever 				       nfsd_file_rhash_params);
715ce502f81SChuck Lever 		if (!nf)
716ce502f81SChuck Lever 			break;
717ce502f81SChuck Lever 		nfsd_file_unhash_and_dispose(nf, dispose);
718a8455110SChuck Lever 		count++;
719ce502f81SChuck Lever 	} while (1);
720ce502f81SChuck Lever 	rcu_read_unlock();
721a8455110SChuck Lever 	return count;
72265294c1fSJeff Layton }
72365294c1fSJeff Layton 
72465294c1fSJeff Layton /**
72565294c1fSJeff Layton  * nfsd_file_close_inode_sync - attempt to forcibly close a nfsd_file
72665294c1fSJeff Layton  * @inode: inode of the file to attempt to remove
72765294c1fSJeff Layton  *
728a8455110SChuck Lever  * Unhash and put, then flush and fput all cache items associated with @inode.
72965294c1fSJeff Layton  */
73065294c1fSJeff Layton void
73165294c1fSJeff Layton nfsd_file_close_inode_sync(struct inode *inode)
73265294c1fSJeff Layton {
73365294c1fSJeff Layton 	LIST_HEAD(dispose);
734a8455110SChuck Lever 	unsigned int count;
73565294c1fSJeff Layton 
736a8455110SChuck Lever 	count = __nfsd_file_close_inode(inode, &dispose);
737a8455110SChuck Lever 	trace_nfsd_file_close_inode_sync(inode, count);
73865294c1fSJeff Layton 	nfsd_file_dispose_list_sync(&dispose);
73965294c1fSJeff Layton }
74065294c1fSJeff Layton 
74165294c1fSJeff Layton /**
74219598141STrond Myklebust  * nfsd_file_close_inode - attempt a delayed close of a nfsd_file
74365294c1fSJeff Layton  * @inode: inode of the file to attempt to remove
74465294c1fSJeff Layton  *
745a8455110SChuck Lever  * Unhash and put all cache item associated with @inode.
74665294c1fSJeff Layton  */
74765294c1fSJeff Layton static void
74865294c1fSJeff Layton nfsd_file_close_inode(struct inode *inode)
74965294c1fSJeff Layton {
75065294c1fSJeff Layton 	LIST_HEAD(dispose);
751a8455110SChuck Lever 	unsigned int count;
75265294c1fSJeff Layton 
753a8455110SChuck Lever 	count = __nfsd_file_close_inode(inode, &dispose);
754a8455110SChuck Lever 	trace_nfsd_file_close_inode(inode, count);
7559542e6a6STrond Myklebust 	nfsd_file_dispose_list_delayed(&dispose);
75665294c1fSJeff Layton }
75765294c1fSJeff Layton 
75865294c1fSJeff Layton /**
75965294c1fSJeff Layton  * nfsd_file_delayed_close - close unused nfsd_files
76065294c1fSJeff Layton  * @work: dummy
76165294c1fSJeff Layton  *
76265294c1fSJeff Layton  * Walk the LRU list and close any entries that have not been used since
76365294c1fSJeff Layton  * the last scan.
76465294c1fSJeff Layton  */
76565294c1fSJeff Layton static void
76665294c1fSJeff Layton nfsd_file_delayed_close(struct work_struct *work)
76765294c1fSJeff Layton {
76865294c1fSJeff Layton 	LIST_HEAD(head);
7699542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l = container_of(work,
7709542e6a6STrond Myklebust 			struct nfsd_fcache_disposal, work);
77165294c1fSJeff Layton 
7729542e6a6STrond Myklebust 	nfsd_file_list_remove_disposal(&head, l);
7739542e6a6STrond Myklebust 	nfsd_file_dispose_list(&head);
77465294c1fSJeff Layton }
77565294c1fSJeff Layton 
77665294c1fSJeff Layton static int
77765294c1fSJeff Layton nfsd_file_lease_notifier_call(struct notifier_block *nb, unsigned long arg,
77865294c1fSJeff Layton 			    void *data)
77965294c1fSJeff Layton {
78065294c1fSJeff Layton 	struct file_lock *fl = data;
78165294c1fSJeff Layton 
78265294c1fSJeff Layton 	/* Only close files for F_SETLEASE leases */
78365294c1fSJeff Layton 	if (fl->fl_flags & FL_LEASE)
78465294c1fSJeff Layton 		nfsd_file_close_inode_sync(file_inode(fl->fl_file));
78565294c1fSJeff Layton 	return 0;
78665294c1fSJeff Layton }
78765294c1fSJeff Layton 
78865294c1fSJeff Layton static struct notifier_block nfsd_file_lease_notifier = {
78965294c1fSJeff Layton 	.notifier_call = nfsd_file_lease_notifier_call,
79065294c1fSJeff Layton };
79165294c1fSJeff Layton 
79265294c1fSJeff Layton static int
793b9a1b977SAmir Goldstein nfsd_file_fsnotify_handle_event(struct fsnotify_mark *mark, u32 mask,
794b9a1b977SAmir Goldstein 				struct inode *inode, struct inode *dir,
795950cc0d2SAmir Goldstein 				const struct qstr *name, u32 cookie)
79665294c1fSJeff Layton {
79724dca905SGabriel Krisman Bertazi 	if (WARN_ON_ONCE(!inode))
79824dca905SGabriel Krisman Bertazi 		return 0;
79924dca905SGabriel Krisman Bertazi 
80065294c1fSJeff Layton 	trace_nfsd_file_fsnotify_handle_event(inode, mask);
80165294c1fSJeff Layton 
80265294c1fSJeff Layton 	/* Should be no marks on non-regular files */
80365294c1fSJeff Layton 	if (!S_ISREG(inode->i_mode)) {
80465294c1fSJeff Layton 		WARN_ON_ONCE(1);
80565294c1fSJeff Layton 		return 0;
80665294c1fSJeff Layton 	}
80765294c1fSJeff Layton 
80865294c1fSJeff Layton 	/* don't close files if this was not the last link */
80965294c1fSJeff Layton 	if (mask & FS_ATTRIB) {
81065294c1fSJeff Layton 		if (inode->i_nlink)
81165294c1fSJeff Layton 			return 0;
81265294c1fSJeff Layton 	}
81365294c1fSJeff Layton 
81465294c1fSJeff Layton 	nfsd_file_close_inode(inode);
81565294c1fSJeff Layton 	return 0;
81665294c1fSJeff Layton }
81765294c1fSJeff Layton 
81865294c1fSJeff Layton 
81965294c1fSJeff Layton static const struct fsnotify_ops nfsd_file_fsnotify_ops = {
820b9a1b977SAmir Goldstein 	.handle_inode_event = nfsd_file_fsnotify_handle_event,
82165294c1fSJeff Layton 	.free_mark = nfsd_file_mark_free,
82265294c1fSJeff Layton };
82365294c1fSJeff Layton 
82465294c1fSJeff Layton int
82565294c1fSJeff Layton nfsd_file_cache_init(void)
82665294c1fSJeff Layton {
827fc22945eSChuck Lever 	int ret;
82865294c1fSJeff Layton 
829c7b824c3SChuck Lever 	lockdep_assert_held(&nfsd_mutex);
830c7b824c3SChuck Lever 	if (test_and_set_bit(NFSD_FILE_CACHE_UP, &nfsd_file_flags) == 1)
83165294c1fSJeff Layton 		return 0;
83265294c1fSJeff Layton 
833fc22945eSChuck Lever 	ret = rhashtable_init(&nfsd_file_rhash_tbl, &nfsd_file_rhash_params);
834fc22945eSChuck Lever 	if (ret)
835fc22945eSChuck Lever 		return ret;
836fc22945eSChuck Lever 
837fc22945eSChuck Lever 	ret = -ENOMEM;
8389542e6a6STrond Myklebust 	nfsd_filecache_wq = alloc_workqueue("nfsd_filecache", 0, 0);
8399542e6a6STrond Myklebust 	if (!nfsd_filecache_wq)
8409542e6a6STrond Myklebust 		goto out;
8419542e6a6STrond Myklebust 
84265294c1fSJeff Layton 	nfsd_file_slab = kmem_cache_create("nfsd_file",
84365294c1fSJeff Layton 				sizeof(struct nfsd_file), 0, 0, NULL);
84465294c1fSJeff Layton 	if (!nfsd_file_slab) {
84565294c1fSJeff Layton 		pr_err("nfsd: unable to create nfsd_file_slab\n");
84665294c1fSJeff Layton 		goto out_err;
84765294c1fSJeff Layton 	}
84865294c1fSJeff Layton 
84965294c1fSJeff Layton 	nfsd_file_mark_slab = kmem_cache_create("nfsd_file_mark",
85065294c1fSJeff Layton 					sizeof(struct nfsd_file_mark), 0, 0, NULL);
85165294c1fSJeff Layton 	if (!nfsd_file_mark_slab) {
85265294c1fSJeff Layton 		pr_err("nfsd: unable to create nfsd_file_mark_slab\n");
85365294c1fSJeff Layton 		goto out_err;
85465294c1fSJeff Layton 	}
85565294c1fSJeff Layton 
85665294c1fSJeff Layton 
85765294c1fSJeff Layton 	ret = list_lru_init(&nfsd_file_lru);
85865294c1fSJeff Layton 	if (ret) {
85965294c1fSJeff Layton 		pr_err("nfsd: failed to init nfsd_file_lru: %d\n", ret);
86065294c1fSJeff Layton 		goto out_err;
86165294c1fSJeff Layton 	}
86265294c1fSJeff Layton 
863e33c267aSRoman Gushchin 	ret = register_shrinker(&nfsd_file_shrinker, "nfsd-filecache");
86465294c1fSJeff Layton 	if (ret) {
86565294c1fSJeff Layton 		pr_err("nfsd: failed to register nfsd_file_shrinker: %d\n", ret);
86665294c1fSJeff Layton 		goto out_lru;
86765294c1fSJeff Layton 	}
86865294c1fSJeff Layton 
86965294c1fSJeff Layton 	ret = lease_register_notifier(&nfsd_file_lease_notifier);
87065294c1fSJeff Layton 	if (ret) {
87165294c1fSJeff Layton 		pr_err("nfsd: unable to register lease notifier: %d\n", ret);
87265294c1fSJeff Layton 		goto out_shrinker;
87365294c1fSJeff Layton 	}
87465294c1fSJeff Layton 
875867a448dSAmir Goldstein 	nfsd_file_fsnotify_group = fsnotify_alloc_group(&nfsd_file_fsnotify_ops,
876b8962a9dSAmir Goldstein 							FSNOTIFY_GROUP_NOFS);
87765294c1fSJeff Layton 	if (IS_ERR(nfsd_file_fsnotify_group)) {
87865294c1fSJeff Layton 		pr_err("nfsd: unable to create fsnotify group: %ld\n",
87965294c1fSJeff Layton 			PTR_ERR(nfsd_file_fsnotify_group));
880231307dfSHuang Guobin 		ret = PTR_ERR(nfsd_file_fsnotify_group);
88165294c1fSJeff Layton 		nfsd_file_fsnotify_group = NULL;
88265294c1fSJeff Layton 		goto out_notifier;
88365294c1fSJeff Layton 	}
88465294c1fSJeff Layton 
8859542e6a6STrond Myklebust 	INIT_DELAYED_WORK(&nfsd_filecache_laundrette, nfsd_file_gc_worker);
88665294c1fSJeff Layton out:
88765294c1fSJeff Layton 	return ret;
88865294c1fSJeff Layton out_notifier:
88965294c1fSJeff Layton 	lease_unregister_notifier(&nfsd_file_lease_notifier);
89065294c1fSJeff Layton out_shrinker:
89165294c1fSJeff Layton 	unregister_shrinker(&nfsd_file_shrinker);
89265294c1fSJeff Layton out_lru:
89365294c1fSJeff Layton 	list_lru_destroy(&nfsd_file_lru);
89465294c1fSJeff Layton out_err:
89565294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_slab);
89665294c1fSJeff Layton 	nfsd_file_slab = NULL;
89765294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_mark_slab);
89865294c1fSJeff Layton 	nfsd_file_mark_slab = NULL;
8999542e6a6STrond Myklebust 	destroy_workqueue(nfsd_filecache_wq);
9009542e6a6STrond Myklebust 	nfsd_filecache_wq = NULL;
901fc22945eSChuck Lever 	rhashtable_destroy(&nfsd_file_rhash_tbl);
90265294c1fSJeff Layton 	goto out;
90365294c1fSJeff Layton }
90465294c1fSJeff Layton 
905c7b824c3SChuck Lever static void
906c7b824c3SChuck Lever __nfsd_file_cache_purge(struct net *net)
90765294c1fSJeff Layton {
908ce502f81SChuck Lever 	struct rhashtable_iter iter;
90965294c1fSJeff Layton 	struct nfsd_file *nf;
91065294c1fSJeff Layton 	LIST_HEAD(dispose);
91165294c1fSJeff Layton 
912ce502f81SChuck Lever 	rhashtable_walk_enter(&nfsd_file_rhash_tbl, &iter);
913ce502f81SChuck Lever 	do {
914ce502f81SChuck Lever 		rhashtable_walk_start(&iter);
91565294c1fSJeff Layton 
916ce502f81SChuck Lever 		nf = rhashtable_walk_next(&iter);
917ce502f81SChuck Lever 		while (!IS_ERR_OR_NULL(nf)) {
918d3aefd2bSJeff Layton 			if (!net || nf->nf_net == net)
9198d0d254bSJeff Layton 				nfsd_file_unhash_and_dispose(nf, &dispose);
920ce502f81SChuck Lever 			nf = rhashtable_walk_next(&iter);
92165294c1fSJeff Layton 		}
922ce502f81SChuck Lever 
923ce502f81SChuck Lever 		rhashtable_walk_stop(&iter);
924ce502f81SChuck Lever 	} while (nf == ERR_PTR(-EAGAIN));
925ce502f81SChuck Lever 	rhashtable_walk_exit(&iter);
926ce502f81SChuck Lever 
92765294c1fSJeff Layton 	nfsd_file_dispose_list(&dispose);
92865294c1fSJeff Layton }
92965294c1fSJeff Layton 
9309542e6a6STrond Myklebust static struct nfsd_fcache_disposal *
9311463b38eSNeilBrown nfsd_alloc_fcache_disposal(void)
9329542e6a6STrond Myklebust {
9339542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l;
9349542e6a6STrond Myklebust 
9359542e6a6STrond Myklebust 	l = kmalloc(sizeof(*l), GFP_KERNEL);
9369542e6a6STrond Myklebust 	if (!l)
9379542e6a6STrond Myklebust 		return NULL;
9389542e6a6STrond Myklebust 	INIT_WORK(&l->work, nfsd_file_delayed_close);
9399542e6a6STrond Myklebust 	spin_lock_init(&l->lock);
9409542e6a6STrond Myklebust 	INIT_LIST_HEAD(&l->freeme);
9419542e6a6STrond Myklebust 	return l;
9429542e6a6STrond Myklebust }
9439542e6a6STrond Myklebust 
9449542e6a6STrond Myklebust static void
9459542e6a6STrond Myklebust nfsd_free_fcache_disposal(struct nfsd_fcache_disposal *l)
9469542e6a6STrond Myklebust {
9479542e6a6STrond Myklebust 	cancel_work_sync(&l->work);
9489542e6a6STrond Myklebust 	nfsd_file_dispose_list(&l->freeme);
9491463b38eSNeilBrown 	kfree(l);
9509542e6a6STrond Myklebust }
9519542e6a6STrond Myklebust 
9529542e6a6STrond Myklebust static void
9539542e6a6STrond Myklebust nfsd_free_fcache_disposal_net(struct net *net)
9549542e6a6STrond Myklebust {
9551463b38eSNeilBrown 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
9561463b38eSNeilBrown 	struct nfsd_fcache_disposal *l = nn->fcache_disposal;
9579542e6a6STrond Myklebust 
9589542e6a6STrond Myklebust 	nfsd_free_fcache_disposal(l);
9599542e6a6STrond Myklebust }
9609542e6a6STrond Myklebust 
9619542e6a6STrond Myklebust int
9629542e6a6STrond Myklebust nfsd_file_cache_start_net(struct net *net)
9639542e6a6STrond Myklebust {
9641463b38eSNeilBrown 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
9651463b38eSNeilBrown 
9661463b38eSNeilBrown 	nn->fcache_disposal = nfsd_alloc_fcache_disposal();
9671463b38eSNeilBrown 	return nn->fcache_disposal ? 0 : -ENOMEM;
9689542e6a6STrond Myklebust }
9699542e6a6STrond Myklebust 
970c7b824c3SChuck Lever /**
971c7b824c3SChuck Lever  * nfsd_file_cache_purge - Remove all cache items associated with @net
972c7b824c3SChuck Lever  * @net: target net namespace
973c7b824c3SChuck Lever  *
974c7b824c3SChuck Lever  */
975c7b824c3SChuck Lever void
976c7b824c3SChuck Lever nfsd_file_cache_purge(struct net *net)
977c7b824c3SChuck Lever {
978c7b824c3SChuck Lever 	lockdep_assert_held(&nfsd_mutex);
979c7b824c3SChuck Lever 	if (test_bit(NFSD_FILE_CACHE_UP, &nfsd_file_flags) == 1)
980c7b824c3SChuck Lever 		__nfsd_file_cache_purge(net);
981c7b824c3SChuck Lever }
982c7b824c3SChuck Lever 
9839542e6a6STrond Myklebust void
9849542e6a6STrond Myklebust nfsd_file_cache_shutdown_net(struct net *net)
9859542e6a6STrond Myklebust {
9869542e6a6STrond Myklebust 	nfsd_file_cache_purge(net);
9879542e6a6STrond Myklebust 	nfsd_free_fcache_disposal_net(net);
9889542e6a6STrond Myklebust }
9899542e6a6STrond Myklebust 
99065294c1fSJeff Layton void
99165294c1fSJeff Layton nfsd_file_cache_shutdown(void)
99265294c1fSJeff Layton {
9938b330f78SChuck Lever 	int i;
9948b330f78SChuck Lever 
995c7b824c3SChuck Lever 	lockdep_assert_held(&nfsd_mutex);
996c7b824c3SChuck Lever 	if (test_and_clear_bit(NFSD_FILE_CACHE_UP, &nfsd_file_flags) == 0)
997c7b824c3SChuck Lever 		return;
99865294c1fSJeff Layton 
99965294c1fSJeff Layton 	lease_unregister_notifier(&nfsd_file_lease_notifier);
100065294c1fSJeff Layton 	unregister_shrinker(&nfsd_file_shrinker);
100165294c1fSJeff Layton 	/*
100265294c1fSJeff Layton 	 * make sure all callers of nfsd_file_lru_cb are done before
100365294c1fSJeff Layton 	 * calling nfsd_file_cache_purge
100465294c1fSJeff Layton 	 */
100565294c1fSJeff Layton 	cancel_delayed_work_sync(&nfsd_filecache_laundrette);
1006c7b824c3SChuck Lever 	__nfsd_file_cache_purge(NULL);
100765294c1fSJeff Layton 	list_lru_destroy(&nfsd_file_lru);
100865294c1fSJeff Layton 	rcu_barrier();
100965294c1fSJeff Layton 	fsnotify_put_group(nfsd_file_fsnotify_group);
101065294c1fSJeff Layton 	nfsd_file_fsnotify_group = NULL;
101165294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_slab);
101265294c1fSJeff Layton 	nfsd_file_slab = NULL;
101365294c1fSJeff Layton 	fsnotify_wait_marks_destroyed();
101465294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_mark_slab);
101565294c1fSJeff Layton 	nfsd_file_mark_slab = NULL;
10169542e6a6STrond Myklebust 	destroy_workqueue(nfsd_filecache_wq);
10179542e6a6STrond Myklebust 	nfsd_filecache_wq = NULL;
1018fc22945eSChuck Lever 	rhashtable_destroy(&nfsd_file_rhash_tbl);
101965294c1fSJeff Layton 
10208b330f78SChuck Lever 	for_each_possible_cpu(i) {
10218b330f78SChuck Lever 		per_cpu(nfsd_file_cache_hits, i) = 0;
10228b330f78SChuck Lever 		per_cpu(nfsd_file_acquisitions, i) = 0;
10238b330f78SChuck Lever 		per_cpu(nfsd_file_releases, i) = 0;
10248b330f78SChuck Lever 		per_cpu(nfsd_file_total_age, i) = 0;
10258b330f78SChuck Lever 		per_cpu(nfsd_file_pages_flushed, i) = 0;
10268b330f78SChuck Lever 		per_cpu(nfsd_file_evictions, i) = 0;
102765294c1fSJeff Layton 	}
102865294c1fSJeff Layton }
102965294c1fSJeff Layton 
103065294c1fSJeff Layton /**
1031ce502f81SChuck Lever  * nfsd_file_is_cached - are there any cached open files for this inode?
1032ce502f81SChuck Lever  * @inode: inode to check
103365294c1fSJeff Layton  *
1034ce502f81SChuck Lever  * The lookup matches inodes in all net namespaces and is atomic wrt
1035ce502f81SChuck Lever  * nfsd_file_acquire().
1036ce502f81SChuck Lever  *
1037ce502f81SChuck Lever  * Return values:
1038ce502f81SChuck Lever  *   %true: filecache contains at least one file matching this inode
1039ce502f81SChuck Lever  *   %false: filecache contains no files matching this inode
104065294c1fSJeff Layton  */
104165294c1fSJeff Layton bool
104265294c1fSJeff Layton nfsd_file_is_cached(struct inode *inode)
104365294c1fSJeff Layton {
1044ce502f81SChuck Lever 	struct nfsd_file_lookup_key key = {
1045ce502f81SChuck Lever 		.type	= NFSD_FILE_KEY_INODE,
1046ce502f81SChuck Lever 		.inode	= inode,
1047ce502f81SChuck Lever 	};
104865294c1fSJeff Layton 	bool ret = false;
104965294c1fSJeff Layton 
1050ce502f81SChuck Lever 	if (rhashtable_lookup_fast(&nfsd_file_rhash_tbl, &key,
1051ce502f81SChuck Lever 				   nfsd_file_rhash_params) != NULL)
105265294c1fSJeff Layton 		ret = true;
105354f7df70SChuck Lever 	trace_nfsd_file_is_cached(inode, (int)ret);
105465294c1fSJeff Layton 	return ret;
105565294c1fSJeff Layton }
105665294c1fSJeff Layton 
1057fb70bf12SChuck Lever static __be32
1058be023006SChuck Lever nfsd_file_do_acquire(struct svc_rqst *rqstp, struct svc_fh *fhp,
10594d1ea845SChuck Lever 		     unsigned int may_flags, struct nfsd_file **pnf,
10604d1ea845SChuck Lever 		     bool open, bool want_gc)
106165294c1fSJeff Layton {
1062ce502f81SChuck Lever 	struct nfsd_file_lookup_key key = {
1063ce502f81SChuck Lever 		.type	= NFSD_FILE_KEY_FULL,
1064ce502f81SChuck Lever 		.need	= may_flags & NFSD_FILE_MAY_MASK,
1065ce502f81SChuck Lever 		.net	= SVC_NET(rqstp),
10664d1ea845SChuck Lever 		.gc	= want_gc,
1067ce502f81SChuck Lever 	};
1068243a5263SJeff Layton 	bool open_retry = true;
1069243a5263SJeff Layton 	struct nfsd_file *nf;
1070ce502f81SChuck Lever 	__be32 status;
1071243a5263SJeff Layton 	int ret;
107265294c1fSJeff Layton 
107365294c1fSJeff Layton 	status = fh_verify(rqstp, fhp, S_IFREG,
107465294c1fSJeff Layton 				may_flags|NFSD_MAY_OWNER_OVERRIDE);
107565294c1fSJeff Layton 	if (status != nfs_ok)
107665294c1fSJeff Layton 		return status;
1077ce502f81SChuck Lever 	key.inode = d_inode(fhp->fh_dentry);
1078ce502f81SChuck Lever 	key.cred = get_current_cred();
107965294c1fSJeff Layton 
108065294c1fSJeff Layton retry:
1081243a5263SJeff Layton 	rcu_read_lock();
1082243a5263SJeff Layton 	nf = rhashtable_lookup(&nfsd_file_rhash_tbl, &key,
1083ce502f81SChuck Lever 			       nfsd_file_rhash_params);
1084ce502f81SChuck Lever 	if (nf)
1085ce502f81SChuck Lever 		nf = nfsd_file_get(nf);
1086243a5263SJeff Layton 	rcu_read_unlock();
108765294c1fSJeff Layton 	if (nf)
108865294c1fSJeff Layton 		goto wait_for_construction;
108965294c1fSJeff Layton 
1090243a5263SJeff Layton 	nf = nfsd_file_alloc(&key, may_flags);
1091243a5263SJeff Layton 	if (!nf) {
109254f7df70SChuck Lever 		status = nfserr_jukebox;
109354f7df70SChuck Lever 		goto out_status;
109465294c1fSJeff Layton 	}
109565294c1fSJeff Layton 
1096243a5263SJeff Layton 	ret = rhashtable_lookup_insert_key(&nfsd_file_rhash_tbl,
1097243a5263SJeff Layton 					   &key, &nf->nf_rhash,
1098ce502f81SChuck Lever 					   nfsd_file_rhash_params);
1099243a5263SJeff Layton 	if (likely(ret == 0))
110065294c1fSJeff Layton 		goto open_file;
1101243a5263SJeff Layton 
1102243a5263SJeff Layton 	nfsd_file_slab_free(&nf->nf_rcu);
1103bdd6b562SJeff Layton 	nf = NULL;
1104243a5263SJeff Layton 	if (ret == -EEXIST)
1105243a5263SJeff Layton 		goto retry;
1106243a5263SJeff Layton 	trace_nfsd_file_insert_err(rqstp, key.inode, may_flags, ret);
1107243a5263SJeff Layton 	status = nfserr_jukebox;
1108243a5263SJeff Layton 	goto out_status;
110965294c1fSJeff Layton 
111065294c1fSJeff Layton wait_for_construction:
111165294c1fSJeff Layton 	wait_on_bit(&nf->nf_flags, NFSD_FILE_PENDING, TASK_UNINTERRUPTIBLE);
111265294c1fSJeff Layton 
111365294c1fSJeff Layton 	/* Did construction of this file fail? */
111465294c1fSJeff Layton 	if (!test_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
1115ce502f81SChuck Lever 		trace_nfsd_file_cons_err(rqstp, key.inode, may_flags, nf);
1116243a5263SJeff Layton 		if (!open_retry) {
111728c7d86bSTrond Myklebust 			status = nfserr_jukebox;
111828c7d86bSTrond Myklebust 			goto out;
111928c7d86bSTrond Myklebust 		}
1120243a5263SJeff Layton 		open_retry = false;
112165294c1fSJeff Layton 		nfsd_file_put_noref(nf);
112265294c1fSJeff Layton 		goto retry;
112365294c1fSJeff Layton 	}
112465294c1fSJeff Layton 
11254a0e73e6SChuck Lever 	nfsd_file_lru_remove(nf);
112665294c1fSJeff Layton 	this_cpu_inc(nfsd_file_cache_hits);
112765294c1fSJeff Layton 
112823ba98deSJeff Layton 	status = nfserrno(nfsd_open_break_lease(file_inode(nf->nf_file), may_flags));
112965294c1fSJeff Layton out:
113065294c1fSJeff Layton 	if (status == nfs_ok) {
113129d4bdbbSChuck Lever 		if (open)
113229d4bdbbSChuck Lever 			this_cpu_inc(nfsd_file_acquisitions);
113365294c1fSJeff Layton 		*pnf = nf;
113465294c1fSJeff Layton 	} else {
113565294c1fSJeff Layton 		nfsd_file_put(nf);
113665294c1fSJeff Layton 		nf = NULL;
113765294c1fSJeff Layton 	}
113865294c1fSJeff Layton 
113954f7df70SChuck Lever out_status:
1140ce502f81SChuck Lever 	put_cred(key.cred);
1141be023006SChuck Lever 	if (open)
1142ce502f81SChuck Lever 		trace_nfsd_file_acquire(rqstp, key.inode, may_flags, nf, status);
114365294c1fSJeff Layton 	return status;
114465294c1fSJeff Layton 
114565294c1fSJeff Layton open_file:
1146b40a2839SChuck Lever 	trace_nfsd_file_alloc(nf);
1147427f5f83SChuck Lever 	nf->nf_mark = nfsd_file_mark_find_or_create(nf, key.inode);
1148fb70bf12SChuck Lever 	if (nf->nf_mark) {
11490122e882SChuck Lever 		if (open) {
1150f4d84c52SChuck Lever 			status = nfsd_open_verified(rqstp, fhp, may_flags,
1151f4d84c52SChuck Lever 						    &nf->nf_file);
11520122e882SChuck Lever 			trace_nfsd_file_open(nf, status);
11530122e882SChuck Lever 		} else
1154fb70bf12SChuck Lever 			status = nfs_ok;
1155fb70bf12SChuck Lever 	} else
115665294c1fSJeff Layton 		status = nfserr_jukebox;
115765294c1fSJeff Layton 	/*
115865294c1fSJeff Layton 	 * If construction failed, or we raced with a call to unlink()
115965294c1fSJeff Layton 	 * then unhash.
116065294c1fSJeff Layton 	 */
1161ce502f81SChuck Lever 	if (status != nfs_ok || key.inode->i_nlink == 0)
11624d1ea845SChuck Lever 		nfsd_file_unhash_and_put(nf);
116365294c1fSJeff Layton 	clear_bit_unlock(NFSD_FILE_PENDING, &nf->nf_flags);
116465294c1fSJeff Layton 	smp_mb__after_atomic();
116565294c1fSJeff Layton 	wake_up_bit(&nf->nf_flags, NFSD_FILE_PENDING);
116665294c1fSJeff Layton 	goto out;
116765294c1fSJeff Layton }
116865294c1fSJeff Layton 
1169fb70bf12SChuck Lever /**
11704d1ea845SChuck Lever  * nfsd_file_acquire_gc - Get a struct nfsd_file with an open file
11714d1ea845SChuck Lever  * @rqstp: the RPC transaction being executed
11724d1ea845SChuck Lever  * @fhp: the NFS filehandle of the file to be opened
11734d1ea845SChuck Lever  * @may_flags: NFSD_MAY_ settings for the file
11744d1ea845SChuck Lever  * @pnf: OUT: new or found "struct nfsd_file" object
11754d1ea845SChuck Lever  *
11764d1ea845SChuck Lever  * The nfsd_file object returned by this API is reference-counted
11774d1ea845SChuck Lever  * and garbage-collected. The object is retained for a few
11784d1ea845SChuck Lever  * seconds after the final nfsd_file_put() in case the caller
11794d1ea845SChuck Lever  * wants to re-use it.
11804d1ea845SChuck Lever  *
11814d1ea845SChuck Lever  * Returns nfs_ok and sets @pnf on success; otherwise an nfsstat in
11824d1ea845SChuck Lever  * network byte order is returned.
11834d1ea845SChuck Lever  */
11844d1ea845SChuck Lever __be32
11854d1ea845SChuck Lever nfsd_file_acquire_gc(struct svc_rqst *rqstp, struct svc_fh *fhp,
11864d1ea845SChuck Lever 		     unsigned int may_flags, struct nfsd_file **pnf)
11874d1ea845SChuck Lever {
11884d1ea845SChuck Lever 	return nfsd_file_do_acquire(rqstp, fhp, may_flags, pnf, true, true);
11894d1ea845SChuck Lever }
11904d1ea845SChuck Lever 
11914d1ea845SChuck Lever /**
1192fb70bf12SChuck Lever  * nfsd_file_acquire - Get a struct nfsd_file with an open file
1193fb70bf12SChuck Lever  * @rqstp: the RPC transaction being executed
1194fb70bf12SChuck Lever  * @fhp: the NFS filehandle of the file to be opened
1195fb70bf12SChuck Lever  * @may_flags: NFSD_MAY_ settings for the file
1196fb70bf12SChuck Lever  * @pnf: OUT: new or found "struct nfsd_file" object
1197fb70bf12SChuck Lever  *
11984d1ea845SChuck Lever  * The nfsd_file_object returned by this API is reference-counted
11994d1ea845SChuck Lever  * but not garbage-collected. The object is unhashed after the
12004d1ea845SChuck Lever  * final nfsd_file_put().
12014d1ea845SChuck Lever  *
1202fb70bf12SChuck Lever  * Returns nfs_ok and sets @pnf on success; otherwise an nfsstat in
1203fb70bf12SChuck Lever  * network byte order is returned.
1204fb70bf12SChuck Lever  */
1205fb70bf12SChuck Lever __be32
1206fb70bf12SChuck Lever nfsd_file_acquire(struct svc_rqst *rqstp, struct svc_fh *fhp,
1207fb70bf12SChuck Lever 		  unsigned int may_flags, struct nfsd_file **pnf)
1208fb70bf12SChuck Lever {
12094d1ea845SChuck Lever 	return nfsd_file_do_acquire(rqstp, fhp, may_flags, pnf, true, false);
1210fb70bf12SChuck Lever }
1211fb70bf12SChuck Lever 
1212fb70bf12SChuck Lever /**
1213fb70bf12SChuck Lever  * nfsd_file_create - Get a struct nfsd_file, do not open
1214fb70bf12SChuck Lever  * @rqstp: the RPC transaction being executed
1215fb70bf12SChuck Lever  * @fhp: the NFS filehandle of the file just created
1216fb70bf12SChuck Lever  * @may_flags: NFSD_MAY_ settings for the file
1217fb70bf12SChuck Lever  * @pnf: OUT: new or found "struct nfsd_file" object
1218fb70bf12SChuck Lever  *
12194d1ea845SChuck Lever  * The nfsd_file_object returned by this API is reference-counted
12204d1ea845SChuck Lever  * but not garbage-collected. The object is released immediately
12214d1ea845SChuck Lever  * one RCU grace period after the final nfsd_file_put().
12224d1ea845SChuck Lever  *
1223fb70bf12SChuck Lever  * Returns nfs_ok and sets @pnf on success; otherwise an nfsstat in
1224fb70bf12SChuck Lever  * network byte order is returned.
1225fb70bf12SChuck Lever  */
1226fb70bf12SChuck Lever __be32
1227fb70bf12SChuck Lever nfsd_file_create(struct svc_rqst *rqstp, struct svc_fh *fhp,
1228fb70bf12SChuck Lever 		 unsigned int may_flags, struct nfsd_file **pnf)
1229fb70bf12SChuck Lever {
12304d1ea845SChuck Lever 	return nfsd_file_do_acquire(rqstp, fhp, may_flags, pnf, false, false);
1231fb70bf12SChuck Lever }
1232fb70bf12SChuck Lever 
123365294c1fSJeff Layton /*
123465294c1fSJeff Layton  * Note that fields may be added, removed or reordered in the future. Programs
123565294c1fSJeff Layton  * scraping this file for info should test the labels to ensure they're
123665294c1fSJeff Layton  * getting the correct field.
123765294c1fSJeff Layton  */
12381342f9ddSChenXiaoSong int nfsd_file_cache_stats_show(struct seq_file *m, void *v)
123965294c1fSJeff Layton {
1240df2aff52SChuck Lever 	unsigned long releases = 0, pages_flushed = 0, evictions = 0;
1241df2aff52SChuck Lever 	unsigned long hits = 0, acquisitions = 0;
1242ce502f81SChuck Lever 	unsigned int i, count = 0, buckets = 0;
1243904940e9SChuck Lever 	unsigned long lru = 0, total_age = 0;
124465294c1fSJeff Layton 
1245ce502f81SChuck Lever 	/* Serialize with server shutdown */
124665294c1fSJeff Layton 	mutex_lock(&nfsd_mutex);
1247c7b824c3SChuck Lever 	if (test_bit(NFSD_FILE_CACHE_UP, &nfsd_file_flags) == 1) {
1248ce502f81SChuck Lever 		struct bucket_table *tbl;
1249ce502f81SChuck Lever 		struct rhashtable *ht;
1250ce502f81SChuck Lever 
12510fd244c1SChuck Lever 		lru = list_lru_count(&nfsd_file_lru);
1252ce502f81SChuck Lever 
1253ce502f81SChuck Lever 		rcu_read_lock();
1254ce502f81SChuck Lever 		ht = &nfsd_file_rhash_tbl;
1255ce502f81SChuck Lever 		count = atomic_read(&ht->nelems);
1256ce502f81SChuck Lever 		tbl = rht_dereference_rcu(ht->tbl, ht);
1257ce502f81SChuck Lever 		buckets = tbl->size;
1258ce502f81SChuck Lever 		rcu_read_unlock();
125965294c1fSJeff Layton 	}
126065294c1fSJeff Layton 	mutex_unlock(&nfsd_mutex);
126165294c1fSJeff Layton 
126229d4bdbbSChuck Lever 	for_each_possible_cpu(i) {
126365294c1fSJeff Layton 		hits += per_cpu(nfsd_file_cache_hits, i);
126429d4bdbbSChuck Lever 		acquisitions += per_cpu(nfsd_file_acquisitions, i);
1265d6329327SChuck Lever 		releases += per_cpu(nfsd_file_releases, i);
1266904940e9SChuck Lever 		total_age += per_cpu(nfsd_file_total_age, i);
126794660cc1SChuck Lever 		evictions += per_cpu(nfsd_file_evictions, i);
1268df2aff52SChuck Lever 		pages_flushed += per_cpu(nfsd_file_pages_flushed, i);
126929d4bdbbSChuck Lever 	}
127065294c1fSJeff Layton 
127165294c1fSJeff Layton 	seq_printf(m, "total entries: %u\n", count);
1272ce502f81SChuck Lever 	seq_printf(m, "hash buckets:  %u\n", buckets);
12730fd244c1SChuck Lever 	seq_printf(m, "lru entries:   %lu\n", lru);
127465294c1fSJeff Layton 	seq_printf(m, "cache hits:    %lu\n", hits);
127529d4bdbbSChuck Lever 	seq_printf(m, "acquisitions:  %lu\n", acquisitions);
1276d6329327SChuck Lever 	seq_printf(m, "releases:      %lu\n", releases);
127794660cc1SChuck Lever 	seq_printf(m, "evictions:     %lu\n", evictions);
1278904940e9SChuck Lever 	if (releases)
1279904940e9SChuck Lever 		seq_printf(m, "mean age (ms): %ld\n", total_age / releases);
1280904940e9SChuck Lever 	else
1281904940e9SChuck Lever 		seq_printf(m, "mean age (ms): -\n");
1282df2aff52SChuck Lever 	seq_printf(m, "pages flushed: %lu\n", pages_flushed);
128365294c1fSJeff Layton 	return 0;
128465294c1fSJeff Layton }
1285