xref: /openbmc/linux/fs/nfsd/filecache.c (revision ae3c57b5ca47665dc3416447a5534a9796096d86)
165294c1fSJeff Layton /*
265294c1fSJeff Layton  * Open file cache.
365294c1fSJeff Layton  *
465294c1fSJeff Layton  * (c) 2015 - Jeff Layton <jeff.layton@primarydata.com>
565294c1fSJeff Layton  */
665294c1fSJeff Layton 
765294c1fSJeff Layton #include <linux/hash.h>
865294c1fSJeff Layton #include <linux/slab.h>
965294c1fSJeff Layton #include <linux/file.h>
1065294c1fSJeff Layton #include <linux/sched.h>
1165294c1fSJeff Layton #include <linux/list_lru.h>
1265294c1fSJeff Layton #include <linux/fsnotify_backend.h>
1365294c1fSJeff Layton #include <linux/fsnotify.h>
1465294c1fSJeff Layton #include <linux/seq_file.h>
1565294c1fSJeff Layton 
1665294c1fSJeff Layton #include "vfs.h"
1765294c1fSJeff Layton #include "nfsd.h"
1865294c1fSJeff Layton #include "nfsfh.h"
195e113224STrond Myklebust #include "netns.h"
2065294c1fSJeff Layton #include "filecache.h"
2165294c1fSJeff Layton #include "trace.h"
2265294c1fSJeff Layton 
2365294c1fSJeff Layton #define NFSDDBG_FACILITY	NFSDDBG_FH
2465294c1fSJeff Layton 
2565294c1fSJeff Layton /* FIXME: dynamically size this for the machine somehow? */
2665294c1fSJeff Layton #define NFSD_FILE_HASH_BITS                   12
2765294c1fSJeff Layton #define NFSD_FILE_HASH_SIZE                  (1 << NFSD_FILE_HASH_BITS)
2865294c1fSJeff Layton #define NFSD_LAUNDRETTE_DELAY		     (2 * HZ)
2965294c1fSJeff Layton 
3065294c1fSJeff Layton #define NFSD_FILE_SHUTDOWN		     (1)
3165294c1fSJeff Layton #define NFSD_FILE_LRU_THRESHOLD		     (4096UL)
3265294c1fSJeff Layton #define NFSD_FILE_LRU_LIMIT		     (NFSD_FILE_LRU_THRESHOLD << 2)
3365294c1fSJeff Layton 
3465294c1fSJeff Layton /* We only care about NFSD_MAY_READ/WRITE for this cache */
3565294c1fSJeff Layton #define NFSD_FILE_MAY_MASK	(NFSD_MAY_READ|NFSD_MAY_WRITE)
3665294c1fSJeff Layton 
3765294c1fSJeff Layton struct nfsd_fcache_bucket {
3865294c1fSJeff Layton 	struct hlist_head	nfb_head;
3965294c1fSJeff Layton 	spinlock_t		nfb_lock;
4065294c1fSJeff Layton 	unsigned int		nfb_count;
4165294c1fSJeff Layton 	unsigned int		nfb_maxcount;
4265294c1fSJeff Layton };
4365294c1fSJeff Layton 
4465294c1fSJeff Layton static DEFINE_PER_CPU(unsigned long, nfsd_file_cache_hits);
4565294c1fSJeff Layton 
469542e6a6STrond Myklebust struct nfsd_fcache_disposal {
479542e6a6STrond Myklebust 	struct list_head list;
489542e6a6STrond Myklebust 	struct work_struct work;
499542e6a6STrond Myklebust 	struct net *net;
509542e6a6STrond Myklebust 	spinlock_t lock;
519542e6a6STrond Myklebust 	struct list_head freeme;
529542e6a6STrond Myklebust 	struct rcu_head rcu;
539542e6a6STrond Myklebust };
549542e6a6STrond Myklebust 
5550d0def9SChen Zhou static struct workqueue_struct *nfsd_filecache_wq __read_mostly;
569542e6a6STrond Myklebust 
5765294c1fSJeff Layton static struct kmem_cache		*nfsd_file_slab;
5865294c1fSJeff Layton static struct kmem_cache		*nfsd_file_mark_slab;
5965294c1fSJeff Layton static struct nfsd_fcache_bucket	*nfsd_file_hashtbl;
6065294c1fSJeff Layton static struct list_lru			nfsd_file_lru;
6165294c1fSJeff Layton static long				nfsd_file_lru_flags;
6265294c1fSJeff Layton static struct fsnotify_group		*nfsd_file_fsnotify_group;
6365294c1fSJeff Layton static atomic_long_t			nfsd_filecache_count;
6465294c1fSJeff Layton static struct delayed_work		nfsd_filecache_laundrette;
659542e6a6STrond Myklebust static DEFINE_SPINLOCK(laundrette_lock);
669542e6a6STrond Myklebust static LIST_HEAD(laundrettes);
6765294c1fSJeff Layton 
689542e6a6STrond Myklebust static void nfsd_file_gc(void);
6965294c1fSJeff Layton 
7065294c1fSJeff Layton static void
719542e6a6STrond Myklebust nfsd_file_schedule_laundrette(void)
7265294c1fSJeff Layton {
7365294c1fSJeff Layton 	long count = atomic_long_read(&nfsd_filecache_count);
7465294c1fSJeff Layton 
7565294c1fSJeff Layton 	if (count == 0 || test_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags))
7665294c1fSJeff Layton 		return;
7765294c1fSJeff Layton 
789542e6a6STrond Myklebust 	queue_delayed_work(system_wq, &nfsd_filecache_laundrette,
799542e6a6STrond Myklebust 			NFSD_LAUNDRETTE_DELAY);
8065294c1fSJeff Layton }
8165294c1fSJeff Layton 
8265294c1fSJeff Layton static void
8365294c1fSJeff Layton nfsd_file_slab_free(struct rcu_head *rcu)
8465294c1fSJeff Layton {
8565294c1fSJeff Layton 	struct nfsd_file *nf = container_of(rcu, struct nfsd_file, nf_rcu);
8665294c1fSJeff Layton 
8765294c1fSJeff Layton 	put_cred(nf->nf_cred);
8865294c1fSJeff Layton 	kmem_cache_free(nfsd_file_slab, nf);
8965294c1fSJeff Layton }
9065294c1fSJeff Layton 
9165294c1fSJeff Layton static void
9265294c1fSJeff Layton nfsd_file_mark_free(struct fsnotify_mark *mark)
9365294c1fSJeff Layton {
9465294c1fSJeff Layton 	struct nfsd_file_mark *nfm = container_of(mark, struct nfsd_file_mark,
9565294c1fSJeff Layton 						  nfm_mark);
9665294c1fSJeff Layton 
9765294c1fSJeff Layton 	kmem_cache_free(nfsd_file_mark_slab, nfm);
9865294c1fSJeff Layton }
9965294c1fSJeff Layton 
10065294c1fSJeff Layton static struct nfsd_file_mark *
10165294c1fSJeff Layton nfsd_file_mark_get(struct nfsd_file_mark *nfm)
10265294c1fSJeff Layton {
103689827cdSTrond Myklebust 	if (!refcount_inc_not_zero(&nfm->nfm_ref))
10465294c1fSJeff Layton 		return NULL;
10565294c1fSJeff Layton 	return nfm;
10665294c1fSJeff Layton }
10765294c1fSJeff Layton 
10865294c1fSJeff Layton static void
10965294c1fSJeff Layton nfsd_file_mark_put(struct nfsd_file_mark *nfm)
11065294c1fSJeff Layton {
111689827cdSTrond Myklebust 	if (refcount_dec_and_test(&nfm->nfm_ref)) {
11265294c1fSJeff Layton 		fsnotify_destroy_mark(&nfm->nfm_mark, nfsd_file_fsnotify_group);
11365294c1fSJeff Layton 		fsnotify_put_mark(&nfm->nfm_mark);
11465294c1fSJeff Layton 	}
11565294c1fSJeff Layton }
11665294c1fSJeff Layton 
11765294c1fSJeff Layton static struct nfsd_file_mark *
11865294c1fSJeff Layton nfsd_file_mark_find_or_create(struct nfsd_file *nf)
11965294c1fSJeff Layton {
12065294c1fSJeff Layton 	int			err;
12165294c1fSJeff Layton 	struct fsnotify_mark	*mark;
12265294c1fSJeff Layton 	struct nfsd_file_mark	*nfm = NULL, *new;
12365294c1fSJeff Layton 	struct inode *inode = nf->nf_inode;
12465294c1fSJeff Layton 
12565294c1fSJeff Layton 	do {
12665294c1fSJeff Layton 		mutex_lock(&nfsd_file_fsnotify_group->mark_mutex);
12765294c1fSJeff Layton 		mark = fsnotify_find_mark(&inode->i_fsnotify_marks,
12865294c1fSJeff Layton 				nfsd_file_fsnotify_group);
12965294c1fSJeff Layton 		if (mark) {
13065294c1fSJeff Layton 			nfm = nfsd_file_mark_get(container_of(mark,
13165294c1fSJeff Layton 						 struct nfsd_file_mark,
13265294c1fSJeff Layton 						 nfm_mark));
13365294c1fSJeff Layton 			mutex_unlock(&nfsd_file_fsnotify_group->mark_mutex);
13490d2f1daSTrond Myklebust 			if (nfm) {
13565294c1fSJeff Layton 				fsnotify_put_mark(mark);
13665294c1fSJeff Layton 				break;
13790d2f1daSTrond Myklebust 			}
13890d2f1daSTrond Myklebust 			/* Avoid soft lockup race with nfsd_file_mark_put() */
13990d2f1daSTrond Myklebust 			fsnotify_destroy_mark(mark, nfsd_file_fsnotify_group);
14090d2f1daSTrond Myklebust 			fsnotify_put_mark(mark);
14165294c1fSJeff Layton 		} else
14265294c1fSJeff Layton 			mutex_unlock(&nfsd_file_fsnotify_group->mark_mutex);
14365294c1fSJeff Layton 
14465294c1fSJeff Layton 		/* allocate a new nfm */
14565294c1fSJeff Layton 		new = kmem_cache_alloc(nfsd_file_mark_slab, GFP_KERNEL);
14665294c1fSJeff Layton 		if (!new)
14765294c1fSJeff Layton 			return NULL;
14865294c1fSJeff Layton 		fsnotify_init_mark(&new->nfm_mark, nfsd_file_fsnotify_group);
14965294c1fSJeff Layton 		new->nfm_mark.mask = FS_ATTRIB|FS_DELETE_SELF;
150689827cdSTrond Myklebust 		refcount_set(&new->nfm_ref, 1);
15165294c1fSJeff Layton 
15265294c1fSJeff Layton 		err = fsnotify_add_inode_mark(&new->nfm_mark, inode, 0);
15365294c1fSJeff Layton 
15465294c1fSJeff Layton 		/*
15565294c1fSJeff Layton 		 * If the add was successful, then return the object.
15665294c1fSJeff Layton 		 * Otherwise, we need to put the reference we hold on the
15765294c1fSJeff Layton 		 * nfm_mark. The fsnotify code will take a reference and put
15865294c1fSJeff Layton 		 * it on failure, so we can't just free it directly. It's also
15965294c1fSJeff Layton 		 * not safe to call fsnotify_destroy_mark on it as the
16065294c1fSJeff Layton 		 * mark->group will be NULL. Thus, we can't let the nfm_ref
16165294c1fSJeff Layton 		 * counter drive the destruction at this point.
16265294c1fSJeff Layton 		 */
16365294c1fSJeff Layton 		if (likely(!err))
16465294c1fSJeff Layton 			nfm = new;
16565294c1fSJeff Layton 		else
16665294c1fSJeff Layton 			fsnotify_put_mark(&new->nfm_mark);
16765294c1fSJeff Layton 	} while (unlikely(err == -EEXIST));
16865294c1fSJeff Layton 
16965294c1fSJeff Layton 	return nfm;
17065294c1fSJeff Layton }
17165294c1fSJeff Layton 
17265294c1fSJeff Layton static struct nfsd_file *
1735e113224STrond Myklebust nfsd_file_alloc(struct inode *inode, unsigned int may, unsigned int hashval,
1745e113224STrond Myklebust 		struct net *net)
17565294c1fSJeff Layton {
17665294c1fSJeff Layton 	struct nfsd_file *nf;
17765294c1fSJeff Layton 
17865294c1fSJeff Layton 	nf = kmem_cache_alloc(nfsd_file_slab, GFP_KERNEL);
17965294c1fSJeff Layton 	if (nf) {
18065294c1fSJeff Layton 		INIT_HLIST_NODE(&nf->nf_node);
18165294c1fSJeff Layton 		INIT_LIST_HEAD(&nf->nf_lru);
18265294c1fSJeff Layton 		nf->nf_file = NULL;
18365294c1fSJeff Layton 		nf->nf_cred = get_current_cred();
1845e113224STrond Myklebust 		nf->nf_net = net;
18565294c1fSJeff Layton 		nf->nf_flags = 0;
18665294c1fSJeff Layton 		nf->nf_inode = inode;
18765294c1fSJeff Layton 		nf->nf_hashval = hashval;
188689827cdSTrond Myklebust 		refcount_set(&nf->nf_ref, 1);
18965294c1fSJeff Layton 		nf->nf_may = may & NFSD_FILE_MAY_MASK;
19065294c1fSJeff Layton 		if (may & NFSD_MAY_NOT_BREAK_LEASE) {
19165294c1fSJeff Layton 			if (may & NFSD_MAY_WRITE)
19265294c1fSJeff Layton 				__set_bit(NFSD_FILE_BREAK_WRITE, &nf->nf_flags);
19365294c1fSJeff Layton 			if (may & NFSD_MAY_READ)
19465294c1fSJeff Layton 				__set_bit(NFSD_FILE_BREAK_READ, &nf->nf_flags);
19565294c1fSJeff Layton 		}
19665294c1fSJeff Layton 		nf->nf_mark = NULL;
1975011af4cSTrond Myklebust 		init_rwsem(&nf->nf_rwsem);
19865294c1fSJeff Layton 		trace_nfsd_file_alloc(nf);
19965294c1fSJeff Layton 	}
20065294c1fSJeff Layton 	return nf;
20165294c1fSJeff Layton }
20265294c1fSJeff Layton 
20365294c1fSJeff Layton static bool
20465294c1fSJeff Layton nfsd_file_free(struct nfsd_file *nf)
20565294c1fSJeff Layton {
20665294c1fSJeff Layton 	bool flush = false;
20765294c1fSJeff Layton 
20865294c1fSJeff Layton 	trace_nfsd_file_put_final(nf);
20965294c1fSJeff Layton 	if (nf->nf_mark)
21065294c1fSJeff Layton 		nfsd_file_mark_put(nf->nf_mark);
21165294c1fSJeff Layton 	if (nf->nf_file) {
21265294c1fSJeff Layton 		get_file(nf->nf_file);
21365294c1fSJeff Layton 		filp_close(nf->nf_file, NULL);
21465294c1fSJeff Layton 		fput(nf->nf_file);
21565294c1fSJeff Layton 		flush = true;
21665294c1fSJeff Layton 	}
21765294c1fSJeff Layton 	call_rcu(&nf->nf_rcu, nfsd_file_slab_free);
21865294c1fSJeff Layton 	return flush;
21965294c1fSJeff Layton }
22065294c1fSJeff Layton 
221055b24a8STrond Myklebust static bool
222055b24a8STrond Myklebust nfsd_file_check_writeback(struct nfsd_file *nf)
223055b24a8STrond Myklebust {
224055b24a8STrond Myklebust 	struct file *file = nf->nf_file;
225055b24a8STrond Myklebust 	struct address_space *mapping;
226055b24a8STrond Myklebust 
227055b24a8STrond Myklebust 	if (!file || !(file->f_mode & FMODE_WRITE))
228055b24a8STrond Myklebust 		return false;
229055b24a8STrond Myklebust 	mapping = file->f_mapping;
230055b24a8STrond Myklebust 	return mapping_tagged(mapping, PAGECACHE_TAG_DIRTY) ||
231055b24a8STrond Myklebust 		mapping_tagged(mapping, PAGECACHE_TAG_WRITEBACK);
232055b24a8STrond Myklebust }
233055b24a8STrond Myklebust 
234055b24a8STrond Myklebust static int
235055b24a8STrond Myklebust nfsd_file_check_write_error(struct nfsd_file *nf)
236055b24a8STrond Myklebust {
237055b24a8STrond Myklebust 	struct file *file = nf->nf_file;
238055b24a8STrond Myklebust 
239055b24a8STrond Myklebust 	if (!file || !(file->f_mode & FMODE_WRITE))
240055b24a8STrond Myklebust 		return 0;
241055b24a8STrond Myklebust 	return filemap_check_wb_err(file->f_mapping, READ_ONCE(file->f_wb_err));
242055b24a8STrond Myklebust }
243055b24a8STrond Myklebust 
24465294c1fSJeff Layton static void
24565294c1fSJeff Layton nfsd_file_do_unhash(struct nfsd_file *nf)
24665294c1fSJeff Layton {
24765294c1fSJeff Layton 	lockdep_assert_held(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock);
24865294c1fSJeff Layton 
24965294c1fSJeff Layton 	trace_nfsd_file_unhash(nf);
25065294c1fSJeff Layton 
251055b24a8STrond Myklebust 	if (nfsd_file_check_write_error(nf))
252055b24a8STrond Myklebust 		nfsd_reset_boot_verifier(net_generic(nf->nf_net, nfsd_net_id));
25365294c1fSJeff Layton 	--nfsd_file_hashtbl[nf->nf_hashval].nfb_count;
25465294c1fSJeff Layton 	hlist_del_rcu(&nf->nf_node);
25565294c1fSJeff Layton 	atomic_long_dec(&nfsd_filecache_count);
25665294c1fSJeff Layton }
25765294c1fSJeff Layton 
25865294c1fSJeff Layton static bool
25965294c1fSJeff Layton nfsd_file_unhash(struct nfsd_file *nf)
26065294c1fSJeff Layton {
26165294c1fSJeff Layton 	if (test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
26265294c1fSJeff Layton 		nfsd_file_do_unhash(nf);
26336ebbdb9STrond Myklebust 		if (!list_empty(&nf->nf_lru))
26436ebbdb9STrond Myklebust 			list_lru_del(&nfsd_file_lru, &nf->nf_lru);
26565294c1fSJeff Layton 		return true;
26665294c1fSJeff Layton 	}
26765294c1fSJeff Layton 	return false;
26865294c1fSJeff Layton }
26965294c1fSJeff Layton 
27065294c1fSJeff Layton /*
27165294c1fSJeff Layton  * Return true if the file was unhashed.
27265294c1fSJeff Layton  */
27365294c1fSJeff Layton static bool
27465294c1fSJeff Layton nfsd_file_unhash_and_release_locked(struct nfsd_file *nf, struct list_head *dispose)
27565294c1fSJeff Layton {
27665294c1fSJeff Layton 	lockdep_assert_held(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock);
27765294c1fSJeff Layton 
27865294c1fSJeff Layton 	trace_nfsd_file_unhash_and_release_locked(nf);
27965294c1fSJeff Layton 	if (!nfsd_file_unhash(nf))
28065294c1fSJeff Layton 		return false;
28165294c1fSJeff Layton 	/* keep final reference for nfsd_file_lru_dispose */
282689827cdSTrond Myklebust 	if (refcount_dec_not_one(&nf->nf_ref))
28365294c1fSJeff Layton 		return true;
28465294c1fSJeff Layton 
28565294c1fSJeff Layton 	list_add(&nf->nf_lru, dispose);
28665294c1fSJeff Layton 	return true;
28765294c1fSJeff Layton }
28865294c1fSJeff Layton 
289b6669305STrond Myklebust static void
29065294c1fSJeff Layton nfsd_file_put_noref(struct nfsd_file *nf)
29165294c1fSJeff Layton {
29265294c1fSJeff Layton 	trace_nfsd_file_put(nf);
29365294c1fSJeff Layton 
294689827cdSTrond Myklebust 	if (refcount_dec_and_test(&nf->nf_ref)) {
29565294c1fSJeff Layton 		WARN_ON(test_bit(NFSD_FILE_HASHED, &nf->nf_flags));
29665294c1fSJeff Layton 		nfsd_file_free(nf);
29765294c1fSJeff Layton 	}
29865294c1fSJeff Layton }
29965294c1fSJeff Layton 
30065294c1fSJeff Layton void
30165294c1fSJeff Layton nfsd_file_put(struct nfsd_file *nf)
30265294c1fSJeff Layton {
303b6669305STrond Myklebust 	bool is_hashed;
30465294c1fSJeff Layton 
30565294c1fSJeff Layton 	set_bit(NFSD_FILE_REFERENCED, &nf->nf_flags);
306689827cdSTrond Myklebust 	if (refcount_read(&nf->nf_ref) > 2 || !nf->nf_file) {
307b6669305STrond Myklebust 		nfsd_file_put_noref(nf);
308b6669305STrond Myklebust 		return;
309b6669305STrond Myklebust 	}
310b6669305STrond Myklebust 
311b6669305STrond Myklebust 	filemap_flush(nf->nf_file->f_mapping);
312b6669305STrond Myklebust 	is_hashed = test_bit(NFSD_FILE_HASHED, &nf->nf_flags) != 0;
313b6669305STrond Myklebust 	nfsd_file_put_noref(nf);
314b6669305STrond Myklebust 	if (is_hashed)
3159542e6a6STrond Myklebust 		nfsd_file_schedule_laundrette();
3169542e6a6STrond Myklebust 	if (atomic_long_read(&nfsd_filecache_count) >= NFSD_FILE_LRU_LIMIT)
3179542e6a6STrond Myklebust 		nfsd_file_gc();
31865294c1fSJeff Layton }
31965294c1fSJeff Layton 
32065294c1fSJeff Layton struct nfsd_file *
32165294c1fSJeff Layton nfsd_file_get(struct nfsd_file *nf)
32265294c1fSJeff Layton {
323689827cdSTrond Myklebust 	if (likely(refcount_inc_not_zero(&nf->nf_ref)))
32465294c1fSJeff Layton 		return nf;
32565294c1fSJeff Layton 	return NULL;
32665294c1fSJeff Layton }
32765294c1fSJeff Layton 
32865294c1fSJeff Layton static void
32965294c1fSJeff Layton nfsd_file_dispose_list(struct list_head *dispose)
33065294c1fSJeff Layton {
33165294c1fSJeff Layton 	struct nfsd_file *nf;
33265294c1fSJeff Layton 
33365294c1fSJeff Layton 	while(!list_empty(dispose)) {
33465294c1fSJeff Layton 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
33565294c1fSJeff Layton 		list_del(&nf->nf_lru);
33665294c1fSJeff Layton 		nfsd_file_put_noref(nf);
33765294c1fSJeff Layton 	}
33865294c1fSJeff Layton }
33965294c1fSJeff Layton 
34065294c1fSJeff Layton static void
34165294c1fSJeff Layton nfsd_file_dispose_list_sync(struct list_head *dispose)
34265294c1fSJeff Layton {
34365294c1fSJeff Layton 	bool flush = false;
34465294c1fSJeff Layton 	struct nfsd_file *nf;
34565294c1fSJeff Layton 
34665294c1fSJeff Layton 	while(!list_empty(dispose)) {
34765294c1fSJeff Layton 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
34865294c1fSJeff Layton 		list_del(&nf->nf_lru);
349689827cdSTrond Myklebust 		if (!refcount_dec_and_test(&nf->nf_ref))
35065294c1fSJeff Layton 			continue;
35165294c1fSJeff Layton 		if (nfsd_file_free(nf))
35265294c1fSJeff Layton 			flush = true;
35365294c1fSJeff Layton 	}
35465294c1fSJeff Layton 	if (flush)
35565294c1fSJeff Layton 		flush_delayed_fput();
35665294c1fSJeff Layton }
35765294c1fSJeff Layton 
3589542e6a6STrond Myklebust static void
3599542e6a6STrond Myklebust nfsd_file_list_remove_disposal(struct list_head *dst,
3609542e6a6STrond Myklebust 		struct nfsd_fcache_disposal *l)
3619542e6a6STrond Myklebust {
3629542e6a6STrond Myklebust 	spin_lock(&l->lock);
3639542e6a6STrond Myklebust 	list_splice_init(&l->freeme, dst);
3649542e6a6STrond Myklebust 	spin_unlock(&l->lock);
3659542e6a6STrond Myklebust }
3669542e6a6STrond Myklebust 
3679542e6a6STrond Myklebust static void
3689542e6a6STrond Myklebust nfsd_file_list_add_disposal(struct list_head *files, struct net *net)
3699542e6a6STrond Myklebust {
3709542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l;
3719542e6a6STrond Myklebust 
3729542e6a6STrond Myklebust 	rcu_read_lock();
3739542e6a6STrond Myklebust 	list_for_each_entry_rcu(l, &laundrettes, list) {
3749542e6a6STrond Myklebust 		if (l->net == net) {
3759542e6a6STrond Myklebust 			spin_lock(&l->lock);
3769542e6a6STrond Myklebust 			list_splice_tail_init(files, &l->freeme);
3779542e6a6STrond Myklebust 			spin_unlock(&l->lock);
3789542e6a6STrond Myklebust 			queue_work(nfsd_filecache_wq, &l->work);
3799542e6a6STrond Myklebust 			break;
3809542e6a6STrond Myklebust 		}
3819542e6a6STrond Myklebust 	}
3829542e6a6STrond Myklebust 	rcu_read_unlock();
3839542e6a6STrond Myklebust }
3849542e6a6STrond Myklebust 
3859542e6a6STrond Myklebust static void
3869542e6a6STrond Myklebust nfsd_file_list_add_pernet(struct list_head *dst, struct list_head *src,
3879542e6a6STrond Myklebust 		struct net *net)
3889542e6a6STrond Myklebust {
3899542e6a6STrond Myklebust 	struct nfsd_file *nf, *tmp;
3909542e6a6STrond Myklebust 
3919542e6a6STrond Myklebust 	list_for_each_entry_safe(nf, tmp, src, nf_lru) {
3929542e6a6STrond Myklebust 		if (nf->nf_net == net)
3939542e6a6STrond Myklebust 			list_move_tail(&nf->nf_lru, dst);
3949542e6a6STrond Myklebust 	}
3959542e6a6STrond Myklebust }
3969542e6a6STrond Myklebust 
3979542e6a6STrond Myklebust static void
3989542e6a6STrond Myklebust nfsd_file_dispose_list_delayed(struct list_head *dispose)
3999542e6a6STrond Myklebust {
4009542e6a6STrond Myklebust 	LIST_HEAD(list);
4019542e6a6STrond Myklebust 	struct nfsd_file *nf;
4029542e6a6STrond Myklebust 
4039542e6a6STrond Myklebust 	while(!list_empty(dispose)) {
4049542e6a6STrond Myklebust 		nf = list_first_entry(dispose, struct nfsd_file, nf_lru);
4059542e6a6STrond Myklebust 		nfsd_file_list_add_pernet(&list, dispose, nf->nf_net);
4069542e6a6STrond Myklebust 		nfsd_file_list_add_disposal(&list, nf->nf_net);
4079542e6a6STrond Myklebust 	}
4089542e6a6STrond Myklebust }
4099542e6a6STrond Myklebust 
41065294c1fSJeff Layton /*
41165294c1fSJeff Layton  * Note this can deadlock with nfsd_file_cache_purge.
41265294c1fSJeff Layton  */
41365294c1fSJeff Layton static enum lru_status
41465294c1fSJeff Layton nfsd_file_lru_cb(struct list_head *item, struct list_lru_one *lru,
41565294c1fSJeff Layton 		 spinlock_t *lock, void *arg)
41665294c1fSJeff Layton 	__releases(lock)
41765294c1fSJeff Layton 	__acquires(lock)
41865294c1fSJeff Layton {
41965294c1fSJeff Layton 	struct list_head *head = arg;
42065294c1fSJeff Layton 	struct nfsd_file *nf = list_entry(item, struct nfsd_file, nf_lru);
42165294c1fSJeff Layton 
42265294c1fSJeff Layton 	/*
42365294c1fSJeff Layton 	 * Do a lockless refcount check. The hashtable holds one reference, so
42465294c1fSJeff Layton 	 * we look to see if anything else has a reference, or if any have
42565294c1fSJeff Layton 	 * been put since the shrinker last ran. Those don't get unhashed and
42665294c1fSJeff Layton 	 * released.
42765294c1fSJeff Layton 	 *
42865294c1fSJeff Layton 	 * Note that in the put path, we set the flag and then decrement the
42965294c1fSJeff Layton 	 * counter. Here we check the counter and then test and clear the flag.
43065294c1fSJeff Layton 	 * That order is deliberate to ensure that we can do this locklessly.
43165294c1fSJeff Layton 	 */
432689827cdSTrond Myklebust 	if (refcount_read(&nf->nf_ref) > 1)
43365294c1fSJeff Layton 		goto out_skip;
434055b24a8STrond Myklebust 
435055b24a8STrond Myklebust 	/*
436055b24a8STrond Myklebust 	 * Don't throw out files that are still undergoing I/O or
437055b24a8STrond Myklebust 	 * that have uncleared errors pending.
438055b24a8STrond Myklebust 	 */
439055b24a8STrond Myklebust 	if (nfsd_file_check_writeback(nf))
440055b24a8STrond Myklebust 		goto out_skip;
441055b24a8STrond Myklebust 
44265294c1fSJeff Layton 	if (test_and_clear_bit(NFSD_FILE_REFERENCED, &nf->nf_flags))
443bd6e1cecSTrond Myklebust 		goto out_skip;
44465294c1fSJeff Layton 
44565294c1fSJeff Layton 	if (!test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags))
44665294c1fSJeff Layton 		goto out_skip;
44765294c1fSJeff Layton 
44865294c1fSJeff Layton 	list_lru_isolate_move(lru, &nf->nf_lru, head);
44965294c1fSJeff Layton 	return LRU_REMOVED;
45065294c1fSJeff Layton out_skip:
45165294c1fSJeff Layton 	return LRU_SKIP;
45265294c1fSJeff Layton }
45365294c1fSJeff Layton 
4549542e6a6STrond Myklebust static unsigned long
4559542e6a6STrond Myklebust nfsd_file_lru_walk_list(struct shrink_control *sc)
45665294c1fSJeff Layton {
4579542e6a6STrond Myklebust 	LIST_HEAD(head);
45836ebbdb9STrond Myklebust 	struct nfsd_file *nf;
4599542e6a6STrond Myklebust 	unsigned long ret;
46036ebbdb9STrond Myklebust 
4619542e6a6STrond Myklebust 	if (sc)
4629542e6a6STrond Myklebust 		ret = list_lru_shrink_walk(&nfsd_file_lru, sc,
4639542e6a6STrond Myklebust 				nfsd_file_lru_cb, &head);
4649542e6a6STrond Myklebust 	else
4659542e6a6STrond Myklebust 		ret = list_lru_walk(&nfsd_file_lru,
4669542e6a6STrond Myklebust 				nfsd_file_lru_cb,
4679542e6a6STrond Myklebust 				&head, LONG_MAX);
4689542e6a6STrond Myklebust 	list_for_each_entry(nf, &head, nf_lru) {
46965294c1fSJeff Layton 		spin_lock(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock);
47065294c1fSJeff Layton 		nfsd_file_do_unhash(nf);
47165294c1fSJeff Layton 		spin_unlock(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock);
47265294c1fSJeff Layton 	}
4739542e6a6STrond Myklebust 	nfsd_file_dispose_list_delayed(&head);
4749542e6a6STrond Myklebust 	return ret;
4759542e6a6STrond Myklebust }
4769542e6a6STrond Myklebust 
4779542e6a6STrond Myklebust static void
4789542e6a6STrond Myklebust nfsd_file_gc(void)
4799542e6a6STrond Myklebust {
4809542e6a6STrond Myklebust 	nfsd_file_lru_walk_list(NULL);
4819542e6a6STrond Myklebust }
4829542e6a6STrond Myklebust 
4839542e6a6STrond Myklebust static void
4849542e6a6STrond Myklebust nfsd_file_gc_worker(struct work_struct *work)
4859542e6a6STrond Myklebust {
4869542e6a6STrond Myklebust 	nfsd_file_gc();
4879542e6a6STrond Myklebust 	nfsd_file_schedule_laundrette();
48865294c1fSJeff Layton }
48965294c1fSJeff Layton 
49065294c1fSJeff Layton static unsigned long
49165294c1fSJeff Layton nfsd_file_lru_count(struct shrinker *s, struct shrink_control *sc)
49265294c1fSJeff Layton {
49365294c1fSJeff Layton 	return list_lru_count(&nfsd_file_lru);
49465294c1fSJeff Layton }
49565294c1fSJeff Layton 
49665294c1fSJeff Layton static unsigned long
49765294c1fSJeff Layton nfsd_file_lru_scan(struct shrinker *s, struct shrink_control *sc)
49865294c1fSJeff Layton {
4999542e6a6STrond Myklebust 	return nfsd_file_lru_walk_list(sc);
50065294c1fSJeff Layton }
50165294c1fSJeff Layton 
50265294c1fSJeff Layton static struct shrinker	nfsd_file_shrinker = {
50365294c1fSJeff Layton 	.scan_objects = nfsd_file_lru_scan,
50465294c1fSJeff Layton 	.count_objects = nfsd_file_lru_count,
50565294c1fSJeff Layton 	.seeks = 1,
50665294c1fSJeff Layton };
50765294c1fSJeff Layton 
50865294c1fSJeff Layton static void
50965294c1fSJeff Layton __nfsd_file_close_inode(struct inode *inode, unsigned int hashval,
51065294c1fSJeff Layton 			struct list_head *dispose)
51165294c1fSJeff Layton {
51265294c1fSJeff Layton 	struct nfsd_file	*nf;
51365294c1fSJeff Layton 	struct hlist_node	*tmp;
51465294c1fSJeff Layton 
51565294c1fSJeff Layton 	spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock);
51665294c1fSJeff Layton 	hlist_for_each_entry_safe(nf, tmp, &nfsd_file_hashtbl[hashval].nfb_head, nf_node) {
51765294c1fSJeff Layton 		if (inode == nf->nf_inode)
51865294c1fSJeff Layton 			nfsd_file_unhash_and_release_locked(nf, dispose);
51965294c1fSJeff Layton 	}
52065294c1fSJeff Layton 	spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock);
52165294c1fSJeff Layton }
52265294c1fSJeff Layton 
52365294c1fSJeff Layton /**
52465294c1fSJeff Layton  * nfsd_file_close_inode_sync - attempt to forcibly close a nfsd_file
52565294c1fSJeff Layton  * @inode: inode of the file to attempt to remove
52665294c1fSJeff Layton  *
52765294c1fSJeff Layton  * Walk the whole hash bucket, looking for any files that correspond to "inode".
52865294c1fSJeff Layton  * If any do, then unhash them and put the hashtable reference to them and
52965294c1fSJeff Layton  * destroy any that had their last reference put. Also ensure that any of the
53065294c1fSJeff Layton  * fputs also have their final __fput done as well.
53165294c1fSJeff Layton  */
53265294c1fSJeff Layton void
53365294c1fSJeff Layton nfsd_file_close_inode_sync(struct inode *inode)
53465294c1fSJeff Layton {
53565294c1fSJeff Layton 	unsigned int		hashval = (unsigned int)hash_long(inode->i_ino,
53665294c1fSJeff Layton 						NFSD_FILE_HASH_BITS);
53765294c1fSJeff Layton 	LIST_HEAD(dispose);
53865294c1fSJeff Layton 
53965294c1fSJeff Layton 	__nfsd_file_close_inode(inode, hashval, &dispose);
54065294c1fSJeff Layton 	trace_nfsd_file_close_inode_sync(inode, hashval, !list_empty(&dispose));
54165294c1fSJeff Layton 	nfsd_file_dispose_list_sync(&dispose);
54265294c1fSJeff Layton }
54365294c1fSJeff Layton 
54465294c1fSJeff Layton /**
54565294c1fSJeff Layton  * nfsd_file_close_inode_sync - attempt to forcibly close a nfsd_file
54665294c1fSJeff Layton  * @inode: inode of the file to attempt to remove
54765294c1fSJeff Layton  *
54865294c1fSJeff Layton  * Walk the whole hash bucket, looking for any files that correspond to "inode".
54965294c1fSJeff Layton  * If any do, then unhash them and put the hashtable reference to them and
55065294c1fSJeff Layton  * destroy any that had their last reference put.
55165294c1fSJeff Layton  */
55265294c1fSJeff Layton static void
55365294c1fSJeff Layton nfsd_file_close_inode(struct inode *inode)
55465294c1fSJeff Layton {
55565294c1fSJeff Layton 	unsigned int		hashval = (unsigned int)hash_long(inode->i_ino,
55665294c1fSJeff Layton 						NFSD_FILE_HASH_BITS);
55765294c1fSJeff Layton 	LIST_HEAD(dispose);
55865294c1fSJeff Layton 
55965294c1fSJeff Layton 	__nfsd_file_close_inode(inode, hashval, &dispose);
56065294c1fSJeff Layton 	trace_nfsd_file_close_inode(inode, hashval, !list_empty(&dispose));
5619542e6a6STrond Myklebust 	nfsd_file_dispose_list_delayed(&dispose);
56265294c1fSJeff Layton }
56365294c1fSJeff Layton 
56465294c1fSJeff Layton /**
56565294c1fSJeff Layton  * nfsd_file_delayed_close - close unused nfsd_files
56665294c1fSJeff Layton  * @work: dummy
56765294c1fSJeff Layton  *
56865294c1fSJeff Layton  * Walk the LRU list and close any entries that have not been used since
56965294c1fSJeff Layton  * the last scan.
57065294c1fSJeff Layton  *
57165294c1fSJeff Layton  * Note this can deadlock with nfsd_file_cache_purge.
57265294c1fSJeff Layton  */
57365294c1fSJeff Layton static void
57465294c1fSJeff Layton nfsd_file_delayed_close(struct work_struct *work)
57565294c1fSJeff Layton {
57665294c1fSJeff Layton 	LIST_HEAD(head);
5779542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l = container_of(work,
5789542e6a6STrond Myklebust 			struct nfsd_fcache_disposal, work);
57965294c1fSJeff Layton 
5809542e6a6STrond Myklebust 	nfsd_file_list_remove_disposal(&head, l);
5819542e6a6STrond Myklebust 	nfsd_file_dispose_list(&head);
58265294c1fSJeff Layton }
58365294c1fSJeff Layton 
58465294c1fSJeff Layton static int
58565294c1fSJeff Layton nfsd_file_lease_notifier_call(struct notifier_block *nb, unsigned long arg,
58665294c1fSJeff Layton 			    void *data)
58765294c1fSJeff Layton {
58865294c1fSJeff Layton 	struct file_lock *fl = data;
58965294c1fSJeff Layton 
59065294c1fSJeff Layton 	/* Only close files for F_SETLEASE leases */
59165294c1fSJeff Layton 	if (fl->fl_flags & FL_LEASE)
59265294c1fSJeff Layton 		nfsd_file_close_inode_sync(file_inode(fl->fl_file));
59365294c1fSJeff Layton 	return 0;
59465294c1fSJeff Layton }
59565294c1fSJeff Layton 
59665294c1fSJeff Layton static struct notifier_block nfsd_file_lease_notifier = {
59765294c1fSJeff Layton 	.notifier_call = nfsd_file_lease_notifier_call,
59865294c1fSJeff Layton };
59965294c1fSJeff Layton 
60065294c1fSJeff Layton static int
601b9a1b977SAmir Goldstein nfsd_file_fsnotify_handle_event(struct fsnotify_mark *mark, u32 mask,
602b9a1b977SAmir Goldstein 				struct inode *inode, struct inode *dir,
603b9a1b977SAmir Goldstein 				const struct qstr *name)
60465294c1fSJeff Layton {
60565294c1fSJeff Layton 	trace_nfsd_file_fsnotify_handle_event(inode, mask);
60665294c1fSJeff Layton 
60765294c1fSJeff Layton 	/* Should be no marks on non-regular files */
60865294c1fSJeff Layton 	if (!S_ISREG(inode->i_mode)) {
60965294c1fSJeff Layton 		WARN_ON_ONCE(1);
61065294c1fSJeff Layton 		return 0;
61165294c1fSJeff Layton 	}
61265294c1fSJeff Layton 
61365294c1fSJeff Layton 	/* don't close files if this was not the last link */
61465294c1fSJeff Layton 	if (mask & FS_ATTRIB) {
61565294c1fSJeff Layton 		if (inode->i_nlink)
61665294c1fSJeff Layton 			return 0;
61765294c1fSJeff Layton 	}
61865294c1fSJeff Layton 
61965294c1fSJeff Layton 	nfsd_file_close_inode(inode);
62065294c1fSJeff Layton 	return 0;
62165294c1fSJeff Layton }
62265294c1fSJeff Layton 
62365294c1fSJeff Layton 
62465294c1fSJeff Layton static const struct fsnotify_ops nfsd_file_fsnotify_ops = {
625b9a1b977SAmir Goldstein 	.handle_inode_event = nfsd_file_fsnotify_handle_event,
62665294c1fSJeff Layton 	.free_mark = nfsd_file_mark_free,
62765294c1fSJeff Layton };
62865294c1fSJeff Layton 
62965294c1fSJeff Layton int
63065294c1fSJeff Layton nfsd_file_cache_init(void)
63165294c1fSJeff Layton {
63265294c1fSJeff Layton 	int		ret = -ENOMEM;
63365294c1fSJeff Layton 	unsigned int	i;
63465294c1fSJeff Layton 
63565294c1fSJeff Layton 	clear_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags);
63665294c1fSJeff Layton 
63765294c1fSJeff Layton 	if (nfsd_file_hashtbl)
63865294c1fSJeff Layton 		return 0;
63965294c1fSJeff Layton 
6409542e6a6STrond Myklebust 	nfsd_filecache_wq = alloc_workqueue("nfsd_filecache", 0, 0);
6419542e6a6STrond Myklebust 	if (!nfsd_filecache_wq)
6429542e6a6STrond Myklebust 		goto out;
6439542e6a6STrond Myklebust 
64465294c1fSJeff Layton 	nfsd_file_hashtbl = kcalloc(NFSD_FILE_HASH_SIZE,
64565294c1fSJeff Layton 				sizeof(*nfsd_file_hashtbl), GFP_KERNEL);
64665294c1fSJeff Layton 	if (!nfsd_file_hashtbl) {
64765294c1fSJeff Layton 		pr_err("nfsd: unable to allocate nfsd_file_hashtbl\n");
64865294c1fSJeff Layton 		goto out_err;
64965294c1fSJeff Layton 	}
65065294c1fSJeff Layton 
65165294c1fSJeff Layton 	nfsd_file_slab = kmem_cache_create("nfsd_file",
65265294c1fSJeff Layton 				sizeof(struct nfsd_file), 0, 0, NULL);
65365294c1fSJeff Layton 	if (!nfsd_file_slab) {
65465294c1fSJeff Layton 		pr_err("nfsd: unable to create nfsd_file_slab\n");
65565294c1fSJeff Layton 		goto out_err;
65665294c1fSJeff Layton 	}
65765294c1fSJeff Layton 
65865294c1fSJeff Layton 	nfsd_file_mark_slab = kmem_cache_create("nfsd_file_mark",
65965294c1fSJeff Layton 					sizeof(struct nfsd_file_mark), 0, 0, NULL);
66065294c1fSJeff Layton 	if (!nfsd_file_mark_slab) {
66165294c1fSJeff Layton 		pr_err("nfsd: unable to create nfsd_file_mark_slab\n");
66265294c1fSJeff Layton 		goto out_err;
66365294c1fSJeff Layton 	}
66465294c1fSJeff Layton 
66565294c1fSJeff Layton 
66665294c1fSJeff Layton 	ret = list_lru_init(&nfsd_file_lru);
66765294c1fSJeff Layton 	if (ret) {
66865294c1fSJeff Layton 		pr_err("nfsd: failed to init nfsd_file_lru: %d\n", ret);
66965294c1fSJeff Layton 		goto out_err;
67065294c1fSJeff Layton 	}
67165294c1fSJeff Layton 
67265294c1fSJeff Layton 	ret = register_shrinker(&nfsd_file_shrinker);
67365294c1fSJeff Layton 	if (ret) {
67465294c1fSJeff Layton 		pr_err("nfsd: failed to register nfsd_file_shrinker: %d\n", ret);
67565294c1fSJeff Layton 		goto out_lru;
67665294c1fSJeff Layton 	}
67765294c1fSJeff Layton 
67865294c1fSJeff Layton 	ret = lease_register_notifier(&nfsd_file_lease_notifier);
67965294c1fSJeff Layton 	if (ret) {
68065294c1fSJeff Layton 		pr_err("nfsd: unable to register lease notifier: %d\n", ret);
68165294c1fSJeff Layton 		goto out_shrinker;
68265294c1fSJeff Layton 	}
68365294c1fSJeff Layton 
68465294c1fSJeff Layton 	nfsd_file_fsnotify_group = fsnotify_alloc_group(&nfsd_file_fsnotify_ops);
68565294c1fSJeff Layton 	if (IS_ERR(nfsd_file_fsnotify_group)) {
68665294c1fSJeff Layton 		pr_err("nfsd: unable to create fsnotify group: %ld\n",
68765294c1fSJeff Layton 			PTR_ERR(nfsd_file_fsnotify_group));
68865294c1fSJeff Layton 		nfsd_file_fsnotify_group = NULL;
68965294c1fSJeff Layton 		goto out_notifier;
69065294c1fSJeff Layton 	}
69165294c1fSJeff Layton 
69265294c1fSJeff Layton 	for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) {
69365294c1fSJeff Layton 		INIT_HLIST_HEAD(&nfsd_file_hashtbl[i].nfb_head);
69465294c1fSJeff Layton 		spin_lock_init(&nfsd_file_hashtbl[i].nfb_lock);
69565294c1fSJeff Layton 	}
69665294c1fSJeff Layton 
6979542e6a6STrond Myklebust 	INIT_DELAYED_WORK(&nfsd_filecache_laundrette, nfsd_file_gc_worker);
69865294c1fSJeff Layton out:
69965294c1fSJeff Layton 	return ret;
70065294c1fSJeff Layton out_notifier:
70165294c1fSJeff Layton 	lease_unregister_notifier(&nfsd_file_lease_notifier);
70265294c1fSJeff Layton out_shrinker:
70365294c1fSJeff Layton 	unregister_shrinker(&nfsd_file_shrinker);
70465294c1fSJeff Layton out_lru:
70565294c1fSJeff Layton 	list_lru_destroy(&nfsd_file_lru);
70665294c1fSJeff Layton out_err:
70765294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_slab);
70865294c1fSJeff Layton 	nfsd_file_slab = NULL;
70965294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_mark_slab);
71065294c1fSJeff Layton 	nfsd_file_mark_slab = NULL;
71165294c1fSJeff Layton 	kfree(nfsd_file_hashtbl);
71265294c1fSJeff Layton 	nfsd_file_hashtbl = NULL;
7139542e6a6STrond Myklebust 	destroy_workqueue(nfsd_filecache_wq);
7149542e6a6STrond Myklebust 	nfsd_filecache_wq = NULL;
71565294c1fSJeff Layton 	goto out;
71665294c1fSJeff Layton }
71765294c1fSJeff Layton 
71865294c1fSJeff Layton /*
71965294c1fSJeff Layton  * Note this can deadlock with nfsd_file_lru_cb.
72065294c1fSJeff Layton  */
72165294c1fSJeff Layton void
7225e113224STrond Myklebust nfsd_file_cache_purge(struct net *net)
72365294c1fSJeff Layton {
72465294c1fSJeff Layton 	unsigned int		i;
72565294c1fSJeff Layton 	struct nfsd_file	*nf;
7265e113224STrond Myklebust 	struct hlist_node	*next;
72765294c1fSJeff Layton 	LIST_HEAD(dispose);
72865294c1fSJeff Layton 	bool del;
72965294c1fSJeff Layton 
73065294c1fSJeff Layton 	if (!nfsd_file_hashtbl)
73165294c1fSJeff Layton 		return;
73265294c1fSJeff Layton 
73365294c1fSJeff Layton 	for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) {
7345e113224STrond Myklebust 		struct nfsd_fcache_bucket *nfb = &nfsd_file_hashtbl[i];
7355e113224STrond Myklebust 
7365e113224STrond Myklebust 		spin_lock(&nfb->nfb_lock);
7375e113224STrond Myklebust 		hlist_for_each_entry_safe(nf, next, &nfb->nfb_head, nf_node) {
7385e113224STrond Myklebust 			if (net && nf->nf_net != net)
7395e113224STrond Myklebust 				continue;
74065294c1fSJeff Layton 			del = nfsd_file_unhash_and_release_locked(nf, &dispose);
74165294c1fSJeff Layton 
74265294c1fSJeff Layton 			/*
74365294c1fSJeff Layton 			 * Deadlock detected! Something marked this entry as
74465294c1fSJeff Layton 			 * unhased, but hasn't removed it from the hash list.
74565294c1fSJeff Layton 			 */
74665294c1fSJeff Layton 			WARN_ON_ONCE(!del);
74765294c1fSJeff Layton 		}
7485e113224STrond Myklebust 		spin_unlock(&nfb->nfb_lock);
74965294c1fSJeff Layton 		nfsd_file_dispose_list(&dispose);
75065294c1fSJeff Layton 	}
75165294c1fSJeff Layton }
75265294c1fSJeff Layton 
7539542e6a6STrond Myklebust static struct nfsd_fcache_disposal *
7549542e6a6STrond Myklebust nfsd_alloc_fcache_disposal(struct net *net)
7559542e6a6STrond Myklebust {
7569542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l;
7579542e6a6STrond Myklebust 
7589542e6a6STrond Myklebust 	l = kmalloc(sizeof(*l), GFP_KERNEL);
7599542e6a6STrond Myklebust 	if (!l)
7609542e6a6STrond Myklebust 		return NULL;
7619542e6a6STrond Myklebust 	INIT_WORK(&l->work, nfsd_file_delayed_close);
7629542e6a6STrond Myklebust 	l->net = net;
7639542e6a6STrond Myklebust 	spin_lock_init(&l->lock);
7649542e6a6STrond Myklebust 	INIT_LIST_HEAD(&l->freeme);
7659542e6a6STrond Myklebust 	return l;
7669542e6a6STrond Myklebust }
7679542e6a6STrond Myklebust 
7689542e6a6STrond Myklebust static void
7699542e6a6STrond Myklebust nfsd_free_fcache_disposal(struct nfsd_fcache_disposal *l)
7709542e6a6STrond Myklebust {
7719542e6a6STrond Myklebust 	rcu_assign_pointer(l->net, NULL);
7729542e6a6STrond Myklebust 	cancel_work_sync(&l->work);
7739542e6a6STrond Myklebust 	nfsd_file_dispose_list(&l->freeme);
7749542e6a6STrond Myklebust 	kfree_rcu(l, rcu);
7759542e6a6STrond Myklebust }
7769542e6a6STrond Myklebust 
7779542e6a6STrond Myklebust static void
7789542e6a6STrond Myklebust nfsd_add_fcache_disposal(struct nfsd_fcache_disposal *l)
7799542e6a6STrond Myklebust {
7809542e6a6STrond Myklebust 	spin_lock(&laundrette_lock);
7819542e6a6STrond Myklebust 	list_add_tail_rcu(&l->list, &laundrettes);
7829542e6a6STrond Myklebust 	spin_unlock(&laundrette_lock);
7839542e6a6STrond Myklebust }
7849542e6a6STrond Myklebust 
7859542e6a6STrond Myklebust static void
7869542e6a6STrond Myklebust nfsd_del_fcache_disposal(struct nfsd_fcache_disposal *l)
7879542e6a6STrond Myklebust {
7889542e6a6STrond Myklebust 	spin_lock(&laundrette_lock);
7899542e6a6STrond Myklebust 	list_del_rcu(&l->list);
7909542e6a6STrond Myklebust 	spin_unlock(&laundrette_lock);
7919542e6a6STrond Myklebust }
7929542e6a6STrond Myklebust 
7939542e6a6STrond Myklebust static int
7949542e6a6STrond Myklebust nfsd_alloc_fcache_disposal_net(struct net *net)
7959542e6a6STrond Myklebust {
7969542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l;
7979542e6a6STrond Myklebust 
7989542e6a6STrond Myklebust 	l = nfsd_alloc_fcache_disposal(net);
7999542e6a6STrond Myklebust 	if (!l)
8009542e6a6STrond Myklebust 		return -ENOMEM;
8019542e6a6STrond Myklebust 	nfsd_add_fcache_disposal(l);
8029542e6a6STrond Myklebust 	return 0;
8039542e6a6STrond Myklebust }
8049542e6a6STrond Myklebust 
8059542e6a6STrond Myklebust static void
8069542e6a6STrond Myklebust nfsd_free_fcache_disposal_net(struct net *net)
8079542e6a6STrond Myklebust {
8089542e6a6STrond Myklebust 	struct nfsd_fcache_disposal *l;
8099542e6a6STrond Myklebust 
8109542e6a6STrond Myklebust 	rcu_read_lock();
8119542e6a6STrond Myklebust 	list_for_each_entry_rcu(l, &laundrettes, list) {
8129542e6a6STrond Myklebust 		if (l->net != net)
8139542e6a6STrond Myklebust 			continue;
8149542e6a6STrond Myklebust 		nfsd_del_fcache_disposal(l);
8159542e6a6STrond Myklebust 		rcu_read_unlock();
8169542e6a6STrond Myklebust 		nfsd_free_fcache_disposal(l);
8179542e6a6STrond Myklebust 		return;
8189542e6a6STrond Myklebust 	}
8199542e6a6STrond Myklebust 	rcu_read_unlock();
8209542e6a6STrond Myklebust }
8219542e6a6STrond Myklebust 
8229542e6a6STrond Myklebust int
8239542e6a6STrond Myklebust nfsd_file_cache_start_net(struct net *net)
8249542e6a6STrond Myklebust {
8259542e6a6STrond Myklebust 	return nfsd_alloc_fcache_disposal_net(net);
8269542e6a6STrond Myklebust }
8279542e6a6STrond Myklebust 
8289542e6a6STrond Myklebust void
8299542e6a6STrond Myklebust nfsd_file_cache_shutdown_net(struct net *net)
8309542e6a6STrond Myklebust {
8319542e6a6STrond Myklebust 	nfsd_file_cache_purge(net);
8329542e6a6STrond Myklebust 	nfsd_free_fcache_disposal_net(net);
8339542e6a6STrond Myklebust }
8349542e6a6STrond Myklebust 
83565294c1fSJeff Layton void
83665294c1fSJeff Layton nfsd_file_cache_shutdown(void)
83765294c1fSJeff Layton {
83865294c1fSJeff Layton 	set_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags);
83965294c1fSJeff Layton 
84065294c1fSJeff Layton 	lease_unregister_notifier(&nfsd_file_lease_notifier);
84165294c1fSJeff Layton 	unregister_shrinker(&nfsd_file_shrinker);
84265294c1fSJeff Layton 	/*
84365294c1fSJeff Layton 	 * make sure all callers of nfsd_file_lru_cb are done before
84465294c1fSJeff Layton 	 * calling nfsd_file_cache_purge
84565294c1fSJeff Layton 	 */
84665294c1fSJeff Layton 	cancel_delayed_work_sync(&nfsd_filecache_laundrette);
8475e113224STrond Myklebust 	nfsd_file_cache_purge(NULL);
84865294c1fSJeff Layton 	list_lru_destroy(&nfsd_file_lru);
84965294c1fSJeff Layton 	rcu_barrier();
85065294c1fSJeff Layton 	fsnotify_put_group(nfsd_file_fsnotify_group);
85165294c1fSJeff Layton 	nfsd_file_fsnotify_group = NULL;
85265294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_slab);
85365294c1fSJeff Layton 	nfsd_file_slab = NULL;
85465294c1fSJeff Layton 	fsnotify_wait_marks_destroyed();
85565294c1fSJeff Layton 	kmem_cache_destroy(nfsd_file_mark_slab);
85665294c1fSJeff Layton 	nfsd_file_mark_slab = NULL;
85765294c1fSJeff Layton 	kfree(nfsd_file_hashtbl);
85865294c1fSJeff Layton 	nfsd_file_hashtbl = NULL;
8599542e6a6STrond Myklebust 	destroy_workqueue(nfsd_filecache_wq);
8609542e6a6STrond Myklebust 	nfsd_filecache_wq = NULL;
86165294c1fSJeff Layton }
86265294c1fSJeff Layton 
86365294c1fSJeff Layton static bool
86465294c1fSJeff Layton nfsd_match_cred(const struct cred *c1, const struct cred *c2)
86565294c1fSJeff Layton {
86665294c1fSJeff Layton 	int i;
86765294c1fSJeff Layton 
86865294c1fSJeff Layton 	if (!uid_eq(c1->fsuid, c2->fsuid))
86965294c1fSJeff Layton 		return false;
87065294c1fSJeff Layton 	if (!gid_eq(c1->fsgid, c2->fsgid))
87165294c1fSJeff Layton 		return false;
87265294c1fSJeff Layton 	if (c1->group_info == NULL || c2->group_info == NULL)
87365294c1fSJeff Layton 		return c1->group_info == c2->group_info;
87465294c1fSJeff Layton 	if (c1->group_info->ngroups != c2->group_info->ngroups)
87565294c1fSJeff Layton 		return false;
87665294c1fSJeff Layton 	for (i = 0; i < c1->group_info->ngroups; i++) {
87765294c1fSJeff Layton 		if (!gid_eq(c1->group_info->gid[i], c2->group_info->gid[i]))
87865294c1fSJeff Layton 			return false;
87965294c1fSJeff Layton 	}
88065294c1fSJeff Layton 	return true;
88165294c1fSJeff Layton }
88265294c1fSJeff Layton 
88365294c1fSJeff Layton static struct nfsd_file *
88465294c1fSJeff Layton nfsd_file_find_locked(struct inode *inode, unsigned int may_flags,
8855e113224STrond Myklebust 			unsigned int hashval, struct net *net)
88665294c1fSJeff Layton {
88765294c1fSJeff Layton 	struct nfsd_file *nf;
88865294c1fSJeff Layton 	unsigned char need = may_flags & NFSD_FILE_MAY_MASK;
88965294c1fSJeff Layton 
89065294c1fSJeff Layton 	hlist_for_each_entry_rcu(nf, &nfsd_file_hashtbl[hashval].nfb_head,
891057a2274SMadhuparna Bhowmik 				 nf_node, lockdep_is_held(&nfsd_file_hashtbl[hashval].nfb_lock)) {
892*ae3c57b5SJ. Bruce Fields 		if (nf->nf_may != need)
89365294c1fSJeff Layton 			continue;
89465294c1fSJeff Layton 		if (nf->nf_inode != inode)
89565294c1fSJeff Layton 			continue;
8965e113224STrond Myklebust 		if (nf->nf_net != net)
8975e113224STrond Myklebust 			continue;
89865294c1fSJeff Layton 		if (!nfsd_match_cred(nf->nf_cred, current_cred()))
89965294c1fSJeff Layton 			continue;
90065294c1fSJeff Layton 		if (nfsd_file_get(nf) != NULL)
90165294c1fSJeff Layton 			return nf;
90265294c1fSJeff Layton 	}
90365294c1fSJeff Layton 	return NULL;
90465294c1fSJeff Layton }
90565294c1fSJeff Layton 
90665294c1fSJeff Layton /**
90765294c1fSJeff Layton  * nfsd_file_is_cached - are there any cached open files for this fh?
90865294c1fSJeff Layton  * @inode: inode of the file to check
90965294c1fSJeff Layton  *
91065294c1fSJeff Layton  * Scan the hashtable for open files that match this fh. Returns true if there
91165294c1fSJeff Layton  * are any, and false if not.
91265294c1fSJeff Layton  */
91365294c1fSJeff Layton bool
91465294c1fSJeff Layton nfsd_file_is_cached(struct inode *inode)
91565294c1fSJeff Layton {
91665294c1fSJeff Layton 	bool			ret = false;
91765294c1fSJeff Layton 	struct nfsd_file	*nf;
91865294c1fSJeff Layton 	unsigned int		hashval;
91965294c1fSJeff Layton 
92065294c1fSJeff Layton         hashval = (unsigned int)hash_long(inode->i_ino, NFSD_FILE_HASH_BITS);
92165294c1fSJeff Layton 
92265294c1fSJeff Layton 	rcu_read_lock();
92365294c1fSJeff Layton 	hlist_for_each_entry_rcu(nf, &nfsd_file_hashtbl[hashval].nfb_head,
92465294c1fSJeff Layton 				 nf_node) {
92565294c1fSJeff Layton 		if (inode == nf->nf_inode) {
92665294c1fSJeff Layton 			ret = true;
92765294c1fSJeff Layton 			break;
92865294c1fSJeff Layton 		}
92965294c1fSJeff Layton 	}
93065294c1fSJeff Layton 	rcu_read_unlock();
93165294c1fSJeff Layton 	trace_nfsd_file_is_cached(inode, hashval, (int)ret);
93265294c1fSJeff Layton 	return ret;
93365294c1fSJeff Layton }
93465294c1fSJeff Layton 
93565294c1fSJeff Layton __be32
93665294c1fSJeff Layton nfsd_file_acquire(struct svc_rqst *rqstp, struct svc_fh *fhp,
93765294c1fSJeff Layton 		  unsigned int may_flags, struct nfsd_file **pnf)
93865294c1fSJeff Layton {
93965294c1fSJeff Layton 	__be32	status;
9405e113224STrond Myklebust 	struct net *net = SVC_NET(rqstp);
94165294c1fSJeff Layton 	struct nfsd_file *nf, *new;
94265294c1fSJeff Layton 	struct inode *inode;
94365294c1fSJeff Layton 	unsigned int hashval;
94428c7d86bSTrond Myklebust 	bool retry = true;
94565294c1fSJeff Layton 
94665294c1fSJeff Layton 	/* FIXME: skip this if fh_dentry is already set? */
94765294c1fSJeff Layton 	status = fh_verify(rqstp, fhp, S_IFREG,
94865294c1fSJeff Layton 				may_flags|NFSD_MAY_OWNER_OVERRIDE);
94965294c1fSJeff Layton 	if (status != nfs_ok)
95065294c1fSJeff Layton 		return status;
95165294c1fSJeff Layton 
95265294c1fSJeff Layton 	inode = d_inode(fhp->fh_dentry);
95365294c1fSJeff Layton 	hashval = (unsigned int)hash_long(inode->i_ino, NFSD_FILE_HASH_BITS);
95465294c1fSJeff Layton retry:
95565294c1fSJeff Layton 	rcu_read_lock();
9565e113224STrond Myklebust 	nf = nfsd_file_find_locked(inode, may_flags, hashval, net);
95765294c1fSJeff Layton 	rcu_read_unlock();
95865294c1fSJeff Layton 	if (nf)
95965294c1fSJeff Layton 		goto wait_for_construction;
96065294c1fSJeff Layton 
9615e113224STrond Myklebust 	new = nfsd_file_alloc(inode, may_flags, hashval, net);
96265294c1fSJeff Layton 	if (!new) {
96365294c1fSJeff Layton 		trace_nfsd_file_acquire(rqstp, hashval, inode, may_flags,
96465294c1fSJeff Layton 					NULL, nfserr_jukebox);
96565294c1fSJeff Layton 		return nfserr_jukebox;
96665294c1fSJeff Layton 	}
96765294c1fSJeff Layton 
96865294c1fSJeff Layton 	spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock);
9695e113224STrond Myklebust 	nf = nfsd_file_find_locked(inode, may_flags, hashval, net);
97065294c1fSJeff Layton 	if (nf == NULL)
97165294c1fSJeff Layton 		goto open_file;
97265294c1fSJeff Layton 	spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock);
97365294c1fSJeff Layton 	nfsd_file_slab_free(&new->nf_rcu);
97465294c1fSJeff Layton 
97565294c1fSJeff Layton wait_for_construction:
97665294c1fSJeff Layton 	wait_on_bit(&nf->nf_flags, NFSD_FILE_PENDING, TASK_UNINTERRUPTIBLE);
97765294c1fSJeff Layton 
97865294c1fSJeff Layton 	/* Did construction of this file fail? */
97965294c1fSJeff Layton 	if (!test_bit(NFSD_FILE_HASHED, &nf->nf_flags)) {
98028c7d86bSTrond Myklebust 		if (!retry) {
98128c7d86bSTrond Myklebust 			status = nfserr_jukebox;
98228c7d86bSTrond Myklebust 			goto out;
98328c7d86bSTrond Myklebust 		}
98428c7d86bSTrond Myklebust 		retry = false;
98565294c1fSJeff Layton 		nfsd_file_put_noref(nf);
98665294c1fSJeff Layton 		goto retry;
98765294c1fSJeff Layton 	}
98865294c1fSJeff Layton 
98965294c1fSJeff Layton 	this_cpu_inc(nfsd_file_cache_hits);
99065294c1fSJeff Layton 
99165294c1fSJeff Layton 	if (!(may_flags & NFSD_MAY_NOT_BREAK_LEASE)) {
99265294c1fSJeff Layton 		bool write = (may_flags & NFSD_MAY_WRITE);
99365294c1fSJeff Layton 
99465294c1fSJeff Layton 		if (test_bit(NFSD_FILE_BREAK_READ, &nf->nf_flags) ||
99565294c1fSJeff Layton 		    (test_bit(NFSD_FILE_BREAK_WRITE, &nf->nf_flags) && write)) {
99665294c1fSJeff Layton 			status = nfserrno(nfsd_open_break_lease(
99765294c1fSJeff Layton 					file_inode(nf->nf_file), may_flags));
99865294c1fSJeff Layton 			if (status == nfs_ok) {
99965294c1fSJeff Layton 				clear_bit(NFSD_FILE_BREAK_READ, &nf->nf_flags);
100065294c1fSJeff Layton 				if (write)
100165294c1fSJeff Layton 					clear_bit(NFSD_FILE_BREAK_WRITE,
100265294c1fSJeff Layton 						  &nf->nf_flags);
100365294c1fSJeff Layton 			}
100465294c1fSJeff Layton 		}
100565294c1fSJeff Layton 	}
100665294c1fSJeff Layton out:
100765294c1fSJeff Layton 	if (status == nfs_ok) {
100865294c1fSJeff Layton 		*pnf = nf;
100965294c1fSJeff Layton 	} else {
101065294c1fSJeff Layton 		nfsd_file_put(nf);
101165294c1fSJeff Layton 		nf = NULL;
101265294c1fSJeff Layton 	}
101365294c1fSJeff Layton 
101465294c1fSJeff Layton 	trace_nfsd_file_acquire(rqstp, hashval, inode, may_flags, nf, status);
101565294c1fSJeff Layton 	return status;
101665294c1fSJeff Layton open_file:
101765294c1fSJeff Layton 	nf = new;
101865294c1fSJeff Layton 	/* Take reference for the hashtable */
1019689827cdSTrond Myklebust 	refcount_inc(&nf->nf_ref);
102065294c1fSJeff Layton 	__set_bit(NFSD_FILE_HASHED, &nf->nf_flags);
102165294c1fSJeff Layton 	__set_bit(NFSD_FILE_PENDING, &nf->nf_flags);
102265294c1fSJeff Layton 	list_lru_add(&nfsd_file_lru, &nf->nf_lru);
102365294c1fSJeff Layton 	hlist_add_head_rcu(&nf->nf_node, &nfsd_file_hashtbl[hashval].nfb_head);
102465294c1fSJeff Layton 	++nfsd_file_hashtbl[hashval].nfb_count;
102565294c1fSJeff Layton 	nfsd_file_hashtbl[hashval].nfb_maxcount = max(nfsd_file_hashtbl[hashval].nfb_maxcount,
102665294c1fSJeff Layton 			nfsd_file_hashtbl[hashval].nfb_count);
102765294c1fSJeff Layton 	spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock);
10289542e6a6STrond Myklebust 	if (atomic_long_inc_return(&nfsd_filecache_count) >= NFSD_FILE_LRU_THRESHOLD)
10299542e6a6STrond Myklebust 		nfsd_file_gc();
103065294c1fSJeff Layton 
103165294c1fSJeff Layton 	nf->nf_mark = nfsd_file_mark_find_or_create(nf);
103265294c1fSJeff Layton 	if (nf->nf_mark)
103365294c1fSJeff Layton 		status = nfsd_open_verified(rqstp, fhp, S_IFREG,
103465294c1fSJeff Layton 				may_flags, &nf->nf_file);
103565294c1fSJeff Layton 	else
103665294c1fSJeff Layton 		status = nfserr_jukebox;
103765294c1fSJeff Layton 	/*
103865294c1fSJeff Layton 	 * If construction failed, or we raced with a call to unlink()
103965294c1fSJeff Layton 	 * then unhash.
104065294c1fSJeff Layton 	 */
104165294c1fSJeff Layton 	if (status != nfs_ok || inode->i_nlink == 0) {
104265294c1fSJeff Layton 		bool do_free;
104365294c1fSJeff Layton 		spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock);
104465294c1fSJeff Layton 		do_free = nfsd_file_unhash(nf);
104565294c1fSJeff Layton 		spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock);
104665294c1fSJeff Layton 		if (do_free)
104765294c1fSJeff Layton 			nfsd_file_put_noref(nf);
104865294c1fSJeff Layton 	}
104965294c1fSJeff Layton 	clear_bit_unlock(NFSD_FILE_PENDING, &nf->nf_flags);
105065294c1fSJeff Layton 	smp_mb__after_atomic();
105165294c1fSJeff Layton 	wake_up_bit(&nf->nf_flags, NFSD_FILE_PENDING);
105265294c1fSJeff Layton 	goto out;
105365294c1fSJeff Layton }
105465294c1fSJeff Layton 
105565294c1fSJeff Layton /*
105665294c1fSJeff Layton  * Note that fields may be added, removed or reordered in the future. Programs
105765294c1fSJeff Layton  * scraping this file for info should test the labels to ensure they're
105865294c1fSJeff Layton  * getting the correct field.
105965294c1fSJeff Layton  */
106065294c1fSJeff Layton static int nfsd_file_cache_stats_show(struct seq_file *m, void *v)
106165294c1fSJeff Layton {
106265294c1fSJeff Layton 	unsigned int i, count = 0, longest = 0;
106365294c1fSJeff Layton 	unsigned long hits = 0;
106465294c1fSJeff Layton 
106565294c1fSJeff Layton 	/*
106665294c1fSJeff Layton 	 * No need for spinlocks here since we're not terribly interested in
106765294c1fSJeff Layton 	 * accuracy. We do take the nfsd_mutex simply to ensure that we
106865294c1fSJeff Layton 	 * don't end up racing with server shutdown
106965294c1fSJeff Layton 	 */
107065294c1fSJeff Layton 	mutex_lock(&nfsd_mutex);
107165294c1fSJeff Layton 	if (nfsd_file_hashtbl) {
107265294c1fSJeff Layton 		for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) {
107365294c1fSJeff Layton 			count += nfsd_file_hashtbl[i].nfb_count;
107465294c1fSJeff Layton 			longest = max(longest, nfsd_file_hashtbl[i].nfb_count);
107565294c1fSJeff Layton 		}
107665294c1fSJeff Layton 	}
107765294c1fSJeff Layton 	mutex_unlock(&nfsd_mutex);
107865294c1fSJeff Layton 
107965294c1fSJeff Layton 	for_each_possible_cpu(i)
108065294c1fSJeff Layton 		hits += per_cpu(nfsd_file_cache_hits, i);
108165294c1fSJeff Layton 
108265294c1fSJeff Layton 	seq_printf(m, "total entries: %u\n", count);
108365294c1fSJeff Layton 	seq_printf(m, "longest chain: %u\n", longest);
108465294c1fSJeff Layton 	seq_printf(m, "cache hits:    %lu\n", hits);
108565294c1fSJeff Layton 	return 0;
108665294c1fSJeff Layton }
108765294c1fSJeff Layton 
108865294c1fSJeff Layton int nfsd_file_cache_stats_open(struct inode *inode, struct file *file)
108965294c1fSJeff Layton {
109065294c1fSJeff Layton 	return single_open(file, nfsd_file_cache_stats_show, NULL);
109165294c1fSJeff Layton }
1092