165294c1fSJeff Layton /* 265294c1fSJeff Layton * Open file cache. 365294c1fSJeff Layton * 465294c1fSJeff Layton * (c) 2015 - Jeff Layton <jeff.layton@primarydata.com> 565294c1fSJeff Layton */ 665294c1fSJeff Layton 765294c1fSJeff Layton #include <linux/hash.h> 865294c1fSJeff Layton #include <linux/slab.h> 965294c1fSJeff Layton #include <linux/file.h> 10cbcc268bSMatthew Wilcox (Oracle) #include <linux/pagemap.h> 1165294c1fSJeff Layton #include <linux/sched.h> 1265294c1fSJeff Layton #include <linux/list_lru.h> 1365294c1fSJeff Layton #include <linux/fsnotify_backend.h> 1465294c1fSJeff Layton #include <linux/fsnotify.h> 1565294c1fSJeff Layton #include <linux/seq_file.h> 1665294c1fSJeff Layton 1765294c1fSJeff Layton #include "vfs.h" 1865294c1fSJeff Layton #include "nfsd.h" 1965294c1fSJeff Layton #include "nfsfh.h" 205e113224STrond Myklebust #include "netns.h" 2165294c1fSJeff Layton #include "filecache.h" 2265294c1fSJeff Layton #include "trace.h" 2365294c1fSJeff Layton 2465294c1fSJeff Layton #define NFSDDBG_FACILITY NFSDDBG_FH 2565294c1fSJeff Layton 2665294c1fSJeff Layton /* FIXME: dynamically size this for the machine somehow? */ 2765294c1fSJeff Layton #define NFSD_FILE_HASH_BITS 12 2865294c1fSJeff Layton #define NFSD_FILE_HASH_SIZE (1 << NFSD_FILE_HASH_BITS) 2965294c1fSJeff Layton #define NFSD_LAUNDRETTE_DELAY (2 * HZ) 3065294c1fSJeff Layton 3165294c1fSJeff Layton #define NFSD_FILE_SHUTDOWN (1) 3265294c1fSJeff Layton #define NFSD_FILE_LRU_THRESHOLD (4096UL) 3365294c1fSJeff Layton #define NFSD_FILE_LRU_LIMIT (NFSD_FILE_LRU_THRESHOLD << 2) 3465294c1fSJeff Layton 3565294c1fSJeff Layton /* We only care about NFSD_MAY_READ/WRITE for this cache */ 3665294c1fSJeff Layton #define NFSD_FILE_MAY_MASK (NFSD_MAY_READ|NFSD_MAY_WRITE) 3765294c1fSJeff Layton 3865294c1fSJeff Layton struct nfsd_fcache_bucket { 3965294c1fSJeff Layton struct hlist_head nfb_head; 4065294c1fSJeff Layton spinlock_t nfb_lock; 4165294c1fSJeff Layton unsigned int nfb_count; 4265294c1fSJeff Layton unsigned int nfb_maxcount; 4365294c1fSJeff Layton }; 4465294c1fSJeff Layton 4565294c1fSJeff Layton static DEFINE_PER_CPU(unsigned long, nfsd_file_cache_hits); 4629d4bdbbSChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_acquisitions); 47d6329327SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_releases); 48904940e9SChuck Lever static DEFINE_PER_CPU(unsigned long, nfsd_file_total_age); 4965294c1fSJeff Layton 509542e6a6STrond Myklebust struct nfsd_fcache_disposal { 519542e6a6STrond Myklebust struct work_struct work; 529542e6a6STrond Myklebust spinlock_t lock; 539542e6a6STrond Myklebust struct list_head freeme; 549542e6a6STrond Myklebust }; 559542e6a6STrond Myklebust 5650d0def9SChen Zhou static struct workqueue_struct *nfsd_filecache_wq __read_mostly; 579542e6a6STrond Myklebust 5865294c1fSJeff Layton static struct kmem_cache *nfsd_file_slab; 5965294c1fSJeff Layton static struct kmem_cache *nfsd_file_mark_slab; 6065294c1fSJeff Layton static struct nfsd_fcache_bucket *nfsd_file_hashtbl; 6165294c1fSJeff Layton static struct list_lru nfsd_file_lru; 6265294c1fSJeff Layton static long nfsd_file_lru_flags; 6365294c1fSJeff Layton static struct fsnotify_group *nfsd_file_fsnotify_group; 6465294c1fSJeff Layton static atomic_long_t nfsd_filecache_count; 6565294c1fSJeff Layton static struct delayed_work nfsd_filecache_laundrette; 6665294c1fSJeff Layton 679542e6a6STrond Myklebust static void nfsd_file_gc(void); 6865294c1fSJeff Layton 6965294c1fSJeff Layton static void 709542e6a6STrond Myklebust nfsd_file_schedule_laundrette(void) 7165294c1fSJeff Layton { 7265294c1fSJeff Layton long count = atomic_long_read(&nfsd_filecache_count); 7365294c1fSJeff Layton 7465294c1fSJeff Layton if (count == 0 || test_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags)) 7565294c1fSJeff Layton return; 7665294c1fSJeff Layton 779542e6a6STrond Myklebust queue_delayed_work(system_wq, &nfsd_filecache_laundrette, 789542e6a6STrond Myklebust NFSD_LAUNDRETTE_DELAY); 7965294c1fSJeff Layton } 8065294c1fSJeff Layton 8165294c1fSJeff Layton static void 8265294c1fSJeff Layton nfsd_file_slab_free(struct rcu_head *rcu) 8365294c1fSJeff Layton { 8465294c1fSJeff Layton struct nfsd_file *nf = container_of(rcu, struct nfsd_file, nf_rcu); 8565294c1fSJeff Layton 8665294c1fSJeff Layton put_cred(nf->nf_cred); 8765294c1fSJeff Layton kmem_cache_free(nfsd_file_slab, nf); 8865294c1fSJeff Layton } 8965294c1fSJeff Layton 9065294c1fSJeff Layton static void 9165294c1fSJeff Layton nfsd_file_mark_free(struct fsnotify_mark *mark) 9265294c1fSJeff Layton { 9365294c1fSJeff Layton struct nfsd_file_mark *nfm = container_of(mark, struct nfsd_file_mark, 9465294c1fSJeff Layton nfm_mark); 9565294c1fSJeff Layton 9665294c1fSJeff Layton kmem_cache_free(nfsd_file_mark_slab, nfm); 9765294c1fSJeff Layton } 9865294c1fSJeff Layton 9965294c1fSJeff Layton static struct nfsd_file_mark * 10065294c1fSJeff Layton nfsd_file_mark_get(struct nfsd_file_mark *nfm) 10165294c1fSJeff Layton { 102689827cdSTrond Myklebust if (!refcount_inc_not_zero(&nfm->nfm_ref)) 10365294c1fSJeff Layton return NULL; 10465294c1fSJeff Layton return nfm; 10565294c1fSJeff Layton } 10665294c1fSJeff Layton 10765294c1fSJeff Layton static void 10865294c1fSJeff Layton nfsd_file_mark_put(struct nfsd_file_mark *nfm) 10965294c1fSJeff Layton { 110689827cdSTrond Myklebust if (refcount_dec_and_test(&nfm->nfm_ref)) { 11165294c1fSJeff Layton fsnotify_destroy_mark(&nfm->nfm_mark, nfsd_file_fsnotify_group); 11265294c1fSJeff Layton fsnotify_put_mark(&nfm->nfm_mark); 11365294c1fSJeff Layton } 11465294c1fSJeff Layton } 11565294c1fSJeff Layton 11665294c1fSJeff Layton static struct nfsd_file_mark * 11765294c1fSJeff Layton nfsd_file_mark_find_or_create(struct nfsd_file *nf) 11865294c1fSJeff Layton { 11965294c1fSJeff Layton int err; 12065294c1fSJeff Layton struct fsnotify_mark *mark; 12165294c1fSJeff Layton struct nfsd_file_mark *nfm = NULL, *new; 12265294c1fSJeff Layton struct inode *inode = nf->nf_inode; 12365294c1fSJeff Layton 12465294c1fSJeff Layton do { 125b8962a9dSAmir Goldstein fsnotify_group_lock(nfsd_file_fsnotify_group); 12665294c1fSJeff Layton mark = fsnotify_find_mark(&inode->i_fsnotify_marks, 12765294c1fSJeff Layton nfsd_file_fsnotify_group); 12865294c1fSJeff Layton if (mark) { 12965294c1fSJeff Layton nfm = nfsd_file_mark_get(container_of(mark, 13065294c1fSJeff Layton struct nfsd_file_mark, 13165294c1fSJeff Layton nfm_mark)); 132b8962a9dSAmir Goldstein fsnotify_group_unlock(nfsd_file_fsnotify_group); 13390d2f1daSTrond Myklebust if (nfm) { 13465294c1fSJeff Layton fsnotify_put_mark(mark); 13565294c1fSJeff Layton break; 13690d2f1daSTrond Myklebust } 13790d2f1daSTrond Myklebust /* Avoid soft lockup race with nfsd_file_mark_put() */ 13890d2f1daSTrond Myklebust fsnotify_destroy_mark(mark, nfsd_file_fsnotify_group); 13990d2f1daSTrond Myklebust fsnotify_put_mark(mark); 140b8962a9dSAmir Goldstein } else { 141b8962a9dSAmir Goldstein fsnotify_group_unlock(nfsd_file_fsnotify_group); 142b8962a9dSAmir Goldstein } 14365294c1fSJeff Layton 14465294c1fSJeff Layton /* allocate a new nfm */ 14565294c1fSJeff Layton new = kmem_cache_alloc(nfsd_file_mark_slab, GFP_KERNEL); 14665294c1fSJeff Layton if (!new) 14765294c1fSJeff Layton return NULL; 14865294c1fSJeff Layton fsnotify_init_mark(&new->nfm_mark, nfsd_file_fsnotify_group); 14965294c1fSJeff Layton new->nfm_mark.mask = FS_ATTRIB|FS_DELETE_SELF; 150689827cdSTrond Myklebust refcount_set(&new->nfm_ref, 1); 15165294c1fSJeff Layton 15265294c1fSJeff Layton err = fsnotify_add_inode_mark(&new->nfm_mark, inode, 0); 15365294c1fSJeff Layton 15465294c1fSJeff Layton /* 15565294c1fSJeff Layton * If the add was successful, then return the object. 15665294c1fSJeff Layton * Otherwise, we need to put the reference we hold on the 15765294c1fSJeff Layton * nfm_mark. The fsnotify code will take a reference and put 15865294c1fSJeff Layton * it on failure, so we can't just free it directly. It's also 15965294c1fSJeff Layton * not safe to call fsnotify_destroy_mark on it as the 16065294c1fSJeff Layton * mark->group will be NULL. Thus, we can't let the nfm_ref 16165294c1fSJeff Layton * counter drive the destruction at this point. 16265294c1fSJeff Layton */ 16365294c1fSJeff Layton if (likely(!err)) 16465294c1fSJeff Layton nfm = new; 16565294c1fSJeff Layton else 16665294c1fSJeff Layton fsnotify_put_mark(&new->nfm_mark); 16765294c1fSJeff Layton } while (unlikely(err == -EEXIST)); 16865294c1fSJeff Layton 16965294c1fSJeff Layton return nfm; 17065294c1fSJeff Layton } 17165294c1fSJeff Layton 17265294c1fSJeff Layton static struct nfsd_file * 1735e113224STrond Myklebust nfsd_file_alloc(struct inode *inode, unsigned int may, unsigned int hashval, 1745e113224STrond Myklebust struct net *net) 17565294c1fSJeff Layton { 17665294c1fSJeff Layton struct nfsd_file *nf; 17765294c1fSJeff Layton 17865294c1fSJeff Layton nf = kmem_cache_alloc(nfsd_file_slab, GFP_KERNEL); 17965294c1fSJeff Layton if (nf) { 18065294c1fSJeff Layton INIT_HLIST_NODE(&nf->nf_node); 18165294c1fSJeff Layton INIT_LIST_HEAD(&nf->nf_lru); 182904940e9SChuck Lever nf->nf_birthtime = ktime_get(); 18365294c1fSJeff Layton nf->nf_file = NULL; 18465294c1fSJeff Layton nf->nf_cred = get_current_cred(); 1855e113224STrond Myklebust nf->nf_net = net; 18665294c1fSJeff Layton nf->nf_flags = 0; 18765294c1fSJeff Layton nf->nf_inode = inode; 18865294c1fSJeff Layton nf->nf_hashval = hashval; 189689827cdSTrond Myklebust refcount_set(&nf->nf_ref, 1); 19065294c1fSJeff Layton nf->nf_may = may & NFSD_FILE_MAY_MASK; 19165294c1fSJeff Layton nf->nf_mark = NULL; 19265294c1fSJeff Layton trace_nfsd_file_alloc(nf); 19365294c1fSJeff Layton } 19465294c1fSJeff Layton return nf; 19565294c1fSJeff Layton } 19665294c1fSJeff Layton 19765294c1fSJeff Layton static bool 19865294c1fSJeff Layton nfsd_file_free(struct nfsd_file *nf) 19965294c1fSJeff Layton { 200904940e9SChuck Lever s64 age = ktime_to_ms(ktime_sub(ktime_get(), nf->nf_birthtime)); 20165294c1fSJeff Layton bool flush = false; 20265294c1fSJeff Layton 203d6329327SChuck Lever this_cpu_inc(nfsd_file_releases); 204904940e9SChuck Lever this_cpu_add(nfsd_file_total_age, age); 205d6329327SChuck Lever 20665294c1fSJeff Layton trace_nfsd_file_put_final(nf); 20765294c1fSJeff Layton if (nf->nf_mark) 20865294c1fSJeff Layton nfsd_file_mark_put(nf->nf_mark); 20965294c1fSJeff Layton if (nf->nf_file) { 21065294c1fSJeff Layton get_file(nf->nf_file); 21165294c1fSJeff Layton filp_close(nf->nf_file, NULL); 21265294c1fSJeff Layton fput(nf->nf_file); 21365294c1fSJeff Layton flush = true; 21465294c1fSJeff Layton } 21565294c1fSJeff Layton call_rcu(&nf->nf_rcu, nfsd_file_slab_free); 21665294c1fSJeff Layton return flush; 21765294c1fSJeff Layton } 21865294c1fSJeff Layton 219055b24a8STrond Myklebust static bool 220055b24a8STrond Myklebust nfsd_file_check_writeback(struct nfsd_file *nf) 221055b24a8STrond Myklebust { 222055b24a8STrond Myklebust struct file *file = nf->nf_file; 223055b24a8STrond Myklebust struct address_space *mapping; 224055b24a8STrond Myklebust 225055b24a8STrond Myklebust if (!file || !(file->f_mode & FMODE_WRITE)) 226055b24a8STrond Myklebust return false; 227055b24a8STrond Myklebust mapping = file->f_mapping; 228055b24a8STrond Myklebust return mapping_tagged(mapping, PAGECACHE_TAG_DIRTY) || 229055b24a8STrond Myklebust mapping_tagged(mapping, PAGECACHE_TAG_WRITEBACK); 230055b24a8STrond Myklebust } 231055b24a8STrond Myklebust 232055b24a8STrond Myklebust static int 233055b24a8STrond Myklebust nfsd_file_check_write_error(struct nfsd_file *nf) 234055b24a8STrond Myklebust { 235055b24a8STrond Myklebust struct file *file = nf->nf_file; 236055b24a8STrond Myklebust 237055b24a8STrond Myklebust if (!file || !(file->f_mode & FMODE_WRITE)) 238055b24a8STrond Myklebust return 0; 239055b24a8STrond Myklebust return filemap_check_wb_err(file->f_mapping, READ_ONCE(file->f_wb_err)); 240055b24a8STrond Myklebust } 241055b24a8STrond Myklebust 24265294c1fSJeff Layton static void 2436b8a9433STrond Myklebust nfsd_file_flush(struct nfsd_file *nf) 2446b8a9433STrond Myklebust { 2456b8a9433STrond Myklebust if (nf->nf_file && vfs_fsync(nf->nf_file, 1) != 0) 2466b8a9433STrond Myklebust nfsd_reset_write_verifier(net_generic(nf->nf_net, nfsd_net_id)); 2476b8a9433STrond Myklebust } 2486b8a9433STrond Myklebust 2496b8a9433STrond Myklebust static void 25065294c1fSJeff Layton nfsd_file_do_unhash(struct nfsd_file *nf) 25165294c1fSJeff Layton { 25265294c1fSJeff Layton lockdep_assert_held(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock); 25365294c1fSJeff Layton 25465294c1fSJeff Layton trace_nfsd_file_unhash(nf); 25565294c1fSJeff Layton 256055b24a8STrond Myklebust if (nfsd_file_check_write_error(nf)) 2573988a578SChuck Lever nfsd_reset_write_verifier(net_generic(nf->nf_net, nfsd_net_id)); 25865294c1fSJeff Layton --nfsd_file_hashtbl[nf->nf_hashval].nfb_count; 25965294c1fSJeff Layton hlist_del_rcu(&nf->nf_node); 26065294c1fSJeff Layton atomic_long_dec(&nfsd_filecache_count); 26165294c1fSJeff Layton } 26265294c1fSJeff Layton 26365294c1fSJeff Layton static bool 26465294c1fSJeff Layton nfsd_file_unhash(struct nfsd_file *nf) 26565294c1fSJeff Layton { 26665294c1fSJeff Layton if (test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags)) { 26765294c1fSJeff Layton nfsd_file_do_unhash(nf); 26836ebbdb9STrond Myklebust if (!list_empty(&nf->nf_lru)) 26936ebbdb9STrond Myklebust list_lru_del(&nfsd_file_lru, &nf->nf_lru); 27065294c1fSJeff Layton return true; 27165294c1fSJeff Layton } 27265294c1fSJeff Layton return false; 27365294c1fSJeff Layton } 27465294c1fSJeff Layton 27565294c1fSJeff Layton /* 27665294c1fSJeff Layton * Return true if the file was unhashed. 27765294c1fSJeff Layton */ 27865294c1fSJeff Layton static bool 27965294c1fSJeff Layton nfsd_file_unhash_and_release_locked(struct nfsd_file *nf, struct list_head *dispose) 28065294c1fSJeff Layton { 28165294c1fSJeff Layton lockdep_assert_held(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock); 28265294c1fSJeff Layton 28365294c1fSJeff Layton trace_nfsd_file_unhash_and_release_locked(nf); 28465294c1fSJeff Layton if (!nfsd_file_unhash(nf)) 28565294c1fSJeff Layton return false; 28665294c1fSJeff Layton /* keep final reference for nfsd_file_lru_dispose */ 287689827cdSTrond Myklebust if (refcount_dec_not_one(&nf->nf_ref)) 28865294c1fSJeff Layton return true; 28965294c1fSJeff Layton 29065294c1fSJeff Layton list_add(&nf->nf_lru, dispose); 29165294c1fSJeff Layton return true; 29265294c1fSJeff Layton } 29365294c1fSJeff Layton 294b6669305STrond Myklebust static void 29565294c1fSJeff Layton nfsd_file_put_noref(struct nfsd_file *nf) 29665294c1fSJeff Layton { 29765294c1fSJeff Layton trace_nfsd_file_put(nf); 29865294c1fSJeff Layton 299689827cdSTrond Myklebust if (refcount_dec_and_test(&nf->nf_ref)) { 30065294c1fSJeff Layton WARN_ON(test_bit(NFSD_FILE_HASHED, &nf->nf_flags)); 30165294c1fSJeff Layton nfsd_file_free(nf); 30265294c1fSJeff Layton } 30365294c1fSJeff Layton } 30465294c1fSJeff Layton 30565294c1fSJeff Layton void 30665294c1fSJeff Layton nfsd_file_put(struct nfsd_file *nf) 30765294c1fSJeff Layton { 30808af54b3SChuck Lever might_sleep(); 30908af54b3SChuck Lever 31065294c1fSJeff Layton set_bit(NFSD_FILE_REFERENCED, &nf->nf_flags); 31199939792STrond Myklebust if (test_bit(NFSD_FILE_HASHED, &nf->nf_flags) == 0) { 3126b8a9433STrond Myklebust nfsd_file_flush(nf); 313b6669305STrond Myklebust nfsd_file_put_noref(nf); 314b6c71c66SChuck Lever } else if (nf->nf_file) { 315b6669305STrond Myklebust nfsd_file_put_noref(nf); 3169542e6a6STrond Myklebust nfsd_file_schedule_laundrette(); 317b6c71c66SChuck Lever } else 318b6c71c66SChuck Lever nfsd_file_put_noref(nf); 319b6c71c66SChuck Lever 3209542e6a6STrond Myklebust if (atomic_long_read(&nfsd_filecache_count) >= NFSD_FILE_LRU_LIMIT) 3219542e6a6STrond Myklebust nfsd_file_gc(); 32265294c1fSJeff Layton } 32365294c1fSJeff Layton 32465294c1fSJeff Layton struct nfsd_file * 32565294c1fSJeff Layton nfsd_file_get(struct nfsd_file *nf) 32665294c1fSJeff Layton { 327689827cdSTrond Myklebust if (likely(refcount_inc_not_zero(&nf->nf_ref))) 32865294c1fSJeff Layton return nf; 32965294c1fSJeff Layton return NULL; 33065294c1fSJeff Layton } 33165294c1fSJeff Layton 33265294c1fSJeff Layton static void 33365294c1fSJeff Layton nfsd_file_dispose_list(struct list_head *dispose) 33465294c1fSJeff Layton { 33565294c1fSJeff Layton struct nfsd_file *nf; 33665294c1fSJeff Layton 33765294c1fSJeff Layton while(!list_empty(dispose)) { 33865294c1fSJeff Layton nf = list_first_entry(dispose, struct nfsd_file, nf_lru); 33965294c1fSJeff Layton list_del(&nf->nf_lru); 3406b8a9433STrond Myklebust nfsd_file_flush(nf); 34165294c1fSJeff Layton nfsd_file_put_noref(nf); 34265294c1fSJeff Layton } 34365294c1fSJeff Layton } 34465294c1fSJeff Layton 34565294c1fSJeff Layton static void 34665294c1fSJeff Layton nfsd_file_dispose_list_sync(struct list_head *dispose) 34765294c1fSJeff Layton { 34865294c1fSJeff Layton bool flush = false; 34965294c1fSJeff Layton struct nfsd_file *nf; 35065294c1fSJeff Layton 35165294c1fSJeff Layton while(!list_empty(dispose)) { 35265294c1fSJeff Layton nf = list_first_entry(dispose, struct nfsd_file, nf_lru); 35365294c1fSJeff Layton list_del(&nf->nf_lru); 3546b8a9433STrond Myklebust nfsd_file_flush(nf); 355689827cdSTrond Myklebust if (!refcount_dec_and_test(&nf->nf_ref)) 35665294c1fSJeff Layton continue; 35765294c1fSJeff Layton if (nfsd_file_free(nf)) 35865294c1fSJeff Layton flush = true; 35965294c1fSJeff Layton } 36065294c1fSJeff Layton if (flush) 36165294c1fSJeff Layton flush_delayed_fput(); 36265294c1fSJeff Layton } 36365294c1fSJeff Layton 3649542e6a6STrond Myklebust static void 3659542e6a6STrond Myklebust nfsd_file_list_remove_disposal(struct list_head *dst, 3669542e6a6STrond Myklebust struct nfsd_fcache_disposal *l) 3679542e6a6STrond Myklebust { 3689542e6a6STrond Myklebust spin_lock(&l->lock); 3699542e6a6STrond Myklebust list_splice_init(&l->freeme, dst); 3709542e6a6STrond Myklebust spin_unlock(&l->lock); 3719542e6a6STrond Myklebust } 3729542e6a6STrond Myklebust 3739542e6a6STrond Myklebust static void 3749542e6a6STrond Myklebust nfsd_file_list_add_disposal(struct list_head *files, struct net *net) 3759542e6a6STrond Myklebust { 3761463b38eSNeilBrown struct nfsd_net *nn = net_generic(net, nfsd_net_id); 3771463b38eSNeilBrown struct nfsd_fcache_disposal *l = nn->fcache_disposal; 3789542e6a6STrond Myklebust 3799542e6a6STrond Myklebust spin_lock(&l->lock); 3809542e6a6STrond Myklebust list_splice_tail_init(files, &l->freeme); 3819542e6a6STrond Myklebust spin_unlock(&l->lock); 3829542e6a6STrond Myklebust queue_work(nfsd_filecache_wq, &l->work); 3839542e6a6STrond Myklebust } 3849542e6a6STrond Myklebust 3859542e6a6STrond Myklebust static void 3869542e6a6STrond Myklebust nfsd_file_list_add_pernet(struct list_head *dst, struct list_head *src, 3879542e6a6STrond Myklebust struct net *net) 3889542e6a6STrond Myklebust { 3899542e6a6STrond Myklebust struct nfsd_file *nf, *tmp; 3909542e6a6STrond Myklebust 3919542e6a6STrond Myklebust list_for_each_entry_safe(nf, tmp, src, nf_lru) { 3929542e6a6STrond Myklebust if (nf->nf_net == net) 3939542e6a6STrond Myklebust list_move_tail(&nf->nf_lru, dst); 3949542e6a6STrond Myklebust } 3959542e6a6STrond Myklebust } 3969542e6a6STrond Myklebust 3979542e6a6STrond Myklebust static void 3989542e6a6STrond Myklebust nfsd_file_dispose_list_delayed(struct list_head *dispose) 3999542e6a6STrond Myklebust { 4009542e6a6STrond Myklebust LIST_HEAD(list); 4019542e6a6STrond Myklebust struct nfsd_file *nf; 4029542e6a6STrond Myklebust 4039542e6a6STrond Myklebust while(!list_empty(dispose)) { 4049542e6a6STrond Myklebust nf = list_first_entry(dispose, struct nfsd_file, nf_lru); 4059542e6a6STrond Myklebust nfsd_file_list_add_pernet(&list, dispose, nf->nf_net); 4069542e6a6STrond Myklebust nfsd_file_list_add_disposal(&list, nf->nf_net); 4079542e6a6STrond Myklebust } 4089542e6a6STrond Myklebust } 4099542e6a6STrond Myklebust 41065294c1fSJeff Layton /* 41165294c1fSJeff Layton * Note this can deadlock with nfsd_file_cache_purge. 41265294c1fSJeff Layton */ 41365294c1fSJeff Layton static enum lru_status 41465294c1fSJeff Layton nfsd_file_lru_cb(struct list_head *item, struct list_lru_one *lru, 41565294c1fSJeff Layton spinlock_t *lock, void *arg) 41665294c1fSJeff Layton __releases(lock) 41765294c1fSJeff Layton __acquires(lock) 41865294c1fSJeff Layton { 41965294c1fSJeff Layton struct list_head *head = arg; 42065294c1fSJeff Layton struct nfsd_file *nf = list_entry(item, struct nfsd_file, nf_lru); 42165294c1fSJeff Layton 42265294c1fSJeff Layton /* 42365294c1fSJeff Layton * Do a lockless refcount check. The hashtable holds one reference, so 42465294c1fSJeff Layton * we look to see if anything else has a reference, or if any have 42565294c1fSJeff Layton * been put since the shrinker last ran. Those don't get unhashed and 42665294c1fSJeff Layton * released. 42765294c1fSJeff Layton * 42865294c1fSJeff Layton * Note that in the put path, we set the flag and then decrement the 42965294c1fSJeff Layton * counter. Here we check the counter and then test and clear the flag. 43065294c1fSJeff Layton * That order is deliberate to ensure that we can do this locklessly. 43165294c1fSJeff Layton */ 432689827cdSTrond Myklebust if (refcount_read(&nf->nf_ref) > 1) 43365294c1fSJeff Layton goto out_skip; 434055b24a8STrond Myklebust 435055b24a8STrond Myklebust /* 436055b24a8STrond Myklebust * Don't throw out files that are still undergoing I/O or 437055b24a8STrond Myklebust * that have uncleared errors pending. 438055b24a8STrond Myklebust */ 439055b24a8STrond Myklebust if (nfsd_file_check_writeback(nf)) 440055b24a8STrond Myklebust goto out_skip; 441055b24a8STrond Myklebust 44265294c1fSJeff Layton if (test_and_clear_bit(NFSD_FILE_REFERENCED, &nf->nf_flags)) 443bd6e1cecSTrond Myklebust goto out_skip; 44465294c1fSJeff Layton 44565294c1fSJeff Layton if (!test_and_clear_bit(NFSD_FILE_HASHED, &nf->nf_flags)) 44665294c1fSJeff Layton goto out_skip; 44765294c1fSJeff Layton 44865294c1fSJeff Layton list_lru_isolate_move(lru, &nf->nf_lru, head); 44965294c1fSJeff Layton return LRU_REMOVED; 45065294c1fSJeff Layton out_skip: 45165294c1fSJeff Layton return LRU_SKIP; 45265294c1fSJeff Layton } 45365294c1fSJeff Layton 4540bac5a26SChuck Lever /* 4550bac5a26SChuck Lever * Unhash items on @dispose immediately, then queue them on the 4560bac5a26SChuck Lever * disposal workqueue to finish releasing them in the background. 4570bac5a26SChuck Lever * 4580bac5a26SChuck Lever * cel: Note that between the time list_lru_shrink_walk runs and 4590bac5a26SChuck Lever * now, these items are in the hash table but marked unhashed. 4600bac5a26SChuck Lever * Why release these outside of lru_cb ? There's no lock ordering 4610bac5a26SChuck Lever * problem since lru_cb currently takes no lock. 4620bac5a26SChuck Lever */ 4630bac5a26SChuck Lever static void nfsd_file_gc_dispose_list(struct list_head *dispose) 4640bac5a26SChuck Lever { 4650bac5a26SChuck Lever struct nfsd_file *nf; 4660bac5a26SChuck Lever 4670bac5a26SChuck Lever list_for_each_entry(nf, dispose, nf_lru) { 4680bac5a26SChuck Lever spin_lock(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock); 4690bac5a26SChuck Lever nfsd_file_do_unhash(nf); 4700bac5a26SChuck Lever spin_unlock(&nfsd_file_hashtbl[nf->nf_hashval].nfb_lock); 4710bac5a26SChuck Lever } 4720bac5a26SChuck Lever nfsd_file_dispose_list_delayed(dispose); 4730bac5a26SChuck Lever } 4740bac5a26SChuck Lever 4759542e6a6STrond Myklebust static void 4769542e6a6STrond Myklebust nfsd_file_gc(void) 4779542e6a6STrond Myklebust { 4783bc6d347SChuck Lever LIST_HEAD(dispose); 4793bc6d347SChuck Lever 4803bc6d347SChuck Lever list_lru_walk(&nfsd_file_lru, nfsd_file_lru_cb, 4813bc6d347SChuck Lever &dispose, LONG_MAX); 4823bc6d347SChuck Lever nfsd_file_gc_dispose_list(&dispose); 4839542e6a6STrond Myklebust } 4849542e6a6STrond Myklebust 4859542e6a6STrond Myklebust static void 4869542e6a6STrond Myklebust nfsd_file_gc_worker(struct work_struct *work) 4879542e6a6STrond Myklebust { 4889542e6a6STrond Myklebust nfsd_file_gc(); 4899542e6a6STrond Myklebust nfsd_file_schedule_laundrette(); 49065294c1fSJeff Layton } 49165294c1fSJeff Layton 49265294c1fSJeff Layton static unsigned long 49365294c1fSJeff Layton nfsd_file_lru_count(struct shrinker *s, struct shrink_control *sc) 49465294c1fSJeff Layton { 49565294c1fSJeff Layton return list_lru_count(&nfsd_file_lru); 49665294c1fSJeff Layton } 49765294c1fSJeff Layton 49865294c1fSJeff Layton static unsigned long 49965294c1fSJeff Layton nfsd_file_lru_scan(struct shrinker *s, struct shrink_control *sc) 50065294c1fSJeff Layton { 501*39f1d1ffSChuck Lever LIST_HEAD(dispose); 502*39f1d1ffSChuck Lever unsigned long ret; 503*39f1d1ffSChuck Lever 504*39f1d1ffSChuck Lever ret = list_lru_shrink_walk(&nfsd_file_lru, sc, 505*39f1d1ffSChuck Lever nfsd_file_lru_cb, &dispose); 506*39f1d1ffSChuck Lever nfsd_file_gc_dispose_list(&dispose); 507*39f1d1ffSChuck Lever return ret; 50865294c1fSJeff Layton } 50965294c1fSJeff Layton 51065294c1fSJeff Layton static struct shrinker nfsd_file_shrinker = { 51165294c1fSJeff Layton .scan_objects = nfsd_file_lru_scan, 51265294c1fSJeff Layton .count_objects = nfsd_file_lru_count, 51365294c1fSJeff Layton .seeks = 1, 51465294c1fSJeff Layton }; 51565294c1fSJeff Layton 51665294c1fSJeff Layton static void 51765294c1fSJeff Layton __nfsd_file_close_inode(struct inode *inode, unsigned int hashval, 51865294c1fSJeff Layton struct list_head *dispose) 51965294c1fSJeff Layton { 52065294c1fSJeff Layton struct nfsd_file *nf; 52165294c1fSJeff Layton struct hlist_node *tmp; 52265294c1fSJeff Layton 52365294c1fSJeff Layton spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock); 52465294c1fSJeff Layton hlist_for_each_entry_safe(nf, tmp, &nfsd_file_hashtbl[hashval].nfb_head, nf_node) { 52565294c1fSJeff Layton if (inode == nf->nf_inode) 52665294c1fSJeff Layton nfsd_file_unhash_and_release_locked(nf, dispose); 52765294c1fSJeff Layton } 52865294c1fSJeff Layton spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock); 52965294c1fSJeff Layton } 53065294c1fSJeff Layton 53165294c1fSJeff Layton /** 53265294c1fSJeff Layton * nfsd_file_close_inode_sync - attempt to forcibly close a nfsd_file 53365294c1fSJeff Layton * @inode: inode of the file to attempt to remove 53465294c1fSJeff Layton * 53565294c1fSJeff Layton * Walk the whole hash bucket, looking for any files that correspond to "inode". 53665294c1fSJeff Layton * If any do, then unhash them and put the hashtable reference to them and 53765294c1fSJeff Layton * destroy any that had their last reference put. Also ensure that any of the 53865294c1fSJeff Layton * fputs also have their final __fput done as well. 53965294c1fSJeff Layton */ 54065294c1fSJeff Layton void 54165294c1fSJeff Layton nfsd_file_close_inode_sync(struct inode *inode) 54265294c1fSJeff Layton { 54365294c1fSJeff Layton unsigned int hashval = (unsigned int)hash_long(inode->i_ino, 54465294c1fSJeff Layton NFSD_FILE_HASH_BITS); 54565294c1fSJeff Layton LIST_HEAD(dispose); 54665294c1fSJeff Layton 54765294c1fSJeff Layton __nfsd_file_close_inode(inode, hashval, &dispose); 54865294c1fSJeff Layton trace_nfsd_file_close_inode_sync(inode, hashval, !list_empty(&dispose)); 54965294c1fSJeff Layton nfsd_file_dispose_list_sync(&dispose); 55065294c1fSJeff Layton } 55165294c1fSJeff Layton 55265294c1fSJeff Layton /** 55319598141STrond Myklebust * nfsd_file_close_inode - attempt a delayed close of a nfsd_file 55465294c1fSJeff Layton * @inode: inode of the file to attempt to remove 55565294c1fSJeff Layton * 55665294c1fSJeff Layton * Walk the whole hash bucket, looking for any files that correspond to "inode". 55765294c1fSJeff Layton * If any do, then unhash them and put the hashtable reference to them and 55865294c1fSJeff Layton * destroy any that had their last reference put. 55965294c1fSJeff Layton */ 56065294c1fSJeff Layton static void 56165294c1fSJeff Layton nfsd_file_close_inode(struct inode *inode) 56265294c1fSJeff Layton { 56365294c1fSJeff Layton unsigned int hashval = (unsigned int)hash_long(inode->i_ino, 56465294c1fSJeff Layton NFSD_FILE_HASH_BITS); 56565294c1fSJeff Layton LIST_HEAD(dispose); 56665294c1fSJeff Layton 56765294c1fSJeff Layton __nfsd_file_close_inode(inode, hashval, &dispose); 56865294c1fSJeff Layton trace_nfsd_file_close_inode(inode, hashval, !list_empty(&dispose)); 5699542e6a6STrond Myklebust nfsd_file_dispose_list_delayed(&dispose); 57065294c1fSJeff Layton } 57165294c1fSJeff Layton 57265294c1fSJeff Layton /** 57365294c1fSJeff Layton * nfsd_file_delayed_close - close unused nfsd_files 57465294c1fSJeff Layton * @work: dummy 57565294c1fSJeff Layton * 57665294c1fSJeff Layton * Walk the LRU list and close any entries that have not been used since 57765294c1fSJeff Layton * the last scan. 57865294c1fSJeff Layton * 57965294c1fSJeff Layton * Note this can deadlock with nfsd_file_cache_purge. 58065294c1fSJeff Layton */ 58165294c1fSJeff Layton static void 58265294c1fSJeff Layton nfsd_file_delayed_close(struct work_struct *work) 58365294c1fSJeff Layton { 58465294c1fSJeff Layton LIST_HEAD(head); 5859542e6a6STrond Myklebust struct nfsd_fcache_disposal *l = container_of(work, 5869542e6a6STrond Myklebust struct nfsd_fcache_disposal, work); 58765294c1fSJeff Layton 5889542e6a6STrond Myklebust nfsd_file_list_remove_disposal(&head, l); 5899542e6a6STrond Myklebust nfsd_file_dispose_list(&head); 59065294c1fSJeff Layton } 59165294c1fSJeff Layton 59265294c1fSJeff Layton static int 59365294c1fSJeff Layton nfsd_file_lease_notifier_call(struct notifier_block *nb, unsigned long arg, 59465294c1fSJeff Layton void *data) 59565294c1fSJeff Layton { 59665294c1fSJeff Layton struct file_lock *fl = data; 59765294c1fSJeff Layton 59865294c1fSJeff Layton /* Only close files for F_SETLEASE leases */ 59965294c1fSJeff Layton if (fl->fl_flags & FL_LEASE) 60065294c1fSJeff Layton nfsd_file_close_inode_sync(file_inode(fl->fl_file)); 60165294c1fSJeff Layton return 0; 60265294c1fSJeff Layton } 60365294c1fSJeff Layton 60465294c1fSJeff Layton static struct notifier_block nfsd_file_lease_notifier = { 60565294c1fSJeff Layton .notifier_call = nfsd_file_lease_notifier_call, 60665294c1fSJeff Layton }; 60765294c1fSJeff Layton 60865294c1fSJeff Layton static int 609b9a1b977SAmir Goldstein nfsd_file_fsnotify_handle_event(struct fsnotify_mark *mark, u32 mask, 610b9a1b977SAmir Goldstein struct inode *inode, struct inode *dir, 611950cc0d2SAmir Goldstein const struct qstr *name, u32 cookie) 61265294c1fSJeff Layton { 61324dca905SGabriel Krisman Bertazi if (WARN_ON_ONCE(!inode)) 61424dca905SGabriel Krisman Bertazi return 0; 61524dca905SGabriel Krisman Bertazi 61665294c1fSJeff Layton trace_nfsd_file_fsnotify_handle_event(inode, mask); 61765294c1fSJeff Layton 61865294c1fSJeff Layton /* Should be no marks on non-regular files */ 61965294c1fSJeff Layton if (!S_ISREG(inode->i_mode)) { 62065294c1fSJeff Layton WARN_ON_ONCE(1); 62165294c1fSJeff Layton return 0; 62265294c1fSJeff Layton } 62365294c1fSJeff Layton 62465294c1fSJeff Layton /* don't close files if this was not the last link */ 62565294c1fSJeff Layton if (mask & FS_ATTRIB) { 62665294c1fSJeff Layton if (inode->i_nlink) 62765294c1fSJeff Layton return 0; 62865294c1fSJeff Layton } 62965294c1fSJeff Layton 63065294c1fSJeff Layton nfsd_file_close_inode(inode); 63165294c1fSJeff Layton return 0; 63265294c1fSJeff Layton } 63365294c1fSJeff Layton 63465294c1fSJeff Layton 63565294c1fSJeff Layton static const struct fsnotify_ops nfsd_file_fsnotify_ops = { 636b9a1b977SAmir Goldstein .handle_inode_event = nfsd_file_fsnotify_handle_event, 63765294c1fSJeff Layton .free_mark = nfsd_file_mark_free, 63865294c1fSJeff Layton }; 63965294c1fSJeff Layton 64065294c1fSJeff Layton int 64165294c1fSJeff Layton nfsd_file_cache_init(void) 64265294c1fSJeff Layton { 64365294c1fSJeff Layton int ret = -ENOMEM; 64465294c1fSJeff Layton unsigned int i; 64565294c1fSJeff Layton 64665294c1fSJeff Layton clear_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags); 64765294c1fSJeff Layton 64865294c1fSJeff Layton if (nfsd_file_hashtbl) 64965294c1fSJeff Layton return 0; 65065294c1fSJeff Layton 6519542e6a6STrond Myklebust nfsd_filecache_wq = alloc_workqueue("nfsd_filecache", 0, 0); 6529542e6a6STrond Myklebust if (!nfsd_filecache_wq) 6539542e6a6STrond Myklebust goto out; 6549542e6a6STrond Myklebust 6554d2eeafeSAmir Goldstein nfsd_file_hashtbl = kvcalloc(NFSD_FILE_HASH_SIZE, 65665294c1fSJeff Layton sizeof(*nfsd_file_hashtbl), GFP_KERNEL); 65765294c1fSJeff Layton if (!nfsd_file_hashtbl) { 65865294c1fSJeff Layton pr_err("nfsd: unable to allocate nfsd_file_hashtbl\n"); 65965294c1fSJeff Layton goto out_err; 66065294c1fSJeff Layton } 66165294c1fSJeff Layton 66265294c1fSJeff Layton nfsd_file_slab = kmem_cache_create("nfsd_file", 66365294c1fSJeff Layton sizeof(struct nfsd_file), 0, 0, NULL); 66465294c1fSJeff Layton if (!nfsd_file_slab) { 66565294c1fSJeff Layton pr_err("nfsd: unable to create nfsd_file_slab\n"); 66665294c1fSJeff Layton goto out_err; 66765294c1fSJeff Layton } 66865294c1fSJeff Layton 66965294c1fSJeff Layton nfsd_file_mark_slab = kmem_cache_create("nfsd_file_mark", 67065294c1fSJeff Layton sizeof(struct nfsd_file_mark), 0, 0, NULL); 67165294c1fSJeff Layton if (!nfsd_file_mark_slab) { 67265294c1fSJeff Layton pr_err("nfsd: unable to create nfsd_file_mark_slab\n"); 67365294c1fSJeff Layton goto out_err; 67465294c1fSJeff Layton } 67565294c1fSJeff Layton 67665294c1fSJeff Layton 67765294c1fSJeff Layton ret = list_lru_init(&nfsd_file_lru); 67865294c1fSJeff Layton if (ret) { 67965294c1fSJeff Layton pr_err("nfsd: failed to init nfsd_file_lru: %d\n", ret); 68065294c1fSJeff Layton goto out_err; 68165294c1fSJeff Layton } 68265294c1fSJeff Layton 68365294c1fSJeff Layton ret = register_shrinker(&nfsd_file_shrinker); 68465294c1fSJeff Layton if (ret) { 68565294c1fSJeff Layton pr_err("nfsd: failed to register nfsd_file_shrinker: %d\n", ret); 68665294c1fSJeff Layton goto out_lru; 68765294c1fSJeff Layton } 68865294c1fSJeff Layton 68965294c1fSJeff Layton ret = lease_register_notifier(&nfsd_file_lease_notifier); 69065294c1fSJeff Layton if (ret) { 69165294c1fSJeff Layton pr_err("nfsd: unable to register lease notifier: %d\n", ret); 69265294c1fSJeff Layton goto out_shrinker; 69365294c1fSJeff Layton } 69465294c1fSJeff Layton 695867a448dSAmir Goldstein nfsd_file_fsnotify_group = fsnotify_alloc_group(&nfsd_file_fsnotify_ops, 696b8962a9dSAmir Goldstein FSNOTIFY_GROUP_NOFS); 69765294c1fSJeff Layton if (IS_ERR(nfsd_file_fsnotify_group)) { 69865294c1fSJeff Layton pr_err("nfsd: unable to create fsnotify group: %ld\n", 69965294c1fSJeff Layton PTR_ERR(nfsd_file_fsnotify_group)); 700231307dfSHuang Guobin ret = PTR_ERR(nfsd_file_fsnotify_group); 70165294c1fSJeff Layton nfsd_file_fsnotify_group = NULL; 70265294c1fSJeff Layton goto out_notifier; 70365294c1fSJeff Layton } 70465294c1fSJeff Layton 70565294c1fSJeff Layton for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) { 70665294c1fSJeff Layton INIT_HLIST_HEAD(&nfsd_file_hashtbl[i].nfb_head); 70765294c1fSJeff Layton spin_lock_init(&nfsd_file_hashtbl[i].nfb_lock); 70865294c1fSJeff Layton } 70965294c1fSJeff Layton 7109542e6a6STrond Myklebust INIT_DELAYED_WORK(&nfsd_filecache_laundrette, nfsd_file_gc_worker); 71165294c1fSJeff Layton out: 71265294c1fSJeff Layton return ret; 71365294c1fSJeff Layton out_notifier: 71465294c1fSJeff Layton lease_unregister_notifier(&nfsd_file_lease_notifier); 71565294c1fSJeff Layton out_shrinker: 71665294c1fSJeff Layton unregister_shrinker(&nfsd_file_shrinker); 71765294c1fSJeff Layton out_lru: 71865294c1fSJeff Layton list_lru_destroy(&nfsd_file_lru); 71965294c1fSJeff Layton out_err: 72065294c1fSJeff Layton kmem_cache_destroy(nfsd_file_slab); 72165294c1fSJeff Layton nfsd_file_slab = NULL; 72265294c1fSJeff Layton kmem_cache_destroy(nfsd_file_mark_slab); 72365294c1fSJeff Layton nfsd_file_mark_slab = NULL; 7244d2eeafeSAmir Goldstein kvfree(nfsd_file_hashtbl); 72565294c1fSJeff Layton nfsd_file_hashtbl = NULL; 7269542e6a6STrond Myklebust destroy_workqueue(nfsd_filecache_wq); 7279542e6a6STrond Myklebust nfsd_filecache_wq = NULL; 72865294c1fSJeff Layton goto out; 72965294c1fSJeff Layton } 73065294c1fSJeff Layton 73165294c1fSJeff Layton /* 73265294c1fSJeff Layton * Note this can deadlock with nfsd_file_lru_cb. 73365294c1fSJeff Layton */ 73465294c1fSJeff Layton void 7355e113224STrond Myklebust nfsd_file_cache_purge(struct net *net) 73665294c1fSJeff Layton { 73765294c1fSJeff Layton unsigned int i; 73865294c1fSJeff Layton struct nfsd_file *nf; 7395e113224STrond Myklebust struct hlist_node *next; 74065294c1fSJeff Layton LIST_HEAD(dispose); 74165294c1fSJeff Layton bool del; 74265294c1fSJeff Layton 74365294c1fSJeff Layton if (!nfsd_file_hashtbl) 74465294c1fSJeff Layton return; 74565294c1fSJeff Layton 74665294c1fSJeff Layton for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) { 7475e113224STrond Myklebust struct nfsd_fcache_bucket *nfb = &nfsd_file_hashtbl[i]; 7485e113224STrond Myklebust 7495e113224STrond Myklebust spin_lock(&nfb->nfb_lock); 7505e113224STrond Myklebust hlist_for_each_entry_safe(nf, next, &nfb->nfb_head, nf_node) { 7515e113224STrond Myklebust if (net && nf->nf_net != net) 7525e113224STrond Myklebust continue; 75365294c1fSJeff Layton del = nfsd_file_unhash_and_release_locked(nf, &dispose); 75465294c1fSJeff Layton 75565294c1fSJeff Layton /* 75665294c1fSJeff Layton * Deadlock detected! Something marked this entry as 75765294c1fSJeff Layton * unhased, but hasn't removed it from the hash list. 75865294c1fSJeff Layton */ 75965294c1fSJeff Layton WARN_ON_ONCE(!del); 76065294c1fSJeff Layton } 7615e113224STrond Myklebust spin_unlock(&nfb->nfb_lock); 76265294c1fSJeff Layton nfsd_file_dispose_list(&dispose); 76365294c1fSJeff Layton } 76465294c1fSJeff Layton } 76565294c1fSJeff Layton 7669542e6a6STrond Myklebust static struct nfsd_fcache_disposal * 7671463b38eSNeilBrown nfsd_alloc_fcache_disposal(void) 7689542e6a6STrond Myklebust { 7699542e6a6STrond Myklebust struct nfsd_fcache_disposal *l; 7709542e6a6STrond Myklebust 7719542e6a6STrond Myklebust l = kmalloc(sizeof(*l), GFP_KERNEL); 7729542e6a6STrond Myklebust if (!l) 7739542e6a6STrond Myklebust return NULL; 7749542e6a6STrond Myklebust INIT_WORK(&l->work, nfsd_file_delayed_close); 7759542e6a6STrond Myklebust spin_lock_init(&l->lock); 7769542e6a6STrond Myklebust INIT_LIST_HEAD(&l->freeme); 7779542e6a6STrond Myklebust return l; 7789542e6a6STrond Myklebust } 7799542e6a6STrond Myklebust 7809542e6a6STrond Myklebust static void 7819542e6a6STrond Myklebust nfsd_free_fcache_disposal(struct nfsd_fcache_disposal *l) 7829542e6a6STrond Myklebust { 7839542e6a6STrond Myklebust cancel_work_sync(&l->work); 7849542e6a6STrond Myklebust nfsd_file_dispose_list(&l->freeme); 7851463b38eSNeilBrown kfree(l); 7869542e6a6STrond Myklebust } 7879542e6a6STrond Myklebust 7889542e6a6STrond Myklebust static void 7899542e6a6STrond Myklebust nfsd_free_fcache_disposal_net(struct net *net) 7909542e6a6STrond Myklebust { 7911463b38eSNeilBrown struct nfsd_net *nn = net_generic(net, nfsd_net_id); 7921463b38eSNeilBrown struct nfsd_fcache_disposal *l = nn->fcache_disposal; 7939542e6a6STrond Myklebust 7949542e6a6STrond Myklebust nfsd_free_fcache_disposal(l); 7959542e6a6STrond Myklebust } 7969542e6a6STrond Myklebust 7979542e6a6STrond Myklebust int 7989542e6a6STrond Myklebust nfsd_file_cache_start_net(struct net *net) 7999542e6a6STrond Myklebust { 8001463b38eSNeilBrown struct nfsd_net *nn = net_generic(net, nfsd_net_id); 8011463b38eSNeilBrown 8021463b38eSNeilBrown nn->fcache_disposal = nfsd_alloc_fcache_disposal(); 8031463b38eSNeilBrown return nn->fcache_disposal ? 0 : -ENOMEM; 8049542e6a6STrond Myklebust } 8059542e6a6STrond Myklebust 8069542e6a6STrond Myklebust void 8079542e6a6STrond Myklebust nfsd_file_cache_shutdown_net(struct net *net) 8089542e6a6STrond Myklebust { 8099542e6a6STrond Myklebust nfsd_file_cache_purge(net); 8109542e6a6STrond Myklebust nfsd_free_fcache_disposal_net(net); 8119542e6a6STrond Myklebust } 8129542e6a6STrond Myklebust 81365294c1fSJeff Layton void 81465294c1fSJeff Layton nfsd_file_cache_shutdown(void) 81565294c1fSJeff Layton { 81665294c1fSJeff Layton set_bit(NFSD_FILE_SHUTDOWN, &nfsd_file_lru_flags); 81765294c1fSJeff Layton 81865294c1fSJeff Layton lease_unregister_notifier(&nfsd_file_lease_notifier); 81965294c1fSJeff Layton unregister_shrinker(&nfsd_file_shrinker); 82065294c1fSJeff Layton /* 82165294c1fSJeff Layton * make sure all callers of nfsd_file_lru_cb are done before 82265294c1fSJeff Layton * calling nfsd_file_cache_purge 82365294c1fSJeff Layton */ 82465294c1fSJeff Layton cancel_delayed_work_sync(&nfsd_filecache_laundrette); 8255e113224STrond Myklebust nfsd_file_cache_purge(NULL); 82665294c1fSJeff Layton list_lru_destroy(&nfsd_file_lru); 82765294c1fSJeff Layton rcu_barrier(); 82865294c1fSJeff Layton fsnotify_put_group(nfsd_file_fsnotify_group); 82965294c1fSJeff Layton nfsd_file_fsnotify_group = NULL; 83065294c1fSJeff Layton kmem_cache_destroy(nfsd_file_slab); 83165294c1fSJeff Layton nfsd_file_slab = NULL; 83265294c1fSJeff Layton fsnotify_wait_marks_destroyed(); 83365294c1fSJeff Layton kmem_cache_destroy(nfsd_file_mark_slab); 83465294c1fSJeff Layton nfsd_file_mark_slab = NULL; 8354d2eeafeSAmir Goldstein kvfree(nfsd_file_hashtbl); 83665294c1fSJeff Layton nfsd_file_hashtbl = NULL; 8379542e6a6STrond Myklebust destroy_workqueue(nfsd_filecache_wq); 8389542e6a6STrond Myklebust nfsd_filecache_wq = NULL; 83965294c1fSJeff Layton } 84065294c1fSJeff Layton 84165294c1fSJeff Layton static bool 84265294c1fSJeff Layton nfsd_match_cred(const struct cred *c1, const struct cred *c2) 84365294c1fSJeff Layton { 84465294c1fSJeff Layton int i; 84565294c1fSJeff Layton 84665294c1fSJeff Layton if (!uid_eq(c1->fsuid, c2->fsuid)) 84765294c1fSJeff Layton return false; 84865294c1fSJeff Layton if (!gid_eq(c1->fsgid, c2->fsgid)) 84965294c1fSJeff Layton return false; 85065294c1fSJeff Layton if (c1->group_info == NULL || c2->group_info == NULL) 85165294c1fSJeff Layton return c1->group_info == c2->group_info; 85265294c1fSJeff Layton if (c1->group_info->ngroups != c2->group_info->ngroups) 85365294c1fSJeff Layton return false; 85465294c1fSJeff Layton for (i = 0; i < c1->group_info->ngroups; i++) { 85565294c1fSJeff Layton if (!gid_eq(c1->group_info->gid[i], c2->group_info->gid[i])) 85665294c1fSJeff Layton return false; 85765294c1fSJeff Layton } 85865294c1fSJeff Layton return true; 85965294c1fSJeff Layton } 86065294c1fSJeff Layton 86165294c1fSJeff Layton static struct nfsd_file * 86265294c1fSJeff Layton nfsd_file_find_locked(struct inode *inode, unsigned int may_flags, 8635e113224STrond Myklebust unsigned int hashval, struct net *net) 86465294c1fSJeff Layton { 86565294c1fSJeff Layton struct nfsd_file *nf; 86665294c1fSJeff Layton unsigned char need = may_flags & NFSD_FILE_MAY_MASK; 86765294c1fSJeff Layton 86865294c1fSJeff Layton hlist_for_each_entry_rcu(nf, &nfsd_file_hashtbl[hashval].nfb_head, 869057a2274SMadhuparna Bhowmik nf_node, lockdep_is_held(&nfsd_file_hashtbl[hashval].nfb_lock)) { 870ae3c57b5SJ. Bruce Fields if (nf->nf_may != need) 87165294c1fSJeff Layton continue; 87265294c1fSJeff Layton if (nf->nf_inode != inode) 87365294c1fSJeff Layton continue; 8745e113224STrond Myklebust if (nf->nf_net != net) 8755e113224STrond Myklebust continue; 87665294c1fSJeff Layton if (!nfsd_match_cred(nf->nf_cred, current_cred())) 87765294c1fSJeff Layton continue; 878d30881f5STrond Myklebust if (!test_bit(NFSD_FILE_HASHED, &nf->nf_flags)) 879d30881f5STrond Myklebust continue; 88065294c1fSJeff Layton if (nfsd_file_get(nf) != NULL) 88165294c1fSJeff Layton return nf; 88265294c1fSJeff Layton } 88365294c1fSJeff Layton return NULL; 88465294c1fSJeff Layton } 88565294c1fSJeff Layton 88665294c1fSJeff Layton /** 88765294c1fSJeff Layton * nfsd_file_is_cached - are there any cached open files for this fh? 88865294c1fSJeff Layton * @inode: inode of the file to check 88965294c1fSJeff Layton * 89065294c1fSJeff Layton * Scan the hashtable for open files that match this fh. Returns true if there 89165294c1fSJeff Layton * are any, and false if not. 89265294c1fSJeff Layton */ 89365294c1fSJeff Layton bool 89465294c1fSJeff Layton nfsd_file_is_cached(struct inode *inode) 89565294c1fSJeff Layton { 89665294c1fSJeff Layton bool ret = false; 89765294c1fSJeff Layton struct nfsd_file *nf; 89865294c1fSJeff Layton unsigned int hashval; 89965294c1fSJeff Layton 90065294c1fSJeff Layton hashval = (unsigned int)hash_long(inode->i_ino, NFSD_FILE_HASH_BITS); 90165294c1fSJeff Layton 90265294c1fSJeff Layton rcu_read_lock(); 90365294c1fSJeff Layton hlist_for_each_entry_rcu(nf, &nfsd_file_hashtbl[hashval].nfb_head, 90465294c1fSJeff Layton nf_node) { 90565294c1fSJeff Layton if (inode == nf->nf_inode) { 90665294c1fSJeff Layton ret = true; 90765294c1fSJeff Layton break; 90865294c1fSJeff Layton } 90965294c1fSJeff Layton } 91065294c1fSJeff Layton rcu_read_unlock(); 91165294c1fSJeff Layton trace_nfsd_file_is_cached(inode, hashval, (int)ret); 91265294c1fSJeff Layton return ret; 91365294c1fSJeff Layton } 91465294c1fSJeff Layton 915fb70bf12SChuck Lever static __be32 916fb70bf12SChuck Lever nfsd_do_file_acquire(struct svc_rqst *rqstp, struct svc_fh *fhp, 917fb70bf12SChuck Lever unsigned int may_flags, struct nfsd_file **pnf, bool open) 91865294c1fSJeff Layton { 91965294c1fSJeff Layton __be32 status; 9205e113224STrond Myklebust struct net *net = SVC_NET(rqstp); 92165294c1fSJeff Layton struct nfsd_file *nf, *new; 92265294c1fSJeff Layton struct inode *inode; 92365294c1fSJeff Layton unsigned int hashval; 92428c7d86bSTrond Myklebust bool retry = true; 92565294c1fSJeff Layton 92665294c1fSJeff Layton /* FIXME: skip this if fh_dentry is already set? */ 92765294c1fSJeff Layton status = fh_verify(rqstp, fhp, S_IFREG, 92865294c1fSJeff Layton may_flags|NFSD_MAY_OWNER_OVERRIDE); 92965294c1fSJeff Layton if (status != nfs_ok) 93065294c1fSJeff Layton return status; 93165294c1fSJeff Layton 93265294c1fSJeff Layton inode = d_inode(fhp->fh_dentry); 93365294c1fSJeff Layton hashval = (unsigned int)hash_long(inode->i_ino, NFSD_FILE_HASH_BITS); 93465294c1fSJeff Layton retry: 93565294c1fSJeff Layton rcu_read_lock(); 9365e113224STrond Myklebust nf = nfsd_file_find_locked(inode, may_flags, hashval, net); 93765294c1fSJeff Layton rcu_read_unlock(); 93865294c1fSJeff Layton if (nf) 93965294c1fSJeff Layton goto wait_for_construction; 94065294c1fSJeff Layton 9415e113224STrond Myklebust new = nfsd_file_alloc(inode, may_flags, hashval, net); 94265294c1fSJeff Layton if (!new) { 94365294c1fSJeff Layton trace_nfsd_file_acquire(rqstp, hashval, inode, may_flags, 94465294c1fSJeff Layton NULL, nfserr_jukebox); 94565294c1fSJeff Layton return nfserr_jukebox; 94665294c1fSJeff Layton } 94765294c1fSJeff Layton 94865294c1fSJeff Layton spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock); 9495e113224STrond Myklebust nf = nfsd_file_find_locked(inode, may_flags, hashval, net); 95065294c1fSJeff Layton if (nf == NULL) 95165294c1fSJeff Layton goto open_file; 95265294c1fSJeff Layton spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock); 95365294c1fSJeff Layton nfsd_file_slab_free(&new->nf_rcu); 95465294c1fSJeff Layton 95565294c1fSJeff Layton wait_for_construction: 95665294c1fSJeff Layton wait_on_bit(&nf->nf_flags, NFSD_FILE_PENDING, TASK_UNINTERRUPTIBLE); 95765294c1fSJeff Layton 95865294c1fSJeff Layton /* Did construction of this file fail? */ 95965294c1fSJeff Layton if (!test_bit(NFSD_FILE_HASHED, &nf->nf_flags)) { 96028c7d86bSTrond Myklebust if (!retry) { 96128c7d86bSTrond Myklebust status = nfserr_jukebox; 96228c7d86bSTrond Myklebust goto out; 96328c7d86bSTrond Myklebust } 96428c7d86bSTrond Myklebust retry = false; 96565294c1fSJeff Layton nfsd_file_put_noref(nf); 96665294c1fSJeff Layton goto retry; 96765294c1fSJeff Layton } 96865294c1fSJeff Layton 96965294c1fSJeff Layton this_cpu_inc(nfsd_file_cache_hits); 97065294c1fSJeff Layton 97123ba98deSJeff Layton status = nfserrno(nfsd_open_break_lease(file_inode(nf->nf_file), may_flags)); 97265294c1fSJeff Layton out: 97365294c1fSJeff Layton if (status == nfs_ok) { 97429d4bdbbSChuck Lever if (open) 97529d4bdbbSChuck Lever this_cpu_inc(nfsd_file_acquisitions); 97665294c1fSJeff Layton *pnf = nf; 97765294c1fSJeff Layton } else { 97865294c1fSJeff Layton nfsd_file_put(nf); 97965294c1fSJeff Layton nf = NULL; 98065294c1fSJeff Layton } 98165294c1fSJeff Layton 98265294c1fSJeff Layton trace_nfsd_file_acquire(rqstp, hashval, inode, may_flags, nf, status); 98365294c1fSJeff Layton return status; 98465294c1fSJeff Layton open_file: 98565294c1fSJeff Layton nf = new; 98665294c1fSJeff Layton /* Take reference for the hashtable */ 987689827cdSTrond Myklebust refcount_inc(&nf->nf_ref); 98865294c1fSJeff Layton __set_bit(NFSD_FILE_HASHED, &nf->nf_flags); 98965294c1fSJeff Layton __set_bit(NFSD_FILE_PENDING, &nf->nf_flags); 99065294c1fSJeff Layton list_lru_add(&nfsd_file_lru, &nf->nf_lru); 99165294c1fSJeff Layton hlist_add_head_rcu(&nf->nf_node, &nfsd_file_hashtbl[hashval].nfb_head); 99265294c1fSJeff Layton ++nfsd_file_hashtbl[hashval].nfb_count; 99365294c1fSJeff Layton nfsd_file_hashtbl[hashval].nfb_maxcount = max(nfsd_file_hashtbl[hashval].nfb_maxcount, 99465294c1fSJeff Layton nfsd_file_hashtbl[hashval].nfb_count); 99565294c1fSJeff Layton spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock); 9969542e6a6STrond Myklebust if (atomic_long_inc_return(&nfsd_filecache_count) >= NFSD_FILE_LRU_THRESHOLD) 9979542e6a6STrond Myklebust nfsd_file_gc(); 99865294c1fSJeff Layton 99965294c1fSJeff Layton nf->nf_mark = nfsd_file_mark_find_or_create(nf); 1000fb70bf12SChuck Lever if (nf->nf_mark) { 10010122e882SChuck Lever if (open) { 1002f4d84c52SChuck Lever status = nfsd_open_verified(rqstp, fhp, may_flags, 1003f4d84c52SChuck Lever &nf->nf_file); 10040122e882SChuck Lever trace_nfsd_file_open(nf, status); 10050122e882SChuck Lever } else 1006fb70bf12SChuck Lever status = nfs_ok; 1007fb70bf12SChuck Lever } else 100865294c1fSJeff Layton status = nfserr_jukebox; 100965294c1fSJeff Layton /* 101065294c1fSJeff Layton * If construction failed, or we raced with a call to unlink() 101165294c1fSJeff Layton * then unhash. 101265294c1fSJeff Layton */ 101365294c1fSJeff Layton if (status != nfs_ok || inode->i_nlink == 0) { 101465294c1fSJeff Layton bool do_free; 101565294c1fSJeff Layton spin_lock(&nfsd_file_hashtbl[hashval].nfb_lock); 101665294c1fSJeff Layton do_free = nfsd_file_unhash(nf); 101765294c1fSJeff Layton spin_unlock(&nfsd_file_hashtbl[hashval].nfb_lock); 101865294c1fSJeff Layton if (do_free) 101965294c1fSJeff Layton nfsd_file_put_noref(nf); 102065294c1fSJeff Layton } 102165294c1fSJeff Layton clear_bit_unlock(NFSD_FILE_PENDING, &nf->nf_flags); 102265294c1fSJeff Layton smp_mb__after_atomic(); 102365294c1fSJeff Layton wake_up_bit(&nf->nf_flags, NFSD_FILE_PENDING); 102465294c1fSJeff Layton goto out; 102565294c1fSJeff Layton } 102665294c1fSJeff Layton 1027fb70bf12SChuck Lever /** 1028fb70bf12SChuck Lever * nfsd_file_acquire - Get a struct nfsd_file with an open file 1029fb70bf12SChuck Lever * @rqstp: the RPC transaction being executed 1030fb70bf12SChuck Lever * @fhp: the NFS filehandle of the file to be opened 1031fb70bf12SChuck Lever * @may_flags: NFSD_MAY_ settings for the file 1032fb70bf12SChuck Lever * @pnf: OUT: new or found "struct nfsd_file" object 1033fb70bf12SChuck Lever * 1034fb70bf12SChuck Lever * Returns nfs_ok and sets @pnf on success; otherwise an nfsstat in 1035fb70bf12SChuck Lever * network byte order is returned. 1036fb70bf12SChuck Lever */ 1037fb70bf12SChuck Lever __be32 1038fb70bf12SChuck Lever nfsd_file_acquire(struct svc_rqst *rqstp, struct svc_fh *fhp, 1039fb70bf12SChuck Lever unsigned int may_flags, struct nfsd_file **pnf) 1040fb70bf12SChuck Lever { 1041fb70bf12SChuck Lever return nfsd_do_file_acquire(rqstp, fhp, may_flags, pnf, true); 1042fb70bf12SChuck Lever } 1043fb70bf12SChuck Lever 1044fb70bf12SChuck Lever /** 1045fb70bf12SChuck Lever * nfsd_file_create - Get a struct nfsd_file, do not open 1046fb70bf12SChuck Lever * @rqstp: the RPC transaction being executed 1047fb70bf12SChuck Lever * @fhp: the NFS filehandle of the file just created 1048fb70bf12SChuck Lever * @may_flags: NFSD_MAY_ settings for the file 1049fb70bf12SChuck Lever * @pnf: OUT: new or found "struct nfsd_file" object 1050fb70bf12SChuck Lever * 1051fb70bf12SChuck Lever * Returns nfs_ok and sets @pnf on success; otherwise an nfsstat in 1052fb70bf12SChuck Lever * network byte order is returned. 1053fb70bf12SChuck Lever */ 1054fb70bf12SChuck Lever __be32 1055fb70bf12SChuck Lever nfsd_file_create(struct svc_rqst *rqstp, struct svc_fh *fhp, 1056fb70bf12SChuck Lever unsigned int may_flags, struct nfsd_file **pnf) 1057fb70bf12SChuck Lever { 1058fb70bf12SChuck Lever return nfsd_do_file_acquire(rqstp, fhp, may_flags, pnf, false); 1059fb70bf12SChuck Lever } 1060fb70bf12SChuck Lever 106165294c1fSJeff Layton /* 106265294c1fSJeff Layton * Note that fields may be added, removed or reordered in the future. Programs 106365294c1fSJeff Layton * scraping this file for info should test the labels to ensure they're 106465294c1fSJeff Layton * getting the correct field. 106565294c1fSJeff Layton */ 106665294c1fSJeff Layton static int nfsd_file_cache_stats_show(struct seq_file *m, void *v) 106765294c1fSJeff Layton { 1068d6329327SChuck Lever unsigned long hits = 0, acquisitions = 0, releases = 0; 106965294c1fSJeff Layton unsigned int i, count = 0, longest = 0; 1070904940e9SChuck Lever unsigned long lru = 0, total_age = 0; 107165294c1fSJeff Layton 107265294c1fSJeff Layton /* 107365294c1fSJeff Layton * No need for spinlocks here since we're not terribly interested in 107465294c1fSJeff Layton * accuracy. We do take the nfsd_mutex simply to ensure that we 107565294c1fSJeff Layton * don't end up racing with server shutdown 107665294c1fSJeff Layton */ 107765294c1fSJeff Layton mutex_lock(&nfsd_mutex); 107865294c1fSJeff Layton if (nfsd_file_hashtbl) { 107965294c1fSJeff Layton for (i = 0; i < NFSD_FILE_HASH_SIZE; i++) { 108065294c1fSJeff Layton count += nfsd_file_hashtbl[i].nfb_count; 108165294c1fSJeff Layton longest = max(longest, nfsd_file_hashtbl[i].nfb_count); 108265294c1fSJeff Layton } 10830fd244c1SChuck Lever lru = list_lru_count(&nfsd_file_lru); 108465294c1fSJeff Layton } 108565294c1fSJeff Layton mutex_unlock(&nfsd_mutex); 108665294c1fSJeff Layton 108729d4bdbbSChuck Lever for_each_possible_cpu(i) { 108865294c1fSJeff Layton hits += per_cpu(nfsd_file_cache_hits, i); 108929d4bdbbSChuck Lever acquisitions += per_cpu(nfsd_file_acquisitions, i); 1090d6329327SChuck Lever releases += per_cpu(nfsd_file_releases, i); 1091904940e9SChuck Lever total_age += per_cpu(nfsd_file_total_age, i); 109229d4bdbbSChuck Lever } 109365294c1fSJeff Layton 109465294c1fSJeff Layton seq_printf(m, "total entries: %u\n", count); 109565294c1fSJeff Layton seq_printf(m, "longest chain: %u\n", longest); 10960fd244c1SChuck Lever seq_printf(m, "lru entries: %lu\n", lru); 109765294c1fSJeff Layton seq_printf(m, "cache hits: %lu\n", hits); 109829d4bdbbSChuck Lever seq_printf(m, "acquisitions: %lu\n", acquisitions); 1099d6329327SChuck Lever seq_printf(m, "releases: %lu\n", releases); 1100904940e9SChuck Lever if (releases) 1101904940e9SChuck Lever seq_printf(m, "mean age (ms): %ld\n", total_age / releases); 1102904940e9SChuck Lever else 1103904940e9SChuck Lever seq_printf(m, "mean age (ms): -\n"); 110465294c1fSJeff Layton return 0; 110565294c1fSJeff Layton } 110665294c1fSJeff Layton 110765294c1fSJeff Layton int nfsd_file_cache_stats_open(struct inode *inode, struct file *file) 110865294c1fSJeff Layton { 110965294c1fSJeff Layton return single_open(file, nfsd_file_cache_stats_show, NULL); 111065294c1fSJeff Layton } 1111