xref: /openbmc/linux/fs/nfs/read.c (revision 91d5b470)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  * linux/fs/nfs/read.c
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  * Block I/O for NFS
51da177e4SLinus Torvalds  *
61da177e4SLinus Torvalds  * Partial copy of Linus' read cache modifications to fs/nfs/file.c
71da177e4SLinus Torvalds  * modified for async RPC by okir@monad.swb.de
81da177e4SLinus Torvalds  *
91da177e4SLinus Torvalds  * We do an ugly hack here in order to return proper error codes to the
101da177e4SLinus Torvalds  * user program when a read request failed: since generic_file_read
111da177e4SLinus Torvalds  * only checks the return value of inode->i_op->readpage() which is always 0
121da177e4SLinus Torvalds  * for async RPC, we set the error bit of the page to 1 when an error occurs,
131da177e4SLinus Torvalds  * and make nfs_readpage transmit requests synchronously when encountering this.
141da177e4SLinus Torvalds  * This is only a small problem, though, since we now retry all operations
151da177e4SLinus Torvalds  * within the RPC code when root squashing is suspected.
161da177e4SLinus Torvalds  */
171da177e4SLinus Torvalds 
181da177e4SLinus Torvalds #include <linux/config.h>
191da177e4SLinus Torvalds #include <linux/time.h>
201da177e4SLinus Torvalds #include <linux/kernel.h>
211da177e4SLinus Torvalds #include <linux/errno.h>
221da177e4SLinus Torvalds #include <linux/fcntl.h>
231da177e4SLinus Torvalds #include <linux/stat.h>
241da177e4SLinus Torvalds #include <linux/mm.h>
251da177e4SLinus Torvalds #include <linux/slab.h>
261da177e4SLinus Torvalds #include <linux/pagemap.h>
271da177e4SLinus Torvalds #include <linux/sunrpc/clnt.h>
281da177e4SLinus Torvalds #include <linux/nfs_fs.h>
291da177e4SLinus Torvalds #include <linux/nfs_page.h>
301da177e4SLinus Torvalds #include <linux/smp_lock.h>
311da177e4SLinus Torvalds 
321da177e4SLinus Torvalds #include <asm/system.h>
331da177e4SLinus Torvalds 
3491d5b470SChuck Lever #include "iostat.h"
3591d5b470SChuck Lever 
361da177e4SLinus Torvalds #define NFSDBG_FACILITY		NFSDBG_PAGECACHE
371da177e4SLinus Torvalds 
381da177e4SLinus Torvalds static int nfs_pagein_one(struct list_head *, struct inode *);
391da177e4SLinus Torvalds static void nfs_readpage_result_partial(struct nfs_read_data *, int);
401da177e4SLinus Torvalds static void nfs_readpage_result_full(struct nfs_read_data *, int);
411da177e4SLinus Torvalds 
421da177e4SLinus Torvalds static kmem_cache_t *nfs_rdata_cachep;
431da177e4SLinus Torvalds mempool_t *nfs_rdata_mempool;
441da177e4SLinus Torvalds 
451da177e4SLinus Torvalds #define MIN_POOL_READ	(32)
461da177e4SLinus Torvalds 
47963d8fe5STrond Myklebust void nfs_readdata_release(void *data)
481da177e4SLinus Torvalds {
491da177e4SLinus Torvalds         nfs_readdata_free(data);
501da177e4SLinus Torvalds }
511da177e4SLinus Torvalds 
521da177e4SLinus Torvalds static
531da177e4SLinus Torvalds unsigned int nfs_page_length(struct inode *inode, struct page *page)
541da177e4SLinus Torvalds {
551da177e4SLinus Torvalds 	loff_t i_size = i_size_read(inode);
561da177e4SLinus Torvalds 	unsigned long idx;
571da177e4SLinus Torvalds 
581da177e4SLinus Torvalds 	if (i_size <= 0)
591da177e4SLinus Torvalds 		return 0;
601da177e4SLinus Torvalds 	idx = (i_size - 1) >> PAGE_CACHE_SHIFT;
611da177e4SLinus Torvalds 	if (page->index > idx)
621da177e4SLinus Torvalds 		return 0;
631da177e4SLinus Torvalds 	if (page->index != idx)
641da177e4SLinus Torvalds 		return PAGE_CACHE_SIZE;
651da177e4SLinus Torvalds 	return 1 + ((i_size - 1) & (PAGE_CACHE_SIZE - 1));
661da177e4SLinus Torvalds }
671da177e4SLinus Torvalds 
681da177e4SLinus Torvalds static
691da177e4SLinus Torvalds int nfs_return_empty_page(struct page *page)
701da177e4SLinus Torvalds {
711da177e4SLinus Torvalds 	memclear_highpage_flush(page, 0, PAGE_CACHE_SIZE);
721da177e4SLinus Torvalds 	SetPageUptodate(page);
731da177e4SLinus Torvalds 	unlock_page(page);
741da177e4SLinus Torvalds 	return 0;
751da177e4SLinus Torvalds }
761da177e4SLinus Torvalds 
771da177e4SLinus Torvalds /*
781da177e4SLinus Torvalds  * Read a page synchronously.
791da177e4SLinus Torvalds  */
801da177e4SLinus Torvalds static int nfs_readpage_sync(struct nfs_open_context *ctx, struct inode *inode,
811da177e4SLinus Torvalds 		struct page *page)
821da177e4SLinus Torvalds {
831da177e4SLinus Torvalds 	unsigned int	rsize = NFS_SERVER(inode)->rsize;
841da177e4SLinus Torvalds 	unsigned int	count = PAGE_CACHE_SIZE;
851da177e4SLinus Torvalds 	int		result;
861da177e4SLinus Torvalds 	struct nfs_read_data *rdata;
871da177e4SLinus Torvalds 
8840859d7eSChuck Lever 	rdata = nfs_readdata_alloc(1);
891da177e4SLinus Torvalds 	if (!rdata)
901da177e4SLinus Torvalds 		return -ENOMEM;
911da177e4SLinus Torvalds 
921da177e4SLinus Torvalds 	memset(rdata, 0, sizeof(*rdata));
931da177e4SLinus Torvalds 	rdata->flags = (IS_SWAPFILE(inode)? NFS_RPC_SWAPFLAGS : 0);
941da177e4SLinus Torvalds 	rdata->cred = ctx->cred;
951da177e4SLinus Torvalds 	rdata->inode = inode;
961da177e4SLinus Torvalds 	INIT_LIST_HEAD(&rdata->pages);
971da177e4SLinus Torvalds 	rdata->args.fh = NFS_FH(inode);
981da177e4SLinus Torvalds 	rdata->args.context = ctx;
991da177e4SLinus Torvalds 	rdata->args.pages = &page;
1001da177e4SLinus Torvalds 	rdata->args.pgbase = 0UL;
1011da177e4SLinus Torvalds 	rdata->args.count = rsize;
1021da177e4SLinus Torvalds 	rdata->res.fattr = &rdata->fattr;
1031da177e4SLinus Torvalds 
1041da177e4SLinus Torvalds 	dprintk("NFS: nfs_readpage_sync(%p)\n", page);
1051da177e4SLinus Torvalds 
1061da177e4SLinus Torvalds 	/*
1071da177e4SLinus Torvalds 	 * This works now because the socket layer never tries to DMA
1081da177e4SLinus Torvalds 	 * into this buffer directly.
1091da177e4SLinus Torvalds 	 */
1101da177e4SLinus Torvalds 	do {
1111da177e4SLinus Torvalds 		if (count < rsize)
1121da177e4SLinus Torvalds 			rdata->args.count = count;
1131da177e4SLinus Torvalds 		rdata->res.count = rdata->args.count;
1141da177e4SLinus Torvalds 		rdata->args.offset = page_offset(page) + rdata->args.pgbase;
1151da177e4SLinus Torvalds 
1161da177e4SLinus Torvalds 		dprintk("NFS: nfs_proc_read(%s, (%s/%Ld), %Lu, %u)\n",
1171da177e4SLinus Torvalds 			NFS_SERVER(inode)->hostname,
1181da177e4SLinus Torvalds 			inode->i_sb->s_id,
1191da177e4SLinus Torvalds 			(long long)NFS_FILEID(inode),
1201da177e4SLinus Torvalds 			(unsigned long long)rdata->args.pgbase,
1211da177e4SLinus Torvalds 			rdata->args.count);
1221da177e4SLinus Torvalds 
1231da177e4SLinus Torvalds 		lock_kernel();
1241da177e4SLinus Torvalds 		result = NFS_PROTO(inode)->read(rdata);
1251da177e4SLinus Torvalds 		unlock_kernel();
1261da177e4SLinus Torvalds 
1271da177e4SLinus Torvalds 		/*
1281da177e4SLinus Torvalds 		 * Even if we had a partial success we can't mark the page
1291da177e4SLinus Torvalds 		 * cache valid.
1301da177e4SLinus Torvalds 		 */
1311da177e4SLinus Torvalds 		if (result < 0) {
1321da177e4SLinus Torvalds 			if (result == -EISDIR)
1331da177e4SLinus Torvalds 				result = -EINVAL;
1341da177e4SLinus Torvalds 			goto io_error;
1351da177e4SLinus Torvalds 		}
1361da177e4SLinus Torvalds 		count -= result;
1371da177e4SLinus Torvalds 		rdata->args.pgbase += result;
13891d5b470SChuck Lever 		nfs_add_stats(inode, NFSIOS_SERVERREADBYTES, result);
13991d5b470SChuck Lever 
1401da177e4SLinus Torvalds 		/* Note: result == 0 should only happen if we're caching
1411da177e4SLinus Torvalds 		 * a write that extends the file and punches a hole.
1421da177e4SLinus Torvalds 		 */
1431da177e4SLinus Torvalds 		if (rdata->res.eof != 0 || result == 0)
1441da177e4SLinus Torvalds 			break;
1451da177e4SLinus Torvalds 	} while (count);
146dc59250cSChuck Lever 	spin_lock(&inode->i_lock);
14755296809SChuck Lever 	NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATIME;
148dc59250cSChuck Lever 	spin_unlock(&inode->i_lock);
1491da177e4SLinus Torvalds 
1501da177e4SLinus Torvalds 	if (count)
1511da177e4SLinus Torvalds 		memclear_highpage_flush(page, rdata->args.pgbase, count);
1521da177e4SLinus Torvalds 	SetPageUptodate(page);
1531da177e4SLinus Torvalds 	if (PageError(page))
1541da177e4SLinus Torvalds 		ClearPageError(page);
1551da177e4SLinus Torvalds 	result = 0;
1561da177e4SLinus Torvalds 
1571da177e4SLinus Torvalds io_error:
1581da177e4SLinus Torvalds 	unlock_page(page);
1591da177e4SLinus Torvalds 	nfs_readdata_free(rdata);
1601da177e4SLinus Torvalds 	return result;
1611da177e4SLinus Torvalds }
1621da177e4SLinus Torvalds 
1631da177e4SLinus Torvalds static int nfs_readpage_async(struct nfs_open_context *ctx, struct inode *inode,
1641da177e4SLinus Torvalds 		struct page *page)
1651da177e4SLinus Torvalds {
1661da177e4SLinus Torvalds 	LIST_HEAD(one_request);
1671da177e4SLinus Torvalds 	struct nfs_page	*new;
1681da177e4SLinus Torvalds 	unsigned int len;
1691da177e4SLinus Torvalds 
1701da177e4SLinus Torvalds 	len = nfs_page_length(inode, page);
1711da177e4SLinus Torvalds 	if (len == 0)
1721da177e4SLinus Torvalds 		return nfs_return_empty_page(page);
1731da177e4SLinus Torvalds 	new = nfs_create_request(ctx, inode, page, 0, len);
1741da177e4SLinus Torvalds 	if (IS_ERR(new)) {
1751da177e4SLinus Torvalds 		unlock_page(page);
1761da177e4SLinus Torvalds 		return PTR_ERR(new);
1771da177e4SLinus Torvalds 	}
1781da177e4SLinus Torvalds 	if (len < PAGE_CACHE_SIZE)
1791da177e4SLinus Torvalds 		memclear_highpage_flush(page, len, PAGE_CACHE_SIZE - len);
1801da177e4SLinus Torvalds 
1811da177e4SLinus Torvalds 	nfs_list_add_request(new, &one_request);
1821da177e4SLinus Torvalds 	nfs_pagein_one(&one_request, inode);
1831da177e4SLinus Torvalds 	return 0;
1841da177e4SLinus Torvalds }
1851da177e4SLinus Torvalds 
1861da177e4SLinus Torvalds static void nfs_readpage_release(struct nfs_page *req)
1871da177e4SLinus Torvalds {
1881da177e4SLinus Torvalds 	unlock_page(req->wb_page);
1891da177e4SLinus Torvalds 
1901da177e4SLinus Torvalds 	dprintk("NFS: read done (%s/%Ld %d@%Ld)\n",
1911da177e4SLinus Torvalds 			req->wb_context->dentry->d_inode->i_sb->s_id,
1921da177e4SLinus Torvalds 			(long long)NFS_FILEID(req->wb_context->dentry->d_inode),
1931da177e4SLinus Torvalds 			req->wb_bytes,
1941da177e4SLinus Torvalds 			(long long)req_offset(req));
19510d2c46fSNick Wilson 	nfs_clear_request(req);
19610d2c46fSNick Wilson 	nfs_release_request(req);
1971da177e4SLinus Torvalds }
1981da177e4SLinus Torvalds 
1991da177e4SLinus Torvalds /*
2001da177e4SLinus Torvalds  * Set up the NFS read request struct
2011da177e4SLinus Torvalds  */
2021da177e4SLinus Torvalds static void nfs_read_rpcsetup(struct nfs_page *req, struct nfs_read_data *data,
2031da177e4SLinus Torvalds 		unsigned int count, unsigned int offset)
2041da177e4SLinus Torvalds {
2051da177e4SLinus Torvalds 	struct inode		*inode;
2061da177e4SLinus Torvalds 
2071da177e4SLinus Torvalds 	data->req	  = req;
2081da177e4SLinus Torvalds 	data->inode	  = inode = req->wb_context->dentry->d_inode;
2091da177e4SLinus Torvalds 	data->cred	  = req->wb_context->cred;
2101da177e4SLinus Torvalds 
2111da177e4SLinus Torvalds 	data->args.fh     = NFS_FH(inode);
2121da177e4SLinus Torvalds 	data->args.offset = req_offset(req) + offset;
2131da177e4SLinus Torvalds 	data->args.pgbase = req->wb_pgbase + offset;
2141da177e4SLinus Torvalds 	data->args.pages  = data->pagevec;
2151da177e4SLinus Torvalds 	data->args.count  = count;
2161da177e4SLinus Torvalds 	data->args.context = req->wb_context;
2171da177e4SLinus Torvalds 
2181da177e4SLinus Torvalds 	data->res.fattr   = &data->fattr;
2191da177e4SLinus Torvalds 	data->res.count   = count;
2201da177e4SLinus Torvalds 	data->res.eof     = 0;
2210e574af1STrond Myklebust 	nfs_fattr_init(&data->fattr);
2221da177e4SLinus Torvalds 
2231da177e4SLinus Torvalds 	NFS_PROTO(inode)->read_setup(data);
2241da177e4SLinus Torvalds 
2251da177e4SLinus Torvalds 	data->task.tk_cookie = (unsigned long)inode;
2261da177e4SLinus Torvalds 
2271da177e4SLinus Torvalds 	dprintk("NFS: %4d initiated read call (req %s/%Ld, %u bytes @ offset %Lu)\n",
2281da177e4SLinus Torvalds 			data->task.tk_pid,
2291da177e4SLinus Torvalds 			inode->i_sb->s_id,
2301da177e4SLinus Torvalds 			(long long)NFS_FILEID(inode),
2311da177e4SLinus Torvalds 			count,
2321da177e4SLinus Torvalds 			(unsigned long long)data->args.offset);
2331da177e4SLinus Torvalds }
2341da177e4SLinus Torvalds 
2351da177e4SLinus Torvalds static void
2361da177e4SLinus Torvalds nfs_async_read_error(struct list_head *head)
2371da177e4SLinus Torvalds {
2381da177e4SLinus Torvalds 	struct nfs_page	*req;
2391da177e4SLinus Torvalds 
2401da177e4SLinus Torvalds 	while (!list_empty(head)) {
2411da177e4SLinus Torvalds 		req = nfs_list_entry(head->next);
2421da177e4SLinus Torvalds 		nfs_list_remove_request(req);
2431da177e4SLinus Torvalds 		SetPageError(req->wb_page);
2441da177e4SLinus Torvalds 		nfs_readpage_release(req);
2451da177e4SLinus Torvalds 	}
2461da177e4SLinus Torvalds }
2471da177e4SLinus Torvalds 
2481da177e4SLinus Torvalds /*
2491da177e4SLinus Torvalds  * Start an async read operation
2501da177e4SLinus Torvalds  */
2511da177e4SLinus Torvalds static void nfs_execute_read(struct nfs_read_data *data)
2521da177e4SLinus Torvalds {
2531da177e4SLinus Torvalds 	struct rpc_clnt *clnt = NFS_CLIENT(data->inode);
2541da177e4SLinus Torvalds 	sigset_t oldset;
2551da177e4SLinus Torvalds 
2561da177e4SLinus Torvalds 	rpc_clnt_sigmask(clnt, &oldset);
2571da177e4SLinus Torvalds 	lock_kernel();
2581da177e4SLinus Torvalds 	rpc_execute(&data->task);
2591da177e4SLinus Torvalds 	unlock_kernel();
2601da177e4SLinus Torvalds 	rpc_clnt_sigunmask(clnt, &oldset);
2611da177e4SLinus Torvalds }
2621da177e4SLinus Torvalds 
2631da177e4SLinus Torvalds /*
2641da177e4SLinus Torvalds  * Generate multiple requests to fill a single page.
2651da177e4SLinus Torvalds  *
2661da177e4SLinus Torvalds  * We optimize to reduce the number of read operations on the wire.  If we
2671da177e4SLinus Torvalds  * detect that we're reading a page, or an area of a page, that is past the
2681da177e4SLinus Torvalds  * end of file, we do not generate NFS read operations but just clear the
2691da177e4SLinus Torvalds  * parts of the page that would have come back zero from the server anyway.
2701da177e4SLinus Torvalds  *
2711da177e4SLinus Torvalds  * We rely on the cached value of i_size to make this determination; another
2721da177e4SLinus Torvalds  * client can fill pages on the server past our cached end-of-file, but we
2731da177e4SLinus Torvalds  * won't see the new data until our attribute cache is updated.  This is more
2741da177e4SLinus Torvalds  * or less conventional NFS client behavior.
2751da177e4SLinus Torvalds  */
2761da177e4SLinus Torvalds static int nfs_pagein_multi(struct list_head *head, struct inode *inode)
2771da177e4SLinus Torvalds {
2781da177e4SLinus Torvalds 	struct nfs_page *req = nfs_list_entry(head->next);
2791da177e4SLinus Torvalds 	struct page *page = req->wb_page;
2801da177e4SLinus Torvalds 	struct nfs_read_data *data;
2811da177e4SLinus Torvalds 	unsigned int rsize = NFS_SERVER(inode)->rsize;
2821da177e4SLinus Torvalds 	unsigned int nbytes, offset;
2831da177e4SLinus Torvalds 	int requests = 0;
2841da177e4SLinus Torvalds 	LIST_HEAD(list);
2851da177e4SLinus Torvalds 
2861da177e4SLinus Torvalds 	nfs_list_remove_request(req);
2871da177e4SLinus Torvalds 
2881da177e4SLinus Torvalds 	nbytes = req->wb_bytes;
2891da177e4SLinus Torvalds 	for(;;) {
29040859d7eSChuck Lever 		data = nfs_readdata_alloc(1);
2911da177e4SLinus Torvalds 		if (!data)
2921da177e4SLinus Torvalds 			goto out_bad;
2931da177e4SLinus Torvalds 		INIT_LIST_HEAD(&data->pages);
2941da177e4SLinus Torvalds 		list_add(&data->pages, &list);
2951da177e4SLinus Torvalds 		requests++;
2961da177e4SLinus Torvalds 		if (nbytes <= rsize)
2971da177e4SLinus Torvalds 			break;
2981da177e4SLinus Torvalds 		nbytes -= rsize;
2991da177e4SLinus Torvalds 	}
3001da177e4SLinus Torvalds 	atomic_set(&req->wb_complete, requests);
3011da177e4SLinus Torvalds 
3021da177e4SLinus Torvalds 	ClearPageError(page);
3031da177e4SLinus Torvalds 	offset = 0;
3041da177e4SLinus Torvalds 	nbytes = req->wb_bytes;
3051da177e4SLinus Torvalds 	do {
3061da177e4SLinus Torvalds 		data = list_entry(list.next, struct nfs_read_data, pages);
3071da177e4SLinus Torvalds 		list_del_init(&data->pages);
3081da177e4SLinus Torvalds 
3091da177e4SLinus Torvalds 		data->pagevec[0] = page;
3101da177e4SLinus Torvalds 		data->complete = nfs_readpage_result_partial;
3111da177e4SLinus Torvalds 
3121da177e4SLinus Torvalds 		if (nbytes > rsize) {
3131da177e4SLinus Torvalds 			nfs_read_rpcsetup(req, data, rsize, offset);
3141da177e4SLinus Torvalds 			offset += rsize;
3151da177e4SLinus Torvalds 			nbytes -= rsize;
3161da177e4SLinus Torvalds 		} else {
3171da177e4SLinus Torvalds 			nfs_read_rpcsetup(req, data, nbytes, offset);
3181da177e4SLinus Torvalds 			nbytes = 0;
3191da177e4SLinus Torvalds 		}
3201da177e4SLinus Torvalds 		nfs_execute_read(data);
3211da177e4SLinus Torvalds 	} while (nbytes != 0);
3221da177e4SLinus Torvalds 
3231da177e4SLinus Torvalds 	return 0;
3241da177e4SLinus Torvalds 
3251da177e4SLinus Torvalds out_bad:
3261da177e4SLinus Torvalds 	while (!list_empty(&list)) {
3271da177e4SLinus Torvalds 		data = list_entry(list.next, struct nfs_read_data, pages);
3281da177e4SLinus Torvalds 		list_del(&data->pages);
3291da177e4SLinus Torvalds 		nfs_readdata_free(data);
3301da177e4SLinus Torvalds 	}
3311da177e4SLinus Torvalds 	SetPageError(page);
3321da177e4SLinus Torvalds 	nfs_readpage_release(req);
3331da177e4SLinus Torvalds 	return -ENOMEM;
3341da177e4SLinus Torvalds }
3351da177e4SLinus Torvalds 
3361da177e4SLinus Torvalds static int nfs_pagein_one(struct list_head *head, struct inode *inode)
3371da177e4SLinus Torvalds {
3381da177e4SLinus Torvalds 	struct nfs_page		*req;
3391da177e4SLinus Torvalds 	struct page		**pages;
3401da177e4SLinus Torvalds 	struct nfs_read_data	*data;
3411da177e4SLinus Torvalds 	unsigned int		count;
3421da177e4SLinus Torvalds 
3431da177e4SLinus Torvalds 	if (NFS_SERVER(inode)->rsize < PAGE_CACHE_SIZE)
3441da177e4SLinus Torvalds 		return nfs_pagein_multi(head, inode);
3451da177e4SLinus Torvalds 
34640859d7eSChuck Lever 	data = nfs_readdata_alloc(NFS_SERVER(inode)->rpages);
3471da177e4SLinus Torvalds 	if (!data)
3481da177e4SLinus Torvalds 		goto out_bad;
3491da177e4SLinus Torvalds 
3501da177e4SLinus Torvalds 	INIT_LIST_HEAD(&data->pages);
3511da177e4SLinus Torvalds 	pages = data->pagevec;
3521da177e4SLinus Torvalds 	count = 0;
3531da177e4SLinus Torvalds 	while (!list_empty(head)) {
3541da177e4SLinus Torvalds 		req = nfs_list_entry(head->next);
3551da177e4SLinus Torvalds 		nfs_list_remove_request(req);
3561da177e4SLinus Torvalds 		nfs_list_add_request(req, &data->pages);
3571da177e4SLinus Torvalds 		ClearPageError(req->wb_page);
3581da177e4SLinus Torvalds 		*pages++ = req->wb_page;
3591da177e4SLinus Torvalds 		count += req->wb_bytes;
3601da177e4SLinus Torvalds 	}
3611da177e4SLinus Torvalds 	req = nfs_list_entry(data->pages.next);
3621da177e4SLinus Torvalds 
3631da177e4SLinus Torvalds 	data->complete = nfs_readpage_result_full;
3641da177e4SLinus Torvalds 	nfs_read_rpcsetup(req, data, count, 0);
3651da177e4SLinus Torvalds 
3661da177e4SLinus Torvalds 	nfs_execute_read(data);
3671da177e4SLinus Torvalds 	return 0;
3681da177e4SLinus Torvalds out_bad:
3691da177e4SLinus Torvalds 	nfs_async_read_error(head);
3701da177e4SLinus Torvalds 	return -ENOMEM;
3711da177e4SLinus Torvalds }
3721da177e4SLinus Torvalds 
3731da177e4SLinus Torvalds static int
3741da177e4SLinus Torvalds nfs_pagein_list(struct list_head *head, int rpages)
3751da177e4SLinus Torvalds {
3761da177e4SLinus Torvalds 	LIST_HEAD(one_request);
3771da177e4SLinus Torvalds 	struct nfs_page		*req;
3781da177e4SLinus Torvalds 	int			error = 0;
3791da177e4SLinus Torvalds 	unsigned int		pages = 0;
3801da177e4SLinus Torvalds 
3811da177e4SLinus Torvalds 	while (!list_empty(head)) {
3821da177e4SLinus Torvalds 		pages += nfs_coalesce_requests(head, &one_request, rpages);
3831da177e4SLinus Torvalds 		req = nfs_list_entry(one_request.next);
3841da177e4SLinus Torvalds 		error = nfs_pagein_one(&one_request, req->wb_context->dentry->d_inode);
3851da177e4SLinus Torvalds 		if (error < 0)
3861da177e4SLinus Torvalds 			break;
3871da177e4SLinus Torvalds 	}
3881da177e4SLinus Torvalds 	if (error >= 0)
3891da177e4SLinus Torvalds 		return pages;
3901da177e4SLinus Torvalds 
3911da177e4SLinus Torvalds 	nfs_async_read_error(head);
3921da177e4SLinus Torvalds 	return error;
3931da177e4SLinus Torvalds }
3941da177e4SLinus Torvalds 
3951da177e4SLinus Torvalds /*
3961da177e4SLinus Torvalds  * Handle a read reply that fills part of a page.
3971da177e4SLinus Torvalds  */
3981da177e4SLinus Torvalds static void nfs_readpage_result_partial(struct nfs_read_data *data, int status)
3991da177e4SLinus Torvalds {
4001da177e4SLinus Torvalds 	struct nfs_page *req = data->req;
4011da177e4SLinus Torvalds 	struct page *page = req->wb_page;
4021da177e4SLinus Torvalds 
4031da177e4SLinus Torvalds 	if (status >= 0) {
4041da177e4SLinus Torvalds 		unsigned int request = data->args.count;
4051da177e4SLinus Torvalds 		unsigned int result = data->res.count;
4061da177e4SLinus Torvalds 
4071da177e4SLinus Torvalds 		if (result < request) {
4081da177e4SLinus Torvalds 			memclear_highpage_flush(page,
4091da177e4SLinus Torvalds 						data->args.pgbase + result,
4101da177e4SLinus Torvalds 						request - result);
4111da177e4SLinus Torvalds 		}
4121da177e4SLinus Torvalds 	} else
4131da177e4SLinus Torvalds 		SetPageError(page);
4141da177e4SLinus Torvalds 
4151da177e4SLinus Torvalds 	if (atomic_dec_and_test(&req->wb_complete)) {
4161da177e4SLinus Torvalds 		if (!PageError(page))
4171da177e4SLinus Torvalds 			SetPageUptodate(page);
4181da177e4SLinus Torvalds 		nfs_readpage_release(req);
4191da177e4SLinus Torvalds 	}
4201da177e4SLinus Torvalds }
4211da177e4SLinus Torvalds 
4221da177e4SLinus Torvalds /*
4231da177e4SLinus Torvalds  * This is the callback from RPC telling us whether a reply was
4241da177e4SLinus Torvalds  * received or some error occurred (timeout or socket shutdown).
4251da177e4SLinus Torvalds  */
4261da177e4SLinus Torvalds static void nfs_readpage_result_full(struct nfs_read_data *data, int status)
4271da177e4SLinus Torvalds {
4281da177e4SLinus Torvalds 	unsigned int count = data->res.count;
4291da177e4SLinus Torvalds 
4301da177e4SLinus Torvalds 	while (!list_empty(&data->pages)) {
4311da177e4SLinus Torvalds 		struct nfs_page *req = nfs_list_entry(data->pages.next);
4321da177e4SLinus Torvalds 		struct page *page = req->wb_page;
4331da177e4SLinus Torvalds 		nfs_list_remove_request(req);
4341da177e4SLinus Torvalds 
4351da177e4SLinus Torvalds 		if (status >= 0) {
4361da177e4SLinus Torvalds 			if (count < PAGE_CACHE_SIZE) {
4371da177e4SLinus Torvalds 				if (count < req->wb_bytes)
4381da177e4SLinus Torvalds 					memclear_highpage_flush(page,
4391da177e4SLinus Torvalds 							req->wb_pgbase + count,
4401da177e4SLinus Torvalds 							req->wb_bytes - count);
4411da177e4SLinus Torvalds 				count = 0;
4421da177e4SLinus Torvalds 			} else
4431da177e4SLinus Torvalds 				count -= PAGE_CACHE_SIZE;
4441da177e4SLinus Torvalds 			SetPageUptodate(page);
4451da177e4SLinus Torvalds 		} else
4461da177e4SLinus Torvalds 			SetPageError(page);
4471da177e4SLinus Torvalds 		nfs_readpage_release(req);
4481da177e4SLinus Torvalds 	}
4491da177e4SLinus Torvalds }
4501da177e4SLinus Torvalds 
4511da177e4SLinus Torvalds /*
4521da177e4SLinus Torvalds  * This is the callback from RPC telling us whether a reply was
4531da177e4SLinus Torvalds  * received or some error occurred (timeout or socket shutdown).
4541da177e4SLinus Torvalds  */
455963d8fe5STrond Myklebust void nfs_readpage_result(struct rpc_task *task, void *calldata)
4561da177e4SLinus Torvalds {
457963d8fe5STrond Myklebust 	struct nfs_read_data *data = calldata;
4581da177e4SLinus Torvalds 	struct nfs_readargs *argp = &data->args;
4591da177e4SLinus Torvalds 	struct nfs_readres *resp = &data->res;
4601da177e4SLinus Torvalds 	int status = task->tk_status;
4611da177e4SLinus Torvalds 
4621da177e4SLinus Torvalds 	dprintk("NFS: %4d nfs_readpage_result, (status %d)\n",
4631da177e4SLinus Torvalds 		task->tk_pid, status);
4641da177e4SLinus Torvalds 
46591d5b470SChuck Lever 	nfs_add_stats(data->inode, NFSIOS_SERVERREADBYTES, resp->count);
46691d5b470SChuck Lever 
4671da177e4SLinus Torvalds 	/* Is this a short read? */
4681da177e4SLinus Torvalds 	if (task->tk_status >= 0 && resp->count < argp->count && !resp->eof) {
46991d5b470SChuck Lever 		nfs_inc_stats(data->inode, NFSIOS_SHORTREAD);
4701da177e4SLinus Torvalds 		/* Has the server at least made some progress? */
4711da177e4SLinus Torvalds 		if (resp->count != 0) {
4721da177e4SLinus Torvalds 			/* Yes, so retry the read at the end of the data */
4731da177e4SLinus Torvalds 			argp->offset += resp->count;
4741da177e4SLinus Torvalds 			argp->pgbase += resp->count;
4751da177e4SLinus Torvalds 			argp->count -= resp->count;
4761da177e4SLinus Torvalds 			rpc_restart_call(task);
4771da177e4SLinus Torvalds 			return;
4781da177e4SLinus Torvalds 		}
4791da177e4SLinus Torvalds 		task->tk_status = -EIO;
4801da177e4SLinus Torvalds 	}
481dc59250cSChuck Lever 	spin_lock(&data->inode->i_lock);
48255296809SChuck Lever 	NFS_I(data->inode)->cache_validity |= NFS_INO_INVALID_ATIME;
483dc59250cSChuck Lever 	spin_unlock(&data->inode->i_lock);
4841da177e4SLinus Torvalds 	data->complete(data, status);
4851da177e4SLinus Torvalds }
4861da177e4SLinus Torvalds 
4871da177e4SLinus Torvalds /*
4881da177e4SLinus Torvalds  * Read a page over NFS.
4891da177e4SLinus Torvalds  * We read the page synchronously in the following case:
4901da177e4SLinus Torvalds  *  -	The error flag is set for this page. This happens only when a
4911da177e4SLinus Torvalds  *	previous async read operation failed.
4921da177e4SLinus Torvalds  */
4931da177e4SLinus Torvalds int nfs_readpage(struct file *file, struct page *page)
4941da177e4SLinus Torvalds {
4951da177e4SLinus Torvalds 	struct nfs_open_context *ctx;
4961da177e4SLinus Torvalds 	struct inode *inode = page->mapping->host;
4971da177e4SLinus Torvalds 	int		error;
4981da177e4SLinus Torvalds 
4991da177e4SLinus Torvalds 	dprintk("NFS: nfs_readpage (%p %ld@%lu)\n",
5001da177e4SLinus Torvalds 		page, PAGE_CACHE_SIZE, page->index);
50191d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGE);
50291d5b470SChuck Lever 	nfs_add_stats(inode, NFSIOS_READPAGES, 1);
50391d5b470SChuck Lever 
5041da177e4SLinus Torvalds 	/*
5051da177e4SLinus Torvalds 	 * Try to flush any pending writes to the file..
5061da177e4SLinus Torvalds 	 *
5071da177e4SLinus Torvalds 	 * NOTE! Because we own the page lock, there cannot
5081da177e4SLinus Torvalds 	 * be any new pending writes generated at this point
5091da177e4SLinus Torvalds 	 * for this page (other pages can be written to).
5101da177e4SLinus Torvalds 	 */
5111da177e4SLinus Torvalds 	error = nfs_wb_page(inode, page);
5121da177e4SLinus Torvalds 	if (error)
5131da177e4SLinus Torvalds 		goto out_error;
5141da177e4SLinus Torvalds 
5151da177e4SLinus Torvalds 	if (file == NULL) {
516d530838bSTrond Myklebust 		ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
5171da177e4SLinus Torvalds 		if (ctx == NULL)
5181da177e4SLinus Torvalds 			return -EBADF;
5191da177e4SLinus Torvalds 	} else
5201da177e4SLinus Torvalds 		ctx = get_nfs_open_context((struct nfs_open_context *)
5211da177e4SLinus Torvalds 				file->private_data);
5221da177e4SLinus Torvalds 	if (!IS_SYNC(inode)) {
5231da177e4SLinus Torvalds 		error = nfs_readpage_async(ctx, inode, page);
5241da177e4SLinus Torvalds 		goto out;
5251da177e4SLinus Torvalds 	}
5261da177e4SLinus Torvalds 
5271da177e4SLinus Torvalds 	error = nfs_readpage_sync(ctx, inode, page);
5281da177e4SLinus Torvalds 	if (error < 0 && IS_SWAPFILE(inode))
5291da177e4SLinus Torvalds 		printk("Aiee.. nfs swap-in of page failed!\n");
5301da177e4SLinus Torvalds out:
5311da177e4SLinus Torvalds 	put_nfs_open_context(ctx);
5321da177e4SLinus Torvalds 	return error;
5331da177e4SLinus Torvalds 
5341da177e4SLinus Torvalds out_error:
5351da177e4SLinus Torvalds 	unlock_page(page);
5361da177e4SLinus Torvalds 	return error;
5371da177e4SLinus Torvalds }
5381da177e4SLinus Torvalds 
5391da177e4SLinus Torvalds struct nfs_readdesc {
5401da177e4SLinus Torvalds 	struct list_head *head;
5411da177e4SLinus Torvalds 	struct nfs_open_context *ctx;
5421da177e4SLinus Torvalds };
5431da177e4SLinus Torvalds 
5441da177e4SLinus Torvalds static int
5451da177e4SLinus Torvalds readpage_async_filler(void *data, struct page *page)
5461da177e4SLinus Torvalds {
5471da177e4SLinus Torvalds 	struct nfs_readdesc *desc = (struct nfs_readdesc *)data;
5481da177e4SLinus Torvalds 	struct inode *inode = page->mapping->host;
5491da177e4SLinus Torvalds 	struct nfs_page *new;
5501da177e4SLinus Torvalds 	unsigned int len;
5511da177e4SLinus Torvalds 
5521da177e4SLinus Torvalds 	nfs_wb_page(inode, page);
5531da177e4SLinus Torvalds 	len = nfs_page_length(inode, page);
5541da177e4SLinus Torvalds 	if (len == 0)
5551da177e4SLinus Torvalds 		return nfs_return_empty_page(page);
5561da177e4SLinus Torvalds 	new = nfs_create_request(desc->ctx, inode, page, 0, len);
5571da177e4SLinus Torvalds 	if (IS_ERR(new)) {
5581da177e4SLinus Torvalds 			SetPageError(page);
5591da177e4SLinus Torvalds 			unlock_page(page);
5601da177e4SLinus Torvalds 			return PTR_ERR(new);
5611da177e4SLinus Torvalds 	}
5621da177e4SLinus Torvalds 	if (len < PAGE_CACHE_SIZE)
5631da177e4SLinus Torvalds 		memclear_highpage_flush(page, len, PAGE_CACHE_SIZE - len);
5641da177e4SLinus Torvalds 	nfs_list_add_request(new, desc->head);
5651da177e4SLinus Torvalds 	return 0;
5661da177e4SLinus Torvalds }
5671da177e4SLinus Torvalds 
5681da177e4SLinus Torvalds int nfs_readpages(struct file *filp, struct address_space *mapping,
5691da177e4SLinus Torvalds 		struct list_head *pages, unsigned nr_pages)
5701da177e4SLinus Torvalds {
5711da177e4SLinus Torvalds 	LIST_HEAD(head);
5721da177e4SLinus Torvalds 	struct nfs_readdesc desc = {
5731da177e4SLinus Torvalds 		.head		= &head,
5741da177e4SLinus Torvalds 	};
5751da177e4SLinus Torvalds 	struct inode *inode = mapping->host;
5761da177e4SLinus Torvalds 	struct nfs_server *server = NFS_SERVER(inode);
5771da177e4SLinus Torvalds 	int ret;
5781da177e4SLinus Torvalds 
5791da177e4SLinus Torvalds 	dprintk("NFS: nfs_readpages (%s/%Ld %d)\n",
5801da177e4SLinus Torvalds 			inode->i_sb->s_id,
5811da177e4SLinus Torvalds 			(long long)NFS_FILEID(inode),
5821da177e4SLinus Torvalds 			nr_pages);
58391d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGES);
5841da177e4SLinus Torvalds 
5851da177e4SLinus Torvalds 	if (filp == NULL) {
586d530838bSTrond Myklebust 		desc.ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
5871da177e4SLinus Torvalds 		if (desc.ctx == NULL)
5881da177e4SLinus Torvalds 			return -EBADF;
5891da177e4SLinus Torvalds 	} else
5901da177e4SLinus Torvalds 		desc.ctx = get_nfs_open_context((struct nfs_open_context *)
5911da177e4SLinus Torvalds 				filp->private_data);
5921da177e4SLinus Torvalds 	ret = read_cache_pages(mapping, pages, readpage_async_filler, &desc);
5931da177e4SLinus Torvalds 	if (!list_empty(&head)) {
5941da177e4SLinus Torvalds 		int err = nfs_pagein_list(&head, server->rpages);
5951da177e4SLinus Torvalds 		if (!ret)
59691d5b470SChuck Lever 			nfs_add_stats(inode, NFSIOS_READPAGES, err);
5971da177e4SLinus Torvalds 			ret = err;
5981da177e4SLinus Torvalds 	}
5991da177e4SLinus Torvalds 	put_nfs_open_context(desc.ctx);
6001da177e4SLinus Torvalds 	return ret;
6011da177e4SLinus Torvalds }
6021da177e4SLinus Torvalds 
6031da177e4SLinus Torvalds int nfs_init_readpagecache(void)
6041da177e4SLinus Torvalds {
6051da177e4SLinus Torvalds 	nfs_rdata_cachep = kmem_cache_create("nfs_read_data",
6061da177e4SLinus Torvalds 					     sizeof(struct nfs_read_data),
6071da177e4SLinus Torvalds 					     0, SLAB_HWCACHE_ALIGN,
6081da177e4SLinus Torvalds 					     NULL, NULL);
6091da177e4SLinus Torvalds 	if (nfs_rdata_cachep == NULL)
6101da177e4SLinus Torvalds 		return -ENOMEM;
6111da177e4SLinus Torvalds 
6121da177e4SLinus Torvalds 	nfs_rdata_mempool = mempool_create(MIN_POOL_READ,
6131da177e4SLinus Torvalds 					   mempool_alloc_slab,
6141da177e4SLinus Torvalds 					   mempool_free_slab,
6151da177e4SLinus Torvalds 					   nfs_rdata_cachep);
6161da177e4SLinus Torvalds 	if (nfs_rdata_mempool == NULL)
6171da177e4SLinus Torvalds 		return -ENOMEM;
6181da177e4SLinus Torvalds 
6191da177e4SLinus Torvalds 	return 0;
6201da177e4SLinus Torvalds }
6211da177e4SLinus Torvalds 
6221da177e4SLinus Torvalds void nfs_destroy_readpagecache(void)
6231da177e4SLinus Torvalds {
6241da177e4SLinus Torvalds 	mempool_destroy(nfs_rdata_mempool);
6251da177e4SLinus Torvalds 	if (kmem_cache_destroy(nfs_rdata_cachep))
6261da177e4SLinus Torvalds 		printk(KERN_INFO "nfs_read_data: not all structures were freed\n");
6271da177e4SLinus Torvalds }
628