xref: /openbmc/linux/fs/nfs/read.c (revision df3accb849607a86278a37c35e6b313635ccc48b)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  * linux/fs/nfs/read.c
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  * Block I/O for NFS
51da177e4SLinus Torvalds  *
61da177e4SLinus Torvalds  * Partial copy of Linus' read cache modifications to fs/nfs/file.c
71da177e4SLinus Torvalds  * modified for async RPC by okir@monad.swb.de
81da177e4SLinus Torvalds  */
91da177e4SLinus Torvalds 
101da177e4SLinus Torvalds #include <linux/time.h>
111da177e4SLinus Torvalds #include <linux/kernel.h>
121da177e4SLinus Torvalds #include <linux/errno.h>
131da177e4SLinus Torvalds #include <linux/fcntl.h>
141da177e4SLinus Torvalds #include <linux/stat.h>
151da177e4SLinus Torvalds #include <linux/mm.h>
161da177e4SLinus Torvalds #include <linux/slab.h>
171da177e4SLinus Torvalds #include <linux/pagemap.h>
181da177e4SLinus Torvalds #include <linux/sunrpc/clnt.h>
191da177e4SLinus Torvalds #include <linux/nfs_fs.h>
201da177e4SLinus Torvalds #include <linux/nfs_page.h>
2164419a9bSAndy Adamson #include <linux/module.h>
221da177e4SLinus Torvalds 
23f11c88afSAndy Adamson #include "nfs4_fs.h"
2449a70f27STrond Myklebust #include "internal.h"
2591d5b470SChuck Lever #include "iostat.h"
269a9fc1c0SDavid Howells #include "fscache.h"
27fab5fc25SChristoph Hellwig #include "pnfs.h"
288224b273SChuck Lever #include "nfstrace.h"
2991d5b470SChuck Lever 
301da177e4SLinus Torvalds #define NFSDBG_FACILITY		NFSDBG_PAGECACHE
311da177e4SLinus Torvalds 
32061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops;
334a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops;
341da177e4SLinus Torvalds 
35e18b890bSChristoph Lameter static struct kmem_cache *nfs_rdata_cachep;
361da177e4SLinus Torvalds 
371e7f3a48SWeston Andros Adamson static struct nfs_pgio_header *nfs_readhdr_alloc(void)
383feb2d49STrond Myklebust {
39fbe77c30SBenjamin Coddington 	struct nfs_pgio_header *p = kmem_cache_zalloc(nfs_rdata_cachep, GFP_KERNEL);
40fbe77c30SBenjamin Coddington 
41fbe77c30SBenjamin Coddington 	if (p)
42fbe77c30SBenjamin Coddington 		p->rw_mode = FMODE_READ;
43fbe77c30SBenjamin Coddington 	return p;
444db6e0b7SFred Isaman }
454db6e0b7SFred Isaman 
461e7f3a48SWeston Andros Adamson static void nfs_readhdr_free(struct nfs_pgio_header *rhdr)
473feb2d49STrond Myklebust {
48cd841605SFred Isaman 	kmem_cache_free(nfs_rdata_cachep, rhdr);
493feb2d49STrond Myklebust }
503feb2d49STrond Myklebust 
511da177e4SLinus Torvalds static
521da177e4SLinus Torvalds int nfs_return_empty_page(struct page *page)
531da177e4SLinus Torvalds {
5409cbfeafSKirill A. Shutemov 	zero_user(page, 0, PAGE_SIZE);
551da177e4SLinus Torvalds 	SetPageUptodate(page);
561da177e4SLinus Torvalds 	unlock_page(page);
571da177e4SLinus Torvalds 	return 0;
581da177e4SLinus Torvalds }
591da177e4SLinus Torvalds 
601abb5088SBryan Schumaker void nfs_pageio_init_read(struct nfs_pageio_descriptor *pgio,
61fab5fc25SChristoph Hellwig 			      struct inode *inode, bool force_mds,
62061ae2edSFred Isaman 			      const struct nfs_pgio_completion_ops *compl_ops)
631751c363STrond Myklebust {
64fab5fc25SChristoph Hellwig 	struct nfs_server *server = NFS_SERVER(inode);
6541d8d5b7SAnna Schumaker 	const struct nfs_pageio_ops *pg_ops = &nfs_pgio_rw_ops;
66fab5fc25SChristoph Hellwig 
67fab5fc25SChristoph Hellwig #ifdef CONFIG_NFS_V4_1
68fab5fc25SChristoph Hellwig 	if (server->pnfs_curr_ld && !force_mds)
69fab5fc25SChristoph Hellwig 		pg_ops = server->pnfs_curr_ld->pg_read_ops;
70fab5fc25SChristoph Hellwig #endif
714a0de55cSAnna Schumaker 	nfs_pageio_init(pgio, inode, pg_ops, compl_ops, &nfs_rw_read_ops,
723bde7afdSTrond Myklebust 			server->rsize, 0);
731751c363STrond Myklebust }
74ddda8e0aSBryan Schumaker EXPORT_SYMBOL_GPL(nfs_pageio_init_read);
751751c363STrond Myklebust 
76493292ddSTrond Myklebust void nfs_pageio_reset_read_mds(struct nfs_pageio_descriptor *pgio)
77493292ddSTrond Myklebust {
78a7d42ddbSWeston Andros Adamson 	struct nfs_pgio_mirror *mirror;
79a7d42ddbSWeston Andros Adamson 
806f29b9bbSKinglong Mee 	if (pgio->pg_ops && pgio->pg_ops->pg_cleanup)
816f29b9bbSKinglong Mee 		pgio->pg_ops->pg_cleanup(pgio);
826f29b9bbSKinglong Mee 
8341d8d5b7SAnna Schumaker 	pgio->pg_ops = &nfs_pgio_rw_ops;
84a7d42ddbSWeston Andros Adamson 
85a7d42ddbSWeston Andros Adamson 	/* read path should never have more than one mirror */
86a7d42ddbSWeston Andros Adamson 	WARN_ON_ONCE(pgio->pg_mirror_count != 1);
87a7d42ddbSWeston Andros Adamson 
88a7d42ddbSWeston Andros Adamson 	mirror = &pgio->pg_mirrors[0];
89a7d42ddbSWeston Andros Adamson 	mirror->pg_bsize = NFS_SERVER(pgio->pg_inode)->rsize;
90493292ddSTrond Myklebust }
911f945357STrond Myklebust EXPORT_SYMBOL_GPL(nfs_pageio_reset_read_mds);
92493292ddSTrond Myklebust 
930bcbf039SPeng Tao static void nfs_readpage_release(struct nfs_page *req)
940bcbf039SPeng Tao {
950bcbf039SPeng Tao 	struct inode *inode = d_inode(req->wb_context->dentry);
960bcbf039SPeng Tao 
970bcbf039SPeng Tao 	dprintk("NFS: read done (%s/%llu %d@%lld)\n", inode->i_sb->s_id,
980bcbf039SPeng Tao 		(unsigned long long)NFS_FILEID(inode), req->wb_bytes,
990bcbf039SPeng Tao 		(long long)req_offset(req));
1000bcbf039SPeng Tao 
1010bcbf039SPeng Tao 	if (nfs_page_group_sync_on_bit(req, PG_UNLOCKPAGE)) {
1020bcbf039SPeng Tao 		if (PageUptodate(req->wb_page))
1030bcbf039SPeng Tao 			nfs_readpage_to_fscache(inode, req->wb_page, 0);
1040bcbf039SPeng Tao 
1050bcbf039SPeng Tao 		unlock_page(req->wb_page);
1060bcbf039SPeng Tao 	}
1070bcbf039SPeng Tao 	nfs_release_request(req);
1080bcbf039SPeng Tao }
1090bcbf039SPeng Tao 
110f42b293dSDavid Howells int nfs_readpage_async(struct nfs_open_context *ctx, struct inode *inode,
1111da177e4SLinus Torvalds 		       struct page *page)
1121da177e4SLinus Torvalds {
1131da177e4SLinus Torvalds 	struct nfs_page	*new;
1141da177e4SLinus Torvalds 	unsigned int len;
115c76069bdSFred Isaman 	struct nfs_pageio_descriptor pgio;
116a7d42ddbSWeston Andros Adamson 	struct nfs_pgio_mirror *pgm;
1171da177e4SLinus Torvalds 
11849a70f27STrond Myklebust 	len = nfs_page_length(page);
1191da177e4SLinus Torvalds 	if (len == 0)
1201da177e4SLinus Torvalds 		return nfs_return_empty_page(page);
1212bfc6e56SWeston Andros Adamson 	new = nfs_create_request(ctx, page, NULL, 0, len);
1221da177e4SLinus Torvalds 	if (IS_ERR(new)) {
1231da177e4SLinus Torvalds 		unlock_page(page);
1241da177e4SLinus Torvalds 		return PTR_ERR(new);
1251da177e4SLinus Torvalds 	}
12609cbfeafSKirill A. Shutemov 	if (len < PAGE_SIZE)
12709cbfeafSKirill A. Shutemov 		zero_user_segment(page, len, PAGE_SIZE);
1281da177e4SLinus Torvalds 
129fab5fc25SChristoph Hellwig 	nfs_pageio_init_read(&pgio, inode, false,
130fab5fc25SChristoph Hellwig 			     &nfs_async_read_completion_ops);
1310bcbf039SPeng Tao 	if (!nfs_pageio_add_request(&pgio, new)) {
1320bcbf039SPeng Tao 		nfs_list_remove_request(new);
1330bcbf039SPeng Tao 		nfs_readpage_release(new);
1340bcbf039SPeng Tao 	}
1351751c363STrond Myklebust 	nfs_pageio_complete(&pgio);
136a7d42ddbSWeston Andros Adamson 
137a7d42ddbSWeston Andros Adamson 	/* It doesn't make sense to do mirrored reads! */
138a7d42ddbSWeston Andros Adamson 	WARN_ON_ONCE(pgio.pg_mirror_count != 1);
139a7d42ddbSWeston Andros Adamson 
140a7d42ddbSWeston Andros Adamson 	pgm = &pgio.pg_mirrors[0];
141a7d42ddbSWeston Andros Adamson 	NFS_I(inode)->read_io += pgm->pg_bytes_written;
142a7d42ddbSWeston Andros Adamson 
143d600ad1fSPeng Tao 	return pgio.pg_error < 0 ? pgio.pg_error : 0;
1441da177e4SLinus Torvalds }
1451da177e4SLinus Torvalds 
14667d0338eSWeston Andros Adamson static void nfs_page_group_set_uptodate(struct nfs_page *req)
14767d0338eSWeston Andros Adamson {
14867d0338eSWeston Andros Adamson 	if (nfs_page_group_sync_on_bit(req, PG_UPTODATE))
14967d0338eSWeston Andros Adamson 		SetPageUptodate(req->wb_page);
15067d0338eSWeston Andros Adamson }
15167d0338eSWeston Andros Adamson 
152061ae2edSFred Isaman static void nfs_read_completion(struct nfs_pgio_header *hdr)
1534db6e0b7SFred Isaman {
1544db6e0b7SFred Isaman 	unsigned long bytes = 0;
1554db6e0b7SFred Isaman 
1564db6e0b7SFred Isaman 	if (test_bit(NFS_IOHDR_REDO, &hdr->flags))
1574db6e0b7SFred Isaman 		goto out;
1584db6e0b7SFred Isaman 	while (!list_empty(&hdr->pages)) {
1594db6e0b7SFred Isaman 		struct nfs_page *req = nfs_list_entry(hdr->pages.next);
1604db6e0b7SFred Isaman 		struct page *page = req->wb_page;
16168072992SWeston Andros Adamson 		unsigned long start = req->wb_pgbase;
16268072992SWeston Andros Adamson 		unsigned long end = req->wb_pgbase + req->wb_bytes;
1634db6e0b7SFred Isaman 
1644db6e0b7SFred Isaman 		if (test_bit(NFS_IOHDR_EOF, &hdr->flags)) {
16568072992SWeston Andros Adamson 			/* note: regions of the page not covered by a
16668072992SWeston Andros Adamson 			 * request are zeroed in nfs_readpage_async /
16768072992SWeston Andros Adamson 			 * readpage_async_filler */
16868072992SWeston Andros Adamson 			if (bytes > hdr->good_bytes) {
16968072992SWeston Andros Adamson 				/* nothing in this request was good, so zero
17068072992SWeston Andros Adamson 				 * the full extent of the request */
17168072992SWeston Andros Adamson 				zero_user_segment(page, start, end);
17268072992SWeston Andros Adamson 
17368072992SWeston Andros Adamson 			} else if (hdr->good_bytes - bytes < req->wb_bytes) {
17468072992SWeston Andros Adamson 				/* part of this request has good bytes, but
17568072992SWeston Andros Adamson 				 * not all. zero the bad bytes */
17668072992SWeston Andros Adamson 				start += hdr->good_bytes - bytes;
17768072992SWeston Andros Adamson 				WARN_ON(start < req->wb_pgbase);
17868072992SWeston Andros Adamson 				zero_user_segment(page, start, end);
17968072992SWeston Andros Adamson 			}
1804db6e0b7SFred Isaman 		}
1814bd8b010STrond Myklebust 		bytes += req->wb_bytes;
1824bd8b010STrond Myklebust 		if (test_bit(NFS_IOHDR_ERROR, &hdr->flags)) {
1834bd8b010STrond Myklebust 			if (bytes <= hdr->good_bytes)
18467d0338eSWeston Andros Adamson 				nfs_page_group_set_uptodate(req);
1854bd8b010STrond Myklebust 		} else
18667d0338eSWeston Andros Adamson 			nfs_page_group_set_uptodate(req);
1874db6e0b7SFred Isaman 		nfs_list_remove_request(req);
1884db6e0b7SFred Isaman 		nfs_readpage_release(req);
1894db6e0b7SFred Isaman 	}
1904db6e0b7SFred Isaman out:
1914db6e0b7SFred Isaman 	hdr->release(hdr);
1924db6e0b7SFred Isaman }
1934db6e0b7SFred Isaman 
194d45f60c6SWeston Andros Adamson static void nfs_initiate_read(struct nfs_pgio_header *hdr,
195d45f60c6SWeston Andros Adamson 			      struct rpc_message *msg,
196abde71f4STom Haynes 			      const struct nfs_rpc_ops *rpc_ops,
1971ed26f33SAnna Schumaker 			      struct rpc_task_setup *task_setup_data, int how)
19864419a9bSAndy Adamson {
199d45f60c6SWeston Andros Adamson 	struct inode *inode = hdr->inode;
20064419a9bSAndy Adamson 	int swap_flags = IS_SWAPFILE(inode) ? NFS_RPC_SWAPFLAGS : 0;
20164419a9bSAndy Adamson 
2021ed26f33SAnna Schumaker 	task_setup_data->flags |= swap_flags;
203abde71f4STom Haynes 	rpc_ops->read_setup(hdr, msg);
2048224b273SChuck Lever 	trace_nfs_initiate_read(inode, hdr->io_start, hdr->good_bytes);
20564419a9bSAndy Adamson }
20664419a9bSAndy Adamson 
207061ae2edSFred Isaman static void
208*df3accb8STrond Myklebust nfs_async_read_error(struct list_head *head, int error)
2091da177e4SLinus Torvalds {
2101da177e4SLinus Torvalds 	struct nfs_page	*req;
2111da177e4SLinus Torvalds 
2121da177e4SLinus Torvalds 	while (!list_empty(head)) {
2131da177e4SLinus Torvalds 		req = nfs_list_entry(head->next);
2141da177e4SLinus Torvalds 		nfs_list_remove_request(req);
2151da177e4SLinus Torvalds 		nfs_readpage_release(req);
2161da177e4SLinus Torvalds 	}
2171da177e4SLinus Torvalds }
2181da177e4SLinus Torvalds 
219061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops = {
220061ae2edSFred Isaman 	.error_cleanup = nfs_async_read_error,
221061ae2edSFred Isaman 	.completion = nfs_read_completion,
222061ae2edSFred Isaman };
223061ae2edSFred Isaman 
2241da177e4SLinus Torvalds /*
2250b671301STrond Myklebust  * This is the callback from RPC telling us whether a reply was
2260b671301STrond Myklebust  * received or some error occurred (timeout or socket shutdown).
2270b671301STrond Myklebust  */
228d45f60c6SWeston Andros Adamson static int nfs_readpage_done(struct rpc_task *task,
229d45f60c6SWeston Andros Adamson 			     struct nfs_pgio_header *hdr,
2300eecb214SAnna Schumaker 			     struct inode *inode)
2310b671301STrond Myklebust {
232d45f60c6SWeston Andros Adamson 	int status = NFS_PROTO(inode)->read_done(task, hdr);
2330b671301STrond Myklebust 	if (status != 0)
2340b671301STrond Myklebust 		return status;
2350b671301STrond Myklebust 
236d45f60c6SWeston Andros Adamson 	nfs_add_stats(inode, NFSIOS_SERVERREADBYTES, hdr->res.count);
2378224b273SChuck Lever 	trace_nfs_readpage_done(inode, task->tk_status,
2388224b273SChuck Lever 				hdr->args.offset, hdr->res.eof);
2390b671301STrond Myklebust 
2400b671301STrond Myklebust 	if (task->tk_status == -ESTALE) {
241cd841605SFred Isaman 		set_bit(NFS_INO_STALE, &NFS_I(inode)->flags);
242cd841605SFred Isaman 		nfs_mark_for_revalidate(inode);
2430b671301STrond Myklebust 	}
2440b671301STrond Myklebust 	return 0;
2450b671301STrond Myklebust }
2460b671301STrond Myklebust 
247d45f60c6SWeston Andros Adamson static void nfs_readpage_retry(struct rpc_task *task,
248d45f60c6SWeston Andros Adamson 			       struct nfs_pgio_header *hdr)
2490b671301STrond Myklebust {
250d45f60c6SWeston Andros Adamson 	struct nfs_pgio_args *argp = &hdr->args;
251d45f60c6SWeston Andros Adamson 	struct nfs_pgio_res  *resp = &hdr->res;
2520b671301STrond Myklebust 
2530b671301STrond Myklebust 	/* This is a short read! */
254d45f60c6SWeston Andros Adamson 	nfs_inc_stats(hdr->inode, NFSIOS_SHORTREAD);
2550b671301STrond Myklebust 	/* Has the server at least made some progress? */
2564db6e0b7SFred Isaman 	if (resp->count == 0) {
257d45f60c6SWeston Andros Adamson 		nfs_set_pgio_error(hdr, -EIO, argp->offset);
258d61e612aSTrond Myklebust 		return;
2594db6e0b7SFred Isaman 	}
260f8417b48SKinglong Mee 
261f8417b48SKinglong Mee 	/* For non rpc-based layout drivers, retry-through-MDS */
262f8417b48SKinglong Mee 	if (!task->tk_ops) {
263f8417b48SKinglong Mee 		hdr->pnfs_error = -EAGAIN;
264f8417b48SKinglong Mee 		return;
265f8417b48SKinglong Mee 	}
266f8417b48SKinglong Mee 
267d45f60c6SWeston Andros Adamson 	/* Yes, so retry the read at the end of the hdr */
268d45f60c6SWeston Andros Adamson 	hdr->mds_offset += resp->count;
2690b671301STrond Myklebust 	argp->offset += resp->count;
2700b671301STrond Myklebust 	argp->pgbase += resp->count;
2710b671301STrond Myklebust 	argp->count -= resp->count;
272d00c5d43STrond Myklebust 	rpc_restart_call_prepare(task);
2730b671301STrond Myklebust }
2740b671301STrond Myklebust 
275d45f60c6SWeston Andros Adamson static void nfs_readpage_result(struct rpc_task *task,
276d45f60c6SWeston Andros Adamson 				struct nfs_pgio_header *hdr)
2771da177e4SLinus Torvalds {
278d45f60c6SWeston Andros Adamson 	if (hdr->res.eof) {
2791c6c4b74STrond Myklebust 		loff_t pos = hdr->args.offset + hdr->res.count;
2801c6c4b74STrond Myklebust 		unsigned int new = pos - hdr->io_start;
281fdd1e74cSTrond Myklebust 
2821c6c4b74STrond Myklebust 		if (hdr->good_bytes > new) {
2831c6c4b74STrond Myklebust 			hdr->good_bytes = new;
2844db6e0b7SFred Isaman 			set_bit(NFS_IOHDR_EOF, &hdr->flags);
2854db6e0b7SFred Isaman 			clear_bit(NFS_IOHDR_ERROR, &hdr->flags);
2864db6e0b7SFred Isaman 		}
287f8417b48SKinglong Mee 	} else if (hdr->res.count < hdr->args.count)
288d45f60c6SWeston Andros Adamson 		nfs_readpage_retry(task, hdr);
2890b671301STrond Myklebust }
290fdd1e74cSTrond Myklebust 
2911da177e4SLinus Torvalds /*
2921da177e4SLinus Torvalds  * Read a page over NFS.
2931da177e4SLinus Torvalds  * We read the page synchronously in the following case:
2941da177e4SLinus Torvalds  *  -	The error flag is set for this page. This happens only when a
2951da177e4SLinus Torvalds  *	previous async read operation failed.
2961da177e4SLinus Torvalds  */
2971da177e4SLinus Torvalds int nfs_readpage(struct file *file, struct page *page)
2981da177e4SLinus Torvalds {
2991da177e4SLinus Torvalds 	struct nfs_open_context *ctx;
300d56b4ddfSMel Gorman 	struct inode *inode = page_file_mapping(page)->host;
3011da177e4SLinus Torvalds 	int		error;
3021da177e4SLinus Torvalds 
3031da177e4SLinus Torvalds 	dprintk("NFS: nfs_readpage (%p %ld@%lu)\n",
3048cd79788SHuang Ying 		page, PAGE_SIZE, page_index(page));
30591d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGE);
3063708f842SNicolas Iooss 	nfs_add_stats(inode, NFSIOS_READPAGES, 1);
30791d5b470SChuck Lever 
3081da177e4SLinus Torvalds 	/*
3091da177e4SLinus Torvalds 	 * Try to flush any pending writes to the file..
3101da177e4SLinus Torvalds 	 *
3111da177e4SLinus Torvalds 	 * NOTE! Because we own the page lock, there cannot
3121da177e4SLinus Torvalds 	 * be any new pending writes generated at this point
3131da177e4SLinus Torvalds 	 * for this page (other pages can be written to).
3141da177e4SLinus Torvalds 	 */
3151da177e4SLinus Torvalds 	error = nfs_wb_page(inode, page);
3161da177e4SLinus Torvalds 	if (error)
317de05a0ccSTrond Myklebust 		goto out_unlock;
318de05a0ccSTrond Myklebust 	if (PageUptodate(page))
319de05a0ccSTrond Myklebust 		goto out_unlock;
3201da177e4SLinus Torvalds 
3215f004cf2STrond Myklebust 	error = -ESTALE;
3225f004cf2STrond Myklebust 	if (NFS_STALE(inode))
323de05a0ccSTrond Myklebust 		goto out_unlock;
3245f004cf2STrond Myklebust 
3251da177e4SLinus Torvalds 	if (file == NULL) {
326cf1308ffSTrond Myklebust 		error = -EBADF;
327d530838bSTrond Myklebust 		ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
3281da177e4SLinus Torvalds 		if (ctx == NULL)
329de05a0ccSTrond Myklebust 			goto out_unlock;
3301da177e4SLinus Torvalds 	} else
331cd3758e3STrond Myklebust 		ctx = get_nfs_open_context(nfs_file_open_context(file));
3321da177e4SLinus Torvalds 
3339a9fc1c0SDavid Howells 	if (!IS_SYNC(inode)) {
3349a9fc1c0SDavid Howells 		error = nfs_readpage_from_fscache(ctx, inode, page);
3359a9fc1c0SDavid Howells 		if (error == 0)
3369a9fc1c0SDavid Howells 			goto out;
3379a9fc1c0SDavid Howells 	}
3389a9fc1c0SDavid Howells 
3398e0969f0STrond Myklebust 	error = nfs_readpage_async(ctx, inode, page);
3408e0969f0STrond Myklebust 
3419a9fc1c0SDavid Howells out:
3421da177e4SLinus Torvalds 	put_nfs_open_context(ctx);
3431da177e4SLinus Torvalds 	return error;
344de05a0ccSTrond Myklebust out_unlock:
3451da177e4SLinus Torvalds 	unlock_page(page);
3461da177e4SLinus Torvalds 	return error;
3471da177e4SLinus Torvalds }
3481da177e4SLinus Torvalds 
3491da177e4SLinus Torvalds struct nfs_readdesc {
3508b09bee3STrond Myklebust 	struct nfs_pageio_descriptor *pgio;
3511da177e4SLinus Torvalds 	struct nfs_open_context *ctx;
3521da177e4SLinus Torvalds };
3531da177e4SLinus Torvalds 
3541da177e4SLinus Torvalds static int
3551da177e4SLinus Torvalds readpage_async_filler(void *data, struct page *page)
3561da177e4SLinus Torvalds {
3571da177e4SLinus Torvalds 	struct nfs_readdesc *desc = (struct nfs_readdesc *)data;
3581da177e4SLinus Torvalds 	struct nfs_page *new;
3591da177e4SLinus Torvalds 	unsigned int len;
360de05a0ccSTrond Myklebust 	int error;
3611da177e4SLinus Torvalds 
36249a70f27STrond Myklebust 	len = nfs_page_length(page);
3631da177e4SLinus Torvalds 	if (len == 0)
3641da177e4SLinus Torvalds 		return nfs_return_empty_page(page);
365de05a0ccSTrond Myklebust 
3662bfc6e56SWeston Andros Adamson 	new = nfs_create_request(desc->ctx, page, NULL, 0, len);
367de05a0ccSTrond Myklebust 	if (IS_ERR(new))
368de05a0ccSTrond Myklebust 		goto out_error;
369de05a0ccSTrond Myklebust 
37009cbfeafSKirill A. Shutemov 	if (len < PAGE_SIZE)
37109cbfeafSKirill A. Shutemov 		zero_user_segment(page, len, PAGE_SIZE);
372f8512ad0SFred Isaman 	if (!nfs_pageio_add_request(desc->pgio, new)) {
3730bcbf039SPeng Tao 		nfs_list_remove_request(new);
3740bcbf039SPeng Tao 		nfs_readpage_release(new);
375f8512ad0SFred Isaman 		error = desc->pgio->pg_error;
376cbebaf89STrond Myklebust 		goto out;
377f8512ad0SFred Isaman 	}
3781da177e4SLinus Torvalds 	return 0;
379de05a0ccSTrond Myklebust out_error:
380de05a0ccSTrond Myklebust 	error = PTR_ERR(new);
381de05a0ccSTrond Myklebust 	unlock_page(page);
382cbebaf89STrond Myklebust out:
383de05a0ccSTrond Myklebust 	return error;
3841da177e4SLinus Torvalds }
3851da177e4SLinus Torvalds 
3861da177e4SLinus Torvalds int nfs_readpages(struct file *filp, struct address_space *mapping,
3871da177e4SLinus Torvalds 		struct list_head *pages, unsigned nr_pages)
3881da177e4SLinus Torvalds {
3898b09bee3STrond Myklebust 	struct nfs_pageio_descriptor pgio;
390a7d42ddbSWeston Andros Adamson 	struct nfs_pgio_mirror *pgm;
3911da177e4SLinus Torvalds 	struct nfs_readdesc desc = {
3928b09bee3STrond Myklebust 		.pgio = &pgio,
3931da177e4SLinus Torvalds 	};
3941da177e4SLinus Torvalds 	struct inode *inode = mapping->host;
3958b09bee3STrond Myklebust 	unsigned long npages;
3965f004cf2STrond Myklebust 	int ret = -ESTALE;
3971da177e4SLinus Torvalds 
3981e8968c5SNiels de Vos 	dprintk("NFS: nfs_readpages (%s/%Lu %d)\n",
3991da177e4SLinus Torvalds 			inode->i_sb->s_id,
4001e8968c5SNiels de Vos 			(unsigned long long)NFS_FILEID(inode),
4011da177e4SLinus Torvalds 			nr_pages);
40291d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGES);
4031da177e4SLinus Torvalds 
4045f004cf2STrond Myklebust 	if (NFS_STALE(inode))
4055f004cf2STrond Myklebust 		goto out;
4065f004cf2STrond Myklebust 
4071da177e4SLinus Torvalds 	if (filp == NULL) {
408d530838bSTrond Myklebust 		desc.ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
4091da177e4SLinus Torvalds 		if (desc.ctx == NULL)
4101da177e4SLinus Torvalds 			return -EBADF;
4111da177e4SLinus Torvalds 	} else
412cd3758e3STrond Myklebust 		desc.ctx = get_nfs_open_context(nfs_file_open_context(filp));
4139a9fc1c0SDavid Howells 
4149a9fc1c0SDavid Howells 	/* attempt to read as many of the pages as possible from the cache
4159a9fc1c0SDavid Howells 	 * - this returns -ENOBUFS immediately if the cookie is negative
4169a9fc1c0SDavid Howells 	 */
4179a9fc1c0SDavid Howells 	ret = nfs_readpages_from_fscache(desc.ctx, inode, mapping,
4189a9fc1c0SDavid Howells 					 pages, &nr_pages);
4199a9fc1c0SDavid Howells 	if (ret == 0)
4209a9fc1c0SDavid Howells 		goto read_complete; /* all pages were read */
4219a9fc1c0SDavid Howells 
422fab5fc25SChristoph Hellwig 	nfs_pageio_init_read(&pgio, inode, false,
423fab5fc25SChristoph Hellwig 			     &nfs_async_read_completion_ops);
4248b09bee3STrond Myklebust 
4251da177e4SLinus Torvalds 	ret = read_cache_pages(mapping, pages, readpage_async_filler, &desc);
4268b09bee3STrond Myklebust 	nfs_pageio_complete(&pgio);
427a7d42ddbSWeston Andros Adamson 
428a7d42ddbSWeston Andros Adamson 	/* It doesn't make sense to do mirrored reads! */
429a7d42ddbSWeston Andros Adamson 	WARN_ON_ONCE(pgio.pg_mirror_count != 1);
430a7d42ddbSWeston Andros Adamson 
431a7d42ddbSWeston Andros Adamson 	pgm = &pgio.pg_mirrors[0];
432a7d42ddbSWeston Andros Adamson 	NFS_I(inode)->read_io += pgm->pg_bytes_written;
43309cbfeafSKirill A. Shutemov 	npages = (pgm->pg_bytes_written + PAGE_SIZE - 1) >>
43409cbfeafSKirill A. Shutemov 		 PAGE_SHIFT;
4358b09bee3STrond Myklebust 	nfs_add_stats(inode, NFSIOS_READPAGES, npages);
4369a9fc1c0SDavid Howells read_complete:
4371da177e4SLinus Torvalds 	put_nfs_open_context(desc.ctx);
4385f004cf2STrond Myklebust out:
4391da177e4SLinus Torvalds 	return ret;
4401da177e4SLinus Torvalds }
4411da177e4SLinus Torvalds 
442f7b422b1SDavid Howells int __init nfs_init_readpagecache(void)
4431da177e4SLinus Torvalds {
4441da177e4SLinus Torvalds 	nfs_rdata_cachep = kmem_cache_create("nfs_read_data",
4451e7f3a48SWeston Andros Adamson 					     sizeof(struct nfs_pgio_header),
4461da177e4SLinus Torvalds 					     0, SLAB_HWCACHE_ALIGN,
44720c2df83SPaul Mundt 					     NULL);
4481da177e4SLinus Torvalds 	if (nfs_rdata_cachep == NULL)
4491da177e4SLinus Torvalds 		return -ENOMEM;
4501da177e4SLinus Torvalds 
4511da177e4SLinus Torvalds 	return 0;
4521da177e4SLinus Torvalds }
4531da177e4SLinus Torvalds 
454266bee88SDavid Brownell void nfs_destroy_readpagecache(void)
4551da177e4SLinus Torvalds {
4561a1d92c1SAlexey Dobriyan 	kmem_cache_destroy(nfs_rdata_cachep);
4571da177e4SLinus Torvalds }
4584a0de55cSAnna Schumaker 
4594a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops = {
4604a0de55cSAnna Schumaker 	.rw_alloc_header	= nfs_readhdr_alloc,
4614a0de55cSAnna Schumaker 	.rw_free_header		= nfs_readhdr_free,
4620eecb214SAnna Schumaker 	.rw_done		= nfs_readpage_done,
4630eecb214SAnna Schumaker 	.rw_result		= nfs_readpage_result,
4641ed26f33SAnna Schumaker 	.rw_initiate		= nfs_initiate_read,
4654a0de55cSAnna Schumaker };
466