xref: /openbmc/linux/fs/nfs/read.c (revision 9c88ea00fef03031ce6554531e89be82f6a42835)
1457c8996SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds  * linux/fs/nfs/read.c
41da177e4SLinus Torvalds  *
51da177e4SLinus Torvalds  * Block I/O for NFS
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  * Partial copy of Linus' read cache modifications to fs/nfs/file.c
81da177e4SLinus Torvalds  * modified for async RPC by okir@monad.swb.de
91da177e4SLinus Torvalds  */
101da177e4SLinus Torvalds 
111da177e4SLinus Torvalds #include <linux/time.h>
121da177e4SLinus Torvalds #include <linux/kernel.h>
131da177e4SLinus Torvalds #include <linux/errno.h>
141da177e4SLinus Torvalds #include <linux/fcntl.h>
151da177e4SLinus Torvalds #include <linux/stat.h>
161da177e4SLinus Torvalds #include <linux/mm.h>
171da177e4SLinus Torvalds #include <linux/slab.h>
18*9c88ea00SDave Wysochanski #include <linux/task_io_accounting_ops.h>
191da177e4SLinus Torvalds #include <linux/pagemap.h>
201da177e4SLinus Torvalds #include <linux/sunrpc/clnt.h>
211da177e4SLinus Torvalds #include <linux/nfs_fs.h>
221da177e4SLinus Torvalds #include <linux/nfs_page.h>
2364419a9bSAndy Adamson #include <linux/module.h>
241da177e4SLinus Torvalds 
25f11c88afSAndy Adamson #include "nfs4_fs.h"
2649a70f27STrond Myklebust #include "internal.h"
2791d5b470SChuck Lever #include "iostat.h"
289a9fc1c0SDavid Howells #include "fscache.h"
29fab5fc25SChristoph Hellwig #include "pnfs.h"
308224b273SChuck Lever #include "nfstrace.h"
3191d5b470SChuck Lever 
321da177e4SLinus Torvalds #define NFSDBG_FACILITY		NFSDBG_PAGECACHE
331da177e4SLinus Torvalds 
34061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops;
354a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops;
361da177e4SLinus Torvalds 
37e18b890bSChristoph Lameter static struct kmem_cache *nfs_rdata_cachep;
381da177e4SLinus Torvalds 
391e7f3a48SWeston Andros Adamson static struct nfs_pgio_header *nfs_readhdr_alloc(void)
403feb2d49STrond Myklebust {
41fbe77c30SBenjamin Coddington 	struct nfs_pgio_header *p = kmem_cache_zalloc(nfs_rdata_cachep, GFP_KERNEL);
42fbe77c30SBenjamin Coddington 
43fbe77c30SBenjamin Coddington 	if (p)
44fbe77c30SBenjamin Coddington 		p->rw_mode = FMODE_READ;
45fbe77c30SBenjamin Coddington 	return p;
464db6e0b7SFred Isaman }
474db6e0b7SFred Isaman 
481e7f3a48SWeston Andros Adamson static void nfs_readhdr_free(struct nfs_pgio_header *rhdr)
493feb2d49STrond Myklebust {
50cd841605SFred Isaman 	kmem_cache_free(nfs_rdata_cachep, rhdr);
513feb2d49STrond Myklebust }
523feb2d49STrond Myklebust 
53ab75bff1STrond Myklebust static int nfs_return_empty_folio(struct folio *folio)
541da177e4SLinus Torvalds {
55ab75bff1STrond Myklebust 	folio_zero_segment(folio, 0, folio_size(folio));
56ab75bff1STrond Myklebust 	folio_mark_uptodate(folio);
57ab75bff1STrond Myklebust 	folio_unlock(folio);
581da177e4SLinus Torvalds 	return 0;
591da177e4SLinus Torvalds }
601da177e4SLinus Torvalds 
611abb5088SBryan Schumaker void nfs_pageio_init_read(struct nfs_pageio_descriptor *pgio,
62fab5fc25SChristoph Hellwig 			      struct inode *inode, bool force_mds,
63061ae2edSFred Isaman 			      const struct nfs_pgio_completion_ops *compl_ops)
641751c363STrond Myklebust {
65fab5fc25SChristoph Hellwig 	struct nfs_server *server = NFS_SERVER(inode);
6641d8d5b7SAnna Schumaker 	const struct nfs_pageio_ops *pg_ops = &nfs_pgio_rw_ops;
67fab5fc25SChristoph Hellwig 
68fab5fc25SChristoph Hellwig #ifdef CONFIG_NFS_V4_1
69fab5fc25SChristoph Hellwig 	if (server->pnfs_curr_ld && !force_mds)
70fab5fc25SChristoph Hellwig 		pg_ops = server->pnfs_curr_ld->pg_read_ops;
71fab5fc25SChristoph Hellwig #endif
724a0de55cSAnna Schumaker 	nfs_pageio_init(pgio, inode, pg_ops, compl_ops, &nfs_rw_read_ops,
733bde7afdSTrond Myklebust 			server->rsize, 0);
741751c363STrond Myklebust }
75ddda8e0aSBryan Schumaker EXPORT_SYMBOL_GPL(nfs_pageio_init_read);
761751c363STrond Myklebust 
77b42ad64fSDave Wysochanski static void nfs_pageio_complete_read(struct nfs_pageio_descriptor *pgio)
781e83b173SDave Wysochanski {
791e83b173SDave Wysochanski 	struct nfs_pgio_mirror *pgm;
801e83b173SDave Wysochanski 	unsigned long npages;
811e83b173SDave Wysochanski 
821e83b173SDave Wysochanski 	nfs_pageio_complete(pgio);
831e83b173SDave Wysochanski 
841e83b173SDave Wysochanski 	/* It doesn't make sense to do mirrored reads! */
851e83b173SDave Wysochanski 	WARN_ON_ONCE(pgio->pg_mirror_count != 1);
861e83b173SDave Wysochanski 
871e83b173SDave Wysochanski 	pgm = &pgio->pg_mirrors[0];
88b42ad64fSDave Wysochanski 	NFS_I(pgio->pg_inode)->read_io += pgm->pg_bytes_written;
891e83b173SDave Wysochanski 	npages = (pgm->pg_bytes_written + PAGE_SIZE - 1) >> PAGE_SHIFT;
90b42ad64fSDave Wysochanski 	nfs_add_stats(pgio->pg_inode, NFSIOS_READPAGES, npages);
911e83b173SDave Wysochanski }
921e83b173SDave Wysochanski 
931e83b173SDave Wysochanski 
94493292ddSTrond Myklebust void nfs_pageio_reset_read_mds(struct nfs_pageio_descriptor *pgio)
95493292ddSTrond Myklebust {
96a7d42ddbSWeston Andros Adamson 	struct nfs_pgio_mirror *mirror;
97a7d42ddbSWeston Andros Adamson 
986f29b9bbSKinglong Mee 	if (pgio->pg_ops && pgio->pg_ops->pg_cleanup)
996f29b9bbSKinglong Mee 		pgio->pg_ops->pg_cleanup(pgio);
1006f29b9bbSKinglong Mee 
10141d8d5b7SAnna Schumaker 	pgio->pg_ops = &nfs_pgio_rw_ops;
102a7d42ddbSWeston Andros Adamson 
103a7d42ddbSWeston Andros Adamson 	/* read path should never have more than one mirror */
104a7d42ddbSWeston Andros Adamson 	WARN_ON_ONCE(pgio->pg_mirror_count != 1);
105a7d42ddbSWeston Andros Adamson 
106a7d42ddbSWeston Andros Adamson 	mirror = &pgio->pg_mirrors[0];
107a7d42ddbSWeston Andros Adamson 	mirror->pg_bsize = NFS_SERVER(pgio->pg_inode)->rsize;
108493292ddSTrond Myklebust }
1091f945357STrond Myklebust EXPORT_SYMBOL_GPL(nfs_pageio_reset_read_mds);
110493292ddSTrond Myklebust 
1118f54c7a4STrond Myklebust static void nfs_readpage_release(struct nfs_page *req, int error)
1120bcbf039SPeng Tao {
1139fcd5960STrond Myklebust 	struct inode *inode = d_inode(nfs_req_openctx(req)->dentry);
114ab75bff1STrond Myklebust 	struct folio *folio = nfs_page_to_folio(req);
1150bcbf039SPeng Tao 
1160bcbf039SPeng Tao 	dprintk("NFS: read done (%s/%llu %d@%lld)\n", inode->i_sb->s_id,
1170bcbf039SPeng Tao 		(unsigned long long)NFS_FILEID(inode), req->wb_bytes,
1180bcbf039SPeng Tao 		(long long)req_offset(req));
1190bcbf039SPeng Tao 
1208f54c7a4STrond Myklebust 	if (nfs_error_is_fatal_on_server(error) && error != -ETIMEDOUT)
121ab75bff1STrond Myklebust 		folio_set_error(folio);
1220bcbf039SPeng Tao 	if (nfs_page_group_sync_on_bit(req, PG_UNLOCKPAGE)) {
123ab75bff1STrond Myklebust 		if (folio_test_uptodate(folio))
124ab75bff1STrond Myklebust 			nfs_fscache_write_page(inode, &folio->page);
125ab75bff1STrond Myklebust 		folio_unlock(folio);
1260bcbf039SPeng Tao 	}
1270bcbf039SPeng Tao 	nfs_release_request(req);
1280bcbf039SPeng Tao }
1290bcbf039SPeng Tao 
1301af7e7f8SDave Wysochanski struct nfs_readdesc {
1311af7e7f8SDave Wysochanski 	struct nfs_pageio_descriptor pgio;
1321af7e7f8SDave Wysochanski 	struct nfs_open_context *ctx;
1331af7e7f8SDave Wysochanski };
1341af7e7f8SDave Wysochanski 
13567d0338eSWeston Andros Adamson static void nfs_page_group_set_uptodate(struct nfs_page *req)
13667d0338eSWeston Andros Adamson {
13767d0338eSWeston Andros Adamson 	if (nfs_page_group_sync_on_bit(req, PG_UPTODATE))
138ab75bff1STrond Myklebust 		folio_mark_uptodate(nfs_page_to_folio(req));
13967d0338eSWeston Andros Adamson }
14067d0338eSWeston Andros Adamson 
141061ae2edSFred Isaman static void nfs_read_completion(struct nfs_pgio_header *hdr)
1424db6e0b7SFred Isaman {
1434db6e0b7SFred Isaman 	unsigned long bytes = 0;
1448f54c7a4STrond Myklebust 	int error;
1454db6e0b7SFred Isaman 
1464db6e0b7SFred Isaman 	if (test_bit(NFS_IOHDR_REDO, &hdr->flags))
1474db6e0b7SFred Isaman 		goto out;
1484db6e0b7SFred Isaman 	while (!list_empty(&hdr->pages)) {
1494db6e0b7SFred Isaman 		struct nfs_page *req = nfs_list_entry(hdr->pages.next);
150ab75bff1STrond Myklebust 		struct folio *folio = nfs_page_to_folio(req);
15168072992SWeston Andros Adamson 		unsigned long start = req->wb_pgbase;
15268072992SWeston Andros Adamson 		unsigned long end = req->wb_pgbase + req->wb_bytes;
1534db6e0b7SFred Isaman 
1544db6e0b7SFred Isaman 		if (test_bit(NFS_IOHDR_EOF, &hdr->flags)) {
15568072992SWeston Andros Adamson 			/* note: regions of the page not covered by a
1561e83b173SDave Wysochanski 			 * request are zeroed in readpage_async_filler */
15768072992SWeston Andros Adamson 			if (bytes > hdr->good_bytes) {
15868072992SWeston Andros Adamson 				/* nothing in this request was good, so zero
15968072992SWeston Andros Adamson 				 * the full extent of the request */
160ab75bff1STrond Myklebust 				folio_zero_segment(folio, start, end);
16168072992SWeston Andros Adamson 
16268072992SWeston Andros Adamson 			} else if (hdr->good_bytes - bytes < req->wb_bytes) {
16368072992SWeston Andros Adamson 				/* part of this request has good bytes, but
16468072992SWeston Andros Adamson 				 * not all. zero the bad bytes */
16568072992SWeston Andros Adamson 				start += hdr->good_bytes - bytes;
16668072992SWeston Andros Adamson 				WARN_ON(start < req->wb_pgbase);
167ab75bff1STrond Myklebust 				folio_zero_segment(folio, start, end);
16868072992SWeston Andros Adamson 			}
1694db6e0b7SFred Isaman 		}
1708f54c7a4STrond Myklebust 		error = 0;
1714bd8b010STrond Myklebust 		bytes += req->wb_bytes;
1724bd8b010STrond Myklebust 		if (test_bit(NFS_IOHDR_ERROR, &hdr->flags)) {
1734bd8b010STrond Myklebust 			if (bytes <= hdr->good_bytes)
17467d0338eSWeston Andros Adamson 				nfs_page_group_set_uptodate(req);
1758f54c7a4STrond Myklebust 			else {
1768f54c7a4STrond Myklebust 				error = hdr->error;
1778f54c7a4STrond Myklebust 				xchg(&nfs_req_openctx(req)->error, error);
1788f54c7a4STrond Myklebust 			}
1794bd8b010STrond Myklebust 		} else
18067d0338eSWeston Andros Adamson 			nfs_page_group_set_uptodate(req);
1814db6e0b7SFred Isaman 		nfs_list_remove_request(req);
1828f54c7a4STrond Myklebust 		nfs_readpage_release(req, error);
1834db6e0b7SFred Isaman 	}
1844db6e0b7SFred Isaman out:
1854db6e0b7SFred Isaman 	hdr->release(hdr);
1864db6e0b7SFred Isaman }
1874db6e0b7SFred Isaman 
188d45f60c6SWeston Andros Adamson static void nfs_initiate_read(struct nfs_pgio_header *hdr,
189d45f60c6SWeston Andros Adamson 			      struct rpc_message *msg,
190abde71f4STom Haynes 			      const struct nfs_rpc_ops *rpc_ops,
1911ed26f33SAnna Schumaker 			      struct rpc_task_setup *task_setup_data, int how)
19264419a9bSAndy Adamson {
193abde71f4STom Haynes 	rpc_ops->read_setup(hdr, msg);
1942343172dSTrond Myklebust 	trace_nfs_initiate_read(hdr);
19564419a9bSAndy Adamson }
19664419a9bSAndy Adamson 
197061ae2edSFred Isaman static void
198df3accb8STrond Myklebust nfs_async_read_error(struct list_head *head, int error)
1991da177e4SLinus Torvalds {
2001da177e4SLinus Torvalds 	struct nfs_page	*req;
2011da177e4SLinus Torvalds 
2021da177e4SLinus Torvalds 	while (!list_empty(head)) {
2031da177e4SLinus Torvalds 		req = nfs_list_entry(head->next);
2041da177e4SLinus Torvalds 		nfs_list_remove_request(req);
2058f54c7a4STrond Myklebust 		nfs_readpage_release(req, error);
2061da177e4SLinus Torvalds 	}
2071da177e4SLinus Torvalds }
2081da177e4SLinus Torvalds 
209061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops = {
210061ae2edSFred Isaman 	.error_cleanup = nfs_async_read_error,
211061ae2edSFred Isaman 	.completion = nfs_read_completion,
212061ae2edSFred Isaman };
213061ae2edSFred Isaman 
2141da177e4SLinus Torvalds /*
2150b671301STrond Myklebust  * This is the callback from RPC telling us whether a reply was
2160b671301STrond Myklebust  * received or some error occurred (timeout or socket shutdown).
2170b671301STrond Myklebust  */
218d45f60c6SWeston Andros Adamson static int nfs_readpage_done(struct rpc_task *task,
219d45f60c6SWeston Andros Adamson 			     struct nfs_pgio_header *hdr,
2200eecb214SAnna Schumaker 			     struct inode *inode)
2210b671301STrond Myklebust {
222d45f60c6SWeston Andros Adamson 	int status = NFS_PROTO(inode)->read_done(task, hdr);
2230b671301STrond Myklebust 	if (status != 0)
2240b671301STrond Myklebust 		return status;
2250b671301STrond Myklebust 
226d45f60c6SWeston Andros Adamson 	nfs_add_stats(inode, NFSIOS_SERVERREADBYTES, hdr->res.count);
2272343172dSTrond Myklebust 	trace_nfs_readpage_done(task, hdr);
2280b671301STrond Myklebust 
2290b671301STrond Myklebust 	if (task->tk_status == -ESTALE) {
23093ce4af7STrond Myklebust 		nfs_set_inode_stale(inode);
231cd841605SFred Isaman 		nfs_mark_for_revalidate(inode);
2320b671301STrond Myklebust 	}
2330b671301STrond Myklebust 	return 0;
2340b671301STrond Myklebust }
2350b671301STrond Myklebust 
236d45f60c6SWeston Andros Adamson static void nfs_readpage_retry(struct rpc_task *task,
237d45f60c6SWeston Andros Adamson 			       struct nfs_pgio_header *hdr)
2380b671301STrond Myklebust {
239d45f60c6SWeston Andros Adamson 	struct nfs_pgio_args *argp = &hdr->args;
240d45f60c6SWeston Andros Adamson 	struct nfs_pgio_res  *resp = &hdr->res;
2410b671301STrond Myklebust 
2420b671301STrond Myklebust 	/* This is a short read! */
243d45f60c6SWeston Andros Adamson 	nfs_inc_stats(hdr->inode, NFSIOS_SHORTREAD);
244fd2b6121SChuck Lever 	trace_nfs_readpage_short(task, hdr);
245fd2b6121SChuck Lever 
2460b671301STrond Myklebust 	/* Has the server at least made some progress? */
2474db6e0b7SFred Isaman 	if (resp->count == 0) {
248d45f60c6SWeston Andros Adamson 		nfs_set_pgio_error(hdr, -EIO, argp->offset);
249d61e612aSTrond Myklebust 		return;
2504db6e0b7SFred Isaman 	}
251f8417b48SKinglong Mee 
252f8417b48SKinglong Mee 	/* For non rpc-based layout drivers, retry-through-MDS */
253f8417b48SKinglong Mee 	if (!task->tk_ops) {
254f8417b48SKinglong Mee 		hdr->pnfs_error = -EAGAIN;
255f8417b48SKinglong Mee 		return;
256f8417b48SKinglong Mee 	}
257f8417b48SKinglong Mee 
258d45f60c6SWeston Andros Adamson 	/* Yes, so retry the read at the end of the hdr */
259d45f60c6SWeston Andros Adamson 	hdr->mds_offset += resp->count;
2600b671301STrond Myklebust 	argp->offset += resp->count;
2610b671301STrond Myklebust 	argp->pgbase += resp->count;
2620b671301STrond Myklebust 	argp->count -= resp->count;
2638c9cb714STrond Myklebust 	resp->count = 0;
2648c9cb714STrond Myklebust 	resp->eof = 0;
265d00c5d43STrond Myklebust 	rpc_restart_call_prepare(task);
2660b671301STrond Myklebust }
2670b671301STrond Myklebust 
268d45f60c6SWeston Andros Adamson static void nfs_readpage_result(struct rpc_task *task,
269d45f60c6SWeston Andros Adamson 				struct nfs_pgio_header *hdr)
2701da177e4SLinus Torvalds {
271d45f60c6SWeston Andros Adamson 	if (hdr->res.eof) {
2721c6c4b74STrond Myklebust 		loff_t pos = hdr->args.offset + hdr->res.count;
2731c6c4b74STrond Myklebust 		unsigned int new = pos - hdr->io_start;
274fdd1e74cSTrond Myklebust 
2751c6c4b74STrond Myklebust 		if (hdr->good_bytes > new) {
2761c6c4b74STrond Myklebust 			hdr->good_bytes = new;
2774db6e0b7SFred Isaman 			set_bit(NFS_IOHDR_EOF, &hdr->flags);
2784db6e0b7SFred Isaman 			clear_bit(NFS_IOHDR_ERROR, &hdr->flags);
2794db6e0b7SFred Isaman 		}
280f8417b48SKinglong Mee 	} else if (hdr->res.count < hdr->args.count)
281d45f60c6SWeston Andros Adamson 		nfs_readpage_retry(task, hdr);
2820b671301STrond Myklebust }
283fdd1e74cSTrond Myklebust 
284ab75bff1STrond Myklebust static int readpage_async_filler(struct nfs_readdesc *desc, struct folio *folio)
2851e83b173SDave Wysochanski {
286ab75bff1STrond Myklebust 	struct inode *inode = folio_file_mapping(folio)->host;
287ab75bff1STrond Myklebust 	struct nfs_server *server = NFS_SERVER(inode);
288ab75bff1STrond Myklebust 	size_t fsize = folio_size(folio);
289ab75bff1STrond Myklebust 	unsigned int rsize = server->rsize;
2901e83b173SDave Wysochanski 	struct nfs_page *new;
2918cfb9015STrond Myklebust 	unsigned int len, aligned_len;
2921e83b173SDave Wysochanski 	int error;
2931e83b173SDave Wysochanski 
294ab75bff1STrond Myklebust 	len = nfs_folio_length(folio);
2951e83b173SDave Wysochanski 	if (len == 0)
296ab75bff1STrond Myklebust 		return nfs_return_empty_folio(folio);
2971e83b173SDave Wysochanski 
298ab75bff1STrond Myklebust 	aligned_len = min_t(unsigned int, ALIGN(len, rsize), fsize);
2998cfb9015STrond Myklebust 
300ab75bff1STrond Myklebust 	if (!IS_SYNC(inode)) {
301ab75bff1STrond Myklebust 		error = nfs_fscache_read_page(inode, &folio->page);
30216f2f4e6SDavid Howells 		if (error == 0)
30316f2f4e6SDavid Howells 			goto out_unlock;
30416f2f4e6SDavid Howells 	}
30516f2f4e6SDavid Howells 
306ab75bff1STrond Myklebust 	new = nfs_page_create_from_folio(desc->ctx, folio, 0, aligned_len);
3071e83b173SDave Wysochanski 	if (IS_ERR(new))
3081e83b173SDave Wysochanski 		goto out_error;
3091e83b173SDave Wysochanski 
310ab75bff1STrond Myklebust 	if (len < fsize)
311ab75bff1STrond Myklebust 		folio_zero_segment(folio, len, fsize);
3121e83b173SDave Wysochanski 	if (!nfs_pageio_add_request(&desc->pgio, new)) {
3131e83b173SDave Wysochanski 		nfs_list_remove_request(new);
3141e83b173SDave Wysochanski 		error = desc->pgio.pg_error;
3151e83b173SDave Wysochanski 		nfs_readpage_release(new, error);
3161e83b173SDave Wysochanski 		goto out;
3171e83b173SDave Wysochanski 	}
3181e83b173SDave Wysochanski 	return 0;
3191e83b173SDave Wysochanski out_error:
3201e83b173SDave Wysochanski 	error = PTR_ERR(new);
32116f2f4e6SDavid Howells out_unlock:
322ab75bff1STrond Myklebust 	folio_unlock(folio);
3231e83b173SDave Wysochanski out:
3241e83b173SDave Wysochanski 	return error;
3251e83b173SDave Wysochanski }
3261e83b173SDave Wysochanski 
3271da177e4SLinus Torvalds /*
3281da177e4SLinus Torvalds  * Read a page over NFS.
3291da177e4SLinus Torvalds  * We read the page synchronously in the following case:
3301da177e4SLinus Torvalds  *  -	The error flag is set for this page. This happens only when a
3311da177e4SLinus Torvalds  *	previous async read operation failed.
3321da177e4SLinus Torvalds  */
33365d023afSMatthew Wilcox (Oracle) int nfs_read_folio(struct file *file, struct folio *folio)
3341da177e4SLinus Torvalds {
3351af7e7f8SDave Wysochanski 	struct nfs_readdesc desc;
336ab75bff1STrond Myklebust 	struct inode *inode = file_inode(file);
33749dee700SDave Wysochanski 	int ret;
3381da177e4SLinus Torvalds 
339ab75bff1STrond Myklebust 	trace_nfs_aop_readpage(inode, folio);
34091d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGE);
341*9c88ea00SDave Wysochanski 	task_io_account_read(folio_size(folio));
34291d5b470SChuck Lever 
3431da177e4SLinus Torvalds 	/*
3441da177e4SLinus Torvalds 	 * Try to flush any pending writes to the file..
3451da177e4SLinus Torvalds 	 *
346ab75bff1STrond Myklebust 	 * NOTE! Because we own the folio lock, there cannot
3471da177e4SLinus Torvalds 	 * be any new pending writes generated at this point
348ab75bff1STrond Myklebust 	 * for this folio (other folios can be written to).
3491da177e4SLinus Torvalds 	 */
350ab75bff1STrond Myklebust 	ret = nfs_wb_folio(inode, folio);
35149dee700SDave Wysochanski 	if (ret)
352de05a0ccSTrond Myklebust 		goto out_unlock;
353ab75bff1STrond Myklebust 	if (folio_test_uptodate(folio))
354de05a0ccSTrond Myklebust 		goto out_unlock;
3551da177e4SLinus Torvalds 
35649dee700SDave Wysochanski 	ret = -ESTALE;
3575f004cf2STrond Myklebust 	if (NFS_STALE(inode))
358de05a0ccSTrond Myklebust 		goto out_unlock;
3595f004cf2STrond Myklebust 
3601af7e7f8SDave Wysochanski 	desc.ctx = get_nfs_open_context(nfs_file_open_context(file));
3611da177e4SLinus Torvalds 
362ba512c1bSDave Wysochanski 	xchg(&desc.ctx->error, 0);
3631e83b173SDave Wysochanski 	nfs_pageio_init_read(&desc.pgio, inode, false,
3641e83b173SDave Wysochanski 			     &nfs_async_read_completion_ops);
3651e83b173SDave Wysochanski 
366ab75bff1STrond Myklebust 	ret = readpage_async_filler(&desc, folio);
367e0340f16SDave Wysochanski 	if (ret)
368e0340f16SDave Wysochanski 		goto out;
3691e83b173SDave Wysochanski 
370b42ad64fSDave Wysochanski 	nfs_pageio_complete_read(&desc.pgio);
3711e83b173SDave Wysochanski 	ret = desc.pgio.pg_error < 0 ? desc.pgio.pg_error : 0;
37249dee700SDave Wysochanski 	if (!ret) {
373ab75bff1STrond Myklebust 		ret = folio_wait_locked_killable(folio);
374ab75bff1STrond Myklebust 		if (!folio_test_uptodate(folio) && !ret)
3751af7e7f8SDave Wysochanski 			ret = xchg(&desc.ctx->error, 0);
3768f54c7a4STrond Myklebust 	}
3779a9fc1c0SDavid Howells out:
3781af7e7f8SDave Wysochanski 	put_nfs_open_context(desc.ctx);
379ab75bff1STrond Myklebust 	trace_nfs_aop_readpage_done(inode, folio, ret);
38049dee700SDave Wysochanski 	return ret;
381de05a0ccSTrond Myklebust out_unlock:
382ab75bff1STrond Myklebust 	folio_unlock(folio);
383ab75bff1STrond Myklebust 	trace_nfs_aop_readpage_done(inode, folio, ret);
38449dee700SDave Wysochanski 	return ret;
3851da177e4SLinus Torvalds }
3861da177e4SLinus Torvalds 
3878786fde8SMatthew Wilcox (Oracle) void nfs_readahead(struct readahead_control *ractl)
3881da177e4SLinus Torvalds {
3898786fde8SMatthew Wilcox (Oracle) 	unsigned int nr_pages = readahead_count(ractl);
3908786fde8SMatthew Wilcox (Oracle) 	struct file *file = ractl->file;
39149dee700SDave Wysochanski 	struct nfs_readdesc desc;
3928786fde8SMatthew Wilcox (Oracle) 	struct inode *inode = ractl->mapping->host;
393ab75bff1STrond Myklebust 	struct folio *folio;
39449dee700SDave Wysochanski 	int ret;
3951da177e4SLinus Torvalds 
3968786fde8SMatthew Wilcox (Oracle) 	trace_nfs_aop_readahead(inode, readahead_pos(ractl), nr_pages);
39791d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGES);
398*9c88ea00SDave Wysochanski 	task_io_account_read(readahead_length(ractl));
3991da177e4SLinus Torvalds 
40049dee700SDave Wysochanski 	ret = -ESTALE;
4015f004cf2STrond Myklebust 	if (NFS_STALE(inode))
4025f004cf2STrond Myklebust 		goto out;
4035f004cf2STrond Myklebust 
40449dee700SDave Wysochanski 	if (file == NULL) {
40549dee700SDave Wysochanski 		ret = -EBADF;
406d530838bSTrond Myklebust 		desc.ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
4071da177e4SLinus Torvalds 		if (desc.ctx == NULL)
40849dee700SDave Wysochanski 			goto out;
4091da177e4SLinus Torvalds 	} else
41049dee700SDave Wysochanski 		desc.ctx = get_nfs_open_context(nfs_file_open_context(file));
4119a9fc1c0SDavid Howells 
4121af7e7f8SDave Wysochanski 	nfs_pageio_init_read(&desc.pgio, inode, false,
413fab5fc25SChristoph Hellwig 			     &nfs_async_read_completion_ops);
4148b09bee3STrond Myklebust 
415ab75bff1STrond Myklebust 	while ((folio = readahead_folio(ractl)) != NULL) {
416ab75bff1STrond Myklebust 		ret = readpage_async_filler(&desc, folio);
4178786fde8SMatthew Wilcox (Oracle) 		if (ret)
4188786fde8SMatthew Wilcox (Oracle) 			break;
4198786fde8SMatthew Wilcox (Oracle) 	}
420a7d42ddbSWeston Andros Adamson 
421b42ad64fSDave Wysochanski 	nfs_pageio_complete_read(&desc.pgio);
422a7d42ddbSWeston Andros Adamson 
4231da177e4SLinus Torvalds 	put_nfs_open_context(desc.ctx);
4245f004cf2STrond Myklebust out:
425d9f87743SChuck Lever 	trace_nfs_aop_readahead_done(inode, nr_pages, ret);
4261da177e4SLinus Torvalds }
4271da177e4SLinus Torvalds 
428f7b422b1SDavid Howells int __init nfs_init_readpagecache(void)
4291da177e4SLinus Torvalds {
4301da177e4SLinus Torvalds 	nfs_rdata_cachep = kmem_cache_create("nfs_read_data",
4311e7f3a48SWeston Andros Adamson 					     sizeof(struct nfs_pgio_header),
4321da177e4SLinus Torvalds 					     0, SLAB_HWCACHE_ALIGN,
43320c2df83SPaul Mundt 					     NULL);
4341da177e4SLinus Torvalds 	if (nfs_rdata_cachep == NULL)
4351da177e4SLinus Torvalds 		return -ENOMEM;
4361da177e4SLinus Torvalds 
4371da177e4SLinus Torvalds 	return 0;
4381da177e4SLinus Torvalds }
4391da177e4SLinus Torvalds 
440266bee88SDavid Brownell void nfs_destroy_readpagecache(void)
4411da177e4SLinus Torvalds {
4421a1d92c1SAlexey Dobriyan 	kmem_cache_destroy(nfs_rdata_cachep);
4431da177e4SLinus Torvalds }
4444a0de55cSAnna Schumaker 
4454a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops = {
4464a0de55cSAnna Schumaker 	.rw_alloc_header	= nfs_readhdr_alloc,
4474a0de55cSAnna Schumaker 	.rw_free_header		= nfs_readhdr_free,
4480eecb214SAnna Schumaker 	.rw_done		= nfs_readpage_done,
4490eecb214SAnna Schumaker 	.rw_result		= nfs_readpage_result,
4501ed26f33SAnna Schumaker 	.rw_initiate		= nfs_initiate_read,
4514a0de55cSAnna Schumaker };
452