xref: /openbmc/linux/fs/nfs/read.c (revision 01c3a40084a42b7a242776d1e9f8e10d4e96c6ef)
1457c8996SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds  * linux/fs/nfs/read.c
41da177e4SLinus Torvalds  *
51da177e4SLinus Torvalds  * Block I/O for NFS
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  * Partial copy of Linus' read cache modifications to fs/nfs/file.c
81da177e4SLinus Torvalds  * modified for async RPC by okir@monad.swb.de
91da177e4SLinus Torvalds  */
101da177e4SLinus Torvalds 
111da177e4SLinus Torvalds #include <linux/time.h>
121da177e4SLinus Torvalds #include <linux/kernel.h>
131da177e4SLinus Torvalds #include <linux/errno.h>
141da177e4SLinus Torvalds #include <linux/fcntl.h>
151da177e4SLinus Torvalds #include <linux/stat.h>
161da177e4SLinus Torvalds #include <linux/mm.h>
171da177e4SLinus Torvalds #include <linux/slab.h>
189c88ea00SDave Wysochanski #include <linux/task_io_accounting_ops.h>
191da177e4SLinus Torvalds #include <linux/pagemap.h>
201da177e4SLinus Torvalds #include <linux/sunrpc/clnt.h>
211da177e4SLinus Torvalds #include <linux/nfs_fs.h>
221da177e4SLinus Torvalds #include <linux/nfs_page.h>
2364419a9bSAndy Adamson #include <linux/module.h>
241da177e4SLinus Torvalds 
25f11c88afSAndy Adamson #include "nfs4_fs.h"
2649a70f27STrond Myklebust #include "internal.h"
2791d5b470SChuck Lever #include "iostat.h"
289a9fc1c0SDavid Howells #include "fscache.h"
29fab5fc25SChristoph Hellwig #include "pnfs.h"
308224b273SChuck Lever #include "nfstrace.h"
3191d5b470SChuck Lever 
321da177e4SLinus Torvalds #define NFSDBG_FACILITY		NFSDBG_PAGECACHE
331da177e4SLinus Torvalds 
34061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops;
354a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops;
361da177e4SLinus Torvalds 
37e18b890bSChristoph Lameter static struct kmem_cache *nfs_rdata_cachep;
381da177e4SLinus Torvalds 
391e7f3a48SWeston Andros Adamson static struct nfs_pgio_header *nfs_readhdr_alloc(void)
403feb2d49STrond Myklebust {
41fbe77c30SBenjamin Coddington 	struct nfs_pgio_header *p = kmem_cache_zalloc(nfs_rdata_cachep, GFP_KERNEL);
42fbe77c30SBenjamin Coddington 
43fbe77c30SBenjamin Coddington 	if (p)
44fbe77c30SBenjamin Coddington 		p->rw_mode = FMODE_READ;
45fbe77c30SBenjamin Coddington 	return p;
464db6e0b7SFred Isaman }
474db6e0b7SFred Isaman 
481e7f3a48SWeston Andros Adamson static void nfs_readhdr_free(struct nfs_pgio_header *rhdr)
493feb2d49STrond Myklebust {
50cd841605SFred Isaman 	kmem_cache_free(nfs_rdata_cachep, rhdr);
513feb2d49STrond Myklebust }
523feb2d49STrond Myklebust 
53ab75bff1STrond Myklebust static int nfs_return_empty_folio(struct folio *folio)
541da177e4SLinus Torvalds {
55ab75bff1STrond Myklebust 	folio_zero_segment(folio, 0, folio_size(folio));
56ab75bff1STrond Myklebust 	folio_mark_uptodate(folio);
57ab75bff1STrond Myklebust 	folio_unlock(folio);
581da177e4SLinus Torvalds 	return 0;
591da177e4SLinus Torvalds }
601da177e4SLinus Torvalds 
611abb5088SBryan Schumaker void nfs_pageio_init_read(struct nfs_pageio_descriptor *pgio,
62fab5fc25SChristoph Hellwig 			      struct inode *inode, bool force_mds,
63061ae2edSFred Isaman 			      const struct nfs_pgio_completion_ops *compl_ops)
641751c363STrond Myklebust {
65fab5fc25SChristoph Hellwig 	struct nfs_server *server = NFS_SERVER(inode);
6641d8d5b7SAnna Schumaker 	const struct nfs_pageio_ops *pg_ops = &nfs_pgio_rw_ops;
67fab5fc25SChristoph Hellwig 
68fab5fc25SChristoph Hellwig #ifdef CONFIG_NFS_V4_1
69fab5fc25SChristoph Hellwig 	if (server->pnfs_curr_ld && !force_mds)
70fab5fc25SChristoph Hellwig 		pg_ops = server->pnfs_curr_ld->pg_read_ops;
71fab5fc25SChristoph Hellwig #endif
724a0de55cSAnna Schumaker 	nfs_pageio_init(pgio, inode, pg_ops, compl_ops, &nfs_rw_read_ops,
733bde7afdSTrond Myklebust 			server->rsize, 0);
741751c363STrond Myklebust }
75ddda8e0aSBryan Schumaker EXPORT_SYMBOL_GPL(nfs_pageio_init_read);
761751c363STrond Myklebust 
77b42ad64fSDave Wysochanski static void nfs_pageio_complete_read(struct nfs_pageio_descriptor *pgio)
781e83b173SDave Wysochanski {
791e83b173SDave Wysochanski 	struct nfs_pgio_mirror *pgm;
801e83b173SDave Wysochanski 	unsigned long npages;
811e83b173SDave Wysochanski 
821e83b173SDave Wysochanski 	nfs_pageio_complete(pgio);
831e83b173SDave Wysochanski 
841e83b173SDave Wysochanski 	/* It doesn't make sense to do mirrored reads! */
851e83b173SDave Wysochanski 	WARN_ON_ONCE(pgio->pg_mirror_count != 1);
861e83b173SDave Wysochanski 
871e83b173SDave Wysochanski 	pgm = &pgio->pg_mirrors[0];
88b42ad64fSDave Wysochanski 	NFS_I(pgio->pg_inode)->read_io += pgm->pg_bytes_written;
891e83b173SDave Wysochanski 	npages = (pgm->pg_bytes_written + PAGE_SIZE - 1) >> PAGE_SHIFT;
90b42ad64fSDave Wysochanski 	nfs_add_stats(pgio->pg_inode, NFSIOS_READPAGES, npages);
911e83b173SDave Wysochanski }
921e83b173SDave Wysochanski 
931e83b173SDave Wysochanski 
94493292ddSTrond Myklebust void nfs_pageio_reset_read_mds(struct nfs_pageio_descriptor *pgio)
95493292ddSTrond Myklebust {
96a7d42ddbSWeston Andros Adamson 	struct nfs_pgio_mirror *mirror;
97a7d42ddbSWeston Andros Adamson 
986f29b9bbSKinglong Mee 	if (pgio->pg_ops && pgio->pg_ops->pg_cleanup)
996f29b9bbSKinglong Mee 		pgio->pg_ops->pg_cleanup(pgio);
1006f29b9bbSKinglong Mee 
10141d8d5b7SAnna Schumaker 	pgio->pg_ops = &nfs_pgio_rw_ops;
102a7d42ddbSWeston Andros Adamson 
103a7d42ddbSWeston Andros Adamson 	/* read path should never have more than one mirror */
104a7d42ddbSWeston Andros Adamson 	WARN_ON_ONCE(pgio->pg_mirror_count != 1);
105a7d42ddbSWeston Andros Adamson 
106a7d42ddbSWeston Andros Adamson 	mirror = &pgio->pg_mirrors[0];
107a7d42ddbSWeston Andros Adamson 	mirror->pg_bsize = NFS_SERVER(pgio->pg_inode)->rsize;
108493292ddSTrond Myklebust }
1091f945357STrond Myklebust EXPORT_SYMBOL_GPL(nfs_pageio_reset_read_mds);
110493292ddSTrond Myklebust 
1118f54c7a4STrond Myklebust static void nfs_readpage_release(struct nfs_page *req, int error)
1120bcbf039SPeng Tao {
1139fcd5960STrond Myklebust 	struct inode *inode = d_inode(nfs_req_openctx(req)->dentry);
114ab75bff1STrond Myklebust 	struct folio *folio = nfs_page_to_folio(req);
1150bcbf039SPeng Tao 
1160bcbf039SPeng Tao 	dprintk("NFS: read done (%s/%llu %d@%lld)\n", inode->i_sb->s_id,
1170bcbf039SPeng Tao 		(unsigned long long)NFS_FILEID(inode), req->wb_bytes,
1180bcbf039SPeng Tao 		(long long)req_offset(req));
1190bcbf039SPeng Tao 
1208f54c7a4STrond Myklebust 	if (nfs_error_is_fatal_on_server(error) && error != -ETIMEDOUT)
121ab75bff1STrond Myklebust 		folio_set_error(folio);
1220bcbf039SPeng Tao 	if (nfs_page_group_sync_on_bit(req, PG_UNLOCKPAGE)) {
123ab75bff1STrond Myklebust 		if (folio_test_uptodate(folio))
124ab75bff1STrond Myklebust 			nfs_fscache_write_page(inode, &folio->page);
125ab75bff1STrond Myklebust 		folio_unlock(folio);
1260bcbf039SPeng Tao 	}
1270bcbf039SPeng Tao 	nfs_release_request(req);
1280bcbf039SPeng Tao }
1290bcbf039SPeng Tao 
13067d0338eSWeston Andros Adamson static void nfs_page_group_set_uptodate(struct nfs_page *req)
13167d0338eSWeston Andros Adamson {
13267d0338eSWeston Andros Adamson 	if (nfs_page_group_sync_on_bit(req, PG_UPTODATE))
133ab75bff1STrond Myklebust 		folio_mark_uptodate(nfs_page_to_folio(req));
13467d0338eSWeston Andros Adamson }
13567d0338eSWeston Andros Adamson 
136061ae2edSFred Isaman static void nfs_read_completion(struct nfs_pgio_header *hdr)
1374db6e0b7SFred Isaman {
1384db6e0b7SFred Isaman 	unsigned long bytes = 0;
1398f54c7a4STrond Myklebust 	int error;
1404db6e0b7SFred Isaman 
1414db6e0b7SFred Isaman 	if (test_bit(NFS_IOHDR_REDO, &hdr->flags))
1424db6e0b7SFred Isaman 		goto out;
1434db6e0b7SFred Isaman 	while (!list_empty(&hdr->pages)) {
1444db6e0b7SFred Isaman 		struct nfs_page *req = nfs_list_entry(hdr->pages.next);
145ab75bff1STrond Myklebust 		struct folio *folio = nfs_page_to_folio(req);
14668072992SWeston Andros Adamson 		unsigned long start = req->wb_pgbase;
14768072992SWeston Andros Adamson 		unsigned long end = req->wb_pgbase + req->wb_bytes;
1484db6e0b7SFred Isaman 
1494db6e0b7SFred Isaman 		if (test_bit(NFS_IOHDR_EOF, &hdr->flags)) {
15068072992SWeston Andros Adamson 			/* note: regions of the page not covered by a
151*01c3a400SDave Wysochanski 			 * request are zeroed in nfs_read_add_folio
152*01c3a400SDave Wysochanski 			 */
15368072992SWeston Andros Adamson 			if (bytes > hdr->good_bytes) {
15468072992SWeston Andros Adamson 				/* nothing in this request was good, so zero
15568072992SWeston Andros Adamson 				 * the full extent of the request */
156ab75bff1STrond Myklebust 				folio_zero_segment(folio, start, end);
15768072992SWeston Andros Adamson 
15868072992SWeston Andros Adamson 			} else if (hdr->good_bytes - bytes < req->wb_bytes) {
15968072992SWeston Andros Adamson 				/* part of this request has good bytes, but
16068072992SWeston Andros Adamson 				 * not all. zero the bad bytes */
16168072992SWeston Andros Adamson 				start += hdr->good_bytes - bytes;
16268072992SWeston Andros Adamson 				WARN_ON(start < req->wb_pgbase);
163ab75bff1STrond Myklebust 				folio_zero_segment(folio, start, end);
16468072992SWeston Andros Adamson 			}
1654db6e0b7SFred Isaman 		}
1668f54c7a4STrond Myklebust 		error = 0;
1674bd8b010STrond Myklebust 		bytes += req->wb_bytes;
1684bd8b010STrond Myklebust 		if (test_bit(NFS_IOHDR_ERROR, &hdr->flags)) {
1694bd8b010STrond Myklebust 			if (bytes <= hdr->good_bytes)
17067d0338eSWeston Andros Adamson 				nfs_page_group_set_uptodate(req);
1718f54c7a4STrond Myklebust 			else {
1728f54c7a4STrond Myklebust 				error = hdr->error;
1738f54c7a4STrond Myklebust 				xchg(&nfs_req_openctx(req)->error, error);
1748f54c7a4STrond Myklebust 			}
1754bd8b010STrond Myklebust 		} else
17667d0338eSWeston Andros Adamson 			nfs_page_group_set_uptodate(req);
1774db6e0b7SFred Isaman 		nfs_list_remove_request(req);
1788f54c7a4STrond Myklebust 		nfs_readpage_release(req, error);
1794db6e0b7SFred Isaman 	}
1804db6e0b7SFred Isaman out:
1814db6e0b7SFred Isaman 	hdr->release(hdr);
1824db6e0b7SFred Isaman }
1834db6e0b7SFred Isaman 
184d45f60c6SWeston Andros Adamson static void nfs_initiate_read(struct nfs_pgio_header *hdr,
185d45f60c6SWeston Andros Adamson 			      struct rpc_message *msg,
186abde71f4STom Haynes 			      const struct nfs_rpc_ops *rpc_ops,
1871ed26f33SAnna Schumaker 			      struct rpc_task_setup *task_setup_data, int how)
18864419a9bSAndy Adamson {
189abde71f4STom Haynes 	rpc_ops->read_setup(hdr, msg);
1902343172dSTrond Myklebust 	trace_nfs_initiate_read(hdr);
19164419a9bSAndy Adamson }
19264419a9bSAndy Adamson 
193061ae2edSFred Isaman static void
194df3accb8STrond Myklebust nfs_async_read_error(struct list_head *head, int error)
1951da177e4SLinus Torvalds {
1961da177e4SLinus Torvalds 	struct nfs_page	*req;
1971da177e4SLinus Torvalds 
1981da177e4SLinus Torvalds 	while (!list_empty(head)) {
1991da177e4SLinus Torvalds 		req = nfs_list_entry(head->next);
2001da177e4SLinus Torvalds 		nfs_list_remove_request(req);
2018f54c7a4STrond Myklebust 		nfs_readpage_release(req, error);
2021da177e4SLinus Torvalds 	}
2031da177e4SLinus Torvalds }
2041da177e4SLinus Torvalds 
205061ae2edSFred Isaman static const struct nfs_pgio_completion_ops nfs_async_read_completion_ops = {
206061ae2edSFred Isaman 	.error_cleanup = nfs_async_read_error,
207061ae2edSFred Isaman 	.completion = nfs_read_completion,
208061ae2edSFred Isaman };
209061ae2edSFred Isaman 
2101da177e4SLinus Torvalds /*
2110b671301STrond Myklebust  * This is the callback from RPC telling us whether a reply was
2120b671301STrond Myklebust  * received or some error occurred (timeout or socket shutdown).
2130b671301STrond Myklebust  */
214d45f60c6SWeston Andros Adamson static int nfs_readpage_done(struct rpc_task *task,
215d45f60c6SWeston Andros Adamson 			     struct nfs_pgio_header *hdr,
2160eecb214SAnna Schumaker 			     struct inode *inode)
2170b671301STrond Myklebust {
218d45f60c6SWeston Andros Adamson 	int status = NFS_PROTO(inode)->read_done(task, hdr);
2190b671301STrond Myklebust 	if (status != 0)
2200b671301STrond Myklebust 		return status;
2210b671301STrond Myklebust 
222d45f60c6SWeston Andros Adamson 	nfs_add_stats(inode, NFSIOS_SERVERREADBYTES, hdr->res.count);
2232343172dSTrond Myklebust 	trace_nfs_readpage_done(task, hdr);
2240b671301STrond Myklebust 
2250b671301STrond Myklebust 	if (task->tk_status == -ESTALE) {
22693ce4af7STrond Myklebust 		nfs_set_inode_stale(inode);
227cd841605SFred Isaman 		nfs_mark_for_revalidate(inode);
2280b671301STrond Myklebust 	}
2290b671301STrond Myklebust 	return 0;
2300b671301STrond Myklebust }
2310b671301STrond Myklebust 
232d45f60c6SWeston Andros Adamson static void nfs_readpage_retry(struct rpc_task *task,
233d45f60c6SWeston Andros Adamson 			       struct nfs_pgio_header *hdr)
2340b671301STrond Myklebust {
235d45f60c6SWeston Andros Adamson 	struct nfs_pgio_args *argp = &hdr->args;
236d45f60c6SWeston Andros Adamson 	struct nfs_pgio_res  *resp = &hdr->res;
2370b671301STrond Myklebust 
2380b671301STrond Myklebust 	/* This is a short read! */
239d45f60c6SWeston Andros Adamson 	nfs_inc_stats(hdr->inode, NFSIOS_SHORTREAD);
240fd2b6121SChuck Lever 	trace_nfs_readpage_short(task, hdr);
241fd2b6121SChuck Lever 
2420b671301STrond Myklebust 	/* Has the server at least made some progress? */
2434db6e0b7SFred Isaman 	if (resp->count == 0) {
244d45f60c6SWeston Andros Adamson 		nfs_set_pgio_error(hdr, -EIO, argp->offset);
245d61e612aSTrond Myklebust 		return;
2464db6e0b7SFred Isaman 	}
247f8417b48SKinglong Mee 
248f8417b48SKinglong Mee 	/* For non rpc-based layout drivers, retry-through-MDS */
249f8417b48SKinglong Mee 	if (!task->tk_ops) {
250f8417b48SKinglong Mee 		hdr->pnfs_error = -EAGAIN;
251f8417b48SKinglong Mee 		return;
252f8417b48SKinglong Mee 	}
253f8417b48SKinglong Mee 
254d45f60c6SWeston Andros Adamson 	/* Yes, so retry the read at the end of the hdr */
255d45f60c6SWeston Andros Adamson 	hdr->mds_offset += resp->count;
2560b671301STrond Myklebust 	argp->offset += resp->count;
2570b671301STrond Myklebust 	argp->pgbase += resp->count;
2580b671301STrond Myklebust 	argp->count -= resp->count;
2598c9cb714STrond Myklebust 	resp->count = 0;
2608c9cb714STrond Myklebust 	resp->eof = 0;
261d00c5d43STrond Myklebust 	rpc_restart_call_prepare(task);
2620b671301STrond Myklebust }
2630b671301STrond Myklebust 
264d45f60c6SWeston Andros Adamson static void nfs_readpage_result(struct rpc_task *task,
265d45f60c6SWeston Andros Adamson 				struct nfs_pgio_header *hdr)
2661da177e4SLinus Torvalds {
267d45f60c6SWeston Andros Adamson 	if (hdr->res.eof) {
2681c6c4b74STrond Myklebust 		loff_t pos = hdr->args.offset + hdr->res.count;
2691c6c4b74STrond Myklebust 		unsigned int new = pos - hdr->io_start;
270fdd1e74cSTrond Myklebust 
2711c6c4b74STrond Myklebust 		if (hdr->good_bytes > new) {
2721c6c4b74STrond Myklebust 			hdr->good_bytes = new;
2734db6e0b7SFred Isaman 			set_bit(NFS_IOHDR_EOF, &hdr->flags);
2744db6e0b7SFred Isaman 			clear_bit(NFS_IOHDR_ERROR, &hdr->flags);
2754db6e0b7SFred Isaman 		}
276f8417b48SKinglong Mee 	} else if (hdr->res.count < hdr->args.count)
277d45f60c6SWeston Andros Adamson 		nfs_readpage_retry(task, hdr);
2780b671301STrond Myklebust }
279fdd1e74cSTrond Myklebust 
280*01c3a400SDave Wysochanski static int nfs_read_add_folio(struct nfs_pageio_descriptor *pgio,
281*01c3a400SDave Wysochanski 			      struct nfs_open_context *ctx,
282*01c3a400SDave Wysochanski 			      struct folio *folio)
2831e83b173SDave Wysochanski {
284ab75bff1STrond Myklebust 	struct inode *inode = folio_file_mapping(folio)->host;
285ab75bff1STrond Myklebust 	struct nfs_server *server = NFS_SERVER(inode);
286ab75bff1STrond Myklebust 	size_t fsize = folio_size(folio);
287ab75bff1STrond Myklebust 	unsigned int rsize = server->rsize;
2881e83b173SDave Wysochanski 	struct nfs_page *new;
2898cfb9015STrond Myklebust 	unsigned int len, aligned_len;
2901e83b173SDave Wysochanski 	int error;
2911e83b173SDave Wysochanski 
292ab75bff1STrond Myklebust 	len = nfs_folio_length(folio);
2931e83b173SDave Wysochanski 	if (len == 0)
294ab75bff1STrond Myklebust 		return nfs_return_empty_folio(folio);
2951e83b173SDave Wysochanski 
296ab75bff1STrond Myklebust 	aligned_len = min_t(unsigned int, ALIGN(len, rsize), fsize);
2978cfb9015STrond Myklebust 
298ab75bff1STrond Myklebust 	if (!IS_SYNC(inode)) {
299ab75bff1STrond Myklebust 		error = nfs_fscache_read_page(inode, &folio->page);
30016f2f4e6SDavid Howells 		if (error == 0)
30116f2f4e6SDavid Howells 			goto out_unlock;
30216f2f4e6SDavid Howells 	}
30316f2f4e6SDavid Howells 
304*01c3a400SDave Wysochanski 	new = nfs_page_create_from_folio(ctx, folio, 0, aligned_len);
3051e83b173SDave Wysochanski 	if (IS_ERR(new))
3061e83b173SDave Wysochanski 		goto out_error;
3071e83b173SDave Wysochanski 
308ab75bff1STrond Myklebust 	if (len < fsize)
309ab75bff1STrond Myklebust 		folio_zero_segment(folio, len, fsize);
310*01c3a400SDave Wysochanski 	if (!nfs_pageio_add_request(pgio, new)) {
3111e83b173SDave Wysochanski 		nfs_list_remove_request(new);
312*01c3a400SDave Wysochanski 		error = pgio->pg_error;
3131e83b173SDave Wysochanski 		nfs_readpage_release(new, error);
3141e83b173SDave Wysochanski 		goto out;
3151e83b173SDave Wysochanski 	}
3161e83b173SDave Wysochanski 	return 0;
3171e83b173SDave Wysochanski out_error:
3181e83b173SDave Wysochanski 	error = PTR_ERR(new);
31916f2f4e6SDavid Howells out_unlock:
320ab75bff1STrond Myklebust 	folio_unlock(folio);
3211e83b173SDave Wysochanski out:
3221e83b173SDave Wysochanski 	return error;
3231e83b173SDave Wysochanski }
3241e83b173SDave Wysochanski 
3251da177e4SLinus Torvalds /*
3261da177e4SLinus Torvalds  * Read a page over NFS.
3271da177e4SLinus Torvalds  * We read the page synchronously in the following case:
3281da177e4SLinus Torvalds  *  -	The error flag is set for this page. This happens only when a
3291da177e4SLinus Torvalds  *	previous async read operation failed.
3301da177e4SLinus Torvalds  */
33165d023afSMatthew Wilcox (Oracle) int nfs_read_folio(struct file *file, struct folio *folio)
3321da177e4SLinus Torvalds {
333ab75bff1STrond Myklebust 	struct inode *inode = file_inode(file);
334*01c3a400SDave Wysochanski 	struct nfs_pageio_descriptor pgio;
335*01c3a400SDave Wysochanski 	struct nfs_open_context *ctx;
33649dee700SDave Wysochanski 	int ret;
3371da177e4SLinus Torvalds 
338ab75bff1STrond Myklebust 	trace_nfs_aop_readpage(inode, folio);
33991d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGE);
3409c88ea00SDave Wysochanski 	task_io_account_read(folio_size(folio));
34191d5b470SChuck Lever 
3421da177e4SLinus Torvalds 	/*
3431da177e4SLinus Torvalds 	 * Try to flush any pending writes to the file..
3441da177e4SLinus Torvalds 	 *
345ab75bff1STrond Myklebust 	 * NOTE! Because we own the folio lock, there cannot
3461da177e4SLinus Torvalds 	 * be any new pending writes generated at this point
347ab75bff1STrond Myklebust 	 * for this folio (other folios can be written to).
3481da177e4SLinus Torvalds 	 */
349ab75bff1STrond Myklebust 	ret = nfs_wb_folio(inode, folio);
35049dee700SDave Wysochanski 	if (ret)
351de05a0ccSTrond Myklebust 		goto out_unlock;
352ab75bff1STrond Myklebust 	if (folio_test_uptodate(folio))
353de05a0ccSTrond Myklebust 		goto out_unlock;
3541da177e4SLinus Torvalds 
35549dee700SDave Wysochanski 	ret = -ESTALE;
3565f004cf2STrond Myklebust 	if (NFS_STALE(inode))
357de05a0ccSTrond Myklebust 		goto out_unlock;
3585f004cf2STrond Myklebust 
359*01c3a400SDave Wysochanski 	ctx = get_nfs_open_context(nfs_file_open_context(file));
3601da177e4SLinus Torvalds 
361*01c3a400SDave Wysochanski 	xchg(&ctx->error, 0);
362*01c3a400SDave Wysochanski 	nfs_pageio_init_read(&pgio, inode, false,
3631e83b173SDave Wysochanski 			     &nfs_async_read_completion_ops);
3641e83b173SDave Wysochanski 
365*01c3a400SDave Wysochanski 	ret = nfs_read_add_folio(&pgio, ctx, folio);
366e0340f16SDave Wysochanski 	if (ret)
367e0340f16SDave Wysochanski 		goto out;
3681e83b173SDave Wysochanski 
369*01c3a400SDave Wysochanski 	nfs_pageio_complete_read(&pgio);
370*01c3a400SDave Wysochanski 	ret = pgio.pg_error < 0 ? pgio.pg_error : 0;
37149dee700SDave Wysochanski 	if (!ret) {
372ab75bff1STrond Myklebust 		ret = folio_wait_locked_killable(folio);
373ab75bff1STrond Myklebust 		if (!folio_test_uptodate(folio) && !ret)
374*01c3a400SDave Wysochanski 			ret = xchg(&ctx->error, 0);
3758f54c7a4STrond Myklebust 	}
3769a9fc1c0SDavid Howells out:
377*01c3a400SDave Wysochanski 	put_nfs_open_context(ctx);
378ab75bff1STrond Myklebust 	trace_nfs_aop_readpage_done(inode, folio, ret);
37949dee700SDave Wysochanski 	return ret;
380de05a0ccSTrond Myklebust out_unlock:
381ab75bff1STrond Myklebust 	folio_unlock(folio);
382ab75bff1STrond Myklebust 	trace_nfs_aop_readpage_done(inode, folio, ret);
38349dee700SDave Wysochanski 	return ret;
3841da177e4SLinus Torvalds }
3851da177e4SLinus Torvalds 
3868786fde8SMatthew Wilcox (Oracle) void nfs_readahead(struct readahead_control *ractl)
3871da177e4SLinus Torvalds {
388*01c3a400SDave Wysochanski 	struct nfs_pageio_descriptor pgio;
389*01c3a400SDave Wysochanski 	struct nfs_open_context *ctx;
3908786fde8SMatthew Wilcox (Oracle) 	unsigned int nr_pages = readahead_count(ractl);
3918786fde8SMatthew Wilcox (Oracle) 	struct file *file = ractl->file;
3928786fde8SMatthew Wilcox (Oracle) 	struct inode *inode = ractl->mapping->host;
393ab75bff1STrond Myklebust 	struct folio *folio;
39449dee700SDave Wysochanski 	int ret;
3951da177e4SLinus Torvalds 
3968786fde8SMatthew Wilcox (Oracle) 	trace_nfs_aop_readahead(inode, readahead_pos(ractl), nr_pages);
39791d5b470SChuck Lever 	nfs_inc_stats(inode, NFSIOS_VFSREADPAGES);
3989c88ea00SDave Wysochanski 	task_io_account_read(readahead_length(ractl));
3991da177e4SLinus Torvalds 
40049dee700SDave Wysochanski 	ret = -ESTALE;
4015f004cf2STrond Myklebust 	if (NFS_STALE(inode))
4025f004cf2STrond Myklebust 		goto out;
4035f004cf2STrond Myklebust 
40449dee700SDave Wysochanski 	if (file == NULL) {
40549dee700SDave Wysochanski 		ret = -EBADF;
406*01c3a400SDave Wysochanski 		ctx = nfs_find_open_context(inode, NULL, FMODE_READ);
407*01c3a400SDave Wysochanski 		if (ctx == NULL)
40849dee700SDave Wysochanski 			goto out;
4091da177e4SLinus Torvalds 	} else
410*01c3a400SDave Wysochanski 		ctx = get_nfs_open_context(nfs_file_open_context(file));
4119a9fc1c0SDavid Howells 
412*01c3a400SDave Wysochanski 	nfs_pageio_init_read(&pgio, inode, false,
413fab5fc25SChristoph Hellwig 			     &nfs_async_read_completion_ops);
4148b09bee3STrond Myklebust 
415ab75bff1STrond Myklebust 	while ((folio = readahead_folio(ractl)) != NULL) {
416*01c3a400SDave Wysochanski 		ret = nfs_read_add_folio(&pgio, ctx, folio);
4178786fde8SMatthew Wilcox (Oracle) 		if (ret)
4188786fde8SMatthew Wilcox (Oracle) 			break;
4198786fde8SMatthew Wilcox (Oracle) 	}
420a7d42ddbSWeston Andros Adamson 
421*01c3a400SDave Wysochanski 	nfs_pageio_complete_read(&pgio);
422a7d42ddbSWeston Andros Adamson 
423*01c3a400SDave Wysochanski 	put_nfs_open_context(ctx);
4245f004cf2STrond Myklebust out:
425d9f87743SChuck Lever 	trace_nfs_aop_readahead_done(inode, nr_pages, ret);
4261da177e4SLinus Torvalds }
4271da177e4SLinus Torvalds 
428f7b422b1SDavid Howells int __init nfs_init_readpagecache(void)
4291da177e4SLinus Torvalds {
4301da177e4SLinus Torvalds 	nfs_rdata_cachep = kmem_cache_create("nfs_read_data",
4311e7f3a48SWeston Andros Adamson 					     sizeof(struct nfs_pgio_header),
4321da177e4SLinus Torvalds 					     0, SLAB_HWCACHE_ALIGN,
43320c2df83SPaul Mundt 					     NULL);
4341da177e4SLinus Torvalds 	if (nfs_rdata_cachep == NULL)
4351da177e4SLinus Torvalds 		return -ENOMEM;
4361da177e4SLinus Torvalds 
4371da177e4SLinus Torvalds 	return 0;
4381da177e4SLinus Torvalds }
4391da177e4SLinus Torvalds 
440266bee88SDavid Brownell void nfs_destroy_readpagecache(void)
4411da177e4SLinus Torvalds {
4421a1d92c1SAlexey Dobriyan 	kmem_cache_destroy(nfs_rdata_cachep);
4431da177e4SLinus Torvalds }
4444a0de55cSAnna Schumaker 
4454a0de55cSAnna Schumaker static const struct nfs_rw_ops nfs_rw_read_ops = {
4464a0de55cSAnna Schumaker 	.rw_alloc_header	= nfs_readhdr_alloc,
4474a0de55cSAnna Schumaker 	.rw_free_header		= nfs_readhdr_free,
4480eecb214SAnna Schumaker 	.rw_done		= nfs_readpage_done,
4490eecb214SAnna Schumaker 	.rw_result		= nfs_readpage_result,
4501ed26f33SAnna Schumaker 	.rw_initiate		= nfs_initiate_read,
4514a0de55cSAnna Schumaker };
452