xref: /openbmc/linux/fs/smb/client/file.c (revision cd743cfead99fbfa176c9b317706da22fb846542)
138c8a9a5SSteve French // SPDX-License-Identifier: LGPL-2.1
238c8a9a5SSteve French /*
338c8a9a5SSteve French  *
438c8a9a5SSteve French  *   vfs operations that deal with files
538c8a9a5SSteve French  *
638c8a9a5SSteve French  *   Copyright (C) International Business Machines  Corp., 2002,2010
738c8a9a5SSteve French  *   Author(s): Steve French (sfrench@us.ibm.com)
838c8a9a5SSteve French  *              Jeremy Allison (jra@samba.org)
938c8a9a5SSteve French  *
1038c8a9a5SSteve French  */
1138c8a9a5SSteve French #include <linux/fs.h>
1238c8a9a5SSteve French #include <linux/filelock.h>
1338c8a9a5SSteve French #include <linux/backing-dev.h>
1438c8a9a5SSteve French #include <linux/stat.h>
1538c8a9a5SSteve French #include <linux/fcntl.h>
1638c8a9a5SSteve French #include <linux/pagemap.h>
1738c8a9a5SSteve French #include <linux/pagevec.h>
1838c8a9a5SSteve French #include <linux/writeback.h>
1938c8a9a5SSteve French #include <linux/task_io_accounting_ops.h>
2038c8a9a5SSteve French #include <linux/delay.h>
2138c8a9a5SSteve French #include <linux/mount.h>
2238c8a9a5SSteve French #include <linux/slab.h>
2338c8a9a5SSteve French #include <linux/swap.h>
2438c8a9a5SSteve French #include <linux/mm.h>
2538c8a9a5SSteve French #include <asm/div64.h>
2638c8a9a5SSteve French #include "cifsfs.h"
2738c8a9a5SSteve French #include "cifspdu.h"
2838c8a9a5SSteve French #include "cifsglob.h"
2938c8a9a5SSteve French #include "cifsproto.h"
3038c8a9a5SSteve French #include "smb2proto.h"
3138c8a9a5SSteve French #include "cifs_unicode.h"
3238c8a9a5SSteve French #include "cifs_debug.h"
3338c8a9a5SSteve French #include "cifs_fs_sb.h"
3438c8a9a5SSteve French #include "fscache.h"
3538c8a9a5SSteve French #include "smbdirect.h"
3638c8a9a5SSteve French #include "fs_context.h"
3738c8a9a5SSteve French #include "cifs_ioctl.h"
3838c8a9a5SSteve French #include "cached_dir.h"
3938c8a9a5SSteve French 
4038c8a9a5SSteve French /*
4138c8a9a5SSteve French  * Remove the dirty flags from a span of pages.
4238c8a9a5SSteve French  */
4338c8a9a5SSteve French static void cifs_undirty_folios(struct inode *inode, loff_t start, unsigned int len)
4438c8a9a5SSteve French {
4538c8a9a5SSteve French 	struct address_space *mapping = inode->i_mapping;
4638c8a9a5SSteve French 	struct folio *folio;
4738c8a9a5SSteve French 	pgoff_t end;
4838c8a9a5SSteve French 
4938c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, start / PAGE_SIZE);
5038c8a9a5SSteve French 
5138c8a9a5SSteve French 	rcu_read_lock();
5238c8a9a5SSteve French 
5338c8a9a5SSteve French 	end = (start + len - 1) / PAGE_SIZE;
5438c8a9a5SSteve French 	xas_for_each_marked(&xas, folio, end, PAGECACHE_TAG_DIRTY) {
5538c8a9a5SSteve French 		if (xas_retry(&xas, folio))
5638c8a9a5SSteve French 			continue;
5738c8a9a5SSteve French 		xas_pause(&xas);
5838c8a9a5SSteve French 		rcu_read_unlock();
5938c8a9a5SSteve French 		folio_lock(folio);
6038c8a9a5SSteve French 		folio_clear_dirty_for_io(folio);
6138c8a9a5SSteve French 		folio_unlock(folio);
6238c8a9a5SSteve French 		rcu_read_lock();
6338c8a9a5SSteve French 	}
6438c8a9a5SSteve French 
6538c8a9a5SSteve French 	rcu_read_unlock();
6638c8a9a5SSteve French }
6738c8a9a5SSteve French 
6838c8a9a5SSteve French /*
6938c8a9a5SSteve French  * Completion of write to server.
7038c8a9a5SSteve French  */
7138c8a9a5SSteve French void cifs_pages_written_back(struct inode *inode, loff_t start, unsigned int len)
7238c8a9a5SSteve French {
7338c8a9a5SSteve French 	struct address_space *mapping = inode->i_mapping;
7438c8a9a5SSteve French 	struct folio *folio;
7538c8a9a5SSteve French 	pgoff_t end;
7638c8a9a5SSteve French 
7738c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, start / PAGE_SIZE);
7838c8a9a5SSteve French 
7938c8a9a5SSteve French 	if (!len)
8038c8a9a5SSteve French 		return;
8138c8a9a5SSteve French 
8238c8a9a5SSteve French 	rcu_read_lock();
8338c8a9a5SSteve French 
8438c8a9a5SSteve French 	end = (start + len - 1) / PAGE_SIZE;
8538c8a9a5SSteve French 	xas_for_each(&xas, folio, end) {
8638c8a9a5SSteve French 		if (xas_retry(&xas, folio))
8738c8a9a5SSteve French 			continue;
8838c8a9a5SSteve French 		if (!folio_test_writeback(folio)) {
8938c8a9a5SSteve French 			WARN_ONCE(1, "bad %x @%llx page %lx %lx\n",
9038c8a9a5SSteve French 				  len, start, folio_index(folio), end);
9138c8a9a5SSteve French 			continue;
9238c8a9a5SSteve French 		}
9338c8a9a5SSteve French 
9438c8a9a5SSteve French 		folio_detach_private(folio);
9538c8a9a5SSteve French 		folio_end_writeback(folio);
9638c8a9a5SSteve French 	}
9738c8a9a5SSteve French 
9838c8a9a5SSteve French 	rcu_read_unlock();
9938c8a9a5SSteve French }
10038c8a9a5SSteve French 
10138c8a9a5SSteve French /*
10238c8a9a5SSteve French  * Failure of write to server.
10338c8a9a5SSteve French  */
10438c8a9a5SSteve French void cifs_pages_write_failed(struct inode *inode, loff_t start, unsigned int len)
10538c8a9a5SSteve French {
10638c8a9a5SSteve French 	struct address_space *mapping = inode->i_mapping;
10738c8a9a5SSteve French 	struct folio *folio;
10838c8a9a5SSteve French 	pgoff_t end;
10938c8a9a5SSteve French 
11038c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, start / PAGE_SIZE);
11138c8a9a5SSteve French 
11238c8a9a5SSteve French 	if (!len)
11338c8a9a5SSteve French 		return;
11438c8a9a5SSteve French 
11538c8a9a5SSteve French 	rcu_read_lock();
11638c8a9a5SSteve French 
11738c8a9a5SSteve French 	end = (start + len - 1) / PAGE_SIZE;
11838c8a9a5SSteve French 	xas_for_each(&xas, folio, end) {
11938c8a9a5SSteve French 		if (xas_retry(&xas, folio))
12038c8a9a5SSteve French 			continue;
12138c8a9a5SSteve French 		if (!folio_test_writeback(folio)) {
12238c8a9a5SSteve French 			WARN_ONCE(1, "bad %x @%llx page %lx %lx\n",
12338c8a9a5SSteve French 				  len, start, folio_index(folio), end);
12438c8a9a5SSteve French 			continue;
12538c8a9a5SSteve French 		}
12638c8a9a5SSteve French 
12738c8a9a5SSteve French 		folio_set_error(folio);
12838c8a9a5SSteve French 		folio_end_writeback(folio);
12938c8a9a5SSteve French 	}
13038c8a9a5SSteve French 
13138c8a9a5SSteve French 	rcu_read_unlock();
13238c8a9a5SSteve French }
13338c8a9a5SSteve French 
13438c8a9a5SSteve French /*
13538c8a9a5SSteve French  * Redirty pages after a temporary failure.
13638c8a9a5SSteve French  */
13738c8a9a5SSteve French void cifs_pages_write_redirty(struct inode *inode, loff_t start, unsigned int len)
13838c8a9a5SSteve French {
13938c8a9a5SSteve French 	struct address_space *mapping = inode->i_mapping;
14038c8a9a5SSteve French 	struct folio *folio;
14138c8a9a5SSteve French 	pgoff_t end;
14238c8a9a5SSteve French 
14338c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, start / PAGE_SIZE);
14438c8a9a5SSteve French 
14538c8a9a5SSteve French 	if (!len)
14638c8a9a5SSteve French 		return;
14738c8a9a5SSteve French 
14838c8a9a5SSteve French 	rcu_read_lock();
14938c8a9a5SSteve French 
15038c8a9a5SSteve French 	end = (start + len - 1) / PAGE_SIZE;
15138c8a9a5SSteve French 	xas_for_each(&xas, folio, end) {
15238c8a9a5SSteve French 		if (!folio_test_writeback(folio)) {
15338c8a9a5SSteve French 			WARN_ONCE(1, "bad %x @%llx page %lx %lx\n",
15438c8a9a5SSteve French 				  len, start, folio_index(folio), end);
15538c8a9a5SSteve French 			continue;
15638c8a9a5SSteve French 		}
15738c8a9a5SSteve French 
15838c8a9a5SSteve French 		filemap_dirty_folio(folio->mapping, folio);
15938c8a9a5SSteve French 		folio_end_writeback(folio);
16038c8a9a5SSteve French 	}
16138c8a9a5SSteve French 
16238c8a9a5SSteve French 	rcu_read_unlock();
16338c8a9a5SSteve French }
16438c8a9a5SSteve French 
16538c8a9a5SSteve French /*
16638c8a9a5SSteve French  * Mark as invalid, all open files on tree connections since they
16738c8a9a5SSteve French  * were closed when session to server was lost.
16838c8a9a5SSteve French  */
16938c8a9a5SSteve French void
17038c8a9a5SSteve French cifs_mark_open_files_invalid(struct cifs_tcon *tcon)
17138c8a9a5SSteve French {
17238c8a9a5SSteve French 	struct cifsFileInfo *open_file = NULL;
17338c8a9a5SSteve French 	struct list_head *tmp;
17438c8a9a5SSteve French 	struct list_head *tmp1;
17538c8a9a5SSteve French 
17638c8a9a5SSteve French 	/* only send once per connect */
17738c8a9a5SSteve French 	spin_lock(&tcon->tc_lock);
178*cd743cfeSShyam Prasad N 	if (tcon->need_reconnect)
179*cd743cfeSShyam Prasad N 		tcon->status = TID_NEED_RECON;
180*cd743cfeSShyam Prasad N 
18138c8a9a5SSteve French 	if (tcon->status != TID_NEED_RECON) {
18238c8a9a5SSteve French 		spin_unlock(&tcon->tc_lock);
18338c8a9a5SSteve French 		return;
18438c8a9a5SSteve French 	}
18538c8a9a5SSteve French 	tcon->status = TID_IN_FILES_INVALIDATE;
18638c8a9a5SSteve French 	spin_unlock(&tcon->tc_lock);
18738c8a9a5SSteve French 
18838c8a9a5SSteve French 	/* list all files open on tree connection and mark them invalid */
18938c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
19038c8a9a5SSteve French 	list_for_each_safe(tmp, tmp1, &tcon->openFileList) {
19138c8a9a5SSteve French 		open_file = list_entry(tmp, struct cifsFileInfo, tlist);
19238c8a9a5SSteve French 		open_file->invalidHandle = true;
19338c8a9a5SSteve French 		open_file->oplock_break_cancelled = true;
19438c8a9a5SSteve French 	}
19538c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
19638c8a9a5SSteve French 
19738c8a9a5SSteve French 	invalidate_all_cached_dirs(tcon);
19838c8a9a5SSteve French 	spin_lock(&tcon->tc_lock);
19938c8a9a5SSteve French 	if (tcon->status == TID_IN_FILES_INVALIDATE)
20038c8a9a5SSteve French 		tcon->status = TID_NEED_TCON;
20138c8a9a5SSteve French 	spin_unlock(&tcon->tc_lock);
20238c8a9a5SSteve French 
20338c8a9a5SSteve French 	/*
20438c8a9a5SSteve French 	 * BB Add call to invalidate_inodes(sb) for all superblocks mounted
20538c8a9a5SSteve French 	 * to this tcon.
20638c8a9a5SSteve French 	 */
20738c8a9a5SSteve French }
20838c8a9a5SSteve French 
20938c8a9a5SSteve French static inline int cifs_convert_flags(unsigned int flags)
21038c8a9a5SSteve French {
21138c8a9a5SSteve French 	if ((flags & O_ACCMODE) == O_RDONLY)
21238c8a9a5SSteve French 		return GENERIC_READ;
21338c8a9a5SSteve French 	else if ((flags & O_ACCMODE) == O_WRONLY)
21438c8a9a5SSteve French 		return GENERIC_WRITE;
21538c8a9a5SSteve French 	else if ((flags & O_ACCMODE) == O_RDWR) {
21638c8a9a5SSteve French 		/* GENERIC_ALL is too much permission to request
21738c8a9a5SSteve French 		   can cause unnecessary access denied on create */
21838c8a9a5SSteve French 		/* return GENERIC_ALL; */
21938c8a9a5SSteve French 		return (GENERIC_READ | GENERIC_WRITE);
22038c8a9a5SSteve French 	}
22138c8a9a5SSteve French 
22238c8a9a5SSteve French 	return (READ_CONTROL | FILE_WRITE_ATTRIBUTES | FILE_READ_ATTRIBUTES |
22338c8a9a5SSteve French 		FILE_WRITE_EA | FILE_APPEND_DATA | FILE_WRITE_DATA |
22438c8a9a5SSteve French 		FILE_READ_DATA);
22538c8a9a5SSteve French }
22638c8a9a5SSteve French 
22738c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
22838c8a9a5SSteve French static u32 cifs_posix_convert_flags(unsigned int flags)
22938c8a9a5SSteve French {
23038c8a9a5SSteve French 	u32 posix_flags = 0;
23138c8a9a5SSteve French 
23238c8a9a5SSteve French 	if ((flags & O_ACCMODE) == O_RDONLY)
23338c8a9a5SSteve French 		posix_flags = SMB_O_RDONLY;
23438c8a9a5SSteve French 	else if ((flags & O_ACCMODE) == O_WRONLY)
23538c8a9a5SSteve French 		posix_flags = SMB_O_WRONLY;
23638c8a9a5SSteve French 	else if ((flags & O_ACCMODE) == O_RDWR)
23738c8a9a5SSteve French 		posix_flags = SMB_O_RDWR;
23838c8a9a5SSteve French 
23938c8a9a5SSteve French 	if (flags & O_CREAT) {
24038c8a9a5SSteve French 		posix_flags |= SMB_O_CREAT;
24138c8a9a5SSteve French 		if (flags & O_EXCL)
24238c8a9a5SSteve French 			posix_flags |= SMB_O_EXCL;
24338c8a9a5SSteve French 	} else if (flags & O_EXCL)
24438c8a9a5SSteve French 		cifs_dbg(FYI, "Application %s pid %d has incorrectly set O_EXCL flag but not O_CREAT on file open. Ignoring O_EXCL\n",
24538c8a9a5SSteve French 			 current->comm, current->tgid);
24638c8a9a5SSteve French 
24738c8a9a5SSteve French 	if (flags & O_TRUNC)
24838c8a9a5SSteve French 		posix_flags |= SMB_O_TRUNC;
24938c8a9a5SSteve French 	/* be safe and imply O_SYNC for O_DSYNC */
25038c8a9a5SSteve French 	if (flags & O_DSYNC)
25138c8a9a5SSteve French 		posix_flags |= SMB_O_SYNC;
25238c8a9a5SSteve French 	if (flags & O_DIRECTORY)
25338c8a9a5SSteve French 		posix_flags |= SMB_O_DIRECTORY;
25438c8a9a5SSteve French 	if (flags & O_NOFOLLOW)
25538c8a9a5SSteve French 		posix_flags |= SMB_O_NOFOLLOW;
25638c8a9a5SSteve French 	if (flags & O_DIRECT)
25738c8a9a5SSteve French 		posix_flags |= SMB_O_DIRECT;
25838c8a9a5SSteve French 
25938c8a9a5SSteve French 	return posix_flags;
26038c8a9a5SSteve French }
26138c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
26238c8a9a5SSteve French 
26338c8a9a5SSteve French static inline int cifs_get_disposition(unsigned int flags)
26438c8a9a5SSteve French {
26538c8a9a5SSteve French 	if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))
26638c8a9a5SSteve French 		return FILE_CREATE;
26738c8a9a5SSteve French 	else if ((flags & (O_CREAT | O_TRUNC)) == (O_CREAT | O_TRUNC))
26838c8a9a5SSteve French 		return FILE_OVERWRITE_IF;
26938c8a9a5SSteve French 	else if ((flags & O_CREAT) == O_CREAT)
27038c8a9a5SSteve French 		return FILE_OPEN_IF;
27138c8a9a5SSteve French 	else if ((flags & O_TRUNC) == O_TRUNC)
27238c8a9a5SSteve French 		return FILE_OVERWRITE;
27338c8a9a5SSteve French 	else
27438c8a9a5SSteve French 		return FILE_OPEN;
27538c8a9a5SSteve French }
27638c8a9a5SSteve French 
27738c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
27838c8a9a5SSteve French int cifs_posix_open(const char *full_path, struct inode **pinode,
27938c8a9a5SSteve French 			struct super_block *sb, int mode, unsigned int f_flags,
28038c8a9a5SSteve French 			__u32 *poplock, __u16 *pnetfid, unsigned int xid)
28138c8a9a5SSteve French {
28238c8a9a5SSteve French 	int rc;
28338c8a9a5SSteve French 	FILE_UNIX_BASIC_INFO *presp_data;
28438c8a9a5SSteve French 	__u32 posix_flags = 0;
28538c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
28638c8a9a5SSteve French 	struct cifs_fattr fattr;
28738c8a9a5SSteve French 	struct tcon_link *tlink;
28838c8a9a5SSteve French 	struct cifs_tcon *tcon;
28938c8a9a5SSteve French 
29038c8a9a5SSteve French 	cifs_dbg(FYI, "posix open %s\n", full_path);
29138c8a9a5SSteve French 
29238c8a9a5SSteve French 	presp_data = kzalloc(sizeof(FILE_UNIX_BASIC_INFO), GFP_KERNEL);
29338c8a9a5SSteve French 	if (presp_data == NULL)
29438c8a9a5SSteve French 		return -ENOMEM;
29538c8a9a5SSteve French 
29638c8a9a5SSteve French 	tlink = cifs_sb_tlink(cifs_sb);
29738c8a9a5SSteve French 	if (IS_ERR(tlink)) {
29838c8a9a5SSteve French 		rc = PTR_ERR(tlink);
29938c8a9a5SSteve French 		goto posix_open_ret;
30038c8a9a5SSteve French 	}
30138c8a9a5SSteve French 
30238c8a9a5SSteve French 	tcon = tlink_tcon(tlink);
30338c8a9a5SSteve French 	mode &= ~current_umask();
30438c8a9a5SSteve French 
30538c8a9a5SSteve French 	posix_flags = cifs_posix_convert_flags(f_flags);
30638c8a9a5SSteve French 	rc = CIFSPOSIXCreate(xid, tcon, posix_flags, mode, pnetfid, presp_data,
30738c8a9a5SSteve French 			     poplock, full_path, cifs_sb->local_nls,
30838c8a9a5SSteve French 			     cifs_remap(cifs_sb));
30938c8a9a5SSteve French 	cifs_put_tlink(tlink);
31038c8a9a5SSteve French 
31138c8a9a5SSteve French 	if (rc)
31238c8a9a5SSteve French 		goto posix_open_ret;
31338c8a9a5SSteve French 
31438c8a9a5SSteve French 	if (presp_data->Type == cpu_to_le32(-1))
31538c8a9a5SSteve French 		goto posix_open_ret; /* open ok, caller does qpathinfo */
31638c8a9a5SSteve French 
31738c8a9a5SSteve French 	if (!pinode)
31838c8a9a5SSteve French 		goto posix_open_ret; /* caller does not need info */
31938c8a9a5SSteve French 
32038c8a9a5SSteve French 	cifs_unix_basic_to_fattr(&fattr, presp_data, cifs_sb);
32138c8a9a5SSteve French 
32238c8a9a5SSteve French 	/* get new inode and set it up */
32338c8a9a5SSteve French 	if (*pinode == NULL) {
32438c8a9a5SSteve French 		cifs_fill_uniqueid(sb, &fattr);
32538c8a9a5SSteve French 		*pinode = cifs_iget(sb, &fattr);
32638c8a9a5SSteve French 		if (!*pinode) {
32738c8a9a5SSteve French 			rc = -ENOMEM;
32838c8a9a5SSteve French 			goto posix_open_ret;
32938c8a9a5SSteve French 		}
33038c8a9a5SSteve French 	} else {
33138c8a9a5SSteve French 		cifs_revalidate_mapping(*pinode);
33238c8a9a5SSteve French 		rc = cifs_fattr_to_inode(*pinode, &fattr);
33338c8a9a5SSteve French 	}
33438c8a9a5SSteve French 
33538c8a9a5SSteve French posix_open_ret:
33638c8a9a5SSteve French 	kfree(presp_data);
33738c8a9a5SSteve French 	return rc;
33838c8a9a5SSteve French }
33938c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
34038c8a9a5SSteve French 
34138c8a9a5SSteve French static int cifs_nt_open(const char *full_path, struct inode *inode, struct cifs_sb_info *cifs_sb,
34238c8a9a5SSteve French 			struct cifs_tcon *tcon, unsigned int f_flags, __u32 *oplock,
34338c8a9a5SSteve French 			struct cifs_fid *fid, unsigned int xid, struct cifs_open_info_data *buf)
34438c8a9a5SSteve French {
34538c8a9a5SSteve French 	int rc;
34638c8a9a5SSteve French 	int desired_access;
34738c8a9a5SSteve French 	int disposition;
34838c8a9a5SSteve French 	int create_options = CREATE_NOT_DIR;
34938c8a9a5SSteve French 	struct TCP_Server_Info *server = tcon->ses->server;
35038c8a9a5SSteve French 	struct cifs_open_parms oparms;
35138c8a9a5SSteve French 
35238c8a9a5SSteve French 	if (!server->ops->open)
35338c8a9a5SSteve French 		return -ENOSYS;
35438c8a9a5SSteve French 
35538c8a9a5SSteve French 	desired_access = cifs_convert_flags(f_flags);
35638c8a9a5SSteve French 
35738c8a9a5SSteve French /*********************************************************************
35838c8a9a5SSteve French  *  open flag mapping table:
35938c8a9a5SSteve French  *
36038c8a9a5SSteve French  *	POSIX Flag            CIFS Disposition
36138c8a9a5SSteve French  *	----------            ----------------
36238c8a9a5SSteve French  *	O_CREAT               FILE_OPEN_IF
36338c8a9a5SSteve French  *	O_CREAT | O_EXCL      FILE_CREATE
36438c8a9a5SSteve French  *	O_CREAT | O_TRUNC     FILE_OVERWRITE_IF
36538c8a9a5SSteve French  *	O_TRUNC               FILE_OVERWRITE
36638c8a9a5SSteve French  *	none of the above     FILE_OPEN
36738c8a9a5SSteve French  *
36838c8a9a5SSteve French  *	Note that there is not a direct match between disposition
36938c8a9a5SSteve French  *	FILE_SUPERSEDE (ie create whether or not file exists although
37038c8a9a5SSteve French  *	O_CREAT | O_TRUNC is similar but truncates the existing
37138c8a9a5SSteve French  *	file rather than creating a new file as FILE_SUPERSEDE does
37238c8a9a5SSteve French  *	(which uses the attributes / metadata passed in on open call)
37338c8a9a5SSteve French  *?
37438c8a9a5SSteve French  *?  O_SYNC is a reasonable match to CIFS writethrough flag
37538c8a9a5SSteve French  *?  and the read write flags match reasonably.  O_LARGEFILE
37638c8a9a5SSteve French  *?  is irrelevant because largefile support is always used
37738c8a9a5SSteve French  *?  by this client. Flags O_APPEND, O_DIRECT, O_DIRECTORY,
37838c8a9a5SSteve French  *	 O_FASYNC, O_NOFOLLOW, O_NONBLOCK need further investigation
37938c8a9a5SSteve French  *********************************************************************/
38038c8a9a5SSteve French 
38138c8a9a5SSteve French 	disposition = cifs_get_disposition(f_flags);
38238c8a9a5SSteve French 
38338c8a9a5SSteve French 	/* BB pass O_SYNC flag through on file attributes .. BB */
38438c8a9a5SSteve French 
38538c8a9a5SSteve French 	/* O_SYNC also has bit for O_DSYNC so following check picks up either */
38638c8a9a5SSteve French 	if (f_flags & O_SYNC)
38738c8a9a5SSteve French 		create_options |= CREATE_WRITE_THROUGH;
38838c8a9a5SSteve French 
38938c8a9a5SSteve French 	if (f_flags & O_DIRECT)
39038c8a9a5SSteve French 		create_options |= CREATE_NO_BUFFER;
39138c8a9a5SSteve French 
39238c8a9a5SSteve French 	oparms = (struct cifs_open_parms) {
39338c8a9a5SSteve French 		.tcon = tcon,
39438c8a9a5SSteve French 		.cifs_sb = cifs_sb,
39538c8a9a5SSteve French 		.desired_access = desired_access,
39638c8a9a5SSteve French 		.create_options = cifs_create_options(cifs_sb, create_options),
39738c8a9a5SSteve French 		.disposition = disposition,
39838c8a9a5SSteve French 		.path = full_path,
39938c8a9a5SSteve French 		.fid = fid,
40038c8a9a5SSteve French 	};
40138c8a9a5SSteve French 
40238c8a9a5SSteve French 	rc = server->ops->open(xid, &oparms, oplock, buf);
40338c8a9a5SSteve French 	if (rc)
40438c8a9a5SSteve French 		return rc;
40538c8a9a5SSteve French 
40638c8a9a5SSteve French 	/* TODO: Add support for calling posix query info but with passing in fid */
40738c8a9a5SSteve French 	if (tcon->unix_ext)
40838c8a9a5SSteve French 		rc = cifs_get_inode_info_unix(&inode, full_path, inode->i_sb,
40938c8a9a5SSteve French 					      xid);
41038c8a9a5SSteve French 	else
41138c8a9a5SSteve French 		rc = cifs_get_inode_info(&inode, full_path, buf, inode->i_sb,
41238c8a9a5SSteve French 					 xid, fid);
41338c8a9a5SSteve French 
41438c8a9a5SSteve French 	if (rc) {
41538c8a9a5SSteve French 		server->ops->close(xid, tcon, fid);
41638c8a9a5SSteve French 		if (rc == -ESTALE)
41738c8a9a5SSteve French 			rc = -EOPENSTALE;
41838c8a9a5SSteve French 	}
41938c8a9a5SSteve French 
42038c8a9a5SSteve French 	return rc;
42138c8a9a5SSteve French }
42238c8a9a5SSteve French 
42338c8a9a5SSteve French static bool
42438c8a9a5SSteve French cifs_has_mand_locks(struct cifsInodeInfo *cinode)
42538c8a9a5SSteve French {
42638c8a9a5SSteve French 	struct cifs_fid_locks *cur;
42738c8a9a5SSteve French 	bool has_locks = false;
42838c8a9a5SSteve French 
42938c8a9a5SSteve French 	down_read(&cinode->lock_sem);
43038c8a9a5SSteve French 	list_for_each_entry(cur, &cinode->llist, llist) {
43138c8a9a5SSteve French 		if (!list_empty(&cur->locks)) {
43238c8a9a5SSteve French 			has_locks = true;
43338c8a9a5SSteve French 			break;
43438c8a9a5SSteve French 		}
43538c8a9a5SSteve French 	}
43638c8a9a5SSteve French 	up_read(&cinode->lock_sem);
43738c8a9a5SSteve French 	return has_locks;
43838c8a9a5SSteve French }
43938c8a9a5SSteve French 
44038c8a9a5SSteve French void
44138c8a9a5SSteve French cifs_down_write(struct rw_semaphore *sem)
44238c8a9a5SSteve French {
44338c8a9a5SSteve French 	while (!down_write_trylock(sem))
44438c8a9a5SSteve French 		msleep(10);
44538c8a9a5SSteve French }
44638c8a9a5SSteve French 
44738c8a9a5SSteve French static void cifsFileInfo_put_work(struct work_struct *work);
44838c8a9a5SSteve French 
44938c8a9a5SSteve French struct cifsFileInfo *cifs_new_fileinfo(struct cifs_fid *fid, struct file *file,
45038c8a9a5SSteve French 				       struct tcon_link *tlink, __u32 oplock,
45138c8a9a5SSteve French 				       const char *symlink_target)
45238c8a9a5SSteve French {
45338c8a9a5SSteve French 	struct dentry *dentry = file_dentry(file);
45438c8a9a5SSteve French 	struct inode *inode = d_inode(dentry);
45538c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
45638c8a9a5SSteve French 	struct cifsFileInfo *cfile;
45738c8a9a5SSteve French 	struct cifs_fid_locks *fdlocks;
45838c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(tlink);
45938c8a9a5SSteve French 	struct TCP_Server_Info *server = tcon->ses->server;
46038c8a9a5SSteve French 
46138c8a9a5SSteve French 	cfile = kzalloc(sizeof(struct cifsFileInfo), GFP_KERNEL);
46238c8a9a5SSteve French 	if (cfile == NULL)
46338c8a9a5SSteve French 		return cfile;
46438c8a9a5SSteve French 
46538c8a9a5SSteve French 	fdlocks = kzalloc(sizeof(struct cifs_fid_locks), GFP_KERNEL);
46638c8a9a5SSteve French 	if (!fdlocks) {
46738c8a9a5SSteve French 		kfree(cfile);
46838c8a9a5SSteve French 		return NULL;
46938c8a9a5SSteve French 	}
47038c8a9a5SSteve French 
47138c8a9a5SSteve French 	if (symlink_target) {
47238c8a9a5SSteve French 		cfile->symlink_target = kstrdup(symlink_target, GFP_KERNEL);
47338c8a9a5SSteve French 		if (!cfile->symlink_target) {
47438c8a9a5SSteve French 			kfree(fdlocks);
47538c8a9a5SSteve French 			kfree(cfile);
47638c8a9a5SSteve French 			return NULL;
47738c8a9a5SSteve French 		}
47838c8a9a5SSteve French 	}
47938c8a9a5SSteve French 
48038c8a9a5SSteve French 	INIT_LIST_HEAD(&fdlocks->locks);
48138c8a9a5SSteve French 	fdlocks->cfile = cfile;
48238c8a9a5SSteve French 	cfile->llist = fdlocks;
48338c8a9a5SSteve French 
48438c8a9a5SSteve French 	cfile->count = 1;
48538c8a9a5SSteve French 	cfile->pid = current->tgid;
48638c8a9a5SSteve French 	cfile->uid = current_fsuid();
48738c8a9a5SSteve French 	cfile->dentry = dget(dentry);
48838c8a9a5SSteve French 	cfile->f_flags = file->f_flags;
48938c8a9a5SSteve French 	cfile->invalidHandle = false;
49038c8a9a5SSteve French 	cfile->deferred_close_scheduled = false;
49138c8a9a5SSteve French 	cfile->tlink = cifs_get_tlink(tlink);
49238c8a9a5SSteve French 	INIT_WORK(&cfile->oplock_break, cifs_oplock_break);
49338c8a9a5SSteve French 	INIT_WORK(&cfile->put, cifsFileInfo_put_work);
49438c8a9a5SSteve French 	INIT_DELAYED_WORK(&cfile->deferred, smb2_deferred_work_close);
49538c8a9a5SSteve French 	mutex_init(&cfile->fh_mutex);
49638c8a9a5SSteve French 	spin_lock_init(&cfile->file_info_lock);
49738c8a9a5SSteve French 
49838c8a9a5SSteve French 	cifs_sb_active(inode->i_sb);
49938c8a9a5SSteve French 
50038c8a9a5SSteve French 	/*
50138c8a9a5SSteve French 	 * If the server returned a read oplock and we have mandatory brlocks,
50238c8a9a5SSteve French 	 * set oplock level to None.
50338c8a9a5SSteve French 	 */
50438c8a9a5SSteve French 	if (server->ops->is_read_op(oplock) && cifs_has_mand_locks(cinode)) {
50538c8a9a5SSteve French 		cifs_dbg(FYI, "Reset oplock val from read to None due to mand locks\n");
50638c8a9a5SSteve French 		oplock = 0;
50738c8a9a5SSteve French 	}
50838c8a9a5SSteve French 
50938c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
51038c8a9a5SSteve French 	list_add(&fdlocks->llist, &cinode->llist);
51138c8a9a5SSteve French 	up_write(&cinode->lock_sem);
51238c8a9a5SSteve French 
51338c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
51438c8a9a5SSteve French 	if (fid->pending_open->oplock != CIFS_OPLOCK_NO_CHANGE && oplock)
51538c8a9a5SSteve French 		oplock = fid->pending_open->oplock;
51638c8a9a5SSteve French 	list_del(&fid->pending_open->olist);
51738c8a9a5SSteve French 
51838c8a9a5SSteve French 	fid->purge_cache = false;
51938c8a9a5SSteve French 	server->ops->set_fid(cfile, fid, oplock);
52038c8a9a5SSteve French 
52138c8a9a5SSteve French 	list_add(&cfile->tlist, &tcon->openFileList);
52238c8a9a5SSteve French 	atomic_inc(&tcon->num_local_opens);
52338c8a9a5SSteve French 
52438c8a9a5SSteve French 	/* if readable file instance put first in list*/
52538c8a9a5SSteve French 	spin_lock(&cinode->open_file_lock);
52638c8a9a5SSteve French 	if (file->f_mode & FMODE_READ)
52738c8a9a5SSteve French 		list_add(&cfile->flist, &cinode->openFileList);
52838c8a9a5SSteve French 	else
52938c8a9a5SSteve French 		list_add_tail(&cfile->flist, &cinode->openFileList);
53038c8a9a5SSteve French 	spin_unlock(&cinode->open_file_lock);
53138c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
53238c8a9a5SSteve French 
53338c8a9a5SSteve French 	if (fid->purge_cache)
53438c8a9a5SSteve French 		cifs_zap_mapping(inode);
53538c8a9a5SSteve French 
53638c8a9a5SSteve French 	file->private_data = cfile;
53738c8a9a5SSteve French 	return cfile;
53838c8a9a5SSteve French }
53938c8a9a5SSteve French 
54038c8a9a5SSteve French struct cifsFileInfo *
54138c8a9a5SSteve French cifsFileInfo_get(struct cifsFileInfo *cifs_file)
54238c8a9a5SSteve French {
54338c8a9a5SSteve French 	spin_lock(&cifs_file->file_info_lock);
54438c8a9a5SSteve French 	cifsFileInfo_get_locked(cifs_file);
54538c8a9a5SSteve French 	spin_unlock(&cifs_file->file_info_lock);
54638c8a9a5SSteve French 	return cifs_file;
54738c8a9a5SSteve French }
54838c8a9a5SSteve French 
54938c8a9a5SSteve French static void cifsFileInfo_put_final(struct cifsFileInfo *cifs_file)
55038c8a9a5SSteve French {
55138c8a9a5SSteve French 	struct inode *inode = d_inode(cifs_file->dentry);
55238c8a9a5SSteve French 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
55338c8a9a5SSteve French 	struct cifsLockInfo *li, *tmp;
55438c8a9a5SSteve French 	struct super_block *sb = inode->i_sb;
55538c8a9a5SSteve French 
55638c8a9a5SSteve French 	/*
55738c8a9a5SSteve French 	 * Delete any outstanding lock records. We'll lose them when the file
55838c8a9a5SSteve French 	 * is closed anyway.
55938c8a9a5SSteve French 	 */
56038c8a9a5SSteve French 	cifs_down_write(&cifsi->lock_sem);
56138c8a9a5SSteve French 	list_for_each_entry_safe(li, tmp, &cifs_file->llist->locks, llist) {
56238c8a9a5SSteve French 		list_del(&li->llist);
56338c8a9a5SSteve French 		cifs_del_lock_waiters(li);
56438c8a9a5SSteve French 		kfree(li);
56538c8a9a5SSteve French 	}
56638c8a9a5SSteve French 	list_del(&cifs_file->llist->llist);
56738c8a9a5SSteve French 	kfree(cifs_file->llist);
56838c8a9a5SSteve French 	up_write(&cifsi->lock_sem);
56938c8a9a5SSteve French 
57038c8a9a5SSteve French 	cifs_put_tlink(cifs_file->tlink);
57138c8a9a5SSteve French 	dput(cifs_file->dentry);
57238c8a9a5SSteve French 	cifs_sb_deactive(sb);
57338c8a9a5SSteve French 	kfree(cifs_file->symlink_target);
57438c8a9a5SSteve French 	kfree(cifs_file);
57538c8a9a5SSteve French }
57638c8a9a5SSteve French 
57738c8a9a5SSteve French static void cifsFileInfo_put_work(struct work_struct *work)
57838c8a9a5SSteve French {
57938c8a9a5SSteve French 	struct cifsFileInfo *cifs_file = container_of(work,
58038c8a9a5SSteve French 			struct cifsFileInfo, put);
58138c8a9a5SSteve French 
58238c8a9a5SSteve French 	cifsFileInfo_put_final(cifs_file);
58338c8a9a5SSteve French }
58438c8a9a5SSteve French 
58538c8a9a5SSteve French /**
58638c8a9a5SSteve French  * cifsFileInfo_put - release a reference of file priv data
58738c8a9a5SSteve French  *
58838c8a9a5SSteve French  * Always potentially wait for oplock handler. See _cifsFileInfo_put().
58938c8a9a5SSteve French  *
59038c8a9a5SSteve French  * @cifs_file:	cifs/smb3 specific info (eg refcounts) for an open file
59138c8a9a5SSteve French  */
59238c8a9a5SSteve French void cifsFileInfo_put(struct cifsFileInfo *cifs_file)
59338c8a9a5SSteve French {
59438c8a9a5SSteve French 	_cifsFileInfo_put(cifs_file, true, true);
59538c8a9a5SSteve French }
59638c8a9a5SSteve French 
59738c8a9a5SSteve French /**
59838c8a9a5SSteve French  * _cifsFileInfo_put - release a reference of file priv data
59938c8a9a5SSteve French  *
60038c8a9a5SSteve French  * This may involve closing the filehandle @cifs_file out on the
60138c8a9a5SSteve French  * server. Must be called without holding tcon->open_file_lock,
60238c8a9a5SSteve French  * cinode->open_file_lock and cifs_file->file_info_lock.
60338c8a9a5SSteve French  *
60438c8a9a5SSteve French  * If @wait_for_oplock_handler is true and we are releasing the last
60538c8a9a5SSteve French  * reference, wait for any running oplock break handler of the file
60638c8a9a5SSteve French  * and cancel any pending one.
60738c8a9a5SSteve French  *
60838c8a9a5SSteve French  * @cifs_file:	cifs/smb3 specific info (eg refcounts) for an open file
60938c8a9a5SSteve French  * @wait_oplock_handler: must be false if called from oplock_break_handler
61038c8a9a5SSteve French  * @offload:	not offloaded on close and oplock breaks
61138c8a9a5SSteve French  *
61238c8a9a5SSteve French  */
61338c8a9a5SSteve French void _cifsFileInfo_put(struct cifsFileInfo *cifs_file,
61438c8a9a5SSteve French 		       bool wait_oplock_handler, bool offload)
61538c8a9a5SSteve French {
61638c8a9a5SSteve French 	struct inode *inode = d_inode(cifs_file->dentry);
61738c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cifs_file->tlink);
61838c8a9a5SSteve French 	struct TCP_Server_Info *server = tcon->ses->server;
61938c8a9a5SSteve French 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
62038c8a9a5SSteve French 	struct super_block *sb = inode->i_sb;
62138c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
62238c8a9a5SSteve French 	struct cifs_fid fid = {};
62338c8a9a5SSteve French 	struct cifs_pending_open open;
62438c8a9a5SSteve French 	bool oplock_break_cancelled;
62538c8a9a5SSteve French 
62638c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
62738c8a9a5SSteve French 	spin_lock(&cifsi->open_file_lock);
62838c8a9a5SSteve French 	spin_lock(&cifs_file->file_info_lock);
62938c8a9a5SSteve French 	if (--cifs_file->count > 0) {
63038c8a9a5SSteve French 		spin_unlock(&cifs_file->file_info_lock);
63138c8a9a5SSteve French 		spin_unlock(&cifsi->open_file_lock);
63238c8a9a5SSteve French 		spin_unlock(&tcon->open_file_lock);
63338c8a9a5SSteve French 		return;
63438c8a9a5SSteve French 	}
63538c8a9a5SSteve French 	spin_unlock(&cifs_file->file_info_lock);
63638c8a9a5SSteve French 
63738c8a9a5SSteve French 	if (server->ops->get_lease_key)
63838c8a9a5SSteve French 		server->ops->get_lease_key(inode, &fid);
63938c8a9a5SSteve French 
64038c8a9a5SSteve French 	/* store open in pending opens to make sure we don't miss lease break */
64138c8a9a5SSteve French 	cifs_add_pending_open_locked(&fid, cifs_file->tlink, &open);
64238c8a9a5SSteve French 
64338c8a9a5SSteve French 	/* remove it from the lists */
64438c8a9a5SSteve French 	list_del(&cifs_file->flist);
64538c8a9a5SSteve French 	list_del(&cifs_file->tlist);
64638c8a9a5SSteve French 	atomic_dec(&tcon->num_local_opens);
64738c8a9a5SSteve French 
64838c8a9a5SSteve French 	if (list_empty(&cifsi->openFileList)) {
64938c8a9a5SSteve French 		cifs_dbg(FYI, "closing last open instance for inode %p\n",
65038c8a9a5SSteve French 			 d_inode(cifs_file->dentry));
65138c8a9a5SSteve French 		/*
65238c8a9a5SSteve French 		 * In strict cache mode we need invalidate mapping on the last
65338c8a9a5SSteve French 		 * close  because it may cause a error when we open this file
65438c8a9a5SSteve French 		 * again and get at least level II oplock.
65538c8a9a5SSteve French 		 */
65638c8a9a5SSteve French 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO)
65738c8a9a5SSteve French 			set_bit(CIFS_INO_INVALID_MAPPING, &cifsi->flags);
65838c8a9a5SSteve French 		cifs_set_oplock_level(cifsi, 0);
65938c8a9a5SSteve French 	}
66038c8a9a5SSteve French 
66138c8a9a5SSteve French 	spin_unlock(&cifsi->open_file_lock);
66238c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
66338c8a9a5SSteve French 
66438c8a9a5SSteve French 	oplock_break_cancelled = wait_oplock_handler ?
66538c8a9a5SSteve French 		cancel_work_sync(&cifs_file->oplock_break) : false;
66638c8a9a5SSteve French 
66738c8a9a5SSteve French 	if (!tcon->need_reconnect && !cifs_file->invalidHandle) {
66838c8a9a5SSteve French 		struct TCP_Server_Info *server = tcon->ses->server;
66938c8a9a5SSteve French 		unsigned int xid;
67038c8a9a5SSteve French 
67138c8a9a5SSteve French 		xid = get_xid();
67238c8a9a5SSteve French 		if (server->ops->close_getattr)
67338c8a9a5SSteve French 			server->ops->close_getattr(xid, tcon, cifs_file);
67438c8a9a5SSteve French 		else if (server->ops->close)
67538c8a9a5SSteve French 			server->ops->close(xid, tcon, &cifs_file->fid);
67638c8a9a5SSteve French 		_free_xid(xid);
67738c8a9a5SSteve French 	}
67838c8a9a5SSteve French 
67938c8a9a5SSteve French 	if (oplock_break_cancelled)
68038c8a9a5SSteve French 		cifs_done_oplock_break(cifsi);
68138c8a9a5SSteve French 
68238c8a9a5SSteve French 	cifs_del_pending_open(&open);
68338c8a9a5SSteve French 
68438c8a9a5SSteve French 	if (offload)
68538c8a9a5SSteve French 		queue_work(fileinfo_put_wq, &cifs_file->put);
68638c8a9a5SSteve French 	else
68738c8a9a5SSteve French 		cifsFileInfo_put_final(cifs_file);
68838c8a9a5SSteve French }
68938c8a9a5SSteve French 
69038c8a9a5SSteve French int cifs_open(struct inode *inode, struct file *file)
69138c8a9a5SSteve French 
69238c8a9a5SSteve French {
69338c8a9a5SSteve French 	int rc = -EACCES;
69438c8a9a5SSteve French 	unsigned int xid;
69538c8a9a5SSteve French 	__u32 oplock;
69638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
69738c8a9a5SSteve French 	struct TCP_Server_Info *server;
69838c8a9a5SSteve French 	struct cifs_tcon *tcon;
69938c8a9a5SSteve French 	struct tcon_link *tlink;
70038c8a9a5SSteve French 	struct cifsFileInfo *cfile = NULL;
70138c8a9a5SSteve French 	void *page;
70238c8a9a5SSteve French 	const char *full_path;
70338c8a9a5SSteve French 	bool posix_open_ok = false;
70438c8a9a5SSteve French 	struct cifs_fid fid = {};
70538c8a9a5SSteve French 	struct cifs_pending_open open;
70638c8a9a5SSteve French 	struct cifs_open_info_data data = {};
70738c8a9a5SSteve French 
70838c8a9a5SSteve French 	xid = get_xid();
70938c8a9a5SSteve French 
71038c8a9a5SSteve French 	cifs_sb = CIFS_SB(inode->i_sb);
71138c8a9a5SSteve French 	if (unlikely(cifs_forced_shutdown(cifs_sb))) {
71238c8a9a5SSteve French 		free_xid(xid);
71338c8a9a5SSteve French 		return -EIO;
71438c8a9a5SSteve French 	}
71538c8a9a5SSteve French 
71638c8a9a5SSteve French 	tlink = cifs_sb_tlink(cifs_sb);
71738c8a9a5SSteve French 	if (IS_ERR(tlink)) {
71838c8a9a5SSteve French 		free_xid(xid);
71938c8a9a5SSteve French 		return PTR_ERR(tlink);
72038c8a9a5SSteve French 	}
72138c8a9a5SSteve French 	tcon = tlink_tcon(tlink);
72238c8a9a5SSteve French 	server = tcon->ses->server;
72338c8a9a5SSteve French 
72438c8a9a5SSteve French 	page = alloc_dentry_path();
72538c8a9a5SSteve French 	full_path = build_path_from_dentry(file_dentry(file), page);
72638c8a9a5SSteve French 	if (IS_ERR(full_path)) {
72738c8a9a5SSteve French 		rc = PTR_ERR(full_path);
72838c8a9a5SSteve French 		goto out;
72938c8a9a5SSteve French 	}
73038c8a9a5SSteve French 
73138c8a9a5SSteve French 	cifs_dbg(FYI, "inode = 0x%p file flags are 0x%x for %s\n",
73238c8a9a5SSteve French 		 inode, file->f_flags, full_path);
73338c8a9a5SSteve French 
73438c8a9a5SSteve French 	if (file->f_flags & O_DIRECT &&
73538c8a9a5SSteve French 	    cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO) {
73638c8a9a5SSteve French 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NO_BRL)
73738c8a9a5SSteve French 			file->f_op = &cifs_file_direct_nobrl_ops;
73838c8a9a5SSteve French 		else
73938c8a9a5SSteve French 			file->f_op = &cifs_file_direct_ops;
74038c8a9a5SSteve French 	}
74138c8a9a5SSteve French 
74238c8a9a5SSteve French 	/* Get the cached handle as SMB2 close is deferred */
74338c8a9a5SSteve French 	rc = cifs_get_readable_path(tcon, full_path, &cfile);
74438c8a9a5SSteve French 	if (rc == 0) {
74538c8a9a5SSteve French 		if (file->f_flags == cfile->f_flags) {
74638c8a9a5SSteve French 			file->private_data = cfile;
74738c8a9a5SSteve French 			spin_lock(&CIFS_I(inode)->deferred_lock);
74838c8a9a5SSteve French 			cifs_del_deferred_close(cfile);
74938c8a9a5SSteve French 			spin_unlock(&CIFS_I(inode)->deferred_lock);
75038c8a9a5SSteve French 			goto use_cache;
75138c8a9a5SSteve French 		} else {
75238c8a9a5SSteve French 			_cifsFileInfo_put(cfile, true, false);
75338c8a9a5SSteve French 		}
75438c8a9a5SSteve French 	}
75538c8a9a5SSteve French 
75638c8a9a5SSteve French 	if (server->oplocks)
75738c8a9a5SSteve French 		oplock = REQ_OPLOCK;
75838c8a9a5SSteve French 	else
75938c8a9a5SSteve French 		oplock = 0;
76038c8a9a5SSteve French 
76138c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
76238c8a9a5SSteve French 	if (!tcon->broken_posix_open && tcon->unix_ext &&
76338c8a9a5SSteve French 	    cap_unix(tcon->ses) && (CIFS_UNIX_POSIX_PATH_OPS_CAP &
76438c8a9a5SSteve French 				le64_to_cpu(tcon->fsUnixInfo.Capability))) {
76538c8a9a5SSteve French 		/* can not refresh inode info since size could be stale */
76638c8a9a5SSteve French 		rc = cifs_posix_open(full_path, &inode, inode->i_sb,
76738c8a9a5SSteve French 				cifs_sb->ctx->file_mode /* ignored */,
76838c8a9a5SSteve French 				file->f_flags, &oplock, &fid.netfid, xid);
76938c8a9a5SSteve French 		if (rc == 0) {
77038c8a9a5SSteve French 			cifs_dbg(FYI, "posix open succeeded\n");
77138c8a9a5SSteve French 			posix_open_ok = true;
77238c8a9a5SSteve French 		} else if ((rc == -EINVAL) || (rc == -EOPNOTSUPP)) {
77338c8a9a5SSteve French 			if (tcon->ses->serverNOS)
77438c8a9a5SSteve French 				cifs_dbg(VFS, "server %s of type %s returned unexpected error on SMB posix open, disabling posix open support. Check if server update available.\n",
77538c8a9a5SSteve French 					 tcon->ses->ip_addr,
77638c8a9a5SSteve French 					 tcon->ses->serverNOS);
77738c8a9a5SSteve French 			tcon->broken_posix_open = true;
77838c8a9a5SSteve French 		} else if ((rc != -EIO) && (rc != -EREMOTE) &&
77938c8a9a5SSteve French 			 (rc != -EOPNOTSUPP)) /* path not found or net err */
78038c8a9a5SSteve French 			goto out;
78138c8a9a5SSteve French 		/*
78238c8a9a5SSteve French 		 * Else fallthrough to retry open the old way on network i/o
78338c8a9a5SSteve French 		 * or DFS errors.
78438c8a9a5SSteve French 		 */
78538c8a9a5SSteve French 	}
78638c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
78738c8a9a5SSteve French 
78838c8a9a5SSteve French 	if (server->ops->get_lease_key)
78938c8a9a5SSteve French 		server->ops->get_lease_key(inode, &fid);
79038c8a9a5SSteve French 
79138c8a9a5SSteve French 	cifs_add_pending_open(&fid, tlink, &open);
79238c8a9a5SSteve French 
79338c8a9a5SSteve French 	if (!posix_open_ok) {
79438c8a9a5SSteve French 		if (server->ops->get_lease_key)
79538c8a9a5SSteve French 			server->ops->get_lease_key(inode, &fid);
79638c8a9a5SSteve French 
79738c8a9a5SSteve French 		rc = cifs_nt_open(full_path, inode, cifs_sb, tcon, file->f_flags, &oplock, &fid,
79838c8a9a5SSteve French 				  xid, &data);
79938c8a9a5SSteve French 		if (rc) {
80038c8a9a5SSteve French 			cifs_del_pending_open(&open);
80138c8a9a5SSteve French 			goto out;
80238c8a9a5SSteve French 		}
80338c8a9a5SSteve French 	}
80438c8a9a5SSteve French 
80538c8a9a5SSteve French 	cfile = cifs_new_fileinfo(&fid, file, tlink, oplock, data.symlink_target);
80638c8a9a5SSteve French 	if (cfile == NULL) {
80738c8a9a5SSteve French 		if (server->ops->close)
80838c8a9a5SSteve French 			server->ops->close(xid, tcon, &fid);
80938c8a9a5SSteve French 		cifs_del_pending_open(&open);
81038c8a9a5SSteve French 		rc = -ENOMEM;
81138c8a9a5SSteve French 		goto out;
81238c8a9a5SSteve French 	}
81338c8a9a5SSteve French 
81438c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
81538c8a9a5SSteve French 	if ((oplock & CIFS_CREATE_ACTION) && !posix_open_ok && tcon->unix_ext) {
81638c8a9a5SSteve French 		/*
81738c8a9a5SSteve French 		 * Time to set mode which we can not set earlier due to
81838c8a9a5SSteve French 		 * problems creating new read-only files.
81938c8a9a5SSteve French 		 */
82038c8a9a5SSteve French 		struct cifs_unix_set_info_args args = {
82138c8a9a5SSteve French 			.mode	= inode->i_mode,
82238c8a9a5SSteve French 			.uid	= INVALID_UID, /* no change */
82338c8a9a5SSteve French 			.gid	= INVALID_GID, /* no change */
82438c8a9a5SSteve French 			.ctime	= NO_CHANGE_64,
82538c8a9a5SSteve French 			.atime	= NO_CHANGE_64,
82638c8a9a5SSteve French 			.mtime	= NO_CHANGE_64,
82738c8a9a5SSteve French 			.device	= 0,
82838c8a9a5SSteve French 		};
82938c8a9a5SSteve French 		CIFSSMBUnixSetFileInfo(xid, tcon, &args, fid.netfid,
83038c8a9a5SSteve French 				       cfile->pid);
83138c8a9a5SSteve French 	}
83238c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
83338c8a9a5SSteve French 
83438c8a9a5SSteve French use_cache:
83538c8a9a5SSteve French 	fscache_use_cookie(cifs_inode_cookie(file_inode(file)),
83638c8a9a5SSteve French 			   file->f_mode & FMODE_WRITE);
83738c8a9a5SSteve French 	if (file->f_flags & O_DIRECT &&
83838c8a9a5SSteve French 	    (!((file->f_flags & O_ACCMODE) != O_RDONLY) ||
83938c8a9a5SSteve French 	     file->f_flags & O_APPEND))
84038c8a9a5SSteve French 		cifs_invalidate_cache(file_inode(file),
84138c8a9a5SSteve French 				      FSCACHE_INVAL_DIO_WRITE);
84238c8a9a5SSteve French 
84338c8a9a5SSteve French out:
84438c8a9a5SSteve French 	free_dentry_path(page);
84538c8a9a5SSteve French 	free_xid(xid);
84638c8a9a5SSteve French 	cifs_put_tlink(tlink);
84738c8a9a5SSteve French 	cifs_free_open_info(&data);
84838c8a9a5SSteve French 	return rc;
84938c8a9a5SSteve French }
85038c8a9a5SSteve French 
85138c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
85238c8a9a5SSteve French static int cifs_push_posix_locks(struct cifsFileInfo *cfile);
85338c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
85438c8a9a5SSteve French 
85538c8a9a5SSteve French /*
85638c8a9a5SSteve French  * Try to reacquire byte range locks that were released when session
85738c8a9a5SSteve French  * to server was lost.
85838c8a9a5SSteve French  */
85938c8a9a5SSteve French static int
86038c8a9a5SSteve French cifs_relock_file(struct cifsFileInfo *cfile)
86138c8a9a5SSteve French {
86238c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
86338c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
86438c8a9a5SSteve French 	int rc = 0;
86538c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
86638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
86738c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
86838c8a9a5SSteve French 
86938c8a9a5SSteve French 	down_read_nested(&cinode->lock_sem, SINGLE_DEPTH_NESTING);
87038c8a9a5SSteve French 	if (cinode->can_cache_brlcks) {
87138c8a9a5SSteve French 		/* can cache locks - no need to relock */
87238c8a9a5SSteve French 		up_read(&cinode->lock_sem);
87338c8a9a5SSteve French 		return rc;
87438c8a9a5SSteve French 	}
87538c8a9a5SSteve French 
87638c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
87738c8a9a5SSteve French 	if (cap_unix(tcon->ses) &&
87838c8a9a5SSteve French 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
87938c8a9a5SSteve French 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
88038c8a9a5SSteve French 		rc = cifs_push_posix_locks(cfile);
88138c8a9a5SSteve French 	else
88238c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
88338c8a9a5SSteve French 		rc = tcon->ses->server->ops->push_mand_locks(cfile);
88438c8a9a5SSteve French 
88538c8a9a5SSteve French 	up_read(&cinode->lock_sem);
88638c8a9a5SSteve French 	return rc;
88738c8a9a5SSteve French }
88838c8a9a5SSteve French 
88938c8a9a5SSteve French static int
89038c8a9a5SSteve French cifs_reopen_file(struct cifsFileInfo *cfile, bool can_flush)
89138c8a9a5SSteve French {
89238c8a9a5SSteve French 	int rc = -EACCES;
89338c8a9a5SSteve French 	unsigned int xid;
89438c8a9a5SSteve French 	__u32 oplock;
89538c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
89638c8a9a5SSteve French 	struct cifs_tcon *tcon;
89738c8a9a5SSteve French 	struct TCP_Server_Info *server;
89838c8a9a5SSteve French 	struct cifsInodeInfo *cinode;
89938c8a9a5SSteve French 	struct inode *inode;
90038c8a9a5SSteve French 	void *page;
90138c8a9a5SSteve French 	const char *full_path;
90238c8a9a5SSteve French 	int desired_access;
90338c8a9a5SSteve French 	int disposition = FILE_OPEN;
90438c8a9a5SSteve French 	int create_options = CREATE_NOT_DIR;
90538c8a9a5SSteve French 	struct cifs_open_parms oparms;
90638c8a9a5SSteve French 
90738c8a9a5SSteve French 	xid = get_xid();
90838c8a9a5SSteve French 	mutex_lock(&cfile->fh_mutex);
90938c8a9a5SSteve French 	if (!cfile->invalidHandle) {
91038c8a9a5SSteve French 		mutex_unlock(&cfile->fh_mutex);
91138c8a9a5SSteve French 		free_xid(xid);
91238c8a9a5SSteve French 		return 0;
91338c8a9a5SSteve French 	}
91438c8a9a5SSteve French 
91538c8a9a5SSteve French 	inode = d_inode(cfile->dentry);
91638c8a9a5SSteve French 	cifs_sb = CIFS_SB(inode->i_sb);
91738c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
91838c8a9a5SSteve French 	server = tcon->ses->server;
91938c8a9a5SSteve French 
92038c8a9a5SSteve French 	/*
92138c8a9a5SSteve French 	 * Can not grab rename sem here because various ops, including those
92238c8a9a5SSteve French 	 * that already have the rename sem can end up causing writepage to get
92338c8a9a5SSteve French 	 * called and if the server was down that means we end up here, and we
92438c8a9a5SSteve French 	 * can never tell if the caller already has the rename_sem.
92538c8a9a5SSteve French 	 */
92638c8a9a5SSteve French 	page = alloc_dentry_path();
92738c8a9a5SSteve French 	full_path = build_path_from_dentry(cfile->dentry, page);
92838c8a9a5SSteve French 	if (IS_ERR(full_path)) {
92938c8a9a5SSteve French 		mutex_unlock(&cfile->fh_mutex);
93038c8a9a5SSteve French 		free_dentry_path(page);
93138c8a9a5SSteve French 		free_xid(xid);
93238c8a9a5SSteve French 		return PTR_ERR(full_path);
93338c8a9a5SSteve French 	}
93438c8a9a5SSteve French 
93538c8a9a5SSteve French 	cifs_dbg(FYI, "inode = 0x%p file flags 0x%x for %s\n",
93638c8a9a5SSteve French 		 inode, cfile->f_flags, full_path);
93738c8a9a5SSteve French 
93838c8a9a5SSteve French 	if (tcon->ses->server->oplocks)
93938c8a9a5SSteve French 		oplock = REQ_OPLOCK;
94038c8a9a5SSteve French 	else
94138c8a9a5SSteve French 		oplock = 0;
94238c8a9a5SSteve French 
94338c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
94438c8a9a5SSteve French 	if (tcon->unix_ext && cap_unix(tcon->ses) &&
94538c8a9a5SSteve French 	    (CIFS_UNIX_POSIX_PATH_OPS_CAP &
94638c8a9a5SSteve French 				le64_to_cpu(tcon->fsUnixInfo.Capability))) {
94738c8a9a5SSteve French 		/*
94838c8a9a5SSteve French 		 * O_CREAT, O_EXCL and O_TRUNC already had their effect on the
94938c8a9a5SSteve French 		 * original open. Must mask them off for a reopen.
95038c8a9a5SSteve French 		 */
95138c8a9a5SSteve French 		unsigned int oflags = cfile->f_flags &
95238c8a9a5SSteve French 						~(O_CREAT | O_EXCL | O_TRUNC);
95338c8a9a5SSteve French 
95438c8a9a5SSteve French 		rc = cifs_posix_open(full_path, NULL, inode->i_sb,
95538c8a9a5SSteve French 				     cifs_sb->ctx->file_mode /* ignored */,
95638c8a9a5SSteve French 				     oflags, &oplock, &cfile->fid.netfid, xid);
95738c8a9a5SSteve French 		if (rc == 0) {
95838c8a9a5SSteve French 			cifs_dbg(FYI, "posix reopen succeeded\n");
95938c8a9a5SSteve French 			oparms.reconnect = true;
96038c8a9a5SSteve French 			goto reopen_success;
96138c8a9a5SSteve French 		}
96238c8a9a5SSteve French 		/*
96338c8a9a5SSteve French 		 * fallthrough to retry open the old way on errors, especially
96438c8a9a5SSteve French 		 * in the reconnect path it is important to retry hard
96538c8a9a5SSteve French 		 */
96638c8a9a5SSteve French 	}
96738c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
96838c8a9a5SSteve French 
96938c8a9a5SSteve French 	desired_access = cifs_convert_flags(cfile->f_flags);
97038c8a9a5SSteve French 
97138c8a9a5SSteve French 	/* O_SYNC also has bit for O_DSYNC so following check picks up either */
97238c8a9a5SSteve French 	if (cfile->f_flags & O_SYNC)
97338c8a9a5SSteve French 		create_options |= CREATE_WRITE_THROUGH;
97438c8a9a5SSteve French 
97538c8a9a5SSteve French 	if (cfile->f_flags & O_DIRECT)
97638c8a9a5SSteve French 		create_options |= CREATE_NO_BUFFER;
97738c8a9a5SSteve French 
97838c8a9a5SSteve French 	if (server->ops->get_lease_key)
97938c8a9a5SSteve French 		server->ops->get_lease_key(inode, &cfile->fid);
98038c8a9a5SSteve French 
98138c8a9a5SSteve French 	oparms = (struct cifs_open_parms) {
98238c8a9a5SSteve French 		.tcon = tcon,
98338c8a9a5SSteve French 		.cifs_sb = cifs_sb,
98438c8a9a5SSteve French 		.desired_access = desired_access,
98538c8a9a5SSteve French 		.create_options = cifs_create_options(cifs_sb, create_options),
98638c8a9a5SSteve French 		.disposition = disposition,
98738c8a9a5SSteve French 		.path = full_path,
98838c8a9a5SSteve French 		.fid = &cfile->fid,
98938c8a9a5SSteve French 		.reconnect = true,
99038c8a9a5SSteve French 	};
99138c8a9a5SSteve French 
99238c8a9a5SSteve French 	/*
99338c8a9a5SSteve French 	 * Can not refresh inode by passing in file_info buf to be returned by
99438c8a9a5SSteve French 	 * ops->open and then calling get_inode_info with returned buf since
99538c8a9a5SSteve French 	 * file might have write behind data that needs to be flushed and server
99638c8a9a5SSteve French 	 * version of file size can be stale. If we knew for sure that inode was
99738c8a9a5SSteve French 	 * not dirty locally we could do this.
99838c8a9a5SSteve French 	 */
99938c8a9a5SSteve French 	rc = server->ops->open(xid, &oparms, &oplock, NULL);
100038c8a9a5SSteve French 	if (rc == -ENOENT && oparms.reconnect == false) {
100138c8a9a5SSteve French 		/* durable handle timeout is expired - open the file again */
100238c8a9a5SSteve French 		rc = server->ops->open(xid, &oparms, &oplock, NULL);
100338c8a9a5SSteve French 		/* indicate that we need to relock the file */
100438c8a9a5SSteve French 		oparms.reconnect = true;
100538c8a9a5SSteve French 	}
100638c8a9a5SSteve French 
100738c8a9a5SSteve French 	if (rc) {
100838c8a9a5SSteve French 		mutex_unlock(&cfile->fh_mutex);
100938c8a9a5SSteve French 		cifs_dbg(FYI, "cifs_reopen returned 0x%x\n", rc);
101038c8a9a5SSteve French 		cifs_dbg(FYI, "oplock: %d\n", oplock);
101138c8a9a5SSteve French 		goto reopen_error_exit;
101238c8a9a5SSteve French 	}
101338c8a9a5SSteve French 
101438c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
101538c8a9a5SSteve French reopen_success:
101638c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
101738c8a9a5SSteve French 	cfile->invalidHandle = false;
101838c8a9a5SSteve French 	mutex_unlock(&cfile->fh_mutex);
101938c8a9a5SSteve French 	cinode = CIFS_I(inode);
102038c8a9a5SSteve French 
102138c8a9a5SSteve French 	if (can_flush) {
102238c8a9a5SSteve French 		rc = filemap_write_and_wait(inode->i_mapping);
102338c8a9a5SSteve French 		if (!is_interrupt_error(rc))
102438c8a9a5SSteve French 			mapping_set_error(inode->i_mapping, rc);
102538c8a9a5SSteve French 
102638c8a9a5SSteve French 		if (tcon->posix_extensions)
102738c8a9a5SSteve French 			rc = smb311_posix_get_inode_info(&inode, full_path, inode->i_sb, xid);
102838c8a9a5SSteve French 		else if (tcon->unix_ext)
102938c8a9a5SSteve French 			rc = cifs_get_inode_info_unix(&inode, full_path,
103038c8a9a5SSteve French 						      inode->i_sb, xid);
103138c8a9a5SSteve French 		else
103238c8a9a5SSteve French 			rc = cifs_get_inode_info(&inode, full_path, NULL,
103338c8a9a5SSteve French 						 inode->i_sb, xid, NULL);
103438c8a9a5SSteve French 	}
103538c8a9a5SSteve French 	/*
103638c8a9a5SSteve French 	 * Else we are writing out data to server already and could deadlock if
103738c8a9a5SSteve French 	 * we tried to flush data, and since we do not know if we have data that
103838c8a9a5SSteve French 	 * would invalidate the current end of file on the server we can not go
103938c8a9a5SSteve French 	 * to the server to get the new inode info.
104038c8a9a5SSteve French 	 */
104138c8a9a5SSteve French 
104238c8a9a5SSteve French 	/*
104338c8a9a5SSteve French 	 * If the server returned a read oplock and we have mandatory brlocks,
104438c8a9a5SSteve French 	 * set oplock level to None.
104538c8a9a5SSteve French 	 */
104638c8a9a5SSteve French 	if (server->ops->is_read_op(oplock) && cifs_has_mand_locks(cinode)) {
104738c8a9a5SSteve French 		cifs_dbg(FYI, "Reset oplock val from read to None due to mand locks\n");
104838c8a9a5SSteve French 		oplock = 0;
104938c8a9a5SSteve French 	}
105038c8a9a5SSteve French 
105138c8a9a5SSteve French 	server->ops->set_fid(cfile, &cfile->fid, oplock);
105238c8a9a5SSteve French 	if (oparms.reconnect)
105338c8a9a5SSteve French 		cifs_relock_file(cfile);
105438c8a9a5SSteve French 
105538c8a9a5SSteve French reopen_error_exit:
105638c8a9a5SSteve French 	free_dentry_path(page);
105738c8a9a5SSteve French 	free_xid(xid);
105838c8a9a5SSteve French 	return rc;
105938c8a9a5SSteve French }
106038c8a9a5SSteve French 
106138c8a9a5SSteve French void smb2_deferred_work_close(struct work_struct *work)
106238c8a9a5SSteve French {
106338c8a9a5SSteve French 	struct cifsFileInfo *cfile = container_of(work,
106438c8a9a5SSteve French 			struct cifsFileInfo, deferred.work);
106538c8a9a5SSteve French 
106638c8a9a5SSteve French 	spin_lock(&CIFS_I(d_inode(cfile->dentry))->deferred_lock);
106738c8a9a5SSteve French 	cifs_del_deferred_close(cfile);
106838c8a9a5SSteve French 	cfile->deferred_close_scheduled = false;
106938c8a9a5SSteve French 	spin_unlock(&CIFS_I(d_inode(cfile->dentry))->deferred_lock);
107038c8a9a5SSteve French 	_cifsFileInfo_put(cfile, true, false);
107138c8a9a5SSteve French }
107238c8a9a5SSteve French 
107338c8a9a5SSteve French int cifs_close(struct inode *inode, struct file *file)
107438c8a9a5SSteve French {
107538c8a9a5SSteve French 	struct cifsFileInfo *cfile;
107638c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
107738c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
107838c8a9a5SSteve French 	struct cifs_deferred_close *dclose;
107938c8a9a5SSteve French 
108038c8a9a5SSteve French 	cifs_fscache_unuse_inode_cookie(inode, file->f_mode & FMODE_WRITE);
108138c8a9a5SSteve French 
108238c8a9a5SSteve French 	if (file->private_data != NULL) {
108338c8a9a5SSteve French 		cfile = file->private_data;
108438c8a9a5SSteve French 		file->private_data = NULL;
108538c8a9a5SSteve French 		dclose = kmalloc(sizeof(struct cifs_deferred_close), GFP_KERNEL);
1086df9d70c1SBharath SM 		if ((cifs_sb->ctx->closetimeo && cinode->oplock == CIFS_CACHE_RHW_FLG)
1087df9d70c1SBharath SM 		    && cinode->lease_granted &&
108838c8a9a5SSteve French 		    !test_bit(CIFS_INO_CLOSE_ON_LOCK, &cinode->flags) &&
108938c8a9a5SSteve French 		    dclose) {
109038c8a9a5SSteve French 			if (test_and_clear_bit(CIFS_INO_MODIFIED_ATTR, &cinode->flags)) {
109123171df5SJeff Layton 				inode_set_mtime_to_ts(inode,
109223171df5SJeff Layton 						      inode_set_ctime_current(inode));
109338c8a9a5SSteve French 			}
109438c8a9a5SSteve French 			spin_lock(&cinode->deferred_lock);
109538c8a9a5SSteve French 			cifs_add_deferred_close(cfile, dclose);
109638c8a9a5SSteve French 			if (cfile->deferred_close_scheduled &&
109738c8a9a5SSteve French 			    delayed_work_pending(&cfile->deferred)) {
109838c8a9a5SSteve French 				/*
109938c8a9a5SSteve French 				 * If there is no pending work, mod_delayed_work queues new work.
110038c8a9a5SSteve French 				 * So, Increase the ref count to avoid use-after-free.
110138c8a9a5SSteve French 				 */
110238c8a9a5SSteve French 				if (!mod_delayed_work(deferredclose_wq,
110338c8a9a5SSteve French 						&cfile->deferred, cifs_sb->ctx->closetimeo))
110438c8a9a5SSteve French 					cifsFileInfo_get(cfile);
110538c8a9a5SSteve French 			} else {
110638c8a9a5SSteve French 				/* Deferred close for files */
110738c8a9a5SSteve French 				queue_delayed_work(deferredclose_wq,
110838c8a9a5SSteve French 						&cfile->deferred, cifs_sb->ctx->closetimeo);
110938c8a9a5SSteve French 				cfile->deferred_close_scheduled = true;
111038c8a9a5SSteve French 				spin_unlock(&cinode->deferred_lock);
111138c8a9a5SSteve French 				return 0;
111238c8a9a5SSteve French 			}
111338c8a9a5SSteve French 			spin_unlock(&cinode->deferred_lock);
111438c8a9a5SSteve French 			_cifsFileInfo_put(cfile, true, false);
111538c8a9a5SSteve French 		} else {
111638c8a9a5SSteve French 			_cifsFileInfo_put(cfile, true, false);
111738c8a9a5SSteve French 			kfree(dclose);
111838c8a9a5SSteve French 		}
111938c8a9a5SSteve French 	}
112038c8a9a5SSteve French 
112138c8a9a5SSteve French 	/* return code from the ->release op is always ignored */
112238c8a9a5SSteve French 	return 0;
112338c8a9a5SSteve French }
112438c8a9a5SSteve French 
112538c8a9a5SSteve French void
112638c8a9a5SSteve French cifs_reopen_persistent_handles(struct cifs_tcon *tcon)
112738c8a9a5SSteve French {
112838c8a9a5SSteve French 	struct cifsFileInfo *open_file, *tmp;
112938c8a9a5SSteve French 	struct list_head tmp_list;
113038c8a9a5SSteve French 
113138c8a9a5SSteve French 	if (!tcon->use_persistent || !tcon->need_reopen_files)
113238c8a9a5SSteve French 		return;
113338c8a9a5SSteve French 
113438c8a9a5SSteve French 	tcon->need_reopen_files = false;
113538c8a9a5SSteve French 
113638c8a9a5SSteve French 	cifs_dbg(FYI, "Reopen persistent handles\n");
113738c8a9a5SSteve French 	INIT_LIST_HEAD(&tmp_list);
113838c8a9a5SSteve French 
113938c8a9a5SSteve French 	/* list all files open on tree connection, reopen resilient handles  */
114038c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
114138c8a9a5SSteve French 	list_for_each_entry(open_file, &tcon->openFileList, tlist) {
114238c8a9a5SSteve French 		if (!open_file->invalidHandle)
114338c8a9a5SSteve French 			continue;
114438c8a9a5SSteve French 		cifsFileInfo_get(open_file);
114538c8a9a5SSteve French 		list_add_tail(&open_file->rlist, &tmp_list);
114638c8a9a5SSteve French 	}
114738c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
114838c8a9a5SSteve French 
114938c8a9a5SSteve French 	list_for_each_entry_safe(open_file, tmp, &tmp_list, rlist) {
115038c8a9a5SSteve French 		if (cifs_reopen_file(open_file, false /* do not flush */))
115138c8a9a5SSteve French 			tcon->need_reopen_files = true;
115238c8a9a5SSteve French 		list_del_init(&open_file->rlist);
115338c8a9a5SSteve French 		cifsFileInfo_put(open_file);
115438c8a9a5SSteve French 	}
115538c8a9a5SSteve French }
115638c8a9a5SSteve French 
115738c8a9a5SSteve French int cifs_closedir(struct inode *inode, struct file *file)
115838c8a9a5SSteve French {
115938c8a9a5SSteve French 	int rc = 0;
116038c8a9a5SSteve French 	unsigned int xid;
116138c8a9a5SSteve French 	struct cifsFileInfo *cfile = file->private_data;
116238c8a9a5SSteve French 	struct cifs_tcon *tcon;
116338c8a9a5SSteve French 	struct TCP_Server_Info *server;
116438c8a9a5SSteve French 	char *buf;
116538c8a9a5SSteve French 
116638c8a9a5SSteve French 	cifs_dbg(FYI, "Closedir inode = 0x%p\n", inode);
116738c8a9a5SSteve French 
116838c8a9a5SSteve French 	if (cfile == NULL)
116938c8a9a5SSteve French 		return rc;
117038c8a9a5SSteve French 
117138c8a9a5SSteve French 	xid = get_xid();
117238c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
117338c8a9a5SSteve French 	server = tcon->ses->server;
117438c8a9a5SSteve French 
117538c8a9a5SSteve French 	cifs_dbg(FYI, "Freeing private data in close dir\n");
117638c8a9a5SSteve French 	spin_lock(&cfile->file_info_lock);
117738c8a9a5SSteve French 	if (server->ops->dir_needs_close(cfile)) {
117838c8a9a5SSteve French 		cfile->invalidHandle = true;
117938c8a9a5SSteve French 		spin_unlock(&cfile->file_info_lock);
118038c8a9a5SSteve French 		if (server->ops->close_dir)
118138c8a9a5SSteve French 			rc = server->ops->close_dir(xid, tcon, &cfile->fid);
118238c8a9a5SSteve French 		else
118338c8a9a5SSteve French 			rc = -ENOSYS;
118438c8a9a5SSteve French 		cifs_dbg(FYI, "Closing uncompleted readdir with rc %d\n", rc);
118538c8a9a5SSteve French 		/* not much we can do if it fails anyway, ignore rc */
118638c8a9a5SSteve French 		rc = 0;
118738c8a9a5SSteve French 	} else
118838c8a9a5SSteve French 		spin_unlock(&cfile->file_info_lock);
118938c8a9a5SSteve French 
119038c8a9a5SSteve French 	buf = cfile->srch_inf.ntwrk_buf_start;
119138c8a9a5SSteve French 	if (buf) {
119238c8a9a5SSteve French 		cifs_dbg(FYI, "closedir free smb buf in srch struct\n");
119338c8a9a5SSteve French 		cfile->srch_inf.ntwrk_buf_start = NULL;
119438c8a9a5SSteve French 		if (cfile->srch_inf.smallBuf)
119538c8a9a5SSteve French 			cifs_small_buf_release(buf);
119638c8a9a5SSteve French 		else
119738c8a9a5SSteve French 			cifs_buf_release(buf);
119838c8a9a5SSteve French 	}
119938c8a9a5SSteve French 
120038c8a9a5SSteve French 	cifs_put_tlink(cfile->tlink);
120138c8a9a5SSteve French 	kfree(file->private_data);
120238c8a9a5SSteve French 	file->private_data = NULL;
120338c8a9a5SSteve French 	/* BB can we lock the filestruct while this is going on? */
120438c8a9a5SSteve French 	free_xid(xid);
120538c8a9a5SSteve French 	return rc;
120638c8a9a5SSteve French }
120738c8a9a5SSteve French 
120838c8a9a5SSteve French static struct cifsLockInfo *
120938c8a9a5SSteve French cifs_lock_init(__u64 offset, __u64 length, __u8 type, __u16 flags)
121038c8a9a5SSteve French {
121138c8a9a5SSteve French 	struct cifsLockInfo *lock =
121238c8a9a5SSteve French 		kmalloc(sizeof(struct cifsLockInfo), GFP_KERNEL);
121338c8a9a5SSteve French 	if (!lock)
121438c8a9a5SSteve French 		return lock;
121538c8a9a5SSteve French 	lock->offset = offset;
121638c8a9a5SSteve French 	lock->length = length;
121738c8a9a5SSteve French 	lock->type = type;
121838c8a9a5SSteve French 	lock->pid = current->tgid;
121938c8a9a5SSteve French 	lock->flags = flags;
122038c8a9a5SSteve French 	INIT_LIST_HEAD(&lock->blist);
122138c8a9a5SSteve French 	init_waitqueue_head(&lock->block_q);
122238c8a9a5SSteve French 	return lock;
122338c8a9a5SSteve French }
122438c8a9a5SSteve French 
122538c8a9a5SSteve French void
122638c8a9a5SSteve French cifs_del_lock_waiters(struct cifsLockInfo *lock)
122738c8a9a5SSteve French {
122838c8a9a5SSteve French 	struct cifsLockInfo *li, *tmp;
122938c8a9a5SSteve French 	list_for_each_entry_safe(li, tmp, &lock->blist, blist) {
123038c8a9a5SSteve French 		list_del_init(&li->blist);
123138c8a9a5SSteve French 		wake_up(&li->block_q);
123238c8a9a5SSteve French 	}
123338c8a9a5SSteve French }
123438c8a9a5SSteve French 
123538c8a9a5SSteve French #define CIFS_LOCK_OP	0
123638c8a9a5SSteve French #define CIFS_READ_OP	1
123738c8a9a5SSteve French #define CIFS_WRITE_OP	2
123838c8a9a5SSteve French 
123938c8a9a5SSteve French /* @rw_check : 0 - no op, 1 - read, 2 - write */
124038c8a9a5SSteve French static bool
124138c8a9a5SSteve French cifs_find_fid_lock_conflict(struct cifs_fid_locks *fdlocks, __u64 offset,
124238c8a9a5SSteve French 			    __u64 length, __u8 type, __u16 flags,
124338c8a9a5SSteve French 			    struct cifsFileInfo *cfile,
124438c8a9a5SSteve French 			    struct cifsLockInfo **conf_lock, int rw_check)
124538c8a9a5SSteve French {
124638c8a9a5SSteve French 	struct cifsLockInfo *li;
124738c8a9a5SSteve French 	struct cifsFileInfo *cur_cfile = fdlocks->cfile;
124838c8a9a5SSteve French 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
124938c8a9a5SSteve French 
125038c8a9a5SSteve French 	list_for_each_entry(li, &fdlocks->locks, llist) {
125138c8a9a5SSteve French 		if (offset + length <= li->offset ||
125238c8a9a5SSteve French 		    offset >= li->offset + li->length)
125338c8a9a5SSteve French 			continue;
125438c8a9a5SSteve French 		if (rw_check != CIFS_LOCK_OP && current->tgid == li->pid &&
125538c8a9a5SSteve French 		    server->ops->compare_fids(cfile, cur_cfile)) {
125638c8a9a5SSteve French 			/* shared lock prevents write op through the same fid */
125738c8a9a5SSteve French 			if (!(li->type & server->vals->shared_lock_type) ||
125838c8a9a5SSteve French 			    rw_check != CIFS_WRITE_OP)
125938c8a9a5SSteve French 				continue;
126038c8a9a5SSteve French 		}
126138c8a9a5SSteve French 		if ((type & server->vals->shared_lock_type) &&
126238c8a9a5SSteve French 		    ((server->ops->compare_fids(cfile, cur_cfile) &&
126338c8a9a5SSteve French 		     current->tgid == li->pid) || type == li->type))
126438c8a9a5SSteve French 			continue;
126538c8a9a5SSteve French 		if (rw_check == CIFS_LOCK_OP &&
126638c8a9a5SSteve French 		    (flags & FL_OFDLCK) && (li->flags & FL_OFDLCK) &&
126738c8a9a5SSteve French 		    server->ops->compare_fids(cfile, cur_cfile))
126838c8a9a5SSteve French 			continue;
126938c8a9a5SSteve French 		if (conf_lock)
127038c8a9a5SSteve French 			*conf_lock = li;
127138c8a9a5SSteve French 		return true;
127238c8a9a5SSteve French 	}
127338c8a9a5SSteve French 	return false;
127438c8a9a5SSteve French }
127538c8a9a5SSteve French 
127638c8a9a5SSteve French bool
127738c8a9a5SSteve French cifs_find_lock_conflict(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
127838c8a9a5SSteve French 			__u8 type, __u16 flags,
127938c8a9a5SSteve French 			struct cifsLockInfo **conf_lock, int rw_check)
128038c8a9a5SSteve French {
128138c8a9a5SSteve French 	bool rc = false;
128238c8a9a5SSteve French 	struct cifs_fid_locks *cur;
128338c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
128438c8a9a5SSteve French 
128538c8a9a5SSteve French 	list_for_each_entry(cur, &cinode->llist, llist) {
128638c8a9a5SSteve French 		rc = cifs_find_fid_lock_conflict(cur, offset, length, type,
128738c8a9a5SSteve French 						 flags, cfile, conf_lock,
128838c8a9a5SSteve French 						 rw_check);
128938c8a9a5SSteve French 		if (rc)
129038c8a9a5SSteve French 			break;
129138c8a9a5SSteve French 	}
129238c8a9a5SSteve French 
129338c8a9a5SSteve French 	return rc;
129438c8a9a5SSteve French }
129538c8a9a5SSteve French 
129638c8a9a5SSteve French /*
129738c8a9a5SSteve French  * Check if there is another lock that prevents us to set the lock (mandatory
129838c8a9a5SSteve French  * style). If such a lock exists, update the flock structure with its
129938c8a9a5SSteve French  * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
130038c8a9a5SSteve French  * or leave it the same if we can't. Returns 0 if we don't need to request to
130138c8a9a5SSteve French  * the server or 1 otherwise.
130238c8a9a5SSteve French  */
130338c8a9a5SSteve French static int
130438c8a9a5SSteve French cifs_lock_test(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
130538c8a9a5SSteve French 	       __u8 type, struct file_lock *flock)
130638c8a9a5SSteve French {
130738c8a9a5SSteve French 	int rc = 0;
130838c8a9a5SSteve French 	struct cifsLockInfo *conf_lock;
130938c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
131038c8a9a5SSteve French 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
131138c8a9a5SSteve French 	bool exist;
131238c8a9a5SSteve French 
131338c8a9a5SSteve French 	down_read(&cinode->lock_sem);
131438c8a9a5SSteve French 
131538c8a9a5SSteve French 	exist = cifs_find_lock_conflict(cfile, offset, length, type,
131638c8a9a5SSteve French 					flock->fl_flags, &conf_lock,
131738c8a9a5SSteve French 					CIFS_LOCK_OP);
131838c8a9a5SSteve French 	if (exist) {
131938c8a9a5SSteve French 		flock->fl_start = conf_lock->offset;
132038c8a9a5SSteve French 		flock->fl_end = conf_lock->offset + conf_lock->length - 1;
132138c8a9a5SSteve French 		flock->fl_pid = conf_lock->pid;
132238c8a9a5SSteve French 		if (conf_lock->type & server->vals->shared_lock_type)
132338c8a9a5SSteve French 			flock->fl_type = F_RDLCK;
132438c8a9a5SSteve French 		else
132538c8a9a5SSteve French 			flock->fl_type = F_WRLCK;
132638c8a9a5SSteve French 	} else if (!cinode->can_cache_brlcks)
132738c8a9a5SSteve French 		rc = 1;
132838c8a9a5SSteve French 	else
132938c8a9a5SSteve French 		flock->fl_type = F_UNLCK;
133038c8a9a5SSteve French 
133138c8a9a5SSteve French 	up_read(&cinode->lock_sem);
133238c8a9a5SSteve French 	return rc;
133338c8a9a5SSteve French }
133438c8a9a5SSteve French 
133538c8a9a5SSteve French static void
133638c8a9a5SSteve French cifs_lock_add(struct cifsFileInfo *cfile, struct cifsLockInfo *lock)
133738c8a9a5SSteve French {
133838c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
133938c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
134038c8a9a5SSteve French 	list_add_tail(&lock->llist, &cfile->llist->locks);
134138c8a9a5SSteve French 	up_write(&cinode->lock_sem);
134238c8a9a5SSteve French }
134338c8a9a5SSteve French 
134438c8a9a5SSteve French /*
134538c8a9a5SSteve French  * Set the byte-range lock (mandatory style). Returns:
134638c8a9a5SSteve French  * 1) 0, if we set the lock and don't need to request to the server;
134738c8a9a5SSteve French  * 2) 1, if no locks prevent us but we need to request to the server;
134838c8a9a5SSteve French  * 3) -EACCES, if there is a lock that prevents us and wait is false.
134938c8a9a5SSteve French  */
135038c8a9a5SSteve French static int
135138c8a9a5SSteve French cifs_lock_add_if(struct cifsFileInfo *cfile, struct cifsLockInfo *lock,
135238c8a9a5SSteve French 		 bool wait)
135338c8a9a5SSteve French {
135438c8a9a5SSteve French 	struct cifsLockInfo *conf_lock;
135538c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
135638c8a9a5SSteve French 	bool exist;
135738c8a9a5SSteve French 	int rc = 0;
135838c8a9a5SSteve French 
135938c8a9a5SSteve French try_again:
136038c8a9a5SSteve French 	exist = false;
136138c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
136238c8a9a5SSteve French 
136338c8a9a5SSteve French 	exist = cifs_find_lock_conflict(cfile, lock->offset, lock->length,
136438c8a9a5SSteve French 					lock->type, lock->flags, &conf_lock,
136538c8a9a5SSteve French 					CIFS_LOCK_OP);
136638c8a9a5SSteve French 	if (!exist && cinode->can_cache_brlcks) {
136738c8a9a5SSteve French 		list_add_tail(&lock->llist, &cfile->llist->locks);
136838c8a9a5SSteve French 		up_write(&cinode->lock_sem);
136938c8a9a5SSteve French 		return rc;
137038c8a9a5SSteve French 	}
137138c8a9a5SSteve French 
137238c8a9a5SSteve French 	if (!exist)
137338c8a9a5SSteve French 		rc = 1;
137438c8a9a5SSteve French 	else if (!wait)
137538c8a9a5SSteve French 		rc = -EACCES;
137638c8a9a5SSteve French 	else {
137738c8a9a5SSteve French 		list_add_tail(&lock->blist, &conf_lock->blist);
137838c8a9a5SSteve French 		up_write(&cinode->lock_sem);
137938c8a9a5SSteve French 		rc = wait_event_interruptible(lock->block_q,
138038c8a9a5SSteve French 					(lock->blist.prev == &lock->blist) &&
138138c8a9a5SSteve French 					(lock->blist.next == &lock->blist));
138238c8a9a5SSteve French 		if (!rc)
138338c8a9a5SSteve French 			goto try_again;
138438c8a9a5SSteve French 		cifs_down_write(&cinode->lock_sem);
138538c8a9a5SSteve French 		list_del_init(&lock->blist);
138638c8a9a5SSteve French 	}
138738c8a9a5SSteve French 
138838c8a9a5SSteve French 	up_write(&cinode->lock_sem);
138938c8a9a5SSteve French 	return rc;
139038c8a9a5SSteve French }
139138c8a9a5SSteve French 
139238c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
139338c8a9a5SSteve French /*
139438c8a9a5SSteve French  * Check if there is another lock that prevents us to set the lock (posix
139538c8a9a5SSteve French  * style). If such a lock exists, update the flock structure with its
139638c8a9a5SSteve French  * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
139738c8a9a5SSteve French  * or leave it the same if we can't. Returns 0 if we don't need to request to
139838c8a9a5SSteve French  * the server or 1 otherwise.
139938c8a9a5SSteve French  */
140038c8a9a5SSteve French static int
140138c8a9a5SSteve French cifs_posix_lock_test(struct file *file, struct file_lock *flock)
140238c8a9a5SSteve French {
140338c8a9a5SSteve French 	int rc = 0;
140438c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
140538c8a9a5SSteve French 	unsigned char saved_type = flock->fl_type;
140638c8a9a5SSteve French 
140738c8a9a5SSteve French 	if ((flock->fl_flags & FL_POSIX) == 0)
140838c8a9a5SSteve French 		return 1;
140938c8a9a5SSteve French 
141038c8a9a5SSteve French 	down_read(&cinode->lock_sem);
141138c8a9a5SSteve French 	posix_test_lock(file, flock);
141238c8a9a5SSteve French 
141338c8a9a5SSteve French 	if (flock->fl_type == F_UNLCK && !cinode->can_cache_brlcks) {
141438c8a9a5SSteve French 		flock->fl_type = saved_type;
141538c8a9a5SSteve French 		rc = 1;
141638c8a9a5SSteve French 	}
141738c8a9a5SSteve French 
141838c8a9a5SSteve French 	up_read(&cinode->lock_sem);
141938c8a9a5SSteve French 	return rc;
142038c8a9a5SSteve French }
142138c8a9a5SSteve French 
142238c8a9a5SSteve French /*
142338c8a9a5SSteve French  * Set the byte-range lock (posix style). Returns:
142438c8a9a5SSteve French  * 1) <0, if the error occurs while setting the lock;
142538c8a9a5SSteve French  * 2) 0, if we set the lock and don't need to request to the server;
142638c8a9a5SSteve French  * 3) FILE_LOCK_DEFERRED, if we will wait for some other file_lock;
142738c8a9a5SSteve French  * 4) FILE_LOCK_DEFERRED + 1, if we need to request to the server.
142838c8a9a5SSteve French  */
142938c8a9a5SSteve French static int
143038c8a9a5SSteve French cifs_posix_lock_set(struct file *file, struct file_lock *flock)
143138c8a9a5SSteve French {
143238c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
143338c8a9a5SSteve French 	int rc = FILE_LOCK_DEFERRED + 1;
143438c8a9a5SSteve French 
143538c8a9a5SSteve French 	if ((flock->fl_flags & FL_POSIX) == 0)
143638c8a9a5SSteve French 		return rc;
143738c8a9a5SSteve French 
143838c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
143938c8a9a5SSteve French 	if (!cinode->can_cache_brlcks) {
144038c8a9a5SSteve French 		up_write(&cinode->lock_sem);
144138c8a9a5SSteve French 		return rc;
144238c8a9a5SSteve French 	}
144338c8a9a5SSteve French 
144438c8a9a5SSteve French 	rc = posix_lock_file(file, flock, NULL);
144538c8a9a5SSteve French 	up_write(&cinode->lock_sem);
144638c8a9a5SSteve French 	return rc;
144738c8a9a5SSteve French }
144838c8a9a5SSteve French 
144938c8a9a5SSteve French int
145038c8a9a5SSteve French cifs_push_mandatory_locks(struct cifsFileInfo *cfile)
145138c8a9a5SSteve French {
145238c8a9a5SSteve French 	unsigned int xid;
145338c8a9a5SSteve French 	int rc = 0, stored_rc;
145438c8a9a5SSteve French 	struct cifsLockInfo *li, *tmp;
145538c8a9a5SSteve French 	struct cifs_tcon *tcon;
145638c8a9a5SSteve French 	unsigned int num, max_num, max_buf;
145738c8a9a5SSteve French 	LOCKING_ANDX_RANGE *buf, *cur;
145838c8a9a5SSteve French 	static const int types[] = {
145938c8a9a5SSteve French 		LOCKING_ANDX_LARGE_FILES,
146038c8a9a5SSteve French 		LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES
146138c8a9a5SSteve French 	};
146238c8a9a5SSteve French 	int i;
146338c8a9a5SSteve French 
146438c8a9a5SSteve French 	xid = get_xid();
146538c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
146638c8a9a5SSteve French 
146738c8a9a5SSteve French 	/*
146838c8a9a5SSteve French 	 * Accessing maxBuf is racy with cifs_reconnect - need to store value
146938c8a9a5SSteve French 	 * and check it before using.
147038c8a9a5SSteve French 	 */
147138c8a9a5SSteve French 	max_buf = tcon->ses->server->maxBuf;
147238c8a9a5SSteve French 	if (max_buf < (sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE))) {
147338c8a9a5SSteve French 		free_xid(xid);
147438c8a9a5SSteve French 		return -EINVAL;
147538c8a9a5SSteve French 	}
147638c8a9a5SSteve French 
147738c8a9a5SSteve French 	BUILD_BUG_ON(sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE) >
147838c8a9a5SSteve French 		     PAGE_SIZE);
147938c8a9a5SSteve French 	max_buf = min_t(unsigned int, max_buf - sizeof(struct smb_hdr),
148038c8a9a5SSteve French 			PAGE_SIZE);
148138c8a9a5SSteve French 	max_num = (max_buf - sizeof(struct smb_hdr)) /
148238c8a9a5SSteve French 						sizeof(LOCKING_ANDX_RANGE);
148338c8a9a5SSteve French 	buf = kcalloc(max_num, sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
148438c8a9a5SSteve French 	if (!buf) {
148538c8a9a5SSteve French 		free_xid(xid);
148638c8a9a5SSteve French 		return -ENOMEM;
148738c8a9a5SSteve French 	}
148838c8a9a5SSteve French 
148938c8a9a5SSteve French 	for (i = 0; i < 2; i++) {
149038c8a9a5SSteve French 		cur = buf;
149138c8a9a5SSteve French 		num = 0;
149238c8a9a5SSteve French 		list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
149338c8a9a5SSteve French 			if (li->type != types[i])
149438c8a9a5SSteve French 				continue;
149538c8a9a5SSteve French 			cur->Pid = cpu_to_le16(li->pid);
149638c8a9a5SSteve French 			cur->LengthLow = cpu_to_le32((u32)li->length);
149738c8a9a5SSteve French 			cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
149838c8a9a5SSteve French 			cur->OffsetLow = cpu_to_le32((u32)li->offset);
149938c8a9a5SSteve French 			cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
150038c8a9a5SSteve French 			if (++num == max_num) {
150138c8a9a5SSteve French 				stored_rc = cifs_lockv(xid, tcon,
150238c8a9a5SSteve French 						       cfile->fid.netfid,
150338c8a9a5SSteve French 						       (__u8)li->type, 0, num,
150438c8a9a5SSteve French 						       buf);
150538c8a9a5SSteve French 				if (stored_rc)
150638c8a9a5SSteve French 					rc = stored_rc;
150738c8a9a5SSteve French 				cur = buf;
150838c8a9a5SSteve French 				num = 0;
150938c8a9a5SSteve French 			} else
151038c8a9a5SSteve French 				cur++;
151138c8a9a5SSteve French 		}
151238c8a9a5SSteve French 
151338c8a9a5SSteve French 		if (num) {
151438c8a9a5SSteve French 			stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
151538c8a9a5SSteve French 					       (__u8)types[i], 0, num, buf);
151638c8a9a5SSteve French 			if (stored_rc)
151738c8a9a5SSteve French 				rc = stored_rc;
151838c8a9a5SSteve French 		}
151938c8a9a5SSteve French 	}
152038c8a9a5SSteve French 
152138c8a9a5SSteve French 	kfree(buf);
152238c8a9a5SSteve French 	free_xid(xid);
152338c8a9a5SSteve French 	return rc;
152438c8a9a5SSteve French }
152538c8a9a5SSteve French 
152638c8a9a5SSteve French static __u32
152738c8a9a5SSteve French hash_lockowner(fl_owner_t owner)
152838c8a9a5SSteve French {
152938c8a9a5SSteve French 	return cifs_lock_secret ^ hash32_ptr((const void *)owner);
153038c8a9a5SSteve French }
153138c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
153238c8a9a5SSteve French 
153338c8a9a5SSteve French struct lock_to_push {
153438c8a9a5SSteve French 	struct list_head llist;
153538c8a9a5SSteve French 	__u64 offset;
153638c8a9a5SSteve French 	__u64 length;
153738c8a9a5SSteve French 	__u32 pid;
153838c8a9a5SSteve French 	__u16 netfid;
153938c8a9a5SSteve French 	__u8 type;
154038c8a9a5SSteve French };
154138c8a9a5SSteve French 
154238c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
154338c8a9a5SSteve French static int
154438c8a9a5SSteve French cifs_push_posix_locks(struct cifsFileInfo *cfile)
154538c8a9a5SSteve French {
154638c8a9a5SSteve French 	struct inode *inode = d_inode(cfile->dentry);
154738c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
154838c8a9a5SSteve French 	struct file_lock *flock;
154938c8a9a5SSteve French 	struct file_lock_context *flctx = locks_inode_context(inode);
155038c8a9a5SSteve French 	unsigned int count = 0, i;
155138c8a9a5SSteve French 	int rc = 0, xid, type;
155238c8a9a5SSteve French 	struct list_head locks_to_send, *el;
155338c8a9a5SSteve French 	struct lock_to_push *lck, *tmp;
155438c8a9a5SSteve French 	__u64 length;
155538c8a9a5SSteve French 
155638c8a9a5SSteve French 	xid = get_xid();
155738c8a9a5SSteve French 
155838c8a9a5SSteve French 	if (!flctx)
155938c8a9a5SSteve French 		goto out;
156038c8a9a5SSteve French 
156138c8a9a5SSteve French 	spin_lock(&flctx->flc_lock);
156238c8a9a5SSteve French 	list_for_each(el, &flctx->flc_posix) {
156338c8a9a5SSteve French 		count++;
156438c8a9a5SSteve French 	}
156538c8a9a5SSteve French 	spin_unlock(&flctx->flc_lock);
156638c8a9a5SSteve French 
156738c8a9a5SSteve French 	INIT_LIST_HEAD(&locks_to_send);
156838c8a9a5SSteve French 
156938c8a9a5SSteve French 	/*
157038c8a9a5SSteve French 	 * Allocating count locks is enough because no FL_POSIX locks can be
157138c8a9a5SSteve French 	 * added to the list while we are holding cinode->lock_sem that
157238c8a9a5SSteve French 	 * protects locking operations of this inode.
157338c8a9a5SSteve French 	 */
157438c8a9a5SSteve French 	for (i = 0; i < count; i++) {
157538c8a9a5SSteve French 		lck = kmalloc(sizeof(struct lock_to_push), GFP_KERNEL);
157638c8a9a5SSteve French 		if (!lck) {
157738c8a9a5SSteve French 			rc = -ENOMEM;
157838c8a9a5SSteve French 			goto err_out;
157938c8a9a5SSteve French 		}
158038c8a9a5SSteve French 		list_add_tail(&lck->llist, &locks_to_send);
158138c8a9a5SSteve French 	}
158238c8a9a5SSteve French 
158338c8a9a5SSteve French 	el = locks_to_send.next;
158438c8a9a5SSteve French 	spin_lock(&flctx->flc_lock);
158538c8a9a5SSteve French 	list_for_each_entry(flock, &flctx->flc_posix, fl_list) {
158638c8a9a5SSteve French 		if (el == &locks_to_send) {
158738c8a9a5SSteve French 			/*
158838c8a9a5SSteve French 			 * The list ended. We don't have enough allocated
158938c8a9a5SSteve French 			 * structures - something is really wrong.
159038c8a9a5SSteve French 			 */
159138c8a9a5SSteve French 			cifs_dbg(VFS, "Can't push all brlocks!\n");
159238c8a9a5SSteve French 			break;
159338c8a9a5SSteve French 		}
159438c8a9a5SSteve French 		length = cifs_flock_len(flock);
159538c8a9a5SSteve French 		if (flock->fl_type == F_RDLCK || flock->fl_type == F_SHLCK)
159638c8a9a5SSteve French 			type = CIFS_RDLCK;
159738c8a9a5SSteve French 		else
159838c8a9a5SSteve French 			type = CIFS_WRLCK;
159938c8a9a5SSteve French 		lck = list_entry(el, struct lock_to_push, llist);
160038c8a9a5SSteve French 		lck->pid = hash_lockowner(flock->fl_owner);
160138c8a9a5SSteve French 		lck->netfid = cfile->fid.netfid;
160238c8a9a5SSteve French 		lck->length = length;
160338c8a9a5SSteve French 		lck->type = type;
160438c8a9a5SSteve French 		lck->offset = flock->fl_start;
160538c8a9a5SSteve French 	}
160638c8a9a5SSteve French 	spin_unlock(&flctx->flc_lock);
160738c8a9a5SSteve French 
160838c8a9a5SSteve French 	list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
160938c8a9a5SSteve French 		int stored_rc;
161038c8a9a5SSteve French 
161138c8a9a5SSteve French 		stored_rc = CIFSSMBPosixLock(xid, tcon, lck->netfid, lck->pid,
161238c8a9a5SSteve French 					     lck->offset, lck->length, NULL,
161338c8a9a5SSteve French 					     lck->type, 0);
161438c8a9a5SSteve French 		if (stored_rc)
161538c8a9a5SSteve French 			rc = stored_rc;
161638c8a9a5SSteve French 		list_del(&lck->llist);
161738c8a9a5SSteve French 		kfree(lck);
161838c8a9a5SSteve French 	}
161938c8a9a5SSteve French 
162038c8a9a5SSteve French out:
162138c8a9a5SSteve French 	free_xid(xid);
162238c8a9a5SSteve French 	return rc;
162338c8a9a5SSteve French err_out:
162438c8a9a5SSteve French 	list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
162538c8a9a5SSteve French 		list_del(&lck->llist);
162638c8a9a5SSteve French 		kfree(lck);
162738c8a9a5SSteve French 	}
162838c8a9a5SSteve French 	goto out;
162938c8a9a5SSteve French }
163038c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
163138c8a9a5SSteve French 
163238c8a9a5SSteve French static int
163338c8a9a5SSteve French cifs_push_locks(struct cifsFileInfo *cfile)
163438c8a9a5SSteve French {
163538c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
163638c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
163738c8a9a5SSteve French 	int rc = 0;
163838c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
163938c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
164038c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
164138c8a9a5SSteve French 
164238c8a9a5SSteve French 	/* we are going to update can_cache_brlcks here - need a write access */
164338c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
164438c8a9a5SSteve French 	if (!cinode->can_cache_brlcks) {
164538c8a9a5SSteve French 		up_write(&cinode->lock_sem);
164638c8a9a5SSteve French 		return rc;
164738c8a9a5SSteve French 	}
164838c8a9a5SSteve French 
164938c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
165038c8a9a5SSteve French 	if (cap_unix(tcon->ses) &&
165138c8a9a5SSteve French 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
165238c8a9a5SSteve French 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
165338c8a9a5SSteve French 		rc = cifs_push_posix_locks(cfile);
165438c8a9a5SSteve French 	else
165538c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
165638c8a9a5SSteve French 		rc = tcon->ses->server->ops->push_mand_locks(cfile);
165738c8a9a5SSteve French 
165838c8a9a5SSteve French 	cinode->can_cache_brlcks = false;
165938c8a9a5SSteve French 	up_write(&cinode->lock_sem);
166038c8a9a5SSteve French 	return rc;
166138c8a9a5SSteve French }
166238c8a9a5SSteve French 
166338c8a9a5SSteve French static void
166438c8a9a5SSteve French cifs_read_flock(struct file_lock *flock, __u32 *type, int *lock, int *unlock,
166538c8a9a5SSteve French 		bool *wait_flag, struct TCP_Server_Info *server)
166638c8a9a5SSteve French {
166738c8a9a5SSteve French 	if (flock->fl_flags & FL_POSIX)
166838c8a9a5SSteve French 		cifs_dbg(FYI, "Posix\n");
166938c8a9a5SSteve French 	if (flock->fl_flags & FL_FLOCK)
167038c8a9a5SSteve French 		cifs_dbg(FYI, "Flock\n");
167138c8a9a5SSteve French 	if (flock->fl_flags & FL_SLEEP) {
167238c8a9a5SSteve French 		cifs_dbg(FYI, "Blocking lock\n");
167338c8a9a5SSteve French 		*wait_flag = true;
167438c8a9a5SSteve French 	}
167538c8a9a5SSteve French 	if (flock->fl_flags & FL_ACCESS)
167638c8a9a5SSteve French 		cifs_dbg(FYI, "Process suspended by mandatory locking - not implemented yet\n");
167738c8a9a5SSteve French 	if (flock->fl_flags & FL_LEASE)
167838c8a9a5SSteve French 		cifs_dbg(FYI, "Lease on file - not implemented yet\n");
167938c8a9a5SSteve French 	if (flock->fl_flags &
168038c8a9a5SSteve French 	    (~(FL_POSIX | FL_FLOCK | FL_SLEEP |
168138c8a9a5SSteve French 	       FL_ACCESS | FL_LEASE | FL_CLOSE | FL_OFDLCK)))
168238c8a9a5SSteve French 		cifs_dbg(FYI, "Unknown lock flags 0x%x\n", flock->fl_flags);
168338c8a9a5SSteve French 
168438c8a9a5SSteve French 	*type = server->vals->large_lock_type;
168538c8a9a5SSteve French 	if (flock->fl_type == F_WRLCK) {
168638c8a9a5SSteve French 		cifs_dbg(FYI, "F_WRLCK\n");
168738c8a9a5SSteve French 		*type |= server->vals->exclusive_lock_type;
168838c8a9a5SSteve French 		*lock = 1;
168938c8a9a5SSteve French 	} else if (flock->fl_type == F_UNLCK) {
169038c8a9a5SSteve French 		cifs_dbg(FYI, "F_UNLCK\n");
169138c8a9a5SSteve French 		*type |= server->vals->unlock_lock_type;
169238c8a9a5SSteve French 		*unlock = 1;
169338c8a9a5SSteve French 		/* Check if unlock includes more than one lock range */
169438c8a9a5SSteve French 	} else if (flock->fl_type == F_RDLCK) {
169538c8a9a5SSteve French 		cifs_dbg(FYI, "F_RDLCK\n");
169638c8a9a5SSteve French 		*type |= server->vals->shared_lock_type;
169738c8a9a5SSteve French 		*lock = 1;
169838c8a9a5SSteve French 	} else if (flock->fl_type == F_EXLCK) {
169938c8a9a5SSteve French 		cifs_dbg(FYI, "F_EXLCK\n");
170038c8a9a5SSteve French 		*type |= server->vals->exclusive_lock_type;
170138c8a9a5SSteve French 		*lock = 1;
170238c8a9a5SSteve French 	} else if (flock->fl_type == F_SHLCK) {
170338c8a9a5SSteve French 		cifs_dbg(FYI, "F_SHLCK\n");
170438c8a9a5SSteve French 		*type |= server->vals->shared_lock_type;
170538c8a9a5SSteve French 		*lock = 1;
170638c8a9a5SSteve French 	} else
170738c8a9a5SSteve French 		cifs_dbg(FYI, "Unknown type of lock\n");
170838c8a9a5SSteve French }
170938c8a9a5SSteve French 
171038c8a9a5SSteve French static int
171138c8a9a5SSteve French cifs_getlk(struct file *file, struct file_lock *flock, __u32 type,
171238c8a9a5SSteve French 	   bool wait_flag, bool posix_lck, unsigned int xid)
171338c8a9a5SSteve French {
171438c8a9a5SSteve French 	int rc = 0;
171538c8a9a5SSteve French 	__u64 length = cifs_flock_len(flock);
171638c8a9a5SSteve French 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
171738c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
171838c8a9a5SSteve French 	struct TCP_Server_Info *server = tcon->ses->server;
171938c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
172038c8a9a5SSteve French 	__u16 netfid = cfile->fid.netfid;
172138c8a9a5SSteve French 
172238c8a9a5SSteve French 	if (posix_lck) {
172338c8a9a5SSteve French 		int posix_lock_type;
172438c8a9a5SSteve French 
172538c8a9a5SSteve French 		rc = cifs_posix_lock_test(file, flock);
172638c8a9a5SSteve French 		if (!rc)
172738c8a9a5SSteve French 			return rc;
172838c8a9a5SSteve French 
172938c8a9a5SSteve French 		if (type & server->vals->shared_lock_type)
173038c8a9a5SSteve French 			posix_lock_type = CIFS_RDLCK;
173138c8a9a5SSteve French 		else
173238c8a9a5SSteve French 			posix_lock_type = CIFS_WRLCK;
173338c8a9a5SSteve French 		rc = CIFSSMBPosixLock(xid, tcon, netfid,
173438c8a9a5SSteve French 				      hash_lockowner(flock->fl_owner),
173538c8a9a5SSteve French 				      flock->fl_start, length, flock,
173638c8a9a5SSteve French 				      posix_lock_type, wait_flag);
173738c8a9a5SSteve French 		return rc;
173838c8a9a5SSteve French 	}
173938c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
174038c8a9a5SSteve French 
174138c8a9a5SSteve French 	rc = cifs_lock_test(cfile, flock->fl_start, length, type, flock);
174238c8a9a5SSteve French 	if (!rc)
174338c8a9a5SSteve French 		return rc;
174438c8a9a5SSteve French 
174538c8a9a5SSteve French 	/* BB we could chain these into one lock request BB */
174638c8a9a5SSteve French 	rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length, type,
174738c8a9a5SSteve French 				    1, 0, false);
174838c8a9a5SSteve French 	if (rc == 0) {
174938c8a9a5SSteve French 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
175038c8a9a5SSteve French 					    type, 0, 1, false);
175138c8a9a5SSteve French 		flock->fl_type = F_UNLCK;
175238c8a9a5SSteve French 		if (rc != 0)
175338c8a9a5SSteve French 			cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
175438c8a9a5SSteve French 				 rc);
175538c8a9a5SSteve French 		return 0;
175638c8a9a5SSteve French 	}
175738c8a9a5SSteve French 
175838c8a9a5SSteve French 	if (type & server->vals->shared_lock_type) {
175938c8a9a5SSteve French 		flock->fl_type = F_WRLCK;
176038c8a9a5SSteve French 		return 0;
176138c8a9a5SSteve French 	}
176238c8a9a5SSteve French 
176338c8a9a5SSteve French 	type &= ~server->vals->exclusive_lock_type;
176438c8a9a5SSteve French 
176538c8a9a5SSteve French 	rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
176638c8a9a5SSteve French 				    type | server->vals->shared_lock_type,
176738c8a9a5SSteve French 				    1, 0, false);
176838c8a9a5SSteve French 	if (rc == 0) {
176938c8a9a5SSteve French 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
177038c8a9a5SSteve French 			type | server->vals->shared_lock_type, 0, 1, false);
177138c8a9a5SSteve French 		flock->fl_type = F_RDLCK;
177238c8a9a5SSteve French 		if (rc != 0)
177338c8a9a5SSteve French 			cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
177438c8a9a5SSteve French 				 rc);
177538c8a9a5SSteve French 	} else
177638c8a9a5SSteve French 		flock->fl_type = F_WRLCK;
177738c8a9a5SSteve French 
177838c8a9a5SSteve French 	return 0;
177938c8a9a5SSteve French }
178038c8a9a5SSteve French 
178138c8a9a5SSteve French void
178238c8a9a5SSteve French cifs_move_llist(struct list_head *source, struct list_head *dest)
178338c8a9a5SSteve French {
178438c8a9a5SSteve French 	struct list_head *li, *tmp;
178538c8a9a5SSteve French 	list_for_each_safe(li, tmp, source)
178638c8a9a5SSteve French 		list_move(li, dest);
178738c8a9a5SSteve French }
178838c8a9a5SSteve French 
178938c8a9a5SSteve French void
179038c8a9a5SSteve French cifs_free_llist(struct list_head *llist)
179138c8a9a5SSteve French {
179238c8a9a5SSteve French 	struct cifsLockInfo *li, *tmp;
179338c8a9a5SSteve French 	list_for_each_entry_safe(li, tmp, llist, llist) {
179438c8a9a5SSteve French 		cifs_del_lock_waiters(li);
179538c8a9a5SSteve French 		list_del(&li->llist);
179638c8a9a5SSteve French 		kfree(li);
179738c8a9a5SSteve French 	}
179838c8a9a5SSteve French }
179938c8a9a5SSteve French 
180038c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
180138c8a9a5SSteve French int
180238c8a9a5SSteve French cifs_unlock_range(struct cifsFileInfo *cfile, struct file_lock *flock,
180338c8a9a5SSteve French 		  unsigned int xid)
180438c8a9a5SSteve French {
180538c8a9a5SSteve French 	int rc = 0, stored_rc;
180638c8a9a5SSteve French 	static const int types[] = {
180738c8a9a5SSteve French 		LOCKING_ANDX_LARGE_FILES,
180838c8a9a5SSteve French 		LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES
180938c8a9a5SSteve French 	};
181038c8a9a5SSteve French 	unsigned int i;
181138c8a9a5SSteve French 	unsigned int max_num, num, max_buf;
181238c8a9a5SSteve French 	LOCKING_ANDX_RANGE *buf, *cur;
181338c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
181438c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
181538c8a9a5SSteve French 	struct cifsLockInfo *li, *tmp;
181638c8a9a5SSteve French 	__u64 length = cifs_flock_len(flock);
181738c8a9a5SSteve French 	struct list_head tmp_llist;
181838c8a9a5SSteve French 
181938c8a9a5SSteve French 	INIT_LIST_HEAD(&tmp_llist);
182038c8a9a5SSteve French 
182138c8a9a5SSteve French 	/*
182238c8a9a5SSteve French 	 * Accessing maxBuf is racy with cifs_reconnect - need to store value
182338c8a9a5SSteve French 	 * and check it before using.
182438c8a9a5SSteve French 	 */
182538c8a9a5SSteve French 	max_buf = tcon->ses->server->maxBuf;
182638c8a9a5SSteve French 	if (max_buf < (sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE)))
182738c8a9a5SSteve French 		return -EINVAL;
182838c8a9a5SSteve French 
182938c8a9a5SSteve French 	BUILD_BUG_ON(sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE) >
183038c8a9a5SSteve French 		     PAGE_SIZE);
183138c8a9a5SSteve French 	max_buf = min_t(unsigned int, max_buf - sizeof(struct smb_hdr),
183238c8a9a5SSteve French 			PAGE_SIZE);
183338c8a9a5SSteve French 	max_num = (max_buf - sizeof(struct smb_hdr)) /
183438c8a9a5SSteve French 						sizeof(LOCKING_ANDX_RANGE);
183538c8a9a5SSteve French 	buf = kcalloc(max_num, sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
183638c8a9a5SSteve French 	if (!buf)
183738c8a9a5SSteve French 		return -ENOMEM;
183838c8a9a5SSteve French 
183938c8a9a5SSteve French 	cifs_down_write(&cinode->lock_sem);
184038c8a9a5SSteve French 	for (i = 0; i < 2; i++) {
184138c8a9a5SSteve French 		cur = buf;
184238c8a9a5SSteve French 		num = 0;
184338c8a9a5SSteve French 		list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
184438c8a9a5SSteve French 			if (flock->fl_start > li->offset ||
184538c8a9a5SSteve French 			    (flock->fl_start + length) <
184638c8a9a5SSteve French 			    (li->offset + li->length))
184738c8a9a5SSteve French 				continue;
184838c8a9a5SSteve French 			if (current->tgid != li->pid)
184938c8a9a5SSteve French 				continue;
185038c8a9a5SSteve French 			if (types[i] != li->type)
185138c8a9a5SSteve French 				continue;
185238c8a9a5SSteve French 			if (cinode->can_cache_brlcks) {
185338c8a9a5SSteve French 				/*
185438c8a9a5SSteve French 				 * We can cache brlock requests - simply remove
185538c8a9a5SSteve French 				 * a lock from the file's list.
185638c8a9a5SSteve French 				 */
185738c8a9a5SSteve French 				list_del(&li->llist);
185838c8a9a5SSteve French 				cifs_del_lock_waiters(li);
185938c8a9a5SSteve French 				kfree(li);
186038c8a9a5SSteve French 				continue;
186138c8a9a5SSteve French 			}
186238c8a9a5SSteve French 			cur->Pid = cpu_to_le16(li->pid);
186338c8a9a5SSteve French 			cur->LengthLow = cpu_to_le32((u32)li->length);
186438c8a9a5SSteve French 			cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
186538c8a9a5SSteve French 			cur->OffsetLow = cpu_to_le32((u32)li->offset);
186638c8a9a5SSteve French 			cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
186738c8a9a5SSteve French 			/*
186838c8a9a5SSteve French 			 * We need to save a lock here to let us add it again to
186938c8a9a5SSteve French 			 * the file's list if the unlock range request fails on
187038c8a9a5SSteve French 			 * the server.
187138c8a9a5SSteve French 			 */
187238c8a9a5SSteve French 			list_move(&li->llist, &tmp_llist);
187338c8a9a5SSteve French 			if (++num == max_num) {
187438c8a9a5SSteve French 				stored_rc = cifs_lockv(xid, tcon,
187538c8a9a5SSteve French 						       cfile->fid.netfid,
187638c8a9a5SSteve French 						       li->type, num, 0, buf);
187738c8a9a5SSteve French 				if (stored_rc) {
187838c8a9a5SSteve French 					/*
187938c8a9a5SSteve French 					 * We failed on the unlock range
188038c8a9a5SSteve French 					 * request - add all locks from the tmp
188138c8a9a5SSteve French 					 * list to the head of the file's list.
188238c8a9a5SSteve French 					 */
188338c8a9a5SSteve French 					cifs_move_llist(&tmp_llist,
188438c8a9a5SSteve French 							&cfile->llist->locks);
188538c8a9a5SSteve French 					rc = stored_rc;
188638c8a9a5SSteve French 				} else
188738c8a9a5SSteve French 					/*
188838c8a9a5SSteve French 					 * The unlock range request succeed -
188938c8a9a5SSteve French 					 * free the tmp list.
189038c8a9a5SSteve French 					 */
189138c8a9a5SSteve French 					cifs_free_llist(&tmp_llist);
189238c8a9a5SSteve French 				cur = buf;
189338c8a9a5SSteve French 				num = 0;
189438c8a9a5SSteve French 			} else
189538c8a9a5SSteve French 				cur++;
189638c8a9a5SSteve French 		}
189738c8a9a5SSteve French 		if (num) {
189838c8a9a5SSteve French 			stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
189938c8a9a5SSteve French 					       types[i], num, 0, buf);
190038c8a9a5SSteve French 			if (stored_rc) {
190138c8a9a5SSteve French 				cifs_move_llist(&tmp_llist,
190238c8a9a5SSteve French 						&cfile->llist->locks);
190338c8a9a5SSteve French 				rc = stored_rc;
190438c8a9a5SSteve French 			} else
190538c8a9a5SSteve French 				cifs_free_llist(&tmp_llist);
190638c8a9a5SSteve French 		}
190738c8a9a5SSteve French 	}
190838c8a9a5SSteve French 
190938c8a9a5SSteve French 	up_write(&cinode->lock_sem);
191038c8a9a5SSteve French 	kfree(buf);
191138c8a9a5SSteve French 	return rc;
191238c8a9a5SSteve French }
191338c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
191438c8a9a5SSteve French 
191538c8a9a5SSteve French static int
191638c8a9a5SSteve French cifs_setlk(struct file *file, struct file_lock *flock, __u32 type,
191738c8a9a5SSteve French 	   bool wait_flag, bool posix_lck, int lock, int unlock,
191838c8a9a5SSteve French 	   unsigned int xid)
191938c8a9a5SSteve French {
192038c8a9a5SSteve French 	int rc = 0;
192138c8a9a5SSteve French 	__u64 length = cifs_flock_len(flock);
192238c8a9a5SSteve French 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
192338c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
192438c8a9a5SSteve French 	struct TCP_Server_Info *server = tcon->ses->server;
192538c8a9a5SSteve French 	struct inode *inode = d_inode(cfile->dentry);
192638c8a9a5SSteve French 
192738c8a9a5SSteve French #ifdef CONFIG_CIFS_ALLOW_INSECURE_LEGACY
192838c8a9a5SSteve French 	if (posix_lck) {
192938c8a9a5SSteve French 		int posix_lock_type;
193038c8a9a5SSteve French 
193138c8a9a5SSteve French 		rc = cifs_posix_lock_set(file, flock);
193238c8a9a5SSteve French 		if (rc <= FILE_LOCK_DEFERRED)
193338c8a9a5SSteve French 			return rc;
193438c8a9a5SSteve French 
193538c8a9a5SSteve French 		if (type & server->vals->shared_lock_type)
193638c8a9a5SSteve French 			posix_lock_type = CIFS_RDLCK;
193738c8a9a5SSteve French 		else
193838c8a9a5SSteve French 			posix_lock_type = CIFS_WRLCK;
193938c8a9a5SSteve French 
194038c8a9a5SSteve French 		if (unlock == 1)
194138c8a9a5SSteve French 			posix_lock_type = CIFS_UNLCK;
194238c8a9a5SSteve French 
194338c8a9a5SSteve French 		rc = CIFSSMBPosixLock(xid, tcon, cfile->fid.netfid,
194438c8a9a5SSteve French 				      hash_lockowner(flock->fl_owner),
194538c8a9a5SSteve French 				      flock->fl_start, length,
194638c8a9a5SSteve French 				      NULL, posix_lock_type, wait_flag);
194738c8a9a5SSteve French 		goto out;
194838c8a9a5SSteve French 	}
194938c8a9a5SSteve French #endif /* CONFIG_CIFS_ALLOW_INSECURE_LEGACY */
195038c8a9a5SSteve French 	if (lock) {
195138c8a9a5SSteve French 		struct cifsLockInfo *lock;
195238c8a9a5SSteve French 
195338c8a9a5SSteve French 		lock = cifs_lock_init(flock->fl_start, length, type,
195438c8a9a5SSteve French 				      flock->fl_flags);
195538c8a9a5SSteve French 		if (!lock)
195638c8a9a5SSteve French 			return -ENOMEM;
195738c8a9a5SSteve French 
195838c8a9a5SSteve French 		rc = cifs_lock_add_if(cfile, lock, wait_flag);
195938c8a9a5SSteve French 		if (rc < 0) {
196038c8a9a5SSteve French 			kfree(lock);
196138c8a9a5SSteve French 			return rc;
196238c8a9a5SSteve French 		}
196338c8a9a5SSteve French 		if (!rc)
196438c8a9a5SSteve French 			goto out;
196538c8a9a5SSteve French 
196638c8a9a5SSteve French 		/*
196738c8a9a5SSteve French 		 * Windows 7 server can delay breaking lease from read to None
196838c8a9a5SSteve French 		 * if we set a byte-range lock on a file - break it explicitly
196938c8a9a5SSteve French 		 * before sending the lock to the server to be sure the next
197038c8a9a5SSteve French 		 * read won't conflict with non-overlapted locks due to
197138c8a9a5SSteve French 		 * pagereading.
197238c8a9a5SSteve French 		 */
197338c8a9a5SSteve French 		if (!CIFS_CACHE_WRITE(CIFS_I(inode)) &&
197438c8a9a5SSteve French 					CIFS_CACHE_READ(CIFS_I(inode))) {
197538c8a9a5SSteve French 			cifs_zap_mapping(inode);
197638c8a9a5SSteve French 			cifs_dbg(FYI, "Set no oplock for inode=%p due to mand locks\n",
197738c8a9a5SSteve French 				 inode);
197838c8a9a5SSteve French 			CIFS_I(inode)->oplock = 0;
197938c8a9a5SSteve French 		}
198038c8a9a5SSteve French 
198138c8a9a5SSteve French 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
198238c8a9a5SSteve French 					    type, 1, 0, wait_flag);
198338c8a9a5SSteve French 		if (rc) {
198438c8a9a5SSteve French 			kfree(lock);
198538c8a9a5SSteve French 			return rc;
198638c8a9a5SSteve French 		}
198738c8a9a5SSteve French 
198838c8a9a5SSteve French 		cifs_lock_add(cfile, lock);
198938c8a9a5SSteve French 	} else if (unlock)
199038c8a9a5SSteve French 		rc = server->ops->mand_unlock_range(cfile, flock, xid);
199138c8a9a5SSteve French 
199238c8a9a5SSteve French out:
199338c8a9a5SSteve French 	if ((flock->fl_flags & FL_POSIX) || (flock->fl_flags & FL_FLOCK)) {
199438c8a9a5SSteve French 		/*
199538c8a9a5SSteve French 		 * If this is a request to remove all locks because we
199638c8a9a5SSteve French 		 * are closing the file, it doesn't matter if the
199738c8a9a5SSteve French 		 * unlocking failed as both cifs.ko and the SMB server
199838c8a9a5SSteve French 		 * remove the lock on file close
199938c8a9a5SSteve French 		 */
200038c8a9a5SSteve French 		if (rc) {
200138c8a9a5SSteve French 			cifs_dbg(VFS, "%s failed rc=%d\n", __func__, rc);
200238c8a9a5SSteve French 			if (!(flock->fl_flags & FL_CLOSE))
200338c8a9a5SSteve French 				return rc;
200438c8a9a5SSteve French 		}
200538c8a9a5SSteve French 		rc = locks_lock_file_wait(file, flock);
200638c8a9a5SSteve French 	}
200738c8a9a5SSteve French 	return rc;
200838c8a9a5SSteve French }
200938c8a9a5SSteve French 
201038c8a9a5SSteve French int cifs_flock(struct file *file, int cmd, struct file_lock *fl)
201138c8a9a5SSteve French {
201238c8a9a5SSteve French 	int rc, xid;
201338c8a9a5SSteve French 	int lock = 0, unlock = 0;
201438c8a9a5SSteve French 	bool wait_flag = false;
201538c8a9a5SSteve French 	bool posix_lck = false;
201638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
201738c8a9a5SSteve French 	struct cifs_tcon *tcon;
201838c8a9a5SSteve French 	struct cifsFileInfo *cfile;
201938c8a9a5SSteve French 	__u32 type;
202038c8a9a5SSteve French 
202138c8a9a5SSteve French 	xid = get_xid();
202238c8a9a5SSteve French 
202338c8a9a5SSteve French 	if (!(fl->fl_flags & FL_FLOCK)) {
202438c8a9a5SSteve French 		rc = -ENOLCK;
202538c8a9a5SSteve French 		free_xid(xid);
202638c8a9a5SSteve French 		return rc;
202738c8a9a5SSteve French 	}
202838c8a9a5SSteve French 
202938c8a9a5SSteve French 	cfile = (struct cifsFileInfo *)file->private_data;
203038c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
203138c8a9a5SSteve French 
203238c8a9a5SSteve French 	cifs_read_flock(fl, &type, &lock, &unlock, &wait_flag,
203338c8a9a5SSteve French 			tcon->ses->server);
203438c8a9a5SSteve French 	cifs_sb = CIFS_FILE_SB(file);
203538c8a9a5SSteve French 
203638c8a9a5SSteve French 	if (cap_unix(tcon->ses) &&
203738c8a9a5SSteve French 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
203838c8a9a5SSteve French 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
203938c8a9a5SSteve French 		posix_lck = true;
204038c8a9a5SSteve French 
204138c8a9a5SSteve French 	if (!lock && !unlock) {
204238c8a9a5SSteve French 		/*
204338c8a9a5SSteve French 		 * if no lock or unlock then nothing to do since we do not
204438c8a9a5SSteve French 		 * know what it is
204538c8a9a5SSteve French 		 */
204638c8a9a5SSteve French 		rc = -EOPNOTSUPP;
204738c8a9a5SSteve French 		free_xid(xid);
204838c8a9a5SSteve French 		return rc;
204938c8a9a5SSteve French 	}
205038c8a9a5SSteve French 
205138c8a9a5SSteve French 	rc = cifs_setlk(file, fl, type, wait_flag, posix_lck, lock, unlock,
205238c8a9a5SSteve French 			xid);
205338c8a9a5SSteve French 	free_xid(xid);
205438c8a9a5SSteve French 	return rc;
205538c8a9a5SSteve French 
205638c8a9a5SSteve French 
205738c8a9a5SSteve French }
205838c8a9a5SSteve French 
205938c8a9a5SSteve French int cifs_lock(struct file *file, int cmd, struct file_lock *flock)
206038c8a9a5SSteve French {
206138c8a9a5SSteve French 	int rc, xid;
206238c8a9a5SSteve French 	int lock = 0, unlock = 0;
206338c8a9a5SSteve French 	bool wait_flag = false;
206438c8a9a5SSteve French 	bool posix_lck = false;
206538c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
206638c8a9a5SSteve French 	struct cifs_tcon *tcon;
206738c8a9a5SSteve French 	struct cifsFileInfo *cfile;
206838c8a9a5SSteve French 	__u32 type;
206938c8a9a5SSteve French 
207038c8a9a5SSteve French 	rc = -EACCES;
207138c8a9a5SSteve French 	xid = get_xid();
207238c8a9a5SSteve French 
207338c8a9a5SSteve French 	cifs_dbg(FYI, "%s: %pD2 cmd=0x%x type=0x%x flags=0x%x r=%lld:%lld\n", __func__, file, cmd,
207438c8a9a5SSteve French 		 flock->fl_flags, flock->fl_type, (long long)flock->fl_start,
207538c8a9a5SSteve French 		 (long long)flock->fl_end);
207638c8a9a5SSteve French 
207738c8a9a5SSteve French 	cfile = (struct cifsFileInfo *)file->private_data;
207838c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
207938c8a9a5SSteve French 
208038c8a9a5SSteve French 	cifs_read_flock(flock, &type, &lock, &unlock, &wait_flag,
208138c8a9a5SSteve French 			tcon->ses->server);
208238c8a9a5SSteve French 	cifs_sb = CIFS_FILE_SB(file);
208338c8a9a5SSteve French 	set_bit(CIFS_INO_CLOSE_ON_LOCK, &CIFS_I(d_inode(cfile->dentry))->flags);
208438c8a9a5SSteve French 
208538c8a9a5SSteve French 	if (cap_unix(tcon->ses) &&
208638c8a9a5SSteve French 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
208738c8a9a5SSteve French 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
208838c8a9a5SSteve French 		posix_lck = true;
208938c8a9a5SSteve French 	/*
209038c8a9a5SSteve French 	 * BB add code here to normalize offset and length to account for
209138c8a9a5SSteve French 	 * negative length which we can not accept over the wire.
209238c8a9a5SSteve French 	 */
209338c8a9a5SSteve French 	if (IS_GETLK(cmd)) {
209438c8a9a5SSteve French 		rc = cifs_getlk(file, flock, type, wait_flag, posix_lck, xid);
209538c8a9a5SSteve French 		free_xid(xid);
209638c8a9a5SSteve French 		return rc;
209738c8a9a5SSteve French 	}
209838c8a9a5SSteve French 
209938c8a9a5SSteve French 	if (!lock && !unlock) {
210038c8a9a5SSteve French 		/*
210138c8a9a5SSteve French 		 * if no lock or unlock then nothing to do since we do not
210238c8a9a5SSteve French 		 * know what it is
210338c8a9a5SSteve French 		 */
210438c8a9a5SSteve French 		free_xid(xid);
210538c8a9a5SSteve French 		return -EOPNOTSUPP;
210638c8a9a5SSteve French 	}
210738c8a9a5SSteve French 
210838c8a9a5SSteve French 	rc = cifs_setlk(file, flock, type, wait_flag, posix_lck, lock, unlock,
210938c8a9a5SSteve French 			xid);
211038c8a9a5SSteve French 	free_xid(xid);
211138c8a9a5SSteve French 	return rc;
211238c8a9a5SSteve French }
211338c8a9a5SSteve French 
211438c8a9a5SSteve French /*
211538c8a9a5SSteve French  * update the file size (if needed) after a write. Should be called with
211638c8a9a5SSteve French  * the inode->i_lock held
211738c8a9a5SSteve French  */
211838c8a9a5SSteve French void
211938c8a9a5SSteve French cifs_update_eof(struct cifsInodeInfo *cifsi, loff_t offset,
212038c8a9a5SSteve French 		      unsigned int bytes_written)
212138c8a9a5SSteve French {
212238c8a9a5SSteve French 	loff_t end_of_write = offset + bytes_written;
212338c8a9a5SSteve French 
212438c8a9a5SSteve French 	if (end_of_write > cifsi->server_eof)
212538c8a9a5SSteve French 		cifsi->server_eof = end_of_write;
212638c8a9a5SSteve French }
212738c8a9a5SSteve French 
212838c8a9a5SSteve French static ssize_t
212938c8a9a5SSteve French cifs_write(struct cifsFileInfo *open_file, __u32 pid, const char *write_data,
213038c8a9a5SSteve French 	   size_t write_size, loff_t *offset)
213138c8a9a5SSteve French {
213238c8a9a5SSteve French 	int rc = 0;
213338c8a9a5SSteve French 	unsigned int bytes_written = 0;
213438c8a9a5SSteve French 	unsigned int total_written;
213538c8a9a5SSteve French 	struct cifs_tcon *tcon;
213638c8a9a5SSteve French 	struct TCP_Server_Info *server;
213738c8a9a5SSteve French 	unsigned int xid;
213838c8a9a5SSteve French 	struct dentry *dentry = open_file->dentry;
213938c8a9a5SSteve French 	struct cifsInodeInfo *cifsi = CIFS_I(d_inode(dentry));
214038c8a9a5SSteve French 	struct cifs_io_parms io_parms = {0};
214138c8a9a5SSteve French 
214238c8a9a5SSteve French 	cifs_dbg(FYI, "write %zd bytes to offset %lld of %pd\n",
214338c8a9a5SSteve French 		 write_size, *offset, dentry);
214438c8a9a5SSteve French 
214538c8a9a5SSteve French 	tcon = tlink_tcon(open_file->tlink);
214638c8a9a5SSteve French 	server = tcon->ses->server;
214738c8a9a5SSteve French 
214838c8a9a5SSteve French 	if (!server->ops->sync_write)
214938c8a9a5SSteve French 		return -ENOSYS;
215038c8a9a5SSteve French 
215138c8a9a5SSteve French 	xid = get_xid();
215238c8a9a5SSteve French 
215338c8a9a5SSteve French 	for (total_written = 0; write_size > total_written;
215438c8a9a5SSteve French 	     total_written += bytes_written) {
215538c8a9a5SSteve French 		rc = -EAGAIN;
215638c8a9a5SSteve French 		while (rc == -EAGAIN) {
215738c8a9a5SSteve French 			struct kvec iov[2];
215838c8a9a5SSteve French 			unsigned int len;
215938c8a9a5SSteve French 
216038c8a9a5SSteve French 			if (open_file->invalidHandle) {
216138c8a9a5SSteve French 				/* we could deadlock if we called
216238c8a9a5SSteve French 				   filemap_fdatawait from here so tell
216338c8a9a5SSteve French 				   reopen_file not to flush data to
216438c8a9a5SSteve French 				   server now */
216538c8a9a5SSteve French 				rc = cifs_reopen_file(open_file, false);
216638c8a9a5SSteve French 				if (rc != 0)
216738c8a9a5SSteve French 					break;
216838c8a9a5SSteve French 			}
216938c8a9a5SSteve French 
217038c8a9a5SSteve French 			len = min(server->ops->wp_retry_size(d_inode(dentry)),
217138c8a9a5SSteve French 				  (unsigned int)write_size - total_written);
217238c8a9a5SSteve French 			/* iov[0] is reserved for smb header */
217338c8a9a5SSteve French 			iov[1].iov_base = (char *)write_data + total_written;
217438c8a9a5SSteve French 			iov[1].iov_len = len;
217538c8a9a5SSteve French 			io_parms.pid = pid;
217638c8a9a5SSteve French 			io_parms.tcon = tcon;
217738c8a9a5SSteve French 			io_parms.offset = *offset;
217838c8a9a5SSteve French 			io_parms.length = len;
217938c8a9a5SSteve French 			rc = server->ops->sync_write(xid, &open_file->fid,
218038c8a9a5SSteve French 					&io_parms, &bytes_written, iov, 1);
218138c8a9a5SSteve French 		}
218238c8a9a5SSteve French 		if (rc || (bytes_written == 0)) {
218338c8a9a5SSteve French 			if (total_written)
218438c8a9a5SSteve French 				break;
218538c8a9a5SSteve French 			else {
218638c8a9a5SSteve French 				free_xid(xid);
218738c8a9a5SSteve French 				return rc;
218838c8a9a5SSteve French 			}
218938c8a9a5SSteve French 		} else {
219038c8a9a5SSteve French 			spin_lock(&d_inode(dentry)->i_lock);
219138c8a9a5SSteve French 			cifs_update_eof(cifsi, *offset, bytes_written);
219238c8a9a5SSteve French 			spin_unlock(&d_inode(dentry)->i_lock);
219338c8a9a5SSteve French 			*offset += bytes_written;
219438c8a9a5SSteve French 		}
219538c8a9a5SSteve French 	}
219638c8a9a5SSteve French 
219738c8a9a5SSteve French 	cifs_stats_bytes_written(tcon, total_written);
219838c8a9a5SSteve French 
219938c8a9a5SSteve French 	if (total_written > 0) {
220038c8a9a5SSteve French 		spin_lock(&d_inode(dentry)->i_lock);
220138c8a9a5SSteve French 		if (*offset > d_inode(dentry)->i_size) {
220238c8a9a5SSteve French 			i_size_write(d_inode(dentry), *offset);
220338c8a9a5SSteve French 			d_inode(dentry)->i_blocks = (512 - 1 + *offset) >> 9;
220438c8a9a5SSteve French 		}
220538c8a9a5SSteve French 		spin_unlock(&d_inode(dentry)->i_lock);
220638c8a9a5SSteve French 	}
220738c8a9a5SSteve French 	mark_inode_dirty_sync(d_inode(dentry));
220838c8a9a5SSteve French 	free_xid(xid);
220938c8a9a5SSteve French 	return total_written;
221038c8a9a5SSteve French }
221138c8a9a5SSteve French 
221238c8a9a5SSteve French struct cifsFileInfo *find_readable_file(struct cifsInodeInfo *cifs_inode,
221338c8a9a5SSteve French 					bool fsuid_only)
221438c8a9a5SSteve French {
221538c8a9a5SSteve French 	struct cifsFileInfo *open_file = NULL;
221638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(cifs_inode->netfs.inode.i_sb);
221738c8a9a5SSteve French 
221838c8a9a5SSteve French 	/* only filter by fsuid on multiuser mounts */
221938c8a9a5SSteve French 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
222038c8a9a5SSteve French 		fsuid_only = false;
222138c8a9a5SSteve French 
222238c8a9a5SSteve French 	spin_lock(&cifs_inode->open_file_lock);
222338c8a9a5SSteve French 	/* we could simply get the first_list_entry since write-only entries
222438c8a9a5SSteve French 	   are always at the end of the list but since the first entry might
222538c8a9a5SSteve French 	   have a close pending, we go through the whole list */
222638c8a9a5SSteve French 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
222738c8a9a5SSteve French 		if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
222838c8a9a5SSteve French 			continue;
222938c8a9a5SSteve French 		if (OPEN_FMODE(open_file->f_flags) & FMODE_READ) {
223038c8a9a5SSteve French 			if ((!open_file->invalidHandle)) {
223138c8a9a5SSteve French 				/* found a good file */
223238c8a9a5SSteve French 				/* lock it so it will not be closed on us */
223338c8a9a5SSteve French 				cifsFileInfo_get(open_file);
223438c8a9a5SSteve French 				spin_unlock(&cifs_inode->open_file_lock);
223538c8a9a5SSteve French 				return open_file;
223638c8a9a5SSteve French 			} /* else might as well continue, and look for
223738c8a9a5SSteve French 			     another, or simply have the caller reopen it
223838c8a9a5SSteve French 			     again rather than trying to fix this handle */
223938c8a9a5SSteve French 		} else /* write only file */
224038c8a9a5SSteve French 			break; /* write only files are last so must be done */
224138c8a9a5SSteve French 	}
224238c8a9a5SSteve French 	spin_unlock(&cifs_inode->open_file_lock);
224338c8a9a5SSteve French 	return NULL;
224438c8a9a5SSteve French }
224538c8a9a5SSteve French 
224638c8a9a5SSteve French /* Return -EBADF if no handle is found and general rc otherwise */
224738c8a9a5SSteve French int
224838c8a9a5SSteve French cifs_get_writable_file(struct cifsInodeInfo *cifs_inode, int flags,
224938c8a9a5SSteve French 		       struct cifsFileInfo **ret_file)
225038c8a9a5SSteve French {
225138c8a9a5SSteve French 	struct cifsFileInfo *open_file, *inv_file = NULL;
225238c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
225338c8a9a5SSteve French 	bool any_available = false;
225438c8a9a5SSteve French 	int rc = -EBADF;
225538c8a9a5SSteve French 	unsigned int refind = 0;
225638c8a9a5SSteve French 	bool fsuid_only = flags & FIND_WR_FSUID_ONLY;
225738c8a9a5SSteve French 	bool with_delete = flags & FIND_WR_WITH_DELETE;
225838c8a9a5SSteve French 	*ret_file = NULL;
225938c8a9a5SSteve French 
226038c8a9a5SSteve French 	/*
226138c8a9a5SSteve French 	 * Having a null inode here (because mapping->host was set to zero by
226238c8a9a5SSteve French 	 * the VFS or MM) should not happen but we had reports of on oops (due
226338c8a9a5SSteve French 	 * to it being zero) during stress testcases so we need to check for it
226438c8a9a5SSteve French 	 */
226538c8a9a5SSteve French 
226638c8a9a5SSteve French 	if (cifs_inode == NULL) {
226738c8a9a5SSteve French 		cifs_dbg(VFS, "Null inode passed to cifs_writeable_file\n");
226838c8a9a5SSteve French 		dump_stack();
226938c8a9a5SSteve French 		return rc;
227038c8a9a5SSteve French 	}
227138c8a9a5SSteve French 
227238c8a9a5SSteve French 	cifs_sb = CIFS_SB(cifs_inode->netfs.inode.i_sb);
227338c8a9a5SSteve French 
227438c8a9a5SSteve French 	/* only filter by fsuid on multiuser mounts */
227538c8a9a5SSteve French 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
227638c8a9a5SSteve French 		fsuid_only = false;
227738c8a9a5SSteve French 
227838c8a9a5SSteve French 	spin_lock(&cifs_inode->open_file_lock);
227938c8a9a5SSteve French refind_writable:
228038c8a9a5SSteve French 	if (refind > MAX_REOPEN_ATT) {
228138c8a9a5SSteve French 		spin_unlock(&cifs_inode->open_file_lock);
228238c8a9a5SSteve French 		return rc;
228338c8a9a5SSteve French 	}
228438c8a9a5SSteve French 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
228538c8a9a5SSteve French 		if (!any_available && open_file->pid != current->tgid)
228638c8a9a5SSteve French 			continue;
228738c8a9a5SSteve French 		if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
228838c8a9a5SSteve French 			continue;
228938c8a9a5SSteve French 		if (with_delete && !(open_file->fid.access & DELETE))
229038c8a9a5SSteve French 			continue;
229138c8a9a5SSteve French 		if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
229238c8a9a5SSteve French 			if (!open_file->invalidHandle) {
229338c8a9a5SSteve French 				/* found a good writable file */
229438c8a9a5SSteve French 				cifsFileInfo_get(open_file);
229538c8a9a5SSteve French 				spin_unlock(&cifs_inode->open_file_lock);
229638c8a9a5SSteve French 				*ret_file = open_file;
229738c8a9a5SSteve French 				return 0;
229838c8a9a5SSteve French 			} else {
229938c8a9a5SSteve French 				if (!inv_file)
230038c8a9a5SSteve French 					inv_file = open_file;
230138c8a9a5SSteve French 			}
230238c8a9a5SSteve French 		}
230338c8a9a5SSteve French 	}
230438c8a9a5SSteve French 	/* couldn't find useable FH with same pid, try any available */
230538c8a9a5SSteve French 	if (!any_available) {
230638c8a9a5SSteve French 		any_available = true;
230738c8a9a5SSteve French 		goto refind_writable;
230838c8a9a5SSteve French 	}
230938c8a9a5SSteve French 
231038c8a9a5SSteve French 	if (inv_file) {
231138c8a9a5SSteve French 		any_available = false;
231238c8a9a5SSteve French 		cifsFileInfo_get(inv_file);
231338c8a9a5SSteve French 	}
231438c8a9a5SSteve French 
231538c8a9a5SSteve French 	spin_unlock(&cifs_inode->open_file_lock);
231638c8a9a5SSteve French 
231738c8a9a5SSteve French 	if (inv_file) {
231838c8a9a5SSteve French 		rc = cifs_reopen_file(inv_file, false);
231938c8a9a5SSteve French 		if (!rc) {
232038c8a9a5SSteve French 			*ret_file = inv_file;
232138c8a9a5SSteve French 			return 0;
232238c8a9a5SSteve French 		}
232338c8a9a5SSteve French 
232438c8a9a5SSteve French 		spin_lock(&cifs_inode->open_file_lock);
232538c8a9a5SSteve French 		list_move_tail(&inv_file->flist, &cifs_inode->openFileList);
232638c8a9a5SSteve French 		spin_unlock(&cifs_inode->open_file_lock);
232738c8a9a5SSteve French 		cifsFileInfo_put(inv_file);
232838c8a9a5SSteve French 		++refind;
232938c8a9a5SSteve French 		inv_file = NULL;
233038c8a9a5SSteve French 		spin_lock(&cifs_inode->open_file_lock);
233138c8a9a5SSteve French 		goto refind_writable;
233238c8a9a5SSteve French 	}
233338c8a9a5SSteve French 
233438c8a9a5SSteve French 	return rc;
233538c8a9a5SSteve French }
233638c8a9a5SSteve French 
233738c8a9a5SSteve French struct cifsFileInfo *
233838c8a9a5SSteve French find_writable_file(struct cifsInodeInfo *cifs_inode, int flags)
233938c8a9a5SSteve French {
234038c8a9a5SSteve French 	struct cifsFileInfo *cfile;
234138c8a9a5SSteve French 	int rc;
234238c8a9a5SSteve French 
234338c8a9a5SSteve French 	rc = cifs_get_writable_file(cifs_inode, flags, &cfile);
234438c8a9a5SSteve French 	if (rc)
234538c8a9a5SSteve French 		cifs_dbg(FYI, "Couldn't find writable handle rc=%d\n", rc);
234638c8a9a5SSteve French 
234738c8a9a5SSteve French 	return cfile;
234838c8a9a5SSteve French }
234938c8a9a5SSteve French 
235038c8a9a5SSteve French int
235138c8a9a5SSteve French cifs_get_writable_path(struct cifs_tcon *tcon, const char *name,
235238c8a9a5SSteve French 		       int flags,
235338c8a9a5SSteve French 		       struct cifsFileInfo **ret_file)
235438c8a9a5SSteve French {
235538c8a9a5SSteve French 	struct cifsFileInfo *cfile;
235638c8a9a5SSteve French 	void *page = alloc_dentry_path();
235738c8a9a5SSteve French 
235838c8a9a5SSteve French 	*ret_file = NULL;
235938c8a9a5SSteve French 
236038c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
236138c8a9a5SSteve French 	list_for_each_entry(cfile, &tcon->openFileList, tlist) {
236238c8a9a5SSteve French 		struct cifsInodeInfo *cinode;
236338c8a9a5SSteve French 		const char *full_path = build_path_from_dentry(cfile->dentry, page);
236438c8a9a5SSteve French 		if (IS_ERR(full_path)) {
236538c8a9a5SSteve French 			spin_unlock(&tcon->open_file_lock);
236638c8a9a5SSteve French 			free_dentry_path(page);
236738c8a9a5SSteve French 			return PTR_ERR(full_path);
236838c8a9a5SSteve French 		}
236938c8a9a5SSteve French 		if (strcmp(full_path, name))
237038c8a9a5SSteve French 			continue;
237138c8a9a5SSteve French 
237238c8a9a5SSteve French 		cinode = CIFS_I(d_inode(cfile->dentry));
237338c8a9a5SSteve French 		spin_unlock(&tcon->open_file_lock);
237438c8a9a5SSteve French 		free_dentry_path(page);
237538c8a9a5SSteve French 		return cifs_get_writable_file(cinode, flags, ret_file);
237638c8a9a5SSteve French 	}
237738c8a9a5SSteve French 
237838c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
237938c8a9a5SSteve French 	free_dentry_path(page);
238038c8a9a5SSteve French 	return -ENOENT;
238138c8a9a5SSteve French }
238238c8a9a5SSteve French 
238338c8a9a5SSteve French int
238438c8a9a5SSteve French cifs_get_readable_path(struct cifs_tcon *tcon, const char *name,
238538c8a9a5SSteve French 		       struct cifsFileInfo **ret_file)
238638c8a9a5SSteve French {
238738c8a9a5SSteve French 	struct cifsFileInfo *cfile;
238838c8a9a5SSteve French 	void *page = alloc_dentry_path();
238938c8a9a5SSteve French 
239038c8a9a5SSteve French 	*ret_file = NULL;
239138c8a9a5SSteve French 
239238c8a9a5SSteve French 	spin_lock(&tcon->open_file_lock);
239338c8a9a5SSteve French 	list_for_each_entry(cfile, &tcon->openFileList, tlist) {
239438c8a9a5SSteve French 		struct cifsInodeInfo *cinode;
239538c8a9a5SSteve French 		const char *full_path = build_path_from_dentry(cfile->dentry, page);
239638c8a9a5SSteve French 		if (IS_ERR(full_path)) {
239738c8a9a5SSteve French 			spin_unlock(&tcon->open_file_lock);
239838c8a9a5SSteve French 			free_dentry_path(page);
239938c8a9a5SSteve French 			return PTR_ERR(full_path);
240038c8a9a5SSteve French 		}
240138c8a9a5SSteve French 		if (strcmp(full_path, name))
240238c8a9a5SSteve French 			continue;
240338c8a9a5SSteve French 
240438c8a9a5SSteve French 		cinode = CIFS_I(d_inode(cfile->dentry));
240538c8a9a5SSteve French 		spin_unlock(&tcon->open_file_lock);
240638c8a9a5SSteve French 		free_dentry_path(page);
240738c8a9a5SSteve French 		*ret_file = find_readable_file(cinode, 0);
240838c8a9a5SSteve French 		return *ret_file ? 0 : -ENOENT;
240938c8a9a5SSteve French 	}
241038c8a9a5SSteve French 
241138c8a9a5SSteve French 	spin_unlock(&tcon->open_file_lock);
241238c8a9a5SSteve French 	free_dentry_path(page);
241338c8a9a5SSteve French 	return -ENOENT;
241438c8a9a5SSteve French }
241538c8a9a5SSteve French 
241638c8a9a5SSteve French void
241738c8a9a5SSteve French cifs_writedata_release(struct kref *refcount)
241838c8a9a5SSteve French {
241938c8a9a5SSteve French 	struct cifs_writedata *wdata = container_of(refcount,
242038c8a9a5SSteve French 					struct cifs_writedata, refcount);
242138c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
242238c8a9a5SSteve French 	if (wdata->mr) {
242338c8a9a5SSteve French 		smbd_deregister_mr(wdata->mr);
242438c8a9a5SSteve French 		wdata->mr = NULL;
242538c8a9a5SSteve French 	}
242638c8a9a5SSteve French #endif
242738c8a9a5SSteve French 
242838c8a9a5SSteve French 	if (wdata->cfile)
242938c8a9a5SSteve French 		cifsFileInfo_put(wdata->cfile);
243038c8a9a5SSteve French 
243138c8a9a5SSteve French 	kfree(wdata);
243238c8a9a5SSteve French }
243338c8a9a5SSteve French 
243438c8a9a5SSteve French /*
243538c8a9a5SSteve French  * Write failed with a retryable error. Resend the write request. It's also
243638c8a9a5SSteve French  * possible that the page was redirtied so re-clean the page.
243738c8a9a5SSteve French  */
243838c8a9a5SSteve French static void
243938c8a9a5SSteve French cifs_writev_requeue(struct cifs_writedata *wdata)
244038c8a9a5SSteve French {
244138c8a9a5SSteve French 	int rc = 0;
244238c8a9a5SSteve French 	struct inode *inode = d_inode(wdata->cfile->dentry);
244338c8a9a5SSteve French 	struct TCP_Server_Info *server;
244438c8a9a5SSteve French 	unsigned int rest_len = wdata->bytes;
244538c8a9a5SSteve French 	loff_t fpos = wdata->offset;
244638c8a9a5SSteve French 
244738c8a9a5SSteve French 	server = tlink_tcon(wdata->cfile->tlink)->ses->server;
244838c8a9a5SSteve French 	do {
244938c8a9a5SSteve French 		struct cifs_writedata *wdata2;
245038c8a9a5SSteve French 		unsigned int wsize, cur_len;
245138c8a9a5SSteve French 
245238c8a9a5SSteve French 		wsize = server->ops->wp_retry_size(inode);
245338c8a9a5SSteve French 		if (wsize < rest_len) {
245438c8a9a5SSteve French 			if (wsize < PAGE_SIZE) {
245538c8a9a5SSteve French 				rc = -EOPNOTSUPP;
245638c8a9a5SSteve French 				break;
245738c8a9a5SSteve French 			}
245838c8a9a5SSteve French 			cur_len = min(round_down(wsize, PAGE_SIZE), rest_len);
245938c8a9a5SSteve French 		} else {
246038c8a9a5SSteve French 			cur_len = rest_len;
246138c8a9a5SSteve French 		}
246238c8a9a5SSteve French 
246338c8a9a5SSteve French 		wdata2 = cifs_writedata_alloc(cifs_writev_complete);
246438c8a9a5SSteve French 		if (!wdata2) {
246538c8a9a5SSteve French 			rc = -ENOMEM;
246638c8a9a5SSteve French 			break;
246738c8a9a5SSteve French 		}
246838c8a9a5SSteve French 
246938c8a9a5SSteve French 		wdata2->sync_mode = wdata->sync_mode;
247038c8a9a5SSteve French 		wdata2->offset	= fpos;
247138c8a9a5SSteve French 		wdata2->bytes	= cur_len;
247238c8a9a5SSteve French 		wdata2->iter	= wdata->iter;
247338c8a9a5SSteve French 
247438c8a9a5SSteve French 		iov_iter_advance(&wdata2->iter, fpos - wdata->offset);
247538c8a9a5SSteve French 		iov_iter_truncate(&wdata2->iter, wdata2->bytes);
247638c8a9a5SSteve French 
247738c8a9a5SSteve French 		if (iov_iter_is_xarray(&wdata2->iter))
247838c8a9a5SSteve French 			/* Check for pages having been redirtied and clean
247938c8a9a5SSteve French 			 * them.  We can do this by walking the xarray.  If
248038c8a9a5SSteve French 			 * it's not an xarray, then it's a DIO and we shouldn't
248138c8a9a5SSteve French 			 * be mucking around with the page bits.
248238c8a9a5SSteve French 			 */
248338c8a9a5SSteve French 			cifs_undirty_folios(inode, fpos, cur_len);
248438c8a9a5SSteve French 
248538c8a9a5SSteve French 		rc = cifs_get_writable_file(CIFS_I(inode), FIND_WR_ANY,
248638c8a9a5SSteve French 					    &wdata2->cfile);
248738c8a9a5SSteve French 		if (!wdata2->cfile) {
248838c8a9a5SSteve French 			cifs_dbg(VFS, "No writable handle to retry writepages rc=%d\n",
248938c8a9a5SSteve French 				 rc);
249038c8a9a5SSteve French 			if (!is_retryable_error(rc))
249138c8a9a5SSteve French 				rc = -EBADF;
249238c8a9a5SSteve French 		} else {
249338c8a9a5SSteve French 			wdata2->pid = wdata2->cfile->pid;
249438c8a9a5SSteve French 			rc = server->ops->async_writev(wdata2,
249538c8a9a5SSteve French 						       cifs_writedata_release);
249638c8a9a5SSteve French 		}
249738c8a9a5SSteve French 
249838c8a9a5SSteve French 		kref_put(&wdata2->refcount, cifs_writedata_release);
249938c8a9a5SSteve French 		if (rc) {
250038c8a9a5SSteve French 			if (is_retryable_error(rc))
250138c8a9a5SSteve French 				continue;
250238c8a9a5SSteve French 			fpos += cur_len;
250338c8a9a5SSteve French 			rest_len -= cur_len;
250438c8a9a5SSteve French 			break;
250538c8a9a5SSteve French 		}
250638c8a9a5SSteve French 
250738c8a9a5SSteve French 		fpos += cur_len;
250838c8a9a5SSteve French 		rest_len -= cur_len;
250938c8a9a5SSteve French 	} while (rest_len > 0);
251038c8a9a5SSteve French 
251138c8a9a5SSteve French 	/* Clean up remaining pages from the original wdata */
251238c8a9a5SSteve French 	if (iov_iter_is_xarray(&wdata->iter))
251338c8a9a5SSteve French 		cifs_pages_write_failed(inode, fpos, rest_len);
251438c8a9a5SSteve French 
251538c8a9a5SSteve French 	if (rc != 0 && !is_retryable_error(rc))
251638c8a9a5SSteve French 		mapping_set_error(inode->i_mapping, rc);
251738c8a9a5SSteve French 	kref_put(&wdata->refcount, cifs_writedata_release);
251838c8a9a5SSteve French }
251938c8a9a5SSteve French 
252038c8a9a5SSteve French void
252138c8a9a5SSteve French cifs_writev_complete(struct work_struct *work)
252238c8a9a5SSteve French {
252338c8a9a5SSteve French 	struct cifs_writedata *wdata = container_of(work,
252438c8a9a5SSteve French 						struct cifs_writedata, work);
252538c8a9a5SSteve French 	struct inode *inode = d_inode(wdata->cfile->dentry);
252638c8a9a5SSteve French 
252738c8a9a5SSteve French 	if (wdata->result == 0) {
252838c8a9a5SSteve French 		spin_lock(&inode->i_lock);
252938c8a9a5SSteve French 		cifs_update_eof(CIFS_I(inode), wdata->offset, wdata->bytes);
253038c8a9a5SSteve French 		spin_unlock(&inode->i_lock);
253138c8a9a5SSteve French 		cifs_stats_bytes_written(tlink_tcon(wdata->cfile->tlink),
253238c8a9a5SSteve French 					 wdata->bytes);
253338c8a9a5SSteve French 	} else if (wdata->sync_mode == WB_SYNC_ALL && wdata->result == -EAGAIN)
253438c8a9a5SSteve French 		return cifs_writev_requeue(wdata);
253538c8a9a5SSteve French 
253638c8a9a5SSteve French 	if (wdata->result == -EAGAIN)
253738c8a9a5SSteve French 		cifs_pages_write_redirty(inode, wdata->offset, wdata->bytes);
253838c8a9a5SSteve French 	else if (wdata->result < 0)
253938c8a9a5SSteve French 		cifs_pages_write_failed(inode, wdata->offset, wdata->bytes);
254038c8a9a5SSteve French 	else
254138c8a9a5SSteve French 		cifs_pages_written_back(inode, wdata->offset, wdata->bytes);
254238c8a9a5SSteve French 
254338c8a9a5SSteve French 	if (wdata->result != -EAGAIN)
254438c8a9a5SSteve French 		mapping_set_error(inode->i_mapping, wdata->result);
254538c8a9a5SSteve French 	kref_put(&wdata->refcount, cifs_writedata_release);
254638c8a9a5SSteve French }
254738c8a9a5SSteve French 
254838c8a9a5SSteve French struct cifs_writedata *cifs_writedata_alloc(work_func_t complete)
254938c8a9a5SSteve French {
255038c8a9a5SSteve French 	struct cifs_writedata *wdata;
255138c8a9a5SSteve French 
255238c8a9a5SSteve French 	wdata = kzalloc(sizeof(*wdata), GFP_NOFS);
255338c8a9a5SSteve French 	if (wdata != NULL) {
255438c8a9a5SSteve French 		kref_init(&wdata->refcount);
255538c8a9a5SSteve French 		INIT_LIST_HEAD(&wdata->list);
255638c8a9a5SSteve French 		init_completion(&wdata->done);
255738c8a9a5SSteve French 		INIT_WORK(&wdata->work, complete);
255838c8a9a5SSteve French 	}
255938c8a9a5SSteve French 	return wdata;
256038c8a9a5SSteve French }
256138c8a9a5SSteve French 
256238c8a9a5SSteve French static int cifs_partialpagewrite(struct page *page, unsigned from, unsigned to)
256338c8a9a5SSteve French {
256438c8a9a5SSteve French 	struct address_space *mapping = page->mapping;
256538c8a9a5SSteve French 	loff_t offset = (loff_t)page->index << PAGE_SHIFT;
256638c8a9a5SSteve French 	char *write_data;
256738c8a9a5SSteve French 	int rc = -EFAULT;
256838c8a9a5SSteve French 	int bytes_written = 0;
256938c8a9a5SSteve French 	struct inode *inode;
257038c8a9a5SSteve French 	struct cifsFileInfo *open_file;
257138c8a9a5SSteve French 
257238c8a9a5SSteve French 	if (!mapping || !mapping->host)
257338c8a9a5SSteve French 		return -EFAULT;
257438c8a9a5SSteve French 
257538c8a9a5SSteve French 	inode = page->mapping->host;
257638c8a9a5SSteve French 
257738c8a9a5SSteve French 	offset += (loff_t)from;
257838c8a9a5SSteve French 	write_data = kmap(page);
257938c8a9a5SSteve French 	write_data += from;
258038c8a9a5SSteve French 
258138c8a9a5SSteve French 	if ((to > PAGE_SIZE) || (from > to)) {
258238c8a9a5SSteve French 		kunmap(page);
258338c8a9a5SSteve French 		return -EIO;
258438c8a9a5SSteve French 	}
258538c8a9a5SSteve French 
258638c8a9a5SSteve French 	/* racing with truncate? */
258738c8a9a5SSteve French 	if (offset > mapping->host->i_size) {
258838c8a9a5SSteve French 		kunmap(page);
258938c8a9a5SSteve French 		return 0; /* don't care */
259038c8a9a5SSteve French 	}
259138c8a9a5SSteve French 
259238c8a9a5SSteve French 	/* check to make sure that we are not extending the file */
259338c8a9a5SSteve French 	if (mapping->host->i_size - offset < (loff_t)to)
259438c8a9a5SSteve French 		to = (unsigned)(mapping->host->i_size - offset);
259538c8a9a5SSteve French 
259638c8a9a5SSteve French 	rc = cifs_get_writable_file(CIFS_I(mapping->host), FIND_WR_ANY,
259738c8a9a5SSteve French 				    &open_file);
259838c8a9a5SSteve French 	if (!rc) {
259938c8a9a5SSteve French 		bytes_written = cifs_write(open_file, open_file->pid,
260038c8a9a5SSteve French 					   write_data, to - from, &offset);
260138c8a9a5SSteve French 		cifsFileInfo_put(open_file);
260238c8a9a5SSteve French 		/* Does mm or vfs already set times? */
260323171df5SJeff Layton 		simple_inode_init_ts(inode);
260438c8a9a5SSteve French 		if ((bytes_written > 0) && (offset))
260538c8a9a5SSteve French 			rc = 0;
260638c8a9a5SSteve French 		else if (bytes_written < 0)
260738c8a9a5SSteve French 			rc = bytes_written;
260838c8a9a5SSteve French 		else
260938c8a9a5SSteve French 			rc = -EFAULT;
261038c8a9a5SSteve French 	} else {
261138c8a9a5SSteve French 		cifs_dbg(FYI, "No writable handle for write page rc=%d\n", rc);
261238c8a9a5SSteve French 		if (!is_retryable_error(rc))
261338c8a9a5SSteve French 			rc = -EIO;
261438c8a9a5SSteve French 	}
261538c8a9a5SSteve French 
261638c8a9a5SSteve French 	kunmap(page);
261738c8a9a5SSteve French 	return rc;
261838c8a9a5SSteve French }
261938c8a9a5SSteve French 
262038c8a9a5SSteve French /*
262138c8a9a5SSteve French  * Extend the region to be written back to include subsequent contiguously
262238c8a9a5SSteve French  * dirty pages if possible, but don't sleep while doing so.
262338c8a9a5SSteve French  */
262438c8a9a5SSteve French static void cifs_extend_writeback(struct address_space *mapping,
262538c8a9a5SSteve French 				  long *_count,
262638c8a9a5SSteve French 				  loff_t start,
262738c8a9a5SSteve French 				  int max_pages,
262838c8a9a5SSteve French 				  size_t max_len,
262938c8a9a5SSteve French 				  unsigned int *_len)
263038c8a9a5SSteve French {
263138c8a9a5SSteve French 	struct folio_batch batch;
263238c8a9a5SSteve French 	struct folio *folio;
263338c8a9a5SSteve French 	unsigned int psize, nr_pages;
263438c8a9a5SSteve French 	size_t len = *_len;
263538c8a9a5SSteve French 	pgoff_t index = (start + len) / PAGE_SIZE;
263638c8a9a5SSteve French 	bool stop = true;
263738c8a9a5SSteve French 	unsigned int i;
263838c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, index);
263938c8a9a5SSteve French 
264038c8a9a5SSteve French 	folio_batch_init(&batch);
264138c8a9a5SSteve French 
264238c8a9a5SSteve French 	do {
264338c8a9a5SSteve French 		/* Firstly, we gather up a batch of contiguous dirty pages
264438c8a9a5SSteve French 		 * under the RCU read lock - but we can't clear the dirty flags
264538c8a9a5SSteve French 		 * there if any of those pages are mapped.
264638c8a9a5SSteve French 		 */
264738c8a9a5SSteve French 		rcu_read_lock();
264838c8a9a5SSteve French 
264938c8a9a5SSteve French 		xas_for_each(&xas, folio, ULONG_MAX) {
265038c8a9a5SSteve French 			stop = true;
265138c8a9a5SSteve French 			if (xas_retry(&xas, folio))
265238c8a9a5SSteve French 				continue;
265338c8a9a5SSteve French 			if (xa_is_value(folio))
265438c8a9a5SSteve French 				break;
265538c8a9a5SSteve French 			if (folio_index(folio) != index)
265638c8a9a5SSteve French 				break;
265738c8a9a5SSteve French 			if (!folio_try_get_rcu(folio)) {
265838c8a9a5SSteve French 				xas_reset(&xas);
265938c8a9a5SSteve French 				continue;
266038c8a9a5SSteve French 			}
266138c8a9a5SSteve French 			nr_pages = folio_nr_pages(folio);
266238c8a9a5SSteve French 			if (nr_pages > max_pages)
266338c8a9a5SSteve French 				break;
266438c8a9a5SSteve French 
266538c8a9a5SSteve French 			/* Has the page moved or been split? */
266638c8a9a5SSteve French 			if (unlikely(folio != xas_reload(&xas))) {
266738c8a9a5SSteve French 				folio_put(folio);
266838c8a9a5SSteve French 				break;
266938c8a9a5SSteve French 			}
267038c8a9a5SSteve French 
267138c8a9a5SSteve French 			if (!folio_trylock(folio)) {
267238c8a9a5SSteve French 				folio_put(folio);
267338c8a9a5SSteve French 				break;
267438c8a9a5SSteve French 			}
267538c8a9a5SSteve French 			if (!folio_test_dirty(folio) || folio_test_writeback(folio)) {
267638c8a9a5SSteve French 				folio_unlock(folio);
267738c8a9a5SSteve French 				folio_put(folio);
267838c8a9a5SSteve French 				break;
267938c8a9a5SSteve French 			}
268038c8a9a5SSteve French 
268138c8a9a5SSteve French 			max_pages -= nr_pages;
268238c8a9a5SSteve French 			psize = folio_size(folio);
268338c8a9a5SSteve French 			len += psize;
268438c8a9a5SSteve French 			stop = false;
268538c8a9a5SSteve French 			if (max_pages <= 0 || len >= max_len || *_count <= 0)
268638c8a9a5SSteve French 				stop = true;
268738c8a9a5SSteve French 
268838c8a9a5SSteve French 			index += nr_pages;
268938c8a9a5SSteve French 			if (!folio_batch_add(&batch, folio))
269038c8a9a5SSteve French 				break;
269138c8a9a5SSteve French 			if (stop)
269238c8a9a5SSteve French 				break;
269338c8a9a5SSteve French 		}
269438c8a9a5SSteve French 
269538c8a9a5SSteve French 		if (!stop)
269638c8a9a5SSteve French 			xas_pause(&xas);
269738c8a9a5SSteve French 		rcu_read_unlock();
269838c8a9a5SSteve French 
269938c8a9a5SSteve French 		/* Now, if we obtained any pages, we can shift them to being
270038c8a9a5SSteve French 		 * writable and mark them for caching.
270138c8a9a5SSteve French 		 */
270238c8a9a5SSteve French 		if (!folio_batch_count(&batch))
270338c8a9a5SSteve French 			break;
270438c8a9a5SSteve French 
270538c8a9a5SSteve French 		for (i = 0; i < folio_batch_count(&batch); i++) {
270638c8a9a5SSteve French 			folio = batch.folios[i];
270738c8a9a5SSteve French 			/* The folio should be locked, dirty and not undergoing
270838c8a9a5SSteve French 			 * writeback from the loop above.
270938c8a9a5SSteve French 			 */
271038c8a9a5SSteve French 			if (!folio_clear_dirty_for_io(folio))
271138c8a9a5SSteve French 				WARN_ON(1);
271238c8a9a5SSteve French 			if (folio_start_writeback(folio))
271338c8a9a5SSteve French 				WARN_ON(1);
271438c8a9a5SSteve French 
271538c8a9a5SSteve French 			*_count -= folio_nr_pages(folio);
271638c8a9a5SSteve French 			folio_unlock(folio);
271738c8a9a5SSteve French 		}
271838c8a9a5SSteve French 
271938c8a9a5SSteve French 		folio_batch_release(&batch);
272038c8a9a5SSteve French 		cond_resched();
272138c8a9a5SSteve French 	} while (!stop);
272238c8a9a5SSteve French 
272338c8a9a5SSteve French 	*_len = len;
272438c8a9a5SSteve French }
272538c8a9a5SSteve French 
272638c8a9a5SSteve French /*
272738c8a9a5SSteve French  * Write back the locked page and any subsequent non-locked dirty pages.
272838c8a9a5SSteve French  */
272938c8a9a5SSteve French static ssize_t cifs_write_back_from_locked_folio(struct address_space *mapping,
273038c8a9a5SSteve French 						 struct writeback_control *wbc,
273138c8a9a5SSteve French 						 struct folio *folio,
273238c8a9a5SSteve French 						 loff_t start, loff_t end)
273338c8a9a5SSteve French {
273438c8a9a5SSteve French 	struct inode *inode = mapping->host;
273538c8a9a5SSteve French 	struct TCP_Server_Info *server;
273638c8a9a5SSteve French 	struct cifs_writedata *wdata;
273738c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
273838c8a9a5SSteve French 	struct cifs_credits credits_on_stack;
273938c8a9a5SSteve French 	struct cifs_credits *credits = &credits_on_stack;
274038c8a9a5SSteve French 	struct cifsFileInfo *cfile = NULL;
274138c8a9a5SSteve French 	unsigned int xid, wsize, len;
274238c8a9a5SSteve French 	loff_t i_size = i_size_read(inode);
274338c8a9a5SSteve French 	size_t max_len;
274438c8a9a5SSteve French 	long count = wbc->nr_to_write;
274538c8a9a5SSteve French 	int rc;
274638c8a9a5SSteve French 
274738c8a9a5SSteve French 	/* The folio should be locked, dirty and not undergoing writeback. */
274838c8a9a5SSteve French 	if (folio_start_writeback(folio))
274938c8a9a5SSteve French 		WARN_ON(1);
275038c8a9a5SSteve French 
275138c8a9a5SSteve French 	count -= folio_nr_pages(folio);
275238c8a9a5SSteve French 	len = folio_size(folio);
275338c8a9a5SSteve French 
275438c8a9a5SSteve French 	xid = get_xid();
275538c8a9a5SSteve French 	server = cifs_pick_channel(cifs_sb_master_tcon(cifs_sb)->ses);
275638c8a9a5SSteve French 
275738c8a9a5SSteve French 	rc = cifs_get_writable_file(CIFS_I(inode), FIND_WR_ANY, &cfile);
275838c8a9a5SSteve French 	if (rc) {
275938c8a9a5SSteve French 		cifs_dbg(VFS, "No writable handle in writepages rc=%d\n", rc);
276038c8a9a5SSteve French 		goto err_xid;
276138c8a9a5SSteve French 	}
276238c8a9a5SSteve French 
276338c8a9a5SSteve French 	rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->wsize,
276438c8a9a5SSteve French 					   &wsize, credits);
276538c8a9a5SSteve French 	if (rc != 0)
276638c8a9a5SSteve French 		goto err_close;
276738c8a9a5SSteve French 
276838c8a9a5SSteve French 	wdata = cifs_writedata_alloc(cifs_writev_complete);
276938c8a9a5SSteve French 	if (!wdata) {
277038c8a9a5SSteve French 		rc = -ENOMEM;
277138c8a9a5SSteve French 		goto err_uncredit;
277238c8a9a5SSteve French 	}
277338c8a9a5SSteve French 
277438c8a9a5SSteve French 	wdata->sync_mode = wbc->sync_mode;
277538c8a9a5SSteve French 	wdata->offset = folio_pos(folio);
277638c8a9a5SSteve French 	wdata->pid = cfile->pid;
277738c8a9a5SSteve French 	wdata->credits = credits_on_stack;
277838c8a9a5SSteve French 	wdata->cfile = cfile;
277938c8a9a5SSteve French 	wdata->server = server;
278038c8a9a5SSteve French 	cfile = NULL;
278138c8a9a5SSteve French 
278238c8a9a5SSteve French 	/* Find all consecutive lockable dirty pages, stopping when we find a
278338c8a9a5SSteve French 	 * page that is not immediately lockable, is not dirty or is missing,
278438c8a9a5SSteve French 	 * or we reach the end of the range.
278538c8a9a5SSteve French 	 */
278638c8a9a5SSteve French 	if (start < i_size) {
278738c8a9a5SSteve French 		/* Trim the write to the EOF; the extra data is ignored.  Also
278838c8a9a5SSteve French 		 * put an upper limit on the size of a single storedata op.
278938c8a9a5SSteve French 		 */
279038c8a9a5SSteve French 		max_len = wsize;
279138c8a9a5SSteve French 		max_len = min_t(unsigned long long, max_len, end - start + 1);
279238c8a9a5SSteve French 		max_len = min_t(unsigned long long, max_len, i_size - start);
279338c8a9a5SSteve French 
279438c8a9a5SSteve French 		if (len < max_len) {
279538c8a9a5SSteve French 			int max_pages = INT_MAX;
279638c8a9a5SSteve French 
279738c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
279838c8a9a5SSteve French 			if (server->smbd_conn)
279938c8a9a5SSteve French 				max_pages = server->smbd_conn->max_frmr_depth;
280038c8a9a5SSteve French #endif
280138c8a9a5SSteve French 			max_pages -= folio_nr_pages(folio);
280238c8a9a5SSteve French 
280338c8a9a5SSteve French 			if (max_pages > 0)
280438c8a9a5SSteve French 				cifs_extend_writeback(mapping, &count, start,
280538c8a9a5SSteve French 						      max_pages, max_len, &len);
280638c8a9a5SSteve French 		}
280738c8a9a5SSteve French 		len = min_t(loff_t, len, max_len);
280838c8a9a5SSteve French 	}
280938c8a9a5SSteve French 
281038c8a9a5SSteve French 	wdata->bytes = len;
281138c8a9a5SSteve French 
281238c8a9a5SSteve French 	/* We now have a contiguous set of dirty pages, each with writeback
281338c8a9a5SSteve French 	 * set; the first page is still locked at this point, but all the rest
281438c8a9a5SSteve French 	 * have been unlocked.
281538c8a9a5SSteve French 	 */
281638c8a9a5SSteve French 	folio_unlock(folio);
281738c8a9a5SSteve French 
281838c8a9a5SSteve French 	if (start < i_size) {
281938c8a9a5SSteve French 		iov_iter_xarray(&wdata->iter, ITER_SOURCE, &mapping->i_pages,
282038c8a9a5SSteve French 				start, len);
282138c8a9a5SSteve French 
282238c8a9a5SSteve French 		rc = adjust_credits(wdata->server, &wdata->credits, wdata->bytes);
282338c8a9a5SSteve French 		if (rc)
282438c8a9a5SSteve French 			goto err_wdata;
282538c8a9a5SSteve French 
282638c8a9a5SSteve French 		if (wdata->cfile->invalidHandle)
282738c8a9a5SSteve French 			rc = -EAGAIN;
282838c8a9a5SSteve French 		else
282938c8a9a5SSteve French 			rc = wdata->server->ops->async_writev(wdata,
283038c8a9a5SSteve French 							      cifs_writedata_release);
283138c8a9a5SSteve French 		if (rc >= 0) {
283238c8a9a5SSteve French 			kref_put(&wdata->refcount, cifs_writedata_release);
283338c8a9a5SSteve French 			goto err_close;
283438c8a9a5SSteve French 		}
283538c8a9a5SSteve French 	} else {
283638c8a9a5SSteve French 		/* The dirty region was entirely beyond the EOF. */
283738c8a9a5SSteve French 		cifs_pages_written_back(inode, start, len);
283838c8a9a5SSteve French 		rc = 0;
283938c8a9a5SSteve French 	}
284038c8a9a5SSteve French 
284138c8a9a5SSteve French err_wdata:
284238c8a9a5SSteve French 	kref_put(&wdata->refcount, cifs_writedata_release);
284338c8a9a5SSteve French err_uncredit:
284438c8a9a5SSteve French 	add_credits_and_wake_if(server, credits, 0);
284538c8a9a5SSteve French err_close:
284638c8a9a5SSteve French 	if (cfile)
284738c8a9a5SSteve French 		cifsFileInfo_put(cfile);
284838c8a9a5SSteve French err_xid:
284938c8a9a5SSteve French 	free_xid(xid);
285038c8a9a5SSteve French 	if (rc == 0) {
285138c8a9a5SSteve French 		wbc->nr_to_write = count;
285238c8a9a5SSteve French 		rc = len;
285338c8a9a5SSteve French 	} else if (is_retryable_error(rc)) {
285438c8a9a5SSteve French 		cifs_pages_write_redirty(inode, start, len);
285538c8a9a5SSteve French 	} else {
285638c8a9a5SSteve French 		cifs_pages_write_failed(inode, start, len);
285738c8a9a5SSteve French 		mapping_set_error(mapping, rc);
285838c8a9a5SSteve French 	}
285938c8a9a5SSteve French 	/* Indication to update ctime and mtime as close is deferred */
286038c8a9a5SSteve French 	set_bit(CIFS_INO_MODIFIED_ATTR, &CIFS_I(inode)->flags);
286138c8a9a5SSteve French 	return rc;
286238c8a9a5SSteve French }
286338c8a9a5SSteve French 
286438c8a9a5SSteve French /*
286538c8a9a5SSteve French  * write a region of pages back to the server
286638c8a9a5SSteve French  */
286738c8a9a5SSteve French static int cifs_writepages_region(struct address_space *mapping,
286838c8a9a5SSteve French 				  struct writeback_control *wbc,
286938c8a9a5SSteve French 				  loff_t start, loff_t end, loff_t *_next)
287038c8a9a5SSteve French {
287138c8a9a5SSteve French 	struct folio_batch fbatch;
287238c8a9a5SSteve French 	int skips = 0;
287338c8a9a5SSteve French 
287438c8a9a5SSteve French 	folio_batch_init(&fbatch);
287538c8a9a5SSteve French 	do {
287638c8a9a5SSteve French 		int nr;
287738c8a9a5SSteve French 		pgoff_t index = start / PAGE_SIZE;
287838c8a9a5SSteve French 
287938c8a9a5SSteve French 		nr = filemap_get_folios_tag(mapping, &index, end / PAGE_SIZE,
288038c8a9a5SSteve French 					    PAGECACHE_TAG_DIRTY, &fbatch);
288138c8a9a5SSteve French 		if (!nr)
288238c8a9a5SSteve French 			break;
288338c8a9a5SSteve French 
288438c8a9a5SSteve French 		for (int i = 0; i < nr; i++) {
288538c8a9a5SSteve French 			ssize_t ret;
288638c8a9a5SSteve French 			struct folio *folio = fbatch.folios[i];
288738c8a9a5SSteve French 
288838c8a9a5SSteve French redo_folio:
288938c8a9a5SSteve French 			start = folio_pos(folio); /* May regress with THPs */
289038c8a9a5SSteve French 
289138c8a9a5SSteve French 			/* At this point we hold neither the i_pages lock nor the
289238c8a9a5SSteve French 			 * page lock: the page may be truncated or invalidated
289338c8a9a5SSteve French 			 * (changing page->mapping to NULL), or even swizzled
289438c8a9a5SSteve French 			 * back from swapper_space to tmpfs file mapping
289538c8a9a5SSteve French 			 */
289638c8a9a5SSteve French 			if (wbc->sync_mode != WB_SYNC_NONE) {
289738c8a9a5SSteve French 				ret = folio_lock_killable(folio);
289838c8a9a5SSteve French 				if (ret < 0)
289938c8a9a5SSteve French 					goto write_error;
290038c8a9a5SSteve French 			} else {
290138c8a9a5SSteve French 				if (!folio_trylock(folio))
290238c8a9a5SSteve French 					goto skip_write;
290338c8a9a5SSteve French 			}
290438c8a9a5SSteve French 
290538c8a9a5SSteve French 			if (folio_mapping(folio) != mapping ||
290638c8a9a5SSteve French 			    !folio_test_dirty(folio)) {
290738c8a9a5SSteve French 				start += folio_size(folio);
290838c8a9a5SSteve French 				folio_unlock(folio);
290938c8a9a5SSteve French 				continue;
291038c8a9a5SSteve French 			}
291138c8a9a5SSteve French 
291238c8a9a5SSteve French 			if (folio_test_writeback(folio) ||
291338c8a9a5SSteve French 			    folio_test_fscache(folio)) {
291438c8a9a5SSteve French 				folio_unlock(folio);
291538c8a9a5SSteve French 				if (wbc->sync_mode == WB_SYNC_NONE)
291638c8a9a5SSteve French 					goto skip_write;
291738c8a9a5SSteve French 
291838c8a9a5SSteve French 				folio_wait_writeback(folio);
291938c8a9a5SSteve French #ifdef CONFIG_CIFS_FSCACHE
292038c8a9a5SSteve French 				folio_wait_fscache(folio);
292138c8a9a5SSteve French #endif
292238c8a9a5SSteve French 				goto redo_folio;
292338c8a9a5SSteve French 			}
292438c8a9a5SSteve French 
292538c8a9a5SSteve French 			if (!folio_clear_dirty_for_io(folio))
292638c8a9a5SSteve French 				/* We hold the page lock - it should've been dirty. */
292738c8a9a5SSteve French 				WARN_ON(1);
292838c8a9a5SSteve French 
292938c8a9a5SSteve French 			ret = cifs_write_back_from_locked_folio(mapping, wbc, folio, start, end);
293038c8a9a5SSteve French 			if (ret < 0)
293138c8a9a5SSteve French 				goto write_error;
293238c8a9a5SSteve French 
293338c8a9a5SSteve French 			start += ret;
293438c8a9a5SSteve French 			continue;
293538c8a9a5SSteve French 
293638c8a9a5SSteve French write_error:
293738c8a9a5SSteve French 			folio_batch_release(&fbatch);
293838c8a9a5SSteve French 			*_next = start;
293938c8a9a5SSteve French 			return ret;
294038c8a9a5SSteve French 
294138c8a9a5SSteve French skip_write:
294238c8a9a5SSteve French 			/*
294338c8a9a5SSteve French 			 * Too many skipped writes, or need to reschedule?
294438c8a9a5SSteve French 			 * Treat it as a write error without an error code.
294538c8a9a5SSteve French 			 */
294638c8a9a5SSteve French 			if (skips >= 5 || need_resched()) {
294738c8a9a5SSteve French 				ret = 0;
294838c8a9a5SSteve French 				goto write_error;
294938c8a9a5SSteve French 			}
295038c8a9a5SSteve French 
295138c8a9a5SSteve French 			/* Otherwise, just skip that folio and go on to the next */
295238c8a9a5SSteve French 			skips++;
295338c8a9a5SSteve French 			start += folio_size(folio);
295438c8a9a5SSteve French 			continue;
295538c8a9a5SSteve French 		}
295638c8a9a5SSteve French 
295738c8a9a5SSteve French 		folio_batch_release(&fbatch);
295838c8a9a5SSteve French 		cond_resched();
295938c8a9a5SSteve French 	} while (wbc->nr_to_write > 0);
296038c8a9a5SSteve French 
296138c8a9a5SSteve French 	*_next = start;
296238c8a9a5SSteve French 	return 0;
296338c8a9a5SSteve French }
296438c8a9a5SSteve French 
296538c8a9a5SSteve French /*
296638c8a9a5SSteve French  * Write some of the pending data back to the server
296738c8a9a5SSteve French  */
296838c8a9a5SSteve French static int cifs_writepages(struct address_space *mapping,
296938c8a9a5SSteve French 			   struct writeback_control *wbc)
297038c8a9a5SSteve French {
297138c8a9a5SSteve French 	loff_t start, next;
297238c8a9a5SSteve French 	int ret;
297338c8a9a5SSteve French 
297438c8a9a5SSteve French 	/* We have to be careful as we can end up racing with setattr()
297538c8a9a5SSteve French 	 * truncating the pagecache since the caller doesn't take a lock here
297638c8a9a5SSteve French 	 * to prevent it.
297738c8a9a5SSteve French 	 */
297838c8a9a5SSteve French 
297938c8a9a5SSteve French 	if (wbc->range_cyclic) {
298038c8a9a5SSteve French 		start = mapping->writeback_index * PAGE_SIZE;
298138c8a9a5SSteve French 		ret = cifs_writepages_region(mapping, wbc, start, LLONG_MAX, &next);
298238c8a9a5SSteve French 		if (ret == 0) {
298338c8a9a5SSteve French 			mapping->writeback_index = next / PAGE_SIZE;
298438c8a9a5SSteve French 			if (start > 0 && wbc->nr_to_write > 0) {
298538c8a9a5SSteve French 				ret = cifs_writepages_region(mapping, wbc, 0,
298638c8a9a5SSteve French 							     start, &next);
298738c8a9a5SSteve French 				if (ret == 0)
298838c8a9a5SSteve French 					mapping->writeback_index =
298938c8a9a5SSteve French 						next / PAGE_SIZE;
299038c8a9a5SSteve French 			}
299138c8a9a5SSteve French 		}
299238c8a9a5SSteve French 	} else if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX) {
299338c8a9a5SSteve French 		ret = cifs_writepages_region(mapping, wbc, 0, LLONG_MAX, &next);
299438c8a9a5SSteve French 		if (wbc->nr_to_write > 0 && ret == 0)
299538c8a9a5SSteve French 			mapping->writeback_index = next / PAGE_SIZE;
299638c8a9a5SSteve French 	} else {
299738c8a9a5SSteve French 		ret = cifs_writepages_region(mapping, wbc,
299838c8a9a5SSteve French 					     wbc->range_start, wbc->range_end, &next);
299938c8a9a5SSteve French 	}
300038c8a9a5SSteve French 
300138c8a9a5SSteve French 	return ret;
300238c8a9a5SSteve French }
300338c8a9a5SSteve French 
300438c8a9a5SSteve French static int
300538c8a9a5SSteve French cifs_writepage_locked(struct page *page, struct writeback_control *wbc)
300638c8a9a5SSteve French {
300738c8a9a5SSteve French 	int rc;
300838c8a9a5SSteve French 	unsigned int xid;
300938c8a9a5SSteve French 
301038c8a9a5SSteve French 	xid = get_xid();
301138c8a9a5SSteve French /* BB add check for wbc flags */
301238c8a9a5SSteve French 	get_page(page);
301338c8a9a5SSteve French 	if (!PageUptodate(page))
301438c8a9a5SSteve French 		cifs_dbg(FYI, "ppw - page not up to date\n");
301538c8a9a5SSteve French 
301638c8a9a5SSteve French 	/*
301738c8a9a5SSteve French 	 * Set the "writeback" flag, and clear "dirty" in the radix tree.
301838c8a9a5SSteve French 	 *
301938c8a9a5SSteve French 	 * A writepage() implementation always needs to do either this,
302038c8a9a5SSteve French 	 * or re-dirty the page with "redirty_page_for_writepage()" in
302138c8a9a5SSteve French 	 * the case of a failure.
302238c8a9a5SSteve French 	 *
302338c8a9a5SSteve French 	 * Just unlocking the page will cause the radix tree tag-bits
302438c8a9a5SSteve French 	 * to fail to update with the state of the page correctly.
302538c8a9a5SSteve French 	 */
302638c8a9a5SSteve French 	set_page_writeback(page);
302738c8a9a5SSteve French retry_write:
302838c8a9a5SSteve French 	rc = cifs_partialpagewrite(page, 0, PAGE_SIZE);
302938c8a9a5SSteve French 	if (is_retryable_error(rc)) {
303038c8a9a5SSteve French 		if (wbc->sync_mode == WB_SYNC_ALL && rc == -EAGAIN)
303138c8a9a5SSteve French 			goto retry_write;
303238c8a9a5SSteve French 		redirty_page_for_writepage(wbc, page);
303338c8a9a5SSteve French 	} else if (rc != 0) {
303438c8a9a5SSteve French 		SetPageError(page);
303538c8a9a5SSteve French 		mapping_set_error(page->mapping, rc);
303638c8a9a5SSteve French 	} else {
303738c8a9a5SSteve French 		SetPageUptodate(page);
303838c8a9a5SSteve French 	}
303938c8a9a5SSteve French 	end_page_writeback(page);
304038c8a9a5SSteve French 	put_page(page);
304138c8a9a5SSteve French 	free_xid(xid);
304238c8a9a5SSteve French 	return rc;
304338c8a9a5SSteve French }
304438c8a9a5SSteve French 
304538c8a9a5SSteve French static int cifs_write_end(struct file *file, struct address_space *mapping,
304638c8a9a5SSteve French 			loff_t pos, unsigned len, unsigned copied,
304738c8a9a5SSteve French 			struct page *page, void *fsdata)
304838c8a9a5SSteve French {
304938c8a9a5SSteve French 	int rc;
305038c8a9a5SSteve French 	struct inode *inode = mapping->host;
305138c8a9a5SSteve French 	struct cifsFileInfo *cfile = file->private_data;
305238c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
305338c8a9a5SSteve French 	struct folio *folio = page_folio(page);
305438c8a9a5SSteve French 	__u32 pid;
305538c8a9a5SSteve French 
305638c8a9a5SSteve French 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
305738c8a9a5SSteve French 		pid = cfile->pid;
305838c8a9a5SSteve French 	else
305938c8a9a5SSteve French 		pid = current->tgid;
306038c8a9a5SSteve French 
306138c8a9a5SSteve French 	cifs_dbg(FYI, "write_end for page %p from pos %lld with %d bytes\n",
306238c8a9a5SSteve French 		 page, pos, copied);
306338c8a9a5SSteve French 
306438c8a9a5SSteve French 	if (folio_test_checked(folio)) {
306538c8a9a5SSteve French 		if (copied == len)
306638c8a9a5SSteve French 			folio_mark_uptodate(folio);
306738c8a9a5SSteve French 		folio_clear_checked(folio);
306838c8a9a5SSteve French 	} else if (!folio_test_uptodate(folio) && copied == PAGE_SIZE)
306938c8a9a5SSteve French 		folio_mark_uptodate(folio);
307038c8a9a5SSteve French 
307138c8a9a5SSteve French 	if (!folio_test_uptodate(folio)) {
307238c8a9a5SSteve French 		char *page_data;
307338c8a9a5SSteve French 		unsigned offset = pos & (PAGE_SIZE - 1);
307438c8a9a5SSteve French 		unsigned int xid;
307538c8a9a5SSteve French 
307638c8a9a5SSteve French 		xid = get_xid();
307738c8a9a5SSteve French 		/* this is probably better than directly calling
307838c8a9a5SSteve French 		   partialpage_write since in this function the file handle is
307938c8a9a5SSteve French 		   known which we might as well	leverage */
308038c8a9a5SSteve French 		/* BB check if anything else missing out of ppw
308138c8a9a5SSteve French 		   such as updating last write time */
308238c8a9a5SSteve French 		page_data = kmap(page);
308338c8a9a5SSteve French 		rc = cifs_write(cfile, pid, page_data + offset, copied, &pos);
308438c8a9a5SSteve French 		/* if (rc < 0) should we set writebehind rc? */
308538c8a9a5SSteve French 		kunmap(page);
308638c8a9a5SSteve French 
308738c8a9a5SSteve French 		free_xid(xid);
308838c8a9a5SSteve French 	} else {
308938c8a9a5SSteve French 		rc = copied;
309038c8a9a5SSteve French 		pos += copied;
309138c8a9a5SSteve French 		set_page_dirty(page);
309238c8a9a5SSteve French 	}
309338c8a9a5SSteve French 
309438c8a9a5SSteve French 	if (rc > 0) {
309538c8a9a5SSteve French 		spin_lock(&inode->i_lock);
309638c8a9a5SSteve French 		if (pos > inode->i_size) {
309738c8a9a5SSteve French 			i_size_write(inode, pos);
309838c8a9a5SSteve French 			inode->i_blocks = (512 - 1 + pos) >> 9;
309938c8a9a5SSteve French 		}
310038c8a9a5SSteve French 		spin_unlock(&inode->i_lock);
310138c8a9a5SSteve French 	}
310238c8a9a5SSteve French 
310338c8a9a5SSteve French 	unlock_page(page);
310438c8a9a5SSteve French 	put_page(page);
310538c8a9a5SSteve French 	/* Indication to update ctime and mtime as close is deferred */
310638c8a9a5SSteve French 	set_bit(CIFS_INO_MODIFIED_ATTR, &CIFS_I(inode)->flags);
310738c8a9a5SSteve French 
310838c8a9a5SSteve French 	return rc;
310938c8a9a5SSteve French }
311038c8a9a5SSteve French 
311138c8a9a5SSteve French int cifs_strict_fsync(struct file *file, loff_t start, loff_t end,
311238c8a9a5SSteve French 		      int datasync)
311338c8a9a5SSteve French {
311438c8a9a5SSteve French 	unsigned int xid;
311538c8a9a5SSteve French 	int rc = 0;
311638c8a9a5SSteve French 	struct cifs_tcon *tcon;
311738c8a9a5SSteve French 	struct TCP_Server_Info *server;
311838c8a9a5SSteve French 	struct cifsFileInfo *smbfile = file->private_data;
311938c8a9a5SSteve French 	struct inode *inode = file_inode(file);
312038c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
312138c8a9a5SSteve French 
312238c8a9a5SSteve French 	rc = file_write_and_wait_range(file, start, end);
312338c8a9a5SSteve French 	if (rc) {
312438c8a9a5SSteve French 		trace_cifs_fsync_err(inode->i_ino, rc);
312538c8a9a5SSteve French 		return rc;
312638c8a9a5SSteve French 	}
312738c8a9a5SSteve French 
312838c8a9a5SSteve French 	xid = get_xid();
312938c8a9a5SSteve French 
313038c8a9a5SSteve French 	cifs_dbg(FYI, "Sync file - name: %pD datasync: 0x%x\n",
313138c8a9a5SSteve French 		 file, datasync);
313238c8a9a5SSteve French 
313338c8a9a5SSteve French 	if (!CIFS_CACHE_READ(CIFS_I(inode))) {
313438c8a9a5SSteve French 		rc = cifs_zap_mapping(inode);
313538c8a9a5SSteve French 		if (rc) {
313638c8a9a5SSteve French 			cifs_dbg(FYI, "rc: %d during invalidate phase\n", rc);
313738c8a9a5SSteve French 			rc = 0; /* don't care about it in fsync */
313838c8a9a5SSteve French 		}
313938c8a9a5SSteve French 	}
314038c8a9a5SSteve French 
314138c8a9a5SSteve French 	tcon = tlink_tcon(smbfile->tlink);
314238c8a9a5SSteve French 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
314338c8a9a5SSteve French 		server = tcon->ses->server;
314438c8a9a5SSteve French 		if (server->ops->flush == NULL) {
314538c8a9a5SSteve French 			rc = -ENOSYS;
314638c8a9a5SSteve French 			goto strict_fsync_exit;
314738c8a9a5SSteve French 		}
314838c8a9a5SSteve French 
314938c8a9a5SSteve French 		if ((OPEN_FMODE(smbfile->f_flags) & FMODE_WRITE) == 0) {
315038c8a9a5SSteve French 			smbfile = find_writable_file(CIFS_I(inode), FIND_WR_ANY);
315138c8a9a5SSteve French 			if (smbfile) {
315238c8a9a5SSteve French 				rc = server->ops->flush(xid, tcon, &smbfile->fid);
315338c8a9a5SSteve French 				cifsFileInfo_put(smbfile);
315438c8a9a5SSteve French 			} else
315538c8a9a5SSteve French 				cifs_dbg(FYI, "ignore fsync for file not open for write\n");
315638c8a9a5SSteve French 		} else
315738c8a9a5SSteve French 			rc = server->ops->flush(xid, tcon, &smbfile->fid);
315838c8a9a5SSteve French 	}
315938c8a9a5SSteve French 
316038c8a9a5SSteve French strict_fsync_exit:
316138c8a9a5SSteve French 	free_xid(xid);
316238c8a9a5SSteve French 	return rc;
316338c8a9a5SSteve French }
316438c8a9a5SSteve French 
316538c8a9a5SSteve French int cifs_fsync(struct file *file, loff_t start, loff_t end, int datasync)
316638c8a9a5SSteve French {
316738c8a9a5SSteve French 	unsigned int xid;
316838c8a9a5SSteve French 	int rc = 0;
316938c8a9a5SSteve French 	struct cifs_tcon *tcon;
317038c8a9a5SSteve French 	struct TCP_Server_Info *server;
317138c8a9a5SSteve French 	struct cifsFileInfo *smbfile = file->private_data;
317238c8a9a5SSteve French 	struct inode *inode = file_inode(file);
317338c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_FILE_SB(file);
317438c8a9a5SSteve French 
317538c8a9a5SSteve French 	rc = file_write_and_wait_range(file, start, end);
317638c8a9a5SSteve French 	if (rc) {
317738c8a9a5SSteve French 		trace_cifs_fsync_err(file_inode(file)->i_ino, rc);
317838c8a9a5SSteve French 		return rc;
317938c8a9a5SSteve French 	}
318038c8a9a5SSteve French 
318138c8a9a5SSteve French 	xid = get_xid();
318238c8a9a5SSteve French 
318338c8a9a5SSteve French 	cifs_dbg(FYI, "Sync file - name: %pD datasync: 0x%x\n",
318438c8a9a5SSteve French 		 file, datasync);
318538c8a9a5SSteve French 
318638c8a9a5SSteve French 	tcon = tlink_tcon(smbfile->tlink);
318738c8a9a5SSteve French 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
318838c8a9a5SSteve French 		server = tcon->ses->server;
318938c8a9a5SSteve French 		if (server->ops->flush == NULL) {
319038c8a9a5SSteve French 			rc = -ENOSYS;
319138c8a9a5SSteve French 			goto fsync_exit;
319238c8a9a5SSteve French 		}
319338c8a9a5SSteve French 
319438c8a9a5SSteve French 		if ((OPEN_FMODE(smbfile->f_flags) & FMODE_WRITE) == 0) {
319538c8a9a5SSteve French 			smbfile = find_writable_file(CIFS_I(inode), FIND_WR_ANY);
319638c8a9a5SSteve French 			if (smbfile) {
319738c8a9a5SSteve French 				rc = server->ops->flush(xid, tcon, &smbfile->fid);
319838c8a9a5SSteve French 				cifsFileInfo_put(smbfile);
319938c8a9a5SSteve French 			} else
320038c8a9a5SSteve French 				cifs_dbg(FYI, "ignore fsync for file not open for write\n");
320138c8a9a5SSteve French 		} else
320238c8a9a5SSteve French 			rc = server->ops->flush(xid, tcon, &smbfile->fid);
320338c8a9a5SSteve French 	}
320438c8a9a5SSteve French 
320538c8a9a5SSteve French fsync_exit:
320638c8a9a5SSteve French 	free_xid(xid);
320738c8a9a5SSteve French 	return rc;
320838c8a9a5SSteve French }
320938c8a9a5SSteve French 
321038c8a9a5SSteve French /*
321138c8a9a5SSteve French  * As file closes, flush all cached write data for this inode checking
321238c8a9a5SSteve French  * for write behind errors.
321338c8a9a5SSteve French  */
321438c8a9a5SSteve French int cifs_flush(struct file *file, fl_owner_t id)
321538c8a9a5SSteve French {
321638c8a9a5SSteve French 	struct inode *inode = file_inode(file);
321738c8a9a5SSteve French 	int rc = 0;
321838c8a9a5SSteve French 
321938c8a9a5SSteve French 	if (file->f_mode & FMODE_WRITE)
322038c8a9a5SSteve French 		rc = filemap_write_and_wait(inode->i_mapping);
322138c8a9a5SSteve French 
322238c8a9a5SSteve French 	cifs_dbg(FYI, "Flush inode %p file %p rc %d\n", inode, file, rc);
322338c8a9a5SSteve French 	if (rc) {
322438c8a9a5SSteve French 		/* get more nuanced writeback errors */
322538c8a9a5SSteve French 		rc = filemap_check_wb_err(file->f_mapping, 0);
322638c8a9a5SSteve French 		trace_cifs_flush_err(inode->i_ino, rc);
322738c8a9a5SSteve French 	}
322838c8a9a5SSteve French 	return rc;
322938c8a9a5SSteve French }
323038c8a9a5SSteve French 
323138c8a9a5SSteve French static void
323238c8a9a5SSteve French cifs_uncached_writedata_release(struct kref *refcount)
323338c8a9a5SSteve French {
323438c8a9a5SSteve French 	struct cifs_writedata *wdata = container_of(refcount,
323538c8a9a5SSteve French 					struct cifs_writedata, refcount);
323638c8a9a5SSteve French 
323738c8a9a5SSteve French 	kref_put(&wdata->ctx->refcount, cifs_aio_ctx_release);
323838c8a9a5SSteve French 	cifs_writedata_release(refcount);
323938c8a9a5SSteve French }
324038c8a9a5SSteve French 
324138c8a9a5SSteve French static void collect_uncached_write_data(struct cifs_aio_ctx *ctx);
324238c8a9a5SSteve French 
324338c8a9a5SSteve French static void
324438c8a9a5SSteve French cifs_uncached_writev_complete(struct work_struct *work)
324538c8a9a5SSteve French {
324638c8a9a5SSteve French 	struct cifs_writedata *wdata = container_of(work,
324738c8a9a5SSteve French 					struct cifs_writedata, work);
324838c8a9a5SSteve French 	struct inode *inode = d_inode(wdata->cfile->dentry);
324938c8a9a5SSteve French 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
325038c8a9a5SSteve French 
325138c8a9a5SSteve French 	spin_lock(&inode->i_lock);
325238c8a9a5SSteve French 	cifs_update_eof(cifsi, wdata->offset, wdata->bytes);
325338c8a9a5SSteve French 	if (cifsi->server_eof > inode->i_size)
325438c8a9a5SSteve French 		i_size_write(inode, cifsi->server_eof);
325538c8a9a5SSteve French 	spin_unlock(&inode->i_lock);
325638c8a9a5SSteve French 
325738c8a9a5SSteve French 	complete(&wdata->done);
325838c8a9a5SSteve French 	collect_uncached_write_data(wdata->ctx);
325938c8a9a5SSteve French 	/* the below call can possibly free the last ref to aio ctx */
326038c8a9a5SSteve French 	kref_put(&wdata->refcount, cifs_uncached_writedata_release);
326138c8a9a5SSteve French }
326238c8a9a5SSteve French 
326338c8a9a5SSteve French static int
326438c8a9a5SSteve French cifs_resend_wdata(struct cifs_writedata *wdata, struct list_head *wdata_list,
326538c8a9a5SSteve French 	struct cifs_aio_ctx *ctx)
326638c8a9a5SSteve French {
326738c8a9a5SSteve French 	unsigned int wsize;
326838c8a9a5SSteve French 	struct cifs_credits credits;
326938c8a9a5SSteve French 	int rc;
327038c8a9a5SSteve French 	struct TCP_Server_Info *server = wdata->server;
327138c8a9a5SSteve French 
327238c8a9a5SSteve French 	do {
327338c8a9a5SSteve French 		if (wdata->cfile->invalidHandle) {
327438c8a9a5SSteve French 			rc = cifs_reopen_file(wdata->cfile, false);
327538c8a9a5SSteve French 			if (rc == -EAGAIN)
327638c8a9a5SSteve French 				continue;
327738c8a9a5SSteve French 			else if (rc)
327838c8a9a5SSteve French 				break;
327938c8a9a5SSteve French 		}
328038c8a9a5SSteve French 
328138c8a9a5SSteve French 
328238c8a9a5SSteve French 		/*
328338c8a9a5SSteve French 		 * Wait for credits to resend this wdata.
328438c8a9a5SSteve French 		 * Note: we are attempting to resend the whole wdata not in
328538c8a9a5SSteve French 		 * segments
328638c8a9a5SSteve French 		 */
328738c8a9a5SSteve French 		do {
328838c8a9a5SSteve French 			rc = server->ops->wait_mtu_credits(server, wdata->bytes,
328938c8a9a5SSteve French 						&wsize, &credits);
329038c8a9a5SSteve French 			if (rc)
329138c8a9a5SSteve French 				goto fail;
329238c8a9a5SSteve French 
329338c8a9a5SSteve French 			if (wsize < wdata->bytes) {
329438c8a9a5SSteve French 				add_credits_and_wake_if(server, &credits, 0);
329538c8a9a5SSteve French 				msleep(1000);
329638c8a9a5SSteve French 			}
329738c8a9a5SSteve French 		} while (wsize < wdata->bytes);
329838c8a9a5SSteve French 		wdata->credits = credits;
329938c8a9a5SSteve French 
330038c8a9a5SSteve French 		rc = adjust_credits(server, &wdata->credits, wdata->bytes);
330138c8a9a5SSteve French 
330238c8a9a5SSteve French 		if (!rc) {
330338c8a9a5SSteve French 			if (wdata->cfile->invalidHandle)
330438c8a9a5SSteve French 				rc = -EAGAIN;
330538c8a9a5SSteve French 			else {
330638c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
330738c8a9a5SSteve French 				if (wdata->mr) {
330838c8a9a5SSteve French 					wdata->mr->need_invalidate = true;
330938c8a9a5SSteve French 					smbd_deregister_mr(wdata->mr);
331038c8a9a5SSteve French 					wdata->mr = NULL;
331138c8a9a5SSteve French 				}
331238c8a9a5SSteve French #endif
331338c8a9a5SSteve French 				rc = server->ops->async_writev(wdata,
331438c8a9a5SSteve French 					cifs_uncached_writedata_release);
331538c8a9a5SSteve French 			}
331638c8a9a5SSteve French 		}
331738c8a9a5SSteve French 
331838c8a9a5SSteve French 		/* If the write was successfully sent, we are done */
331938c8a9a5SSteve French 		if (!rc) {
332038c8a9a5SSteve French 			list_add_tail(&wdata->list, wdata_list);
332138c8a9a5SSteve French 			return 0;
332238c8a9a5SSteve French 		}
332338c8a9a5SSteve French 
332438c8a9a5SSteve French 		/* Roll back credits and retry if needed */
332538c8a9a5SSteve French 		add_credits_and_wake_if(server, &wdata->credits, 0);
332638c8a9a5SSteve French 	} while (rc == -EAGAIN);
332738c8a9a5SSteve French 
332838c8a9a5SSteve French fail:
332938c8a9a5SSteve French 	kref_put(&wdata->refcount, cifs_uncached_writedata_release);
333038c8a9a5SSteve French 	return rc;
333138c8a9a5SSteve French }
333238c8a9a5SSteve French 
333338c8a9a5SSteve French /*
333438c8a9a5SSteve French  * Select span of a bvec iterator we're going to use.  Limit it by both maximum
333538c8a9a5SSteve French  * size and maximum number of segments.
333638c8a9a5SSteve French  */
333738c8a9a5SSteve French static size_t cifs_limit_bvec_subset(const struct iov_iter *iter, size_t max_size,
333838c8a9a5SSteve French 				     size_t max_segs, unsigned int *_nsegs)
333938c8a9a5SSteve French {
334038c8a9a5SSteve French 	const struct bio_vec *bvecs = iter->bvec;
334138c8a9a5SSteve French 	unsigned int nbv = iter->nr_segs, ix = 0, nsegs = 0;
334238c8a9a5SSteve French 	size_t len, span = 0, n = iter->count;
334338c8a9a5SSteve French 	size_t skip = iter->iov_offset;
334438c8a9a5SSteve French 
334538c8a9a5SSteve French 	if (WARN_ON(!iov_iter_is_bvec(iter)) || n == 0)
334638c8a9a5SSteve French 		return 0;
334738c8a9a5SSteve French 
334838c8a9a5SSteve French 	while (n && ix < nbv && skip) {
334938c8a9a5SSteve French 		len = bvecs[ix].bv_len;
335038c8a9a5SSteve French 		if (skip < len)
335138c8a9a5SSteve French 			break;
335238c8a9a5SSteve French 		skip -= len;
335338c8a9a5SSteve French 		n -= len;
335438c8a9a5SSteve French 		ix++;
335538c8a9a5SSteve French 	}
335638c8a9a5SSteve French 
335738c8a9a5SSteve French 	while (n && ix < nbv) {
335838c8a9a5SSteve French 		len = min3(n, bvecs[ix].bv_len - skip, max_size);
335938c8a9a5SSteve French 		span += len;
336038c8a9a5SSteve French 		max_size -= len;
336138c8a9a5SSteve French 		nsegs++;
336238c8a9a5SSteve French 		ix++;
336338c8a9a5SSteve French 		if (max_size == 0 || nsegs >= max_segs)
336438c8a9a5SSteve French 			break;
336538c8a9a5SSteve French 		skip = 0;
336638c8a9a5SSteve French 		n -= len;
336738c8a9a5SSteve French 	}
336838c8a9a5SSteve French 
336938c8a9a5SSteve French 	*_nsegs = nsegs;
337038c8a9a5SSteve French 	return span;
337138c8a9a5SSteve French }
337238c8a9a5SSteve French 
337338c8a9a5SSteve French static int
337438c8a9a5SSteve French cifs_write_from_iter(loff_t fpos, size_t len, struct iov_iter *from,
337538c8a9a5SSteve French 		     struct cifsFileInfo *open_file,
337638c8a9a5SSteve French 		     struct cifs_sb_info *cifs_sb, struct list_head *wdata_list,
337738c8a9a5SSteve French 		     struct cifs_aio_ctx *ctx)
337838c8a9a5SSteve French {
337938c8a9a5SSteve French 	int rc = 0;
338038c8a9a5SSteve French 	size_t cur_len, max_len;
338138c8a9a5SSteve French 	struct cifs_writedata *wdata;
338238c8a9a5SSteve French 	pid_t pid;
338338c8a9a5SSteve French 	struct TCP_Server_Info *server;
338438c8a9a5SSteve French 	unsigned int xid, max_segs = INT_MAX;
338538c8a9a5SSteve French 
338638c8a9a5SSteve French 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
338738c8a9a5SSteve French 		pid = open_file->pid;
338838c8a9a5SSteve French 	else
338938c8a9a5SSteve French 		pid = current->tgid;
339038c8a9a5SSteve French 
339138c8a9a5SSteve French 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
339238c8a9a5SSteve French 	xid = get_xid();
339338c8a9a5SSteve French 
339438c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
339538c8a9a5SSteve French 	if (server->smbd_conn)
339638c8a9a5SSteve French 		max_segs = server->smbd_conn->max_frmr_depth;
339738c8a9a5SSteve French #endif
339838c8a9a5SSteve French 
339938c8a9a5SSteve French 	do {
340038c8a9a5SSteve French 		struct cifs_credits credits_on_stack;
340138c8a9a5SSteve French 		struct cifs_credits *credits = &credits_on_stack;
340238c8a9a5SSteve French 		unsigned int wsize, nsegs = 0;
340338c8a9a5SSteve French 
340438c8a9a5SSteve French 		if (signal_pending(current)) {
340538c8a9a5SSteve French 			rc = -EINTR;
340638c8a9a5SSteve French 			break;
340738c8a9a5SSteve French 		}
340838c8a9a5SSteve French 
340938c8a9a5SSteve French 		if (open_file->invalidHandle) {
341038c8a9a5SSteve French 			rc = cifs_reopen_file(open_file, false);
341138c8a9a5SSteve French 			if (rc == -EAGAIN)
341238c8a9a5SSteve French 				continue;
341338c8a9a5SSteve French 			else if (rc)
341438c8a9a5SSteve French 				break;
341538c8a9a5SSteve French 		}
341638c8a9a5SSteve French 
341738c8a9a5SSteve French 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->wsize,
341838c8a9a5SSteve French 						   &wsize, credits);
341938c8a9a5SSteve French 		if (rc)
342038c8a9a5SSteve French 			break;
342138c8a9a5SSteve French 
342238c8a9a5SSteve French 		max_len = min_t(const size_t, len, wsize);
342338c8a9a5SSteve French 		if (!max_len) {
342438c8a9a5SSteve French 			rc = -EAGAIN;
342538c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
342638c8a9a5SSteve French 			break;
342738c8a9a5SSteve French 		}
342838c8a9a5SSteve French 
342938c8a9a5SSteve French 		cur_len = cifs_limit_bvec_subset(from, max_len, max_segs, &nsegs);
343038c8a9a5SSteve French 		cifs_dbg(FYI, "write_from_iter len=%zx/%zx nsegs=%u/%lu/%u\n",
343138c8a9a5SSteve French 			 cur_len, max_len, nsegs, from->nr_segs, max_segs);
343238c8a9a5SSteve French 		if (cur_len == 0) {
343338c8a9a5SSteve French 			rc = -EIO;
343438c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
343538c8a9a5SSteve French 			break;
343638c8a9a5SSteve French 		}
343738c8a9a5SSteve French 
343838c8a9a5SSteve French 		wdata = cifs_writedata_alloc(cifs_uncached_writev_complete);
343938c8a9a5SSteve French 		if (!wdata) {
344038c8a9a5SSteve French 			rc = -ENOMEM;
344138c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
344238c8a9a5SSteve French 			break;
344338c8a9a5SSteve French 		}
344438c8a9a5SSteve French 
344538c8a9a5SSteve French 		wdata->sync_mode = WB_SYNC_ALL;
344638c8a9a5SSteve French 		wdata->offset	= (__u64)fpos;
344738c8a9a5SSteve French 		wdata->cfile	= cifsFileInfo_get(open_file);
344838c8a9a5SSteve French 		wdata->server	= server;
344938c8a9a5SSteve French 		wdata->pid	= pid;
345038c8a9a5SSteve French 		wdata->bytes	= cur_len;
345138c8a9a5SSteve French 		wdata->credits	= credits_on_stack;
345238c8a9a5SSteve French 		wdata->iter	= *from;
345338c8a9a5SSteve French 		wdata->ctx	= ctx;
345438c8a9a5SSteve French 		kref_get(&ctx->refcount);
345538c8a9a5SSteve French 
345638c8a9a5SSteve French 		iov_iter_truncate(&wdata->iter, cur_len);
345738c8a9a5SSteve French 
345838c8a9a5SSteve French 		rc = adjust_credits(server, &wdata->credits, wdata->bytes);
345938c8a9a5SSteve French 
346038c8a9a5SSteve French 		if (!rc) {
346138c8a9a5SSteve French 			if (wdata->cfile->invalidHandle)
346238c8a9a5SSteve French 				rc = -EAGAIN;
346338c8a9a5SSteve French 			else
346438c8a9a5SSteve French 				rc = server->ops->async_writev(wdata,
346538c8a9a5SSteve French 					cifs_uncached_writedata_release);
346638c8a9a5SSteve French 		}
346738c8a9a5SSteve French 
346838c8a9a5SSteve French 		if (rc) {
346938c8a9a5SSteve French 			add_credits_and_wake_if(server, &wdata->credits, 0);
347038c8a9a5SSteve French 			kref_put(&wdata->refcount,
347138c8a9a5SSteve French 				 cifs_uncached_writedata_release);
347238c8a9a5SSteve French 			if (rc == -EAGAIN)
347338c8a9a5SSteve French 				continue;
347438c8a9a5SSteve French 			break;
347538c8a9a5SSteve French 		}
347638c8a9a5SSteve French 
347738c8a9a5SSteve French 		list_add_tail(&wdata->list, wdata_list);
347838c8a9a5SSteve French 		iov_iter_advance(from, cur_len);
347938c8a9a5SSteve French 		fpos += cur_len;
348038c8a9a5SSteve French 		len -= cur_len;
348138c8a9a5SSteve French 	} while (len > 0);
348238c8a9a5SSteve French 
348338c8a9a5SSteve French 	free_xid(xid);
348438c8a9a5SSteve French 	return rc;
348538c8a9a5SSteve French }
348638c8a9a5SSteve French 
348738c8a9a5SSteve French static void collect_uncached_write_data(struct cifs_aio_ctx *ctx)
348838c8a9a5SSteve French {
348938c8a9a5SSteve French 	struct cifs_writedata *wdata, *tmp;
349038c8a9a5SSteve French 	struct cifs_tcon *tcon;
349138c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
349238c8a9a5SSteve French 	struct dentry *dentry = ctx->cfile->dentry;
349338c8a9a5SSteve French 	ssize_t rc;
349438c8a9a5SSteve French 
349538c8a9a5SSteve French 	tcon = tlink_tcon(ctx->cfile->tlink);
349638c8a9a5SSteve French 	cifs_sb = CIFS_SB(dentry->d_sb);
349738c8a9a5SSteve French 
349838c8a9a5SSteve French 	mutex_lock(&ctx->aio_mutex);
349938c8a9a5SSteve French 
350038c8a9a5SSteve French 	if (list_empty(&ctx->list)) {
350138c8a9a5SSteve French 		mutex_unlock(&ctx->aio_mutex);
350238c8a9a5SSteve French 		return;
350338c8a9a5SSteve French 	}
350438c8a9a5SSteve French 
350538c8a9a5SSteve French 	rc = ctx->rc;
350638c8a9a5SSteve French 	/*
350738c8a9a5SSteve French 	 * Wait for and collect replies for any successful sends in order of
350838c8a9a5SSteve French 	 * increasing offset. Once an error is hit, then return without waiting
350938c8a9a5SSteve French 	 * for any more replies.
351038c8a9a5SSteve French 	 */
351138c8a9a5SSteve French restart_loop:
351238c8a9a5SSteve French 	list_for_each_entry_safe(wdata, tmp, &ctx->list, list) {
351338c8a9a5SSteve French 		if (!rc) {
351438c8a9a5SSteve French 			if (!try_wait_for_completion(&wdata->done)) {
351538c8a9a5SSteve French 				mutex_unlock(&ctx->aio_mutex);
351638c8a9a5SSteve French 				return;
351738c8a9a5SSteve French 			}
351838c8a9a5SSteve French 
351938c8a9a5SSteve French 			if (wdata->result)
352038c8a9a5SSteve French 				rc = wdata->result;
352138c8a9a5SSteve French 			else
352238c8a9a5SSteve French 				ctx->total_len += wdata->bytes;
352338c8a9a5SSteve French 
352438c8a9a5SSteve French 			/* resend call if it's a retryable error */
352538c8a9a5SSteve French 			if (rc == -EAGAIN) {
352638c8a9a5SSteve French 				struct list_head tmp_list;
352738c8a9a5SSteve French 				struct iov_iter tmp_from = ctx->iter;
352838c8a9a5SSteve French 
352938c8a9a5SSteve French 				INIT_LIST_HEAD(&tmp_list);
353038c8a9a5SSteve French 				list_del_init(&wdata->list);
353138c8a9a5SSteve French 
353238c8a9a5SSteve French 				if (ctx->direct_io)
353338c8a9a5SSteve French 					rc = cifs_resend_wdata(
353438c8a9a5SSteve French 						wdata, &tmp_list, ctx);
353538c8a9a5SSteve French 				else {
353638c8a9a5SSteve French 					iov_iter_advance(&tmp_from,
353738c8a9a5SSteve French 						 wdata->offset - ctx->pos);
353838c8a9a5SSteve French 
353938c8a9a5SSteve French 					rc = cifs_write_from_iter(wdata->offset,
354038c8a9a5SSteve French 						wdata->bytes, &tmp_from,
354138c8a9a5SSteve French 						ctx->cfile, cifs_sb, &tmp_list,
354238c8a9a5SSteve French 						ctx);
354338c8a9a5SSteve French 
354438c8a9a5SSteve French 					kref_put(&wdata->refcount,
354538c8a9a5SSteve French 						cifs_uncached_writedata_release);
354638c8a9a5SSteve French 				}
354738c8a9a5SSteve French 
354838c8a9a5SSteve French 				list_splice(&tmp_list, &ctx->list);
354938c8a9a5SSteve French 				goto restart_loop;
355038c8a9a5SSteve French 			}
355138c8a9a5SSteve French 		}
355238c8a9a5SSteve French 		list_del_init(&wdata->list);
355338c8a9a5SSteve French 		kref_put(&wdata->refcount, cifs_uncached_writedata_release);
355438c8a9a5SSteve French 	}
355538c8a9a5SSteve French 
355638c8a9a5SSteve French 	cifs_stats_bytes_written(tcon, ctx->total_len);
355738c8a9a5SSteve French 	set_bit(CIFS_INO_INVALID_MAPPING, &CIFS_I(dentry->d_inode)->flags);
355838c8a9a5SSteve French 
355938c8a9a5SSteve French 	ctx->rc = (rc == 0) ? ctx->total_len : rc;
356038c8a9a5SSteve French 
356138c8a9a5SSteve French 	mutex_unlock(&ctx->aio_mutex);
356238c8a9a5SSteve French 
356338c8a9a5SSteve French 	if (ctx->iocb && ctx->iocb->ki_complete)
356438c8a9a5SSteve French 		ctx->iocb->ki_complete(ctx->iocb, ctx->rc);
356538c8a9a5SSteve French 	else
356638c8a9a5SSteve French 		complete(&ctx->done);
356738c8a9a5SSteve French }
356838c8a9a5SSteve French 
356938c8a9a5SSteve French static ssize_t __cifs_writev(
357038c8a9a5SSteve French 	struct kiocb *iocb, struct iov_iter *from, bool direct)
357138c8a9a5SSteve French {
357238c8a9a5SSteve French 	struct file *file = iocb->ki_filp;
357338c8a9a5SSteve French 	ssize_t total_written = 0;
357438c8a9a5SSteve French 	struct cifsFileInfo *cfile;
357538c8a9a5SSteve French 	struct cifs_tcon *tcon;
357638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
357738c8a9a5SSteve French 	struct cifs_aio_ctx *ctx;
357838c8a9a5SSteve French 	int rc;
357938c8a9a5SSteve French 
358038c8a9a5SSteve French 	rc = generic_write_checks(iocb, from);
358138c8a9a5SSteve French 	if (rc <= 0)
358238c8a9a5SSteve French 		return rc;
358338c8a9a5SSteve French 
358438c8a9a5SSteve French 	cifs_sb = CIFS_FILE_SB(file);
358538c8a9a5SSteve French 	cfile = file->private_data;
358638c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
358738c8a9a5SSteve French 
358838c8a9a5SSteve French 	if (!tcon->ses->server->ops->async_writev)
358938c8a9a5SSteve French 		return -ENOSYS;
359038c8a9a5SSteve French 
359138c8a9a5SSteve French 	ctx = cifs_aio_ctx_alloc();
359238c8a9a5SSteve French 	if (!ctx)
359338c8a9a5SSteve French 		return -ENOMEM;
359438c8a9a5SSteve French 
359538c8a9a5SSteve French 	ctx->cfile = cifsFileInfo_get(cfile);
359638c8a9a5SSteve French 
359738c8a9a5SSteve French 	if (!is_sync_kiocb(iocb))
359838c8a9a5SSteve French 		ctx->iocb = iocb;
359938c8a9a5SSteve French 
360038c8a9a5SSteve French 	ctx->pos = iocb->ki_pos;
360138c8a9a5SSteve French 	ctx->direct_io = direct;
360238c8a9a5SSteve French 	ctx->nr_pinned_pages = 0;
360338c8a9a5SSteve French 
360438c8a9a5SSteve French 	if (user_backed_iter(from)) {
360538c8a9a5SSteve French 		/*
360638c8a9a5SSteve French 		 * Extract IOVEC/UBUF-type iterators to a BVEC-type iterator as
360738c8a9a5SSteve French 		 * they contain references to the calling process's virtual
360838c8a9a5SSteve French 		 * memory layout which won't be available in an async worker
360938c8a9a5SSteve French 		 * thread.  This also takes a pin on every folio involved.
361038c8a9a5SSteve French 		 */
361138c8a9a5SSteve French 		rc = netfs_extract_user_iter(from, iov_iter_count(from),
361238c8a9a5SSteve French 					     &ctx->iter, 0);
361338c8a9a5SSteve French 		if (rc < 0) {
361438c8a9a5SSteve French 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
361538c8a9a5SSteve French 			return rc;
361638c8a9a5SSteve French 		}
361738c8a9a5SSteve French 
361838c8a9a5SSteve French 		ctx->nr_pinned_pages = rc;
361938c8a9a5SSteve French 		ctx->bv = (void *)ctx->iter.bvec;
362038c8a9a5SSteve French 		ctx->bv_need_unpin = iov_iter_extract_will_pin(from);
362138c8a9a5SSteve French 	} else if ((iov_iter_is_bvec(from) || iov_iter_is_kvec(from)) &&
362238c8a9a5SSteve French 		   !is_sync_kiocb(iocb)) {
362338c8a9a5SSteve French 		/*
362438c8a9a5SSteve French 		 * If the op is asynchronous, we need to copy the list attached
362538c8a9a5SSteve French 		 * to a BVEC/KVEC-type iterator, but we assume that the storage
362638c8a9a5SSteve French 		 * will be pinned by the caller; in any case, we may or may not
362738c8a9a5SSteve French 		 * be able to pin the pages, so we don't try.
362838c8a9a5SSteve French 		 */
362938c8a9a5SSteve French 		ctx->bv = (void *)dup_iter(&ctx->iter, from, GFP_KERNEL);
363038c8a9a5SSteve French 		if (!ctx->bv) {
363138c8a9a5SSteve French 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
363238c8a9a5SSteve French 			return -ENOMEM;
363338c8a9a5SSteve French 		}
363438c8a9a5SSteve French 	} else {
363538c8a9a5SSteve French 		/*
363638c8a9a5SSteve French 		 * Otherwise, we just pass the iterator down as-is and rely on
363738c8a9a5SSteve French 		 * the caller to make sure the pages referred to by the
363838c8a9a5SSteve French 		 * iterator don't evaporate.
363938c8a9a5SSteve French 		 */
364038c8a9a5SSteve French 		ctx->iter = *from;
364138c8a9a5SSteve French 	}
364238c8a9a5SSteve French 
364338c8a9a5SSteve French 	ctx->len = iov_iter_count(&ctx->iter);
364438c8a9a5SSteve French 
364538c8a9a5SSteve French 	/* grab a lock here due to read response handlers can access ctx */
364638c8a9a5SSteve French 	mutex_lock(&ctx->aio_mutex);
364738c8a9a5SSteve French 
364838c8a9a5SSteve French 	rc = cifs_write_from_iter(iocb->ki_pos, ctx->len, &ctx->iter,
364938c8a9a5SSteve French 				  cfile, cifs_sb, &ctx->list, ctx);
365038c8a9a5SSteve French 
365138c8a9a5SSteve French 	/*
365238c8a9a5SSteve French 	 * If at least one write was successfully sent, then discard any rc
365338c8a9a5SSteve French 	 * value from the later writes. If the other write succeeds, then
365438c8a9a5SSteve French 	 * we'll end up returning whatever was written. If it fails, then
365538c8a9a5SSteve French 	 * we'll get a new rc value from that.
365638c8a9a5SSteve French 	 */
365738c8a9a5SSteve French 	if (!list_empty(&ctx->list))
365838c8a9a5SSteve French 		rc = 0;
365938c8a9a5SSteve French 
366038c8a9a5SSteve French 	mutex_unlock(&ctx->aio_mutex);
366138c8a9a5SSteve French 
366238c8a9a5SSteve French 	if (rc) {
366338c8a9a5SSteve French 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
366438c8a9a5SSteve French 		return rc;
366538c8a9a5SSteve French 	}
366638c8a9a5SSteve French 
366738c8a9a5SSteve French 	if (!is_sync_kiocb(iocb)) {
366838c8a9a5SSteve French 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
366938c8a9a5SSteve French 		return -EIOCBQUEUED;
367038c8a9a5SSteve French 	}
367138c8a9a5SSteve French 
367238c8a9a5SSteve French 	rc = wait_for_completion_killable(&ctx->done);
367338c8a9a5SSteve French 	if (rc) {
367438c8a9a5SSteve French 		mutex_lock(&ctx->aio_mutex);
367538c8a9a5SSteve French 		ctx->rc = rc = -EINTR;
367638c8a9a5SSteve French 		total_written = ctx->total_len;
367738c8a9a5SSteve French 		mutex_unlock(&ctx->aio_mutex);
367838c8a9a5SSteve French 	} else {
367938c8a9a5SSteve French 		rc = ctx->rc;
368038c8a9a5SSteve French 		total_written = ctx->total_len;
368138c8a9a5SSteve French 	}
368238c8a9a5SSteve French 
368338c8a9a5SSteve French 	kref_put(&ctx->refcount, cifs_aio_ctx_release);
368438c8a9a5SSteve French 
368538c8a9a5SSteve French 	if (unlikely(!total_written))
368638c8a9a5SSteve French 		return rc;
368738c8a9a5SSteve French 
368838c8a9a5SSteve French 	iocb->ki_pos += total_written;
368938c8a9a5SSteve French 	return total_written;
369038c8a9a5SSteve French }
369138c8a9a5SSteve French 
369238c8a9a5SSteve French ssize_t cifs_direct_writev(struct kiocb *iocb, struct iov_iter *from)
369338c8a9a5SSteve French {
369438c8a9a5SSteve French 	struct file *file = iocb->ki_filp;
369538c8a9a5SSteve French 
369638c8a9a5SSteve French 	cifs_revalidate_mapping(file->f_inode);
369738c8a9a5SSteve French 	return __cifs_writev(iocb, from, true);
369838c8a9a5SSteve French }
369938c8a9a5SSteve French 
370038c8a9a5SSteve French ssize_t cifs_user_writev(struct kiocb *iocb, struct iov_iter *from)
370138c8a9a5SSteve French {
370238c8a9a5SSteve French 	return __cifs_writev(iocb, from, false);
370338c8a9a5SSteve French }
370438c8a9a5SSteve French 
370538c8a9a5SSteve French static ssize_t
370638c8a9a5SSteve French cifs_writev(struct kiocb *iocb, struct iov_iter *from)
370738c8a9a5SSteve French {
370838c8a9a5SSteve French 	struct file *file = iocb->ki_filp;
370938c8a9a5SSteve French 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
371038c8a9a5SSteve French 	struct inode *inode = file->f_mapping->host;
371138c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
371238c8a9a5SSteve French 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
371338c8a9a5SSteve French 	ssize_t rc;
371438c8a9a5SSteve French 
371538c8a9a5SSteve French 	inode_lock(inode);
371638c8a9a5SSteve French 	/*
371738c8a9a5SSteve French 	 * We need to hold the sem to be sure nobody modifies lock list
371838c8a9a5SSteve French 	 * with a brlock that prevents writing.
371938c8a9a5SSteve French 	 */
372038c8a9a5SSteve French 	down_read(&cinode->lock_sem);
372138c8a9a5SSteve French 
372238c8a9a5SSteve French 	rc = generic_write_checks(iocb, from);
372338c8a9a5SSteve French 	if (rc <= 0)
372438c8a9a5SSteve French 		goto out;
372538c8a9a5SSteve French 
372638c8a9a5SSteve French 	if (!cifs_find_lock_conflict(cfile, iocb->ki_pos, iov_iter_count(from),
372738c8a9a5SSteve French 				     server->vals->exclusive_lock_type, 0,
372838c8a9a5SSteve French 				     NULL, CIFS_WRITE_OP))
372938c8a9a5SSteve French 		rc = __generic_file_write_iter(iocb, from);
373038c8a9a5SSteve French 	else
373138c8a9a5SSteve French 		rc = -EACCES;
373238c8a9a5SSteve French out:
373338c8a9a5SSteve French 	up_read(&cinode->lock_sem);
373438c8a9a5SSteve French 	inode_unlock(inode);
373538c8a9a5SSteve French 
373638c8a9a5SSteve French 	if (rc > 0)
373738c8a9a5SSteve French 		rc = generic_write_sync(iocb, rc);
373838c8a9a5SSteve French 	return rc;
373938c8a9a5SSteve French }
374038c8a9a5SSteve French 
374138c8a9a5SSteve French ssize_t
374238c8a9a5SSteve French cifs_strict_writev(struct kiocb *iocb, struct iov_iter *from)
374338c8a9a5SSteve French {
374438c8a9a5SSteve French 	struct inode *inode = file_inode(iocb->ki_filp);
374538c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
374638c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
374738c8a9a5SSteve French 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)
374838c8a9a5SSteve French 						iocb->ki_filp->private_data;
374938c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
375038c8a9a5SSteve French 	ssize_t written;
375138c8a9a5SSteve French 
375238c8a9a5SSteve French 	written = cifs_get_writer(cinode);
375338c8a9a5SSteve French 	if (written)
375438c8a9a5SSteve French 		return written;
375538c8a9a5SSteve French 
375638c8a9a5SSteve French 	if (CIFS_CACHE_WRITE(cinode)) {
375738c8a9a5SSteve French 		if (cap_unix(tcon->ses) &&
375838c8a9a5SSteve French 		(CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability))
375938c8a9a5SSteve French 		  && ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0)) {
376038c8a9a5SSteve French 			written = generic_file_write_iter(iocb, from);
376138c8a9a5SSteve French 			goto out;
376238c8a9a5SSteve French 		}
376338c8a9a5SSteve French 		written = cifs_writev(iocb, from);
376438c8a9a5SSteve French 		goto out;
376538c8a9a5SSteve French 	}
376638c8a9a5SSteve French 	/*
376738c8a9a5SSteve French 	 * For non-oplocked files in strict cache mode we need to write the data
376838c8a9a5SSteve French 	 * to the server exactly from the pos to pos+len-1 rather than flush all
376938c8a9a5SSteve French 	 * affected pages because it may cause a error with mandatory locks on
377038c8a9a5SSteve French 	 * these pages but not on the region from pos to ppos+len-1.
377138c8a9a5SSteve French 	 */
377238c8a9a5SSteve French 	written = cifs_user_writev(iocb, from);
377338c8a9a5SSteve French 	if (CIFS_CACHE_READ(cinode)) {
377438c8a9a5SSteve French 		/*
377538c8a9a5SSteve French 		 * We have read level caching and we have just sent a write
377638c8a9a5SSteve French 		 * request to the server thus making data in the cache stale.
377738c8a9a5SSteve French 		 * Zap the cache and set oplock/lease level to NONE to avoid
377838c8a9a5SSteve French 		 * reading stale data from the cache. All subsequent read
377938c8a9a5SSteve French 		 * operations will read new data from the server.
378038c8a9a5SSteve French 		 */
378138c8a9a5SSteve French 		cifs_zap_mapping(inode);
378238c8a9a5SSteve French 		cifs_dbg(FYI, "Set Oplock/Lease to NONE for inode=%p after write\n",
378338c8a9a5SSteve French 			 inode);
378438c8a9a5SSteve French 		cinode->oplock = 0;
378538c8a9a5SSteve French 	}
378638c8a9a5SSteve French out:
378738c8a9a5SSteve French 	cifs_put_writer(cinode);
378838c8a9a5SSteve French 	return written;
378938c8a9a5SSteve French }
379038c8a9a5SSteve French 
379138c8a9a5SSteve French static struct cifs_readdata *cifs_readdata_alloc(work_func_t complete)
379238c8a9a5SSteve French {
379338c8a9a5SSteve French 	struct cifs_readdata *rdata;
379438c8a9a5SSteve French 
379538c8a9a5SSteve French 	rdata = kzalloc(sizeof(*rdata), GFP_KERNEL);
379638c8a9a5SSteve French 	if (rdata) {
379738c8a9a5SSteve French 		kref_init(&rdata->refcount);
379838c8a9a5SSteve French 		INIT_LIST_HEAD(&rdata->list);
379938c8a9a5SSteve French 		init_completion(&rdata->done);
380038c8a9a5SSteve French 		INIT_WORK(&rdata->work, complete);
380138c8a9a5SSteve French 	}
380238c8a9a5SSteve French 
380338c8a9a5SSteve French 	return rdata;
380438c8a9a5SSteve French }
380538c8a9a5SSteve French 
380638c8a9a5SSteve French void
380738c8a9a5SSteve French cifs_readdata_release(struct kref *refcount)
380838c8a9a5SSteve French {
380938c8a9a5SSteve French 	struct cifs_readdata *rdata = container_of(refcount,
381038c8a9a5SSteve French 					struct cifs_readdata, refcount);
381138c8a9a5SSteve French 
381238c8a9a5SSteve French 	if (rdata->ctx)
381338c8a9a5SSteve French 		kref_put(&rdata->ctx->refcount, cifs_aio_ctx_release);
381438c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
381538c8a9a5SSteve French 	if (rdata->mr) {
381638c8a9a5SSteve French 		smbd_deregister_mr(rdata->mr);
381738c8a9a5SSteve French 		rdata->mr = NULL;
381838c8a9a5SSteve French 	}
381938c8a9a5SSteve French #endif
382038c8a9a5SSteve French 	if (rdata->cfile)
382138c8a9a5SSteve French 		cifsFileInfo_put(rdata->cfile);
382238c8a9a5SSteve French 
382338c8a9a5SSteve French 	kfree(rdata);
382438c8a9a5SSteve French }
382538c8a9a5SSteve French 
382638c8a9a5SSteve French static void collect_uncached_read_data(struct cifs_aio_ctx *ctx);
382738c8a9a5SSteve French 
382838c8a9a5SSteve French static void
382938c8a9a5SSteve French cifs_uncached_readv_complete(struct work_struct *work)
383038c8a9a5SSteve French {
383138c8a9a5SSteve French 	struct cifs_readdata *rdata = container_of(work,
383238c8a9a5SSteve French 						struct cifs_readdata, work);
383338c8a9a5SSteve French 
383438c8a9a5SSteve French 	complete(&rdata->done);
383538c8a9a5SSteve French 	collect_uncached_read_data(rdata->ctx);
383638c8a9a5SSteve French 	/* the below call can possibly free the last ref to aio ctx */
383738c8a9a5SSteve French 	kref_put(&rdata->refcount, cifs_readdata_release);
383838c8a9a5SSteve French }
383938c8a9a5SSteve French 
384038c8a9a5SSteve French static int cifs_resend_rdata(struct cifs_readdata *rdata,
384138c8a9a5SSteve French 			struct list_head *rdata_list,
384238c8a9a5SSteve French 			struct cifs_aio_ctx *ctx)
384338c8a9a5SSteve French {
384438c8a9a5SSteve French 	unsigned int rsize;
384538c8a9a5SSteve French 	struct cifs_credits credits;
384638c8a9a5SSteve French 	int rc;
384738c8a9a5SSteve French 	struct TCP_Server_Info *server;
384838c8a9a5SSteve French 
384938c8a9a5SSteve French 	/* XXX: should we pick a new channel here? */
385038c8a9a5SSteve French 	server = rdata->server;
385138c8a9a5SSteve French 
385238c8a9a5SSteve French 	do {
385338c8a9a5SSteve French 		if (rdata->cfile->invalidHandle) {
385438c8a9a5SSteve French 			rc = cifs_reopen_file(rdata->cfile, true);
385538c8a9a5SSteve French 			if (rc == -EAGAIN)
385638c8a9a5SSteve French 				continue;
385738c8a9a5SSteve French 			else if (rc)
385838c8a9a5SSteve French 				break;
385938c8a9a5SSteve French 		}
386038c8a9a5SSteve French 
386138c8a9a5SSteve French 		/*
386238c8a9a5SSteve French 		 * Wait for credits to resend this rdata.
386338c8a9a5SSteve French 		 * Note: we are attempting to resend the whole rdata not in
386438c8a9a5SSteve French 		 * segments
386538c8a9a5SSteve French 		 */
386638c8a9a5SSteve French 		do {
386738c8a9a5SSteve French 			rc = server->ops->wait_mtu_credits(server, rdata->bytes,
386838c8a9a5SSteve French 						&rsize, &credits);
386938c8a9a5SSteve French 
387038c8a9a5SSteve French 			if (rc)
387138c8a9a5SSteve French 				goto fail;
387238c8a9a5SSteve French 
387338c8a9a5SSteve French 			if (rsize < rdata->bytes) {
387438c8a9a5SSteve French 				add_credits_and_wake_if(server, &credits, 0);
387538c8a9a5SSteve French 				msleep(1000);
387638c8a9a5SSteve French 			}
387738c8a9a5SSteve French 		} while (rsize < rdata->bytes);
387838c8a9a5SSteve French 		rdata->credits = credits;
387938c8a9a5SSteve French 
388038c8a9a5SSteve French 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
388138c8a9a5SSteve French 		if (!rc) {
388238c8a9a5SSteve French 			if (rdata->cfile->invalidHandle)
388338c8a9a5SSteve French 				rc = -EAGAIN;
388438c8a9a5SSteve French 			else {
388538c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
388638c8a9a5SSteve French 				if (rdata->mr) {
388738c8a9a5SSteve French 					rdata->mr->need_invalidate = true;
388838c8a9a5SSteve French 					smbd_deregister_mr(rdata->mr);
388938c8a9a5SSteve French 					rdata->mr = NULL;
389038c8a9a5SSteve French 				}
389138c8a9a5SSteve French #endif
389238c8a9a5SSteve French 				rc = server->ops->async_readv(rdata);
389338c8a9a5SSteve French 			}
389438c8a9a5SSteve French 		}
389538c8a9a5SSteve French 
389638c8a9a5SSteve French 		/* If the read was successfully sent, we are done */
389738c8a9a5SSteve French 		if (!rc) {
389838c8a9a5SSteve French 			/* Add to aio pending list */
389938c8a9a5SSteve French 			list_add_tail(&rdata->list, rdata_list);
390038c8a9a5SSteve French 			return 0;
390138c8a9a5SSteve French 		}
390238c8a9a5SSteve French 
390338c8a9a5SSteve French 		/* Roll back credits and retry if needed */
390438c8a9a5SSteve French 		add_credits_and_wake_if(server, &rdata->credits, 0);
390538c8a9a5SSteve French 	} while (rc == -EAGAIN);
390638c8a9a5SSteve French 
390738c8a9a5SSteve French fail:
390838c8a9a5SSteve French 	kref_put(&rdata->refcount, cifs_readdata_release);
390938c8a9a5SSteve French 	return rc;
391038c8a9a5SSteve French }
391138c8a9a5SSteve French 
391238c8a9a5SSteve French static int
391338c8a9a5SSteve French cifs_send_async_read(loff_t fpos, size_t len, struct cifsFileInfo *open_file,
391438c8a9a5SSteve French 		     struct cifs_sb_info *cifs_sb, struct list_head *rdata_list,
391538c8a9a5SSteve French 		     struct cifs_aio_ctx *ctx)
391638c8a9a5SSteve French {
391738c8a9a5SSteve French 	struct cifs_readdata *rdata;
391838c8a9a5SSteve French 	unsigned int rsize, nsegs, max_segs = INT_MAX;
391938c8a9a5SSteve French 	struct cifs_credits credits_on_stack;
392038c8a9a5SSteve French 	struct cifs_credits *credits = &credits_on_stack;
392138c8a9a5SSteve French 	size_t cur_len, max_len;
392238c8a9a5SSteve French 	int rc;
392338c8a9a5SSteve French 	pid_t pid;
392438c8a9a5SSteve French 	struct TCP_Server_Info *server;
392538c8a9a5SSteve French 
392638c8a9a5SSteve French 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
392738c8a9a5SSteve French 
392838c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
392938c8a9a5SSteve French 	if (server->smbd_conn)
393038c8a9a5SSteve French 		max_segs = server->smbd_conn->max_frmr_depth;
393138c8a9a5SSteve French #endif
393238c8a9a5SSteve French 
393338c8a9a5SSteve French 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
393438c8a9a5SSteve French 		pid = open_file->pid;
393538c8a9a5SSteve French 	else
393638c8a9a5SSteve French 		pid = current->tgid;
393738c8a9a5SSteve French 
393838c8a9a5SSteve French 	do {
393938c8a9a5SSteve French 		if (open_file->invalidHandle) {
394038c8a9a5SSteve French 			rc = cifs_reopen_file(open_file, true);
394138c8a9a5SSteve French 			if (rc == -EAGAIN)
394238c8a9a5SSteve French 				continue;
394338c8a9a5SSteve French 			else if (rc)
394438c8a9a5SSteve French 				break;
394538c8a9a5SSteve French 		}
394638c8a9a5SSteve French 
394738c8a9a5SSteve French 		if (cifs_sb->ctx->rsize == 0)
394838c8a9a5SSteve French 			cifs_sb->ctx->rsize =
394938c8a9a5SSteve French 				server->ops->negotiate_rsize(tlink_tcon(open_file->tlink),
395038c8a9a5SSteve French 							     cifs_sb->ctx);
395138c8a9a5SSteve French 
395238c8a9a5SSteve French 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->rsize,
395338c8a9a5SSteve French 						   &rsize, credits);
395438c8a9a5SSteve French 		if (rc)
395538c8a9a5SSteve French 			break;
395638c8a9a5SSteve French 
395738c8a9a5SSteve French 		max_len = min_t(size_t, len, rsize);
395838c8a9a5SSteve French 
395938c8a9a5SSteve French 		cur_len = cifs_limit_bvec_subset(&ctx->iter, max_len,
396038c8a9a5SSteve French 						 max_segs, &nsegs);
396138c8a9a5SSteve French 		cifs_dbg(FYI, "read-to-iter len=%zx/%zx nsegs=%u/%lu/%u\n",
396238c8a9a5SSteve French 			 cur_len, max_len, nsegs, ctx->iter.nr_segs, max_segs);
396338c8a9a5SSteve French 		if (cur_len == 0) {
396438c8a9a5SSteve French 			rc = -EIO;
396538c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
396638c8a9a5SSteve French 			break;
396738c8a9a5SSteve French 		}
396838c8a9a5SSteve French 
396938c8a9a5SSteve French 		rdata = cifs_readdata_alloc(cifs_uncached_readv_complete);
397038c8a9a5SSteve French 		if (!rdata) {
397138c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
397238c8a9a5SSteve French 			rc = -ENOMEM;
397338c8a9a5SSteve French 			break;
397438c8a9a5SSteve French 		}
397538c8a9a5SSteve French 
397638c8a9a5SSteve French 		rdata->server	= server;
397738c8a9a5SSteve French 		rdata->cfile	= cifsFileInfo_get(open_file);
397838c8a9a5SSteve French 		rdata->offset	= fpos;
397938c8a9a5SSteve French 		rdata->bytes	= cur_len;
398038c8a9a5SSteve French 		rdata->pid	= pid;
398138c8a9a5SSteve French 		rdata->credits	= credits_on_stack;
398238c8a9a5SSteve French 		rdata->ctx	= ctx;
398338c8a9a5SSteve French 		kref_get(&ctx->refcount);
398438c8a9a5SSteve French 
398538c8a9a5SSteve French 		rdata->iter	= ctx->iter;
398638c8a9a5SSteve French 		iov_iter_truncate(&rdata->iter, cur_len);
398738c8a9a5SSteve French 
398838c8a9a5SSteve French 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
398938c8a9a5SSteve French 
399038c8a9a5SSteve French 		if (!rc) {
399138c8a9a5SSteve French 			if (rdata->cfile->invalidHandle)
399238c8a9a5SSteve French 				rc = -EAGAIN;
399338c8a9a5SSteve French 			else
399438c8a9a5SSteve French 				rc = server->ops->async_readv(rdata);
399538c8a9a5SSteve French 		}
399638c8a9a5SSteve French 
399738c8a9a5SSteve French 		if (rc) {
399838c8a9a5SSteve French 			add_credits_and_wake_if(server, &rdata->credits, 0);
399938c8a9a5SSteve French 			kref_put(&rdata->refcount, cifs_readdata_release);
400038c8a9a5SSteve French 			if (rc == -EAGAIN)
400138c8a9a5SSteve French 				continue;
400238c8a9a5SSteve French 			break;
400338c8a9a5SSteve French 		}
400438c8a9a5SSteve French 
400538c8a9a5SSteve French 		list_add_tail(&rdata->list, rdata_list);
400638c8a9a5SSteve French 		iov_iter_advance(&ctx->iter, cur_len);
400738c8a9a5SSteve French 		fpos += cur_len;
400838c8a9a5SSteve French 		len -= cur_len;
400938c8a9a5SSteve French 	} while (len > 0);
401038c8a9a5SSteve French 
401138c8a9a5SSteve French 	return rc;
401238c8a9a5SSteve French }
401338c8a9a5SSteve French 
401438c8a9a5SSteve French static void
401538c8a9a5SSteve French collect_uncached_read_data(struct cifs_aio_ctx *ctx)
401638c8a9a5SSteve French {
401738c8a9a5SSteve French 	struct cifs_readdata *rdata, *tmp;
401838c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
401938c8a9a5SSteve French 	int rc;
402038c8a9a5SSteve French 
402138c8a9a5SSteve French 	cifs_sb = CIFS_SB(ctx->cfile->dentry->d_sb);
402238c8a9a5SSteve French 
402338c8a9a5SSteve French 	mutex_lock(&ctx->aio_mutex);
402438c8a9a5SSteve French 
402538c8a9a5SSteve French 	if (list_empty(&ctx->list)) {
402638c8a9a5SSteve French 		mutex_unlock(&ctx->aio_mutex);
402738c8a9a5SSteve French 		return;
402838c8a9a5SSteve French 	}
402938c8a9a5SSteve French 
403038c8a9a5SSteve French 	rc = ctx->rc;
403138c8a9a5SSteve French 	/* the loop below should proceed in the order of increasing offsets */
403238c8a9a5SSteve French again:
403338c8a9a5SSteve French 	list_for_each_entry_safe(rdata, tmp, &ctx->list, list) {
403438c8a9a5SSteve French 		if (!rc) {
403538c8a9a5SSteve French 			if (!try_wait_for_completion(&rdata->done)) {
403638c8a9a5SSteve French 				mutex_unlock(&ctx->aio_mutex);
403738c8a9a5SSteve French 				return;
403838c8a9a5SSteve French 			}
403938c8a9a5SSteve French 
404038c8a9a5SSteve French 			if (rdata->result == -EAGAIN) {
404138c8a9a5SSteve French 				/* resend call if it's a retryable error */
404238c8a9a5SSteve French 				struct list_head tmp_list;
404338c8a9a5SSteve French 				unsigned int got_bytes = rdata->got_bytes;
404438c8a9a5SSteve French 
404538c8a9a5SSteve French 				list_del_init(&rdata->list);
404638c8a9a5SSteve French 				INIT_LIST_HEAD(&tmp_list);
404738c8a9a5SSteve French 
404838c8a9a5SSteve French 				if (ctx->direct_io) {
404938c8a9a5SSteve French 					/*
405038c8a9a5SSteve French 					 * Re-use rdata as this is a
405138c8a9a5SSteve French 					 * direct I/O
405238c8a9a5SSteve French 					 */
405338c8a9a5SSteve French 					rc = cifs_resend_rdata(
405438c8a9a5SSteve French 						rdata,
405538c8a9a5SSteve French 						&tmp_list, ctx);
405638c8a9a5SSteve French 				} else {
405738c8a9a5SSteve French 					rc = cifs_send_async_read(
405838c8a9a5SSteve French 						rdata->offset + got_bytes,
405938c8a9a5SSteve French 						rdata->bytes - got_bytes,
406038c8a9a5SSteve French 						rdata->cfile, cifs_sb,
406138c8a9a5SSteve French 						&tmp_list, ctx);
406238c8a9a5SSteve French 
406338c8a9a5SSteve French 					kref_put(&rdata->refcount,
406438c8a9a5SSteve French 						cifs_readdata_release);
406538c8a9a5SSteve French 				}
406638c8a9a5SSteve French 
406738c8a9a5SSteve French 				list_splice(&tmp_list, &ctx->list);
406838c8a9a5SSteve French 
406938c8a9a5SSteve French 				goto again;
407038c8a9a5SSteve French 			} else if (rdata->result)
407138c8a9a5SSteve French 				rc = rdata->result;
407238c8a9a5SSteve French 
407338c8a9a5SSteve French 			/* if there was a short read -- discard anything left */
407438c8a9a5SSteve French 			if (rdata->got_bytes && rdata->got_bytes < rdata->bytes)
407538c8a9a5SSteve French 				rc = -ENODATA;
407638c8a9a5SSteve French 
407738c8a9a5SSteve French 			ctx->total_len += rdata->got_bytes;
407838c8a9a5SSteve French 		}
407938c8a9a5SSteve French 		list_del_init(&rdata->list);
408038c8a9a5SSteve French 		kref_put(&rdata->refcount, cifs_readdata_release);
408138c8a9a5SSteve French 	}
408238c8a9a5SSteve French 
408338c8a9a5SSteve French 	/* mask nodata case */
408438c8a9a5SSteve French 	if (rc == -ENODATA)
408538c8a9a5SSteve French 		rc = 0;
408638c8a9a5SSteve French 
408738c8a9a5SSteve French 	ctx->rc = (rc == 0) ? (ssize_t)ctx->total_len : rc;
408838c8a9a5SSteve French 
408938c8a9a5SSteve French 	mutex_unlock(&ctx->aio_mutex);
409038c8a9a5SSteve French 
409138c8a9a5SSteve French 	if (ctx->iocb && ctx->iocb->ki_complete)
409238c8a9a5SSteve French 		ctx->iocb->ki_complete(ctx->iocb, ctx->rc);
409338c8a9a5SSteve French 	else
409438c8a9a5SSteve French 		complete(&ctx->done);
409538c8a9a5SSteve French }
409638c8a9a5SSteve French 
409738c8a9a5SSteve French static ssize_t __cifs_readv(
409838c8a9a5SSteve French 	struct kiocb *iocb, struct iov_iter *to, bool direct)
409938c8a9a5SSteve French {
410038c8a9a5SSteve French 	size_t len;
410138c8a9a5SSteve French 	struct file *file = iocb->ki_filp;
410238c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
410338c8a9a5SSteve French 	struct cifsFileInfo *cfile;
410438c8a9a5SSteve French 	struct cifs_tcon *tcon;
410538c8a9a5SSteve French 	ssize_t rc, total_read = 0;
410638c8a9a5SSteve French 	loff_t offset = iocb->ki_pos;
410738c8a9a5SSteve French 	struct cifs_aio_ctx *ctx;
410838c8a9a5SSteve French 
410938c8a9a5SSteve French 	len = iov_iter_count(to);
411038c8a9a5SSteve French 	if (!len)
411138c8a9a5SSteve French 		return 0;
411238c8a9a5SSteve French 
411338c8a9a5SSteve French 	cifs_sb = CIFS_FILE_SB(file);
411438c8a9a5SSteve French 	cfile = file->private_data;
411538c8a9a5SSteve French 	tcon = tlink_tcon(cfile->tlink);
411638c8a9a5SSteve French 
411738c8a9a5SSteve French 	if (!tcon->ses->server->ops->async_readv)
411838c8a9a5SSteve French 		return -ENOSYS;
411938c8a9a5SSteve French 
412038c8a9a5SSteve French 	if ((file->f_flags & O_ACCMODE) == O_WRONLY)
412138c8a9a5SSteve French 		cifs_dbg(FYI, "attempting read on write only file instance\n");
412238c8a9a5SSteve French 
412338c8a9a5SSteve French 	ctx = cifs_aio_ctx_alloc();
412438c8a9a5SSteve French 	if (!ctx)
412538c8a9a5SSteve French 		return -ENOMEM;
412638c8a9a5SSteve French 
412738c8a9a5SSteve French 	ctx->pos	= offset;
412838c8a9a5SSteve French 	ctx->direct_io	= direct;
412938c8a9a5SSteve French 	ctx->len	= len;
413038c8a9a5SSteve French 	ctx->cfile	= cifsFileInfo_get(cfile);
413138c8a9a5SSteve French 	ctx->nr_pinned_pages = 0;
413238c8a9a5SSteve French 
413338c8a9a5SSteve French 	if (!is_sync_kiocb(iocb))
413438c8a9a5SSteve French 		ctx->iocb = iocb;
413538c8a9a5SSteve French 
413638c8a9a5SSteve French 	if (user_backed_iter(to)) {
413738c8a9a5SSteve French 		/*
413838c8a9a5SSteve French 		 * Extract IOVEC/UBUF-type iterators to a BVEC-type iterator as
413938c8a9a5SSteve French 		 * they contain references to the calling process's virtual
414038c8a9a5SSteve French 		 * memory layout which won't be available in an async worker
414138c8a9a5SSteve French 		 * thread.  This also takes a pin on every folio involved.
414238c8a9a5SSteve French 		 */
414338c8a9a5SSteve French 		rc = netfs_extract_user_iter(to, iov_iter_count(to),
414438c8a9a5SSteve French 					     &ctx->iter, 0);
414538c8a9a5SSteve French 		if (rc < 0) {
414638c8a9a5SSteve French 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
414738c8a9a5SSteve French 			return rc;
414838c8a9a5SSteve French 		}
414938c8a9a5SSteve French 
415038c8a9a5SSteve French 		ctx->nr_pinned_pages = rc;
415138c8a9a5SSteve French 		ctx->bv = (void *)ctx->iter.bvec;
415238c8a9a5SSteve French 		ctx->bv_need_unpin = iov_iter_extract_will_pin(to);
415338c8a9a5SSteve French 		ctx->should_dirty = true;
415438c8a9a5SSteve French 	} else if ((iov_iter_is_bvec(to) || iov_iter_is_kvec(to)) &&
415538c8a9a5SSteve French 		   !is_sync_kiocb(iocb)) {
415638c8a9a5SSteve French 		/*
415738c8a9a5SSteve French 		 * If the op is asynchronous, we need to copy the list attached
415838c8a9a5SSteve French 		 * to a BVEC/KVEC-type iterator, but we assume that the storage
415938c8a9a5SSteve French 		 * will be retained by the caller; in any case, we may or may
416038c8a9a5SSteve French 		 * not be able to pin the pages, so we don't try.
416138c8a9a5SSteve French 		 */
416238c8a9a5SSteve French 		ctx->bv = (void *)dup_iter(&ctx->iter, to, GFP_KERNEL);
416338c8a9a5SSteve French 		if (!ctx->bv) {
416438c8a9a5SSteve French 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
416538c8a9a5SSteve French 			return -ENOMEM;
416638c8a9a5SSteve French 		}
416738c8a9a5SSteve French 	} else {
416838c8a9a5SSteve French 		/*
416938c8a9a5SSteve French 		 * Otherwise, we just pass the iterator down as-is and rely on
417038c8a9a5SSteve French 		 * the caller to make sure the pages referred to by the
417138c8a9a5SSteve French 		 * iterator don't evaporate.
417238c8a9a5SSteve French 		 */
417338c8a9a5SSteve French 		ctx->iter = *to;
417438c8a9a5SSteve French 	}
417538c8a9a5SSteve French 
417638c8a9a5SSteve French 	if (direct) {
417738c8a9a5SSteve French 		rc = filemap_write_and_wait_range(file->f_inode->i_mapping,
417838c8a9a5SSteve French 						  offset, offset + len - 1);
417938c8a9a5SSteve French 		if (rc) {
418038c8a9a5SSteve French 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
418138c8a9a5SSteve French 			return -EAGAIN;
418238c8a9a5SSteve French 		}
418338c8a9a5SSteve French 	}
418438c8a9a5SSteve French 
418538c8a9a5SSteve French 	/* grab a lock here due to read response handlers can access ctx */
418638c8a9a5SSteve French 	mutex_lock(&ctx->aio_mutex);
418738c8a9a5SSteve French 
418838c8a9a5SSteve French 	rc = cifs_send_async_read(offset, len, cfile, cifs_sb, &ctx->list, ctx);
418938c8a9a5SSteve French 
419038c8a9a5SSteve French 	/* if at least one read request send succeeded, then reset rc */
419138c8a9a5SSteve French 	if (!list_empty(&ctx->list))
419238c8a9a5SSteve French 		rc = 0;
419338c8a9a5SSteve French 
419438c8a9a5SSteve French 	mutex_unlock(&ctx->aio_mutex);
419538c8a9a5SSteve French 
419638c8a9a5SSteve French 	if (rc) {
419738c8a9a5SSteve French 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
419838c8a9a5SSteve French 		return rc;
419938c8a9a5SSteve French 	}
420038c8a9a5SSteve French 
420138c8a9a5SSteve French 	if (!is_sync_kiocb(iocb)) {
420238c8a9a5SSteve French 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
420338c8a9a5SSteve French 		return -EIOCBQUEUED;
420438c8a9a5SSteve French 	}
420538c8a9a5SSteve French 
420638c8a9a5SSteve French 	rc = wait_for_completion_killable(&ctx->done);
420738c8a9a5SSteve French 	if (rc) {
420838c8a9a5SSteve French 		mutex_lock(&ctx->aio_mutex);
420938c8a9a5SSteve French 		ctx->rc = rc = -EINTR;
421038c8a9a5SSteve French 		total_read = ctx->total_len;
421138c8a9a5SSteve French 		mutex_unlock(&ctx->aio_mutex);
421238c8a9a5SSteve French 	} else {
421338c8a9a5SSteve French 		rc = ctx->rc;
421438c8a9a5SSteve French 		total_read = ctx->total_len;
421538c8a9a5SSteve French 	}
421638c8a9a5SSteve French 
421738c8a9a5SSteve French 	kref_put(&ctx->refcount, cifs_aio_ctx_release);
421838c8a9a5SSteve French 
421938c8a9a5SSteve French 	if (total_read) {
422038c8a9a5SSteve French 		iocb->ki_pos += total_read;
422138c8a9a5SSteve French 		return total_read;
422238c8a9a5SSteve French 	}
422338c8a9a5SSteve French 	return rc;
422438c8a9a5SSteve French }
422538c8a9a5SSteve French 
422638c8a9a5SSteve French ssize_t cifs_direct_readv(struct kiocb *iocb, struct iov_iter *to)
422738c8a9a5SSteve French {
422838c8a9a5SSteve French 	return __cifs_readv(iocb, to, true);
422938c8a9a5SSteve French }
423038c8a9a5SSteve French 
423138c8a9a5SSteve French ssize_t cifs_user_readv(struct kiocb *iocb, struct iov_iter *to)
423238c8a9a5SSteve French {
423338c8a9a5SSteve French 	return __cifs_readv(iocb, to, false);
423438c8a9a5SSteve French }
423538c8a9a5SSteve French 
423638c8a9a5SSteve French ssize_t
423738c8a9a5SSteve French cifs_strict_readv(struct kiocb *iocb, struct iov_iter *to)
423838c8a9a5SSteve French {
423938c8a9a5SSteve French 	struct inode *inode = file_inode(iocb->ki_filp);
424038c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
424138c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
424238c8a9a5SSteve French 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)
424338c8a9a5SSteve French 						iocb->ki_filp->private_data;
424438c8a9a5SSteve French 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
424538c8a9a5SSteve French 	int rc = -EACCES;
424638c8a9a5SSteve French 
424738c8a9a5SSteve French 	/*
424838c8a9a5SSteve French 	 * In strict cache mode we need to read from the server all the time
424938c8a9a5SSteve French 	 * if we don't have level II oplock because the server can delay mtime
425038c8a9a5SSteve French 	 * change - so we can't make a decision about inode invalidating.
425138c8a9a5SSteve French 	 * And we can also fail with pagereading if there are mandatory locks
425238c8a9a5SSteve French 	 * on pages affected by this read but not on the region from pos to
425338c8a9a5SSteve French 	 * pos+len-1.
425438c8a9a5SSteve French 	 */
425538c8a9a5SSteve French 	if (!CIFS_CACHE_READ(cinode))
425638c8a9a5SSteve French 		return cifs_user_readv(iocb, to);
425738c8a9a5SSteve French 
425838c8a9a5SSteve French 	if (cap_unix(tcon->ses) &&
425938c8a9a5SSteve French 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
426038c8a9a5SSteve French 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
426138c8a9a5SSteve French 		return generic_file_read_iter(iocb, to);
426238c8a9a5SSteve French 
426338c8a9a5SSteve French 	/*
426438c8a9a5SSteve French 	 * We need to hold the sem to be sure nobody modifies lock list
426538c8a9a5SSteve French 	 * with a brlock that prevents reading.
426638c8a9a5SSteve French 	 */
426738c8a9a5SSteve French 	down_read(&cinode->lock_sem);
426838c8a9a5SSteve French 	if (!cifs_find_lock_conflict(cfile, iocb->ki_pos, iov_iter_count(to),
426938c8a9a5SSteve French 				     tcon->ses->server->vals->shared_lock_type,
427038c8a9a5SSteve French 				     0, NULL, CIFS_READ_OP))
427138c8a9a5SSteve French 		rc = generic_file_read_iter(iocb, to);
427238c8a9a5SSteve French 	up_read(&cinode->lock_sem);
427338c8a9a5SSteve French 	return rc;
427438c8a9a5SSteve French }
427538c8a9a5SSteve French 
427638c8a9a5SSteve French static ssize_t
427738c8a9a5SSteve French cifs_read(struct file *file, char *read_data, size_t read_size, loff_t *offset)
427838c8a9a5SSteve French {
427938c8a9a5SSteve French 	int rc = -EACCES;
428038c8a9a5SSteve French 	unsigned int bytes_read = 0;
428138c8a9a5SSteve French 	unsigned int total_read;
428238c8a9a5SSteve French 	unsigned int current_read_size;
428338c8a9a5SSteve French 	unsigned int rsize;
428438c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb;
428538c8a9a5SSteve French 	struct cifs_tcon *tcon;
428638c8a9a5SSteve French 	struct TCP_Server_Info *server;
428738c8a9a5SSteve French 	unsigned int xid;
428838c8a9a5SSteve French 	char *cur_offset;
428938c8a9a5SSteve French 	struct cifsFileInfo *open_file;
429038c8a9a5SSteve French 	struct cifs_io_parms io_parms = {0};
429138c8a9a5SSteve French 	int buf_type = CIFS_NO_BUFFER;
429238c8a9a5SSteve French 	__u32 pid;
429338c8a9a5SSteve French 
429438c8a9a5SSteve French 	xid = get_xid();
429538c8a9a5SSteve French 	cifs_sb = CIFS_FILE_SB(file);
429638c8a9a5SSteve French 
429738c8a9a5SSteve French 	/* FIXME: set up handlers for larger reads and/or convert to async */
429838c8a9a5SSteve French 	rsize = min_t(unsigned int, cifs_sb->ctx->rsize, CIFSMaxBufSize);
429938c8a9a5SSteve French 
430038c8a9a5SSteve French 	if (file->private_data == NULL) {
430138c8a9a5SSteve French 		rc = -EBADF;
430238c8a9a5SSteve French 		free_xid(xid);
430338c8a9a5SSteve French 		return rc;
430438c8a9a5SSteve French 	}
430538c8a9a5SSteve French 	open_file = file->private_data;
430638c8a9a5SSteve French 	tcon = tlink_tcon(open_file->tlink);
430738c8a9a5SSteve French 	server = cifs_pick_channel(tcon->ses);
430838c8a9a5SSteve French 
430938c8a9a5SSteve French 	if (!server->ops->sync_read) {
431038c8a9a5SSteve French 		free_xid(xid);
431138c8a9a5SSteve French 		return -ENOSYS;
431238c8a9a5SSteve French 	}
431338c8a9a5SSteve French 
431438c8a9a5SSteve French 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
431538c8a9a5SSteve French 		pid = open_file->pid;
431638c8a9a5SSteve French 	else
431738c8a9a5SSteve French 		pid = current->tgid;
431838c8a9a5SSteve French 
431938c8a9a5SSteve French 	if ((file->f_flags & O_ACCMODE) == O_WRONLY)
432038c8a9a5SSteve French 		cifs_dbg(FYI, "attempting read on write only file instance\n");
432138c8a9a5SSteve French 
432238c8a9a5SSteve French 	for (total_read = 0, cur_offset = read_data; read_size > total_read;
432338c8a9a5SSteve French 	     total_read += bytes_read, cur_offset += bytes_read) {
432438c8a9a5SSteve French 		do {
432538c8a9a5SSteve French 			current_read_size = min_t(uint, read_size - total_read,
432638c8a9a5SSteve French 						  rsize);
432738c8a9a5SSteve French 			/*
432838c8a9a5SSteve French 			 * For windows me and 9x we do not want to request more
432938c8a9a5SSteve French 			 * than it negotiated since it will refuse the read
433038c8a9a5SSteve French 			 * then.
433138c8a9a5SSteve French 			 */
433238c8a9a5SSteve French 			if (!(tcon->ses->capabilities &
433338c8a9a5SSteve French 				tcon->ses->server->vals->cap_large_files)) {
433438c8a9a5SSteve French 				current_read_size = min_t(uint,
433538c8a9a5SSteve French 					current_read_size, CIFSMaxBufSize);
433638c8a9a5SSteve French 			}
433738c8a9a5SSteve French 			if (open_file->invalidHandle) {
433838c8a9a5SSteve French 				rc = cifs_reopen_file(open_file, true);
433938c8a9a5SSteve French 				if (rc != 0)
434038c8a9a5SSteve French 					break;
434138c8a9a5SSteve French 			}
434238c8a9a5SSteve French 			io_parms.pid = pid;
434338c8a9a5SSteve French 			io_parms.tcon = tcon;
434438c8a9a5SSteve French 			io_parms.offset = *offset;
434538c8a9a5SSteve French 			io_parms.length = current_read_size;
434638c8a9a5SSteve French 			io_parms.server = server;
434738c8a9a5SSteve French 			rc = server->ops->sync_read(xid, &open_file->fid, &io_parms,
434838c8a9a5SSteve French 						    &bytes_read, &cur_offset,
434938c8a9a5SSteve French 						    &buf_type);
435038c8a9a5SSteve French 		} while (rc == -EAGAIN);
435138c8a9a5SSteve French 
435238c8a9a5SSteve French 		if (rc || (bytes_read == 0)) {
435338c8a9a5SSteve French 			if (total_read) {
435438c8a9a5SSteve French 				break;
435538c8a9a5SSteve French 			} else {
435638c8a9a5SSteve French 				free_xid(xid);
435738c8a9a5SSteve French 				return rc;
435838c8a9a5SSteve French 			}
435938c8a9a5SSteve French 		} else {
436038c8a9a5SSteve French 			cifs_stats_bytes_read(tcon, total_read);
436138c8a9a5SSteve French 			*offset += bytes_read;
436238c8a9a5SSteve French 		}
436338c8a9a5SSteve French 	}
436438c8a9a5SSteve French 	free_xid(xid);
436538c8a9a5SSteve French 	return total_read;
436638c8a9a5SSteve French }
436738c8a9a5SSteve French 
436838c8a9a5SSteve French /*
436938c8a9a5SSteve French  * If the page is mmap'ed into a process' page tables, then we need to make
437038c8a9a5SSteve French  * sure that it doesn't change while being written back.
437138c8a9a5SSteve French  */
437238c8a9a5SSteve French static vm_fault_t cifs_page_mkwrite(struct vm_fault *vmf)
437338c8a9a5SSteve French {
437438c8a9a5SSteve French 	struct folio *folio = page_folio(vmf->page);
437538c8a9a5SSteve French 
437638c8a9a5SSteve French 	/* Wait for the folio to be written to the cache before we allow it to
437738c8a9a5SSteve French 	 * be modified.  We then assume the entire folio will need writing back.
437838c8a9a5SSteve French 	 */
437938c8a9a5SSteve French #ifdef CONFIG_CIFS_FSCACHE
438038c8a9a5SSteve French 	if (folio_test_fscache(folio) &&
438138c8a9a5SSteve French 	    folio_wait_fscache_killable(folio) < 0)
438238c8a9a5SSteve French 		return VM_FAULT_RETRY;
438338c8a9a5SSteve French #endif
438438c8a9a5SSteve French 
438538c8a9a5SSteve French 	folio_wait_writeback(folio);
438638c8a9a5SSteve French 
438738c8a9a5SSteve French 	if (folio_lock_killable(folio) < 0)
438838c8a9a5SSteve French 		return VM_FAULT_RETRY;
438938c8a9a5SSteve French 	return VM_FAULT_LOCKED;
439038c8a9a5SSteve French }
439138c8a9a5SSteve French 
439238c8a9a5SSteve French static const struct vm_operations_struct cifs_file_vm_ops = {
439338c8a9a5SSteve French 	.fault = filemap_fault,
439438c8a9a5SSteve French 	.map_pages = filemap_map_pages,
439538c8a9a5SSteve French 	.page_mkwrite = cifs_page_mkwrite,
439638c8a9a5SSteve French };
439738c8a9a5SSteve French 
439838c8a9a5SSteve French int cifs_file_strict_mmap(struct file *file, struct vm_area_struct *vma)
439938c8a9a5SSteve French {
440038c8a9a5SSteve French 	int xid, rc = 0;
440138c8a9a5SSteve French 	struct inode *inode = file_inode(file);
440238c8a9a5SSteve French 
440338c8a9a5SSteve French 	xid = get_xid();
440438c8a9a5SSteve French 
440538c8a9a5SSteve French 	if (!CIFS_CACHE_READ(CIFS_I(inode)))
440638c8a9a5SSteve French 		rc = cifs_zap_mapping(inode);
440738c8a9a5SSteve French 	if (!rc)
440838c8a9a5SSteve French 		rc = generic_file_mmap(file, vma);
440938c8a9a5SSteve French 	if (!rc)
441038c8a9a5SSteve French 		vma->vm_ops = &cifs_file_vm_ops;
441138c8a9a5SSteve French 
441238c8a9a5SSteve French 	free_xid(xid);
441338c8a9a5SSteve French 	return rc;
441438c8a9a5SSteve French }
441538c8a9a5SSteve French 
441638c8a9a5SSteve French int cifs_file_mmap(struct file *file, struct vm_area_struct *vma)
441738c8a9a5SSteve French {
441838c8a9a5SSteve French 	int rc, xid;
441938c8a9a5SSteve French 
442038c8a9a5SSteve French 	xid = get_xid();
442138c8a9a5SSteve French 
442238c8a9a5SSteve French 	rc = cifs_revalidate_file(file);
442338c8a9a5SSteve French 	if (rc)
442438c8a9a5SSteve French 		cifs_dbg(FYI, "Validation prior to mmap failed, error=%d\n",
442538c8a9a5SSteve French 			 rc);
442638c8a9a5SSteve French 	if (!rc)
442738c8a9a5SSteve French 		rc = generic_file_mmap(file, vma);
442838c8a9a5SSteve French 	if (!rc)
442938c8a9a5SSteve French 		vma->vm_ops = &cifs_file_vm_ops;
443038c8a9a5SSteve French 
443138c8a9a5SSteve French 	free_xid(xid);
443238c8a9a5SSteve French 	return rc;
443338c8a9a5SSteve French }
443438c8a9a5SSteve French 
443538c8a9a5SSteve French /*
443638c8a9a5SSteve French  * Unlock a bunch of folios in the pagecache.
443738c8a9a5SSteve French  */
443838c8a9a5SSteve French static void cifs_unlock_folios(struct address_space *mapping, pgoff_t first, pgoff_t last)
443938c8a9a5SSteve French {
444038c8a9a5SSteve French 	struct folio *folio;
444138c8a9a5SSteve French 	XA_STATE(xas, &mapping->i_pages, first);
444238c8a9a5SSteve French 
444338c8a9a5SSteve French 	rcu_read_lock();
444438c8a9a5SSteve French 	xas_for_each(&xas, folio, last) {
444538c8a9a5SSteve French 		folio_unlock(folio);
444638c8a9a5SSteve French 	}
444738c8a9a5SSteve French 	rcu_read_unlock();
444838c8a9a5SSteve French }
444938c8a9a5SSteve French 
445038c8a9a5SSteve French static void cifs_readahead_complete(struct work_struct *work)
445138c8a9a5SSteve French {
445238c8a9a5SSteve French 	struct cifs_readdata *rdata = container_of(work,
445338c8a9a5SSteve French 						   struct cifs_readdata, work);
445438c8a9a5SSteve French 	struct folio *folio;
445538c8a9a5SSteve French 	pgoff_t last;
445638c8a9a5SSteve French 	bool good = rdata->result == 0 || (rdata->result == -EAGAIN && rdata->got_bytes);
445738c8a9a5SSteve French 
445838c8a9a5SSteve French 	XA_STATE(xas, &rdata->mapping->i_pages, rdata->offset / PAGE_SIZE);
445938c8a9a5SSteve French 
446038c8a9a5SSteve French 	if (good)
446138c8a9a5SSteve French 		cifs_readahead_to_fscache(rdata->mapping->host,
446238c8a9a5SSteve French 					  rdata->offset, rdata->bytes);
446338c8a9a5SSteve French 
446438c8a9a5SSteve French 	if (iov_iter_count(&rdata->iter) > 0)
446538c8a9a5SSteve French 		iov_iter_zero(iov_iter_count(&rdata->iter), &rdata->iter);
446638c8a9a5SSteve French 
446738c8a9a5SSteve French 	last = (rdata->offset + rdata->bytes - 1) / PAGE_SIZE;
446838c8a9a5SSteve French 
446938c8a9a5SSteve French 	rcu_read_lock();
447038c8a9a5SSteve French 	xas_for_each(&xas, folio, last) {
447138c8a9a5SSteve French 		if (good) {
447238c8a9a5SSteve French 			flush_dcache_folio(folio);
447338c8a9a5SSteve French 			folio_mark_uptodate(folio);
447438c8a9a5SSteve French 		}
447538c8a9a5SSteve French 		folio_unlock(folio);
447638c8a9a5SSteve French 	}
447738c8a9a5SSteve French 	rcu_read_unlock();
447838c8a9a5SSteve French 
447938c8a9a5SSteve French 	kref_put(&rdata->refcount, cifs_readdata_release);
448038c8a9a5SSteve French }
448138c8a9a5SSteve French 
448238c8a9a5SSteve French static void cifs_readahead(struct readahead_control *ractl)
448338c8a9a5SSteve French {
448438c8a9a5SSteve French 	struct cifsFileInfo *open_file = ractl->file->private_data;
448538c8a9a5SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_FILE_SB(ractl->file);
448638c8a9a5SSteve French 	struct TCP_Server_Info *server;
448738c8a9a5SSteve French 	unsigned int xid, nr_pages, cache_nr_pages = 0;
448838c8a9a5SSteve French 	unsigned int ra_pages;
448938c8a9a5SSteve French 	pgoff_t next_cached = ULONG_MAX, ra_index;
449038c8a9a5SSteve French 	bool caching = fscache_cookie_enabled(cifs_inode_cookie(ractl->mapping->host)) &&
449138c8a9a5SSteve French 		cifs_inode_cookie(ractl->mapping->host)->cache_priv;
449238c8a9a5SSteve French 	bool check_cache = caching;
449338c8a9a5SSteve French 	pid_t pid;
449438c8a9a5SSteve French 	int rc = 0;
449538c8a9a5SSteve French 
449638c8a9a5SSteve French 	/* Note that readahead_count() lags behind our dequeuing of pages from
449738c8a9a5SSteve French 	 * the ractl, wo we have to keep track for ourselves.
449838c8a9a5SSteve French 	 */
449938c8a9a5SSteve French 	ra_pages = readahead_count(ractl);
450038c8a9a5SSteve French 	ra_index = readahead_index(ractl);
450138c8a9a5SSteve French 
450238c8a9a5SSteve French 	xid = get_xid();
450338c8a9a5SSteve French 
450438c8a9a5SSteve French 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
450538c8a9a5SSteve French 		pid = open_file->pid;
450638c8a9a5SSteve French 	else
450738c8a9a5SSteve French 		pid = current->tgid;
450838c8a9a5SSteve French 
450938c8a9a5SSteve French 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
451038c8a9a5SSteve French 
451138c8a9a5SSteve French 	cifs_dbg(FYI, "%s: file=%p mapping=%p num_pages=%u\n",
451238c8a9a5SSteve French 		 __func__, ractl->file, ractl->mapping, ra_pages);
451338c8a9a5SSteve French 
451438c8a9a5SSteve French 	/*
451538c8a9a5SSteve French 	 * Chop the readahead request up into rsize-sized read requests.
451638c8a9a5SSteve French 	 */
451738c8a9a5SSteve French 	while ((nr_pages = ra_pages)) {
451838c8a9a5SSteve French 		unsigned int i, rsize;
451938c8a9a5SSteve French 		struct cifs_readdata *rdata;
452038c8a9a5SSteve French 		struct cifs_credits credits_on_stack;
452138c8a9a5SSteve French 		struct cifs_credits *credits = &credits_on_stack;
452238c8a9a5SSteve French 		struct folio *folio;
452338c8a9a5SSteve French 		pgoff_t fsize;
452438c8a9a5SSteve French 
452538c8a9a5SSteve French 		/*
452638c8a9a5SSteve French 		 * Find out if we have anything cached in the range of
452738c8a9a5SSteve French 		 * interest, and if so, where the next chunk of cached data is.
452838c8a9a5SSteve French 		 */
452938c8a9a5SSteve French 		if (caching) {
453038c8a9a5SSteve French 			if (check_cache) {
453138c8a9a5SSteve French 				rc = cifs_fscache_query_occupancy(
453238c8a9a5SSteve French 					ractl->mapping->host, ra_index, nr_pages,
453338c8a9a5SSteve French 					&next_cached, &cache_nr_pages);
453438c8a9a5SSteve French 				if (rc < 0)
453538c8a9a5SSteve French 					caching = false;
453638c8a9a5SSteve French 				check_cache = false;
453738c8a9a5SSteve French 			}
453838c8a9a5SSteve French 
453938c8a9a5SSteve French 			if (ra_index == next_cached) {
454038c8a9a5SSteve French 				/*
454138c8a9a5SSteve French 				 * TODO: Send a whole batch of pages to be read
454238c8a9a5SSteve French 				 * by the cache.
454338c8a9a5SSteve French 				 */
454438c8a9a5SSteve French 				folio = readahead_folio(ractl);
454538c8a9a5SSteve French 				fsize = folio_nr_pages(folio);
454638c8a9a5SSteve French 				ra_pages -= fsize;
454738c8a9a5SSteve French 				ra_index += fsize;
454838c8a9a5SSteve French 				if (cifs_readpage_from_fscache(ractl->mapping->host,
454938c8a9a5SSteve French 							       &folio->page) < 0) {
455038c8a9a5SSteve French 					/*
455138c8a9a5SSteve French 					 * TODO: Deal with cache read failure
455238c8a9a5SSteve French 					 * here, but for the moment, delegate
455338c8a9a5SSteve French 					 * that to readpage.
455438c8a9a5SSteve French 					 */
455538c8a9a5SSteve French 					caching = false;
455638c8a9a5SSteve French 				}
455738c8a9a5SSteve French 				folio_unlock(folio);
455838c8a9a5SSteve French 				next_cached += fsize;
455938c8a9a5SSteve French 				cache_nr_pages -= fsize;
456038c8a9a5SSteve French 				if (cache_nr_pages == 0)
456138c8a9a5SSteve French 					check_cache = true;
456238c8a9a5SSteve French 				continue;
456338c8a9a5SSteve French 			}
456438c8a9a5SSteve French 		}
456538c8a9a5SSteve French 
456638c8a9a5SSteve French 		if (open_file->invalidHandle) {
456738c8a9a5SSteve French 			rc = cifs_reopen_file(open_file, true);
456838c8a9a5SSteve French 			if (rc) {
456938c8a9a5SSteve French 				if (rc == -EAGAIN)
457038c8a9a5SSteve French 					continue;
457138c8a9a5SSteve French 				break;
457238c8a9a5SSteve French 			}
457338c8a9a5SSteve French 		}
457438c8a9a5SSteve French 
457538c8a9a5SSteve French 		if (cifs_sb->ctx->rsize == 0)
457638c8a9a5SSteve French 			cifs_sb->ctx->rsize =
457738c8a9a5SSteve French 				server->ops->negotiate_rsize(tlink_tcon(open_file->tlink),
457838c8a9a5SSteve French 							     cifs_sb->ctx);
457938c8a9a5SSteve French 
458038c8a9a5SSteve French 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->rsize,
458138c8a9a5SSteve French 						   &rsize, credits);
458238c8a9a5SSteve French 		if (rc)
458338c8a9a5SSteve French 			break;
458438c8a9a5SSteve French 		nr_pages = min_t(size_t, rsize / PAGE_SIZE, ra_pages);
458538c8a9a5SSteve French 		if (next_cached != ULONG_MAX)
458638c8a9a5SSteve French 			nr_pages = min_t(size_t, nr_pages, next_cached - ra_index);
458738c8a9a5SSteve French 
458838c8a9a5SSteve French 		/*
458938c8a9a5SSteve French 		 * Give up immediately if rsize is too small to read an entire
459038c8a9a5SSteve French 		 * page. The VFS will fall back to readpage. We should never
459138c8a9a5SSteve French 		 * reach this point however since we set ra_pages to 0 when the
459238c8a9a5SSteve French 		 * rsize is smaller than a cache page.
459338c8a9a5SSteve French 		 */
459438c8a9a5SSteve French 		if (unlikely(!nr_pages)) {
459538c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
459638c8a9a5SSteve French 			break;
459738c8a9a5SSteve French 		}
459838c8a9a5SSteve French 
459938c8a9a5SSteve French 		rdata = cifs_readdata_alloc(cifs_readahead_complete);
460038c8a9a5SSteve French 		if (!rdata) {
460138c8a9a5SSteve French 			/* best to give up if we're out of mem */
460238c8a9a5SSteve French 			add_credits_and_wake_if(server, credits, 0);
460338c8a9a5SSteve French 			break;
460438c8a9a5SSteve French 		}
460538c8a9a5SSteve French 
460638c8a9a5SSteve French 		rdata->offset	= ra_index * PAGE_SIZE;
460738c8a9a5SSteve French 		rdata->bytes	= nr_pages * PAGE_SIZE;
460838c8a9a5SSteve French 		rdata->cfile	= cifsFileInfo_get(open_file);
460938c8a9a5SSteve French 		rdata->server	= server;
461038c8a9a5SSteve French 		rdata->mapping	= ractl->mapping;
461138c8a9a5SSteve French 		rdata->pid	= pid;
461238c8a9a5SSteve French 		rdata->credits	= credits_on_stack;
461338c8a9a5SSteve French 
461438c8a9a5SSteve French 		for (i = 0; i < nr_pages; i++) {
461538c8a9a5SSteve French 			if (!readahead_folio(ractl))
461638c8a9a5SSteve French 				WARN_ON(1);
461738c8a9a5SSteve French 		}
461838c8a9a5SSteve French 		ra_pages -= nr_pages;
461938c8a9a5SSteve French 		ra_index += nr_pages;
462038c8a9a5SSteve French 
462138c8a9a5SSteve French 		iov_iter_xarray(&rdata->iter, ITER_DEST, &rdata->mapping->i_pages,
462238c8a9a5SSteve French 				rdata->offset, rdata->bytes);
462338c8a9a5SSteve French 
462438c8a9a5SSteve French 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
462538c8a9a5SSteve French 		if (!rc) {
462638c8a9a5SSteve French 			if (rdata->cfile->invalidHandle)
462738c8a9a5SSteve French 				rc = -EAGAIN;
462838c8a9a5SSteve French 			else
462938c8a9a5SSteve French 				rc = server->ops->async_readv(rdata);
463038c8a9a5SSteve French 		}
463138c8a9a5SSteve French 
463238c8a9a5SSteve French 		if (rc) {
463338c8a9a5SSteve French 			add_credits_and_wake_if(server, &rdata->credits, 0);
463438c8a9a5SSteve French 			cifs_unlock_folios(rdata->mapping,
463538c8a9a5SSteve French 					   rdata->offset / PAGE_SIZE,
463638c8a9a5SSteve French 					   (rdata->offset + rdata->bytes - 1) / PAGE_SIZE);
463738c8a9a5SSteve French 			/* Fallback to the readpage in error/reconnect cases */
463838c8a9a5SSteve French 			kref_put(&rdata->refcount, cifs_readdata_release);
463938c8a9a5SSteve French 			break;
464038c8a9a5SSteve French 		}
464138c8a9a5SSteve French 
464238c8a9a5SSteve French 		kref_put(&rdata->refcount, cifs_readdata_release);
464338c8a9a5SSteve French 	}
464438c8a9a5SSteve French 
464538c8a9a5SSteve French 	free_xid(xid);
464638c8a9a5SSteve French }
464738c8a9a5SSteve French 
464838c8a9a5SSteve French /*
464938c8a9a5SSteve French  * cifs_readpage_worker must be called with the page pinned
465038c8a9a5SSteve French  */
465138c8a9a5SSteve French static int cifs_readpage_worker(struct file *file, struct page *page,
465238c8a9a5SSteve French 	loff_t *poffset)
465338c8a9a5SSteve French {
465423171df5SJeff Layton 	struct inode *inode = file_inode(file);
465523171df5SJeff Layton 	struct timespec64 atime, mtime;
465638c8a9a5SSteve French 	char *read_data;
465738c8a9a5SSteve French 	int rc;
465838c8a9a5SSteve French 
465938c8a9a5SSteve French 	/* Is the page cached? */
466023171df5SJeff Layton 	rc = cifs_readpage_from_fscache(inode, page);
466138c8a9a5SSteve French 	if (rc == 0)
466238c8a9a5SSteve French 		goto read_complete;
466338c8a9a5SSteve French 
466438c8a9a5SSteve French 	read_data = kmap(page);
466538c8a9a5SSteve French 	/* for reads over a certain size could initiate async read ahead */
466638c8a9a5SSteve French 
466738c8a9a5SSteve French 	rc = cifs_read(file, read_data, PAGE_SIZE, poffset);
466838c8a9a5SSteve French 
466938c8a9a5SSteve French 	if (rc < 0)
467038c8a9a5SSteve French 		goto io_error;
467138c8a9a5SSteve French 	else
467238c8a9a5SSteve French 		cifs_dbg(FYI, "Bytes read %d\n", rc);
467338c8a9a5SSteve French 
467438c8a9a5SSteve French 	/* we do not want atime to be less than mtime, it broke some apps */
467523171df5SJeff Layton 	atime = inode_set_atime_to_ts(inode, current_time(inode));
467623171df5SJeff Layton 	mtime = inode_get_mtime(inode);
46779a498744SZizhi Wo 	if (timespec64_compare(&atime, &mtime) < 0)
467823171df5SJeff Layton 		inode_set_atime_to_ts(inode, inode_get_mtime(inode));
467938c8a9a5SSteve French 
468038c8a9a5SSteve French 	if (PAGE_SIZE > rc)
468138c8a9a5SSteve French 		memset(read_data + rc, 0, PAGE_SIZE - rc);
468238c8a9a5SSteve French 
468338c8a9a5SSteve French 	flush_dcache_page(page);
468438c8a9a5SSteve French 	SetPageUptodate(page);
468538c8a9a5SSteve French 	rc = 0;
468638c8a9a5SSteve French 
468738c8a9a5SSteve French io_error:
468838c8a9a5SSteve French 	kunmap(page);
468938c8a9a5SSteve French 
469038c8a9a5SSteve French read_complete:
469169513dd6SRussell Harmon via samba-technical 	unlock_page(page);
469238c8a9a5SSteve French 	return rc;
469338c8a9a5SSteve French }
469438c8a9a5SSteve French 
469538c8a9a5SSteve French static int cifs_read_folio(struct file *file, struct folio *folio)
469638c8a9a5SSteve French {
469738c8a9a5SSteve French 	struct page *page = &folio->page;
469838c8a9a5SSteve French 	loff_t offset = page_file_offset(page);
469938c8a9a5SSteve French 	int rc = -EACCES;
470038c8a9a5SSteve French 	unsigned int xid;
470138c8a9a5SSteve French 
470238c8a9a5SSteve French 	xid = get_xid();
470338c8a9a5SSteve French 
470438c8a9a5SSteve French 	if (file->private_data == NULL) {
470538c8a9a5SSteve French 		rc = -EBADF;
470638c8a9a5SSteve French 		free_xid(xid);
470738c8a9a5SSteve French 		return rc;
470838c8a9a5SSteve French 	}
470938c8a9a5SSteve French 
471038c8a9a5SSteve French 	cifs_dbg(FYI, "read_folio %p at offset %d 0x%x\n",
471138c8a9a5SSteve French 		 page, (int)offset, (int)offset);
471238c8a9a5SSteve French 
471338c8a9a5SSteve French 	rc = cifs_readpage_worker(file, page, &offset);
471438c8a9a5SSteve French 
471538c8a9a5SSteve French 	free_xid(xid);
471638c8a9a5SSteve French 	return rc;
471738c8a9a5SSteve French }
471838c8a9a5SSteve French 
471938c8a9a5SSteve French static int is_inode_writable(struct cifsInodeInfo *cifs_inode)
472038c8a9a5SSteve French {
472138c8a9a5SSteve French 	struct cifsFileInfo *open_file;
472238c8a9a5SSteve French 
472338c8a9a5SSteve French 	spin_lock(&cifs_inode->open_file_lock);
472438c8a9a5SSteve French 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
472538c8a9a5SSteve French 		if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
472638c8a9a5SSteve French 			spin_unlock(&cifs_inode->open_file_lock);
472738c8a9a5SSteve French 			return 1;
472838c8a9a5SSteve French 		}
472938c8a9a5SSteve French 	}
473038c8a9a5SSteve French 	spin_unlock(&cifs_inode->open_file_lock);
473138c8a9a5SSteve French 	return 0;
473238c8a9a5SSteve French }
473338c8a9a5SSteve French 
473438c8a9a5SSteve French /* We do not want to update the file size from server for inodes
473538c8a9a5SSteve French    open for write - to avoid races with writepage extending
473638c8a9a5SSteve French    the file - in the future we could consider allowing
473738c8a9a5SSteve French    refreshing the inode only on increases in the file size
473838c8a9a5SSteve French    but this is tricky to do without racing with writebehind
473938c8a9a5SSteve French    page caching in the current Linux kernel design */
474038c8a9a5SSteve French bool is_size_safe_to_change(struct cifsInodeInfo *cifsInode, __u64 end_of_file)
474138c8a9a5SSteve French {
474238c8a9a5SSteve French 	if (!cifsInode)
474338c8a9a5SSteve French 		return true;
474438c8a9a5SSteve French 
474538c8a9a5SSteve French 	if (is_inode_writable(cifsInode)) {
474638c8a9a5SSteve French 		/* This inode is open for write at least once */
474738c8a9a5SSteve French 		struct cifs_sb_info *cifs_sb;
474838c8a9a5SSteve French 
474938c8a9a5SSteve French 		cifs_sb = CIFS_SB(cifsInode->netfs.inode.i_sb);
475038c8a9a5SSteve French 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_DIRECT_IO) {
475138c8a9a5SSteve French 			/* since no page cache to corrupt on directio
475238c8a9a5SSteve French 			we can change size safely */
475338c8a9a5SSteve French 			return true;
475438c8a9a5SSteve French 		}
475538c8a9a5SSteve French 
475638c8a9a5SSteve French 		if (i_size_read(&cifsInode->netfs.inode) < end_of_file)
475738c8a9a5SSteve French 			return true;
475838c8a9a5SSteve French 
475938c8a9a5SSteve French 		return false;
476038c8a9a5SSteve French 	} else
476138c8a9a5SSteve French 		return true;
476238c8a9a5SSteve French }
476338c8a9a5SSteve French 
476438c8a9a5SSteve French static int cifs_write_begin(struct file *file, struct address_space *mapping,
476538c8a9a5SSteve French 			loff_t pos, unsigned len,
476638c8a9a5SSteve French 			struct page **pagep, void **fsdata)
476738c8a9a5SSteve French {
476838c8a9a5SSteve French 	int oncethru = 0;
476938c8a9a5SSteve French 	pgoff_t index = pos >> PAGE_SHIFT;
477038c8a9a5SSteve French 	loff_t offset = pos & (PAGE_SIZE - 1);
477138c8a9a5SSteve French 	loff_t page_start = pos & PAGE_MASK;
477238c8a9a5SSteve French 	loff_t i_size;
477338c8a9a5SSteve French 	struct page *page;
477438c8a9a5SSteve French 	int rc = 0;
477538c8a9a5SSteve French 
477638c8a9a5SSteve French 	cifs_dbg(FYI, "write_begin from %lld len %d\n", (long long)pos, len);
477738c8a9a5SSteve French 
477838c8a9a5SSteve French start:
477938c8a9a5SSteve French 	page = grab_cache_page_write_begin(mapping, index);
478038c8a9a5SSteve French 	if (!page) {
478138c8a9a5SSteve French 		rc = -ENOMEM;
478238c8a9a5SSteve French 		goto out;
478338c8a9a5SSteve French 	}
478438c8a9a5SSteve French 
478538c8a9a5SSteve French 	if (PageUptodate(page))
478638c8a9a5SSteve French 		goto out;
478738c8a9a5SSteve French 
478838c8a9a5SSteve French 	/*
478938c8a9a5SSteve French 	 * If we write a full page it will be up to date, no need to read from
479038c8a9a5SSteve French 	 * the server. If the write is short, we'll end up doing a sync write
479138c8a9a5SSteve French 	 * instead.
479238c8a9a5SSteve French 	 */
479338c8a9a5SSteve French 	if (len == PAGE_SIZE)
479438c8a9a5SSteve French 		goto out;
479538c8a9a5SSteve French 
479638c8a9a5SSteve French 	/*
479738c8a9a5SSteve French 	 * optimize away the read when we have an oplock, and we're not
479838c8a9a5SSteve French 	 * expecting to use any of the data we'd be reading in. That
479938c8a9a5SSteve French 	 * is, when the page lies beyond the EOF, or straddles the EOF
480038c8a9a5SSteve French 	 * and the write will cover all of the existing data.
480138c8a9a5SSteve French 	 */
480238c8a9a5SSteve French 	if (CIFS_CACHE_READ(CIFS_I(mapping->host))) {
480338c8a9a5SSteve French 		i_size = i_size_read(mapping->host);
480438c8a9a5SSteve French 		if (page_start >= i_size ||
480538c8a9a5SSteve French 		    (offset == 0 && (pos + len) >= i_size)) {
480638c8a9a5SSteve French 			zero_user_segments(page, 0, offset,
480738c8a9a5SSteve French 					   offset + len,
480838c8a9a5SSteve French 					   PAGE_SIZE);
480938c8a9a5SSteve French 			/*
481038c8a9a5SSteve French 			 * PageChecked means that the parts of the page
481138c8a9a5SSteve French 			 * to which we're not writing are considered up
481238c8a9a5SSteve French 			 * to date. Once the data is copied to the
481338c8a9a5SSteve French 			 * page, it can be set uptodate.
481438c8a9a5SSteve French 			 */
481538c8a9a5SSteve French 			SetPageChecked(page);
481638c8a9a5SSteve French 			goto out;
481738c8a9a5SSteve French 		}
481838c8a9a5SSteve French 	}
481938c8a9a5SSteve French 
482038c8a9a5SSteve French 	if ((file->f_flags & O_ACCMODE) != O_WRONLY && !oncethru) {
482138c8a9a5SSteve French 		/*
482238c8a9a5SSteve French 		 * might as well read a page, it is fast enough. If we get
482338c8a9a5SSteve French 		 * an error, we don't need to return it. cifs_write_end will
482438c8a9a5SSteve French 		 * do a sync write instead since PG_uptodate isn't set.
482538c8a9a5SSteve French 		 */
482638c8a9a5SSteve French 		cifs_readpage_worker(file, page, &page_start);
482738c8a9a5SSteve French 		put_page(page);
482838c8a9a5SSteve French 		oncethru = 1;
482938c8a9a5SSteve French 		goto start;
483038c8a9a5SSteve French 	} else {
483138c8a9a5SSteve French 		/* we could try using another file handle if there is one -
483238c8a9a5SSteve French 		   but how would we lock it to prevent close of that handle
483338c8a9a5SSteve French 		   racing with this read? In any case
483438c8a9a5SSteve French 		   this will be written out by write_end so is fine */
483538c8a9a5SSteve French 	}
483638c8a9a5SSteve French out:
483738c8a9a5SSteve French 	*pagep = page;
483838c8a9a5SSteve French 	return rc;
483938c8a9a5SSteve French }
484038c8a9a5SSteve French 
484138c8a9a5SSteve French static bool cifs_release_folio(struct folio *folio, gfp_t gfp)
484238c8a9a5SSteve French {
484338c8a9a5SSteve French 	if (folio_test_private(folio))
484438c8a9a5SSteve French 		return 0;
484538c8a9a5SSteve French 	if (folio_test_fscache(folio)) {
484638c8a9a5SSteve French 		if (current_is_kswapd() || !(gfp & __GFP_FS))
484738c8a9a5SSteve French 			return false;
484838c8a9a5SSteve French 		folio_wait_fscache(folio);
484938c8a9a5SSteve French 	}
485038c8a9a5SSteve French 	fscache_note_page_release(cifs_inode_cookie(folio->mapping->host));
485138c8a9a5SSteve French 	return true;
485238c8a9a5SSteve French }
485338c8a9a5SSteve French 
485438c8a9a5SSteve French static void cifs_invalidate_folio(struct folio *folio, size_t offset,
485538c8a9a5SSteve French 				 size_t length)
485638c8a9a5SSteve French {
485738c8a9a5SSteve French 	folio_wait_fscache(folio);
485838c8a9a5SSteve French }
485938c8a9a5SSteve French 
486038c8a9a5SSteve French static int cifs_launder_folio(struct folio *folio)
486138c8a9a5SSteve French {
486238c8a9a5SSteve French 	int rc = 0;
486338c8a9a5SSteve French 	loff_t range_start = folio_pos(folio);
486438c8a9a5SSteve French 	loff_t range_end = range_start + folio_size(folio);
486538c8a9a5SSteve French 	struct writeback_control wbc = {
486638c8a9a5SSteve French 		.sync_mode = WB_SYNC_ALL,
486738c8a9a5SSteve French 		.nr_to_write = 0,
486838c8a9a5SSteve French 		.range_start = range_start,
486938c8a9a5SSteve French 		.range_end = range_end,
487038c8a9a5SSteve French 	};
487138c8a9a5SSteve French 
487238c8a9a5SSteve French 	cifs_dbg(FYI, "Launder page: %lu\n", folio->index);
487338c8a9a5SSteve French 
487438c8a9a5SSteve French 	if (folio_clear_dirty_for_io(folio))
487538c8a9a5SSteve French 		rc = cifs_writepage_locked(&folio->page, &wbc);
487638c8a9a5SSteve French 
487738c8a9a5SSteve French 	folio_wait_fscache(folio);
487838c8a9a5SSteve French 	return rc;
487938c8a9a5SSteve French }
488038c8a9a5SSteve French 
488138c8a9a5SSteve French void cifs_oplock_break(struct work_struct *work)
488238c8a9a5SSteve French {
488338c8a9a5SSteve French 	struct cifsFileInfo *cfile = container_of(work, struct cifsFileInfo,
488438c8a9a5SSteve French 						  oplock_break);
488538c8a9a5SSteve French 	struct inode *inode = d_inode(cfile->dentry);
4886e8f5f849SSteve French 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
488738c8a9a5SSteve French 	struct cifsInodeInfo *cinode = CIFS_I(inode);
4888e8f5f849SSteve French 	struct cifs_tcon *tcon;
4889e8f5f849SSteve French 	struct TCP_Server_Info *server;
4890e8f5f849SSteve French 	struct tcon_link *tlink;
489138c8a9a5SSteve French 	int rc = 0;
489238c8a9a5SSteve French 	bool purge_cache = false, oplock_break_cancelled;
489338c8a9a5SSteve French 	__u64 persistent_fid, volatile_fid;
489438c8a9a5SSteve French 	__u16 net_fid;
489538c8a9a5SSteve French 
489638c8a9a5SSteve French 	wait_on_bit(&cinode->flags, CIFS_INODE_PENDING_WRITERS,
489738c8a9a5SSteve French 			TASK_UNINTERRUPTIBLE);
489838c8a9a5SSteve French 
4899e8f5f849SSteve French 	tlink = cifs_sb_tlink(cifs_sb);
4900e8f5f849SSteve French 	if (IS_ERR(tlink))
4901e8f5f849SSteve French 		goto out;
4902e8f5f849SSteve French 	tcon = tlink_tcon(tlink);
4903e8f5f849SSteve French 	server = tcon->ses->server;
4904e8f5f849SSteve French 
490538c8a9a5SSteve French 	server->ops->downgrade_oplock(server, cinode, cfile->oplock_level,
490638c8a9a5SSteve French 				      cfile->oplock_epoch, &purge_cache);
490738c8a9a5SSteve French 
490838c8a9a5SSteve French 	if (!CIFS_CACHE_WRITE(cinode) && CIFS_CACHE_READ(cinode) &&
490938c8a9a5SSteve French 						cifs_has_mand_locks(cinode)) {
491038c8a9a5SSteve French 		cifs_dbg(FYI, "Reset oplock to None for inode=%p due to mand locks\n",
491138c8a9a5SSteve French 			 inode);
491238c8a9a5SSteve French 		cinode->oplock = 0;
491338c8a9a5SSteve French 	}
491438c8a9a5SSteve French 
491538c8a9a5SSteve French 	if (inode && S_ISREG(inode->i_mode)) {
491638c8a9a5SSteve French 		if (CIFS_CACHE_READ(cinode))
491738c8a9a5SSteve French 			break_lease(inode, O_RDONLY);
491838c8a9a5SSteve French 		else
491938c8a9a5SSteve French 			break_lease(inode, O_WRONLY);
492038c8a9a5SSteve French 		rc = filemap_fdatawrite(inode->i_mapping);
492138c8a9a5SSteve French 		if (!CIFS_CACHE_READ(cinode) || purge_cache) {
492238c8a9a5SSteve French 			rc = filemap_fdatawait(inode->i_mapping);
492338c8a9a5SSteve French 			mapping_set_error(inode->i_mapping, rc);
492438c8a9a5SSteve French 			cifs_zap_mapping(inode);
492538c8a9a5SSteve French 		}
492638c8a9a5SSteve French 		cifs_dbg(FYI, "Oplock flush inode %p rc %d\n", inode, rc);
492738c8a9a5SSteve French 		if (CIFS_CACHE_WRITE(cinode))
492838c8a9a5SSteve French 			goto oplock_break_ack;
492938c8a9a5SSteve French 	}
493038c8a9a5SSteve French 
493138c8a9a5SSteve French 	rc = cifs_push_locks(cfile);
493238c8a9a5SSteve French 	if (rc)
493338c8a9a5SSteve French 		cifs_dbg(VFS, "Push locks rc = %d\n", rc);
493438c8a9a5SSteve French 
493538c8a9a5SSteve French oplock_break_ack:
493638c8a9a5SSteve French 	/*
493738c8a9a5SSteve French 	 * When oplock break is received and there are no active
493838c8a9a5SSteve French 	 * file handles but cached, then schedule deferred close immediately.
493938c8a9a5SSteve French 	 * So, new open will not use cached handle.
494038c8a9a5SSteve French 	 */
494138c8a9a5SSteve French 
494238c8a9a5SSteve French 	if (!CIFS_CACHE_HANDLE(cinode) && !list_empty(&cinode->deferred_closes))
494338c8a9a5SSteve French 		cifs_close_deferred_file(cinode);
494438c8a9a5SSteve French 
494538c8a9a5SSteve French 	persistent_fid = cfile->fid.persistent_fid;
494638c8a9a5SSteve French 	volatile_fid = cfile->fid.volatile_fid;
494738c8a9a5SSteve French 	net_fid = cfile->fid.netfid;
494838c8a9a5SSteve French 	oplock_break_cancelled = cfile->oplock_break_cancelled;
494938c8a9a5SSteve French 
495038c8a9a5SSteve French 	_cifsFileInfo_put(cfile, false /* do not wait for ourself */, false);
495138c8a9a5SSteve French 	/*
4952da787d5bSBharath SM 	 * MS-SMB2 3.2.5.19.1 and 3.2.5.19.2 (and MS-CIFS 3.2.5.42) do not require
4953da787d5bSBharath SM 	 * an acknowledgment to be sent when the file has already been closed.
495438c8a9a5SSteve French 	 */
4955da787d5bSBharath SM 	spin_lock(&cinode->open_file_lock);
4956e8f5f849SSteve French 	/* check list empty since can race with kill_sb calling tree disconnect */
4957e8f5f849SSteve French 	if (!oplock_break_cancelled && !list_empty(&cinode->openFileList)) {
4958da787d5bSBharath SM 		spin_unlock(&cinode->open_file_lock);
4959e8f5f849SSteve French 		rc = server->ops->oplock_response(tcon, persistent_fid,
496038c8a9a5SSteve French 						  volatile_fid, net_fid, cinode);
496138c8a9a5SSteve French 		cifs_dbg(FYI, "Oplock release rc = %d\n", rc);
4962c774e677SSteve French 	} else
4963da787d5bSBharath SM 		spin_unlock(&cinode->open_file_lock);
496438c8a9a5SSteve French 
4965e8f5f849SSteve French 	cifs_put_tlink(tlink);
4966e8f5f849SSteve French out:
496738c8a9a5SSteve French 	cifs_done_oplock_break(cinode);
496838c8a9a5SSteve French }
496938c8a9a5SSteve French 
497038c8a9a5SSteve French /*
497138c8a9a5SSteve French  * The presence of cifs_direct_io() in the address space ops vector
497238c8a9a5SSteve French  * allowes open() O_DIRECT flags which would have failed otherwise.
497338c8a9a5SSteve French  *
497438c8a9a5SSteve French  * In the non-cached mode (mount with cache=none), we shunt off direct read and write requests
497538c8a9a5SSteve French  * so this method should never be called.
497638c8a9a5SSteve French  *
497738c8a9a5SSteve French  * Direct IO is not yet supported in the cached mode.
497838c8a9a5SSteve French  */
497938c8a9a5SSteve French static ssize_t
498038c8a9a5SSteve French cifs_direct_io(struct kiocb *iocb, struct iov_iter *iter)
498138c8a9a5SSteve French {
498238c8a9a5SSteve French         /*
498338c8a9a5SSteve French          * FIXME
498438c8a9a5SSteve French          * Eventually need to support direct IO for non forcedirectio mounts
498538c8a9a5SSteve French          */
498638c8a9a5SSteve French         return -EINVAL;
498738c8a9a5SSteve French }
498838c8a9a5SSteve French 
498938c8a9a5SSteve French static int cifs_swap_activate(struct swap_info_struct *sis,
499038c8a9a5SSteve French 			      struct file *swap_file, sector_t *span)
499138c8a9a5SSteve French {
499238c8a9a5SSteve French 	struct cifsFileInfo *cfile = swap_file->private_data;
499338c8a9a5SSteve French 	struct inode *inode = swap_file->f_mapping->host;
499438c8a9a5SSteve French 	unsigned long blocks;
499538c8a9a5SSteve French 	long long isize;
499638c8a9a5SSteve French 
499738c8a9a5SSteve French 	cifs_dbg(FYI, "swap activate\n");
499838c8a9a5SSteve French 
499938c8a9a5SSteve French 	if (!swap_file->f_mapping->a_ops->swap_rw)
500038c8a9a5SSteve French 		/* Cannot support swap */
500138c8a9a5SSteve French 		return -EINVAL;
500238c8a9a5SSteve French 
500338c8a9a5SSteve French 	spin_lock(&inode->i_lock);
500438c8a9a5SSteve French 	blocks = inode->i_blocks;
500538c8a9a5SSteve French 	isize = inode->i_size;
500638c8a9a5SSteve French 	spin_unlock(&inode->i_lock);
500738c8a9a5SSteve French 	if (blocks*512 < isize) {
500838c8a9a5SSteve French 		pr_warn("swap activate: swapfile has holes\n");
500938c8a9a5SSteve French 		return -EINVAL;
501038c8a9a5SSteve French 	}
501138c8a9a5SSteve French 	*span = sis->pages;
501238c8a9a5SSteve French 
501338c8a9a5SSteve French 	pr_warn_once("Swap support over SMB3 is experimental\n");
501438c8a9a5SSteve French 
501538c8a9a5SSteve French 	/*
501638c8a9a5SSteve French 	 * TODO: consider adding ACL (or documenting how) to prevent other
501738c8a9a5SSteve French 	 * users (on this or other systems) from reading it
501838c8a9a5SSteve French 	 */
501938c8a9a5SSteve French 
502038c8a9a5SSteve French 
502138c8a9a5SSteve French 	/* TODO: add sk_set_memalloc(inet) or similar */
502238c8a9a5SSteve French 
502338c8a9a5SSteve French 	if (cfile)
502438c8a9a5SSteve French 		cfile->swapfile = true;
502538c8a9a5SSteve French 	/*
502638c8a9a5SSteve French 	 * TODO: Since file already open, we can't open with DENY_ALL here
502738c8a9a5SSteve French 	 * but we could add call to grab a byte range lock to prevent others
502838c8a9a5SSteve French 	 * from reading or writing the file
502938c8a9a5SSteve French 	 */
503038c8a9a5SSteve French 
503138c8a9a5SSteve French 	sis->flags |= SWP_FS_OPS;
503238c8a9a5SSteve French 	return add_swap_extent(sis, 0, sis->max, 0);
503338c8a9a5SSteve French }
503438c8a9a5SSteve French 
503538c8a9a5SSteve French static void cifs_swap_deactivate(struct file *file)
503638c8a9a5SSteve French {
503738c8a9a5SSteve French 	struct cifsFileInfo *cfile = file->private_data;
503838c8a9a5SSteve French 
503938c8a9a5SSteve French 	cifs_dbg(FYI, "swap deactivate\n");
504038c8a9a5SSteve French 
504138c8a9a5SSteve French 	/* TODO: undo sk_set_memalloc(inet) will eventually be needed */
504238c8a9a5SSteve French 
504338c8a9a5SSteve French 	if (cfile)
504438c8a9a5SSteve French 		cfile->swapfile = false;
504538c8a9a5SSteve French 
504638c8a9a5SSteve French 	/* do we need to unpin (or unlock) the file */
504738c8a9a5SSteve French }
504838c8a9a5SSteve French 
504938c8a9a5SSteve French /*
505038c8a9a5SSteve French  * Mark a page as having been made dirty and thus needing writeback.  We also
505138c8a9a5SSteve French  * need to pin the cache object to write back to.
505238c8a9a5SSteve French  */
505338c8a9a5SSteve French #ifdef CONFIG_CIFS_FSCACHE
505438c8a9a5SSteve French static bool cifs_dirty_folio(struct address_space *mapping, struct folio *folio)
505538c8a9a5SSteve French {
505638c8a9a5SSteve French 	return fscache_dirty_folio(mapping, folio,
505738c8a9a5SSteve French 					cifs_inode_cookie(mapping->host));
505838c8a9a5SSteve French }
505938c8a9a5SSteve French #else
506038c8a9a5SSteve French #define cifs_dirty_folio filemap_dirty_folio
506138c8a9a5SSteve French #endif
506238c8a9a5SSteve French 
506338c8a9a5SSteve French const struct address_space_operations cifs_addr_ops = {
506438c8a9a5SSteve French 	.read_folio = cifs_read_folio,
506538c8a9a5SSteve French 	.readahead = cifs_readahead,
506638c8a9a5SSteve French 	.writepages = cifs_writepages,
506738c8a9a5SSteve French 	.write_begin = cifs_write_begin,
506838c8a9a5SSteve French 	.write_end = cifs_write_end,
506938c8a9a5SSteve French 	.dirty_folio = cifs_dirty_folio,
507038c8a9a5SSteve French 	.release_folio = cifs_release_folio,
507138c8a9a5SSteve French 	.direct_IO = cifs_direct_io,
507238c8a9a5SSteve French 	.invalidate_folio = cifs_invalidate_folio,
507338c8a9a5SSteve French 	.launder_folio = cifs_launder_folio,
507438c8a9a5SSteve French 	.migrate_folio = filemap_migrate_folio,
507538c8a9a5SSteve French 	/*
507638c8a9a5SSteve French 	 * TODO: investigate and if useful we could add an is_dirty_writeback
507738c8a9a5SSteve French 	 * helper if needed
507838c8a9a5SSteve French 	 */
507938c8a9a5SSteve French 	.swap_activate = cifs_swap_activate,
508038c8a9a5SSteve French 	.swap_deactivate = cifs_swap_deactivate,
508138c8a9a5SSteve French };
508238c8a9a5SSteve French 
508338c8a9a5SSteve French /*
508438c8a9a5SSteve French  * cifs_readahead requires the server to support a buffer large enough to
508538c8a9a5SSteve French  * contain the header plus one complete page of data.  Otherwise, we need
508638c8a9a5SSteve French  * to leave cifs_readahead out of the address space operations.
508738c8a9a5SSteve French  */
508838c8a9a5SSteve French const struct address_space_operations cifs_addr_ops_smallbuf = {
508938c8a9a5SSteve French 	.read_folio = cifs_read_folio,
509038c8a9a5SSteve French 	.writepages = cifs_writepages,
509138c8a9a5SSteve French 	.write_begin = cifs_write_begin,
509238c8a9a5SSteve French 	.write_end = cifs_write_end,
509338c8a9a5SSteve French 	.dirty_folio = cifs_dirty_folio,
509438c8a9a5SSteve French 	.release_folio = cifs_release_folio,
509538c8a9a5SSteve French 	.invalidate_folio = cifs_invalidate_folio,
509638c8a9a5SSteve French 	.launder_folio = cifs_launder_folio,
509738c8a9a5SSteve French 	.migrate_folio = filemap_migrate_folio,
509838c8a9a5SSteve French };
5099