xref: /openbmc/linux/lib/iov_iter.c (revision 8780356e)
1d879cb83SAl Viro #include <linux/export.h>
22f8b5444SChristoph Hellwig #include <linux/bvec.h>
3d879cb83SAl Viro #include <linux/uio.h>
4d879cb83SAl Viro #include <linux/pagemap.h>
5d879cb83SAl Viro #include <linux/slab.h>
6d879cb83SAl Viro #include <linux/vmalloc.h>
7241699cdSAl Viro #include <linux/splice.h>
8d879cb83SAl Viro #include <net/checksum.h>
9d879cb83SAl Viro 
10241699cdSAl Viro #define PIPE_PARANOIA /* for now */
11241699cdSAl Viro 
12d879cb83SAl Viro #define iterate_iovec(i, n, __v, __p, skip, STEP) {	\
13d879cb83SAl Viro 	size_t left;					\
14d879cb83SAl Viro 	size_t wanted = n;				\
15d879cb83SAl Viro 	__p = i->iov;					\
16d879cb83SAl Viro 	__v.iov_len = min(n, __p->iov_len - skip);	\
17d879cb83SAl Viro 	if (likely(__v.iov_len)) {			\
18d879cb83SAl Viro 		__v.iov_base = __p->iov_base + skip;	\
19d879cb83SAl Viro 		left = (STEP);				\
20d879cb83SAl Viro 		__v.iov_len -= left;			\
21d879cb83SAl Viro 		skip += __v.iov_len;			\
22d879cb83SAl Viro 		n -= __v.iov_len;			\
23d879cb83SAl Viro 	} else {					\
24d879cb83SAl Viro 		left = 0;				\
25d879cb83SAl Viro 	}						\
26d879cb83SAl Viro 	while (unlikely(!left && n)) {			\
27d879cb83SAl Viro 		__p++;					\
28d879cb83SAl Viro 		__v.iov_len = min(n, __p->iov_len);	\
29d879cb83SAl Viro 		if (unlikely(!__v.iov_len))		\
30d879cb83SAl Viro 			continue;			\
31d879cb83SAl Viro 		__v.iov_base = __p->iov_base;		\
32d879cb83SAl Viro 		left = (STEP);				\
33d879cb83SAl Viro 		__v.iov_len -= left;			\
34d879cb83SAl Viro 		skip = __v.iov_len;			\
35d879cb83SAl Viro 		n -= __v.iov_len;			\
36d879cb83SAl Viro 	}						\
37d879cb83SAl Viro 	n = wanted - n;					\
38d879cb83SAl Viro }
39d879cb83SAl Viro 
40d879cb83SAl Viro #define iterate_kvec(i, n, __v, __p, skip, STEP) {	\
41d879cb83SAl Viro 	size_t wanted = n;				\
42d879cb83SAl Viro 	__p = i->kvec;					\
43d879cb83SAl Viro 	__v.iov_len = min(n, __p->iov_len - skip);	\
44d879cb83SAl Viro 	if (likely(__v.iov_len)) {			\
45d879cb83SAl Viro 		__v.iov_base = __p->iov_base + skip;	\
46d879cb83SAl Viro 		(void)(STEP);				\
47d879cb83SAl Viro 		skip += __v.iov_len;			\
48d879cb83SAl Viro 		n -= __v.iov_len;			\
49d879cb83SAl Viro 	}						\
50d879cb83SAl Viro 	while (unlikely(n)) {				\
51d879cb83SAl Viro 		__p++;					\
52d879cb83SAl Viro 		__v.iov_len = min(n, __p->iov_len);	\
53d879cb83SAl Viro 		if (unlikely(!__v.iov_len))		\
54d879cb83SAl Viro 			continue;			\
55d879cb83SAl Viro 		__v.iov_base = __p->iov_base;		\
56d879cb83SAl Viro 		(void)(STEP);				\
57d879cb83SAl Viro 		skip = __v.iov_len;			\
58d879cb83SAl Viro 		n -= __v.iov_len;			\
59d879cb83SAl Viro 	}						\
60d879cb83SAl Viro 	n = wanted;					\
61d879cb83SAl Viro }
62d879cb83SAl Viro 
631bdc76aeSMing Lei #define iterate_bvec(i, n, __v, __bi, skip, STEP) {	\
641bdc76aeSMing Lei 	struct bvec_iter __start;			\
651bdc76aeSMing Lei 	__start.bi_size = n;				\
661bdc76aeSMing Lei 	__start.bi_bvec_done = skip;			\
671bdc76aeSMing Lei 	__start.bi_idx = 0;				\
681bdc76aeSMing Lei 	for_each_bvec(__v, i->bvec, __bi, __start) {	\
691bdc76aeSMing Lei 		if (!__v.bv_len)			\
70d879cb83SAl Viro 			continue;			\
71d879cb83SAl Viro 		(void)(STEP);				\
72d879cb83SAl Viro 	}						\
73d879cb83SAl Viro }
74d879cb83SAl Viro 
75d879cb83SAl Viro #define iterate_all_kinds(i, n, v, I, B, K) {			\
7633844e66SAl Viro 	if (likely(n)) {					\
77d879cb83SAl Viro 		size_t skip = i->iov_offset;			\
78d879cb83SAl Viro 		if (unlikely(i->type & ITER_BVEC)) {		\
79d879cb83SAl Viro 			struct bio_vec v;			\
801bdc76aeSMing Lei 			struct bvec_iter __bi;			\
811bdc76aeSMing Lei 			iterate_bvec(i, n, v, __bi, skip, (B))	\
82d879cb83SAl Viro 		} else if (unlikely(i->type & ITER_KVEC)) {	\
83d879cb83SAl Viro 			const struct kvec *kvec;		\
84d879cb83SAl Viro 			struct kvec v;				\
85d879cb83SAl Viro 			iterate_kvec(i, n, v, kvec, skip, (K))	\
86d879cb83SAl Viro 		} else {					\
87d879cb83SAl Viro 			const struct iovec *iov;		\
88d879cb83SAl Viro 			struct iovec v;				\
89d879cb83SAl Viro 			iterate_iovec(i, n, v, iov, skip, (I))	\
90d879cb83SAl Viro 		}						\
9133844e66SAl Viro 	}							\
92d879cb83SAl Viro }
93d879cb83SAl Viro 
94d879cb83SAl Viro #define iterate_and_advance(i, n, v, I, B, K) {			\
95dd254f5aSAl Viro 	if (unlikely(i->count < n))				\
96dd254f5aSAl Viro 		n = i->count;					\
9719f18459SAl Viro 	if (i->count) {						\
98d879cb83SAl Viro 		size_t skip = i->iov_offset;			\
99d879cb83SAl Viro 		if (unlikely(i->type & ITER_BVEC)) {		\
1001bdc76aeSMing Lei 			const struct bio_vec *bvec = i->bvec;	\
101d879cb83SAl Viro 			struct bio_vec v;			\
1021bdc76aeSMing Lei 			struct bvec_iter __bi;			\
1031bdc76aeSMing Lei 			iterate_bvec(i, n, v, __bi, skip, (B))	\
1041bdc76aeSMing Lei 			i->bvec = __bvec_iter_bvec(i->bvec, __bi);	\
1051bdc76aeSMing Lei 			i->nr_segs -= i->bvec - bvec;		\
1061bdc76aeSMing Lei 			skip = __bi.bi_bvec_done;		\
107d879cb83SAl Viro 		} else if (unlikely(i->type & ITER_KVEC)) {	\
108d879cb83SAl Viro 			const struct kvec *kvec;		\
109d879cb83SAl Viro 			struct kvec v;				\
110d879cb83SAl Viro 			iterate_kvec(i, n, v, kvec, skip, (K))	\
111d879cb83SAl Viro 			if (skip == kvec->iov_len) {		\
112d879cb83SAl Viro 				kvec++;				\
113d879cb83SAl Viro 				skip = 0;			\
114d879cb83SAl Viro 			}					\
115d879cb83SAl Viro 			i->nr_segs -= kvec - i->kvec;		\
116d879cb83SAl Viro 			i->kvec = kvec;				\
117d879cb83SAl Viro 		} else {					\
118d879cb83SAl Viro 			const struct iovec *iov;		\
119d879cb83SAl Viro 			struct iovec v;				\
120d879cb83SAl Viro 			iterate_iovec(i, n, v, iov, skip, (I))	\
121d879cb83SAl Viro 			if (skip == iov->iov_len) {		\
122d879cb83SAl Viro 				iov++;				\
123d879cb83SAl Viro 				skip = 0;			\
124d879cb83SAl Viro 			}					\
125d879cb83SAl Viro 			i->nr_segs -= iov - i->iov;		\
126d879cb83SAl Viro 			i->iov = iov;				\
127d879cb83SAl Viro 		}						\
128d879cb83SAl Viro 		i->count -= n;					\
129d879cb83SAl Viro 		i->iov_offset = skip;				\
130dd254f5aSAl Viro 	}							\
131d879cb83SAl Viro }
132d879cb83SAl Viro 
13309fc68dcSAl Viro static int copyout(void __user *to, const void *from, size_t n)
13409fc68dcSAl Viro {
13509fc68dcSAl Viro 	if (access_ok(VERIFY_WRITE, to, n)) {
13609fc68dcSAl Viro 		kasan_check_read(from, n);
13709fc68dcSAl Viro 		n = raw_copy_to_user(to, from, n);
13809fc68dcSAl Viro 	}
13909fc68dcSAl Viro 	return n;
14009fc68dcSAl Viro }
14109fc68dcSAl Viro 
14209fc68dcSAl Viro static int copyin(void *to, const void __user *from, size_t n)
14309fc68dcSAl Viro {
14409fc68dcSAl Viro 	if (access_ok(VERIFY_READ, from, n)) {
14509fc68dcSAl Viro 		kasan_check_write(to, n);
14609fc68dcSAl Viro 		n = raw_copy_from_user(to, from, n);
14709fc68dcSAl Viro 	}
14809fc68dcSAl Viro 	return n;
14909fc68dcSAl Viro }
15009fc68dcSAl Viro 
151d879cb83SAl Viro static size_t copy_page_to_iter_iovec(struct page *page, size_t offset, size_t bytes,
152d879cb83SAl Viro 			 struct iov_iter *i)
153d879cb83SAl Viro {
154d879cb83SAl Viro 	size_t skip, copy, left, wanted;
155d879cb83SAl Viro 	const struct iovec *iov;
156d879cb83SAl Viro 	char __user *buf;
157d879cb83SAl Viro 	void *kaddr, *from;
158d879cb83SAl Viro 
159d879cb83SAl Viro 	if (unlikely(bytes > i->count))
160d879cb83SAl Viro 		bytes = i->count;
161d879cb83SAl Viro 
162d879cb83SAl Viro 	if (unlikely(!bytes))
163d879cb83SAl Viro 		return 0;
164d879cb83SAl Viro 
16509fc68dcSAl Viro 	might_fault();
166d879cb83SAl Viro 	wanted = bytes;
167d879cb83SAl Viro 	iov = i->iov;
168d879cb83SAl Viro 	skip = i->iov_offset;
169d879cb83SAl Viro 	buf = iov->iov_base + skip;
170d879cb83SAl Viro 	copy = min(bytes, iov->iov_len - skip);
171d879cb83SAl Viro 
1723fa6c507SMikulas Patocka 	if (IS_ENABLED(CONFIG_HIGHMEM) && !fault_in_pages_writeable(buf, copy)) {
173d879cb83SAl Viro 		kaddr = kmap_atomic(page);
174d879cb83SAl Viro 		from = kaddr + offset;
175d879cb83SAl Viro 
176d879cb83SAl Viro 		/* first chunk, usually the only one */
17709fc68dcSAl Viro 		left = copyout(buf, from, copy);
178d879cb83SAl Viro 		copy -= left;
179d879cb83SAl Viro 		skip += copy;
180d879cb83SAl Viro 		from += copy;
181d879cb83SAl Viro 		bytes -= copy;
182d879cb83SAl Viro 
183d879cb83SAl Viro 		while (unlikely(!left && bytes)) {
184d879cb83SAl Viro 			iov++;
185d879cb83SAl Viro 			buf = iov->iov_base;
186d879cb83SAl Viro 			copy = min(bytes, iov->iov_len);
18709fc68dcSAl Viro 			left = copyout(buf, from, copy);
188d879cb83SAl Viro 			copy -= left;
189d879cb83SAl Viro 			skip = copy;
190d879cb83SAl Viro 			from += copy;
191d879cb83SAl Viro 			bytes -= copy;
192d879cb83SAl Viro 		}
193d879cb83SAl Viro 		if (likely(!bytes)) {
194d879cb83SAl Viro 			kunmap_atomic(kaddr);
195d879cb83SAl Viro 			goto done;
196d879cb83SAl Viro 		}
197d879cb83SAl Viro 		offset = from - kaddr;
198d879cb83SAl Viro 		buf += copy;
199d879cb83SAl Viro 		kunmap_atomic(kaddr);
200d879cb83SAl Viro 		copy = min(bytes, iov->iov_len - skip);
201d879cb83SAl Viro 	}
202d879cb83SAl Viro 	/* Too bad - revert to non-atomic kmap */
2033fa6c507SMikulas Patocka 
204d879cb83SAl Viro 	kaddr = kmap(page);
205d879cb83SAl Viro 	from = kaddr + offset;
20609fc68dcSAl Viro 	left = copyout(buf, from, copy);
207d879cb83SAl Viro 	copy -= left;
208d879cb83SAl Viro 	skip += copy;
209d879cb83SAl Viro 	from += copy;
210d879cb83SAl Viro 	bytes -= copy;
211d879cb83SAl Viro 	while (unlikely(!left && bytes)) {
212d879cb83SAl Viro 		iov++;
213d879cb83SAl Viro 		buf = iov->iov_base;
214d879cb83SAl Viro 		copy = min(bytes, iov->iov_len);
21509fc68dcSAl Viro 		left = copyout(buf, from, copy);
216d879cb83SAl Viro 		copy -= left;
217d879cb83SAl Viro 		skip = copy;
218d879cb83SAl Viro 		from += copy;
219d879cb83SAl Viro 		bytes -= copy;
220d879cb83SAl Viro 	}
221d879cb83SAl Viro 	kunmap(page);
2223fa6c507SMikulas Patocka 
223d879cb83SAl Viro done:
224d879cb83SAl Viro 	if (skip == iov->iov_len) {
225d879cb83SAl Viro 		iov++;
226d879cb83SAl Viro 		skip = 0;
227d879cb83SAl Viro 	}
228d879cb83SAl Viro 	i->count -= wanted - bytes;
229d879cb83SAl Viro 	i->nr_segs -= iov - i->iov;
230d879cb83SAl Viro 	i->iov = iov;
231d879cb83SAl Viro 	i->iov_offset = skip;
232d879cb83SAl Viro 	return wanted - bytes;
233d879cb83SAl Viro }
234d879cb83SAl Viro 
235d879cb83SAl Viro static size_t copy_page_from_iter_iovec(struct page *page, size_t offset, size_t bytes,
236d879cb83SAl Viro 			 struct iov_iter *i)
237d879cb83SAl Viro {
238d879cb83SAl Viro 	size_t skip, copy, left, wanted;
239d879cb83SAl Viro 	const struct iovec *iov;
240d879cb83SAl Viro 	char __user *buf;
241d879cb83SAl Viro 	void *kaddr, *to;
242d879cb83SAl Viro 
243d879cb83SAl Viro 	if (unlikely(bytes > i->count))
244d879cb83SAl Viro 		bytes = i->count;
245d879cb83SAl Viro 
246d879cb83SAl Viro 	if (unlikely(!bytes))
247d879cb83SAl Viro 		return 0;
248d879cb83SAl Viro 
24909fc68dcSAl Viro 	might_fault();
250d879cb83SAl Viro 	wanted = bytes;
251d879cb83SAl Viro 	iov = i->iov;
252d879cb83SAl Viro 	skip = i->iov_offset;
253d879cb83SAl Viro 	buf = iov->iov_base + skip;
254d879cb83SAl Viro 	copy = min(bytes, iov->iov_len - skip);
255d879cb83SAl Viro 
2563fa6c507SMikulas Patocka 	if (IS_ENABLED(CONFIG_HIGHMEM) && !fault_in_pages_readable(buf, copy)) {
257d879cb83SAl Viro 		kaddr = kmap_atomic(page);
258d879cb83SAl Viro 		to = kaddr + offset;
259d879cb83SAl Viro 
260d879cb83SAl Viro 		/* first chunk, usually the only one */
26109fc68dcSAl Viro 		left = copyin(to, buf, copy);
262d879cb83SAl Viro 		copy -= left;
263d879cb83SAl Viro 		skip += copy;
264d879cb83SAl Viro 		to += copy;
265d879cb83SAl Viro 		bytes -= copy;
266d879cb83SAl Viro 
267d879cb83SAl Viro 		while (unlikely(!left && bytes)) {
268d879cb83SAl Viro 			iov++;
269d879cb83SAl Viro 			buf = iov->iov_base;
270d879cb83SAl Viro 			copy = min(bytes, iov->iov_len);
27109fc68dcSAl Viro 			left = copyin(to, buf, copy);
272d879cb83SAl Viro 			copy -= left;
273d879cb83SAl Viro 			skip = copy;
274d879cb83SAl Viro 			to += copy;
275d879cb83SAl Viro 			bytes -= copy;
276d879cb83SAl Viro 		}
277d879cb83SAl Viro 		if (likely(!bytes)) {
278d879cb83SAl Viro 			kunmap_atomic(kaddr);
279d879cb83SAl Viro 			goto done;
280d879cb83SAl Viro 		}
281d879cb83SAl Viro 		offset = to - kaddr;
282d879cb83SAl Viro 		buf += copy;
283d879cb83SAl Viro 		kunmap_atomic(kaddr);
284d879cb83SAl Viro 		copy = min(bytes, iov->iov_len - skip);
285d879cb83SAl Viro 	}
286d879cb83SAl Viro 	/* Too bad - revert to non-atomic kmap */
2873fa6c507SMikulas Patocka 
288d879cb83SAl Viro 	kaddr = kmap(page);
289d879cb83SAl Viro 	to = kaddr + offset;
29009fc68dcSAl Viro 	left = copyin(to, buf, copy);
291d879cb83SAl Viro 	copy -= left;
292d879cb83SAl Viro 	skip += copy;
293d879cb83SAl Viro 	to += copy;
294d879cb83SAl Viro 	bytes -= copy;
295d879cb83SAl Viro 	while (unlikely(!left && bytes)) {
296d879cb83SAl Viro 		iov++;
297d879cb83SAl Viro 		buf = iov->iov_base;
298d879cb83SAl Viro 		copy = min(bytes, iov->iov_len);
29909fc68dcSAl Viro 		left = copyin(to, buf, copy);
300d879cb83SAl Viro 		copy -= left;
301d879cb83SAl Viro 		skip = copy;
302d879cb83SAl Viro 		to += copy;
303d879cb83SAl Viro 		bytes -= copy;
304d879cb83SAl Viro 	}
305d879cb83SAl Viro 	kunmap(page);
3063fa6c507SMikulas Patocka 
307d879cb83SAl Viro done:
308d879cb83SAl Viro 	if (skip == iov->iov_len) {
309d879cb83SAl Viro 		iov++;
310d879cb83SAl Viro 		skip = 0;
311d879cb83SAl Viro 	}
312d879cb83SAl Viro 	i->count -= wanted - bytes;
313d879cb83SAl Viro 	i->nr_segs -= iov - i->iov;
314d879cb83SAl Viro 	i->iov = iov;
315d879cb83SAl Viro 	i->iov_offset = skip;
316d879cb83SAl Viro 	return wanted - bytes;
317d879cb83SAl Viro }
318d879cb83SAl Viro 
319241699cdSAl Viro #ifdef PIPE_PARANOIA
320241699cdSAl Viro static bool sanity(const struct iov_iter *i)
321241699cdSAl Viro {
322241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
323241699cdSAl Viro 	int idx = i->idx;
324241699cdSAl Viro 	int next = pipe->curbuf + pipe->nrbufs;
325241699cdSAl Viro 	if (i->iov_offset) {
326241699cdSAl Viro 		struct pipe_buffer *p;
327241699cdSAl Viro 		if (unlikely(!pipe->nrbufs))
328241699cdSAl Viro 			goto Bad;	// pipe must be non-empty
329241699cdSAl Viro 		if (unlikely(idx != ((next - 1) & (pipe->buffers - 1))))
330241699cdSAl Viro 			goto Bad;	// must be at the last buffer...
331241699cdSAl Viro 
332241699cdSAl Viro 		p = &pipe->bufs[idx];
333241699cdSAl Viro 		if (unlikely(p->offset + p->len != i->iov_offset))
334241699cdSAl Viro 			goto Bad;	// ... at the end of segment
335241699cdSAl Viro 	} else {
336241699cdSAl Viro 		if (idx != (next & (pipe->buffers - 1)))
337241699cdSAl Viro 			goto Bad;	// must be right after the last buffer
338241699cdSAl Viro 	}
339241699cdSAl Viro 	return true;
340241699cdSAl Viro Bad:
341241699cdSAl Viro 	printk(KERN_ERR "idx = %d, offset = %zd\n", i->idx, i->iov_offset);
342241699cdSAl Viro 	printk(KERN_ERR "curbuf = %d, nrbufs = %d, buffers = %d\n",
343241699cdSAl Viro 			pipe->curbuf, pipe->nrbufs, pipe->buffers);
344241699cdSAl Viro 	for (idx = 0; idx < pipe->buffers; idx++)
345241699cdSAl Viro 		printk(KERN_ERR "[%p %p %d %d]\n",
346241699cdSAl Viro 			pipe->bufs[idx].ops,
347241699cdSAl Viro 			pipe->bufs[idx].page,
348241699cdSAl Viro 			pipe->bufs[idx].offset,
349241699cdSAl Viro 			pipe->bufs[idx].len);
350241699cdSAl Viro 	WARN_ON(1);
351241699cdSAl Viro 	return false;
352241699cdSAl Viro }
353241699cdSAl Viro #else
354241699cdSAl Viro #define sanity(i) true
355241699cdSAl Viro #endif
356241699cdSAl Viro 
357241699cdSAl Viro static inline int next_idx(int idx, struct pipe_inode_info *pipe)
358241699cdSAl Viro {
359241699cdSAl Viro 	return (idx + 1) & (pipe->buffers - 1);
360241699cdSAl Viro }
361241699cdSAl Viro 
362241699cdSAl Viro static size_t copy_page_to_iter_pipe(struct page *page, size_t offset, size_t bytes,
363241699cdSAl Viro 			 struct iov_iter *i)
364241699cdSAl Viro {
365241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
366241699cdSAl Viro 	struct pipe_buffer *buf;
367241699cdSAl Viro 	size_t off;
368241699cdSAl Viro 	int idx;
369241699cdSAl Viro 
370241699cdSAl Viro 	if (unlikely(bytes > i->count))
371241699cdSAl Viro 		bytes = i->count;
372241699cdSAl Viro 
373241699cdSAl Viro 	if (unlikely(!bytes))
374241699cdSAl Viro 		return 0;
375241699cdSAl Viro 
376241699cdSAl Viro 	if (!sanity(i))
377241699cdSAl Viro 		return 0;
378241699cdSAl Viro 
379241699cdSAl Viro 	off = i->iov_offset;
380241699cdSAl Viro 	idx = i->idx;
381241699cdSAl Viro 	buf = &pipe->bufs[idx];
382241699cdSAl Viro 	if (off) {
383241699cdSAl Viro 		if (offset == off && buf->page == page) {
384241699cdSAl Viro 			/* merge with the last one */
385241699cdSAl Viro 			buf->len += bytes;
386241699cdSAl Viro 			i->iov_offset += bytes;
387241699cdSAl Viro 			goto out;
388241699cdSAl Viro 		}
389241699cdSAl Viro 		idx = next_idx(idx, pipe);
390241699cdSAl Viro 		buf = &pipe->bufs[idx];
391241699cdSAl Viro 	}
392241699cdSAl Viro 	if (idx == pipe->curbuf && pipe->nrbufs)
393241699cdSAl Viro 		return 0;
394241699cdSAl Viro 	pipe->nrbufs++;
395241699cdSAl Viro 	buf->ops = &page_cache_pipe_buf_ops;
396241699cdSAl Viro 	get_page(buf->page = page);
397241699cdSAl Viro 	buf->offset = offset;
398241699cdSAl Viro 	buf->len = bytes;
399241699cdSAl Viro 	i->iov_offset = offset + bytes;
400241699cdSAl Viro 	i->idx = idx;
401241699cdSAl Viro out:
402241699cdSAl Viro 	i->count -= bytes;
403241699cdSAl Viro 	return bytes;
404241699cdSAl Viro }
405241699cdSAl Viro 
406d879cb83SAl Viro /*
407171a0203SAnton Altaparmakov  * Fault in one or more iovecs of the given iov_iter, to a maximum length of
408171a0203SAnton Altaparmakov  * bytes.  For each iovec, fault in each page that constitutes the iovec.
409171a0203SAnton Altaparmakov  *
410171a0203SAnton Altaparmakov  * Return 0 on success, or non-zero if the memory could not be accessed (i.e.
411171a0203SAnton Altaparmakov  * because it is an invalid address).
412171a0203SAnton Altaparmakov  */
413d4690f1eSAl Viro int iov_iter_fault_in_readable(struct iov_iter *i, size_t bytes)
414171a0203SAnton Altaparmakov {
415171a0203SAnton Altaparmakov 	size_t skip = i->iov_offset;
416171a0203SAnton Altaparmakov 	const struct iovec *iov;
417171a0203SAnton Altaparmakov 	int err;
418171a0203SAnton Altaparmakov 	struct iovec v;
419171a0203SAnton Altaparmakov 
420171a0203SAnton Altaparmakov 	if (!(i->type & (ITER_BVEC|ITER_KVEC))) {
421171a0203SAnton Altaparmakov 		iterate_iovec(i, bytes, v, iov, skip, ({
4224bce9f6eSAl Viro 			err = fault_in_pages_readable(v.iov_base, v.iov_len);
423171a0203SAnton Altaparmakov 			if (unlikely(err))
424171a0203SAnton Altaparmakov 			return err;
425171a0203SAnton Altaparmakov 		0;}))
426171a0203SAnton Altaparmakov 	}
427171a0203SAnton Altaparmakov 	return 0;
428171a0203SAnton Altaparmakov }
429d4690f1eSAl Viro EXPORT_SYMBOL(iov_iter_fault_in_readable);
430171a0203SAnton Altaparmakov 
431d879cb83SAl Viro void iov_iter_init(struct iov_iter *i, int direction,
432d879cb83SAl Viro 			const struct iovec *iov, unsigned long nr_segs,
433d879cb83SAl Viro 			size_t count)
434d879cb83SAl Viro {
435d879cb83SAl Viro 	/* It will get better.  Eventually... */
436db68ce10SAl Viro 	if (uaccess_kernel()) {
437d879cb83SAl Viro 		direction |= ITER_KVEC;
438d879cb83SAl Viro 		i->type = direction;
439d879cb83SAl Viro 		i->kvec = (struct kvec *)iov;
440d879cb83SAl Viro 	} else {
441d879cb83SAl Viro 		i->type = direction;
442d879cb83SAl Viro 		i->iov = iov;
443d879cb83SAl Viro 	}
444d879cb83SAl Viro 	i->nr_segs = nr_segs;
445d879cb83SAl Viro 	i->iov_offset = 0;
446d879cb83SAl Viro 	i->count = count;
447d879cb83SAl Viro }
448d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_init);
449d879cb83SAl Viro 
450d879cb83SAl Viro static void memcpy_from_page(char *to, struct page *page, size_t offset, size_t len)
451d879cb83SAl Viro {
452d879cb83SAl Viro 	char *from = kmap_atomic(page);
453d879cb83SAl Viro 	memcpy(to, from + offset, len);
454d879cb83SAl Viro 	kunmap_atomic(from);
455d879cb83SAl Viro }
456d879cb83SAl Viro 
45736f7a8a4SAl Viro static void memcpy_to_page(struct page *page, size_t offset, const char *from, size_t len)
458d879cb83SAl Viro {
459d879cb83SAl Viro 	char *to = kmap_atomic(page);
460d879cb83SAl Viro 	memcpy(to + offset, from, len);
461d879cb83SAl Viro 	kunmap_atomic(to);
462d879cb83SAl Viro }
463d879cb83SAl Viro 
464d879cb83SAl Viro static void memzero_page(struct page *page, size_t offset, size_t len)
465d879cb83SAl Viro {
466d879cb83SAl Viro 	char *addr = kmap_atomic(page);
467d879cb83SAl Viro 	memset(addr + offset, 0, len);
468d879cb83SAl Viro 	kunmap_atomic(addr);
469d879cb83SAl Viro }
470d879cb83SAl Viro 
471241699cdSAl Viro static inline bool allocated(struct pipe_buffer *buf)
472241699cdSAl Viro {
473241699cdSAl Viro 	return buf->ops == &default_pipe_buf_ops;
474241699cdSAl Viro }
475241699cdSAl Viro 
476241699cdSAl Viro static inline void data_start(const struct iov_iter *i, int *idxp, size_t *offp)
477241699cdSAl Viro {
478241699cdSAl Viro 	size_t off = i->iov_offset;
479241699cdSAl Viro 	int idx = i->idx;
480241699cdSAl Viro 	if (off && (!allocated(&i->pipe->bufs[idx]) || off == PAGE_SIZE)) {
481241699cdSAl Viro 		idx = next_idx(idx, i->pipe);
482241699cdSAl Viro 		off = 0;
483241699cdSAl Viro 	}
484241699cdSAl Viro 	*idxp = idx;
485241699cdSAl Viro 	*offp = off;
486241699cdSAl Viro }
487241699cdSAl Viro 
488241699cdSAl Viro static size_t push_pipe(struct iov_iter *i, size_t size,
489241699cdSAl Viro 			int *idxp, size_t *offp)
490241699cdSAl Viro {
491241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
492241699cdSAl Viro 	size_t off;
493241699cdSAl Viro 	int idx;
494241699cdSAl Viro 	ssize_t left;
495241699cdSAl Viro 
496241699cdSAl Viro 	if (unlikely(size > i->count))
497241699cdSAl Viro 		size = i->count;
498241699cdSAl Viro 	if (unlikely(!size))
499241699cdSAl Viro 		return 0;
500241699cdSAl Viro 
501241699cdSAl Viro 	left = size;
502241699cdSAl Viro 	data_start(i, &idx, &off);
503241699cdSAl Viro 	*idxp = idx;
504241699cdSAl Viro 	*offp = off;
505241699cdSAl Viro 	if (off) {
506241699cdSAl Viro 		left -= PAGE_SIZE - off;
507241699cdSAl Viro 		if (left <= 0) {
508241699cdSAl Viro 			pipe->bufs[idx].len += size;
509241699cdSAl Viro 			return size;
510241699cdSAl Viro 		}
511241699cdSAl Viro 		pipe->bufs[idx].len = PAGE_SIZE;
512241699cdSAl Viro 		idx = next_idx(idx, pipe);
513241699cdSAl Viro 	}
514241699cdSAl Viro 	while (idx != pipe->curbuf || !pipe->nrbufs) {
515241699cdSAl Viro 		struct page *page = alloc_page(GFP_USER);
516241699cdSAl Viro 		if (!page)
517241699cdSAl Viro 			break;
518241699cdSAl Viro 		pipe->nrbufs++;
519241699cdSAl Viro 		pipe->bufs[idx].ops = &default_pipe_buf_ops;
520241699cdSAl Viro 		pipe->bufs[idx].page = page;
521241699cdSAl Viro 		pipe->bufs[idx].offset = 0;
522241699cdSAl Viro 		if (left <= PAGE_SIZE) {
523241699cdSAl Viro 			pipe->bufs[idx].len = left;
524241699cdSAl Viro 			return size;
525241699cdSAl Viro 		}
526241699cdSAl Viro 		pipe->bufs[idx].len = PAGE_SIZE;
527241699cdSAl Viro 		left -= PAGE_SIZE;
528241699cdSAl Viro 		idx = next_idx(idx, pipe);
529241699cdSAl Viro 	}
530241699cdSAl Viro 	return size - left;
531241699cdSAl Viro }
532241699cdSAl Viro 
533241699cdSAl Viro static size_t copy_pipe_to_iter(const void *addr, size_t bytes,
534241699cdSAl Viro 				struct iov_iter *i)
535241699cdSAl Viro {
536241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
537241699cdSAl Viro 	size_t n, off;
538241699cdSAl Viro 	int idx;
539241699cdSAl Viro 
540241699cdSAl Viro 	if (!sanity(i))
541241699cdSAl Viro 		return 0;
542241699cdSAl Viro 
543241699cdSAl Viro 	bytes = n = push_pipe(i, bytes, &idx, &off);
544241699cdSAl Viro 	if (unlikely(!n))
545241699cdSAl Viro 		return 0;
546241699cdSAl Viro 	for ( ; n; idx = next_idx(idx, pipe), off = 0) {
547241699cdSAl Viro 		size_t chunk = min_t(size_t, n, PAGE_SIZE - off);
548241699cdSAl Viro 		memcpy_to_page(pipe->bufs[idx].page, off, addr, chunk);
549241699cdSAl Viro 		i->idx = idx;
550241699cdSAl Viro 		i->iov_offset = off + chunk;
551241699cdSAl Viro 		n -= chunk;
552241699cdSAl Viro 		addr += chunk;
553241699cdSAl Viro 	}
554241699cdSAl Viro 	i->count -= bytes;
555241699cdSAl Viro 	return bytes;
556241699cdSAl Viro }
557241699cdSAl Viro 
558aa28de27SAl Viro size_t _copy_to_iter(const void *addr, size_t bytes, struct iov_iter *i)
559d879cb83SAl Viro {
56036f7a8a4SAl Viro 	const char *from = addr;
561241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE))
562241699cdSAl Viro 		return copy_pipe_to_iter(addr, bytes, i);
56309fc68dcSAl Viro 	if (iter_is_iovec(i))
56409fc68dcSAl Viro 		might_fault();
565d879cb83SAl Viro 	iterate_and_advance(i, bytes, v,
56609fc68dcSAl Viro 		copyout(v.iov_base, (from += v.iov_len) - v.iov_len, v.iov_len),
567d879cb83SAl Viro 		memcpy_to_page(v.bv_page, v.bv_offset,
568d879cb83SAl Viro 			       (from += v.bv_len) - v.bv_len, v.bv_len),
569d879cb83SAl Viro 		memcpy(v.iov_base, (from += v.iov_len) - v.iov_len, v.iov_len)
570d879cb83SAl Viro 	)
571d879cb83SAl Viro 
572d879cb83SAl Viro 	return bytes;
573d879cb83SAl Viro }
574aa28de27SAl Viro EXPORT_SYMBOL(_copy_to_iter);
575d879cb83SAl Viro 
5768780356eSDan Williams #ifdef CONFIG_ARCH_HAS_UACCESS_MCSAFE
5778780356eSDan Williams static int copyout_mcsafe(void __user *to, const void *from, size_t n)
5788780356eSDan Williams {
5798780356eSDan Williams 	if (access_ok(VERIFY_WRITE, to, n)) {
5808780356eSDan Williams 		kasan_check_read(from, n);
5818780356eSDan Williams 		n = copy_to_user_mcsafe((__force void *) to, from, n);
5828780356eSDan Williams 	}
5838780356eSDan Williams 	return n;
5848780356eSDan Williams }
5858780356eSDan Williams 
5868780356eSDan Williams static unsigned long memcpy_mcsafe_to_page(struct page *page, size_t offset,
5878780356eSDan Williams 		const char *from, size_t len)
5888780356eSDan Williams {
5898780356eSDan Williams 	unsigned long ret;
5908780356eSDan Williams 	char *to;
5918780356eSDan Williams 
5928780356eSDan Williams 	to = kmap_atomic(page);
5938780356eSDan Williams 	ret = memcpy_mcsafe(to + offset, from, len);
5948780356eSDan Williams 	kunmap_atomic(to);
5958780356eSDan Williams 
5968780356eSDan Williams 	return ret;
5978780356eSDan Williams }
5988780356eSDan Williams 
5998780356eSDan Williams size_t _copy_to_iter_mcsafe(const void *addr, size_t bytes, struct iov_iter *i)
6008780356eSDan Williams {
6018780356eSDan Williams 	const char *from = addr;
6028780356eSDan Williams 	unsigned long rem, curr_addr, s_addr = (unsigned long) addr;
6038780356eSDan Williams 
6048780356eSDan Williams 	if (unlikely(i->type & ITER_PIPE)) {
6058780356eSDan Williams 		WARN_ON(1);
6068780356eSDan Williams 		return 0;
6078780356eSDan Williams 	}
6088780356eSDan Williams 	if (iter_is_iovec(i))
6098780356eSDan Williams 		might_fault();
6108780356eSDan Williams 	iterate_and_advance(i, bytes, v,
6118780356eSDan Williams 		copyout_mcsafe(v.iov_base, (from += v.iov_len) - v.iov_len, v.iov_len),
6128780356eSDan Williams 		({
6138780356eSDan Williams 		rem = memcpy_mcsafe_to_page(v.bv_page, v.bv_offset,
6148780356eSDan Williams                                (from += v.bv_len) - v.bv_len, v.bv_len);
6158780356eSDan Williams 		if (rem) {
6168780356eSDan Williams 			curr_addr = (unsigned long) from;
6178780356eSDan Williams 			bytes = curr_addr - s_addr - rem;
6188780356eSDan Williams 			return bytes;
6198780356eSDan Williams 		}
6208780356eSDan Williams 		}),
6218780356eSDan Williams 		({
6228780356eSDan Williams 		rem = memcpy_mcsafe(v.iov_base, (from += v.iov_len) - v.iov_len,
6238780356eSDan Williams 				v.iov_len);
6248780356eSDan Williams 		if (rem) {
6258780356eSDan Williams 			curr_addr = (unsigned long) from;
6268780356eSDan Williams 			bytes = curr_addr - s_addr - rem;
6278780356eSDan Williams 			return bytes;
6288780356eSDan Williams 		}
6298780356eSDan Williams 		})
6308780356eSDan Williams 	)
6318780356eSDan Williams 
6328780356eSDan Williams 	return bytes;
6338780356eSDan Williams }
6348780356eSDan Williams EXPORT_SYMBOL_GPL(_copy_to_iter_mcsafe);
6358780356eSDan Williams #endif /* CONFIG_ARCH_HAS_UACCESS_MCSAFE */
6368780356eSDan Williams 
637aa28de27SAl Viro size_t _copy_from_iter(void *addr, size_t bytes, struct iov_iter *i)
638d879cb83SAl Viro {
639d879cb83SAl Viro 	char *to = addr;
640241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
641241699cdSAl Viro 		WARN_ON(1);
642241699cdSAl Viro 		return 0;
643241699cdSAl Viro 	}
64409fc68dcSAl Viro 	if (iter_is_iovec(i))
64509fc68dcSAl Viro 		might_fault();
646d879cb83SAl Viro 	iterate_and_advance(i, bytes, v,
64709fc68dcSAl Viro 		copyin((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len),
648d879cb83SAl Viro 		memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page,
649d879cb83SAl Viro 				 v.bv_offset, v.bv_len),
650d879cb83SAl Viro 		memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len)
651d879cb83SAl Viro 	)
652d879cb83SAl Viro 
653d879cb83SAl Viro 	return bytes;
654d879cb83SAl Viro }
655aa28de27SAl Viro EXPORT_SYMBOL(_copy_from_iter);
656d879cb83SAl Viro 
657aa28de27SAl Viro bool _copy_from_iter_full(void *addr, size_t bytes, struct iov_iter *i)
658cbbd26b8SAl Viro {
659cbbd26b8SAl Viro 	char *to = addr;
660cbbd26b8SAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
661cbbd26b8SAl Viro 		WARN_ON(1);
662cbbd26b8SAl Viro 		return false;
663cbbd26b8SAl Viro 	}
66433844e66SAl Viro 	if (unlikely(i->count < bytes))
665cbbd26b8SAl Viro 		return false;
666cbbd26b8SAl Viro 
66709fc68dcSAl Viro 	if (iter_is_iovec(i))
66809fc68dcSAl Viro 		might_fault();
669cbbd26b8SAl Viro 	iterate_all_kinds(i, bytes, v, ({
67009fc68dcSAl Viro 		if (copyin((to += v.iov_len) - v.iov_len,
671cbbd26b8SAl Viro 				      v.iov_base, v.iov_len))
672cbbd26b8SAl Viro 			return false;
673cbbd26b8SAl Viro 		0;}),
674cbbd26b8SAl Viro 		memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page,
675cbbd26b8SAl Viro 				 v.bv_offset, v.bv_len),
676cbbd26b8SAl Viro 		memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len)
677cbbd26b8SAl Viro 	)
678cbbd26b8SAl Viro 
679cbbd26b8SAl Viro 	iov_iter_advance(i, bytes);
680cbbd26b8SAl Viro 	return true;
681cbbd26b8SAl Viro }
682aa28de27SAl Viro EXPORT_SYMBOL(_copy_from_iter_full);
683cbbd26b8SAl Viro 
684aa28de27SAl Viro size_t _copy_from_iter_nocache(void *addr, size_t bytes, struct iov_iter *i)
685d879cb83SAl Viro {
686d879cb83SAl Viro 	char *to = addr;
687241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
688241699cdSAl Viro 		WARN_ON(1);
689241699cdSAl Viro 		return 0;
690241699cdSAl Viro 	}
691d879cb83SAl Viro 	iterate_and_advance(i, bytes, v,
6923f763453SAl Viro 		__copy_from_user_inatomic_nocache((to += v.iov_len) - v.iov_len,
693d879cb83SAl Viro 					 v.iov_base, v.iov_len),
694d879cb83SAl Viro 		memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page,
695d879cb83SAl Viro 				 v.bv_offset, v.bv_len),
696d879cb83SAl Viro 		memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len)
697d879cb83SAl Viro 	)
698d879cb83SAl Viro 
699d879cb83SAl Viro 	return bytes;
700d879cb83SAl Viro }
701aa28de27SAl Viro EXPORT_SYMBOL(_copy_from_iter_nocache);
702d879cb83SAl Viro 
7030aed55afSDan Williams #ifdef CONFIG_ARCH_HAS_UACCESS_FLUSHCACHE
7046a37e940SLinus Torvalds size_t _copy_from_iter_flushcache(void *addr, size_t bytes, struct iov_iter *i)
7050aed55afSDan Williams {
7060aed55afSDan Williams 	char *to = addr;
7070aed55afSDan Williams 	if (unlikely(i->type & ITER_PIPE)) {
7080aed55afSDan Williams 		WARN_ON(1);
7090aed55afSDan Williams 		return 0;
7100aed55afSDan Williams 	}
7110aed55afSDan Williams 	iterate_and_advance(i, bytes, v,
7120aed55afSDan Williams 		__copy_from_user_flushcache((to += v.iov_len) - v.iov_len,
7130aed55afSDan Williams 					 v.iov_base, v.iov_len),
7140aed55afSDan Williams 		memcpy_page_flushcache((to += v.bv_len) - v.bv_len, v.bv_page,
7150aed55afSDan Williams 				 v.bv_offset, v.bv_len),
7160aed55afSDan Williams 		memcpy_flushcache((to += v.iov_len) - v.iov_len, v.iov_base,
7170aed55afSDan Williams 			v.iov_len)
7180aed55afSDan Williams 	)
7190aed55afSDan Williams 
7200aed55afSDan Williams 	return bytes;
7210aed55afSDan Williams }
7226a37e940SLinus Torvalds EXPORT_SYMBOL_GPL(_copy_from_iter_flushcache);
7230aed55afSDan Williams #endif
7240aed55afSDan Williams 
725aa28de27SAl Viro bool _copy_from_iter_full_nocache(void *addr, size_t bytes, struct iov_iter *i)
726cbbd26b8SAl Viro {
727cbbd26b8SAl Viro 	char *to = addr;
728cbbd26b8SAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
729cbbd26b8SAl Viro 		WARN_ON(1);
730cbbd26b8SAl Viro 		return false;
731cbbd26b8SAl Viro 	}
73233844e66SAl Viro 	if (unlikely(i->count < bytes))
733cbbd26b8SAl Viro 		return false;
734cbbd26b8SAl Viro 	iterate_all_kinds(i, bytes, v, ({
7353f763453SAl Viro 		if (__copy_from_user_inatomic_nocache((to += v.iov_len) - v.iov_len,
736cbbd26b8SAl Viro 					     v.iov_base, v.iov_len))
737cbbd26b8SAl Viro 			return false;
738cbbd26b8SAl Viro 		0;}),
739cbbd26b8SAl Viro 		memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page,
740cbbd26b8SAl Viro 				 v.bv_offset, v.bv_len),
741cbbd26b8SAl Viro 		memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len)
742cbbd26b8SAl Viro 	)
743cbbd26b8SAl Viro 
744cbbd26b8SAl Viro 	iov_iter_advance(i, bytes);
745cbbd26b8SAl Viro 	return true;
746cbbd26b8SAl Viro }
747aa28de27SAl Viro EXPORT_SYMBOL(_copy_from_iter_full_nocache);
748cbbd26b8SAl Viro 
74972e809edSAl Viro static inline bool page_copy_sane(struct page *page, size_t offset, size_t n)
75072e809edSAl Viro {
751a90bcb86SPetar Penkov 	struct page *head = compound_head(page);
752a90bcb86SPetar Penkov 	size_t v = n + offset + page_address(page) - page_address(head);
753a90bcb86SPetar Penkov 
754a90bcb86SPetar Penkov 	if (likely(n <= v && v <= (PAGE_SIZE << compound_order(head))))
75572e809edSAl Viro 		return true;
75672e809edSAl Viro 	WARN_ON(1);
75772e809edSAl Viro 	return false;
75872e809edSAl Viro }
759d879cb83SAl Viro 
760d879cb83SAl Viro size_t copy_page_to_iter(struct page *page, size_t offset, size_t bytes,
761d879cb83SAl Viro 			 struct iov_iter *i)
762d879cb83SAl Viro {
76372e809edSAl Viro 	if (unlikely(!page_copy_sane(page, offset, bytes)))
76472e809edSAl Viro 		return 0;
765d879cb83SAl Viro 	if (i->type & (ITER_BVEC|ITER_KVEC)) {
766d879cb83SAl Viro 		void *kaddr = kmap_atomic(page);
767d879cb83SAl Viro 		size_t wanted = copy_to_iter(kaddr + offset, bytes, i);
768d879cb83SAl Viro 		kunmap_atomic(kaddr);
769d879cb83SAl Viro 		return wanted;
770241699cdSAl Viro 	} else if (likely(!(i->type & ITER_PIPE)))
771d879cb83SAl Viro 		return copy_page_to_iter_iovec(page, offset, bytes, i);
772241699cdSAl Viro 	else
773241699cdSAl Viro 		return copy_page_to_iter_pipe(page, offset, bytes, i);
774d879cb83SAl Viro }
775d879cb83SAl Viro EXPORT_SYMBOL(copy_page_to_iter);
776d879cb83SAl Viro 
777d879cb83SAl Viro size_t copy_page_from_iter(struct page *page, size_t offset, size_t bytes,
778d879cb83SAl Viro 			 struct iov_iter *i)
779d879cb83SAl Viro {
78072e809edSAl Viro 	if (unlikely(!page_copy_sane(page, offset, bytes)))
78172e809edSAl Viro 		return 0;
782241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
783241699cdSAl Viro 		WARN_ON(1);
784241699cdSAl Viro 		return 0;
785241699cdSAl Viro 	}
786d879cb83SAl Viro 	if (i->type & (ITER_BVEC|ITER_KVEC)) {
787d879cb83SAl Viro 		void *kaddr = kmap_atomic(page);
788aa28de27SAl Viro 		size_t wanted = _copy_from_iter(kaddr + offset, bytes, i);
789d879cb83SAl Viro 		kunmap_atomic(kaddr);
790d879cb83SAl Viro 		return wanted;
791d879cb83SAl Viro 	} else
792d879cb83SAl Viro 		return copy_page_from_iter_iovec(page, offset, bytes, i);
793d879cb83SAl Viro }
794d879cb83SAl Viro EXPORT_SYMBOL(copy_page_from_iter);
795d879cb83SAl Viro 
796241699cdSAl Viro static size_t pipe_zero(size_t bytes, struct iov_iter *i)
797241699cdSAl Viro {
798241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
799241699cdSAl Viro 	size_t n, off;
800241699cdSAl Viro 	int idx;
801241699cdSAl Viro 
802241699cdSAl Viro 	if (!sanity(i))
803241699cdSAl Viro 		return 0;
804241699cdSAl Viro 
805241699cdSAl Viro 	bytes = n = push_pipe(i, bytes, &idx, &off);
806241699cdSAl Viro 	if (unlikely(!n))
807241699cdSAl Viro 		return 0;
808241699cdSAl Viro 
809241699cdSAl Viro 	for ( ; n; idx = next_idx(idx, pipe), off = 0) {
810241699cdSAl Viro 		size_t chunk = min_t(size_t, n, PAGE_SIZE - off);
811241699cdSAl Viro 		memzero_page(pipe->bufs[idx].page, off, chunk);
812241699cdSAl Viro 		i->idx = idx;
813241699cdSAl Viro 		i->iov_offset = off + chunk;
814241699cdSAl Viro 		n -= chunk;
815241699cdSAl Viro 	}
816241699cdSAl Viro 	i->count -= bytes;
817241699cdSAl Viro 	return bytes;
818241699cdSAl Viro }
819241699cdSAl Viro 
820d879cb83SAl Viro size_t iov_iter_zero(size_t bytes, struct iov_iter *i)
821d879cb83SAl Viro {
822241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE))
823241699cdSAl Viro 		return pipe_zero(bytes, i);
824d879cb83SAl Viro 	iterate_and_advance(i, bytes, v,
82509fc68dcSAl Viro 		clear_user(v.iov_base, v.iov_len),
826d879cb83SAl Viro 		memzero_page(v.bv_page, v.bv_offset, v.bv_len),
827d879cb83SAl Viro 		memset(v.iov_base, 0, v.iov_len)
828d879cb83SAl Viro 	)
829d879cb83SAl Viro 
830d879cb83SAl Viro 	return bytes;
831d879cb83SAl Viro }
832d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_zero);
833d879cb83SAl Viro 
834d879cb83SAl Viro size_t iov_iter_copy_from_user_atomic(struct page *page,
835d879cb83SAl Viro 		struct iov_iter *i, unsigned long offset, size_t bytes)
836d879cb83SAl Viro {
837d879cb83SAl Viro 	char *kaddr = kmap_atomic(page), *p = kaddr + offset;
83872e809edSAl Viro 	if (unlikely(!page_copy_sane(page, offset, bytes))) {
83972e809edSAl Viro 		kunmap_atomic(kaddr);
84072e809edSAl Viro 		return 0;
84172e809edSAl Viro 	}
842241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
843241699cdSAl Viro 		kunmap_atomic(kaddr);
844241699cdSAl Viro 		WARN_ON(1);
845241699cdSAl Viro 		return 0;
846241699cdSAl Viro 	}
847d879cb83SAl Viro 	iterate_all_kinds(i, bytes, v,
84809fc68dcSAl Viro 		copyin((p += v.iov_len) - v.iov_len, v.iov_base, v.iov_len),
849d879cb83SAl Viro 		memcpy_from_page((p += v.bv_len) - v.bv_len, v.bv_page,
850d879cb83SAl Viro 				 v.bv_offset, v.bv_len),
851d879cb83SAl Viro 		memcpy((p += v.iov_len) - v.iov_len, v.iov_base, v.iov_len)
852d879cb83SAl Viro 	)
853d879cb83SAl Viro 	kunmap_atomic(kaddr);
854d879cb83SAl Viro 	return bytes;
855d879cb83SAl Viro }
856d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_copy_from_user_atomic);
857d879cb83SAl Viro 
858b9dc6f65SAl Viro static inline void pipe_truncate(struct iov_iter *i)
859241699cdSAl Viro {
860241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
861241699cdSAl Viro 	if (pipe->nrbufs) {
862b9dc6f65SAl Viro 		size_t off = i->iov_offset;
863b9dc6f65SAl Viro 		int idx = i->idx;
864b9dc6f65SAl Viro 		int nrbufs = (idx - pipe->curbuf) & (pipe->buffers - 1);
865b9dc6f65SAl Viro 		if (off) {
866b9dc6f65SAl Viro 			pipe->bufs[idx].len = off - pipe->bufs[idx].offset;
867b9dc6f65SAl Viro 			idx = next_idx(idx, pipe);
868b9dc6f65SAl Viro 			nrbufs++;
869b9dc6f65SAl Viro 		}
870b9dc6f65SAl Viro 		while (pipe->nrbufs > nrbufs) {
871a779638cSMiklos Szeredi 			pipe_buf_release(pipe, &pipe->bufs[idx]);
872241699cdSAl Viro 			idx = next_idx(idx, pipe);
873241699cdSAl Viro 			pipe->nrbufs--;
874241699cdSAl Viro 		}
875241699cdSAl Viro 	}
876b9dc6f65SAl Viro }
877b9dc6f65SAl Viro 
878b9dc6f65SAl Viro static void pipe_advance(struct iov_iter *i, size_t size)
879b9dc6f65SAl Viro {
880b9dc6f65SAl Viro 	struct pipe_inode_info *pipe = i->pipe;
881b9dc6f65SAl Viro 	if (unlikely(i->count < size))
882b9dc6f65SAl Viro 		size = i->count;
883b9dc6f65SAl Viro 	if (size) {
884b9dc6f65SAl Viro 		struct pipe_buffer *buf;
885b9dc6f65SAl Viro 		size_t off = i->iov_offset, left = size;
886b9dc6f65SAl Viro 		int idx = i->idx;
887b9dc6f65SAl Viro 		if (off) /* make it relative to the beginning of buffer */
888b9dc6f65SAl Viro 			left += off - pipe->bufs[idx].offset;
889b9dc6f65SAl Viro 		while (1) {
890b9dc6f65SAl Viro 			buf = &pipe->bufs[idx];
891b9dc6f65SAl Viro 			if (left <= buf->len)
892b9dc6f65SAl Viro 				break;
893b9dc6f65SAl Viro 			left -= buf->len;
894b9dc6f65SAl Viro 			idx = next_idx(idx, pipe);
895b9dc6f65SAl Viro 		}
896b9dc6f65SAl Viro 		i->idx = idx;
897b9dc6f65SAl Viro 		i->iov_offset = buf->offset + left;
898b9dc6f65SAl Viro 	}
899b9dc6f65SAl Viro 	i->count -= size;
900b9dc6f65SAl Viro 	/* ... and discard everything past that point */
901b9dc6f65SAl Viro 	pipe_truncate(i);
902241699cdSAl Viro }
903241699cdSAl Viro 
904d879cb83SAl Viro void iov_iter_advance(struct iov_iter *i, size_t size)
905d879cb83SAl Viro {
906241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
907241699cdSAl Viro 		pipe_advance(i, size);
908241699cdSAl Viro 		return;
909241699cdSAl Viro 	}
910d879cb83SAl Viro 	iterate_and_advance(i, size, v, 0, 0, 0)
911d879cb83SAl Viro }
912d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_advance);
913d879cb83SAl Viro 
91427c0e374SAl Viro void iov_iter_revert(struct iov_iter *i, size_t unroll)
91527c0e374SAl Viro {
91627c0e374SAl Viro 	if (!unroll)
91727c0e374SAl Viro 		return;
9185b47d59aSAl Viro 	if (WARN_ON(unroll > MAX_RW_COUNT))
9195b47d59aSAl Viro 		return;
92027c0e374SAl Viro 	i->count += unroll;
92127c0e374SAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
92227c0e374SAl Viro 		struct pipe_inode_info *pipe = i->pipe;
92327c0e374SAl Viro 		int idx = i->idx;
92427c0e374SAl Viro 		size_t off = i->iov_offset;
92527c0e374SAl Viro 		while (1) {
92627c0e374SAl Viro 			size_t n = off - pipe->bufs[idx].offset;
92727c0e374SAl Viro 			if (unroll < n) {
9284fa55cefSAl Viro 				off -= unroll;
92927c0e374SAl Viro 				break;
93027c0e374SAl Viro 			}
93127c0e374SAl Viro 			unroll -= n;
93227c0e374SAl Viro 			if (!unroll && idx == i->start_idx) {
93327c0e374SAl Viro 				off = 0;
93427c0e374SAl Viro 				break;
93527c0e374SAl Viro 			}
93627c0e374SAl Viro 			if (!idx--)
93727c0e374SAl Viro 				idx = pipe->buffers - 1;
93827c0e374SAl Viro 			off = pipe->bufs[idx].offset + pipe->bufs[idx].len;
93927c0e374SAl Viro 		}
94027c0e374SAl Viro 		i->iov_offset = off;
94127c0e374SAl Viro 		i->idx = idx;
94227c0e374SAl Viro 		pipe_truncate(i);
94327c0e374SAl Viro 		return;
94427c0e374SAl Viro 	}
94527c0e374SAl Viro 	if (unroll <= i->iov_offset) {
94627c0e374SAl Viro 		i->iov_offset -= unroll;
94727c0e374SAl Viro 		return;
94827c0e374SAl Viro 	}
94927c0e374SAl Viro 	unroll -= i->iov_offset;
95027c0e374SAl Viro 	if (i->type & ITER_BVEC) {
95127c0e374SAl Viro 		const struct bio_vec *bvec = i->bvec;
95227c0e374SAl Viro 		while (1) {
95327c0e374SAl Viro 			size_t n = (--bvec)->bv_len;
95427c0e374SAl Viro 			i->nr_segs++;
95527c0e374SAl Viro 			if (unroll <= n) {
95627c0e374SAl Viro 				i->bvec = bvec;
95727c0e374SAl Viro 				i->iov_offset = n - unroll;
95827c0e374SAl Viro 				return;
95927c0e374SAl Viro 			}
96027c0e374SAl Viro 			unroll -= n;
96127c0e374SAl Viro 		}
96227c0e374SAl Viro 	} else { /* same logics for iovec and kvec */
96327c0e374SAl Viro 		const struct iovec *iov = i->iov;
96427c0e374SAl Viro 		while (1) {
96527c0e374SAl Viro 			size_t n = (--iov)->iov_len;
96627c0e374SAl Viro 			i->nr_segs++;
96727c0e374SAl Viro 			if (unroll <= n) {
96827c0e374SAl Viro 				i->iov = iov;
96927c0e374SAl Viro 				i->iov_offset = n - unroll;
97027c0e374SAl Viro 				return;
97127c0e374SAl Viro 			}
97227c0e374SAl Viro 			unroll -= n;
97327c0e374SAl Viro 		}
97427c0e374SAl Viro 	}
97527c0e374SAl Viro }
97627c0e374SAl Viro EXPORT_SYMBOL(iov_iter_revert);
97727c0e374SAl Viro 
978d879cb83SAl Viro /*
979d879cb83SAl Viro  * Return the count of just the current iov_iter segment.
980d879cb83SAl Viro  */
981d879cb83SAl Viro size_t iov_iter_single_seg_count(const struct iov_iter *i)
982d879cb83SAl Viro {
983241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE))
984241699cdSAl Viro 		return i->count;	// it is a silly place, anyway
985d879cb83SAl Viro 	if (i->nr_segs == 1)
986d879cb83SAl Viro 		return i->count;
987d879cb83SAl Viro 	else if (i->type & ITER_BVEC)
988d879cb83SAl Viro 		return min(i->count, i->bvec->bv_len - i->iov_offset);
989d879cb83SAl Viro 	else
990d879cb83SAl Viro 		return min(i->count, i->iov->iov_len - i->iov_offset);
991d879cb83SAl Viro }
992d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_single_seg_count);
993d879cb83SAl Viro 
994d879cb83SAl Viro void iov_iter_kvec(struct iov_iter *i, int direction,
995d879cb83SAl Viro 			const struct kvec *kvec, unsigned long nr_segs,
996d879cb83SAl Viro 			size_t count)
997d879cb83SAl Viro {
998d879cb83SAl Viro 	BUG_ON(!(direction & ITER_KVEC));
999d879cb83SAl Viro 	i->type = direction;
1000d879cb83SAl Viro 	i->kvec = kvec;
1001d879cb83SAl Viro 	i->nr_segs = nr_segs;
1002d879cb83SAl Viro 	i->iov_offset = 0;
1003d879cb83SAl Viro 	i->count = count;
1004d879cb83SAl Viro }
1005d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_kvec);
1006d879cb83SAl Viro 
1007d879cb83SAl Viro void iov_iter_bvec(struct iov_iter *i, int direction,
1008d879cb83SAl Viro 			const struct bio_vec *bvec, unsigned long nr_segs,
1009d879cb83SAl Viro 			size_t count)
1010d879cb83SAl Viro {
1011d879cb83SAl Viro 	BUG_ON(!(direction & ITER_BVEC));
1012d879cb83SAl Viro 	i->type = direction;
1013d879cb83SAl Viro 	i->bvec = bvec;
1014d879cb83SAl Viro 	i->nr_segs = nr_segs;
1015d879cb83SAl Viro 	i->iov_offset = 0;
1016d879cb83SAl Viro 	i->count = count;
1017d879cb83SAl Viro }
1018d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_bvec);
1019d879cb83SAl Viro 
1020241699cdSAl Viro void iov_iter_pipe(struct iov_iter *i, int direction,
1021241699cdSAl Viro 			struct pipe_inode_info *pipe,
1022241699cdSAl Viro 			size_t count)
1023241699cdSAl Viro {
1024241699cdSAl Viro 	BUG_ON(direction != ITER_PIPE);
1025b9dc6f65SAl Viro 	WARN_ON(pipe->nrbufs == pipe->buffers);
1026241699cdSAl Viro 	i->type = direction;
1027241699cdSAl Viro 	i->pipe = pipe;
1028241699cdSAl Viro 	i->idx = (pipe->curbuf + pipe->nrbufs) & (pipe->buffers - 1);
1029241699cdSAl Viro 	i->iov_offset = 0;
1030241699cdSAl Viro 	i->count = count;
103127c0e374SAl Viro 	i->start_idx = i->idx;
1032241699cdSAl Viro }
1033241699cdSAl Viro EXPORT_SYMBOL(iov_iter_pipe);
1034241699cdSAl Viro 
1035d879cb83SAl Viro unsigned long iov_iter_alignment(const struct iov_iter *i)
1036d879cb83SAl Viro {
1037d879cb83SAl Viro 	unsigned long res = 0;
1038d879cb83SAl Viro 	size_t size = i->count;
1039d879cb83SAl Viro 
1040241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
104133844e66SAl Viro 		if (size && i->iov_offset && allocated(&i->pipe->bufs[i->idx]))
1042241699cdSAl Viro 			return size | i->iov_offset;
1043241699cdSAl Viro 		return size;
1044241699cdSAl Viro 	}
1045d879cb83SAl Viro 	iterate_all_kinds(i, size, v,
1046d879cb83SAl Viro 		(res |= (unsigned long)v.iov_base | v.iov_len, 0),
1047d879cb83SAl Viro 		res |= v.bv_offset | v.bv_len,
1048d879cb83SAl Viro 		res |= (unsigned long)v.iov_base | v.iov_len
1049d879cb83SAl Viro 	)
1050d879cb83SAl Viro 	return res;
1051d879cb83SAl Viro }
1052d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_alignment);
1053d879cb83SAl Viro 
1054357f435dSAl Viro unsigned long iov_iter_gap_alignment(const struct iov_iter *i)
1055357f435dSAl Viro {
1056357f435dSAl Viro 	unsigned long res = 0;
1057357f435dSAl Viro 	size_t size = i->count;
1058357f435dSAl Viro 
1059241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
1060241699cdSAl Viro 		WARN_ON(1);
1061241699cdSAl Viro 		return ~0U;
1062241699cdSAl Viro 	}
1063241699cdSAl Viro 
1064357f435dSAl Viro 	iterate_all_kinds(i, size, v,
1065357f435dSAl Viro 		(res |= (!res ? 0 : (unsigned long)v.iov_base) |
1066357f435dSAl Viro 			(size != v.iov_len ? size : 0), 0),
1067357f435dSAl Viro 		(res |= (!res ? 0 : (unsigned long)v.bv_offset) |
1068357f435dSAl Viro 			(size != v.bv_len ? size : 0)),
1069357f435dSAl Viro 		(res |= (!res ? 0 : (unsigned long)v.iov_base) |
1070357f435dSAl Viro 			(size != v.iov_len ? size : 0))
1071357f435dSAl Viro 		);
1072357f435dSAl Viro 	return res;
1073357f435dSAl Viro }
1074357f435dSAl Viro EXPORT_SYMBOL(iov_iter_gap_alignment);
1075357f435dSAl Viro 
1076241699cdSAl Viro static inline size_t __pipe_get_pages(struct iov_iter *i,
1077241699cdSAl Viro 				size_t maxsize,
1078241699cdSAl Viro 				struct page **pages,
1079241699cdSAl Viro 				int idx,
1080241699cdSAl Viro 				size_t *start)
1081241699cdSAl Viro {
1082241699cdSAl Viro 	struct pipe_inode_info *pipe = i->pipe;
10831689c73aSAl Viro 	ssize_t n = push_pipe(i, maxsize, &idx, start);
1084241699cdSAl Viro 	if (!n)
1085241699cdSAl Viro 		return -EFAULT;
1086241699cdSAl Viro 
1087241699cdSAl Viro 	maxsize = n;
1088241699cdSAl Viro 	n += *start;
10891689c73aSAl Viro 	while (n > 0) {
1090241699cdSAl Viro 		get_page(*pages++ = pipe->bufs[idx].page);
1091241699cdSAl Viro 		idx = next_idx(idx, pipe);
1092241699cdSAl Viro 		n -= PAGE_SIZE;
1093241699cdSAl Viro 	}
1094241699cdSAl Viro 
1095241699cdSAl Viro 	return maxsize;
1096241699cdSAl Viro }
1097241699cdSAl Viro 
1098241699cdSAl Viro static ssize_t pipe_get_pages(struct iov_iter *i,
1099241699cdSAl Viro 		   struct page **pages, size_t maxsize, unsigned maxpages,
1100241699cdSAl Viro 		   size_t *start)
1101241699cdSAl Viro {
1102241699cdSAl Viro 	unsigned npages;
1103241699cdSAl Viro 	size_t capacity;
1104241699cdSAl Viro 	int idx;
1105241699cdSAl Viro 
110633844e66SAl Viro 	if (!maxsize)
110733844e66SAl Viro 		return 0;
110833844e66SAl Viro 
1109241699cdSAl Viro 	if (!sanity(i))
1110241699cdSAl Viro 		return -EFAULT;
1111241699cdSAl Viro 
1112241699cdSAl Viro 	data_start(i, &idx, start);
1113241699cdSAl Viro 	/* some of this one + all after this one */
1114241699cdSAl Viro 	npages = ((i->pipe->curbuf - idx - 1) & (i->pipe->buffers - 1)) + 1;
1115241699cdSAl Viro 	capacity = min(npages,maxpages) * PAGE_SIZE - *start;
1116241699cdSAl Viro 
1117241699cdSAl Viro 	return __pipe_get_pages(i, min(maxsize, capacity), pages, idx, start);
1118241699cdSAl Viro }
1119241699cdSAl Viro 
1120d879cb83SAl Viro ssize_t iov_iter_get_pages(struct iov_iter *i,
1121d879cb83SAl Viro 		   struct page **pages, size_t maxsize, unsigned maxpages,
1122d879cb83SAl Viro 		   size_t *start)
1123d879cb83SAl Viro {
1124d879cb83SAl Viro 	if (maxsize > i->count)
1125d879cb83SAl Viro 		maxsize = i->count;
1126d879cb83SAl Viro 
1127241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE))
1128241699cdSAl Viro 		return pipe_get_pages(i, pages, maxsize, maxpages, start);
1129d879cb83SAl Viro 	iterate_all_kinds(i, maxsize, v, ({
1130d879cb83SAl Viro 		unsigned long addr = (unsigned long)v.iov_base;
1131d879cb83SAl Viro 		size_t len = v.iov_len + (*start = addr & (PAGE_SIZE - 1));
1132d879cb83SAl Viro 		int n;
1133d879cb83SAl Viro 		int res;
1134d879cb83SAl Viro 
1135d879cb83SAl Viro 		if (len > maxpages * PAGE_SIZE)
1136d879cb83SAl Viro 			len = maxpages * PAGE_SIZE;
1137d879cb83SAl Viro 		addr &= ~(PAGE_SIZE - 1);
1138d879cb83SAl Viro 		n = DIV_ROUND_UP(len, PAGE_SIZE);
1139d879cb83SAl Viro 		res = get_user_pages_fast(addr, n, (i->type & WRITE) != WRITE, pages);
1140d879cb83SAl Viro 		if (unlikely(res < 0))
1141d879cb83SAl Viro 			return res;
1142d879cb83SAl Viro 		return (res == n ? len : res * PAGE_SIZE) - *start;
1143d879cb83SAl Viro 	0;}),({
1144d879cb83SAl Viro 		/* can't be more than PAGE_SIZE */
1145d879cb83SAl Viro 		*start = v.bv_offset;
1146d879cb83SAl Viro 		get_page(*pages = v.bv_page);
1147d879cb83SAl Viro 		return v.bv_len;
1148d879cb83SAl Viro 	}),({
1149d879cb83SAl Viro 		return -EFAULT;
1150d879cb83SAl Viro 	})
1151d879cb83SAl Viro 	)
1152d879cb83SAl Viro 	return 0;
1153d879cb83SAl Viro }
1154d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_get_pages);
1155d879cb83SAl Viro 
1156d879cb83SAl Viro static struct page **get_pages_array(size_t n)
1157d879cb83SAl Viro {
1158752ade68SMichal Hocko 	return kvmalloc_array(n, sizeof(struct page *), GFP_KERNEL);
1159d879cb83SAl Viro }
1160d879cb83SAl Viro 
1161241699cdSAl Viro static ssize_t pipe_get_pages_alloc(struct iov_iter *i,
1162241699cdSAl Viro 		   struct page ***pages, size_t maxsize,
1163241699cdSAl Viro 		   size_t *start)
1164241699cdSAl Viro {
1165241699cdSAl Viro 	struct page **p;
1166241699cdSAl Viro 	size_t n;
1167241699cdSAl Viro 	int idx;
1168241699cdSAl Viro 	int npages;
1169241699cdSAl Viro 
117033844e66SAl Viro 	if (!maxsize)
117133844e66SAl Viro 		return 0;
117233844e66SAl Viro 
1173241699cdSAl Viro 	if (!sanity(i))
1174241699cdSAl Viro 		return -EFAULT;
1175241699cdSAl Viro 
1176241699cdSAl Viro 	data_start(i, &idx, start);
1177241699cdSAl Viro 	/* some of this one + all after this one */
1178241699cdSAl Viro 	npages = ((i->pipe->curbuf - idx - 1) & (i->pipe->buffers - 1)) + 1;
1179241699cdSAl Viro 	n = npages * PAGE_SIZE - *start;
1180241699cdSAl Viro 	if (maxsize > n)
1181241699cdSAl Viro 		maxsize = n;
1182241699cdSAl Viro 	else
1183241699cdSAl Viro 		npages = DIV_ROUND_UP(maxsize + *start, PAGE_SIZE);
1184241699cdSAl Viro 	p = get_pages_array(npages);
1185241699cdSAl Viro 	if (!p)
1186241699cdSAl Viro 		return -ENOMEM;
1187241699cdSAl Viro 	n = __pipe_get_pages(i, maxsize, p, idx, start);
1188241699cdSAl Viro 	if (n > 0)
1189241699cdSAl Viro 		*pages = p;
1190241699cdSAl Viro 	else
1191241699cdSAl Viro 		kvfree(p);
1192241699cdSAl Viro 	return n;
1193241699cdSAl Viro }
1194241699cdSAl Viro 
1195d879cb83SAl Viro ssize_t iov_iter_get_pages_alloc(struct iov_iter *i,
1196d879cb83SAl Viro 		   struct page ***pages, size_t maxsize,
1197d879cb83SAl Viro 		   size_t *start)
1198d879cb83SAl Viro {
1199d879cb83SAl Viro 	struct page **p;
1200d879cb83SAl Viro 
1201d879cb83SAl Viro 	if (maxsize > i->count)
1202d879cb83SAl Viro 		maxsize = i->count;
1203d879cb83SAl Viro 
1204241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE))
1205241699cdSAl Viro 		return pipe_get_pages_alloc(i, pages, maxsize, start);
1206d879cb83SAl Viro 	iterate_all_kinds(i, maxsize, v, ({
1207d879cb83SAl Viro 		unsigned long addr = (unsigned long)v.iov_base;
1208d879cb83SAl Viro 		size_t len = v.iov_len + (*start = addr & (PAGE_SIZE - 1));
1209d879cb83SAl Viro 		int n;
1210d879cb83SAl Viro 		int res;
1211d879cb83SAl Viro 
1212d879cb83SAl Viro 		addr &= ~(PAGE_SIZE - 1);
1213d879cb83SAl Viro 		n = DIV_ROUND_UP(len, PAGE_SIZE);
1214d879cb83SAl Viro 		p = get_pages_array(n);
1215d879cb83SAl Viro 		if (!p)
1216d879cb83SAl Viro 			return -ENOMEM;
1217d879cb83SAl Viro 		res = get_user_pages_fast(addr, n, (i->type & WRITE) != WRITE, p);
1218d879cb83SAl Viro 		if (unlikely(res < 0)) {
1219d879cb83SAl Viro 			kvfree(p);
1220d879cb83SAl Viro 			return res;
1221d879cb83SAl Viro 		}
1222d879cb83SAl Viro 		*pages = p;
1223d879cb83SAl Viro 		return (res == n ? len : res * PAGE_SIZE) - *start;
1224d879cb83SAl Viro 	0;}),({
1225d879cb83SAl Viro 		/* can't be more than PAGE_SIZE */
1226d879cb83SAl Viro 		*start = v.bv_offset;
1227d879cb83SAl Viro 		*pages = p = get_pages_array(1);
1228d879cb83SAl Viro 		if (!p)
1229d879cb83SAl Viro 			return -ENOMEM;
1230d879cb83SAl Viro 		get_page(*p = v.bv_page);
1231d879cb83SAl Viro 		return v.bv_len;
1232d879cb83SAl Viro 	}),({
1233d879cb83SAl Viro 		return -EFAULT;
1234d879cb83SAl Viro 	})
1235d879cb83SAl Viro 	)
1236d879cb83SAl Viro 	return 0;
1237d879cb83SAl Viro }
1238d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_get_pages_alloc);
1239d879cb83SAl Viro 
1240d879cb83SAl Viro size_t csum_and_copy_from_iter(void *addr, size_t bytes, __wsum *csum,
1241d879cb83SAl Viro 			       struct iov_iter *i)
1242d879cb83SAl Viro {
1243d879cb83SAl Viro 	char *to = addr;
1244d879cb83SAl Viro 	__wsum sum, next;
1245d879cb83SAl Viro 	size_t off = 0;
1246d879cb83SAl Viro 	sum = *csum;
1247241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
1248241699cdSAl Viro 		WARN_ON(1);
1249241699cdSAl Viro 		return 0;
1250241699cdSAl Viro 	}
1251d879cb83SAl Viro 	iterate_and_advance(i, bytes, v, ({
1252d879cb83SAl Viro 		int err = 0;
1253d879cb83SAl Viro 		next = csum_and_copy_from_user(v.iov_base,
1254d879cb83SAl Viro 					       (to += v.iov_len) - v.iov_len,
1255d879cb83SAl Viro 					       v.iov_len, 0, &err);
1256d879cb83SAl Viro 		if (!err) {
1257d879cb83SAl Viro 			sum = csum_block_add(sum, next, off);
1258d879cb83SAl Viro 			off += v.iov_len;
1259d879cb83SAl Viro 		}
1260d879cb83SAl Viro 		err ? v.iov_len : 0;
1261d879cb83SAl Viro 	}), ({
1262d879cb83SAl Viro 		char *p = kmap_atomic(v.bv_page);
1263d879cb83SAl Viro 		next = csum_partial_copy_nocheck(p + v.bv_offset,
1264d879cb83SAl Viro 						 (to += v.bv_len) - v.bv_len,
1265d879cb83SAl Viro 						 v.bv_len, 0);
1266d879cb83SAl Viro 		kunmap_atomic(p);
1267d879cb83SAl Viro 		sum = csum_block_add(sum, next, off);
1268d879cb83SAl Viro 		off += v.bv_len;
1269d879cb83SAl Viro 	}),({
1270d879cb83SAl Viro 		next = csum_partial_copy_nocheck(v.iov_base,
1271d879cb83SAl Viro 						 (to += v.iov_len) - v.iov_len,
1272d879cb83SAl Viro 						 v.iov_len, 0);
1273d879cb83SAl Viro 		sum = csum_block_add(sum, next, off);
1274d879cb83SAl Viro 		off += v.iov_len;
1275d879cb83SAl Viro 	})
1276d879cb83SAl Viro 	)
1277d879cb83SAl Viro 	*csum = sum;
1278d879cb83SAl Viro 	return bytes;
1279d879cb83SAl Viro }
1280d879cb83SAl Viro EXPORT_SYMBOL(csum_and_copy_from_iter);
1281d879cb83SAl Viro 
1282cbbd26b8SAl Viro bool csum_and_copy_from_iter_full(void *addr, size_t bytes, __wsum *csum,
1283cbbd26b8SAl Viro 			       struct iov_iter *i)
1284cbbd26b8SAl Viro {
1285cbbd26b8SAl Viro 	char *to = addr;
1286cbbd26b8SAl Viro 	__wsum sum, next;
1287cbbd26b8SAl Viro 	size_t off = 0;
1288cbbd26b8SAl Viro 	sum = *csum;
1289cbbd26b8SAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
1290cbbd26b8SAl Viro 		WARN_ON(1);
1291cbbd26b8SAl Viro 		return false;
1292cbbd26b8SAl Viro 	}
1293cbbd26b8SAl Viro 	if (unlikely(i->count < bytes))
1294cbbd26b8SAl Viro 		return false;
1295cbbd26b8SAl Viro 	iterate_all_kinds(i, bytes, v, ({
1296cbbd26b8SAl Viro 		int err = 0;
1297cbbd26b8SAl Viro 		next = csum_and_copy_from_user(v.iov_base,
1298cbbd26b8SAl Viro 					       (to += v.iov_len) - v.iov_len,
1299cbbd26b8SAl Viro 					       v.iov_len, 0, &err);
1300cbbd26b8SAl Viro 		if (err)
1301cbbd26b8SAl Viro 			return false;
1302cbbd26b8SAl Viro 		sum = csum_block_add(sum, next, off);
1303cbbd26b8SAl Viro 		off += v.iov_len;
1304cbbd26b8SAl Viro 		0;
1305cbbd26b8SAl Viro 	}), ({
1306cbbd26b8SAl Viro 		char *p = kmap_atomic(v.bv_page);
1307cbbd26b8SAl Viro 		next = csum_partial_copy_nocheck(p + v.bv_offset,
1308cbbd26b8SAl Viro 						 (to += v.bv_len) - v.bv_len,
1309cbbd26b8SAl Viro 						 v.bv_len, 0);
1310cbbd26b8SAl Viro 		kunmap_atomic(p);
1311cbbd26b8SAl Viro 		sum = csum_block_add(sum, next, off);
1312cbbd26b8SAl Viro 		off += v.bv_len;
1313cbbd26b8SAl Viro 	}),({
1314cbbd26b8SAl Viro 		next = csum_partial_copy_nocheck(v.iov_base,
1315cbbd26b8SAl Viro 						 (to += v.iov_len) - v.iov_len,
1316cbbd26b8SAl Viro 						 v.iov_len, 0);
1317cbbd26b8SAl Viro 		sum = csum_block_add(sum, next, off);
1318cbbd26b8SAl Viro 		off += v.iov_len;
1319cbbd26b8SAl Viro 	})
1320cbbd26b8SAl Viro 	)
1321cbbd26b8SAl Viro 	*csum = sum;
1322cbbd26b8SAl Viro 	iov_iter_advance(i, bytes);
1323cbbd26b8SAl Viro 	return true;
1324cbbd26b8SAl Viro }
1325cbbd26b8SAl Viro EXPORT_SYMBOL(csum_and_copy_from_iter_full);
1326cbbd26b8SAl Viro 
132736f7a8a4SAl Viro size_t csum_and_copy_to_iter(const void *addr, size_t bytes, __wsum *csum,
1328d879cb83SAl Viro 			     struct iov_iter *i)
1329d879cb83SAl Viro {
133036f7a8a4SAl Viro 	const char *from = addr;
1331d879cb83SAl Viro 	__wsum sum, next;
1332d879cb83SAl Viro 	size_t off = 0;
1333d879cb83SAl Viro 	sum = *csum;
1334241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
1335241699cdSAl Viro 		WARN_ON(1);	/* for now */
1336241699cdSAl Viro 		return 0;
1337241699cdSAl Viro 	}
1338d879cb83SAl Viro 	iterate_and_advance(i, bytes, v, ({
1339d879cb83SAl Viro 		int err = 0;
1340d879cb83SAl Viro 		next = csum_and_copy_to_user((from += v.iov_len) - v.iov_len,
1341d879cb83SAl Viro 					     v.iov_base,
1342d879cb83SAl Viro 					     v.iov_len, 0, &err);
1343d879cb83SAl Viro 		if (!err) {
1344d879cb83SAl Viro 			sum = csum_block_add(sum, next, off);
1345d879cb83SAl Viro 			off += v.iov_len;
1346d879cb83SAl Viro 		}
1347d879cb83SAl Viro 		err ? v.iov_len : 0;
1348d879cb83SAl Viro 	}), ({
1349d879cb83SAl Viro 		char *p = kmap_atomic(v.bv_page);
1350d879cb83SAl Viro 		next = csum_partial_copy_nocheck((from += v.bv_len) - v.bv_len,
1351d879cb83SAl Viro 						 p + v.bv_offset,
1352d879cb83SAl Viro 						 v.bv_len, 0);
1353d879cb83SAl Viro 		kunmap_atomic(p);
1354d879cb83SAl Viro 		sum = csum_block_add(sum, next, off);
1355d879cb83SAl Viro 		off += v.bv_len;
1356d879cb83SAl Viro 	}),({
1357d879cb83SAl Viro 		next = csum_partial_copy_nocheck((from += v.iov_len) - v.iov_len,
1358d879cb83SAl Viro 						 v.iov_base,
1359d879cb83SAl Viro 						 v.iov_len, 0);
1360d879cb83SAl Viro 		sum = csum_block_add(sum, next, off);
1361d879cb83SAl Viro 		off += v.iov_len;
1362d879cb83SAl Viro 	})
1363d879cb83SAl Viro 	)
1364d879cb83SAl Viro 	*csum = sum;
1365d879cb83SAl Viro 	return bytes;
1366d879cb83SAl Viro }
1367d879cb83SAl Viro EXPORT_SYMBOL(csum_and_copy_to_iter);
1368d879cb83SAl Viro 
1369d879cb83SAl Viro int iov_iter_npages(const struct iov_iter *i, int maxpages)
1370d879cb83SAl Viro {
1371d879cb83SAl Viro 	size_t size = i->count;
1372d879cb83SAl Viro 	int npages = 0;
1373d879cb83SAl Viro 
1374d879cb83SAl Viro 	if (!size)
1375d879cb83SAl Viro 		return 0;
1376d879cb83SAl Viro 
1377241699cdSAl Viro 	if (unlikely(i->type & ITER_PIPE)) {
1378241699cdSAl Viro 		struct pipe_inode_info *pipe = i->pipe;
1379241699cdSAl Viro 		size_t off;
1380241699cdSAl Viro 		int idx;
1381241699cdSAl Viro 
1382241699cdSAl Viro 		if (!sanity(i))
1383241699cdSAl Viro 			return 0;
1384241699cdSAl Viro 
1385241699cdSAl Viro 		data_start(i, &idx, &off);
1386241699cdSAl Viro 		/* some of this one + all after this one */
1387241699cdSAl Viro 		npages = ((pipe->curbuf - idx - 1) & (pipe->buffers - 1)) + 1;
1388241699cdSAl Viro 		if (npages >= maxpages)
1389241699cdSAl Viro 			return maxpages;
1390241699cdSAl Viro 	} else iterate_all_kinds(i, size, v, ({
1391d879cb83SAl Viro 		unsigned long p = (unsigned long)v.iov_base;
1392d879cb83SAl Viro 		npages += DIV_ROUND_UP(p + v.iov_len, PAGE_SIZE)
1393d879cb83SAl Viro 			- p / PAGE_SIZE;
1394d879cb83SAl Viro 		if (npages >= maxpages)
1395d879cb83SAl Viro 			return maxpages;
1396d879cb83SAl Viro 	0;}),({
1397d879cb83SAl Viro 		npages++;
1398d879cb83SAl Viro 		if (npages >= maxpages)
1399d879cb83SAl Viro 			return maxpages;
1400d879cb83SAl Viro 	}),({
1401d879cb83SAl Viro 		unsigned long p = (unsigned long)v.iov_base;
1402d879cb83SAl Viro 		npages += DIV_ROUND_UP(p + v.iov_len, PAGE_SIZE)
1403d879cb83SAl Viro 			- p / PAGE_SIZE;
1404d879cb83SAl Viro 		if (npages >= maxpages)
1405d879cb83SAl Viro 			return maxpages;
1406d879cb83SAl Viro 	})
1407d879cb83SAl Viro 	)
1408d879cb83SAl Viro 	return npages;
1409d879cb83SAl Viro }
1410d879cb83SAl Viro EXPORT_SYMBOL(iov_iter_npages);
1411d879cb83SAl Viro 
1412d879cb83SAl Viro const void *dup_iter(struct iov_iter *new, struct iov_iter *old, gfp_t flags)
1413d879cb83SAl Viro {
1414d879cb83SAl Viro 	*new = *old;
1415241699cdSAl Viro 	if (unlikely(new->type & ITER_PIPE)) {
1416241699cdSAl Viro 		WARN_ON(1);
1417241699cdSAl Viro 		return NULL;
1418241699cdSAl Viro 	}
1419d879cb83SAl Viro 	if (new->type & ITER_BVEC)
1420d879cb83SAl Viro 		return new->bvec = kmemdup(new->bvec,
1421d879cb83SAl Viro 				    new->nr_segs * sizeof(struct bio_vec),
1422d879cb83SAl Viro 				    flags);
1423d879cb83SAl Viro 	else
1424d879cb83SAl Viro 		/* iovec and kvec have identical layout */
1425d879cb83SAl Viro 		return new->iov = kmemdup(new->iov,
1426d879cb83SAl Viro 				   new->nr_segs * sizeof(struct iovec),
1427d879cb83SAl Viro 				   flags);
1428d879cb83SAl Viro }
1429d879cb83SAl Viro EXPORT_SYMBOL(dup_iter);
1430bc917be8SAl Viro 
1431ffecee4fSVegard Nossum /**
1432ffecee4fSVegard Nossum  * import_iovec() - Copy an array of &struct iovec from userspace
1433ffecee4fSVegard Nossum  *     into the kernel, check that it is valid, and initialize a new
1434ffecee4fSVegard Nossum  *     &struct iov_iter iterator to access it.
1435ffecee4fSVegard Nossum  *
1436ffecee4fSVegard Nossum  * @type: One of %READ or %WRITE.
1437ffecee4fSVegard Nossum  * @uvector: Pointer to the userspace array.
1438ffecee4fSVegard Nossum  * @nr_segs: Number of elements in userspace array.
1439ffecee4fSVegard Nossum  * @fast_segs: Number of elements in @iov.
1440ffecee4fSVegard Nossum  * @iov: (input and output parameter) Pointer to pointer to (usually small
1441ffecee4fSVegard Nossum  *     on-stack) kernel array.
1442ffecee4fSVegard Nossum  * @i: Pointer to iterator that will be initialized on success.
1443ffecee4fSVegard Nossum  *
1444ffecee4fSVegard Nossum  * If the array pointed to by *@iov is large enough to hold all @nr_segs,
1445ffecee4fSVegard Nossum  * then this function places %NULL in *@iov on return. Otherwise, a new
1446ffecee4fSVegard Nossum  * array will be allocated and the result placed in *@iov. This means that
1447ffecee4fSVegard Nossum  * the caller may call kfree() on *@iov regardless of whether the small
1448ffecee4fSVegard Nossum  * on-stack array was used or not (and regardless of whether this function
1449ffecee4fSVegard Nossum  * returns an error or not).
1450ffecee4fSVegard Nossum  *
1451ffecee4fSVegard Nossum  * Return: 0 on success or negative error code on error.
1452ffecee4fSVegard Nossum  */
1453bc917be8SAl Viro int import_iovec(int type, const struct iovec __user * uvector,
1454bc917be8SAl Viro 		 unsigned nr_segs, unsigned fast_segs,
1455bc917be8SAl Viro 		 struct iovec **iov, struct iov_iter *i)
1456bc917be8SAl Viro {
1457bc917be8SAl Viro 	ssize_t n;
1458bc917be8SAl Viro 	struct iovec *p;
1459bc917be8SAl Viro 	n = rw_copy_check_uvector(type, uvector, nr_segs, fast_segs,
1460bc917be8SAl Viro 				  *iov, &p);
1461bc917be8SAl Viro 	if (n < 0) {
1462bc917be8SAl Viro 		if (p != *iov)
1463bc917be8SAl Viro 			kfree(p);
1464bc917be8SAl Viro 		*iov = NULL;
1465bc917be8SAl Viro 		return n;
1466bc917be8SAl Viro 	}
1467bc917be8SAl Viro 	iov_iter_init(i, type, p, nr_segs, n);
1468bc917be8SAl Viro 	*iov = p == *iov ? NULL : p;
1469bc917be8SAl Viro 	return 0;
1470bc917be8SAl Viro }
1471bc917be8SAl Viro EXPORT_SYMBOL(import_iovec);
1472bc917be8SAl Viro 
1473bc917be8SAl Viro #ifdef CONFIG_COMPAT
1474bc917be8SAl Viro #include <linux/compat.h>
1475bc917be8SAl Viro 
1476bc917be8SAl Viro int compat_import_iovec(int type, const struct compat_iovec __user * uvector,
1477bc917be8SAl Viro 		 unsigned nr_segs, unsigned fast_segs,
1478bc917be8SAl Viro 		 struct iovec **iov, struct iov_iter *i)
1479bc917be8SAl Viro {
1480bc917be8SAl Viro 	ssize_t n;
1481bc917be8SAl Viro 	struct iovec *p;
1482bc917be8SAl Viro 	n = compat_rw_copy_check_uvector(type, uvector, nr_segs, fast_segs,
1483bc917be8SAl Viro 				  *iov, &p);
1484bc917be8SAl Viro 	if (n < 0) {
1485bc917be8SAl Viro 		if (p != *iov)
1486bc917be8SAl Viro 			kfree(p);
1487bc917be8SAl Viro 		*iov = NULL;
1488bc917be8SAl Viro 		return n;
1489bc917be8SAl Viro 	}
1490bc917be8SAl Viro 	iov_iter_init(i, type, p, nr_segs, n);
1491bc917be8SAl Viro 	*iov = p == *iov ? NULL : p;
1492bc917be8SAl Viro 	return 0;
1493bc917be8SAl Viro }
1494bc917be8SAl Viro #endif
1495bc917be8SAl Viro 
1496bc917be8SAl Viro int import_single_range(int rw, void __user *buf, size_t len,
1497bc917be8SAl Viro 		 struct iovec *iov, struct iov_iter *i)
1498bc917be8SAl Viro {
1499bc917be8SAl Viro 	if (len > MAX_RW_COUNT)
1500bc917be8SAl Viro 		len = MAX_RW_COUNT;
1501bc917be8SAl Viro 	if (unlikely(!access_ok(!rw, buf, len)))
1502bc917be8SAl Viro 		return -EFAULT;
1503bc917be8SAl Viro 
1504bc917be8SAl Viro 	iov->iov_base = buf;
1505bc917be8SAl Viro 	iov->iov_len = len;
1506bc917be8SAl Viro 	iov_iter_init(i, rw, iov, 1, len);
1507bc917be8SAl Viro 	return 0;
1508bc917be8SAl Viro }
1509e1267585SAl Viro EXPORT_SYMBOL(import_single_range);
151009cf698aSAl Viro 
151109cf698aSAl Viro int iov_iter_for_each_range(struct iov_iter *i, size_t bytes,
151209cf698aSAl Viro 			    int (*f)(struct kvec *vec, void *context),
151309cf698aSAl Viro 			    void *context)
151409cf698aSAl Viro {
151509cf698aSAl Viro 	struct kvec w;
151609cf698aSAl Viro 	int err = -EINVAL;
151709cf698aSAl Viro 	if (!bytes)
151809cf698aSAl Viro 		return 0;
151909cf698aSAl Viro 
152009cf698aSAl Viro 	iterate_all_kinds(i, bytes, v, -EINVAL, ({
152109cf698aSAl Viro 		w.iov_base = kmap(v.bv_page) + v.bv_offset;
152209cf698aSAl Viro 		w.iov_len = v.bv_len;
152309cf698aSAl Viro 		err = f(&w, context);
152409cf698aSAl Viro 		kunmap(v.bv_page);
152509cf698aSAl Viro 		err;}), ({
152609cf698aSAl Viro 		w = v;
152709cf698aSAl Viro 		err = f(&w, context);})
152809cf698aSAl Viro 	)
152909cf698aSAl Viro 	return err;
153009cf698aSAl Viro }
153109cf698aSAl Viro EXPORT_SYMBOL(iov_iter_for_each_range);
1532