xref: /openbmc/linux/net/socket.c (revision c0371da6)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  * NET		An implementation of the SOCKET network access protocol.
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  * Version:	@(#)socket.c	1.1.93	18/02/95
51da177e4SLinus Torvalds  *
61da177e4SLinus Torvalds  * Authors:	Orest Zborowski, <obz@Kodak.COM>
702c30a84SJesper Juhl  *		Ross Biro
81da177e4SLinus Torvalds  *		Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
91da177e4SLinus Torvalds  *
101da177e4SLinus Torvalds  * Fixes:
111da177e4SLinus Torvalds  *		Anonymous	:	NOTSOCK/BADF cleanup. Error fix in
121da177e4SLinus Torvalds  *					shutdown()
131da177e4SLinus Torvalds  *		Alan Cox	:	verify_area() fixes
141da177e4SLinus Torvalds  *		Alan Cox	:	Removed DDI
151da177e4SLinus Torvalds  *		Jonathan Kamens	:	SOCK_DGRAM reconnect bug
161da177e4SLinus Torvalds  *		Alan Cox	:	Moved a load of checks to the very
171da177e4SLinus Torvalds  *					top level.
181da177e4SLinus Torvalds  *		Alan Cox	:	Move address structures to/from user
191da177e4SLinus Torvalds  *					mode above the protocol layers.
201da177e4SLinus Torvalds  *		Rob Janssen	:	Allow 0 length sends.
211da177e4SLinus Torvalds  *		Alan Cox	:	Asynchronous I/O support (cribbed from the
221da177e4SLinus Torvalds  *					tty drivers).
231da177e4SLinus Torvalds  *		Niibe Yutaka	:	Asynchronous I/O for writes (4.4BSD style)
241da177e4SLinus Torvalds  *		Jeff Uphoff	:	Made max number of sockets command-line
251da177e4SLinus Torvalds  *					configurable.
261da177e4SLinus Torvalds  *		Matti Aarnio	:	Made the number of sockets dynamic,
271da177e4SLinus Torvalds  *					to be allocated when needed, and mr.
281da177e4SLinus Torvalds  *					Uphoff's max is used as max to be
291da177e4SLinus Torvalds  *					allowed to allocate.
301da177e4SLinus Torvalds  *		Linus		:	Argh. removed all the socket allocation
311da177e4SLinus Torvalds  *					altogether: it's in the inode now.
321da177e4SLinus Torvalds  *		Alan Cox	:	Made sock_alloc()/sock_release() public
331da177e4SLinus Torvalds  *					for NetROM and future kernel nfsd type
341da177e4SLinus Torvalds  *					stuff.
351da177e4SLinus Torvalds  *		Alan Cox	:	sendmsg/recvmsg basics.
361da177e4SLinus Torvalds  *		Tom Dyas	:	Export net symbols.
371da177e4SLinus Torvalds  *		Marcin Dalecki	:	Fixed problems with CONFIG_NET="n".
381da177e4SLinus Torvalds  *		Alan Cox	:	Added thread locking to sys_* calls
391da177e4SLinus Torvalds  *					for sockets. May have errors at the
401da177e4SLinus Torvalds  *					moment.
411da177e4SLinus Torvalds  *		Kevin Buhr	:	Fixed the dumb errors in the above.
421da177e4SLinus Torvalds  *		Andi Kleen	:	Some small cleanups, optimizations,
431da177e4SLinus Torvalds  *					and fixed a copy_from_user() bug.
441da177e4SLinus Torvalds  *		Tigran Aivazian	:	sys_send(args) calls sys_sendto(args, NULL, 0)
451da177e4SLinus Torvalds  *		Tigran Aivazian	:	Made listen(2) backlog sanity checks
461da177e4SLinus Torvalds  *					protocol-independent
471da177e4SLinus Torvalds  *
481da177e4SLinus Torvalds  *
491da177e4SLinus Torvalds  *		This program is free software; you can redistribute it and/or
501da177e4SLinus Torvalds  *		modify it under the terms of the GNU General Public License
511da177e4SLinus Torvalds  *		as published by the Free Software Foundation; either version
521da177e4SLinus Torvalds  *		2 of the License, or (at your option) any later version.
531da177e4SLinus Torvalds  *
541da177e4SLinus Torvalds  *
551da177e4SLinus Torvalds  *	This module is effectively the top level interface to the BSD socket
561da177e4SLinus Torvalds  *	paradigm.
571da177e4SLinus Torvalds  *
581da177e4SLinus Torvalds  *	Based upon Swansea University Computer Society NET3.039
591da177e4SLinus Torvalds  */
601da177e4SLinus Torvalds 
611da177e4SLinus Torvalds #include <linux/mm.h>
621da177e4SLinus Torvalds #include <linux/socket.h>
631da177e4SLinus Torvalds #include <linux/file.h>
641da177e4SLinus Torvalds #include <linux/net.h>
651da177e4SLinus Torvalds #include <linux/interrupt.h>
66aaca0bdcSUlrich Drepper #include <linux/thread_info.h>
6755737fdaSStephen Hemminger #include <linux/rcupdate.h>
681da177e4SLinus Torvalds #include <linux/netdevice.h>
691da177e4SLinus Torvalds #include <linux/proc_fs.h>
701da177e4SLinus Torvalds #include <linux/seq_file.h>
714a3e2f71SArjan van de Ven #include <linux/mutex.h>
721da177e4SLinus Torvalds #include <linux/if_bridge.h>
7320380731SArnaldo Carvalho de Melo #include <linux/if_frad.h>
7420380731SArnaldo Carvalho de Melo #include <linux/if_vlan.h>
75408eccceSDaniel Borkmann #include <linux/ptp_classify.h>
761da177e4SLinus Torvalds #include <linux/init.h>
771da177e4SLinus Torvalds #include <linux/poll.h>
781da177e4SLinus Torvalds #include <linux/cache.h>
791da177e4SLinus Torvalds #include <linux/module.h>
801da177e4SLinus Torvalds #include <linux/highmem.h>
811da177e4SLinus Torvalds #include <linux/mount.h>
821da177e4SLinus Torvalds #include <linux/security.h>
831da177e4SLinus Torvalds #include <linux/syscalls.h>
841da177e4SLinus Torvalds #include <linux/compat.h>
851da177e4SLinus Torvalds #include <linux/kmod.h>
863ec3b2fbSDavid Woodhouse #include <linux/audit.h>
87d86b5e0eSAdrian Bunk #include <linux/wireless.h>
881b8d7ae4SEric W. Biederman #include <linux/nsproxy.h>
891fd7317dSNick Black #include <linux/magic.h>
905a0e3ad6STejun Heo #include <linux/slab.h>
91600e1779SMasatake YAMATO #include <linux/xattr.h>
921da177e4SLinus Torvalds 
931da177e4SLinus Torvalds #include <asm/uaccess.h>
941da177e4SLinus Torvalds #include <asm/unistd.h>
951da177e4SLinus Torvalds 
961da177e4SLinus Torvalds #include <net/compat.h>
9787de87d5SDavid S. Miller #include <net/wext.h>
98f8451725SHerbert Xu #include <net/cls_cgroup.h>
991da177e4SLinus Torvalds 
1001da177e4SLinus Torvalds #include <net/sock.h>
1011da177e4SLinus Torvalds #include <linux/netfilter.h>
1021da177e4SLinus Torvalds 
1036b96018bSArnd Bergmann #include <linux/if_tun.h>
1046b96018bSArnd Bergmann #include <linux/ipv6_route.h>
1056b96018bSArnd Bergmann #include <linux/route.h>
1066b96018bSArnd Bergmann #include <linux/sockios.h>
1076b96018bSArnd Bergmann #include <linux/atalk.h>
108076bb0c8SEliezer Tamir #include <net/busy_poll.h>
109f24b9be5SWillem de Bruijn #include <linux/errqueue.h>
11006021292SEliezer Tamir 
111e0d1095aSCong Wang #ifdef CONFIG_NET_RX_BUSY_POLL
11264b0dc51SEliezer Tamir unsigned int sysctl_net_busy_read __read_mostly;
11364b0dc51SEliezer Tamir unsigned int sysctl_net_busy_poll __read_mostly;
11406021292SEliezer Tamir #endif
1156b96018bSArnd Bergmann 
1161da177e4SLinus Torvalds static int sock_no_open(struct inode *irrelevant, struct file *dontcare);
117027445c3SBadari Pulavarty static ssize_t sock_aio_read(struct kiocb *iocb, const struct iovec *iov,
118027445c3SBadari Pulavarty 			 unsigned long nr_segs, loff_t pos);
119027445c3SBadari Pulavarty static ssize_t sock_aio_write(struct kiocb *iocb, const struct iovec *iov,
120027445c3SBadari Pulavarty 			  unsigned long nr_segs, loff_t pos);
1211da177e4SLinus Torvalds static int sock_mmap(struct file *file, struct vm_area_struct *vma);
1221da177e4SLinus Torvalds 
1231da177e4SLinus Torvalds static int sock_close(struct inode *inode, struct file *file);
1241da177e4SLinus Torvalds static unsigned int sock_poll(struct file *file,
1251da177e4SLinus Torvalds 			      struct poll_table_struct *wait);
12689bddce5SStephen Hemminger static long sock_ioctl(struct file *file, unsigned int cmd, unsigned long arg);
12789bbfc95SShaun Pereira #ifdef CONFIG_COMPAT
12889bbfc95SShaun Pereira static long compat_sock_ioctl(struct file *file,
12989bbfc95SShaun Pereira 			      unsigned int cmd, unsigned long arg);
13089bbfc95SShaun Pereira #endif
1311da177e4SLinus Torvalds static int sock_fasync(int fd, struct file *filp, int on);
1321da177e4SLinus Torvalds static ssize_t sock_sendpage(struct file *file, struct page *page,
1331da177e4SLinus Torvalds 			     int offset, size_t size, loff_t *ppos, int more);
1349c55e01cSJens Axboe static ssize_t sock_splice_read(struct file *file, loff_t *ppos,
1359c55e01cSJens Axboe 				struct pipe_inode_info *pipe, size_t len,
1369c55e01cSJens Axboe 				unsigned int flags);
1371da177e4SLinus Torvalds 
1381da177e4SLinus Torvalds /*
1391da177e4SLinus Torvalds  *	Socket files have a set of 'special' operations as well as the generic file ones. These don't appear
1401da177e4SLinus Torvalds  *	in the operation structures but are done directly via the socketcall() multiplexor.
1411da177e4SLinus Torvalds  */
1421da177e4SLinus Torvalds 
143da7071d7SArjan van de Ven static const struct file_operations socket_file_ops = {
1441da177e4SLinus Torvalds 	.owner =	THIS_MODULE,
1451da177e4SLinus Torvalds 	.llseek =	no_llseek,
1461da177e4SLinus Torvalds 	.aio_read =	sock_aio_read,
1471da177e4SLinus Torvalds 	.aio_write =	sock_aio_write,
1481da177e4SLinus Torvalds 	.poll =		sock_poll,
1491da177e4SLinus Torvalds 	.unlocked_ioctl = sock_ioctl,
15089bbfc95SShaun Pereira #ifdef CONFIG_COMPAT
15189bbfc95SShaun Pereira 	.compat_ioctl = compat_sock_ioctl,
15289bbfc95SShaun Pereira #endif
1531da177e4SLinus Torvalds 	.mmap =		sock_mmap,
1541da177e4SLinus Torvalds 	.open =		sock_no_open,	/* special open code to disallow open via /proc */
1551da177e4SLinus Torvalds 	.release =	sock_close,
1561da177e4SLinus Torvalds 	.fasync =	sock_fasync,
1575274f052SJens Axboe 	.sendpage =	sock_sendpage,
1585274f052SJens Axboe 	.splice_write = generic_splice_sendpage,
1599c55e01cSJens Axboe 	.splice_read =	sock_splice_read,
1601da177e4SLinus Torvalds };
1611da177e4SLinus Torvalds 
1621da177e4SLinus Torvalds /*
1631da177e4SLinus Torvalds  *	The protocol list. Each protocol is registered in here.
1641da177e4SLinus Torvalds  */
1651da177e4SLinus Torvalds 
1661da177e4SLinus Torvalds static DEFINE_SPINLOCK(net_family_lock);
167190683a9SEric Dumazet static const struct net_proto_family __rcu *net_families[NPROTO] __read_mostly;
1681da177e4SLinus Torvalds 
1691da177e4SLinus Torvalds /*
1701da177e4SLinus Torvalds  *	Statistics counters of the socket lists
1711da177e4SLinus Torvalds  */
1721da177e4SLinus Torvalds 
173c6d409cfSEric Dumazet static DEFINE_PER_CPU(int, sockets_in_use);
1741da177e4SLinus Torvalds 
1751da177e4SLinus Torvalds /*
17689bddce5SStephen Hemminger  * Support routines.
17789bddce5SStephen Hemminger  * Move socket addresses back and forth across the kernel/user
1781da177e4SLinus Torvalds  * divide and look after the messy bits.
1791da177e4SLinus Torvalds  */
1801da177e4SLinus Torvalds 
1811da177e4SLinus Torvalds /**
1821da177e4SLinus Torvalds  *	move_addr_to_kernel	-	copy a socket address into kernel space
1831da177e4SLinus Torvalds  *	@uaddr: Address in user space
1841da177e4SLinus Torvalds  *	@kaddr: Address in kernel space
1851da177e4SLinus Torvalds  *	@ulen: Length in user space
1861da177e4SLinus Torvalds  *
1871da177e4SLinus Torvalds  *	The address is copied into kernel space. If the provided address is
1881da177e4SLinus Torvalds  *	too long an error code of -EINVAL is returned. If the copy gives
1891da177e4SLinus Torvalds  *	invalid addresses -EFAULT is returned. On a success 0 is returned.
1901da177e4SLinus Torvalds  */
1911da177e4SLinus Torvalds 
19243db362dSMaciej Żenczykowski int move_addr_to_kernel(void __user *uaddr, int ulen, struct sockaddr_storage *kaddr)
1931da177e4SLinus Torvalds {
194230b1839SYOSHIFUJI Hideaki 	if (ulen < 0 || ulen > sizeof(struct sockaddr_storage))
1951da177e4SLinus Torvalds 		return -EINVAL;
1961da177e4SLinus Torvalds 	if (ulen == 0)
1971da177e4SLinus Torvalds 		return 0;
1981da177e4SLinus Torvalds 	if (copy_from_user(kaddr, uaddr, ulen))
1991da177e4SLinus Torvalds 		return -EFAULT;
2003ec3b2fbSDavid Woodhouse 	return audit_sockaddr(ulen, kaddr);
2011da177e4SLinus Torvalds }
2021da177e4SLinus Torvalds 
2031da177e4SLinus Torvalds /**
2041da177e4SLinus Torvalds  *	move_addr_to_user	-	copy an address to user space
2051da177e4SLinus Torvalds  *	@kaddr: kernel space address
2061da177e4SLinus Torvalds  *	@klen: length of address in kernel
2071da177e4SLinus Torvalds  *	@uaddr: user space address
2081da177e4SLinus Torvalds  *	@ulen: pointer to user length field
2091da177e4SLinus Torvalds  *
2101da177e4SLinus Torvalds  *	The value pointed to by ulen on entry is the buffer length available.
2111da177e4SLinus Torvalds  *	This is overwritten with the buffer space used. -EINVAL is returned
2121da177e4SLinus Torvalds  *	if an overlong buffer is specified or a negative buffer size. -EFAULT
2131da177e4SLinus Torvalds  *	is returned if either the buffer or the length field are not
2141da177e4SLinus Torvalds  *	accessible.
2151da177e4SLinus Torvalds  *	After copying the data up to the limit the user specifies, the true
2161da177e4SLinus Torvalds  *	length of the data is written over the length limit the user
2171da177e4SLinus Torvalds  *	specified. Zero is returned for a success.
2181da177e4SLinus Torvalds  */
2191da177e4SLinus Torvalds 
22043db362dSMaciej Żenczykowski static int move_addr_to_user(struct sockaddr_storage *kaddr, int klen,
22111165f14Sstephen hemminger 			     void __user *uaddr, int __user *ulen)
2221da177e4SLinus Torvalds {
2231da177e4SLinus Torvalds 	int err;
2241da177e4SLinus Torvalds 	int len;
2251da177e4SLinus Torvalds 
22668c6beb3SHannes Frederic Sowa 	BUG_ON(klen > sizeof(struct sockaddr_storage));
22789bddce5SStephen Hemminger 	err = get_user(len, ulen);
22889bddce5SStephen Hemminger 	if (err)
2291da177e4SLinus Torvalds 		return err;
2301da177e4SLinus Torvalds 	if (len > klen)
2311da177e4SLinus Torvalds 		len = klen;
23268c6beb3SHannes Frederic Sowa 	if (len < 0)
2331da177e4SLinus Torvalds 		return -EINVAL;
23489bddce5SStephen Hemminger 	if (len) {
235d6fe3945SSteve Grubb 		if (audit_sockaddr(klen, kaddr))
236d6fe3945SSteve Grubb 			return -ENOMEM;
2371da177e4SLinus Torvalds 		if (copy_to_user(uaddr, kaddr, len))
2381da177e4SLinus Torvalds 			return -EFAULT;
2391da177e4SLinus Torvalds 	}
2401da177e4SLinus Torvalds 	/*
2411da177e4SLinus Torvalds 	 *      "fromlen shall refer to the value before truncation.."
2421da177e4SLinus Torvalds 	 *                      1003.1g
2431da177e4SLinus Torvalds 	 */
2441da177e4SLinus Torvalds 	return __put_user(klen, ulen);
2451da177e4SLinus Torvalds }
2461da177e4SLinus Torvalds 
247e18b890bSChristoph Lameter static struct kmem_cache *sock_inode_cachep __read_mostly;
2481da177e4SLinus Torvalds 
2491da177e4SLinus Torvalds static struct inode *sock_alloc_inode(struct super_block *sb)
2501da177e4SLinus Torvalds {
2511da177e4SLinus Torvalds 	struct socket_alloc *ei;
252eaefd110SEric Dumazet 	struct socket_wq *wq;
25389bddce5SStephen Hemminger 
254e94b1766SChristoph Lameter 	ei = kmem_cache_alloc(sock_inode_cachep, GFP_KERNEL);
2551da177e4SLinus Torvalds 	if (!ei)
2561da177e4SLinus Torvalds 		return NULL;
257eaefd110SEric Dumazet 	wq = kmalloc(sizeof(*wq), GFP_KERNEL);
258eaefd110SEric Dumazet 	if (!wq) {
25943815482SEric Dumazet 		kmem_cache_free(sock_inode_cachep, ei);
26043815482SEric Dumazet 		return NULL;
26143815482SEric Dumazet 	}
262eaefd110SEric Dumazet 	init_waitqueue_head(&wq->wait);
263eaefd110SEric Dumazet 	wq->fasync_list = NULL;
264eaefd110SEric Dumazet 	RCU_INIT_POINTER(ei->socket.wq, wq);
2651da177e4SLinus Torvalds 
2661da177e4SLinus Torvalds 	ei->socket.state = SS_UNCONNECTED;
2671da177e4SLinus Torvalds 	ei->socket.flags = 0;
2681da177e4SLinus Torvalds 	ei->socket.ops = NULL;
2691da177e4SLinus Torvalds 	ei->socket.sk = NULL;
2701da177e4SLinus Torvalds 	ei->socket.file = NULL;
2711da177e4SLinus Torvalds 
2721da177e4SLinus Torvalds 	return &ei->vfs_inode;
2731da177e4SLinus Torvalds }
2741da177e4SLinus Torvalds 
2751da177e4SLinus Torvalds static void sock_destroy_inode(struct inode *inode)
2761da177e4SLinus Torvalds {
27743815482SEric Dumazet 	struct socket_alloc *ei;
278eaefd110SEric Dumazet 	struct socket_wq *wq;
27943815482SEric Dumazet 
28043815482SEric Dumazet 	ei = container_of(inode, struct socket_alloc, vfs_inode);
281eaefd110SEric Dumazet 	wq = rcu_dereference_protected(ei->socket.wq, 1);
28261845220SLai Jiangshan 	kfree_rcu(wq, rcu);
28343815482SEric Dumazet 	kmem_cache_free(sock_inode_cachep, ei);
2841da177e4SLinus Torvalds }
2851da177e4SLinus Torvalds 
28651cc5068SAlexey Dobriyan static void init_once(void *foo)
2871da177e4SLinus Torvalds {
2881da177e4SLinus Torvalds 	struct socket_alloc *ei = (struct socket_alloc *)foo;
2891da177e4SLinus Torvalds 
2901da177e4SLinus Torvalds 	inode_init_once(&ei->vfs_inode);
2911da177e4SLinus Torvalds }
2921da177e4SLinus Torvalds 
2931da177e4SLinus Torvalds static int init_inodecache(void)
2941da177e4SLinus Torvalds {
2951da177e4SLinus Torvalds 	sock_inode_cachep = kmem_cache_create("sock_inode_cache",
2961da177e4SLinus Torvalds 					      sizeof(struct socket_alloc),
29789bddce5SStephen Hemminger 					      0,
29889bddce5SStephen Hemminger 					      (SLAB_HWCACHE_ALIGN |
29989bddce5SStephen Hemminger 					       SLAB_RECLAIM_ACCOUNT |
300fffb60f9SPaul Jackson 					       SLAB_MEM_SPREAD),
30120c2df83SPaul Mundt 					      init_once);
3021da177e4SLinus Torvalds 	if (sock_inode_cachep == NULL)
3031da177e4SLinus Torvalds 		return -ENOMEM;
3041da177e4SLinus Torvalds 	return 0;
3051da177e4SLinus Torvalds }
3061da177e4SLinus Torvalds 
307b87221deSAlexey Dobriyan static const struct super_operations sockfs_ops = {
3081da177e4SLinus Torvalds 	.alloc_inode	= sock_alloc_inode,
3091da177e4SLinus Torvalds 	.destroy_inode	= sock_destroy_inode,
3101da177e4SLinus Torvalds 	.statfs		= simple_statfs,
3111da177e4SLinus Torvalds };
3121da177e4SLinus Torvalds 
313c23fbb6bSEric Dumazet /*
314c23fbb6bSEric Dumazet  * sockfs_dname() is called from d_path().
315c23fbb6bSEric Dumazet  */
316c23fbb6bSEric Dumazet static char *sockfs_dname(struct dentry *dentry, char *buffer, int buflen)
317c23fbb6bSEric Dumazet {
318c23fbb6bSEric Dumazet 	return dynamic_dname(dentry, buffer, buflen, "socket:[%lu]",
319c23fbb6bSEric Dumazet 				dentry->d_inode->i_ino);
320c23fbb6bSEric Dumazet }
321c23fbb6bSEric Dumazet 
3223ba13d17SAl Viro static const struct dentry_operations sockfs_dentry_operations = {
323c23fbb6bSEric Dumazet 	.d_dname  = sockfs_dname,
3241da177e4SLinus Torvalds };
3251da177e4SLinus Torvalds 
326c74a1cbbSAl Viro static struct dentry *sockfs_mount(struct file_system_type *fs_type,
327c74a1cbbSAl Viro 			 int flags, const char *dev_name, void *data)
328c74a1cbbSAl Viro {
329c74a1cbbSAl Viro 	return mount_pseudo(fs_type, "socket:", &sockfs_ops,
330c74a1cbbSAl Viro 		&sockfs_dentry_operations, SOCKFS_MAGIC);
331c74a1cbbSAl Viro }
332c74a1cbbSAl Viro 
333c74a1cbbSAl Viro static struct vfsmount *sock_mnt __read_mostly;
334c74a1cbbSAl Viro 
335c74a1cbbSAl Viro static struct file_system_type sock_fs_type = {
336c74a1cbbSAl Viro 	.name =		"sockfs",
337c74a1cbbSAl Viro 	.mount =	sockfs_mount,
338c74a1cbbSAl Viro 	.kill_sb =	kill_anon_super,
339c74a1cbbSAl Viro };
340c74a1cbbSAl Viro 
3411da177e4SLinus Torvalds /*
3421da177e4SLinus Torvalds  *	Obtains the first available file descriptor and sets it up for use.
3431da177e4SLinus Torvalds  *
34439d8c1b6SDavid S. Miller  *	These functions create file structures and maps them to fd space
34539d8c1b6SDavid S. Miller  *	of the current process. On success it returns file descriptor
3461da177e4SLinus Torvalds  *	and file struct implicitly stored in sock->file.
3471da177e4SLinus Torvalds  *	Note that another thread may close file descriptor before we return
3481da177e4SLinus Torvalds  *	from this function. We use the fact that now we do not refer
3491da177e4SLinus Torvalds  *	to socket after mapping. If one day we will need it, this
3501da177e4SLinus Torvalds  *	function will increment ref. count on file by 1.
3511da177e4SLinus Torvalds  *
3521da177e4SLinus Torvalds  *	In any case returned fd MAY BE not valid!
3531da177e4SLinus Torvalds  *	This race condition is unavoidable
3541da177e4SLinus Torvalds  *	with shared fd spaces, we cannot solve it inside kernel,
3551da177e4SLinus Torvalds  *	but we take care of internal coherence yet.
3561da177e4SLinus Torvalds  */
3571da177e4SLinus Torvalds 
358aab174f0SLinus Torvalds struct file *sock_alloc_file(struct socket *sock, int flags, const char *dname)
3591da177e4SLinus Torvalds {
3607cbe66b6SAl Viro 	struct qstr name = { .name = "" };
3612c48b9c4SAl Viro 	struct path path;
3627cbe66b6SAl Viro 	struct file *file;
3631da177e4SLinus Torvalds 
364600e1779SMasatake YAMATO 	if (dname) {
365600e1779SMasatake YAMATO 		name.name = dname;
366600e1779SMasatake YAMATO 		name.len = strlen(name.name);
367600e1779SMasatake YAMATO 	} else if (sock->sk) {
368600e1779SMasatake YAMATO 		name.name = sock->sk->sk_prot_creator->name;
369600e1779SMasatake YAMATO 		name.len = strlen(name.name);
370600e1779SMasatake YAMATO 	}
3714b936885SNick Piggin 	path.dentry = d_alloc_pseudo(sock_mnt->mnt_sb, &name);
37228407630SAl Viro 	if (unlikely(!path.dentry))
37328407630SAl Viro 		return ERR_PTR(-ENOMEM);
3742c48b9c4SAl Viro 	path.mnt = mntget(sock_mnt);
37539d8c1b6SDavid S. Miller 
3762c48b9c4SAl Viro 	d_instantiate(path.dentry, SOCK_INODE(sock));
377cc3808f8SAl Viro 	SOCK_INODE(sock)->i_fop = &socket_file_ops;
378cc3808f8SAl Viro 
3792c48b9c4SAl Viro 	file = alloc_file(&path, FMODE_READ | FMODE_WRITE,
380cc3808f8SAl Viro 		  &socket_file_ops);
38139b65252SAnatol Pomozov 	if (unlikely(IS_ERR(file))) {
382cc3808f8SAl Viro 		/* drop dentry, keep inode */
3837de9c6eeSAl Viro 		ihold(path.dentry->d_inode);
3842c48b9c4SAl Viro 		path_put(&path);
38539b65252SAnatol Pomozov 		return file;
386cc3808f8SAl Viro 	}
3871da177e4SLinus Torvalds 
3881da177e4SLinus Torvalds 	sock->file = file;
38977d27200SUlrich Drepper 	file->f_flags = O_RDWR | (flags & O_NONBLOCK);
39007dc3f07SBenjamin LaHaise 	file->private_data = sock;
39128407630SAl Viro 	return file;
3921da177e4SLinus Torvalds }
39356b31d1cSAl Viro EXPORT_SYMBOL(sock_alloc_file);
3941da177e4SLinus Torvalds 
39556b31d1cSAl Viro static int sock_map_fd(struct socket *sock, int flags)
39639d8c1b6SDavid S. Miller {
39739d8c1b6SDavid S. Miller 	struct file *newfile;
39828407630SAl Viro 	int fd = get_unused_fd_flags(flags);
39928407630SAl Viro 	if (unlikely(fd < 0))
4001da177e4SLinus Torvalds 		return fd;
4011da177e4SLinus Torvalds 
402aab174f0SLinus Torvalds 	newfile = sock_alloc_file(sock, flags, NULL);
40328407630SAl Viro 	if (likely(!IS_ERR(newfile))) {
4041da177e4SLinus Torvalds 		fd_install(fd, newfile);
4051da177e4SLinus Torvalds 		return fd;
4061da177e4SLinus Torvalds 	}
40728407630SAl Viro 
40828407630SAl Viro 	put_unused_fd(fd);
40928407630SAl Viro 	return PTR_ERR(newfile);
4101da177e4SLinus Torvalds }
4111da177e4SLinus Torvalds 
412406a3c63SJohn Fastabend struct socket *sock_from_file(struct file *file, int *err)
4136cb153caSBenjamin LaHaise {
4146cb153caSBenjamin LaHaise 	if (file->f_op == &socket_file_ops)
4156cb153caSBenjamin LaHaise 		return file->private_data;	/* set in sock_map_fd */
4166cb153caSBenjamin LaHaise 
4176cb153caSBenjamin LaHaise 	*err = -ENOTSOCK;
4186cb153caSBenjamin LaHaise 	return NULL;
4196cb153caSBenjamin LaHaise }
420406a3c63SJohn Fastabend EXPORT_SYMBOL(sock_from_file);
4216cb153caSBenjamin LaHaise 
4221da177e4SLinus Torvalds /**
4231da177e4SLinus Torvalds  *	sockfd_lookup - Go from a file number to its socket slot
4241da177e4SLinus Torvalds  *	@fd: file handle
4251da177e4SLinus Torvalds  *	@err: pointer to an error code return
4261da177e4SLinus Torvalds  *
4271da177e4SLinus Torvalds  *	The file handle passed in is locked and the socket it is bound
4281da177e4SLinus Torvalds  *	too is returned. If an error occurs the err pointer is overwritten
4291da177e4SLinus Torvalds  *	with a negative errno code and NULL is returned. The function checks
4301da177e4SLinus Torvalds  *	for both invalid handles and passing a handle which is not a socket.
4311da177e4SLinus Torvalds  *
4321da177e4SLinus Torvalds  *	On a success the socket object pointer is returned.
4331da177e4SLinus Torvalds  */
4341da177e4SLinus Torvalds 
4351da177e4SLinus Torvalds struct socket *sockfd_lookup(int fd, int *err)
4361da177e4SLinus Torvalds {
4371da177e4SLinus Torvalds 	struct file *file;
4381da177e4SLinus Torvalds 	struct socket *sock;
4391da177e4SLinus Torvalds 
44089bddce5SStephen Hemminger 	file = fget(fd);
44189bddce5SStephen Hemminger 	if (!file) {
4421da177e4SLinus Torvalds 		*err = -EBADF;
4431da177e4SLinus Torvalds 		return NULL;
4441da177e4SLinus Torvalds 	}
44589bddce5SStephen Hemminger 
4466cb153caSBenjamin LaHaise 	sock = sock_from_file(file, err);
4476cb153caSBenjamin LaHaise 	if (!sock)
4481da177e4SLinus Torvalds 		fput(file);
4496cb153caSBenjamin LaHaise 	return sock;
4501da177e4SLinus Torvalds }
451c6d409cfSEric Dumazet EXPORT_SYMBOL(sockfd_lookup);
4521da177e4SLinus Torvalds 
4536cb153caSBenjamin LaHaise static struct socket *sockfd_lookup_light(int fd, int *err, int *fput_needed)
4546cb153caSBenjamin LaHaise {
45500e188efSAl Viro 	struct fd f = fdget(fd);
4566cb153caSBenjamin LaHaise 	struct socket *sock;
4576cb153caSBenjamin LaHaise 
4583672558cSHua Zhong 	*err = -EBADF;
45900e188efSAl Viro 	if (f.file) {
46000e188efSAl Viro 		sock = sock_from_file(f.file, err);
46100e188efSAl Viro 		if (likely(sock)) {
46200e188efSAl Viro 			*fput_needed = f.flags;
4631da177e4SLinus Torvalds 			return sock;
46400e188efSAl Viro 		}
46500e188efSAl Viro 		fdput(f);
4666cb153caSBenjamin LaHaise 	}
4676cb153caSBenjamin LaHaise 	return NULL;
4681da177e4SLinus Torvalds }
4691da177e4SLinus Torvalds 
470600e1779SMasatake YAMATO #define XATTR_SOCKPROTONAME_SUFFIX "sockprotoname"
471600e1779SMasatake YAMATO #define XATTR_NAME_SOCKPROTONAME (XATTR_SYSTEM_PREFIX XATTR_SOCKPROTONAME_SUFFIX)
472600e1779SMasatake YAMATO #define XATTR_NAME_SOCKPROTONAME_LEN (sizeof(XATTR_NAME_SOCKPROTONAME)-1)
473600e1779SMasatake YAMATO static ssize_t sockfs_getxattr(struct dentry *dentry,
474600e1779SMasatake YAMATO 			       const char *name, void *value, size_t size)
475600e1779SMasatake YAMATO {
476600e1779SMasatake YAMATO 	const char *proto_name;
477600e1779SMasatake YAMATO 	size_t proto_size;
478600e1779SMasatake YAMATO 	int error;
479600e1779SMasatake YAMATO 
480600e1779SMasatake YAMATO 	error = -ENODATA;
481600e1779SMasatake YAMATO 	if (!strncmp(name, XATTR_NAME_SOCKPROTONAME, XATTR_NAME_SOCKPROTONAME_LEN)) {
482600e1779SMasatake YAMATO 		proto_name = dentry->d_name.name;
483600e1779SMasatake YAMATO 		proto_size = strlen(proto_name);
484600e1779SMasatake YAMATO 
485600e1779SMasatake YAMATO 		if (value) {
486600e1779SMasatake YAMATO 			error = -ERANGE;
487600e1779SMasatake YAMATO 			if (proto_size + 1 > size)
488600e1779SMasatake YAMATO 				goto out;
489600e1779SMasatake YAMATO 
490600e1779SMasatake YAMATO 			strncpy(value, proto_name, proto_size + 1);
491600e1779SMasatake YAMATO 		}
492600e1779SMasatake YAMATO 		error = proto_size + 1;
493600e1779SMasatake YAMATO 	}
494600e1779SMasatake YAMATO 
495600e1779SMasatake YAMATO out:
496600e1779SMasatake YAMATO 	return error;
497600e1779SMasatake YAMATO }
498600e1779SMasatake YAMATO 
499600e1779SMasatake YAMATO static ssize_t sockfs_listxattr(struct dentry *dentry, char *buffer,
500600e1779SMasatake YAMATO 				size_t size)
501600e1779SMasatake YAMATO {
502600e1779SMasatake YAMATO 	ssize_t len;
503600e1779SMasatake YAMATO 	ssize_t used = 0;
504600e1779SMasatake YAMATO 
505600e1779SMasatake YAMATO 	len = security_inode_listsecurity(dentry->d_inode, buffer, size);
506600e1779SMasatake YAMATO 	if (len < 0)
507600e1779SMasatake YAMATO 		return len;
508600e1779SMasatake YAMATO 	used += len;
509600e1779SMasatake YAMATO 	if (buffer) {
510600e1779SMasatake YAMATO 		if (size < used)
511600e1779SMasatake YAMATO 			return -ERANGE;
512600e1779SMasatake YAMATO 		buffer += len;
513600e1779SMasatake YAMATO 	}
514600e1779SMasatake YAMATO 
515600e1779SMasatake YAMATO 	len = (XATTR_NAME_SOCKPROTONAME_LEN + 1);
516600e1779SMasatake YAMATO 	used += len;
517600e1779SMasatake YAMATO 	if (buffer) {
518600e1779SMasatake YAMATO 		if (size < used)
519600e1779SMasatake YAMATO 			return -ERANGE;
520600e1779SMasatake YAMATO 		memcpy(buffer, XATTR_NAME_SOCKPROTONAME, len);
521600e1779SMasatake YAMATO 		buffer += len;
522600e1779SMasatake YAMATO 	}
523600e1779SMasatake YAMATO 
524600e1779SMasatake YAMATO 	return used;
525600e1779SMasatake YAMATO }
526600e1779SMasatake YAMATO 
527600e1779SMasatake YAMATO static const struct inode_operations sockfs_inode_ops = {
528600e1779SMasatake YAMATO 	.getxattr = sockfs_getxattr,
529600e1779SMasatake YAMATO 	.listxattr = sockfs_listxattr,
530600e1779SMasatake YAMATO };
531600e1779SMasatake YAMATO 
5321da177e4SLinus Torvalds /**
5331da177e4SLinus Torvalds  *	sock_alloc	-	allocate a socket
5341da177e4SLinus Torvalds  *
5351da177e4SLinus Torvalds  *	Allocate a new inode and socket object. The two are bound together
5361da177e4SLinus Torvalds  *	and initialised. The socket is then returned. If we are out of inodes
5371da177e4SLinus Torvalds  *	NULL is returned.
5381da177e4SLinus Torvalds  */
5391da177e4SLinus Torvalds 
5401da177e4SLinus Torvalds static struct socket *sock_alloc(void)
5411da177e4SLinus Torvalds {
5421da177e4SLinus Torvalds 	struct inode *inode;
5431da177e4SLinus Torvalds 	struct socket *sock;
5441da177e4SLinus Torvalds 
545a209dfc7SEric Dumazet 	inode = new_inode_pseudo(sock_mnt->mnt_sb);
5461da177e4SLinus Torvalds 	if (!inode)
5471da177e4SLinus Torvalds 		return NULL;
5481da177e4SLinus Torvalds 
5491da177e4SLinus Torvalds 	sock = SOCKET_I(inode);
5501da177e4SLinus Torvalds 
55129a020d3SEric Dumazet 	kmemcheck_annotate_bitfield(sock, type);
55285fe4025SChristoph Hellwig 	inode->i_ino = get_next_ino();
5531da177e4SLinus Torvalds 	inode->i_mode = S_IFSOCK | S_IRWXUGO;
5548192b0c4SDavid Howells 	inode->i_uid = current_fsuid();
5558192b0c4SDavid Howells 	inode->i_gid = current_fsgid();
556600e1779SMasatake YAMATO 	inode->i_op = &sockfs_inode_ops;
5571da177e4SLinus Torvalds 
55819e8d69cSAlex Shi 	this_cpu_add(sockets_in_use, 1);
5591da177e4SLinus Torvalds 	return sock;
5601da177e4SLinus Torvalds }
5611da177e4SLinus Torvalds 
5621da177e4SLinus Torvalds /*
5631da177e4SLinus Torvalds  *	In theory you can't get an open on this inode, but /proc provides
5641da177e4SLinus Torvalds  *	a back door. Remember to keep it shut otherwise you'll let the
5651da177e4SLinus Torvalds  *	creepy crawlies in.
5661da177e4SLinus Torvalds  */
5671da177e4SLinus Torvalds 
5681da177e4SLinus Torvalds static int sock_no_open(struct inode *irrelevant, struct file *dontcare)
5691da177e4SLinus Torvalds {
5701da177e4SLinus Torvalds 	return -ENXIO;
5711da177e4SLinus Torvalds }
5721da177e4SLinus Torvalds 
5734b6f5d20SArjan van de Ven const struct file_operations bad_sock_fops = {
5741da177e4SLinus Torvalds 	.owner = THIS_MODULE,
5751da177e4SLinus Torvalds 	.open = sock_no_open,
5766038f373SArnd Bergmann 	.llseek = noop_llseek,
5771da177e4SLinus Torvalds };
5781da177e4SLinus Torvalds 
5791da177e4SLinus Torvalds /**
5801da177e4SLinus Torvalds  *	sock_release	-	close a socket
5811da177e4SLinus Torvalds  *	@sock: socket to close
5821da177e4SLinus Torvalds  *
5831da177e4SLinus Torvalds  *	The socket is released from the protocol stack if it has a release
5841da177e4SLinus Torvalds  *	callback, and the inode is then released if the socket is bound to
5851da177e4SLinus Torvalds  *	an inode not a file.
5861da177e4SLinus Torvalds  */
5871da177e4SLinus Torvalds 
5881da177e4SLinus Torvalds void sock_release(struct socket *sock)
5891da177e4SLinus Torvalds {
5901da177e4SLinus Torvalds 	if (sock->ops) {
5911da177e4SLinus Torvalds 		struct module *owner = sock->ops->owner;
5921da177e4SLinus Torvalds 
5931da177e4SLinus Torvalds 		sock->ops->release(sock);
5941da177e4SLinus Torvalds 		sock->ops = NULL;
5951da177e4SLinus Torvalds 		module_put(owner);
5961da177e4SLinus Torvalds 	}
5971da177e4SLinus Torvalds 
598eaefd110SEric Dumazet 	if (rcu_dereference_protected(sock->wq, 1)->fasync_list)
5993410f22eSYang Yingliang 		pr_err("%s: fasync list not empty!\n", __func__);
6001da177e4SLinus Torvalds 
601b09e786bSMikulas Patocka 	if (test_bit(SOCK_EXTERNALLY_ALLOCATED, &sock->flags))
602b09e786bSMikulas Patocka 		return;
603b09e786bSMikulas Patocka 
60419e8d69cSAlex Shi 	this_cpu_sub(sockets_in_use, 1);
6051da177e4SLinus Torvalds 	if (!sock->file) {
6061da177e4SLinus Torvalds 		iput(SOCK_INODE(sock));
6071da177e4SLinus Torvalds 		return;
6081da177e4SLinus Torvalds 	}
6091da177e4SLinus Torvalds 	sock->file = NULL;
6101da177e4SLinus Torvalds }
611c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_release);
6121da177e4SLinus Torvalds 
61367cc0d40SWillem de Bruijn void __sock_tx_timestamp(const struct sock *sk, __u8 *tx_flags)
61420d49473SPatrick Ohly {
615140c55d4SEric Dumazet 	u8 flags = *tx_flags;
616140c55d4SEric Dumazet 
617b9f40e21SWillem de Bruijn 	if (sk->sk_tsflags & SOF_TIMESTAMPING_TX_HARDWARE)
618140c55d4SEric Dumazet 		flags |= SKBTX_HW_TSTAMP;
619140c55d4SEric Dumazet 
620b9f40e21SWillem de Bruijn 	if (sk->sk_tsflags & SOF_TIMESTAMPING_TX_SOFTWARE)
621140c55d4SEric Dumazet 		flags |= SKBTX_SW_TSTAMP;
622140c55d4SEric Dumazet 
623e7fd2885SWillem de Bruijn 	if (sk->sk_tsflags & SOF_TIMESTAMPING_TX_SCHED)
624140c55d4SEric Dumazet 		flags |= SKBTX_SCHED_TSTAMP;
625140c55d4SEric Dumazet 
626e1c8a607SWillem de Bruijn 	if (sk->sk_tsflags & SOF_TIMESTAMPING_TX_ACK)
627140c55d4SEric Dumazet 		flags |= SKBTX_ACK_TSTAMP;
628e7fd2885SWillem de Bruijn 
629140c55d4SEric Dumazet 	*tx_flags = flags;
63020d49473SPatrick Ohly }
63167cc0d40SWillem de Bruijn EXPORT_SYMBOL(__sock_tx_timestamp);
63220d49473SPatrick Ohly 
633228e548eSAnton Blanchard static inline int __sock_sendmsg_nosec(struct kiocb *iocb, struct socket *sock,
6341da177e4SLinus Torvalds 				       struct msghdr *msg, size_t size)
6351da177e4SLinus Torvalds {
6361da177e4SLinus Torvalds 	struct sock_iocb *si = kiocb_to_siocb(iocb);
6371da177e4SLinus Torvalds 
6381da177e4SLinus Torvalds 	si->sock = sock;
6391da177e4SLinus Torvalds 	si->scm = NULL;
6401da177e4SLinus Torvalds 	si->msg = msg;
6411da177e4SLinus Torvalds 	si->size = size;
6421da177e4SLinus Torvalds 
6431da177e4SLinus Torvalds 	return sock->ops->sendmsg(iocb, sock, msg, size);
6441da177e4SLinus Torvalds }
6451da177e4SLinus Torvalds 
646228e548eSAnton Blanchard static inline int __sock_sendmsg(struct kiocb *iocb, struct socket *sock,
647228e548eSAnton Blanchard 				 struct msghdr *msg, size_t size)
648228e548eSAnton Blanchard {
649228e548eSAnton Blanchard 	int err = security_socket_sendmsg(sock, msg, size);
650228e548eSAnton Blanchard 
651228e548eSAnton Blanchard 	return err ?: __sock_sendmsg_nosec(iocb, sock, msg, size);
652228e548eSAnton Blanchard }
653228e548eSAnton Blanchard 
6540cf00c6fSGu Zheng static int do_sock_sendmsg(struct socket *sock, struct msghdr *msg,
6550cf00c6fSGu Zheng 			   size_t size, bool nosec)
6561da177e4SLinus Torvalds {
6571da177e4SLinus Torvalds 	struct kiocb iocb;
6581da177e4SLinus Torvalds 	struct sock_iocb siocb;
6591da177e4SLinus Torvalds 	int ret;
6601da177e4SLinus Torvalds 
6611da177e4SLinus Torvalds 	init_sync_kiocb(&iocb, NULL);
6621da177e4SLinus Torvalds 	iocb.private = &siocb;
6630cf00c6fSGu Zheng 	ret = nosec ? __sock_sendmsg_nosec(&iocb, sock, msg, size) :
6640cf00c6fSGu Zheng 		      __sock_sendmsg(&iocb, sock, msg, size);
6651da177e4SLinus Torvalds 	if (-EIOCBQUEUED == ret)
6661da177e4SLinus Torvalds 		ret = wait_on_sync_kiocb(&iocb);
6671da177e4SLinus Torvalds 	return ret;
6681da177e4SLinus Torvalds }
6690cf00c6fSGu Zheng 
6700cf00c6fSGu Zheng int sock_sendmsg(struct socket *sock, struct msghdr *msg, size_t size)
6710cf00c6fSGu Zheng {
6720cf00c6fSGu Zheng 	return do_sock_sendmsg(sock, msg, size, false);
6730cf00c6fSGu Zheng }
674c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_sendmsg);
6751da177e4SLinus Torvalds 
676894dc24cSEric Dumazet static int sock_sendmsg_nosec(struct socket *sock, struct msghdr *msg, size_t size)
677228e548eSAnton Blanchard {
6780cf00c6fSGu Zheng 	return do_sock_sendmsg(sock, msg, size, true);
679228e548eSAnton Blanchard }
680228e548eSAnton Blanchard 
6811da177e4SLinus Torvalds int kernel_sendmsg(struct socket *sock, struct msghdr *msg,
6821da177e4SLinus Torvalds 		   struct kvec *vec, size_t num, size_t size)
6831da177e4SLinus Torvalds {
6841da177e4SLinus Torvalds 	mm_segment_t oldfs = get_fs();
6851da177e4SLinus Torvalds 	int result;
6861da177e4SLinus Torvalds 
6871da177e4SLinus Torvalds 	set_fs(KERNEL_DS);
6881da177e4SLinus Torvalds 	/*
6891da177e4SLinus Torvalds 	 * the following is safe, since for compiler definitions of kvec and
6901da177e4SLinus Torvalds 	 * iovec are identical, yielding the same in-core layout and alignment
6911da177e4SLinus Torvalds 	 */
692c0371da6SAl Viro 	iov_iter_init(&msg->msg_iter, WRITE, (struct iovec *)vec, num, size);
6931da177e4SLinus Torvalds 	result = sock_sendmsg(sock, msg, size);
6941da177e4SLinus Torvalds 	set_fs(oldfs);
6951da177e4SLinus Torvalds 	return result;
6961da177e4SLinus Torvalds }
697c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_sendmsg);
6981da177e4SLinus Torvalds 
69992f37fd2SEric Dumazet /*
70092f37fd2SEric Dumazet  * called from sock_recv_timestamp() if sock_flag(sk, SOCK_RCVTSTAMP)
70192f37fd2SEric Dumazet  */
70292f37fd2SEric Dumazet void __sock_recv_timestamp(struct msghdr *msg, struct sock *sk,
70392f37fd2SEric Dumazet 	struct sk_buff *skb)
70492f37fd2SEric Dumazet {
70520d49473SPatrick Ohly 	int need_software_tstamp = sock_flag(sk, SOCK_RCVTSTAMP);
706f24b9be5SWillem de Bruijn 	struct scm_timestamping tss;
70720d49473SPatrick Ohly 	int empty = 1;
70820d49473SPatrick Ohly 	struct skb_shared_hwtstamps *shhwtstamps =
70920d49473SPatrick Ohly 		skb_hwtstamps(skb);
71092f37fd2SEric Dumazet 
71120d49473SPatrick Ohly 	/* Race occurred between timestamp enabling and packet
71220d49473SPatrick Ohly 	   receiving.  Fill in the current time for now. */
71320d49473SPatrick Ohly 	if (need_software_tstamp && skb->tstamp.tv64 == 0)
71420d49473SPatrick Ohly 		__net_timestamp(skb);
71520d49473SPatrick Ohly 
71620d49473SPatrick Ohly 	if (need_software_tstamp) {
71792f37fd2SEric Dumazet 		if (!sock_flag(sk, SOCK_RCVTSTAMPNS)) {
71892f37fd2SEric Dumazet 			struct timeval tv;
71920d49473SPatrick Ohly 			skb_get_timestamp(skb, &tv);
72020d49473SPatrick Ohly 			put_cmsg(msg, SOL_SOCKET, SCM_TIMESTAMP,
72120d49473SPatrick Ohly 				 sizeof(tv), &tv);
72292f37fd2SEric Dumazet 		} else {
723f24b9be5SWillem de Bruijn 			struct timespec ts;
724f24b9be5SWillem de Bruijn 			skb_get_timestampns(skb, &ts);
72520d49473SPatrick Ohly 			put_cmsg(msg, SOL_SOCKET, SCM_TIMESTAMPNS,
726f24b9be5SWillem de Bruijn 				 sizeof(ts), &ts);
72792f37fd2SEric Dumazet 		}
72892f37fd2SEric Dumazet 	}
72992f37fd2SEric Dumazet 
730f24b9be5SWillem de Bruijn 	memset(&tss, 0, sizeof(tss));
731c199105dSWillem de Bruijn 	if ((sk->sk_tsflags & SOF_TIMESTAMPING_SOFTWARE) &&
732f24b9be5SWillem de Bruijn 	    ktime_to_timespec_cond(skb->tstamp, tss.ts + 0))
73320d49473SPatrick Ohly 		empty = 0;
7344d276eb6SWillem de Bruijn 	if (shhwtstamps &&
735b9f40e21SWillem de Bruijn 	    (sk->sk_tsflags & SOF_TIMESTAMPING_RAW_HARDWARE) &&
736f24b9be5SWillem de Bruijn 	    ktime_to_timespec_cond(shhwtstamps->hwtstamp, tss.ts + 2))
73720d49473SPatrick Ohly 		empty = 0;
73820d49473SPatrick Ohly 	if (!empty)
73920d49473SPatrick Ohly 		put_cmsg(msg, SOL_SOCKET,
740f24b9be5SWillem de Bruijn 			 SCM_TIMESTAMPING, sizeof(tss), &tss);
74120d49473SPatrick Ohly }
7427c81fd8bSArnaldo Carvalho de Melo EXPORT_SYMBOL_GPL(__sock_recv_timestamp);
7437c81fd8bSArnaldo Carvalho de Melo 
7446e3e939fSJohannes Berg void __sock_recv_wifi_status(struct msghdr *msg, struct sock *sk,
7456e3e939fSJohannes Berg 	struct sk_buff *skb)
7466e3e939fSJohannes Berg {
7476e3e939fSJohannes Berg 	int ack;
7486e3e939fSJohannes Berg 
7496e3e939fSJohannes Berg 	if (!sock_flag(sk, SOCK_WIFI_STATUS))
7506e3e939fSJohannes Berg 		return;
7516e3e939fSJohannes Berg 	if (!skb->wifi_acked_valid)
7526e3e939fSJohannes Berg 		return;
7536e3e939fSJohannes Berg 
7546e3e939fSJohannes Berg 	ack = skb->wifi_acked;
7556e3e939fSJohannes Berg 
7566e3e939fSJohannes Berg 	put_cmsg(msg, SOL_SOCKET, SCM_WIFI_STATUS, sizeof(ack), &ack);
7576e3e939fSJohannes Berg }
7586e3e939fSJohannes Berg EXPORT_SYMBOL_GPL(__sock_recv_wifi_status);
7596e3e939fSJohannes Berg 
76011165f14Sstephen hemminger static inline void sock_recv_drops(struct msghdr *msg, struct sock *sk,
76111165f14Sstephen hemminger 				   struct sk_buff *skb)
7623b885787SNeil Horman {
7633b885787SNeil Horman 	if (sock_flag(sk, SOCK_RXQ_OVFL) && skb && skb->dropcount)
7643b885787SNeil Horman 		put_cmsg(msg, SOL_SOCKET, SO_RXQ_OVFL,
7653b885787SNeil Horman 			sizeof(__u32), &skb->dropcount);
7663b885787SNeil Horman }
7673b885787SNeil Horman 
768767dd033SEric Dumazet void __sock_recv_ts_and_drops(struct msghdr *msg, struct sock *sk,
7693b885787SNeil Horman 	struct sk_buff *skb)
7703b885787SNeil Horman {
7713b885787SNeil Horman 	sock_recv_timestamp(msg, sk, skb);
7723b885787SNeil Horman 	sock_recv_drops(msg, sk, skb);
7733b885787SNeil Horman }
774767dd033SEric Dumazet EXPORT_SYMBOL_GPL(__sock_recv_ts_and_drops);
7753b885787SNeil Horman 
776a2e27255SArnaldo Carvalho de Melo static inline int __sock_recvmsg_nosec(struct kiocb *iocb, struct socket *sock,
7771da177e4SLinus Torvalds 				       struct msghdr *msg, size_t size, int flags)
7781da177e4SLinus Torvalds {
7791da177e4SLinus Torvalds 	struct sock_iocb *si = kiocb_to_siocb(iocb);
7801da177e4SLinus Torvalds 
7811da177e4SLinus Torvalds 	si->sock = sock;
7821da177e4SLinus Torvalds 	si->scm = NULL;
7831da177e4SLinus Torvalds 	si->msg = msg;
7841da177e4SLinus Torvalds 	si->size = size;
7851da177e4SLinus Torvalds 	si->flags = flags;
7861da177e4SLinus Torvalds 
7871da177e4SLinus Torvalds 	return sock->ops->recvmsg(iocb, sock, msg, size, flags);
7881da177e4SLinus Torvalds }
7891da177e4SLinus Torvalds 
790a2e27255SArnaldo Carvalho de Melo static inline int __sock_recvmsg(struct kiocb *iocb, struct socket *sock,
791a2e27255SArnaldo Carvalho de Melo 				 struct msghdr *msg, size_t size, int flags)
792a2e27255SArnaldo Carvalho de Melo {
793a2e27255SArnaldo Carvalho de Melo 	int err = security_socket_recvmsg(sock, msg, size, flags);
794a2e27255SArnaldo Carvalho de Melo 
795a2e27255SArnaldo Carvalho de Melo 	return err ?: __sock_recvmsg_nosec(iocb, sock, msg, size, flags);
796a2e27255SArnaldo Carvalho de Melo }
797a2e27255SArnaldo Carvalho de Melo 
7981da177e4SLinus Torvalds int sock_recvmsg(struct socket *sock, struct msghdr *msg,
7991da177e4SLinus Torvalds 		 size_t size, int flags)
8001da177e4SLinus Torvalds {
8011da177e4SLinus Torvalds 	struct kiocb iocb;
8021da177e4SLinus Torvalds 	struct sock_iocb siocb;
8031da177e4SLinus Torvalds 	int ret;
8041da177e4SLinus Torvalds 
8051da177e4SLinus Torvalds 	init_sync_kiocb(&iocb, NULL);
8061da177e4SLinus Torvalds 	iocb.private = &siocb;
8071da177e4SLinus Torvalds 	ret = __sock_recvmsg(&iocb, sock, msg, size, flags);
8081da177e4SLinus Torvalds 	if (-EIOCBQUEUED == ret)
8091da177e4SLinus Torvalds 		ret = wait_on_sync_kiocb(&iocb);
8101da177e4SLinus Torvalds 	return ret;
8111da177e4SLinus Torvalds }
812c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_recvmsg);
8131da177e4SLinus Torvalds 
814a2e27255SArnaldo Carvalho de Melo static int sock_recvmsg_nosec(struct socket *sock, struct msghdr *msg,
815a2e27255SArnaldo Carvalho de Melo 			      size_t size, int flags)
816a2e27255SArnaldo Carvalho de Melo {
817a2e27255SArnaldo Carvalho de Melo 	struct kiocb iocb;
818a2e27255SArnaldo Carvalho de Melo 	struct sock_iocb siocb;
819a2e27255SArnaldo Carvalho de Melo 	int ret;
820a2e27255SArnaldo Carvalho de Melo 
821a2e27255SArnaldo Carvalho de Melo 	init_sync_kiocb(&iocb, NULL);
822a2e27255SArnaldo Carvalho de Melo 	iocb.private = &siocb;
823a2e27255SArnaldo Carvalho de Melo 	ret = __sock_recvmsg_nosec(&iocb, sock, msg, size, flags);
824a2e27255SArnaldo Carvalho de Melo 	if (-EIOCBQUEUED == ret)
825a2e27255SArnaldo Carvalho de Melo 		ret = wait_on_sync_kiocb(&iocb);
826a2e27255SArnaldo Carvalho de Melo 	return ret;
827a2e27255SArnaldo Carvalho de Melo }
828a2e27255SArnaldo Carvalho de Melo 
829c1249c0aSMartin Lucina /**
830c1249c0aSMartin Lucina  * kernel_recvmsg - Receive a message from a socket (kernel space)
831c1249c0aSMartin Lucina  * @sock:       The socket to receive the message from
832c1249c0aSMartin Lucina  * @msg:        Received message
833c1249c0aSMartin Lucina  * @vec:        Input s/g array for message data
834c1249c0aSMartin Lucina  * @num:        Size of input s/g array
835c1249c0aSMartin Lucina  * @size:       Number of bytes to read
836c1249c0aSMartin Lucina  * @flags:      Message flags (MSG_DONTWAIT, etc...)
837c1249c0aSMartin Lucina  *
838c1249c0aSMartin Lucina  * On return the msg structure contains the scatter/gather array passed in the
839c1249c0aSMartin Lucina  * vec argument. The array is modified so that it consists of the unfilled
840c1249c0aSMartin Lucina  * portion of the original array.
841c1249c0aSMartin Lucina  *
842c1249c0aSMartin Lucina  * The returned value is the total number of bytes received, or an error.
843c1249c0aSMartin Lucina  */
8441da177e4SLinus Torvalds int kernel_recvmsg(struct socket *sock, struct msghdr *msg,
84589bddce5SStephen Hemminger 		   struct kvec *vec, size_t num, size_t size, int flags)
8461da177e4SLinus Torvalds {
8471da177e4SLinus Torvalds 	mm_segment_t oldfs = get_fs();
8481da177e4SLinus Torvalds 	int result;
8491da177e4SLinus Torvalds 
8501da177e4SLinus Torvalds 	set_fs(KERNEL_DS);
8511da177e4SLinus Torvalds 	/*
8521da177e4SLinus Torvalds 	 * the following is safe, since for compiler definitions of kvec and
8531da177e4SLinus Torvalds 	 * iovec are identical, yielding the same in-core layout and alignment
8541da177e4SLinus Torvalds 	 */
855c0371da6SAl Viro 	iov_iter_init(&msg->msg_iter, READ, (struct iovec *)vec, num, size);
8561da177e4SLinus Torvalds 	result = sock_recvmsg(sock, msg, size, flags);
8571da177e4SLinus Torvalds 	set_fs(oldfs);
8581da177e4SLinus Torvalds 	return result;
8591da177e4SLinus Torvalds }
860c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_recvmsg);
8611da177e4SLinus Torvalds 
86220380731SArnaldo Carvalho de Melo static ssize_t sock_sendpage(struct file *file, struct page *page,
8631da177e4SLinus Torvalds 			     int offset, size_t size, loff_t *ppos, int more)
8641da177e4SLinus Torvalds {
8651da177e4SLinus Torvalds 	struct socket *sock;
8661da177e4SLinus Torvalds 	int flags;
8671da177e4SLinus Torvalds 
868b69aee04SEric Dumazet 	sock = file->private_data;
8691da177e4SLinus Torvalds 
87035f9c09fSEric Dumazet 	flags = (file->f_flags & O_NONBLOCK) ? MSG_DONTWAIT : 0;
87135f9c09fSEric Dumazet 	/* more is a combination of MSG_MORE and MSG_SENDPAGE_NOTLAST */
87235f9c09fSEric Dumazet 	flags |= more;
8731da177e4SLinus Torvalds 
874e6949583SLinus Torvalds 	return kernel_sendpage(sock, page, offset, size, flags);
8751da177e4SLinus Torvalds }
8761da177e4SLinus Torvalds 
8779c55e01cSJens Axboe static ssize_t sock_splice_read(struct file *file, loff_t *ppos,
8789c55e01cSJens Axboe 				struct pipe_inode_info *pipe, size_t len,
8799c55e01cSJens Axboe 				unsigned int flags)
8809c55e01cSJens Axboe {
8819c55e01cSJens Axboe 	struct socket *sock = file->private_data;
8829c55e01cSJens Axboe 
883997b37daSRémi Denis-Courmont 	if (unlikely(!sock->ops->splice_read))
884997b37daSRémi Denis-Courmont 		return -EINVAL;
885997b37daSRémi Denis-Courmont 
8869c55e01cSJens Axboe 	return sock->ops->splice_read(sock, ppos, pipe, len, flags);
8879c55e01cSJens Axboe }
8889c55e01cSJens Axboe 
889ce1d4d3eSChristoph Hellwig static struct sock_iocb *alloc_sock_iocb(struct kiocb *iocb,
89089bddce5SStephen Hemminger 					 struct sock_iocb *siocb)
891ce1d4d3eSChristoph Hellwig {
892d29c445bSKent Overstreet 	if (!is_sync_kiocb(iocb))
893d29c445bSKent Overstreet 		BUG();
894ce1d4d3eSChristoph Hellwig 
895ce1d4d3eSChristoph Hellwig 	siocb->kiocb = iocb;
896ce1d4d3eSChristoph Hellwig 	iocb->private = siocb;
897ce1d4d3eSChristoph Hellwig 	return siocb;
898ce1d4d3eSChristoph Hellwig }
899ce1d4d3eSChristoph Hellwig 
900ce1d4d3eSChristoph Hellwig static ssize_t do_sock_read(struct msghdr *msg, struct kiocb *iocb,
901027445c3SBadari Pulavarty 		struct file *file, const struct iovec *iov,
90289bddce5SStephen Hemminger 		unsigned long nr_segs)
903ce1d4d3eSChristoph Hellwig {
904ce1d4d3eSChristoph Hellwig 	struct socket *sock = file->private_data;
905ce1d4d3eSChristoph Hellwig 	size_t size = 0;
906ce1d4d3eSChristoph Hellwig 	int i;
907ce1d4d3eSChristoph Hellwig 
908ce1d4d3eSChristoph Hellwig 	for (i = 0; i < nr_segs; i++)
909ce1d4d3eSChristoph Hellwig 		size += iov[i].iov_len;
910ce1d4d3eSChristoph Hellwig 
911ce1d4d3eSChristoph Hellwig 	msg->msg_name = NULL;
912ce1d4d3eSChristoph Hellwig 	msg->msg_namelen = 0;
913ce1d4d3eSChristoph Hellwig 	msg->msg_control = NULL;
914ce1d4d3eSChristoph Hellwig 	msg->msg_controllen = 0;
915c0371da6SAl Viro 	iov_iter_init(&msg->msg_iter, READ, iov, nr_segs, size);
916ce1d4d3eSChristoph Hellwig 	msg->msg_flags = (file->f_flags & O_NONBLOCK) ? MSG_DONTWAIT : 0;
917ce1d4d3eSChristoph Hellwig 
918ce1d4d3eSChristoph Hellwig 	return __sock_recvmsg(iocb, sock, msg, size, msg->msg_flags);
919ce1d4d3eSChristoph Hellwig }
920ce1d4d3eSChristoph Hellwig 
921027445c3SBadari Pulavarty static ssize_t sock_aio_read(struct kiocb *iocb, const struct iovec *iov,
922027445c3SBadari Pulavarty 				unsigned long nr_segs, loff_t pos)
923ce1d4d3eSChristoph Hellwig {
924ce1d4d3eSChristoph Hellwig 	struct sock_iocb siocb, *x;
925ce1d4d3eSChristoph Hellwig 
926ce1d4d3eSChristoph Hellwig 	if (pos != 0)
927ce1d4d3eSChristoph Hellwig 		return -ESPIPE;
928027445c3SBadari Pulavarty 
92973a7075eSKent Overstreet 	if (iocb->ki_nbytes == 0)	/* Match SYS5 behaviour */
930ce1d4d3eSChristoph Hellwig 		return 0;
931ce1d4d3eSChristoph Hellwig 
932027445c3SBadari Pulavarty 
933027445c3SBadari Pulavarty 	x = alloc_sock_iocb(iocb, &siocb);
934ce1d4d3eSChristoph Hellwig 	if (!x)
935ce1d4d3eSChristoph Hellwig 		return -ENOMEM;
936027445c3SBadari Pulavarty 	return do_sock_read(&x->async_msg, iocb, iocb->ki_filp, iov, nr_segs);
937ce1d4d3eSChristoph Hellwig }
938ce1d4d3eSChristoph Hellwig 
939ce1d4d3eSChristoph Hellwig static ssize_t do_sock_write(struct msghdr *msg, struct kiocb *iocb,
940027445c3SBadari Pulavarty 			struct file *file, const struct iovec *iov,
94189bddce5SStephen Hemminger 			unsigned long nr_segs)
942ce1d4d3eSChristoph Hellwig {
943ce1d4d3eSChristoph Hellwig 	struct socket *sock = file->private_data;
944ce1d4d3eSChristoph Hellwig 	size_t size = 0;
945ce1d4d3eSChristoph Hellwig 	int i;
946ce1d4d3eSChristoph Hellwig 
947ce1d4d3eSChristoph Hellwig 	for (i = 0; i < nr_segs; i++)
948ce1d4d3eSChristoph Hellwig 		size += iov[i].iov_len;
949ce1d4d3eSChristoph Hellwig 
950ce1d4d3eSChristoph Hellwig 	msg->msg_name = NULL;
951ce1d4d3eSChristoph Hellwig 	msg->msg_namelen = 0;
952ce1d4d3eSChristoph Hellwig 	msg->msg_control = NULL;
953ce1d4d3eSChristoph Hellwig 	msg->msg_controllen = 0;
954c0371da6SAl Viro 	iov_iter_init(&msg->msg_iter, WRITE, iov, nr_segs, size);
955ce1d4d3eSChristoph Hellwig 	msg->msg_flags = (file->f_flags & O_NONBLOCK) ? MSG_DONTWAIT : 0;
956ce1d4d3eSChristoph Hellwig 	if (sock->type == SOCK_SEQPACKET)
957ce1d4d3eSChristoph Hellwig 		msg->msg_flags |= MSG_EOR;
958ce1d4d3eSChristoph Hellwig 
959ce1d4d3eSChristoph Hellwig 	return __sock_sendmsg(iocb, sock, msg, size);
960ce1d4d3eSChristoph Hellwig }
961ce1d4d3eSChristoph Hellwig 
962027445c3SBadari Pulavarty static ssize_t sock_aio_write(struct kiocb *iocb, const struct iovec *iov,
963027445c3SBadari Pulavarty 			  unsigned long nr_segs, loff_t pos)
9641da177e4SLinus Torvalds {
965ce1d4d3eSChristoph Hellwig 	struct sock_iocb siocb, *x;
9661da177e4SLinus Torvalds 
967ce1d4d3eSChristoph Hellwig 	if (pos != 0)
968ce1d4d3eSChristoph Hellwig 		return -ESPIPE;
969027445c3SBadari Pulavarty 
970027445c3SBadari Pulavarty 	x = alloc_sock_iocb(iocb, &siocb);
971ce1d4d3eSChristoph Hellwig 	if (!x)
972ce1d4d3eSChristoph Hellwig 		return -ENOMEM;
973ce1d4d3eSChristoph Hellwig 
974027445c3SBadari Pulavarty 	return do_sock_write(&x->async_msg, iocb, iocb->ki_filp, iov, nr_segs);
9751da177e4SLinus Torvalds }
9761da177e4SLinus Torvalds 
9771da177e4SLinus Torvalds /*
9781da177e4SLinus Torvalds  * Atomic setting of ioctl hooks to avoid race
9791da177e4SLinus Torvalds  * with module unload.
9801da177e4SLinus Torvalds  */
9811da177e4SLinus Torvalds 
9824a3e2f71SArjan van de Ven static DEFINE_MUTEX(br_ioctl_mutex);
983c6d409cfSEric Dumazet static int (*br_ioctl_hook) (struct net *, unsigned int cmd, void __user *arg);
9841da177e4SLinus Torvalds 
985881d966bSEric W. Biederman void brioctl_set(int (*hook) (struct net *, unsigned int, void __user *))
9861da177e4SLinus Torvalds {
9874a3e2f71SArjan van de Ven 	mutex_lock(&br_ioctl_mutex);
9881da177e4SLinus Torvalds 	br_ioctl_hook = hook;
9894a3e2f71SArjan van de Ven 	mutex_unlock(&br_ioctl_mutex);
9901da177e4SLinus Torvalds }
9911da177e4SLinus Torvalds EXPORT_SYMBOL(brioctl_set);
9921da177e4SLinus Torvalds 
9934a3e2f71SArjan van de Ven static DEFINE_MUTEX(vlan_ioctl_mutex);
994881d966bSEric W. Biederman static int (*vlan_ioctl_hook) (struct net *, void __user *arg);
9951da177e4SLinus Torvalds 
996881d966bSEric W. Biederman void vlan_ioctl_set(int (*hook) (struct net *, void __user *))
9971da177e4SLinus Torvalds {
9984a3e2f71SArjan van de Ven 	mutex_lock(&vlan_ioctl_mutex);
9991da177e4SLinus Torvalds 	vlan_ioctl_hook = hook;
10004a3e2f71SArjan van de Ven 	mutex_unlock(&vlan_ioctl_mutex);
10011da177e4SLinus Torvalds }
10021da177e4SLinus Torvalds EXPORT_SYMBOL(vlan_ioctl_set);
10031da177e4SLinus Torvalds 
10044a3e2f71SArjan van de Ven static DEFINE_MUTEX(dlci_ioctl_mutex);
10051da177e4SLinus Torvalds static int (*dlci_ioctl_hook) (unsigned int, void __user *);
10061da177e4SLinus Torvalds 
10071da177e4SLinus Torvalds void dlci_ioctl_set(int (*hook) (unsigned int, void __user *))
10081da177e4SLinus Torvalds {
10094a3e2f71SArjan van de Ven 	mutex_lock(&dlci_ioctl_mutex);
10101da177e4SLinus Torvalds 	dlci_ioctl_hook = hook;
10114a3e2f71SArjan van de Ven 	mutex_unlock(&dlci_ioctl_mutex);
10121da177e4SLinus Torvalds }
10131da177e4SLinus Torvalds EXPORT_SYMBOL(dlci_ioctl_set);
10141da177e4SLinus Torvalds 
10156b96018bSArnd Bergmann static long sock_do_ioctl(struct net *net, struct socket *sock,
10166b96018bSArnd Bergmann 				 unsigned int cmd, unsigned long arg)
10176b96018bSArnd Bergmann {
10186b96018bSArnd Bergmann 	int err;
10196b96018bSArnd Bergmann 	void __user *argp = (void __user *)arg;
10206b96018bSArnd Bergmann 
10216b96018bSArnd Bergmann 	err = sock->ops->ioctl(sock, cmd, arg);
10226b96018bSArnd Bergmann 
10236b96018bSArnd Bergmann 	/*
10246b96018bSArnd Bergmann 	 * If this ioctl is unknown try to hand it down
10256b96018bSArnd Bergmann 	 * to the NIC driver.
10266b96018bSArnd Bergmann 	 */
10276b96018bSArnd Bergmann 	if (err == -ENOIOCTLCMD)
10286b96018bSArnd Bergmann 		err = dev_ioctl(net, cmd, argp);
10296b96018bSArnd Bergmann 
10306b96018bSArnd Bergmann 	return err;
10316b96018bSArnd Bergmann }
10326b96018bSArnd Bergmann 
10331da177e4SLinus Torvalds /*
10341da177e4SLinus Torvalds  *	With an ioctl, arg may well be a user mode pointer, but we don't know
10351da177e4SLinus Torvalds  *	what to do with it - that's up to the protocol still.
10361da177e4SLinus Torvalds  */
10371da177e4SLinus Torvalds 
10381da177e4SLinus Torvalds static long sock_ioctl(struct file *file, unsigned cmd, unsigned long arg)
10391da177e4SLinus Torvalds {
10401da177e4SLinus Torvalds 	struct socket *sock;
1041881d966bSEric W. Biederman 	struct sock *sk;
10421da177e4SLinus Torvalds 	void __user *argp = (void __user *)arg;
10431da177e4SLinus Torvalds 	int pid, err;
1044881d966bSEric W. Biederman 	struct net *net;
10451da177e4SLinus Torvalds 
1046b69aee04SEric Dumazet 	sock = file->private_data;
1047881d966bSEric W. Biederman 	sk = sock->sk;
10483b1e0a65SYOSHIFUJI Hideaki 	net = sock_net(sk);
10491da177e4SLinus Torvalds 	if (cmd >= SIOCDEVPRIVATE && cmd <= (SIOCDEVPRIVATE + 15)) {
1050881d966bSEric W. Biederman 		err = dev_ioctl(net, cmd, argp);
10511da177e4SLinus Torvalds 	} else
10523d23e349SJohannes Berg #ifdef CONFIG_WEXT_CORE
10531da177e4SLinus Torvalds 	if (cmd >= SIOCIWFIRST && cmd <= SIOCIWLAST) {
1054881d966bSEric W. Biederman 		err = dev_ioctl(net, cmd, argp);
10551da177e4SLinus Torvalds 	} else
10563d23e349SJohannes Berg #endif
10571da177e4SLinus Torvalds 		switch (cmd) {
10581da177e4SLinus Torvalds 		case FIOSETOWN:
10591da177e4SLinus Torvalds 		case SIOCSPGRP:
10601da177e4SLinus Torvalds 			err = -EFAULT;
10611da177e4SLinus Torvalds 			if (get_user(pid, (int __user *)argp))
10621da177e4SLinus Torvalds 				break;
1063e0b93eddSJeff Layton 			f_setown(sock->file, pid, 1);
1064e0b93eddSJeff Layton 			err = 0;
10651da177e4SLinus Torvalds 			break;
10661da177e4SLinus Torvalds 		case FIOGETOWN:
10671da177e4SLinus Torvalds 		case SIOCGPGRP:
1068609d7fa9SEric W. Biederman 			err = put_user(f_getown(sock->file),
106989bddce5SStephen Hemminger 				       (int __user *)argp);
10701da177e4SLinus Torvalds 			break;
10711da177e4SLinus Torvalds 		case SIOCGIFBR:
10721da177e4SLinus Torvalds 		case SIOCSIFBR:
10731da177e4SLinus Torvalds 		case SIOCBRADDBR:
10741da177e4SLinus Torvalds 		case SIOCBRDELBR:
10751da177e4SLinus Torvalds 			err = -ENOPKG;
10761da177e4SLinus Torvalds 			if (!br_ioctl_hook)
10771da177e4SLinus Torvalds 				request_module("bridge");
10781da177e4SLinus Torvalds 
10794a3e2f71SArjan van de Ven 			mutex_lock(&br_ioctl_mutex);
10801da177e4SLinus Torvalds 			if (br_ioctl_hook)
1081881d966bSEric W. Biederman 				err = br_ioctl_hook(net, cmd, argp);
10824a3e2f71SArjan van de Ven 			mutex_unlock(&br_ioctl_mutex);
10831da177e4SLinus Torvalds 			break;
10841da177e4SLinus Torvalds 		case SIOCGIFVLAN:
10851da177e4SLinus Torvalds 		case SIOCSIFVLAN:
10861da177e4SLinus Torvalds 			err = -ENOPKG;
10871da177e4SLinus Torvalds 			if (!vlan_ioctl_hook)
10881da177e4SLinus Torvalds 				request_module("8021q");
10891da177e4SLinus Torvalds 
10904a3e2f71SArjan van de Ven 			mutex_lock(&vlan_ioctl_mutex);
10911da177e4SLinus Torvalds 			if (vlan_ioctl_hook)
1092881d966bSEric W. Biederman 				err = vlan_ioctl_hook(net, argp);
10934a3e2f71SArjan van de Ven 			mutex_unlock(&vlan_ioctl_mutex);
10941da177e4SLinus Torvalds 			break;
10951da177e4SLinus Torvalds 		case SIOCADDDLCI:
10961da177e4SLinus Torvalds 		case SIOCDELDLCI:
10971da177e4SLinus Torvalds 			err = -ENOPKG;
10981da177e4SLinus Torvalds 			if (!dlci_ioctl_hook)
10991da177e4SLinus Torvalds 				request_module("dlci");
11001da177e4SLinus Torvalds 
11014a3e2f71SArjan van de Ven 			mutex_lock(&dlci_ioctl_mutex);
11027512cbf6SPavel Emelyanov 			if (dlci_ioctl_hook)
11031da177e4SLinus Torvalds 				err = dlci_ioctl_hook(cmd, argp);
11044a3e2f71SArjan van de Ven 			mutex_unlock(&dlci_ioctl_mutex);
11051da177e4SLinus Torvalds 			break;
11061da177e4SLinus Torvalds 		default:
11076b96018bSArnd Bergmann 			err = sock_do_ioctl(net, sock, cmd, arg);
11081da177e4SLinus Torvalds 			break;
11091da177e4SLinus Torvalds 		}
11101da177e4SLinus Torvalds 	return err;
11111da177e4SLinus Torvalds }
11121da177e4SLinus Torvalds 
11131da177e4SLinus Torvalds int sock_create_lite(int family, int type, int protocol, struct socket **res)
11141da177e4SLinus Torvalds {
11151da177e4SLinus Torvalds 	int err;
11161da177e4SLinus Torvalds 	struct socket *sock = NULL;
11171da177e4SLinus Torvalds 
11181da177e4SLinus Torvalds 	err = security_socket_create(family, type, protocol, 1);
11191da177e4SLinus Torvalds 	if (err)
11201da177e4SLinus Torvalds 		goto out;
11211da177e4SLinus Torvalds 
11221da177e4SLinus Torvalds 	sock = sock_alloc();
11231da177e4SLinus Torvalds 	if (!sock) {
11241da177e4SLinus Torvalds 		err = -ENOMEM;
11251da177e4SLinus Torvalds 		goto out;
11261da177e4SLinus Torvalds 	}
11271da177e4SLinus Torvalds 
11281da177e4SLinus Torvalds 	sock->type = type;
11297420ed23SVenkat Yekkirala 	err = security_socket_post_create(sock, family, type, protocol, 1);
11307420ed23SVenkat Yekkirala 	if (err)
11317420ed23SVenkat Yekkirala 		goto out_release;
11327420ed23SVenkat Yekkirala 
11331da177e4SLinus Torvalds out:
11341da177e4SLinus Torvalds 	*res = sock;
11351da177e4SLinus Torvalds 	return err;
11367420ed23SVenkat Yekkirala out_release:
11377420ed23SVenkat Yekkirala 	sock_release(sock);
11387420ed23SVenkat Yekkirala 	sock = NULL;
11397420ed23SVenkat Yekkirala 	goto out;
11401da177e4SLinus Torvalds }
1141c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_create_lite);
11421da177e4SLinus Torvalds 
11431da177e4SLinus Torvalds /* No kernel lock held - perfect */
11441da177e4SLinus Torvalds static unsigned int sock_poll(struct file *file, poll_table *wait)
11451da177e4SLinus Torvalds {
1146cbf55001SEliezer Tamir 	unsigned int busy_flag = 0;
11471da177e4SLinus Torvalds 	struct socket *sock;
11481da177e4SLinus Torvalds 
11491da177e4SLinus Torvalds 	/*
11501da177e4SLinus Torvalds 	 *      We can't return errors to poll, so it's either yes or no.
11511da177e4SLinus Torvalds 	 */
1152b69aee04SEric Dumazet 	sock = file->private_data;
11532d48d67fSEliezer Tamir 
1154cbf55001SEliezer Tamir 	if (sk_can_busy_loop(sock->sk)) {
11552d48d67fSEliezer Tamir 		/* this socket can poll_ll so tell the system call */
1156cbf55001SEliezer Tamir 		busy_flag = POLL_BUSY_LOOP;
11572d48d67fSEliezer Tamir 
11582d48d67fSEliezer Tamir 		/* once, only if requested by syscall */
1159cbf55001SEliezer Tamir 		if (wait && (wait->_key & POLL_BUSY_LOOP))
1160cbf55001SEliezer Tamir 			sk_busy_loop(sock->sk, 1);
11612d48d67fSEliezer Tamir 	}
11622d48d67fSEliezer Tamir 
1163cbf55001SEliezer Tamir 	return busy_flag | sock->ops->poll(file, sock, wait);
11641da177e4SLinus Torvalds }
11651da177e4SLinus Torvalds 
11661da177e4SLinus Torvalds static int sock_mmap(struct file *file, struct vm_area_struct *vma)
11671da177e4SLinus Torvalds {
1168b69aee04SEric Dumazet 	struct socket *sock = file->private_data;
11691da177e4SLinus Torvalds 
11701da177e4SLinus Torvalds 	return sock->ops->mmap(file, sock, vma);
11711da177e4SLinus Torvalds }
11721da177e4SLinus Torvalds 
117320380731SArnaldo Carvalho de Melo static int sock_close(struct inode *inode, struct file *filp)
11741da177e4SLinus Torvalds {
11751da177e4SLinus Torvalds 	sock_release(SOCKET_I(inode));
11761da177e4SLinus Torvalds 	return 0;
11771da177e4SLinus Torvalds }
11781da177e4SLinus Torvalds 
11791da177e4SLinus Torvalds /*
11801da177e4SLinus Torvalds  *	Update the socket async list
11811da177e4SLinus Torvalds  *
11821da177e4SLinus Torvalds  *	Fasync_list locking strategy.
11831da177e4SLinus Torvalds  *
11841da177e4SLinus Torvalds  *	1. fasync_list is modified only under process context socket lock
11851da177e4SLinus Torvalds  *	   i.e. under semaphore.
11861da177e4SLinus Torvalds  *	2. fasync_list is used under read_lock(&sk->sk_callback_lock)
1187989a2979SEric Dumazet  *	   or under socket lock
11881da177e4SLinus Torvalds  */
11891da177e4SLinus Torvalds 
11901da177e4SLinus Torvalds static int sock_fasync(int fd, struct file *filp, int on)
11911da177e4SLinus Torvalds {
1192989a2979SEric Dumazet 	struct socket *sock = filp->private_data;
1193989a2979SEric Dumazet 	struct sock *sk = sock->sk;
1194eaefd110SEric Dumazet 	struct socket_wq *wq;
11951da177e4SLinus Torvalds 
1196989a2979SEric Dumazet 	if (sk == NULL)
11971da177e4SLinus Torvalds 		return -EINVAL;
11981da177e4SLinus Torvalds 
11991da177e4SLinus Torvalds 	lock_sock(sk);
1200eaefd110SEric Dumazet 	wq = rcu_dereference_protected(sock->wq, sock_owned_by_user(sk));
1201eaefd110SEric Dumazet 	fasync_helper(fd, filp, on, &wq->fasync_list);
12021da177e4SLinus Torvalds 
1203eaefd110SEric Dumazet 	if (!wq->fasync_list)
1204bcdce719SEric Dumazet 		sock_reset_flag(sk, SOCK_FASYNC);
1205989a2979SEric Dumazet 	else
1206989a2979SEric Dumazet 		sock_set_flag(sk, SOCK_FASYNC);
12071da177e4SLinus Torvalds 
1208989a2979SEric Dumazet 	release_sock(sk);
12091da177e4SLinus Torvalds 	return 0;
12101da177e4SLinus Torvalds }
12111da177e4SLinus Torvalds 
121243815482SEric Dumazet /* This function may be called only under socket lock or callback_lock or rcu_lock */
12131da177e4SLinus Torvalds 
12141da177e4SLinus Torvalds int sock_wake_async(struct socket *sock, int how, int band)
12151da177e4SLinus Torvalds {
121643815482SEric Dumazet 	struct socket_wq *wq;
121743815482SEric Dumazet 
121843815482SEric Dumazet 	if (!sock)
12191da177e4SLinus Torvalds 		return -1;
122043815482SEric Dumazet 	rcu_read_lock();
122143815482SEric Dumazet 	wq = rcu_dereference(sock->wq);
122243815482SEric Dumazet 	if (!wq || !wq->fasync_list) {
122343815482SEric Dumazet 		rcu_read_unlock();
122443815482SEric Dumazet 		return -1;
122543815482SEric Dumazet 	}
122689bddce5SStephen Hemminger 	switch (how) {
12278d8ad9d7SPavel Emelyanov 	case SOCK_WAKE_WAITD:
12281da177e4SLinus Torvalds 		if (test_bit(SOCK_ASYNC_WAITDATA, &sock->flags))
12291da177e4SLinus Torvalds 			break;
12301da177e4SLinus Torvalds 		goto call_kill;
12318d8ad9d7SPavel Emelyanov 	case SOCK_WAKE_SPACE:
12321da177e4SLinus Torvalds 		if (!test_and_clear_bit(SOCK_ASYNC_NOSPACE, &sock->flags))
12331da177e4SLinus Torvalds 			break;
12341da177e4SLinus Torvalds 		/* fall through */
12358d8ad9d7SPavel Emelyanov 	case SOCK_WAKE_IO:
12361da177e4SLinus Torvalds call_kill:
123743815482SEric Dumazet 		kill_fasync(&wq->fasync_list, SIGIO, band);
12381da177e4SLinus Torvalds 		break;
12398d8ad9d7SPavel Emelyanov 	case SOCK_WAKE_URG:
124043815482SEric Dumazet 		kill_fasync(&wq->fasync_list, SIGURG, band);
12411da177e4SLinus Torvalds 	}
124243815482SEric Dumazet 	rcu_read_unlock();
12431da177e4SLinus Torvalds 	return 0;
12441da177e4SLinus Torvalds }
1245c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_wake_async);
12461da177e4SLinus Torvalds 
1247721db93aSPavel Emelyanov int __sock_create(struct net *net, int family, int type, int protocol,
124889bddce5SStephen Hemminger 			 struct socket **res, int kern)
12491da177e4SLinus Torvalds {
12501da177e4SLinus Torvalds 	int err;
12511da177e4SLinus Torvalds 	struct socket *sock;
125255737fdaSStephen Hemminger 	const struct net_proto_family *pf;
12531da177e4SLinus Torvalds 
12541da177e4SLinus Torvalds 	/*
12551da177e4SLinus Torvalds 	 *      Check protocol is in range
12561da177e4SLinus Torvalds 	 */
12571da177e4SLinus Torvalds 	if (family < 0 || family >= NPROTO)
12581da177e4SLinus Torvalds 		return -EAFNOSUPPORT;
12591da177e4SLinus Torvalds 	if (type < 0 || type >= SOCK_MAX)
12601da177e4SLinus Torvalds 		return -EINVAL;
12611da177e4SLinus Torvalds 
12621da177e4SLinus Torvalds 	/* Compatibility.
12631da177e4SLinus Torvalds 
12641da177e4SLinus Torvalds 	   This uglymoron is moved from INET layer to here to avoid
12651da177e4SLinus Torvalds 	   deadlock in module load.
12661da177e4SLinus Torvalds 	 */
12671da177e4SLinus Torvalds 	if (family == PF_INET && type == SOCK_PACKET) {
12681da177e4SLinus Torvalds 		static int warned;
12691da177e4SLinus Torvalds 		if (!warned) {
12701da177e4SLinus Torvalds 			warned = 1;
12713410f22eSYang Yingliang 			pr_info("%s uses obsolete (PF_INET,SOCK_PACKET)\n",
127289bddce5SStephen Hemminger 				current->comm);
12731da177e4SLinus Torvalds 		}
12741da177e4SLinus Torvalds 		family = PF_PACKET;
12751da177e4SLinus Torvalds 	}
12761da177e4SLinus Torvalds 
12771da177e4SLinus Torvalds 	err = security_socket_create(family, type, protocol, kern);
12781da177e4SLinus Torvalds 	if (err)
12791da177e4SLinus Torvalds 		return err;
12801da177e4SLinus Torvalds 
128155737fdaSStephen Hemminger 	/*
128255737fdaSStephen Hemminger 	 *	Allocate the socket and allow the family to set things up. if
128355737fdaSStephen Hemminger 	 *	the protocol is 0, the family is instructed to select an appropriate
128455737fdaSStephen Hemminger 	 *	default.
128555737fdaSStephen Hemminger 	 */
128655737fdaSStephen Hemminger 	sock = sock_alloc();
128755737fdaSStephen Hemminger 	if (!sock) {
1288e87cc472SJoe Perches 		net_warn_ratelimited("socket: no more sockets\n");
128955737fdaSStephen Hemminger 		return -ENFILE;	/* Not exactly a match, but its the
129055737fdaSStephen Hemminger 				   closest posix thing */
129155737fdaSStephen Hemminger 	}
129255737fdaSStephen Hemminger 
129355737fdaSStephen Hemminger 	sock->type = type;
129455737fdaSStephen Hemminger 
129595a5afcaSJohannes Berg #ifdef CONFIG_MODULES
12961da177e4SLinus Torvalds 	/* Attempt to load a protocol module if the find failed.
12971da177e4SLinus Torvalds 	 *
12981da177e4SLinus Torvalds 	 * 12/09/1996 Marcin: But! this makes REALLY only sense, if the user
12991da177e4SLinus Torvalds 	 * requested real, full-featured networking support upon configuration.
13001da177e4SLinus Torvalds 	 * Otherwise module support will break!
13011da177e4SLinus Torvalds 	 */
1302190683a9SEric Dumazet 	if (rcu_access_pointer(net_families[family]) == NULL)
13031da177e4SLinus Torvalds 		request_module("net-pf-%d", family);
13041da177e4SLinus Torvalds #endif
13051da177e4SLinus Torvalds 
130655737fdaSStephen Hemminger 	rcu_read_lock();
130755737fdaSStephen Hemminger 	pf = rcu_dereference(net_families[family]);
13081da177e4SLinus Torvalds 	err = -EAFNOSUPPORT;
130955737fdaSStephen Hemminger 	if (!pf)
131055737fdaSStephen Hemminger 		goto out_release;
13111da177e4SLinus Torvalds 
13121da177e4SLinus Torvalds 	/*
13131da177e4SLinus Torvalds 	 * We will call the ->create function, that possibly is in a loadable
13141da177e4SLinus Torvalds 	 * module, so we have to bump that loadable module refcnt first.
13151da177e4SLinus Torvalds 	 */
131655737fdaSStephen Hemminger 	if (!try_module_get(pf->owner))
13171da177e4SLinus Torvalds 		goto out_release;
13181da177e4SLinus Torvalds 
131955737fdaSStephen Hemminger 	/* Now protected by module ref count */
132055737fdaSStephen Hemminger 	rcu_read_unlock();
132155737fdaSStephen Hemminger 
13223f378b68SEric Paris 	err = pf->create(net, sock, protocol, kern);
132355737fdaSStephen Hemminger 	if (err < 0)
13241da177e4SLinus Torvalds 		goto out_module_put;
1325a79af59eSFrank Filz 
13261da177e4SLinus Torvalds 	/*
13271da177e4SLinus Torvalds 	 * Now to bump the refcnt of the [loadable] module that owns this
13281da177e4SLinus Torvalds 	 * socket at sock_release time we decrement its refcnt.
13291da177e4SLinus Torvalds 	 */
133055737fdaSStephen Hemminger 	if (!try_module_get(sock->ops->owner))
133155737fdaSStephen Hemminger 		goto out_module_busy;
133255737fdaSStephen Hemminger 
13331da177e4SLinus Torvalds 	/*
13341da177e4SLinus Torvalds 	 * Now that we're done with the ->create function, the [loadable]
13351da177e4SLinus Torvalds 	 * module can have its refcnt decremented
13361da177e4SLinus Torvalds 	 */
133755737fdaSStephen Hemminger 	module_put(pf->owner);
13387420ed23SVenkat Yekkirala 	err = security_socket_post_create(sock, family, type, protocol, kern);
13397420ed23SVenkat Yekkirala 	if (err)
13403b185525SHerbert Xu 		goto out_sock_release;
134155737fdaSStephen Hemminger 	*res = sock;
13421da177e4SLinus Torvalds 
134355737fdaSStephen Hemminger 	return 0;
134455737fdaSStephen Hemminger 
134555737fdaSStephen Hemminger out_module_busy:
134655737fdaSStephen Hemminger 	err = -EAFNOSUPPORT;
13471da177e4SLinus Torvalds out_module_put:
134855737fdaSStephen Hemminger 	sock->ops = NULL;
134955737fdaSStephen Hemminger 	module_put(pf->owner);
135055737fdaSStephen Hemminger out_sock_release:
13511da177e4SLinus Torvalds 	sock_release(sock);
135255737fdaSStephen Hemminger 	return err;
135355737fdaSStephen Hemminger 
135455737fdaSStephen Hemminger out_release:
135555737fdaSStephen Hemminger 	rcu_read_unlock();
135655737fdaSStephen Hemminger 	goto out_sock_release;
13571da177e4SLinus Torvalds }
1358721db93aSPavel Emelyanov EXPORT_SYMBOL(__sock_create);
13591da177e4SLinus Torvalds 
13601da177e4SLinus Torvalds int sock_create(int family, int type, int protocol, struct socket **res)
13611da177e4SLinus Torvalds {
13621b8d7ae4SEric W. Biederman 	return __sock_create(current->nsproxy->net_ns, family, type, protocol, res, 0);
13631da177e4SLinus Torvalds }
1364c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_create);
13651da177e4SLinus Torvalds 
13661da177e4SLinus Torvalds int sock_create_kern(int family, int type, int protocol, struct socket **res)
13671da177e4SLinus Torvalds {
13681b8d7ae4SEric W. Biederman 	return __sock_create(&init_net, family, type, protocol, res, 1);
13691da177e4SLinus Torvalds }
1370c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_create_kern);
13711da177e4SLinus Torvalds 
13723e0fa65fSHeiko Carstens SYSCALL_DEFINE3(socket, int, family, int, type, int, protocol)
13731da177e4SLinus Torvalds {
13741da177e4SLinus Torvalds 	int retval;
13751da177e4SLinus Torvalds 	struct socket *sock;
1376a677a039SUlrich Drepper 	int flags;
1377a677a039SUlrich Drepper 
1378e38b36f3SUlrich Drepper 	/* Check the SOCK_* constants for consistency.  */
1379e38b36f3SUlrich Drepper 	BUILD_BUG_ON(SOCK_CLOEXEC != O_CLOEXEC);
1380e38b36f3SUlrich Drepper 	BUILD_BUG_ON((SOCK_MAX | SOCK_TYPE_MASK) != SOCK_TYPE_MASK);
1381e38b36f3SUlrich Drepper 	BUILD_BUG_ON(SOCK_CLOEXEC & SOCK_TYPE_MASK);
1382e38b36f3SUlrich Drepper 	BUILD_BUG_ON(SOCK_NONBLOCK & SOCK_TYPE_MASK);
1383e38b36f3SUlrich Drepper 
1384a677a039SUlrich Drepper 	flags = type & ~SOCK_TYPE_MASK;
138577d27200SUlrich Drepper 	if (flags & ~(SOCK_CLOEXEC | SOCK_NONBLOCK))
1386a677a039SUlrich Drepper 		return -EINVAL;
1387a677a039SUlrich Drepper 	type &= SOCK_TYPE_MASK;
13881da177e4SLinus Torvalds 
1389aaca0bdcSUlrich Drepper 	if (SOCK_NONBLOCK != O_NONBLOCK && (flags & SOCK_NONBLOCK))
1390aaca0bdcSUlrich Drepper 		flags = (flags & ~SOCK_NONBLOCK) | O_NONBLOCK;
1391aaca0bdcSUlrich Drepper 
13921da177e4SLinus Torvalds 	retval = sock_create(family, type, protocol, &sock);
13931da177e4SLinus Torvalds 	if (retval < 0)
13941da177e4SLinus Torvalds 		goto out;
13951da177e4SLinus Torvalds 
139677d27200SUlrich Drepper 	retval = sock_map_fd(sock, flags & (O_CLOEXEC | O_NONBLOCK));
13971da177e4SLinus Torvalds 	if (retval < 0)
13981da177e4SLinus Torvalds 		goto out_release;
13991da177e4SLinus Torvalds 
14001da177e4SLinus Torvalds out:
14011da177e4SLinus Torvalds 	/* It may be already another descriptor 8) Not kernel problem. */
14021da177e4SLinus Torvalds 	return retval;
14031da177e4SLinus Torvalds 
14041da177e4SLinus Torvalds out_release:
14051da177e4SLinus Torvalds 	sock_release(sock);
14061da177e4SLinus Torvalds 	return retval;
14071da177e4SLinus Torvalds }
14081da177e4SLinus Torvalds 
14091da177e4SLinus Torvalds /*
14101da177e4SLinus Torvalds  *	Create a pair of connected sockets.
14111da177e4SLinus Torvalds  */
14121da177e4SLinus Torvalds 
14133e0fa65fSHeiko Carstens SYSCALL_DEFINE4(socketpair, int, family, int, type, int, protocol,
14143e0fa65fSHeiko Carstens 		int __user *, usockvec)
14151da177e4SLinus Torvalds {
14161da177e4SLinus Torvalds 	struct socket *sock1, *sock2;
14171da177e4SLinus Torvalds 	int fd1, fd2, err;
1418db349509SAl Viro 	struct file *newfile1, *newfile2;
1419a677a039SUlrich Drepper 	int flags;
1420a677a039SUlrich Drepper 
1421a677a039SUlrich Drepper 	flags = type & ~SOCK_TYPE_MASK;
142277d27200SUlrich Drepper 	if (flags & ~(SOCK_CLOEXEC | SOCK_NONBLOCK))
1423a677a039SUlrich Drepper 		return -EINVAL;
1424a677a039SUlrich Drepper 	type &= SOCK_TYPE_MASK;
14251da177e4SLinus Torvalds 
1426aaca0bdcSUlrich Drepper 	if (SOCK_NONBLOCK != O_NONBLOCK && (flags & SOCK_NONBLOCK))
1427aaca0bdcSUlrich Drepper 		flags = (flags & ~SOCK_NONBLOCK) | O_NONBLOCK;
1428aaca0bdcSUlrich Drepper 
14291da177e4SLinus Torvalds 	/*
14301da177e4SLinus Torvalds 	 * Obtain the first socket and check if the underlying protocol
14311da177e4SLinus Torvalds 	 * supports the socketpair call.
14321da177e4SLinus Torvalds 	 */
14331da177e4SLinus Torvalds 
14341da177e4SLinus Torvalds 	err = sock_create(family, type, protocol, &sock1);
14351da177e4SLinus Torvalds 	if (err < 0)
14361da177e4SLinus Torvalds 		goto out;
14371da177e4SLinus Torvalds 
14381da177e4SLinus Torvalds 	err = sock_create(family, type, protocol, &sock2);
14391da177e4SLinus Torvalds 	if (err < 0)
14401da177e4SLinus Torvalds 		goto out_release_1;
14411da177e4SLinus Torvalds 
14421da177e4SLinus Torvalds 	err = sock1->ops->socketpair(sock1, sock2);
14431da177e4SLinus Torvalds 	if (err < 0)
14441da177e4SLinus Torvalds 		goto out_release_both;
14451da177e4SLinus Torvalds 
144628407630SAl Viro 	fd1 = get_unused_fd_flags(flags);
1447bf3c23d1SDavid S. Miller 	if (unlikely(fd1 < 0)) {
1448bf3c23d1SDavid S. Miller 		err = fd1;
14491da177e4SLinus Torvalds 		goto out_release_both;
1450bf3c23d1SDavid S. Miller 	}
1451d73aa286SYann Droneaud 
145228407630SAl Viro 	fd2 = get_unused_fd_flags(flags);
1453198de4d7SAl Viro 	if (unlikely(fd2 < 0)) {
1454198de4d7SAl Viro 		err = fd2;
1455d73aa286SYann Droneaud 		goto out_put_unused_1;
145628407630SAl Viro 	}
145728407630SAl Viro 
1458aab174f0SLinus Torvalds 	newfile1 = sock_alloc_file(sock1, flags, NULL);
145928407630SAl Viro 	if (unlikely(IS_ERR(newfile1))) {
146028407630SAl Viro 		err = PTR_ERR(newfile1);
1461d73aa286SYann Droneaud 		goto out_put_unused_both;
146228407630SAl Viro 	}
146328407630SAl Viro 
1464aab174f0SLinus Torvalds 	newfile2 = sock_alloc_file(sock2, flags, NULL);
146528407630SAl Viro 	if (IS_ERR(newfile2)) {
146628407630SAl Viro 		err = PTR_ERR(newfile2);
1467d73aa286SYann Droneaud 		goto out_fput_1;
1468db349509SAl Viro 	}
1469db349509SAl Viro 
1470d73aa286SYann Droneaud 	err = put_user(fd1, &usockvec[0]);
1471d73aa286SYann Droneaud 	if (err)
1472d73aa286SYann Droneaud 		goto out_fput_both;
1473d73aa286SYann Droneaud 
1474d73aa286SYann Droneaud 	err = put_user(fd2, &usockvec[1]);
1475d73aa286SYann Droneaud 	if (err)
1476d73aa286SYann Droneaud 		goto out_fput_both;
1477d73aa286SYann Droneaud 
1478157cf649SAl Viro 	audit_fd_pair(fd1, fd2);
1479d73aa286SYann Droneaud 
1480db349509SAl Viro 	fd_install(fd1, newfile1);
1481db349509SAl Viro 	fd_install(fd2, newfile2);
14821da177e4SLinus Torvalds 	/* fd1 and fd2 may be already another descriptors.
14831da177e4SLinus Torvalds 	 * Not kernel problem.
14841da177e4SLinus Torvalds 	 */
14851da177e4SLinus Torvalds 
14861da177e4SLinus Torvalds 	return 0;
14871da177e4SLinus Torvalds 
1488d73aa286SYann Droneaud out_fput_both:
1489d73aa286SYann Droneaud 	fput(newfile2);
1490d73aa286SYann Droneaud 	fput(newfile1);
1491d73aa286SYann Droneaud 	put_unused_fd(fd2);
1492d73aa286SYann Droneaud 	put_unused_fd(fd1);
1493d73aa286SYann Droneaud 	goto out;
14941da177e4SLinus Torvalds 
1495d73aa286SYann Droneaud out_fput_1:
1496d73aa286SYann Droneaud 	fput(newfile1);
1497d73aa286SYann Droneaud 	put_unused_fd(fd2);
1498d73aa286SYann Droneaud 	put_unused_fd(fd1);
1499d73aa286SYann Droneaud 	sock_release(sock2);
1500d73aa286SYann Droneaud 	goto out;
1501d73aa286SYann Droneaud 
1502d73aa286SYann Droneaud out_put_unused_both:
1503d73aa286SYann Droneaud 	put_unused_fd(fd2);
1504d73aa286SYann Droneaud out_put_unused_1:
1505d73aa286SYann Droneaud 	put_unused_fd(fd1);
15061da177e4SLinus Torvalds out_release_both:
15071da177e4SLinus Torvalds 	sock_release(sock2);
15081da177e4SLinus Torvalds out_release_1:
15091da177e4SLinus Torvalds 	sock_release(sock1);
15101da177e4SLinus Torvalds out:
15111da177e4SLinus Torvalds 	return err;
15121da177e4SLinus Torvalds }
15131da177e4SLinus Torvalds 
15141da177e4SLinus Torvalds /*
15151da177e4SLinus Torvalds  *	Bind a name to a socket. Nothing much to do here since it's
15161da177e4SLinus Torvalds  *	the protocol's responsibility to handle the local address.
15171da177e4SLinus Torvalds  *
15181da177e4SLinus Torvalds  *	We move the socket address to kernel space before we call
15191da177e4SLinus Torvalds  *	the protocol layer (having also checked the address is ok).
15201da177e4SLinus Torvalds  */
15211da177e4SLinus Torvalds 
152220f37034SHeiko Carstens SYSCALL_DEFINE3(bind, int, fd, struct sockaddr __user *, umyaddr, int, addrlen)
15231da177e4SLinus Torvalds {
15241da177e4SLinus Torvalds 	struct socket *sock;
1525230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
15266cb153caSBenjamin LaHaise 	int err, fput_needed;
15271da177e4SLinus Torvalds 
152889bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
152989bddce5SStephen Hemminger 	if (sock) {
153043db362dSMaciej Żenczykowski 		err = move_addr_to_kernel(umyaddr, addrlen, &address);
153189bddce5SStephen Hemminger 		if (err >= 0) {
153289bddce5SStephen Hemminger 			err = security_socket_bind(sock,
1533230b1839SYOSHIFUJI Hideaki 						   (struct sockaddr *)&address,
153489bddce5SStephen Hemminger 						   addrlen);
15356cb153caSBenjamin LaHaise 			if (!err)
15366cb153caSBenjamin LaHaise 				err = sock->ops->bind(sock,
153789bddce5SStephen Hemminger 						      (struct sockaddr *)
1538230b1839SYOSHIFUJI Hideaki 						      &address, addrlen);
15391da177e4SLinus Torvalds 		}
15406cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
15411da177e4SLinus Torvalds 	}
15421da177e4SLinus Torvalds 	return err;
15431da177e4SLinus Torvalds }
15441da177e4SLinus Torvalds 
15451da177e4SLinus Torvalds /*
15461da177e4SLinus Torvalds  *	Perform a listen. Basically, we allow the protocol to do anything
15471da177e4SLinus Torvalds  *	necessary for a listen, and if that works, we mark the socket as
15481da177e4SLinus Torvalds  *	ready for listening.
15491da177e4SLinus Torvalds  */
15501da177e4SLinus Torvalds 
15513e0fa65fSHeiko Carstens SYSCALL_DEFINE2(listen, int, fd, int, backlog)
15521da177e4SLinus Torvalds {
15531da177e4SLinus Torvalds 	struct socket *sock;
15546cb153caSBenjamin LaHaise 	int err, fput_needed;
1555b8e1f9b5SPavel Emelyanov 	int somaxconn;
15561da177e4SLinus Torvalds 
155789bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
155889bddce5SStephen Hemminger 	if (sock) {
15598efa6e93SPavel Emelyanov 		somaxconn = sock_net(sock->sk)->core.sysctl_somaxconn;
156095c96174SEric Dumazet 		if ((unsigned int)backlog > somaxconn)
1561b8e1f9b5SPavel Emelyanov 			backlog = somaxconn;
15621da177e4SLinus Torvalds 
15631da177e4SLinus Torvalds 		err = security_socket_listen(sock, backlog);
15646cb153caSBenjamin LaHaise 		if (!err)
15651da177e4SLinus Torvalds 			err = sock->ops->listen(sock, backlog);
15666cb153caSBenjamin LaHaise 
15676cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
15681da177e4SLinus Torvalds 	}
15691da177e4SLinus Torvalds 	return err;
15701da177e4SLinus Torvalds }
15711da177e4SLinus Torvalds 
15721da177e4SLinus Torvalds /*
15731da177e4SLinus Torvalds  *	For accept, we attempt to create a new socket, set up the link
15741da177e4SLinus Torvalds  *	with the client, wake up the client, then return the new
15751da177e4SLinus Torvalds  *	connected fd. We collect the address of the connector in kernel
15761da177e4SLinus Torvalds  *	space and move it to user at the very end. This is unclean because
15771da177e4SLinus Torvalds  *	we open the socket then return an error.
15781da177e4SLinus Torvalds  *
15791da177e4SLinus Torvalds  *	1003.1g adds the ability to recvmsg() to query connection pending
15801da177e4SLinus Torvalds  *	status to recvmsg. We need to add that support in a way thats
15811da177e4SLinus Torvalds  *	clean when we restucture accept also.
15821da177e4SLinus Torvalds  */
15831da177e4SLinus Torvalds 
158420f37034SHeiko Carstens SYSCALL_DEFINE4(accept4, int, fd, struct sockaddr __user *, upeer_sockaddr,
158520f37034SHeiko Carstens 		int __user *, upeer_addrlen, int, flags)
15861da177e4SLinus Torvalds {
15871da177e4SLinus Torvalds 	struct socket *sock, *newsock;
158839d8c1b6SDavid S. Miller 	struct file *newfile;
15896cb153caSBenjamin LaHaise 	int err, len, newfd, fput_needed;
1590230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
15911da177e4SLinus Torvalds 
159277d27200SUlrich Drepper 	if (flags & ~(SOCK_CLOEXEC | SOCK_NONBLOCK))
1593aaca0bdcSUlrich Drepper 		return -EINVAL;
1594aaca0bdcSUlrich Drepper 
1595aaca0bdcSUlrich Drepper 	if (SOCK_NONBLOCK != O_NONBLOCK && (flags & SOCK_NONBLOCK))
1596aaca0bdcSUlrich Drepper 		flags = (flags & ~SOCK_NONBLOCK) | O_NONBLOCK;
1597aaca0bdcSUlrich Drepper 
15986cb153caSBenjamin LaHaise 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
15991da177e4SLinus Torvalds 	if (!sock)
16001da177e4SLinus Torvalds 		goto out;
16011da177e4SLinus Torvalds 
16021da177e4SLinus Torvalds 	err = -ENFILE;
1603c6d409cfSEric Dumazet 	newsock = sock_alloc();
1604c6d409cfSEric Dumazet 	if (!newsock)
16051da177e4SLinus Torvalds 		goto out_put;
16061da177e4SLinus Torvalds 
16071da177e4SLinus Torvalds 	newsock->type = sock->type;
16081da177e4SLinus Torvalds 	newsock->ops = sock->ops;
16091da177e4SLinus Torvalds 
16101da177e4SLinus Torvalds 	/*
16111da177e4SLinus Torvalds 	 * We don't need try_module_get here, as the listening socket (sock)
16121da177e4SLinus Torvalds 	 * has the protocol module (sock->ops->owner) held.
16131da177e4SLinus Torvalds 	 */
16141da177e4SLinus Torvalds 	__module_get(newsock->ops->owner);
16151da177e4SLinus Torvalds 
161628407630SAl Viro 	newfd = get_unused_fd_flags(flags);
161739d8c1b6SDavid S. Miller 	if (unlikely(newfd < 0)) {
161839d8c1b6SDavid S. Miller 		err = newfd;
16199a1875e6SDavid S. Miller 		sock_release(newsock);
16209a1875e6SDavid S. Miller 		goto out_put;
162139d8c1b6SDavid S. Miller 	}
1622aab174f0SLinus Torvalds 	newfile = sock_alloc_file(newsock, flags, sock->sk->sk_prot_creator->name);
162328407630SAl Viro 	if (unlikely(IS_ERR(newfile))) {
162428407630SAl Viro 		err = PTR_ERR(newfile);
162528407630SAl Viro 		put_unused_fd(newfd);
162628407630SAl Viro 		sock_release(newsock);
162728407630SAl Viro 		goto out_put;
162828407630SAl Viro 	}
162939d8c1b6SDavid S. Miller 
1630a79af59eSFrank Filz 	err = security_socket_accept(sock, newsock);
1631a79af59eSFrank Filz 	if (err)
163239d8c1b6SDavid S. Miller 		goto out_fd;
1633a79af59eSFrank Filz 
16341da177e4SLinus Torvalds 	err = sock->ops->accept(sock, newsock, sock->file->f_flags);
16351da177e4SLinus Torvalds 	if (err < 0)
163639d8c1b6SDavid S. Miller 		goto out_fd;
16371da177e4SLinus Torvalds 
16381da177e4SLinus Torvalds 	if (upeer_sockaddr) {
1639230b1839SYOSHIFUJI Hideaki 		if (newsock->ops->getname(newsock, (struct sockaddr *)&address,
164089bddce5SStephen Hemminger 					  &len, 2) < 0) {
16411da177e4SLinus Torvalds 			err = -ECONNABORTED;
164239d8c1b6SDavid S. Miller 			goto out_fd;
16431da177e4SLinus Torvalds 		}
164443db362dSMaciej Żenczykowski 		err = move_addr_to_user(&address,
1645230b1839SYOSHIFUJI Hideaki 					len, upeer_sockaddr, upeer_addrlen);
16461da177e4SLinus Torvalds 		if (err < 0)
164739d8c1b6SDavid S. Miller 			goto out_fd;
16481da177e4SLinus Torvalds 	}
16491da177e4SLinus Torvalds 
16501da177e4SLinus Torvalds 	/* File flags are not inherited via accept() unlike another OSes. */
16511da177e4SLinus Torvalds 
165239d8c1b6SDavid S. Miller 	fd_install(newfd, newfile);
165339d8c1b6SDavid S. Miller 	err = newfd;
16541da177e4SLinus Torvalds 
16551da177e4SLinus Torvalds out_put:
16566cb153caSBenjamin LaHaise 	fput_light(sock->file, fput_needed);
16571da177e4SLinus Torvalds out:
16581da177e4SLinus Torvalds 	return err;
165939d8c1b6SDavid S. Miller out_fd:
16609606a216SDavid S. Miller 	fput(newfile);
166139d8c1b6SDavid S. Miller 	put_unused_fd(newfd);
16621da177e4SLinus Torvalds 	goto out_put;
16631da177e4SLinus Torvalds }
16641da177e4SLinus Torvalds 
166520f37034SHeiko Carstens SYSCALL_DEFINE3(accept, int, fd, struct sockaddr __user *, upeer_sockaddr,
166620f37034SHeiko Carstens 		int __user *, upeer_addrlen)
1667aaca0bdcSUlrich Drepper {
1668de11defeSUlrich Drepper 	return sys_accept4(fd, upeer_sockaddr, upeer_addrlen, 0);
1669aaca0bdcSUlrich Drepper }
1670aaca0bdcSUlrich Drepper 
16711da177e4SLinus Torvalds /*
16721da177e4SLinus Torvalds  *	Attempt to connect to a socket with the server address.  The address
16731da177e4SLinus Torvalds  *	is in user space so we verify it is OK and move it to kernel space.
16741da177e4SLinus Torvalds  *
16751da177e4SLinus Torvalds  *	For 1003.1g we need to add clean support for a bind to AF_UNSPEC to
16761da177e4SLinus Torvalds  *	break bindings
16771da177e4SLinus Torvalds  *
16781da177e4SLinus Torvalds  *	NOTE: 1003.1g draft 6.3 is broken with respect to AX.25/NetROM and
16791da177e4SLinus Torvalds  *	other SEQPACKET protocols that take time to connect() as it doesn't
16801da177e4SLinus Torvalds  *	include the -EINPROGRESS status for such sockets.
16811da177e4SLinus Torvalds  */
16821da177e4SLinus Torvalds 
168320f37034SHeiko Carstens SYSCALL_DEFINE3(connect, int, fd, struct sockaddr __user *, uservaddr,
168420f37034SHeiko Carstens 		int, addrlen)
16851da177e4SLinus Torvalds {
16861da177e4SLinus Torvalds 	struct socket *sock;
1687230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
16886cb153caSBenjamin LaHaise 	int err, fput_needed;
16891da177e4SLinus Torvalds 
16906cb153caSBenjamin LaHaise 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
16911da177e4SLinus Torvalds 	if (!sock)
16921da177e4SLinus Torvalds 		goto out;
169343db362dSMaciej Żenczykowski 	err = move_addr_to_kernel(uservaddr, addrlen, &address);
16941da177e4SLinus Torvalds 	if (err < 0)
16951da177e4SLinus Torvalds 		goto out_put;
16961da177e4SLinus Torvalds 
169789bddce5SStephen Hemminger 	err =
1698230b1839SYOSHIFUJI Hideaki 	    security_socket_connect(sock, (struct sockaddr *)&address, addrlen);
16991da177e4SLinus Torvalds 	if (err)
17001da177e4SLinus Torvalds 		goto out_put;
17011da177e4SLinus Torvalds 
1702230b1839SYOSHIFUJI Hideaki 	err = sock->ops->connect(sock, (struct sockaddr *)&address, addrlen,
17031da177e4SLinus Torvalds 				 sock->file->f_flags);
17041da177e4SLinus Torvalds out_put:
17056cb153caSBenjamin LaHaise 	fput_light(sock->file, fput_needed);
17061da177e4SLinus Torvalds out:
17071da177e4SLinus Torvalds 	return err;
17081da177e4SLinus Torvalds }
17091da177e4SLinus Torvalds 
17101da177e4SLinus Torvalds /*
17111da177e4SLinus Torvalds  *	Get the local address ('name') of a socket object. Move the obtained
17121da177e4SLinus Torvalds  *	name to user space.
17131da177e4SLinus Torvalds  */
17141da177e4SLinus Torvalds 
171520f37034SHeiko Carstens SYSCALL_DEFINE3(getsockname, int, fd, struct sockaddr __user *, usockaddr,
171620f37034SHeiko Carstens 		int __user *, usockaddr_len)
17171da177e4SLinus Torvalds {
17181da177e4SLinus Torvalds 	struct socket *sock;
1719230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
17206cb153caSBenjamin LaHaise 	int len, err, fput_needed;
17211da177e4SLinus Torvalds 
17226cb153caSBenjamin LaHaise 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
17231da177e4SLinus Torvalds 	if (!sock)
17241da177e4SLinus Torvalds 		goto out;
17251da177e4SLinus Torvalds 
17261da177e4SLinus Torvalds 	err = security_socket_getsockname(sock);
17271da177e4SLinus Torvalds 	if (err)
17281da177e4SLinus Torvalds 		goto out_put;
17291da177e4SLinus Torvalds 
1730230b1839SYOSHIFUJI Hideaki 	err = sock->ops->getname(sock, (struct sockaddr *)&address, &len, 0);
17311da177e4SLinus Torvalds 	if (err)
17321da177e4SLinus Torvalds 		goto out_put;
173343db362dSMaciej Żenczykowski 	err = move_addr_to_user(&address, len, usockaddr, usockaddr_len);
17341da177e4SLinus Torvalds 
17351da177e4SLinus Torvalds out_put:
17366cb153caSBenjamin LaHaise 	fput_light(sock->file, fput_needed);
17371da177e4SLinus Torvalds out:
17381da177e4SLinus Torvalds 	return err;
17391da177e4SLinus Torvalds }
17401da177e4SLinus Torvalds 
17411da177e4SLinus Torvalds /*
17421da177e4SLinus Torvalds  *	Get the remote address ('name') of a socket object. Move the obtained
17431da177e4SLinus Torvalds  *	name to user space.
17441da177e4SLinus Torvalds  */
17451da177e4SLinus Torvalds 
174620f37034SHeiko Carstens SYSCALL_DEFINE3(getpeername, int, fd, struct sockaddr __user *, usockaddr,
174720f37034SHeiko Carstens 		int __user *, usockaddr_len)
17481da177e4SLinus Torvalds {
17491da177e4SLinus Torvalds 	struct socket *sock;
1750230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
17516cb153caSBenjamin LaHaise 	int len, err, fput_needed;
17521da177e4SLinus Torvalds 
175389bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
175489bddce5SStephen Hemminger 	if (sock != NULL) {
17551da177e4SLinus Torvalds 		err = security_socket_getpeername(sock);
17561da177e4SLinus Torvalds 		if (err) {
17576cb153caSBenjamin LaHaise 			fput_light(sock->file, fput_needed);
17581da177e4SLinus Torvalds 			return err;
17591da177e4SLinus Torvalds 		}
17601da177e4SLinus Torvalds 
176189bddce5SStephen Hemminger 		err =
1762230b1839SYOSHIFUJI Hideaki 		    sock->ops->getname(sock, (struct sockaddr *)&address, &len,
176389bddce5SStephen Hemminger 				       1);
17641da177e4SLinus Torvalds 		if (!err)
176543db362dSMaciej Żenczykowski 			err = move_addr_to_user(&address, len, usockaddr,
176689bddce5SStephen Hemminger 						usockaddr_len);
17676cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
17681da177e4SLinus Torvalds 	}
17691da177e4SLinus Torvalds 	return err;
17701da177e4SLinus Torvalds }
17711da177e4SLinus Torvalds 
17721da177e4SLinus Torvalds /*
17731da177e4SLinus Torvalds  *	Send a datagram to a given address. We move the address into kernel
17741da177e4SLinus Torvalds  *	space and check the user space data area is readable before invoking
17751da177e4SLinus Torvalds  *	the protocol.
17761da177e4SLinus Torvalds  */
17771da177e4SLinus Torvalds 
17783e0fa65fSHeiko Carstens SYSCALL_DEFINE6(sendto, int, fd, void __user *, buff, size_t, len,
177995c96174SEric Dumazet 		unsigned int, flags, struct sockaddr __user *, addr,
17803e0fa65fSHeiko Carstens 		int, addr_len)
17811da177e4SLinus Torvalds {
17821da177e4SLinus Torvalds 	struct socket *sock;
1783230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
17841da177e4SLinus Torvalds 	int err;
17851da177e4SLinus Torvalds 	struct msghdr msg;
17861da177e4SLinus Torvalds 	struct iovec iov;
17876cb153caSBenjamin LaHaise 	int fput_needed;
17881da177e4SLinus Torvalds 
1789253eacc0SLinus Torvalds 	if (len > INT_MAX)
1790253eacc0SLinus Torvalds 		len = INT_MAX;
1791de0fa95cSPavel Emelyanov 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
1792de0fa95cSPavel Emelyanov 	if (!sock)
17934387ff75SDavid S. Miller 		goto out;
17946cb153caSBenjamin LaHaise 
17951da177e4SLinus Torvalds 	iov.iov_base = buff;
17961da177e4SLinus Torvalds 	iov.iov_len = len;
17971da177e4SLinus Torvalds 	msg.msg_name = NULL;
1798c0371da6SAl Viro 	iov_iter_init(&msg.msg_iter, WRITE, &iov, 1, len);
17991da177e4SLinus Torvalds 	msg.msg_control = NULL;
18001da177e4SLinus Torvalds 	msg.msg_controllen = 0;
18011da177e4SLinus Torvalds 	msg.msg_namelen = 0;
18026cb153caSBenjamin LaHaise 	if (addr) {
180343db362dSMaciej Żenczykowski 		err = move_addr_to_kernel(addr, addr_len, &address);
18041da177e4SLinus Torvalds 		if (err < 0)
18051da177e4SLinus Torvalds 			goto out_put;
1806230b1839SYOSHIFUJI Hideaki 		msg.msg_name = (struct sockaddr *)&address;
18071da177e4SLinus Torvalds 		msg.msg_namelen = addr_len;
18081da177e4SLinus Torvalds 	}
18091da177e4SLinus Torvalds 	if (sock->file->f_flags & O_NONBLOCK)
18101da177e4SLinus Torvalds 		flags |= MSG_DONTWAIT;
18111da177e4SLinus Torvalds 	msg.msg_flags = flags;
18121da177e4SLinus Torvalds 	err = sock_sendmsg(sock, &msg, len);
18131da177e4SLinus Torvalds 
18141da177e4SLinus Torvalds out_put:
1815de0fa95cSPavel Emelyanov 	fput_light(sock->file, fput_needed);
18164387ff75SDavid S. Miller out:
18171da177e4SLinus Torvalds 	return err;
18181da177e4SLinus Torvalds }
18191da177e4SLinus Torvalds 
18201da177e4SLinus Torvalds /*
18211da177e4SLinus Torvalds  *	Send a datagram down a socket.
18221da177e4SLinus Torvalds  */
18231da177e4SLinus Torvalds 
18243e0fa65fSHeiko Carstens SYSCALL_DEFINE4(send, int, fd, void __user *, buff, size_t, len,
182595c96174SEric Dumazet 		unsigned int, flags)
18261da177e4SLinus Torvalds {
18271da177e4SLinus Torvalds 	return sys_sendto(fd, buff, len, flags, NULL, 0);
18281da177e4SLinus Torvalds }
18291da177e4SLinus Torvalds 
18301da177e4SLinus Torvalds /*
18311da177e4SLinus Torvalds  *	Receive a frame from the socket and optionally record the address of the
18321da177e4SLinus Torvalds  *	sender. We verify the buffers are writable and if needed move the
18331da177e4SLinus Torvalds  *	sender address from kernel to user space.
18341da177e4SLinus Torvalds  */
18351da177e4SLinus Torvalds 
18363e0fa65fSHeiko Carstens SYSCALL_DEFINE6(recvfrom, int, fd, void __user *, ubuf, size_t, size,
183795c96174SEric Dumazet 		unsigned int, flags, struct sockaddr __user *, addr,
18383e0fa65fSHeiko Carstens 		int __user *, addr_len)
18391da177e4SLinus Torvalds {
18401da177e4SLinus Torvalds 	struct socket *sock;
18411da177e4SLinus Torvalds 	struct iovec iov;
18421da177e4SLinus Torvalds 	struct msghdr msg;
1843230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
18441da177e4SLinus Torvalds 	int err, err2;
18456cb153caSBenjamin LaHaise 	int fput_needed;
18461da177e4SLinus Torvalds 
1847253eacc0SLinus Torvalds 	if (size > INT_MAX)
1848253eacc0SLinus Torvalds 		size = INT_MAX;
1849de0fa95cSPavel Emelyanov 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
18501da177e4SLinus Torvalds 	if (!sock)
1851de0fa95cSPavel Emelyanov 		goto out;
18521da177e4SLinus Torvalds 
18531da177e4SLinus Torvalds 	msg.msg_control = NULL;
18541da177e4SLinus Torvalds 	msg.msg_controllen = 0;
18551da177e4SLinus Torvalds 	iov.iov_len = size;
18561da177e4SLinus Torvalds 	iov.iov_base = ubuf;
1857c0371da6SAl Viro 	iov_iter_init(&msg.msg_iter, READ, &iov, 1, size);
1858f3d33426SHannes Frederic Sowa 	/* Save some cycles and don't copy the address if not needed */
1859f3d33426SHannes Frederic Sowa 	msg.msg_name = addr ? (struct sockaddr *)&address : NULL;
1860f3d33426SHannes Frederic Sowa 	/* We assume all kernel code knows the size of sockaddr_storage */
1861f3d33426SHannes Frederic Sowa 	msg.msg_namelen = 0;
18621da177e4SLinus Torvalds 	if (sock->file->f_flags & O_NONBLOCK)
18631da177e4SLinus Torvalds 		flags |= MSG_DONTWAIT;
18641da177e4SLinus Torvalds 	err = sock_recvmsg(sock, &msg, size, flags);
18651da177e4SLinus Torvalds 
186689bddce5SStephen Hemminger 	if (err >= 0 && addr != NULL) {
186743db362dSMaciej Żenczykowski 		err2 = move_addr_to_user(&address,
1868230b1839SYOSHIFUJI Hideaki 					 msg.msg_namelen, addr, addr_len);
18691da177e4SLinus Torvalds 		if (err2 < 0)
18701da177e4SLinus Torvalds 			err = err2;
18711da177e4SLinus Torvalds 	}
1872de0fa95cSPavel Emelyanov 
1873de0fa95cSPavel Emelyanov 	fput_light(sock->file, fput_needed);
18744387ff75SDavid S. Miller out:
18751da177e4SLinus Torvalds 	return err;
18761da177e4SLinus Torvalds }
18771da177e4SLinus Torvalds 
18781da177e4SLinus Torvalds /*
18791da177e4SLinus Torvalds  *	Receive a datagram from a socket.
18801da177e4SLinus Torvalds  */
18811da177e4SLinus Torvalds 
1882b7c0ddf5SJan Glauber SYSCALL_DEFINE4(recv, int, fd, void __user *, ubuf, size_t, size,
1883b7c0ddf5SJan Glauber 		unsigned int, flags)
18841da177e4SLinus Torvalds {
18851da177e4SLinus Torvalds 	return sys_recvfrom(fd, ubuf, size, flags, NULL, NULL);
18861da177e4SLinus Torvalds }
18871da177e4SLinus Torvalds 
18881da177e4SLinus Torvalds /*
18891da177e4SLinus Torvalds  *	Set a socket option. Because we don't know the option lengths we have
18901da177e4SLinus Torvalds  *	to pass the user mode parameter for the protocols to sort out.
18911da177e4SLinus Torvalds  */
18921da177e4SLinus Torvalds 
189320f37034SHeiko Carstens SYSCALL_DEFINE5(setsockopt, int, fd, int, level, int, optname,
189420f37034SHeiko Carstens 		char __user *, optval, int, optlen)
18951da177e4SLinus Torvalds {
18966cb153caSBenjamin LaHaise 	int err, fput_needed;
18971da177e4SLinus Torvalds 	struct socket *sock;
18981da177e4SLinus Torvalds 
18991da177e4SLinus Torvalds 	if (optlen < 0)
19001da177e4SLinus Torvalds 		return -EINVAL;
19011da177e4SLinus Torvalds 
190289bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
190389bddce5SStephen Hemminger 	if (sock != NULL) {
19041da177e4SLinus Torvalds 		err = security_socket_setsockopt(sock, level, optname);
19056cb153caSBenjamin LaHaise 		if (err)
19066cb153caSBenjamin LaHaise 			goto out_put;
19071da177e4SLinus Torvalds 
19081da177e4SLinus Torvalds 		if (level == SOL_SOCKET)
190989bddce5SStephen Hemminger 			err =
191089bddce5SStephen Hemminger 			    sock_setsockopt(sock, level, optname, optval,
191189bddce5SStephen Hemminger 					    optlen);
19121da177e4SLinus Torvalds 		else
191389bddce5SStephen Hemminger 			err =
191489bddce5SStephen Hemminger 			    sock->ops->setsockopt(sock, level, optname, optval,
191589bddce5SStephen Hemminger 						  optlen);
19166cb153caSBenjamin LaHaise out_put:
19176cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
19181da177e4SLinus Torvalds 	}
19191da177e4SLinus Torvalds 	return err;
19201da177e4SLinus Torvalds }
19211da177e4SLinus Torvalds 
19221da177e4SLinus Torvalds /*
19231da177e4SLinus Torvalds  *	Get a socket option. Because we don't know the option lengths we have
19241da177e4SLinus Torvalds  *	to pass a user mode parameter for the protocols to sort out.
19251da177e4SLinus Torvalds  */
19261da177e4SLinus Torvalds 
192720f37034SHeiko Carstens SYSCALL_DEFINE5(getsockopt, int, fd, int, level, int, optname,
192820f37034SHeiko Carstens 		char __user *, optval, int __user *, optlen)
19291da177e4SLinus Torvalds {
19306cb153caSBenjamin LaHaise 	int err, fput_needed;
19311da177e4SLinus Torvalds 	struct socket *sock;
19321da177e4SLinus Torvalds 
193389bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
193489bddce5SStephen Hemminger 	if (sock != NULL) {
19356cb153caSBenjamin LaHaise 		err = security_socket_getsockopt(sock, level, optname);
19366cb153caSBenjamin LaHaise 		if (err)
19376cb153caSBenjamin LaHaise 			goto out_put;
19381da177e4SLinus Torvalds 
19391da177e4SLinus Torvalds 		if (level == SOL_SOCKET)
194089bddce5SStephen Hemminger 			err =
194189bddce5SStephen Hemminger 			    sock_getsockopt(sock, level, optname, optval,
194289bddce5SStephen Hemminger 					    optlen);
19431da177e4SLinus Torvalds 		else
194489bddce5SStephen Hemminger 			err =
194589bddce5SStephen Hemminger 			    sock->ops->getsockopt(sock, level, optname, optval,
194689bddce5SStephen Hemminger 						  optlen);
19476cb153caSBenjamin LaHaise out_put:
19486cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
19491da177e4SLinus Torvalds 	}
19501da177e4SLinus Torvalds 	return err;
19511da177e4SLinus Torvalds }
19521da177e4SLinus Torvalds 
19531da177e4SLinus Torvalds /*
19541da177e4SLinus Torvalds  *	Shutdown a socket.
19551da177e4SLinus Torvalds  */
19561da177e4SLinus Torvalds 
1957754fe8d2SHeiko Carstens SYSCALL_DEFINE2(shutdown, int, fd, int, how)
19581da177e4SLinus Torvalds {
19596cb153caSBenjamin LaHaise 	int err, fput_needed;
19601da177e4SLinus Torvalds 	struct socket *sock;
19611da177e4SLinus Torvalds 
196289bddce5SStephen Hemminger 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
196389bddce5SStephen Hemminger 	if (sock != NULL) {
19641da177e4SLinus Torvalds 		err = security_socket_shutdown(sock, how);
19656cb153caSBenjamin LaHaise 		if (!err)
19661da177e4SLinus Torvalds 			err = sock->ops->shutdown(sock, how);
19676cb153caSBenjamin LaHaise 		fput_light(sock->file, fput_needed);
19681da177e4SLinus Torvalds 	}
19691da177e4SLinus Torvalds 	return err;
19701da177e4SLinus Torvalds }
19711da177e4SLinus Torvalds 
19721da177e4SLinus Torvalds /* A couple of helpful macros for getting the address of the 32/64 bit
19731da177e4SLinus Torvalds  * fields which are the same type (int / unsigned) on our platforms.
19741da177e4SLinus Torvalds  */
19751da177e4SLinus Torvalds #define COMPAT_MSG(msg, member)	((MSG_CMSG_COMPAT & flags) ? &msg##_compat->member : &msg->member)
19761da177e4SLinus Torvalds #define COMPAT_NAMELEN(msg)	COMPAT_MSG(msg, msg_namelen)
19771da177e4SLinus Torvalds #define COMPAT_FLAGS(msg)	COMPAT_MSG(msg, msg_flags)
19781da177e4SLinus Torvalds 
1979c71d8ebeSTetsuo Handa struct used_address {
1980c71d8ebeSTetsuo Handa 	struct sockaddr_storage name;
1981c71d8ebeSTetsuo Handa 	unsigned int name_len;
1982c71d8ebeSTetsuo Handa };
1983c71d8ebeSTetsuo Handa 
198408adb7daSAl Viro static ssize_t copy_msghdr_from_user(struct msghdr *kmsg,
198508adb7daSAl Viro 				     struct user_msghdr __user *umsg,
198608adb7daSAl Viro 				     struct sockaddr __user **save_addr,
198708adb7daSAl Viro 				     struct iovec **iov)
19881661bf36SDan Carpenter {
198908adb7daSAl Viro 	struct sockaddr __user *uaddr;
199008adb7daSAl Viro 	struct iovec __user *uiov;
1991c0371da6SAl Viro 	size_t nr_segs;
199208adb7daSAl Viro 	ssize_t err;
199308adb7daSAl Viro 
199408adb7daSAl Viro 	if (!access_ok(VERIFY_READ, umsg, sizeof(*umsg)) ||
199508adb7daSAl Viro 	    __get_user(uaddr, &umsg->msg_name) ||
199608adb7daSAl Viro 	    __get_user(kmsg->msg_namelen, &umsg->msg_namelen) ||
199708adb7daSAl Viro 	    __get_user(uiov, &umsg->msg_iov) ||
1998c0371da6SAl Viro 	    __get_user(nr_segs, &umsg->msg_iovlen) ||
199908adb7daSAl Viro 	    __get_user(kmsg->msg_control, &umsg->msg_control) ||
200008adb7daSAl Viro 	    __get_user(kmsg->msg_controllen, &umsg->msg_controllen) ||
200108adb7daSAl Viro 	    __get_user(kmsg->msg_flags, &umsg->msg_flags))
20021661bf36SDan Carpenter 		return -EFAULT;
2003dbb490b9SMatthew Leach 
200408adb7daSAl Viro 	if (!uaddr)
20056a2a2b3aSAni Sinha 		kmsg->msg_namelen = 0;
20066a2a2b3aSAni Sinha 
2007dbb490b9SMatthew Leach 	if (kmsg->msg_namelen < 0)
2008dbb490b9SMatthew Leach 		return -EINVAL;
2009dbb490b9SMatthew Leach 
20101661bf36SDan Carpenter 	if (kmsg->msg_namelen > sizeof(struct sockaddr_storage))
2011db31c55aSDan Carpenter 		kmsg->msg_namelen = sizeof(struct sockaddr_storage);
201208adb7daSAl Viro 
201308adb7daSAl Viro 	if (save_addr)
201408adb7daSAl Viro 		*save_addr = uaddr;
201508adb7daSAl Viro 
201608adb7daSAl Viro 	if (uaddr && kmsg->msg_namelen) {
201708adb7daSAl Viro 		if (!save_addr) {
201808adb7daSAl Viro 			err = move_addr_to_kernel(uaddr, kmsg->msg_namelen,
201908adb7daSAl Viro 						  kmsg->msg_name);
202008adb7daSAl Viro 			if (err < 0)
202108adb7daSAl Viro 				return err;
202208adb7daSAl Viro 		}
202308adb7daSAl Viro 	} else {
202408adb7daSAl Viro 		kmsg->msg_name = NULL;
202508adb7daSAl Viro 		kmsg->msg_namelen = 0;
202608adb7daSAl Viro 	}
202708adb7daSAl Viro 
2028c0371da6SAl Viro 	if (nr_segs > UIO_MAXIOV)
202908adb7daSAl Viro 		return -EMSGSIZE;
203008adb7daSAl Viro 
203108adb7daSAl Viro 	err = rw_copy_check_uvector(save_addr ? READ : WRITE,
2032c0371da6SAl Viro 				    uiov, nr_segs,
203308adb7daSAl Viro 				    UIO_FASTIOV, *iov, iov);
203408adb7daSAl Viro 	if (err >= 0)
2035c0371da6SAl Viro 		iov_iter_init(&kmsg->msg_iter, save_addr ? READ : WRITE,
2036c0371da6SAl Viro 			      *iov, nr_segs, err);
203708adb7daSAl Viro 	return err;
20381661bf36SDan Carpenter }
20391661bf36SDan Carpenter 
2040666547ffSAl Viro static int ___sys_sendmsg(struct socket *sock, struct user_msghdr __user *msg,
204195c96174SEric Dumazet 			 struct msghdr *msg_sys, unsigned int flags,
2042c71d8ebeSTetsuo Handa 			 struct used_address *used_address)
20431da177e4SLinus Torvalds {
204489bddce5SStephen Hemminger 	struct compat_msghdr __user *msg_compat =
204589bddce5SStephen Hemminger 	    (struct compat_msghdr __user *)msg;
2046230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage address;
20471da177e4SLinus Torvalds 	struct iovec iovstack[UIO_FASTIOV], *iov = iovstack;
2048b9d717a7SAlex Williamson 	unsigned char ctl[sizeof(struct cmsghdr) + 20]
2049b9d717a7SAlex Williamson 	    __attribute__ ((aligned(sizeof(__kernel_size_t))));
2050b9d717a7SAlex Williamson 	/* 20 is size of ipv6_pktinfo */
20511da177e4SLinus Torvalds 	unsigned char *ctl_buf = ctl;
205208adb7daSAl Viro 	int ctl_len, total_len;
205308adb7daSAl Viro 	ssize_t err;
20541da177e4SLinus Torvalds 
205508adb7daSAl Viro 	msg_sys->msg_name = &address;
20561da177e4SLinus Torvalds 
205708449320SAl Viro 	if (MSG_CMSG_COMPAT & flags)
205808adb7daSAl Viro 		err = get_compat_msghdr(msg_sys, msg_compat, NULL, &iov);
205908449320SAl Viro 	else
206008adb7daSAl Viro 		err = copy_msghdr_from_user(msg_sys, msg, NULL, &iov);
20611da177e4SLinus Torvalds 	if (err < 0)
20621da177e4SLinus Torvalds 		goto out_freeiov;
20631da177e4SLinus Torvalds 	total_len = err;
20641da177e4SLinus Torvalds 
20651da177e4SLinus Torvalds 	err = -ENOBUFS;
20661da177e4SLinus Torvalds 
2067228e548eSAnton Blanchard 	if (msg_sys->msg_controllen > INT_MAX)
20681da177e4SLinus Torvalds 		goto out_freeiov;
2069228e548eSAnton Blanchard 	ctl_len = msg_sys->msg_controllen;
20701da177e4SLinus Torvalds 	if ((MSG_CMSG_COMPAT & flags) && ctl_len) {
207189bddce5SStephen Hemminger 		err =
2072228e548eSAnton Blanchard 		    cmsghdr_from_user_compat_to_kern(msg_sys, sock->sk, ctl,
207389bddce5SStephen Hemminger 						     sizeof(ctl));
20741da177e4SLinus Torvalds 		if (err)
20751da177e4SLinus Torvalds 			goto out_freeiov;
2076228e548eSAnton Blanchard 		ctl_buf = msg_sys->msg_control;
2077228e548eSAnton Blanchard 		ctl_len = msg_sys->msg_controllen;
20781da177e4SLinus Torvalds 	} else if (ctl_len) {
207989bddce5SStephen Hemminger 		if (ctl_len > sizeof(ctl)) {
20801da177e4SLinus Torvalds 			ctl_buf = sock_kmalloc(sock->sk, ctl_len, GFP_KERNEL);
20811da177e4SLinus Torvalds 			if (ctl_buf == NULL)
20821da177e4SLinus Torvalds 				goto out_freeiov;
20831da177e4SLinus Torvalds 		}
20841da177e4SLinus Torvalds 		err = -EFAULT;
20851da177e4SLinus Torvalds 		/*
2086228e548eSAnton Blanchard 		 * Careful! Before this, msg_sys->msg_control contains a user pointer.
20871da177e4SLinus Torvalds 		 * Afterwards, it will be a kernel pointer. Thus the compiler-assisted
20881da177e4SLinus Torvalds 		 * checking falls down on this.
20891da177e4SLinus Torvalds 		 */
2090fb8621bbSNamhyung Kim 		if (copy_from_user(ctl_buf,
2091228e548eSAnton Blanchard 				   (void __user __force *)msg_sys->msg_control,
209289bddce5SStephen Hemminger 				   ctl_len))
20931da177e4SLinus Torvalds 			goto out_freectl;
2094228e548eSAnton Blanchard 		msg_sys->msg_control = ctl_buf;
20951da177e4SLinus Torvalds 	}
2096228e548eSAnton Blanchard 	msg_sys->msg_flags = flags;
20971da177e4SLinus Torvalds 
20981da177e4SLinus Torvalds 	if (sock->file->f_flags & O_NONBLOCK)
2099228e548eSAnton Blanchard 		msg_sys->msg_flags |= MSG_DONTWAIT;
2100c71d8ebeSTetsuo Handa 	/*
2101c71d8ebeSTetsuo Handa 	 * If this is sendmmsg() and current destination address is same as
2102c71d8ebeSTetsuo Handa 	 * previously succeeded address, omit asking LSM's decision.
2103c71d8ebeSTetsuo Handa 	 * used_address->name_len is initialized to UINT_MAX so that the first
2104c71d8ebeSTetsuo Handa 	 * destination address never matches.
2105c71d8ebeSTetsuo Handa 	 */
2106bc909d9dSMathieu Desnoyers 	if (used_address && msg_sys->msg_name &&
2107bc909d9dSMathieu Desnoyers 	    used_address->name_len == msg_sys->msg_namelen &&
2108bc909d9dSMathieu Desnoyers 	    !memcmp(&used_address->name, msg_sys->msg_name,
2109c71d8ebeSTetsuo Handa 		    used_address->name_len)) {
2110c71d8ebeSTetsuo Handa 		err = sock_sendmsg_nosec(sock, msg_sys, total_len);
2111c71d8ebeSTetsuo Handa 		goto out_freectl;
2112c71d8ebeSTetsuo Handa 	}
2113c71d8ebeSTetsuo Handa 	err = sock_sendmsg(sock, msg_sys, total_len);
2114c71d8ebeSTetsuo Handa 	/*
2115c71d8ebeSTetsuo Handa 	 * If this is sendmmsg() and sending to current destination address was
2116c71d8ebeSTetsuo Handa 	 * successful, remember it.
2117c71d8ebeSTetsuo Handa 	 */
2118c71d8ebeSTetsuo Handa 	if (used_address && err >= 0) {
2119c71d8ebeSTetsuo Handa 		used_address->name_len = msg_sys->msg_namelen;
2120bc909d9dSMathieu Desnoyers 		if (msg_sys->msg_name)
2121bc909d9dSMathieu Desnoyers 			memcpy(&used_address->name, msg_sys->msg_name,
2122c71d8ebeSTetsuo Handa 			       used_address->name_len);
2123c71d8ebeSTetsuo Handa 	}
21241da177e4SLinus Torvalds 
21251da177e4SLinus Torvalds out_freectl:
21261da177e4SLinus Torvalds 	if (ctl_buf != ctl)
21271da177e4SLinus Torvalds 		sock_kfree_s(sock->sk, ctl_buf, ctl_len);
21281da177e4SLinus Torvalds out_freeiov:
21291da177e4SLinus Torvalds 	if (iov != iovstack)
2130a74e9106SEric Dumazet 		kfree(iov);
2131228e548eSAnton Blanchard 	return err;
2132228e548eSAnton Blanchard }
2133228e548eSAnton Blanchard 
2134228e548eSAnton Blanchard /*
2135228e548eSAnton Blanchard  *	BSD sendmsg interface
2136228e548eSAnton Blanchard  */
2137228e548eSAnton Blanchard 
2138666547ffSAl Viro long __sys_sendmsg(int fd, struct user_msghdr __user *msg, unsigned flags)
2139228e548eSAnton Blanchard {
2140228e548eSAnton Blanchard 	int fput_needed, err;
2141228e548eSAnton Blanchard 	struct msghdr msg_sys;
21421be374a0SAndy Lutomirski 	struct socket *sock;
2143228e548eSAnton Blanchard 
21441be374a0SAndy Lutomirski 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
2145228e548eSAnton Blanchard 	if (!sock)
2146228e548eSAnton Blanchard 		goto out;
2147228e548eSAnton Blanchard 
2148a7526eb5SAndy Lutomirski 	err = ___sys_sendmsg(sock, msg, &msg_sys, flags, NULL);
2149228e548eSAnton Blanchard 
21506cb153caSBenjamin LaHaise 	fput_light(sock->file, fput_needed);
21511da177e4SLinus Torvalds out:
21521da177e4SLinus Torvalds 	return err;
21531da177e4SLinus Torvalds }
21541da177e4SLinus Torvalds 
2155666547ffSAl Viro SYSCALL_DEFINE3(sendmsg, int, fd, struct user_msghdr __user *, msg, unsigned int, flags)
2156a7526eb5SAndy Lutomirski {
2157a7526eb5SAndy Lutomirski 	if (flags & MSG_CMSG_COMPAT)
2158a7526eb5SAndy Lutomirski 		return -EINVAL;
2159a7526eb5SAndy Lutomirski 	return __sys_sendmsg(fd, msg, flags);
2160a7526eb5SAndy Lutomirski }
2161a7526eb5SAndy Lutomirski 
2162228e548eSAnton Blanchard /*
2163228e548eSAnton Blanchard  *	Linux sendmmsg interface
2164228e548eSAnton Blanchard  */
2165228e548eSAnton Blanchard 
2166228e548eSAnton Blanchard int __sys_sendmmsg(int fd, struct mmsghdr __user *mmsg, unsigned int vlen,
2167228e548eSAnton Blanchard 		   unsigned int flags)
2168228e548eSAnton Blanchard {
2169228e548eSAnton Blanchard 	int fput_needed, err, datagrams;
2170228e548eSAnton Blanchard 	struct socket *sock;
2171228e548eSAnton Blanchard 	struct mmsghdr __user *entry;
2172228e548eSAnton Blanchard 	struct compat_mmsghdr __user *compat_entry;
2173228e548eSAnton Blanchard 	struct msghdr msg_sys;
2174c71d8ebeSTetsuo Handa 	struct used_address used_address;
2175228e548eSAnton Blanchard 
217698382f41SAnton Blanchard 	if (vlen > UIO_MAXIOV)
217798382f41SAnton Blanchard 		vlen = UIO_MAXIOV;
2178228e548eSAnton Blanchard 
2179228e548eSAnton Blanchard 	datagrams = 0;
2180228e548eSAnton Blanchard 
2181228e548eSAnton Blanchard 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
2182228e548eSAnton Blanchard 	if (!sock)
2183228e548eSAnton Blanchard 		return err;
2184228e548eSAnton Blanchard 
2185c71d8ebeSTetsuo Handa 	used_address.name_len = UINT_MAX;
2186228e548eSAnton Blanchard 	entry = mmsg;
2187228e548eSAnton Blanchard 	compat_entry = (struct compat_mmsghdr __user *)mmsg;
2188728ffb86SAnton Blanchard 	err = 0;
2189228e548eSAnton Blanchard 
2190228e548eSAnton Blanchard 	while (datagrams < vlen) {
2191228e548eSAnton Blanchard 		if (MSG_CMSG_COMPAT & flags) {
2192666547ffSAl Viro 			err = ___sys_sendmsg(sock, (struct user_msghdr __user *)compat_entry,
2193c71d8ebeSTetsuo Handa 					     &msg_sys, flags, &used_address);
2194228e548eSAnton Blanchard 			if (err < 0)
2195228e548eSAnton Blanchard 				break;
2196228e548eSAnton Blanchard 			err = __put_user(err, &compat_entry->msg_len);
2197228e548eSAnton Blanchard 			++compat_entry;
2198228e548eSAnton Blanchard 		} else {
2199a7526eb5SAndy Lutomirski 			err = ___sys_sendmsg(sock,
2200666547ffSAl Viro 					     (struct user_msghdr __user *)entry,
2201c71d8ebeSTetsuo Handa 					     &msg_sys, flags, &used_address);
2202228e548eSAnton Blanchard 			if (err < 0)
2203228e548eSAnton Blanchard 				break;
2204228e548eSAnton Blanchard 			err = put_user(err, &entry->msg_len);
2205228e548eSAnton Blanchard 			++entry;
2206228e548eSAnton Blanchard 		}
2207228e548eSAnton Blanchard 
2208228e548eSAnton Blanchard 		if (err)
2209228e548eSAnton Blanchard 			break;
2210228e548eSAnton Blanchard 		++datagrams;
2211228e548eSAnton Blanchard 	}
2212228e548eSAnton Blanchard 
2213228e548eSAnton Blanchard 	fput_light(sock->file, fput_needed);
2214228e548eSAnton Blanchard 
2215728ffb86SAnton Blanchard 	/* We only return an error if no datagrams were able to be sent */
2216728ffb86SAnton Blanchard 	if (datagrams != 0)
2217228e548eSAnton Blanchard 		return datagrams;
2218228e548eSAnton Blanchard 
2219228e548eSAnton Blanchard 	return err;
2220228e548eSAnton Blanchard }
2221228e548eSAnton Blanchard 
2222228e548eSAnton Blanchard SYSCALL_DEFINE4(sendmmsg, int, fd, struct mmsghdr __user *, mmsg,
2223228e548eSAnton Blanchard 		unsigned int, vlen, unsigned int, flags)
2224228e548eSAnton Blanchard {
22251be374a0SAndy Lutomirski 	if (flags & MSG_CMSG_COMPAT)
22261be374a0SAndy Lutomirski 		return -EINVAL;
2227228e548eSAnton Blanchard 	return __sys_sendmmsg(fd, mmsg, vlen, flags);
2228228e548eSAnton Blanchard }
2229228e548eSAnton Blanchard 
2230666547ffSAl Viro static int ___sys_recvmsg(struct socket *sock, struct user_msghdr __user *msg,
223195c96174SEric Dumazet 			 struct msghdr *msg_sys, unsigned int flags, int nosec)
22321da177e4SLinus Torvalds {
223389bddce5SStephen Hemminger 	struct compat_msghdr __user *msg_compat =
223489bddce5SStephen Hemminger 	    (struct compat_msghdr __user *)msg;
22351da177e4SLinus Torvalds 	struct iovec iovstack[UIO_FASTIOV];
22361da177e4SLinus Torvalds 	struct iovec *iov = iovstack;
22371da177e4SLinus Torvalds 	unsigned long cmsg_ptr;
223808adb7daSAl Viro 	int total_len, len;
223908adb7daSAl Viro 	ssize_t err;
22401da177e4SLinus Torvalds 
22411da177e4SLinus Torvalds 	/* kernel mode address */
2242230b1839SYOSHIFUJI Hideaki 	struct sockaddr_storage addr;
22431da177e4SLinus Torvalds 
22441da177e4SLinus Torvalds 	/* user mode address pointers */
22451da177e4SLinus Torvalds 	struct sockaddr __user *uaddr;
224608adb7daSAl Viro 	int __user *uaddr_len = COMPAT_NAMELEN(msg);
22471da177e4SLinus Torvalds 
224808adb7daSAl Viro 	msg_sys->msg_name = &addr;
22491da177e4SLinus Torvalds 
2250f3d33426SHannes Frederic Sowa 	if (MSG_CMSG_COMPAT & flags)
225108adb7daSAl Viro 		err = get_compat_msghdr(msg_sys, msg_compat, &uaddr, &iov);
2252f3d33426SHannes Frederic Sowa 	else
225308adb7daSAl Viro 		err = copy_msghdr_from_user(msg_sys, msg, &uaddr, &iov);
22541da177e4SLinus Torvalds 	if (err < 0)
22551da177e4SLinus Torvalds 		goto out_freeiov;
22561da177e4SLinus Torvalds 	total_len = err;
22571da177e4SLinus Torvalds 
2258a2e27255SArnaldo Carvalho de Melo 	cmsg_ptr = (unsigned long)msg_sys->msg_control;
2259a2e27255SArnaldo Carvalho de Melo 	msg_sys->msg_flags = flags & (MSG_CMSG_CLOEXEC|MSG_CMSG_COMPAT);
22601da177e4SLinus Torvalds 
2261f3d33426SHannes Frederic Sowa 	/* We assume all kernel code knows the size of sockaddr_storage */
2262f3d33426SHannes Frederic Sowa 	msg_sys->msg_namelen = 0;
2263f3d33426SHannes Frederic Sowa 
22641da177e4SLinus Torvalds 	if (sock->file->f_flags & O_NONBLOCK)
22651da177e4SLinus Torvalds 		flags |= MSG_DONTWAIT;
2266a2e27255SArnaldo Carvalho de Melo 	err = (nosec ? sock_recvmsg_nosec : sock_recvmsg)(sock, msg_sys,
2267a2e27255SArnaldo Carvalho de Melo 							  total_len, flags);
22681da177e4SLinus Torvalds 	if (err < 0)
22691da177e4SLinus Torvalds 		goto out_freeiov;
22701da177e4SLinus Torvalds 	len = err;
22711da177e4SLinus Torvalds 
22721da177e4SLinus Torvalds 	if (uaddr != NULL) {
227343db362dSMaciej Żenczykowski 		err = move_addr_to_user(&addr,
2274a2e27255SArnaldo Carvalho de Melo 					msg_sys->msg_namelen, uaddr,
227589bddce5SStephen Hemminger 					uaddr_len);
22761da177e4SLinus Torvalds 		if (err < 0)
22771da177e4SLinus Torvalds 			goto out_freeiov;
22781da177e4SLinus Torvalds 	}
2279a2e27255SArnaldo Carvalho de Melo 	err = __put_user((msg_sys->msg_flags & ~MSG_CMSG_COMPAT),
228037f7f421SDavid S. Miller 			 COMPAT_FLAGS(msg));
22811da177e4SLinus Torvalds 	if (err)
22821da177e4SLinus Torvalds 		goto out_freeiov;
22831da177e4SLinus Torvalds 	if (MSG_CMSG_COMPAT & flags)
2284a2e27255SArnaldo Carvalho de Melo 		err = __put_user((unsigned long)msg_sys->msg_control - cmsg_ptr,
22851da177e4SLinus Torvalds 				 &msg_compat->msg_controllen);
22861da177e4SLinus Torvalds 	else
2287a2e27255SArnaldo Carvalho de Melo 		err = __put_user((unsigned long)msg_sys->msg_control - cmsg_ptr,
22881da177e4SLinus Torvalds 				 &msg->msg_controllen);
22891da177e4SLinus Torvalds 	if (err)
22901da177e4SLinus Torvalds 		goto out_freeiov;
22911da177e4SLinus Torvalds 	err = len;
22921da177e4SLinus Torvalds 
22931da177e4SLinus Torvalds out_freeiov:
22941da177e4SLinus Torvalds 	if (iov != iovstack)
2295a74e9106SEric Dumazet 		kfree(iov);
2296a2e27255SArnaldo Carvalho de Melo 	return err;
2297a2e27255SArnaldo Carvalho de Melo }
2298a2e27255SArnaldo Carvalho de Melo 
2299a2e27255SArnaldo Carvalho de Melo /*
2300a2e27255SArnaldo Carvalho de Melo  *	BSD recvmsg interface
2301a2e27255SArnaldo Carvalho de Melo  */
2302a2e27255SArnaldo Carvalho de Melo 
2303666547ffSAl Viro long __sys_recvmsg(int fd, struct user_msghdr __user *msg, unsigned flags)
2304a2e27255SArnaldo Carvalho de Melo {
2305a2e27255SArnaldo Carvalho de Melo 	int fput_needed, err;
2306a2e27255SArnaldo Carvalho de Melo 	struct msghdr msg_sys;
23071be374a0SAndy Lutomirski 	struct socket *sock;
2308a2e27255SArnaldo Carvalho de Melo 
23091be374a0SAndy Lutomirski 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
2310a2e27255SArnaldo Carvalho de Melo 	if (!sock)
2311a2e27255SArnaldo Carvalho de Melo 		goto out;
2312a2e27255SArnaldo Carvalho de Melo 
2313a7526eb5SAndy Lutomirski 	err = ___sys_recvmsg(sock, msg, &msg_sys, flags, 0);
2314a2e27255SArnaldo Carvalho de Melo 
23156cb153caSBenjamin LaHaise 	fput_light(sock->file, fput_needed);
23161da177e4SLinus Torvalds out:
23171da177e4SLinus Torvalds 	return err;
23181da177e4SLinus Torvalds }
23191da177e4SLinus Torvalds 
2320666547ffSAl Viro SYSCALL_DEFINE3(recvmsg, int, fd, struct user_msghdr __user *, msg,
2321a7526eb5SAndy Lutomirski 		unsigned int, flags)
2322a7526eb5SAndy Lutomirski {
2323a7526eb5SAndy Lutomirski 	if (flags & MSG_CMSG_COMPAT)
2324a7526eb5SAndy Lutomirski 		return -EINVAL;
2325a7526eb5SAndy Lutomirski 	return __sys_recvmsg(fd, msg, flags);
2326a7526eb5SAndy Lutomirski }
2327a7526eb5SAndy Lutomirski 
2328a2e27255SArnaldo Carvalho de Melo /*
2329a2e27255SArnaldo Carvalho de Melo  *     Linux recvmmsg interface
2330a2e27255SArnaldo Carvalho de Melo  */
23311da177e4SLinus Torvalds 
2332a2e27255SArnaldo Carvalho de Melo int __sys_recvmmsg(int fd, struct mmsghdr __user *mmsg, unsigned int vlen,
2333a2e27255SArnaldo Carvalho de Melo 		   unsigned int flags, struct timespec *timeout)
2334a2e27255SArnaldo Carvalho de Melo {
2335a2e27255SArnaldo Carvalho de Melo 	int fput_needed, err, datagrams;
2336a2e27255SArnaldo Carvalho de Melo 	struct socket *sock;
2337a2e27255SArnaldo Carvalho de Melo 	struct mmsghdr __user *entry;
2338d7256d0eSJean-Mickael Guerin 	struct compat_mmsghdr __user *compat_entry;
2339a2e27255SArnaldo Carvalho de Melo 	struct msghdr msg_sys;
2340a2e27255SArnaldo Carvalho de Melo 	struct timespec end_time;
2341a2e27255SArnaldo Carvalho de Melo 
2342a2e27255SArnaldo Carvalho de Melo 	if (timeout &&
2343a2e27255SArnaldo Carvalho de Melo 	    poll_select_set_timeout(&end_time, timeout->tv_sec,
2344a2e27255SArnaldo Carvalho de Melo 				    timeout->tv_nsec))
2345a2e27255SArnaldo Carvalho de Melo 		return -EINVAL;
2346a2e27255SArnaldo Carvalho de Melo 
2347a2e27255SArnaldo Carvalho de Melo 	datagrams = 0;
2348a2e27255SArnaldo Carvalho de Melo 
2349a2e27255SArnaldo Carvalho de Melo 	sock = sockfd_lookup_light(fd, &err, &fput_needed);
2350a2e27255SArnaldo Carvalho de Melo 	if (!sock)
2351a2e27255SArnaldo Carvalho de Melo 		return err;
2352a2e27255SArnaldo Carvalho de Melo 
2353a2e27255SArnaldo Carvalho de Melo 	err = sock_error(sock->sk);
2354a2e27255SArnaldo Carvalho de Melo 	if (err)
2355a2e27255SArnaldo Carvalho de Melo 		goto out_put;
2356a2e27255SArnaldo Carvalho de Melo 
2357a2e27255SArnaldo Carvalho de Melo 	entry = mmsg;
2358d7256d0eSJean-Mickael Guerin 	compat_entry = (struct compat_mmsghdr __user *)mmsg;
2359a2e27255SArnaldo Carvalho de Melo 
2360a2e27255SArnaldo Carvalho de Melo 	while (datagrams < vlen) {
2361a2e27255SArnaldo Carvalho de Melo 		/*
2362a2e27255SArnaldo Carvalho de Melo 		 * No need to ask LSM for more than the first datagram.
2363a2e27255SArnaldo Carvalho de Melo 		 */
2364d7256d0eSJean-Mickael Guerin 		if (MSG_CMSG_COMPAT & flags) {
2365666547ffSAl Viro 			err = ___sys_recvmsg(sock, (struct user_msghdr __user *)compat_entry,
2366b9eb8b87SAnton Blanchard 					     &msg_sys, flags & ~MSG_WAITFORONE,
2367b9eb8b87SAnton Blanchard 					     datagrams);
2368d7256d0eSJean-Mickael Guerin 			if (err < 0)
2369d7256d0eSJean-Mickael Guerin 				break;
2370d7256d0eSJean-Mickael Guerin 			err = __put_user(err, &compat_entry->msg_len);
2371d7256d0eSJean-Mickael Guerin 			++compat_entry;
2372d7256d0eSJean-Mickael Guerin 		} else {
2373a7526eb5SAndy Lutomirski 			err = ___sys_recvmsg(sock,
2374666547ffSAl Viro 					     (struct user_msghdr __user *)entry,
2375b9eb8b87SAnton Blanchard 					     &msg_sys, flags & ~MSG_WAITFORONE,
2376b9eb8b87SAnton Blanchard 					     datagrams);
2377a2e27255SArnaldo Carvalho de Melo 			if (err < 0)
2378a2e27255SArnaldo Carvalho de Melo 				break;
2379a2e27255SArnaldo Carvalho de Melo 			err = put_user(err, &entry->msg_len);
2380d7256d0eSJean-Mickael Guerin 			++entry;
2381d7256d0eSJean-Mickael Guerin 		}
2382d7256d0eSJean-Mickael Guerin 
2383a2e27255SArnaldo Carvalho de Melo 		if (err)
2384a2e27255SArnaldo Carvalho de Melo 			break;
2385a2e27255SArnaldo Carvalho de Melo 		++datagrams;
2386a2e27255SArnaldo Carvalho de Melo 
238771c5c159SBrandon L Black 		/* MSG_WAITFORONE turns on MSG_DONTWAIT after one packet */
238871c5c159SBrandon L Black 		if (flags & MSG_WAITFORONE)
238971c5c159SBrandon L Black 			flags |= MSG_DONTWAIT;
239071c5c159SBrandon L Black 
2391a2e27255SArnaldo Carvalho de Melo 		if (timeout) {
2392a2e27255SArnaldo Carvalho de Melo 			ktime_get_ts(timeout);
2393a2e27255SArnaldo Carvalho de Melo 			*timeout = timespec_sub(end_time, *timeout);
2394a2e27255SArnaldo Carvalho de Melo 			if (timeout->tv_sec < 0) {
2395a2e27255SArnaldo Carvalho de Melo 				timeout->tv_sec = timeout->tv_nsec = 0;
2396a2e27255SArnaldo Carvalho de Melo 				break;
2397a2e27255SArnaldo Carvalho de Melo 			}
2398a2e27255SArnaldo Carvalho de Melo 
2399a2e27255SArnaldo Carvalho de Melo 			/* Timeout, return less than vlen datagrams */
2400a2e27255SArnaldo Carvalho de Melo 			if (timeout->tv_nsec == 0 && timeout->tv_sec == 0)
2401a2e27255SArnaldo Carvalho de Melo 				break;
2402a2e27255SArnaldo Carvalho de Melo 		}
2403a2e27255SArnaldo Carvalho de Melo 
2404a2e27255SArnaldo Carvalho de Melo 		/* Out of band data, return right away */
2405a2e27255SArnaldo Carvalho de Melo 		if (msg_sys.msg_flags & MSG_OOB)
2406a2e27255SArnaldo Carvalho de Melo 			break;
2407a2e27255SArnaldo Carvalho de Melo 	}
2408a2e27255SArnaldo Carvalho de Melo 
2409a2e27255SArnaldo Carvalho de Melo out_put:
2410a2e27255SArnaldo Carvalho de Melo 	fput_light(sock->file, fput_needed);
2411a2e27255SArnaldo Carvalho de Melo 
2412a2e27255SArnaldo Carvalho de Melo 	if (err == 0)
2413a2e27255SArnaldo Carvalho de Melo 		return datagrams;
2414a2e27255SArnaldo Carvalho de Melo 
2415a2e27255SArnaldo Carvalho de Melo 	if (datagrams != 0) {
2416a2e27255SArnaldo Carvalho de Melo 		/*
2417a2e27255SArnaldo Carvalho de Melo 		 * We may return less entries than requested (vlen) if the
2418a2e27255SArnaldo Carvalho de Melo 		 * sock is non block and there aren't enough datagrams...
2419a2e27255SArnaldo Carvalho de Melo 		 */
2420a2e27255SArnaldo Carvalho de Melo 		if (err != -EAGAIN) {
2421a2e27255SArnaldo Carvalho de Melo 			/*
2422a2e27255SArnaldo Carvalho de Melo 			 * ... or  if recvmsg returns an error after we
2423a2e27255SArnaldo Carvalho de Melo 			 * received some datagrams, where we record the
2424a2e27255SArnaldo Carvalho de Melo 			 * error to return on the next call or if the
2425a2e27255SArnaldo Carvalho de Melo 			 * app asks about it using getsockopt(SO_ERROR).
2426a2e27255SArnaldo Carvalho de Melo 			 */
2427a2e27255SArnaldo Carvalho de Melo 			sock->sk->sk_err = -err;
2428a2e27255SArnaldo Carvalho de Melo 		}
2429a2e27255SArnaldo Carvalho de Melo 
2430a2e27255SArnaldo Carvalho de Melo 		return datagrams;
2431a2e27255SArnaldo Carvalho de Melo 	}
2432a2e27255SArnaldo Carvalho de Melo 
2433a2e27255SArnaldo Carvalho de Melo 	return err;
2434a2e27255SArnaldo Carvalho de Melo }
2435a2e27255SArnaldo Carvalho de Melo 
2436a2e27255SArnaldo Carvalho de Melo SYSCALL_DEFINE5(recvmmsg, int, fd, struct mmsghdr __user *, mmsg,
2437a2e27255SArnaldo Carvalho de Melo 		unsigned int, vlen, unsigned int, flags,
2438a2e27255SArnaldo Carvalho de Melo 		struct timespec __user *, timeout)
2439a2e27255SArnaldo Carvalho de Melo {
2440a2e27255SArnaldo Carvalho de Melo 	int datagrams;
2441a2e27255SArnaldo Carvalho de Melo 	struct timespec timeout_sys;
2442a2e27255SArnaldo Carvalho de Melo 
24431be374a0SAndy Lutomirski 	if (flags & MSG_CMSG_COMPAT)
24441be374a0SAndy Lutomirski 		return -EINVAL;
24451be374a0SAndy Lutomirski 
2446a2e27255SArnaldo Carvalho de Melo 	if (!timeout)
2447a2e27255SArnaldo Carvalho de Melo 		return __sys_recvmmsg(fd, mmsg, vlen, flags, NULL);
2448a2e27255SArnaldo Carvalho de Melo 
2449a2e27255SArnaldo Carvalho de Melo 	if (copy_from_user(&timeout_sys, timeout, sizeof(timeout_sys)))
2450a2e27255SArnaldo Carvalho de Melo 		return -EFAULT;
2451a2e27255SArnaldo Carvalho de Melo 
2452a2e27255SArnaldo Carvalho de Melo 	datagrams = __sys_recvmmsg(fd, mmsg, vlen, flags, &timeout_sys);
2453a2e27255SArnaldo Carvalho de Melo 
2454a2e27255SArnaldo Carvalho de Melo 	if (datagrams > 0 &&
2455a2e27255SArnaldo Carvalho de Melo 	    copy_to_user(timeout, &timeout_sys, sizeof(timeout_sys)))
2456a2e27255SArnaldo Carvalho de Melo 		datagrams = -EFAULT;
2457a2e27255SArnaldo Carvalho de Melo 
2458a2e27255SArnaldo Carvalho de Melo 	return datagrams;
2459a2e27255SArnaldo Carvalho de Melo }
2460a2e27255SArnaldo Carvalho de Melo 
2461a2e27255SArnaldo Carvalho de Melo #ifdef __ARCH_WANT_SYS_SOCKETCALL
24621da177e4SLinus Torvalds /* Argument list sizes for sys_socketcall */
24631da177e4SLinus Torvalds #define AL(x) ((x) * sizeof(unsigned long))
2464228e548eSAnton Blanchard static const unsigned char nargs[21] = {
246589bddce5SStephen Hemminger 	AL(0), AL(3), AL(3), AL(3), AL(2), AL(3),
24661da177e4SLinus Torvalds 	AL(3), AL(3), AL(4), AL(4), AL(4), AL(6),
2467aaca0bdcSUlrich Drepper 	AL(6), AL(2), AL(5), AL(5), AL(3), AL(3),
2468228e548eSAnton Blanchard 	AL(4), AL(5), AL(4)
246989bddce5SStephen Hemminger };
247089bddce5SStephen Hemminger 
24711da177e4SLinus Torvalds #undef AL
24721da177e4SLinus Torvalds 
24731da177e4SLinus Torvalds /*
24741da177e4SLinus Torvalds  *	System call vectors.
24751da177e4SLinus Torvalds  *
24761da177e4SLinus Torvalds  *	Argument checking cleaned up. Saved 20% in size.
24771da177e4SLinus Torvalds  *  This function doesn't need to set the kernel lock because
24781da177e4SLinus Torvalds  *  it is set by the callees.
24791da177e4SLinus Torvalds  */
24801da177e4SLinus Torvalds 
24813e0fa65fSHeiko Carstens SYSCALL_DEFINE2(socketcall, int, call, unsigned long __user *, args)
24821da177e4SLinus Torvalds {
24832950fa9dSChen Gang 	unsigned long a[AUDITSC_ARGS];
24841da177e4SLinus Torvalds 	unsigned long a0, a1;
24851da177e4SLinus Torvalds 	int err;
248647379052SArjan van de Ven 	unsigned int len;
24871da177e4SLinus Torvalds 
2488228e548eSAnton Blanchard 	if (call < 1 || call > SYS_SENDMMSG)
24891da177e4SLinus Torvalds 		return -EINVAL;
24901da177e4SLinus Torvalds 
249147379052SArjan van de Ven 	len = nargs[call];
249247379052SArjan van de Ven 	if (len > sizeof(a))
249347379052SArjan van de Ven 		return -EINVAL;
249447379052SArjan van de Ven 
24951da177e4SLinus Torvalds 	/* copy_from_user should be SMP safe. */
249647379052SArjan van de Ven 	if (copy_from_user(a, args, len))
24971da177e4SLinus Torvalds 		return -EFAULT;
24981da177e4SLinus Torvalds 
24992950fa9dSChen Gang 	err = audit_socketcall(nargs[call] / sizeof(unsigned long), a);
25002950fa9dSChen Gang 	if (err)
25012950fa9dSChen Gang 		return err;
25023ec3b2fbSDavid Woodhouse 
25031da177e4SLinus Torvalds 	a0 = a[0];
25041da177e4SLinus Torvalds 	a1 = a[1];
25051da177e4SLinus Torvalds 
250689bddce5SStephen Hemminger 	switch (call) {
25071da177e4SLinus Torvalds 	case SYS_SOCKET:
25081da177e4SLinus Torvalds 		err = sys_socket(a0, a1, a[2]);
25091da177e4SLinus Torvalds 		break;
25101da177e4SLinus Torvalds 	case SYS_BIND:
25111da177e4SLinus Torvalds 		err = sys_bind(a0, (struct sockaddr __user *)a1, a[2]);
25121da177e4SLinus Torvalds 		break;
25131da177e4SLinus Torvalds 	case SYS_CONNECT:
25141da177e4SLinus Torvalds 		err = sys_connect(a0, (struct sockaddr __user *)a1, a[2]);
25151da177e4SLinus Torvalds 		break;
25161da177e4SLinus Torvalds 	case SYS_LISTEN:
25171da177e4SLinus Torvalds 		err = sys_listen(a0, a1);
25181da177e4SLinus Torvalds 		break;
25191da177e4SLinus Torvalds 	case SYS_ACCEPT:
2520de11defeSUlrich Drepper 		err = sys_accept4(a0, (struct sockaddr __user *)a1,
2521aaca0bdcSUlrich Drepper 				  (int __user *)a[2], 0);
25221da177e4SLinus Torvalds 		break;
25231da177e4SLinus Torvalds 	case SYS_GETSOCKNAME:
252489bddce5SStephen Hemminger 		err =
252589bddce5SStephen Hemminger 		    sys_getsockname(a0, (struct sockaddr __user *)a1,
252689bddce5SStephen Hemminger 				    (int __user *)a[2]);
25271da177e4SLinus Torvalds 		break;
25281da177e4SLinus Torvalds 	case SYS_GETPEERNAME:
252989bddce5SStephen Hemminger 		err =
253089bddce5SStephen Hemminger 		    sys_getpeername(a0, (struct sockaddr __user *)a1,
253189bddce5SStephen Hemminger 				    (int __user *)a[2]);
25321da177e4SLinus Torvalds 		break;
25331da177e4SLinus Torvalds 	case SYS_SOCKETPAIR:
25341da177e4SLinus Torvalds 		err = sys_socketpair(a0, a1, a[2], (int __user *)a[3]);
25351da177e4SLinus Torvalds 		break;
25361da177e4SLinus Torvalds 	case SYS_SEND:
25371da177e4SLinus Torvalds 		err = sys_send(a0, (void __user *)a1, a[2], a[3]);
25381da177e4SLinus Torvalds 		break;
25391da177e4SLinus Torvalds 	case SYS_SENDTO:
25401da177e4SLinus Torvalds 		err = sys_sendto(a0, (void __user *)a1, a[2], a[3],
25411da177e4SLinus Torvalds 				 (struct sockaddr __user *)a[4], a[5]);
25421da177e4SLinus Torvalds 		break;
25431da177e4SLinus Torvalds 	case SYS_RECV:
25441da177e4SLinus Torvalds 		err = sys_recv(a0, (void __user *)a1, a[2], a[3]);
25451da177e4SLinus Torvalds 		break;
25461da177e4SLinus Torvalds 	case SYS_RECVFROM:
25471da177e4SLinus Torvalds 		err = sys_recvfrom(a0, (void __user *)a1, a[2], a[3],
254889bddce5SStephen Hemminger 				   (struct sockaddr __user *)a[4],
254989bddce5SStephen Hemminger 				   (int __user *)a[5]);
25501da177e4SLinus Torvalds 		break;
25511da177e4SLinus Torvalds 	case SYS_SHUTDOWN:
25521da177e4SLinus Torvalds 		err = sys_shutdown(a0, a1);
25531da177e4SLinus Torvalds 		break;
25541da177e4SLinus Torvalds 	case SYS_SETSOCKOPT:
25551da177e4SLinus Torvalds 		err = sys_setsockopt(a0, a1, a[2], (char __user *)a[3], a[4]);
25561da177e4SLinus Torvalds 		break;
25571da177e4SLinus Torvalds 	case SYS_GETSOCKOPT:
255889bddce5SStephen Hemminger 		err =
255989bddce5SStephen Hemminger 		    sys_getsockopt(a0, a1, a[2], (char __user *)a[3],
256089bddce5SStephen Hemminger 				   (int __user *)a[4]);
25611da177e4SLinus Torvalds 		break;
25621da177e4SLinus Torvalds 	case SYS_SENDMSG:
2563666547ffSAl Viro 		err = sys_sendmsg(a0, (struct user_msghdr __user *)a1, a[2]);
25641da177e4SLinus Torvalds 		break;
2565228e548eSAnton Blanchard 	case SYS_SENDMMSG:
2566228e548eSAnton Blanchard 		err = sys_sendmmsg(a0, (struct mmsghdr __user *)a1, a[2], a[3]);
2567228e548eSAnton Blanchard 		break;
25681da177e4SLinus Torvalds 	case SYS_RECVMSG:
2569666547ffSAl Viro 		err = sys_recvmsg(a0, (struct user_msghdr __user *)a1, a[2]);
25701da177e4SLinus Torvalds 		break;
2571a2e27255SArnaldo Carvalho de Melo 	case SYS_RECVMMSG:
2572a2e27255SArnaldo Carvalho de Melo 		err = sys_recvmmsg(a0, (struct mmsghdr __user *)a1, a[2], a[3],
2573a2e27255SArnaldo Carvalho de Melo 				   (struct timespec __user *)a[4]);
2574a2e27255SArnaldo Carvalho de Melo 		break;
2575de11defeSUlrich Drepper 	case SYS_ACCEPT4:
2576de11defeSUlrich Drepper 		err = sys_accept4(a0, (struct sockaddr __user *)a1,
2577de11defeSUlrich Drepper 				  (int __user *)a[2], a[3]);
2578aaca0bdcSUlrich Drepper 		break;
25791da177e4SLinus Torvalds 	default:
25801da177e4SLinus Torvalds 		err = -EINVAL;
25811da177e4SLinus Torvalds 		break;
25821da177e4SLinus Torvalds 	}
25831da177e4SLinus Torvalds 	return err;
25841da177e4SLinus Torvalds }
25851da177e4SLinus Torvalds 
25861da177e4SLinus Torvalds #endif				/* __ARCH_WANT_SYS_SOCKETCALL */
25871da177e4SLinus Torvalds 
258855737fdaSStephen Hemminger /**
258955737fdaSStephen Hemminger  *	sock_register - add a socket protocol handler
259055737fdaSStephen Hemminger  *	@ops: description of protocol
259155737fdaSStephen Hemminger  *
25921da177e4SLinus Torvalds  *	This function is called by a protocol handler that wants to
25931da177e4SLinus Torvalds  *	advertise its address family, and have it linked into the
2594e793c0f7SMasanari Iida  *	socket interface. The value ops->family corresponds to the
259555737fdaSStephen Hemminger  *	socket system call protocol family.
25961da177e4SLinus Torvalds  */
2597f0fd27d4SStephen Hemminger int sock_register(const struct net_proto_family *ops)
25981da177e4SLinus Torvalds {
25991da177e4SLinus Torvalds 	int err;
26001da177e4SLinus Torvalds 
26011da177e4SLinus Torvalds 	if (ops->family >= NPROTO) {
26023410f22eSYang Yingliang 		pr_crit("protocol %d >= NPROTO(%d)\n", ops->family, NPROTO);
26031da177e4SLinus Torvalds 		return -ENOBUFS;
26041da177e4SLinus Torvalds 	}
260555737fdaSStephen Hemminger 
260655737fdaSStephen Hemminger 	spin_lock(&net_family_lock);
2607190683a9SEric Dumazet 	if (rcu_dereference_protected(net_families[ops->family],
2608190683a9SEric Dumazet 				      lockdep_is_held(&net_family_lock)))
26091da177e4SLinus Torvalds 		err = -EEXIST;
261055737fdaSStephen Hemminger 	else {
2611cf778b00SEric Dumazet 		rcu_assign_pointer(net_families[ops->family], ops);
26121da177e4SLinus Torvalds 		err = 0;
26131da177e4SLinus Torvalds 	}
261455737fdaSStephen Hemminger 	spin_unlock(&net_family_lock);
261555737fdaSStephen Hemminger 
26163410f22eSYang Yingliang 	pr_info("NET: Registered protocol family %d\n", ops->family);
26171da177e4SLinus Torvalds 	return err;
26181da177e4SLinus Torvalds }
2619c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_register);
26201da177e4SLinus Torvalds 
262155737fdaSStephen Hemminger /**
262255737fdaSStephen Hemminger  *	sock_unregister - remove a protocol handler
262355737fdaSStephen Hemminger  *	@family: protocol family to remove
262455737fdaSStephen Hemminger  *
26251da177e4SLinus Torvalds  *	This function is called by a protocol handler that wants to
26261da177e4SLinus Torvalds  *	remove its address family, and have it unlinked from the
262755737fdaSStephen Hemminger  *	new socket creation.
262855737fdaSStephen Hemminger  *
262955737fdaSStephen Hemminger  *	If protocol handler is a module, then it can use module reference
263055737fdaSStephen Hemminger  *	counts to protect against new references. If protocol handler is not
263155737fdaSStephen Hemminger  *	a module then it needs to provide its own protection in
263255737fdaSStephen Hemminger  *	the ops->create routine.
26331da177e4SLinus Torvalds  */
2634f0fd27d4SStephen Hemminger void sock_unregister(int family)
26351da177e4SLinus Torvalds {
2636f0fd27d4SStephen Hemminger 	BUG_ON(family < 0 || family >= NPROTO);
26371da177e4SLinus Torvalds 
263855737fdaSStephen Hemminger 	spin_lock(&net_family_lock);
2639a9b3cd7fSStephen Hemminger 	RCU_INIT_POINTER(net_families[family], NULL);
264055737fdaSStephen Hemminger 	spin_unlock(&net_family_lock);
264155737fdaSStephen Hemminger 
264255737fdaSStephen Hemminger 	synchronize_rcu();
264355737fdaSStephen Hemminger 
26443410f22eSYang Yingliang 	pr_info("NET: Unregistered protocol family %d\n", family);
26451da177e4SLinus Torvalds }
2646c6d409cfSEric Dumazet EXPORT_SYMBOL(sock_unregister);
26471da177e4SLinus Torvalds 
264877d76ea3SAndi Kleen static int __init sock_init(void)
26491da177e4SLinus Torvalds {
2650b3e19d92SNick Piggin 	int err;
26512ca794e5SEric W. Biederman 	/*
26522ca794e5SEric W. Biederman 	 *      Initialize the network sysctl infrastructure.
26532ca794e5SEric W. Biederman 	 */
26542ca794e5SEric W. Biederman 	err = net_sysctl_init();
26552ca794e5SEric W. Biederman 	if (err)
26562ca794e5SEric W. Biederman 		goto out;
2657b3e19d92SNick Piggin 
26581da177e4SLinus Torvalds 	/*
26591da177e4SLinus Torvalds 	 *      Initialize skbuff SLAB cache
26601da177e4SLinus Torvalds 	 */
26611da177e4SLinus Torvalds 	skb_init();
26621da177e4SLinus Torvalds 
26631da177e4SLinus Torvalds 	/*
26641da177e4SLinus Torvalds 	 *      Initialize the protocols module.
26651da177e4SLinus Torvalds 	 */
26661da177e4SLinus Torvalds 
26671da177e4SLinus Torvalds 	init_inodecache();
2668b3e19d92SNick Piggin 
2669b3e19d92SNick Piggin 	err = register_filesystem(&sock_fs_type);
2670b3e19d92SNick Piggin 	if (err)
2671b3e19d92SNick Piggin 		goto out_fs;
26721da177e4SLinus Torvalds 	sock_mnt = kern_mount(&sock_fs_type);
2673b3e19d92SNick Piggin 	if (IS_ERR(sock_mnt)) {
2674b3e19d92SNick Piggin 		err = PTR_ERR(sock_mnt);
2675b3e19d92SNick Piggin 		goto out_mount;
2676b3e19d92SNick Piggin 	}
267777d76ea3SAndi Kleen 
267877d76ea3SAndi Kleen 	/* The real protocol initialization is performed in later initcalls.
26791da177e4SLinus Torvalds 	 */
26801da177e4SLinus Torvalds 
26811da177e4SLinus Torvalds #ifdef CONFIG_NETFILTER
26826d11cfdbSPablo Neira Ayuso 	err = netfilter_init();
26836d11cfdbSPablo Neira Ayuso 	if (err)
26846d11cfdbSPablo Neira Ayuso 		goto out;
26851da177e4SLinus Torvalds #endif
2686cbeb321aSDavid S. Miller 
2687408eccceSDaniel Borkmann 	ptp_classifier_init();
2688c1f19b51SRichard Cochran 
2689b3e19d92SNick Piggin out:
2690b3e19d92SNick Piggin 	return err;
2691b3e19d92SNick Piggin 
2692b3e19d92SNick Piggin out_mount:
2693b3e19d92SNick Piggin 	unregister_filesystem(&sock_fs_type);
2694b3e19d92SNick Piggin out_fs:
2695b3e19d92SNick Piggin 	goto out;
26961da177e4SLinus Torvalds }
26971da177e4SLinus Torvalds 
269877d76ea3SAndi Kleen core_initcall(sock_init);	/* early initcall */
269977d76ea3SAndi Kleen 
27001da177e4SLinus Torvalds #ifdef CONFIG_PROC_FS
27011da177e4SLinus Torvalds void socket_seq_show(struct seq_file *seq)
27021da177e4SLinus Torvalds {
27031da177e4SLinus Torvalds 	int cpu;
27041da177e4SLinus Torvalds 	int counter = 0;
27051da177e4SLinus Torvalds 
27066f912042SKAMEZAWA Hiroyuki 	for_each_possible_cpu(cpu)
27071da177e4SLinus Torvalds 	    counter += per_cpu(sockets_in_use, cpu);
27081da177e4SLinus Torvalds 
27091da177e4SLinus Torvalds 	/* It can be negative, by the way. 8) */
27101da177e4SLinus Torvalds 	if (counter < 0)
27111da177e4SLinus Torvalds 		counter = 0;
27121da177e4SLinus Torvalds 
27131da177e4SLinus Torvalds 	seq_printf(seq, "sockets: used %d\n", counter);
27141da177e4SLinus Torvalds }
27151da177e4SLinus Torvalds #endif				/* CONFIG_PROC_FS */
27161da177e4SLinus Torvalds 
271789bbfc95SShaun Pereira #ifdef CONFIG_COMPAT
27186b96018bSArnd Bergmann static int do_siocgstamp(struct net *net, struct socket *sock,
2719644595f8SH. Peter Anvin 			 unsigned int cmd, void __user *up)
27207a229387SArnd Bergmann {
27217a229387SArnd Bergmann 	mm_segment_t old_fs = get_fs();
27227a229387SArnd Bergmann 	struct timeval ktv;
27237a229387SArnd Bergmann 	int err;
27247a229387SArnd Bergmann 
27257a229387SArnd Bergmann 	set_fs(KERNEL_DS);
27266b96018bSArnd Bergmann 	err = sock_do_ioctl(net, sock, cmd, (unsigned long)&ktv);
27277a229387SArnd Bergmann 	set_fs(old_fs);
2728644595f8SH. Peter Anvin 	if (!err)
2729ed6fe9d6SMikulas Patocka 		err = compat_put_timeval(&ktv, up);
2730644595f8SH. Peter Anvin 
27317a229387SArnd Bergmann 	return err;
27327a229387SArnd Bergmann }
27337a229387SArnd Bergmann 
27346b96018bSArnd Bergmann static int do_siocgstampns(struct net *net, struct socket *sock,
2735644595f8SH. Peter Anvin 			   unsigned int cmd, void __user *up)
27367a229387SArnd Bergmann {
27377a229387SArnd Bergmann 	mm_segment_t old_fs = get_fs();
27387a229387SArnd Bergmann 	struct timespec kts;
27397a229387SArnd Bergmann 	int err;
27407a229387SArnd Bergmann 
27417a229387SArnd Bergmann 	set_fs(KERNEL_DS);
27426b96018bSArnd Bergmann 	err = sock_do_ioctl(net, sock, cmd, (unsigned long)&kts);
27437a229387SArnd Bergmann 	set_fs(old_fs);
2744644595f8SH. Peter Anvin 	if (!err)
2745ed6fe9d6SMikulas Patocka 		err = compat_put_timespec(&kts, up);
2746644595f8SH. Peter Anvin 
27477a229387SArnd Bergmann 	return err;
27487a229387SArnd Bergmann }
27497a229387SArnd Bergmann 
27506b96018bSArnd Bergmann static int dev_ifname32(struct net *net, struct compat_ifreq __user *uifr32)
27517a229387SArnd Bergmann {
27527a229387SArnd Bergmann 	struct ifreq __user *uifr;
27537a229387SArnd Bergmann 	int err;
27547a229387SArnd Bergmann 
27557a229387SArnd Bergmann 	uifr = compat_alloc_user_space(sizeof(struct ifreq));
27566b96018bSArnd Bergmann 	if (copy_in_user(uifr, uifr32, sizeof(struct compat_ifreq)))
27577a229387SArnd Bergmann 		return -EFAULT;
27587a229387SArnd Bergmann 
27596b96018bSArnd Bergmann 	err = dev_ioctl(net, SIOCGIFNAME, uifr);
27607a229387SArnd Bergmann 	if (err)
27617a229387SArnd Bergmann 		return err;
27627a229387SArnd Bergmann 
27636b96018bSArnd Bergmann 	if (copy_in_user(uifr32, uifr, sizeof(struct compat_ifreq)))
27647a229387SArnd Bergmann 		return -EFAULT;
27657a229387SArnd Bergmann 
27667a229387SArnd Bergmann 	return 0;
27677a229387SArnd Bergmann }
27687a229387SArnd Bergmann 
27696b96018bSArnd Bergmann static int dev_ifconf(struct net *net, struct compat_ifconf __user *uifc32)
27707a229387SArnd Bergmann {
27716b96018bSArnd Bergmann 	struct compat_ifconf ifc32;
27727a229387SArnd Bergmann 	struct ifconf ifc;
27737a229387SArnd Bergmann 	struct ifconf __user *uifc;
27746b96018bSArnd Bergmann 	struct compat_ifreq __user *ifr32;
27757a229387SArnd Bergmann 	struct ifreq __user *ifr;
27767a229387SArnd Bergmann 	unsigned int i, j;
27777a229387SArnd Bergmann 	int err;
27787a229387SArnd Bergmann 
27796b96018bSArnd Bergmann 	if (copy_from_user(&ifc32, uifc32, sizeof(struct compat_ifconf)))
27807a229387SArnd Bergmann 		return -EFAULT;
27817a229387SArnd Bergmann 
278243da5f2eSMathias Krause 	memset(&ifc, 0, sizeof(ifc));
27837a229387SArnd Bergmann 	if (ifc32.ifcbuf == 0) {
27847a229387SArnd Bergmann 		ifc32.ifc_len = 0;
27857a229387SArnd Bergmann 		ifc.ifc_len = 0;
27867a229387SArnd Bergmann 		ifc.ifc_req = NULL;
27877a229387SArnd Bergmann 		uifc = compat_alloc_user_space(sizeof(struct ifconf));
27887a229387SArnd Bergmann 	} else {
27896b96018bSArnd Bergmann 		size_t len = ((ifc32.ifc_len / sizeof(struct compat_ifreq)) + 1) *
27907a229387SArnd Bergmann 			sizeof(struct ifreq);
27917a229387SArnd Bergmann 		uifc = compat_alloc_user_space(sizeof(struct ifconf) + len);
27927a229387SArnd Bergmann 		ifc.ifc_len = len;
27937a229387SArnd Bergmann 		ifr = ifc.ifc_req = (void __user *)(uifc + 1);
27947a229387SArnd Bergmann 		ifr32 = compat_ptr(ifc32.ifcbuf);
27956b96018bSArnd Bergmann 		for (i = 0; i < ifc32.ifc_len; i += sizeof(struct compat_ifreq)) {
27966b96018bSArnd Bergmann 			if (copy_in_user(ifr, ifr32, sizeof(struct compat_ifreq)))
27977a229387SArnd Bergmann 				return -EFAULT;
27987a229387SArnd Bergmann 			ifr++;
27997a229387SArnd Bergmann 			ifr32++;
28007a229387SArnd Bergmann 		}
28017a229387SArnd Bergmann 	}
28027a229387SArnd Bergmann 	if (copy_to_user(uifc, &ifc, sizeof(struct ifconf)))
28037a229387SArnd Bergmann 		return -EFAULT;
28047a229387SArnd Bergmann 
28056b96018bSArnd Bergmann 	err = dev_ioctl(net, SIOCGIFCONF, uifc);
28067a229387SArnd Bergmann 	if (err)
28077a229387SArnd Bergmann 		return err;
28087a229387SArnd Bergmann 
28097a229387SArnd Bergmann 	if (copy_from_user(&ifc, uifc, sizeof(struct ifconf)))
28107a229387SArnd Bergmann 		return -EFAULT;
28117a229387SArnd Bergmann 
28127a229387SArnd Bergmann 	ifr = ifc.ifc_req;
28137a229387SArnd Bergmann 	ifr32 = compat_ptr(ifc32.ifcbuf);
28147a229387SArnd Bergmann 	for (i = 0, j = 0;
28156b96018bSArnd Bergmann 	     i + sizeof(struct compat_ifreq) <= ifc32.ifc_len && j < ifc.ifc_len;
28166b96018bSArnd Bergmann 	     i += sizeof(struct compat_ifreq), j += sizeof(struct ifreq)) {
28176b96018bSArnd Bergmann 		if (copy_in_user(ifr32, ifr, sizeof(struct compat_ifreq)))
28187a229387SArnd Bergmann 			return -EFAULT;
28197a229387SArnd Bergmann 		ifr32++;
28207a229387SArnd Bergmann 		ifr++;
28217a229387SArnd Bergmann 	}
28227a229387SArnd Bergmann 
28237a229387SArnd Bergmann 	if (ifc32.ifcbuf == 0) {
28247a229387SArnd Bergmann 		/* Translate from 64-bit structure multiple to
28257a229387SArnd Bergmann 		 * a 32-bit one.
28267a229387SArnd Bergmann 		 */
28277a229387SArnd Bergmann 		i = ifc.ifc_len;
28286b96018bSArnd Bergmann 		i = ((i / sizeof(struct ifreq)) * sizeof(struct compat_ifreq));
28297a229387SArnd Bergmann 		ifc32.ifc_len = i;
28307a229387SArnd Bergmann 	} else {
28317a229387SArnd Bergmann 		ifc32.ifc_len = i;
28327a229387SArnd Bergmann 	}
28336b96018bSArnd Bergmann 	if (copy_to_user(uifc32, &ifc32, sizeof(struct compat_ifconf)))
28347a229387SArnd Bergmann 		return -EFAULT;
28357a229387SArnd Bergmann 
28367a229387SArnd Bergmann 	return 0;
28377a229387SArnd Bergmann }
28387a229387SArnd Bergmann 
28396b96018bSArnd Bergmann static int ethtool_ioctl(struct net *net, struct compat_ifreq __user *ifr32)
28407a229387SArnd Bergmann {
28413a7da39dSBen Hutchings 	struct compat_ethtool_rxnfc __user *compat_rxnfc;
28423a7da39dSBen Hutchings 	bool convert_in = false, convert_out = false;
28433a7da39dSBen Hutchings 	size_t buf_size = ALIGN(sizeof(struct ifreq), 8);
28443a7da39dSBen Hutchings 	struct ethtool_rxnfc __user *rxnfc;
28457a229387SArnd Bergmann 	struct ifreq __user *ifr;
28463a7da39dSBen Hutchings 	u32 rule_cnt = 0, actual_rule_cnt;
28473a7da39dSBen Hutchings 	u32 ethcmd;
28487a229387SArnd Bergmann 	u32 data;
28493a7da39dSBen Hutchings 	int ret;
28507a229387SArnd Bergmann 
28517a229387SArnd Bergmann 	if (get_user(data, &ifr32->ifr_ifru.ifru_data))
28527a229387SArnd Bergmann 		return -EFAULT;
28537a229387SArnd Bergmann 
28543a7da39dSBen Hutchings 	compat_rxnfc = compat_ptr(data);
28553a7da39dSBen Hutchings 
28563a7da39dSBen Hutchings 	if (get_user(ethcmd, &compat_rxnfc->cmd))
28577a229387SArnd Bergmann 		return -EFAULT;
28587a229387SArnd Bergmann 
28593a7da39dSBen Hutchings 	/* Most ethtool structures are defined without padding.
28603a7da39dSBen Hutchings 	 * Unfortunately struct ethtool_rxnfc is an exception.
28613a7da39dSBen Hutchings 	 */
28623a7da39dSBen Hutchings 	switch (ethcmd) {
28633a7da39dSBen Hutchings 	default:
28643a7da39dSBen Hutchings 		break;
28653a7da39dSBen Hutchings 	case ETHTOOL_GRXCLSRLALL:
28663a7da39dSBen Hutchings 		/* Buffer size is variable */
28673a7da39dSBen Hutchings 		if (get_user(rule_cnt, &compat_rxnfc->rule_cnt))
28683a7da39dSBen Hutchings 			return -EFAULT;
28693a7da39dSBen Hutchings 		if (rule_cnt > KMALLOC_MAX_SIZE / sizeof(u32))
28703a7da39dSBen Hutchings 			return -ENOMEM;
28713a7da39dSBen Hutchings 		buf_size += rule_cnt * sizeof(u32);
28723a7da39dSBen Hutchings 		/* fall through */
28733a7da39dSBen Hutchings 	case ETHTOOL_GRXRINGS:
28743a7da39dSBen Hutchings 	case ETHTOOL_GRXCLSRLCNT:
28753a7da39dSBen Hutchings 	case ETHTOOL_GRXCLSRULE:
287655664f32SBen Hutchings 	case ETHTOOL_SRXCLSRLINS:
28773a7da39dSBen Hutchings 		convert_out = true;
28783a7da39dSBen Hutchings 		/* fall through */
28793a7da39dSBen Hutchings 	case ETHTOOL_SRXCLSRLDEL:
28803a7da39dSBen Hutchings 		buf_size += sizeof(struct ethtool_rxnfc);
28813a7da39dSBen Hutchings 		convert_in = true;
28823a7da39dSBen Hutchings 		break;
28833a7da39dSBen Hutchings 	}
28843a7da39dSBen Hutchings 
28853a7da39dSBen Hutchings 	ifr = compat_alloc_user_space(buf_size);
2886954b1244SStephen Hemminger 	rxnfc = (void __user *)ifr + ALIGN(sizeof(struct ifreq), 8);
28873a7da39dSBen Hutchings 
28883a7da39dSBen Hutchings 	if (copy_in_user(&ifr->ifr_name, &ifr32->ifr_name, IFNAMSIZ))
28893a7da39dSBen Hutchings 		return -EFAULT;
28903a7da39dSBen Hutchings 
28913a7da39dSBen Hutchings 	if (put_user(convert_in ? rxnfc : compat_ptr(data),
28923a7da39dSBen Hutchings 		     &ifr->ifr_ifru.ifru_data))
28933a7da39dSBen Hutchings 		return -EFAULT;
28943a7da39dSBen Hutchings 
28953a7da39dSBen Hutchings 	if (convert_in) {
2896127fe533SAlexander Duyck 		/* We expect there to be holes between fs.m_ext and
28973a7da39dSBen Hutchings 		 * fs.ring_cookie and at the end of fs, but nowhere else.
28983a7da39dSBen Hutchings 		 */
2899127fe533SAlexander Duyck 		BUILD_BUG_ON(offsetof(struct compat_ethtool_rxnfc, fs.m_ext) +
2900127fe533SAlexander Duyck 			     sizeof(compat_rxnfc->fs.m_ext) !=
2901127fe533SAlexander Duyck 			     offsetof(struct ethtool_rxnfc, fs.m_ext) +
2902127fe533SAlexander Duyck 			     sizeof(rxnfc->fs.m_ext));
29033a7da39dSBen Hutchings 		BUILD_BUG_ON(
29043a7da39dSBen Hutchings 			offsetof(struct compat_ethtool_rxnfc, fs.location) -
29053a7da39dSBen Hutchings 			offsetof(struct compat_ethtool_rxnfc, fs.ring_cookie) !=
29063a7da39dSBen Hutchings 			offsetof(struct ethtool_rxnfc, fs.location) -
29073a7da39dSBen Hutchings 			offsetof(struct ethtool_rxnfc, fs.ring_cookie));
29083a7da39dSBen Hutchings 
29093a7da39dSBen Hutchings 		if (copy_in_user(rxnfc, compat_rxnfc,
2910954b1244SStephen Hemminger 				 (void __user *)(&rxnfc->fs.m_ext + 1) -
2911954b1244SStephen Hemminger 				 (void __user *)rxnfc) ||
29123a7da39dSBen Hutchings 		    copy_in_user(&rxnfc->fs.ring_cookie,
29133a7da39dSBen Hutchings 				 &compat_rxnfc->fs.ring_cookie,
2914954b1244SStephen Hemminger 				 (void __user *)(&rxnfc->fs.location + 1) -
2915954b1244SStephen Hemminger 				 (void __user *)&rxnfc->fs.ring_cookie) ||
29163a7da39dSBen Hutchings 		    copy_in_user(&rxnfc->rule_cnt, &compat_rxnfc->rule_cnt,
29173a7da39dSBen Hutchings 				 sizeof(rxnfc->rule_cnt)))
29183a7da39dSBen Hutchings 			return -EFAULT;
29193a7da39dSBen Hutchings 	}
29203a7da39dSBen Hutchings 
29213a7da39dSBen Hutchings 	ret = dev_ioctl(net, SIOCETHTOOL, ifr);
29223a7da39dSBen Hutchings 	if (ret)
29233a7da39dSBen Hutchings 		return ret;
29243a7da39dSBen Hutchings 
29253a7da39dSBen Hutchings 	if (convert_out) {
29263a7da39dSBen Hutchings 		if (copy_in_user(compat_rxnfc, rxnfc,
2927954b1244SStephen Hemminger 				 (const void __user *)(&rxnfc->fs.m_ext + 1) -
2928954b1244SStephen Hemminger 				 (const void __user *)rxnfc) ||
29293a7da39dSBen Hutchings 		    copy_in_user(&compat_rxnfc->fs.ring_cookie,
29303a7da39dSBen Hutchings 				 &rxnfc->fs.ring_cookie,
2931954b1244SStephen Hemminger 				 (const void __user *)(&rxnfc->fs.location + 1) -
2932954b1244SStephen Hemminger 				 (const void __user *)&rxnfc->fs.ring_cookie) ||
29333a7da39dSBen Hutchings 		    copy_in_user(&compat_rxnfc->rule_cnt, &rxnfc->rule_cnt,
29343a7da39dSBen Hutchings 				 sizeof(rxnfc->rule_cnt)))
29353a7da39dSBen Hutchings 			return -EFAULT;
29363a7da39dSBen Hutchings 
29373a7da39dSBen Hutchings 		if (ethcmd == ETHTOOL_GRXCLSRLALL) {
29383a7da39dSBen Hutchings 			/* As an optimisation, we only copy the actual
29393a7da39dSBen Hutchings 			 * number of rules that the underlying
29403a7da39dSBen Hutchings 			 * function returned.  Since Mallory might
29413a7da39dSBen Hutchings 			 * change the rule count in user memory, we
29423a7da39dSBen Hutchings 			 * check that it is less than the rule count
29433a7da39dSBen Hutchings 			 * originally given (as the user buffer size),
29443a7da39dSBen Hutchings 			 * which has been range-checked.
29453a7da39dSBen Hutchings 			 */
29463a7da39dSBen Hutchings 			if (get_user(actual_rule_cnt, &rxnfc->rule_cnt))
29473a7da39dSBen Hutchings 				return -EFAULT;
29483a7da39dSBen Hutchings 			if (actual_rule_cnt < rule_cnt)
29493a7da39dSBen Hutchings 				rule_cnt = actual_rule_cnt;
29503a7da39dSBen Hutchings 			if (copy_in_user(&compat_rxnfc->rule_locs[0],
29513a7da39dSBen Hutchings 					 &rxnfc->rule_locs[0],
29523a7da39dSBen Hutchings 					 rule_cnt * sizeof(u32)))
29533a7da39dSBen Hutchings 				return -EFAULT;
29543a7da39dSBen Hutchings 		}
29553a7da39dSBen Hutchings 	}
29563a7da39dSBen Hutchings 
29573a7da39dSBen Hutchings 	return 0;
29587a229387SArnd Bergmann }
29597a229387SArnd Bergmann 
29607a50a240SArnd Bergmann static int compat_siocwandev(struct net *net, struct compat_ifreq __user *uifr32)
29617a50a240SArnd Bergmann {
29627a50a240SArnd Bergmann 	void __user *uptr;
29637a50a240SArnd Bergmann 	compat_uptr_t uptr32;
29647a50a240SArnd Bergmann 	struct ifreq __user *uifr;
29657a50a240SArnd Bergmann 
29667a50a240SArnd Bergmann 	uifr = compat_alloc_user_space(sizeof(*uifr));
29677a50a240SArnd Bergmann 	if (copy_in_user(uifr, uifr32, sizeof(struct compat_ifreq)))
29687a50a240SArnd Bergmann 		return -EFAULT;
29697a50a240SArnd Bergmann 
29707a50a240SArnd Bergmann 	if (get_user(uptr32, &uifr32->ifr_settings.ifs_ifsu))
29717a50a240SArnd Bergmann 		return -EFAULT;
29727a50a240SArnd Bergmann 
29737a50a240SArnd Bergmann 	uptr = compat_ptr(uptr32);
29747a50a240SArnd Bergmann 
29757a50a240SArnd Bergmann 	if (put_user(uptr, &uifr->ifr_settings.ifs_ifsu.raw_hdlc))
29767a50a240SArnd Bergmann 		return -EFAULT;
29777a50a240SArnd Bergmann 
29787a50a240SArnd Bergmann 	return dev_ioctl(net, SIOCWANDEV, uifr);
29797a50a240SArnd Bergmann }
29807a50a240SArnd Bergmann 
29816b96018bSArnd Bergmann static int bond_ioctl(struct net *net, unsigned int cmd,
29826b96018bSArnd Bergmann 			 struct compat_ifreq __user *ifr32)
29837a229387SArnd Bergmann {
29847a229387SArnd Bergmann 	struct ifreq kifr;
29857a229387SArnd Bergmann 	mm_segment_t old_fs;
29867a229387SArnd Bergmann 	int err;
29877a229387SArnd Bergmann 
29887a229387SArnd Bergmann 	switch (cmd) {
29897a229387SArnd Bergmann 	case SIOCBONDENSLAVE:
29907a229387SArnd Bergmann 	case SIOCBONDRELEASE:
29917a229387SArnd Bergmann 	case SIOCBONDSETHWADDR:
29927a229387SArnd Bergmann 	case SIOCBONDCHANGEACTIVE:
29936b96018bSArnd Bergmann 		if (copy_from_user(&kifr, ifr32, sizeof(struct compat_ifreq)))
29947a229387SArnd Bergmann 			return -EFAULT;
29957a229387SArnd Bergmann 
29967a229387SArnd Bergmann 		old_fs = get_fs();
29977a229387SArnd Bergmann 		set_fs(KERNEL_DS);
2998c3f52ae6Sstephen hemminger 		err = dev_ioctl(net, cmd,
2999c3f52ae6Sstephen hemminger 				(struct ifreq __user __force *) &kifr);
30007a229387SArnd Bergmann 		set_fs(old_fs);
30017a229387SArnd Bergmann 
30027a229387SArnd Bergmann 		return err;
30037a229387SArnd Bergmann 	default:
300407d106d0SLinus Torvalds 		return -ENOIOCTLCMD;
3005ccbd6a5aSJoe Perches 	}
30067a229387SArnd Bergmann }
30077a229387SArnd Bergmann 
3008590d4693SBen Hutchings /* Handle ioctls that use ifreq::ifr_data and just need struct ifreq converted */
3009590d4693SBen Hutchings static int compat_ifr_data_ioctl(struct net *net, unsigned int cmd,
30106b96018bSArnd Bergmann 				 struct compat_ifreq __user *u_ifreq32)
30117a229387SArnd Bergmann {
30127a229387SArnd Bergmann 	struct ifreq __user *u_ifreq64;
30137a229387SArnd Bergmann 	char tmp_buf[IFNAMSIZ];
30147a229387SArnd Bergmann 	void __user *data64;
30157a229387SArnd Bergmann 	u32 data32;
30167a229387SArnd Bergmann 
30177a229387SArnd Bergmann 	if (copy_from_user(&tmp_buf[0], &(u_ifreq32->ifr_ifrn.ifrn_name[0]),
30187a229387SArnd Bergmann 			   IFNAMSIZ))
30197a229387SArnd Bergmann 		return -EFAULT;
3020417c3522SBen Hutchings 	if (get_user(data32, &u_ifreq32->ifr_ifru.ifru_data))
30217a229387SArnd Bergmann 		return -EFAULT;
30227a229387SArnd Bergmann 	data64 = compat_ptr(data32);
30237a229387SArnd Bergmann 
30247a229387SArnd Bergmann 	u_ifreq64 = compat_alloc_user_space(sizeof(*u_ifreq64));
30257a229387SArnd Bergmann 
30267a229387SArnd Bergmann 	if (copy_to_user(&u_ifreq64->ifr_ifrn.ifrn_name[0], &tmp_buf[0],
30277a229387SArnd Bergmann 			 IFNAMSIZ))
30287a229387SArnd Bergmann 		return -EFAULT;
3029417c3522SBen Hutchings 	if (put_user(data64, &u_ifreq64->ifr_ifru.ifru_data))
30307a229387SArnd Bergmann 		return -EFAULT;
30317a229387SArnd Bergmann 
30326b96018bSArnd Bergmann 	return dev_ioctl(net, cmd, u_ifreq64);
30337a229387SArnd Bergmann }
30347a229387SArnd Bergmann 
30356b96018bSArnd Bergmann static int dev_ifsioc(struct net *net, struct socket *sock,
30366b96018bSArnd Bergmann 			 unsigned int cmd, struct compat_ifreq __user *uifr32)
30377a229387SArnd Bergmann {
3038a2116ed2SArnd Bergmann 	struct ifreq __user *uifr;
30397a229387SArnd Bergmann 	int err;
30407a229387SArnd Bergmann 
3041a2116ed2SArnd Bergmann 	uifr = compat_alloc_user_space(sizeof(*uifr));
3042a2116ed2SArnd Bergmann 	if (copy_in_user(uifr, uifr32, sizeof(*uifr32)))
30437a229387SArnd Bergmann 		return -EFAULT;
3044a2116ed2SArnd Bergmann 
3045a2116ed2SArnd Bergmann 	err = sock_do_ioctl(net, sock, cmd, (unsigned long)uifr);
3046a2116ed2SArnd Bergmann 
30477a229387SArnd Bergmann 	if (!err) {
30487a229387SArnd Bergmann 		switch (cmd) {
30497a229387SArnd Bergmann 		case SIOCGIFFLAGS:
30507a229387SArnd Bergmann 		case SIOCGIFMETRIC:
30517a229387SArnd Bergmann 		case SIOCGIFMTU:
30527a229387SArnd Bergmann 		case SIOCGIFMEM:
30537a229387SArnd Bergmann 		case SIOCGIFHWADDR:
30547a229387SArnd Bergmann 		case SIOCGIFINDEX:
30557a229387SArnd Bergmann 		case SIOCGIFADDR:
30567a229387SArnd Bergmann 		case SIOCGIFBRDADDR:
30577a229387SArnd Bergmann 		case SIOCGIFDSTADDR:
30587a229387SArnd Bergmann 		case SIOCGIFNETMASK:
3059fab2532bSArnd Bergmann 		case SIOCGIFPFLAGS:
30607a229387SArnd Bergmann 		case SIOCGIFTXQLEN:
3061fab2532bSArnd Bergmann 		case SIOCGMIIPHY:
3062fab2532bSArnd Bergmann 		case SIOCGMIIREG:
3063a2116ed2SArnd Bergmann 			if (copy_in_user(uifr32, uifr, sizeof(*uifr32)))
3064a2116ed2SArnd Bergmann 				err = -EFAULT;
30657a229387SArnd Bergmann 			break;
3066a2116ed2SArnd Bergmann 		}
3067a2116ed2SArnd Bergmann 	}
3068a2116ed2SArnd Bergmann 	return err;
3069a2116ed2SArnd Bergmann }
3070a2116ed2SArnd Bergmann 
3071a2116ed2SArnd Bergmann static int compat_sioc_ifmap(struct net *net, unsigned int cmd,
3072a2116ed2SArnd Bergmann 			struct compat_ifreq __user *uifr32)
3073a2116ed2SArnd Bergmann {
3074a2116ed2SArnd Bergmann 	struct ifreq ifr;
3075a2116ed2SArnd Bergmann 	struct compat_ifmap __user *uifmap32;
3076a2116ed2SArnd Bergmann 	mm_segment_t old_fs;
3077a2116ed2SArnd Bergmann 	int err;
3078a2116ed2SArnd Bergmann 
3079a2116ed2SArnd Bergmann 	uifmap32 = &uifr32->ifr_ifru.ifru_map;
3080a2116ed2SArnd Bergmann 	err = copy_from_user(&ifr, uifr32, sizeof(ifr.ifr_name));
30813ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.mem_start, &uifmap32->mem_start);
30823ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.mem_end, &uifmap32->mem_end);
30833ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.base_addr, &uifmap32->base_addr);
30843ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.irq, &uifmap32->irq);
30853ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.dma, &uifmap32->dma);
30863ddc5b46SMathieu Desnoyers 	err |= get_user(ifr.ifr_map.port, &uifmap32->port);
3087a2116ed2SArnd Bergmann 	if (err)
3088a2116ed2SArnd Bergmann 		return -EFAULT;
3089a2116ed2SArnd Bergmann 
3090a2116ed2SArnd Bergmann 	old_fs = get_fs();
3091a2116ed2SArnd Bergmann 	set_fs(KERNEL_DS);
3092c3f52ae6Sstephen hemminger 	err = dev_ioctl(net, cmd, (void  __user __force *)&ifr);
3093a2116ed2SArnd Bergmann 	set_fs(old_fs);
3094a2116ed2SArnd Bergmann 
3095a2116ed2SArnd Bergmann 	if (cmd == SIOCGIFMAP && !err) {
30967a229387SArnd Bergmann 		err = copy_to_user(uifr32, &ifr, sizeof(ifr.ifr_name));
30973ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.mem_start, &uifmap32->mem_start);
30983ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.mem_end, &uifmap32->mem_end);
30993ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.base_addr, &uifmap32->base_addr);
31003ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.irq, &uifmap32->irq);
31013ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.dma, &uifmap32->dma);
31023ddc5b46SMathieu Desnoyers 		err |= put_user(ifr.ifr_map.port, &uifmap32->port);
31037a229387SArnd Bergmann 		if (err)
31047a229387SArnd Bergmann 			err = -EFAULT;
31057a229387SArnd Bergmann 	}
31067a229387SArnd Bergmann 	return err;
31077a229387SArnd Bergmann }
31087a229387SArnd Bergmann 
31097a229387SArnd Bergmann struct rtentry32 {
31107a229387SArnd Bergmann 	u32		rt_pad1;
31117a229387SArnd Bergmann 	struct sockaddr rt_dst;         /* target address               */
31127a229387SArnd Bergmann 	struct sockaddr rt_gateway;     /* gateway addr (RTF_GATEWAY)   */
31137a229387SArnd Bergmann 	struct sockaddr rt_genmask;     /* target network mask (IP)     */
31147a229387SArnd Bergmann 	unsigned short	rt_flags;
31157a229387SArnd Bergmann 	short		rt_pad2;
31167a229387SArnd Bergmann 	u32		rt_pad3;
31177a229387SArnd Bergmann 	unsigned char	rt_tos;
31187a229387SArnd Bergmann 	unsigned char	rt_class;
31197a229387SArnd Bergmann 	short		rt_pad4;
31207a229387SArnd Bergmann 	short		rt_metric;      /* +1 for binary compatibility! */
31217a229387SArnd Bergmann 	/* char * */ u32 rt_dev;        /* forcing the device at add    */
31227a229387SArnd Bergmann 	u32		rt_mtu;         /* per route MTU/Window         */
31237a229387SArnd Bergmann 	u32		rt_window;      /* Window clamping              */
31247a229387SArnd Bergmann 	unsigned short  rt_irtt;        /* Initial RTT                  */
31257a229387SArnd Bergmann };
31267a229387SArnd Bergmann 
31277a229387SArnd Bergmann struct in6_rtmsg32 {
31287a229387SArnd Bergmann 	struct in6_addr		rtmsg_dst;
31297a229387SArnd Bergmann 	struct in6_addr		rtmsg_src;
31307a229387SArnd Bergmann 	struct in6_addr		rtmsg_gateway;
31317a229387SArnd Bergmann 	u32			rtmsg_type;
31327a229387SArnd Bergmann 	u16			rtmsg_dst_len;
31337a229387SArnd Bergmann 	u16			rtmsg_src_len;
31347a229387SArnd Bergmann 	u32			rtmsg_metric;
31357a229387SArnd Bergmann 	u32			rtmsg_info;
31367a229387SArnd Bergmann 	u32			rtmsg_flags;
31377a229387SArnd Bergmann 	s32			rtmsg_ifindex;
31387a229387SArnd Bergmann };
31397a229387SArnd Bergmann 
31406b96018bSArnd Bergmann static int routing_ioctl(struct net *net, struct socket *sock,
31416b96018bSArnd Bergmann 			 unsigned int cmd, void __user *argp)
31427a229387SArnd Bergmann {
31437a229387SArnd Bergmann 	int ret;
31447a229387SArnd Bergmann 	void *r = NULL;
31457a229387SArnd Bergmann 	struct in6_rtmsg r6;
31467a229387SArnd Bergmann 	struct rtentry r4;
31477a229387SArnd Bergmann 	char devname[16];
31487a229387SArnd Bergmann 	u32 rtdev;
31497a229387SArnd Bergmann 	mm_segment_t old_fs = get_fs();
31507a229387SArnd Bergmann 
31516b96018bSArnd Bergmann 	if (sock && sock->sk && sock->sk->sk_family == AF_INET6) { /* ipv6 */
31526b96018bSArnd Bergmann 		struct in6_rtmsg32 __user *ur6 = argp;
31537a229387SArnd Bergmann 		ret = copy_from_user(&r6.rtmsg_dst, &(ur6->rtmsg_dst),
31547a229387SArnd Bergmann 			3 * sizeof(struct in6_addr));
31553ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_type, &(ur6->rtmsg_type));
31563ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_dst_len, &(ur6->rtmsg_dst_len));
31573ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_src_len, &(ur6->rtmsg_src_len));
31583ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_metric, &(ur6->rtmsg_metric));
31593ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_info, &(ur6->rtmsg_info));
31603ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_flags, &(ur6->rtmsg_flags));
31613ddc5b46SMathieu Desnoyers 		ret |= get_user(r6.rtmsg_ifindex, &(ur6->rtmsg_ifindex));
31627a229387SArnd Bergmann 
31637a229387SArnd Bergmann 		r = (void *) &r6;
31647a229387SArnd Bergmann 	} else { /* ipv4 */
31656b96018bSArnd Bergmann 		struct rtentry32 __user *ur4 = argp;
31667a229387SArnd Bergmann 		ret = copy_from_user(&r4.rt_dst, &(ur4->rt_dst),
31677a229387SArnd Bergmann 					3 * sizeof(struct sockaddr));
31683ddc5b46SMathieu Desnoyers 		ret |= get_user(r4.rt_flags, &(ur4->rt_flags));
31693ddc5b46SMathieu Desnoyers 		ret |= get_user(r4.rt_metric, &(ur4->rt_metric));
31703ddc5b46SMathieu Desnoyers 		ret |= get_user(r4.rt_mtu, &(ur4->rt_mtu));
31713ddc5b46SMathieu Desnoyers 		ret |= get_user(r4.rt_window, &(ur4->rt_window));
31723ddc5b46SMathieu Desnoyers 		ret |= get_user(r4.rt_irtt, &(ur4->rt_irtt));
31733ddc5b46SMathieu Desnoyers 		ret |= get_user(rtdev, &(ur4->rt_dev));
31747a229387SArnd Bergmann 		if (rtdev) {
31757a229387SArnd Bergmann 			ret |= copy_from_user(devname, compat_ptr(rtdev), 15);
3176c3f52ae6Sstephen hemminger 			r4.rt_dev = (char __user __force *)devname;
3177c3f52ae6Sstephen hemminger 			devname[15] = 0;
31787a229387SArnd Bergmann 		} else
31797a229387SArnd Bergmann 			r4.rt_dev = NULL;
31807a229387SArnd Bergmann 
31817a229387SArnd Bergmann 		r = (void *) &r4;
31827a229387SArnd Bergmann 	}
31837a229387SArnd Bergmann 
31847a229387SArnd Bergmann 	if (ret) {
31857a229387SArnd Bergmann 		ret = -EFAULT;
31867a229387SArnd Bergmann 		goto out;
31877a229387SArnd Bergmann 	}
31887a229387SArnd Bergmann 
31897a229387SArnd Bergmann 	set_fs(KERNEL_DS);
31906b96018bSArnd Bergmann 	ret = sock_do_ioctl(net, sock, cmd, (unsigned long) r);
31917a229387SArnd Bergmann 	set_fs(old_fs);
31927a229387SArnd Bergmann 
31937a229387SArnd Bergmann out:
31947a229387SArnd Bergmann 	return ret;
31957a229387SArnd Bergmann }
31967a229387SArnd Bergmann 
31977a229387SArnd Bergmann /* Since old style bridge ioctl's endup using SIOCDEVPRIVATE
31987a229387SArnd Bergmann  * for some operations; this forces use of the newer bridge-utils that
319925985edcSLucas De Marchi  * use compatible ioctls
32007a229387SArnd Bergmann  */
32016b96018bSArnd Bergmann static int old_bridge_ioctl(compat_ulong_t __user *argp)
32027a229387SArnd Bergmann {
32036b96018bSArnd Bergmann 	compat_ulong_t tmp;
32047a229387SArnd Bergmann 
32056b96018bSArnd Bergmann 	if (get_user(tmp, argp))
32067a229387SArnd Bergmann 		return -EFAULT;
32077a229387SArnd Bergmann 	if (tmp == BRCTL_GET_VERSION)
32087a229387SArnd Bergmann 		return BRCTL_VERSION + 1;
32097a229387SArnd Bergmann 	return -EINVAL;
32107a229387SArnd Bergmann }
32117a229387SArnd Bergmann 
32126b96018bSArnd Bergmann static int compat_sock_ioctl_trans(struct file *file, struct socket *sock,
32136b96018bSArnd Bergmann 			 unsigned int cmd, unsigned long arg)
32146b96018bSArnd Bergmann {
32156b96018bSArnd Bergmann 	void __user *argp = compat_ptr(arg);
32166b96018bSArnd Bergmann 	struct sock *sk = sock->sk;
32176b96018bSArnd Bergmann 	struct net *net = sock_net(sk);
32187a229387SArnd Bergmann 
32196b96018bSArnd Bergmann 	if (cmd >= SIOCDEVPRIVATE && cmd <= (SIOCDEVPRIVATE + 15))
3220590d4693SBen Hutchings 		return compat_ifr_data_ioctl(net, cmd, argp);
32217a229387SArnd Bergmann 
32226b96018bSArnd Bergmann 	switch (cmd) {
32236b96018bSArnd Bergmann 	case SIOCSIFBR:
32246b96018bSArnd Bergmann 	case SIOCGIFBR:
32256b96018bSArnd Bergmann 		return old_bridge_ioctl(argp);
32266b96018bSArnd Bergmann 	case SIOCGIFNAME:
32276b96018bSArnd Bergmann 		return dev_ifname32(net, argp);
32286b96018bSArnd Bergmann 	case SIOCGIFCONF:
32296b96018bSArnd Bergmann 		return dev_ifconf(net, argp);
32306b96018bSArnd Bergmann 	case SIOCETHTOOL:
32316b96018bSArnd Bergmann 		return ethtool_ioctl(net, argp);
32327a50a240SArnd Bergmann 	case SIOCWANDEV:
32337a50a240SArnd Bergmann 		return compat_siocwandev(net, argp);
3234a2116ed2SArnd Bergmann 	case SIOCGIFMAP:
3235a2116ed2SArnd Bergmann 	case SIOCSIFMAP:
3236a2116ed2SArnd Bergmann 		return compat_sioc_ifmap(net, cmd, argp);
32376b96018bSArnd Bergmann 	case SIOCBONDENSLAVE:
32386b96018bSArnd Bergmann 	case SIOCBONDRELEASE:
32396b96018bSArnd Bergmann 	case SIOCBONDSETHWADDR:
32406b96018bSArnd Bergmann 	case SIOCBONDCHANGEACTIVE:
32416b96018bSArnd Bergmann 		return bond_ioctl(net, cmd, argp);
32426b96018bSArnd Bergmann 	case SIOCADDRT:
32436b96018bSArnd Bergmann 	case SIOCDELRT:
32446b96018bSArnd Bergmann 		return routing_ioctl(net, sock, cmd, argp);
32456b96018bSArnd Bergmann 	case SIOCGSTAMP:
32466b96018bSArnd Bergmann 		return do_siocgstamp(net, sock, cmd, argp);
32476b96018bSArnd Bergmann 	case SIOCGSTAMPNS:
32486b96018bSArnd Bergmann 		return do_siocgstampns(net, sock, cmd, argp);
3249590d4693SBen Hutchings 	case SIOCBONDSLAVEINFOQUERY:
3250590d4693SBen Hutchings 	case SIOCBONDINFOQUERY:
3251a2116ed2SArnd Bergmann 	case SIOCSHWTSTAMP:
3252fd468c74SBen Hutchings 	case SIOCGHWTSTAMP:
3253590d4693SBen Hutchings 		return compat_ifr_data_ioctl(net, cmd, argp);
32547a229387SArnd Bergmann 
32556b96018bSArnd Bergmann 	case FIOSETOWN:
32566b96018bSArnd Bergmann 	case SIOCSPGRP:
32576b96018bSArnd Bergmann 	case FIOGETOWN:
32586b96018bSArnd Bergmann 	case SIOCGPGRP:
32596b96018bSArnd Bergmann 	case SIOCBRADDBR:
32606b96018bSArnd Bergmann 	case SIOCBRDELBR:
32616b96018bSArnd Bergmann 	case SIOCGIFVLAN:
32626b96018bSArnd Bergmann 	case SIOCSIFVLAN:
32636b96018bSArnd Bergmann 	case SIOCADDDLCI:
32646b96018bSArnd Bergmann 	case SIOCDELDLCI:
32656b96018bSArnd Bergmann 		return sock_ioctl(file, cmd, arg);
32666b96018bSArnd Bergmann 
32676b96018bSArnd Bergmann 	case SIOCGIFFLAGS:
32686b96018bSArnd Bergmann 	case SIOCSIFFLAGS:
32696b96018bSArnd Bergmann 	case SIOCGIFMETRIC:
32706b96018bSArnd Bergmann 	case SIOCSIFMETRIC:
32716b96018bSArnd Bergmann 	case SIOCGIFMTU:
32726b96018bSArnd Bergmann 	case SIOCSIFMTU:
32736b96018bSArnd Bergmann 	case SIOCGIFMEM:
32746b96018bSArnd Bergmann 	case SIOCSIFMEM:
32756b96018bSArnd Bergmann 	case SIOCGIFHWADDR:
32766b96018bSArnd Bergmann 	case SIOCSIFHWADDR:
32776b96018bSArnd Bergmann 	case SIOCADDMULTI:
32786b96018bSArnd Bergmann 	case SIOCDELMULTI:
32796b96018bSArnd Bergmann 	case SIOCGIFINDEX:
32806b96018bSArnd Bergmann 	case SIOCGIFADDR:
32816b96018bSArnd Bergmann 	case SIOCSIFADDR:
32826b96018bSArnd Bergmann 	case SIOCSIFHWBROADCAST:
32836b96018bSArnd Bergmann 	case SIOCDIFADDR:
32846b96018bSArnd Bergmann 	case SIOCGIFBRDADDR:
32856b96018bSArnd Bergmann 	case SIOCSIFBRDADDR:
32866b96018bSArnd Bergmann 	case SIOCGIFDSTADDR:
32876b96018bSArnd Bergmann 	case SIOCSIFDSTADDR:
32886b96018bSArnd Bergmann 	case SIOCGIFNETMASK:
32896b96018bSArnd Bergmann 	case SIOCSIFNETMASK:
32906b96018bSArnd Bergmann 	case SIOCSIFPFLAGS:
32916b96018bSArnd Bergmann 	case SIOCGIFPFLAGS:
32926b96018bSArnd Bergmann 	case SIOCGIFTXQLEN:
32936b96018bSArnd Bergmann 	case SIOCSIFTXQLEN:
32946b96018bSArnd Bergmann 	case SIOCBRADDIF:
32956b96018bSArnd Bergmann 	case SIOCBRDELIF:
32969177efd3SArnd Bergmann 	case SIOCSIFNAME:
32979177efd3SArnd Bergmann 	case SIOCGMIIPHY:
32989177efd3SArnd Bergmann 	case SIOCGMIIREG:
32999177efd3SArnd Bergmann 	case SIOCSMIIREG:
33006b96018bSArnd Bergmann 		return dev_ifsioc(net, sock, cmd, argp);
33019177efd3SArnd Bergmann 
33026b96018bSArnd Bergmann 	case SIOCSARP:
33036b96018bSArnd Bergmann 	case SIOCGARP:
33046b96018bSArnd Bergmann 	case SIOCDARP:
33056b96018bSArnd Bergmann 	case SIOCATMARK:
33069177efd3SArnd Bergmann 		return sock_do_ioctl(net, sock, cmd, arg);
33079177efd3SArnd Bergmann 	}
33089177efd3SArnd Bergmann 
33096b96018bSArnd Bergmann 	return -ENOIOCTLCMD;
33106b96018bSArnd Bergmann }
33117a229387SArnd Bergmann 
331295c96174SEric Dumazet static long compat_sock_ioctl(struct file *file, unsigned int cmd,
331389bbfc95SShaun Pereira 			      unsigned long arg)
331489bbfc95SShaun Pereira {
331589bbfc95SShaun Pereira 	struct socket *sock = file->private_data;
331689bbfc95SShaun Pereira 	int ret = -ENOIOCTLCMD;
331787de87d5SDavid S. Miller 	struct sock *sk;
331887de87d5SDavid S. Miller 	struct net *net;
331987de87d5SDavid S. Miller 
332087de87d5SDavid S. Miller 	sk = sock->sk;
332187de87d5SDavid S. Miller 	net = sock_net(sk);
332289bbfc95SShaun Pereira 
332389bbfc95SShaun Pereira 	if (sock->ops->compat_ioctl)
332489bbfc95SShaun Pereira 		ret = sock->ops->compat_ioctl(sock, cmd, arg);
332589bbfc95SShaun Pereira 
332687de87d5SDavid S. Miller 	if (ret == -ENOIOCTLCMD &&
332787de87d5SDavid S. Miller 	    (cmd >= SIOCIWFIRST && cmd <= SIOCIWLAST))
332887de87d5SDavid S. Miller 		ret = compat_wext_handle_ioctl(net, cmd, arg);
332987de87d5SDavid S. Miller 
33306b96018bSArnd Bergmann 	if (ret == -ENOIOCTLCMD)
33316b96018bSArnd Bergmann 		ret = compat_sock_ioctl_trans(file, sock, cmd, arg);
33326b96018bSArnd Bergmann 
333389bbfc95SShaun Pereira 	return ret;
333489bbfc95SShaun Pereira }
333589bbfc95SShaun Pereira #endif
333689bbfc95SShaun Pereira 
3337ac5a488eSSridhar Samudrala int kernel_bind(struct socket *sock, struct sockaddr *addr, int addrlen)
3338ac5a488eSSridhar Samudrala {
3339ac5a488eSSridhar Samudrala 	return sock->ops->bind(sock, addr, addrlen);
3340ac5a488eSSridhar Samudrala }
3341c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_bind);
3342ac5a488eSSridhar Samudrala 
3343ac5a488eSSridhar Samudrala int kernel_listen(struct socket *sock, int backlog)
3344ac5a488eSSridhar Samudrala {
3345ac5a488eSSridhar Samudrala 	return sock->ops->listen(sock, backlog);
3346ac5a488eSSridhar Samudrala }
3347c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_listen);
3348ac5a488eSSridhar Samudrala 
3349ac5a488eSSridhar Samudrala int kernel_accept(struct socket *sock, struct socket **newsock, int flags)
3350ac5a488eSSridhar Samudrala {
3351ac5a488eSSridhar Samudrala 	struct sock *sk = sock->sk;
3352ac5a488eSSridhar Samudrala 	int err;
3353ac5a488eSSridhar Samudrala 
3354ac5a488eSSridhar Samudrala 	err = sock_create_lite(sk->sk_family, sk->sk_type, sk->sk_protocol,
3355ac5a488eSSridhar Samudrala 			       newsock);
3356ac5a488eSSridhar Samudrala 	if (err < 0)
3357ac5a488eSSridhar Samudrala 		goto done;
3358ac5a488eSSridhar Samudrala 
3359ac5a488eSSridhar Samudrala 	err = sock->ops->accept(sock, *newsock, flags);
3360ac5a488eSSridhar Samudrala 	if (err < 0) {
3361ac5a488eSSridhar Samudrala 		sock_release(*newsock);
3362fa8705b0STony Battersby 		*newsock = NULL;
3363ac5a488eSSridhar Samudrala 		goto done;
3364ac5a488eSSridhar Samudrala 	}
3365ac5a488eSSridhar Samudrala 
3366ac5a488eSSridhar Samudrala 	(*newsock)->ops = sock->ops;
33671b08534eSWei Yongjun 	__module_get((*newsock)->ops->owner);
3368ac5a488eSSridhar Samudrala 
3369ac5a488eSSridhar Samudrala done:
3370ac5a488eSSridhar Samudrala 	return err;
3371ac5a488eSSridhar Samudrala }
3372c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_accept);
3373ac5a488eSSridhar Samudrala 
3374ac5a488eSSridhar Samudrala int kernel_connect(struct socket *sock, struct sockaddr *addr, int addrlen,
3375ac5a488eSSridhar Samudrala 		   int flags)
3376ac5a488eSSridhar Samudrala {
3377ac5a488eSSridhar Samudrala 	return sock->ops->connect(sock, addr, addrlen, flags);
3378ac5a488eSSridhar Samudrala }
3379c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_connect);
3380ac5a488eSSridhar Samudrala 
3381ac5a488eSSridhar Samudrala int kernel_getsockname(struct socket *sock, struct sockaddr *addr,
3382ac5a488eSSridhar Samudrala 			 int *addrlen)
3383ac5a488eSSridhar Samudrala {
3384ac5a488eSSridhar Samudrala 	return sock->ops->getname(sock, addr, addrlen, 0);
3385ac5a488eSSridhar Samudrala }
3386c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_getsockname);
3387ac5a488eSSridhar Samudrala 
3388ac5a488eSSridhar Samudrala int kernel_getpeername(struct socket *sock, struct sockaddr *addr,
3389ac5a488eSSridhar Samudrala 			 int *addrlen)
3390ac5a488eSSridhar Samudrala {
3391ac5a488eSSridhar Samudrala 	return sock->ops->getname(sock, addr, addrlen, 1);
3392ac5a488eSSridhar Samudrala }
3393c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_getpeername);
3394ac5a488eSSridhar Samudrala 
3395ac5a488eSSridhar Samudrala int kernel_getsockopt(struct socket *sock, int level, int optname,
3396ac5a488eSSridhar Samudrala 			char *optval, int *optlen)
3397ac5a488eSSridhar Samudrala {
3398ac5a488eSSridhar Samudrala 	mm_segment_t oldfs = get_fs();
3399fb8621bbSNamhyung Kim 	char __user *uoptval;
3400fb8621bbSNamhyung Kim 	int __user *uoptlen;
3401ac5a488eSSridhar Samudrala 	int err;
3402ac5a488eSSridhar Samudrala 
3403fb8621bbSNamhyung Kim 	uoptval = (char __user __force *) optval;
3404fb8621bbSNamhyung Kim 	uoptlen = (int __user __force *) optlen;
3405fb8621bbSNamhyung Kim 
3406ac5a488eSSridhar Samudrala 	set_fs(KERNEL_DS);
3407ac5a488eSSridhar Samudrala 	if (level == SOL_SOCKET)
3408fb8621bbSNamhyung Kim 		err = sock_getsockopt(sock, level, optname, uoptval, uoptlen);
3409ac5a488eSSridhar Samudrala 	else
3410fb8621bbSNamhyung Kim 		err = sock->ops->getsockopt(sock, level, optname, uoptval,
3411fb8621bbSNamhyung Kim 					    uoptlen);
3412ac5a488eSSridhar Samudrala 	set_fs(oldfs);
3413ac5a488eSSridhar Samudrala 	return err;
3414ac5a488eSSridhar Samudrala }
3415c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_getsockopt);
3416ac5a488eSSridhar Samudrala 
3417ac5a488eSSridhar Samudrala int kernel_setsockopt(struct socket *sock, int level, int optname,
3418b7058842SDavid S. Miller 			char *optval, unsigned int optlen)
3419ac5a488eSSridhar Samudrala {
3420ac5a488eSSridhar Samudrala 	mm_segment_t oldfs = get_fs();
3421fb8621bbSNamhyung Kim 	char __user *uoptval;
3422ac5a488eSSridhar Samudrala 	int err;
3423ac5a488eSSridhar Samudrala 
3424fb8621bbSNamhyung Kim 	uoptval = (char __user __force *) optval;
3425fb8621bbSNamhyung Kim 
3426ac5a488eSSridhar Samudrala 	set_fs(KERNEL_DS);
3427ac5a488eSSridhar Samudrala 	if (level == SOL_SOCKET)
3428fb8621bbSNamhyung Kim 		err = sock_setsockopt(sock, level, optname, uoptval, optlen);
3429ac5a488eSSridhar Samudrala 	else
3430fb8621bbSNamhyung Kim 		err = sock->ops->setsockopt(sock, level, optname, uoptval,
3431ac5a488eSSridhar Samudrala 					    optlen);
3432ac5a488eSSridhar Samudrala 	set_fs(oldfs);
3433ac5a488eSSridhar Samudrala 	return err;
3434ac5a488eSSridhar Samudrala }
3435c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_setsockopt);
3436ac5a488eSSridhar Samudrala 
3437ac5a488eSSridhar Samudrala int kernel_sendpage(struct socket *sock, struct page *page, int offset,
3438ac5a488eSSridhar Samudrala 		    size_t size, int flags)
3439ac5a488eSSridhar Samudrala {
3440ac5a488eSSridhar Samudrala 	if (sock->ops->sendpage)
3441ac5a488eSSridhar Samudrala 		return sock->ops->sendpage(sock, page, offset, size, flags);
3442ac5a488eSSridhar Samudrala 
3443ac5a488eSSridhar Samudrala 	return sock_no_sendpage(sock, page, offset, size, flags);
3444ac5a488eSSridhar Samudrala }
3445c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_sendpage);
3446ac5a488eSSridhar Samudrala 
3447ac5a488eSSridhar Samudrala int kernel_sock_ioctl(struct socket *sock, int cmd, unsigned long arg)
3448ac5a488eSSridhar Samudrala {
3449ac5a488eSSridhar Samudrala 	mm_segment_t oldfs = get_fs();
3450ac5a488eSSridhar Samudrala 	int err;
3451ac5a488eSSridhar Samudrala 
3452ac5a488eSSridhar Samudrala 	set_fs(KERNEL_DS);
3453ac5a488eSSridhar Samudrala 	err = sock->ops->ioctl(sock, cmd, arg);
3454ac5a488eSSridhar Samudrala 	set_fs(oldfs);
3455ac5a488eSSridhar Samudrala 
3456ac5a488eSSridhar Samudrala 	return err;
3457ac5a488eSSridhar Samudrala }
3458c6d409cfSEric Dumazet EXPORT_SYMBOL(kernel_sock_ioctl);
3459ac5a488eSSridhar Samudrala 
346091cf45f0STrond Myklebust int kernel_sock_shutdown(struct socket *sock, enum sock_shutdown_cmd how)
346191cf45f0STrond Myklebust {
346291cf45f0STrond Myklebust 	return sock->ops->shutdown(sock, how);
346391cf45f0STrond Myklebust }
346491cf45f0STrond Myklebust EXPORT_SYMBOL(kernel_sock_shutdown);
3465