xref: /openbmc/linux/drivers/net/loopback.c (revision de7d5084d82794a8e83afb994fcb07f82da3cd7b)
12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds  * INET		An implementation of the TCP/IP protocol suite for the LINUX
41da177e4SLinus Torvalds  *		operating system.  INET is implemented using the  BSD Socket
51da177e4SLinus Torvalds  *		interface as the means of communication with the user level.
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  *		Pseudo-driver for the loopback interface.
81da177e4SLinus Torvalds  *
91da177e4SLinus Torvalds  * Version:	@(#)loopback.c	1.0.4b	08/16/93
101da177e4SLinus Torvalds  *
1102c30a84SJesper Juhl  * Authors:	Ross Biro
121da177e4SLinus Torvalds  *		Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
131da177e4SLinus Torvalds  *		Donald Becker, <becker@scyld.com>
141da177e4SLinus Torvalds  *
151da177e4SLinus Torvalds  *		Alan Cox	:	Fixed oddments for NET3.014
161da177e4SLinus Torvalds  *		Alan Cox	:	Rejig for NET3.029 snap #3
171da177e4SLinus Torvalds  *		Alan Cox	:	Fixed NET3.029 bugs and sped up
181da177e4SLinus Torvalds  *		Larry McVoy	:	Tiny tweak to double performance
191da177e4SLinus Torvalds  *		Alan Cox	:	Backed out LMV's tweak - the linux mm
201da177e4SLinus Torvalds  *					can't take it...
211da177e4SLinus Torvalds  *              Michael Griffith:       Don't bother computing the checksums
221da177e4SLinus Torvalds  *                                      on packets received on the loopback
231da177e4SLinus Torvalds  *                                      interface.
241da177e4SLinus Torvalds  *		Alexey Kuznetsov:	Potential hang under some extreme
251da177e4SLinus Torvalds  *					cases removed.
261da177e4SLinus Torvalds  */
271da177e4SLinus Torvalds #include <linux/kernel.h>
281da177e4SLinus Torvalds #include <linux/jiffies.h>
291da177e4SLinus Torvalds #include <linux/module.h>
301da177e4SLinus Torvalds #include <linux/interrupt.h>
311da177e4SLinus Torvalds #include <linux/fs.h>
321da177e4SLinus Torvalds #include <linux/types.h>
331da177e4SLinus Torvalds #include <linux/string.h>
341da177e4SLinus Torvalds #include <linux/socket.h>
351da177e4SLinus Torvalds #include <linux/errno.h>
361da177e4SLinus Torvalds #include <linux/fcntl.h>
371da177e4SLinus Torvalds #include <linux/in.h>
381da177e4SLinus Torvalds 
397c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
40b3407c8eSEzequiel Lara Gomez #include <linux/io.h>
411da177e4SLinus Torvalds 
421da177e4SLinus Torvalds #include <linux/inet.h>
431da177e4SLinus Torvalds #include <linux/netdevice.h>
441da177e4SLinus Torvalds #include <linux/etherdevice.h>
451da177e4SLinus Torvalds #include <linux/skbuff.h>
461da177e4SLinus Torvalds #include <linux/ethtool.h>
471da177e4SLinus Torvalds #include <net/sock.h>
481da177e4SLinus Torvalds #include <net/checksum.h>
491da177e4SLinus Torvalds #include <linux/if_ether.h>	/* For the statistics structure. */
501da177e4SLinus Torvalds #include <linux/if_arp.h>	/* For ARPHRD_ETHER */
511da177e4SLinus Torvalds #include <linux/ip.h>
521da177e4SLinus Torvalds #include <linux/tcp.h>
531da177e4SLinus Torvalds #include <linux/percpu.h>
546df014cfSEzequiel Lara Gomez #include <linux/net_tstamp.h>
552774c7abSEric W. Biederman #include <net/net_namespace.h>
565eaa0bd8SEric Dumazet #include <linux/u64_stats_sync.h>
571da177e4SLinus Torvalds 
584de83b88SMahesh Bandewar /* blackhole_netdev - a device used for dsts that are marked expired!
594de83b88SMahesh Bandewar  * This is global device (instead of per-net-ns) since it's not needed
604de83b88SMahesh Bandewar  * to be per-ns and gets initialized at boot time.
614de83b88SMahesh Bandewar  */
624de83b88SMahesh Bandewar struct net_device *blackhole_netdev;
634de83b88SMahesh Bandewar EXPORT_SYMBOL(blackhole_netdev);
644de83b88SMahesh Bandewar 
65b3407c8eSEzequiel Lara Gomez /* The higher levels take care of making this non-reentrant (it's
661da177e4SLinus Torvalds  * called with bh's disabled).
671da177e4SLinus Torvalds  */
6861357325SStephen Hemminger static netdev_tx_t loopback_xmit(struct sk_buff *skb,
6961357325SStephen Hemminger 				 struct net_device *dev)
701da177e4SLinus Torvalds {
7147d74275STejun Heo 	struct pcpu_lstats *lb_stats;
727eebb0b2SEric Dumazet 	int len;
731da177e4SLinus Torvalds 
746df014cfSEzequiel Lara Gomez 	skb_tx_timestamp(skb);
754c16128bSEric Dumazet 
764c16128bSEric Dumazet 	/* do not fool net_timestamp_check() with various clock bases */
774c16128bSEric Dumazet 	skb->tstamp = 0;
784c16128bSEric Dumazet 
791da177e4SLinus Torvalds 	skb_orphan(skb);
801da177e4SLinus Torvalds 
81794ed393SEric Dumazet 	/* Before queueing this packet to netif_rx(),
82794ed393SEric Dumazet 	 * make sure dst is refcounted.
83794ed393SEric Dumazet 	 */
84794ed393SEric Dumazet 	skb_dst_force(skb);
85794ed393SEric Dumazet 
861da177e4SLinus Torvalds 	skb->protocol = eth_type_trans(skb, dev);
871da177e4SLinus Torvalds 
889e0db4b1SEric W. Biederman 	/* it's OK to use per_cpu_ptr() because BHs are off */
89a7855c78SEric Dumazet 	lb_stats = this_cpu_ptr(dev->lstats);
901da177e4SLinus Torvalds 
917eebb0b2SEric Dumazet 	len = skb->len;
927eebb0b2SEric Dumazet 	if (likely(netif_rx(skb) == NET_RX_SUCCESS)) {
935eaa0bd8SEric Dumazet 		u64_stats_update_begin(&lb_stats->syncp);
947eebb0b2SEric Dumazet 		lb_stats->bytes += len;
957eebb0b2SEric Dumazet 		lb_stats->packets++;
965eaa0bd8SEric Dumazet 		u64_stats_update_end(&lb_stats->syncp);
97caf586e5SEric Dumazet 	}
981da177e4SLinus Torvalds 
996ed10654SPatrick McHardy 	return NETDEV_TX_OK;
1001da177e4SLinus Torvalds }
1011da177e4SLinus Torvalds 
102*de7d5084SEric Dumazet void dev_lstats_read(struct net_device *dev, u64 *packets, u64 *bytes)
1031da177e4SLinus Torvalds {
1041da177e4SLinus Torvalds 	int i;
1051da177e4SLinus Torvalds 
106*de7d5084SEric Dumazet 	*packets = 0;
107*de7d5084SEric Dumazet 	*bytes = 0;
108*de7d5084SEric Dumazet 
1090fed4846SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
1105175c378SEric Dumazet 		const struct pcpu_lstats *lb_stats;
1115eaa0bd8SEric Dumazet 		u64 tbytes, tpackets;
1125eaa0bd8SEric Dumazet 		unsigned int start;
1131da177e4SLinus Torvalds 
114a7855c78SEric Dumazet 		lb_stats = per_cpu_ptr(dev->lstats, i);
1155eaa0bd8SEric Dumazet 		do {
11657a7744eSEric W. Biederman 			start = u64_stats_fetch_begin_irq(&lb_stats->syncp);
1175eaa0bd8SEric Dumazet 			tpackets = lb_stats->packets;
118*de7d5084SEric Dumazet 			tbytes = lb_stats->bytes;
11957a7744eSEric W. Biederman 		} while (u64_stats_fetch_retry_irq(&lb_stats->syncp, start));
120*de7d5084SEric Dumazet 		*bytes   += tbytes;
121*de7d5084SEric Dumazet 		*packets += tpackets;
1221da177e4SLinus Torvalds 	}
123*de7d5084SEric Dumazet }
124*de7d5084SEric Dumazet EXPORT_SYMBOL(dev_lstats_read);
125*de7d5084SEric Dumazet 
126*de7d5084SEric Dumazet static void loopback_get_stats64(struct net_device *dev,
127*de7d5084SEric Dumazet 				 struct rtnl_link_stats64 *stats)
128*de7d5084SEric Dumazet {
129*de7d5084SEric Dumazet 	u64 packets, bytes;
130*de7d5084SEric Dumazet 
131*de7d5084SEric Dumazet 	dev_lstats_read(dev, &packets, &bytes);
132*de7d5084SEric Dumazet 
1335175c378SEric Dumazet 	stats->rx_packets = packets;
1345175c378SEric Dumazet 	stats->tx_packets = packets;
1355175c378SEric Dumazet 	stats->rx_bytes   = bytes;
1365175c378SEric Dumazet 	stats->tx_bytes   = bytes;
1371da177e4SLinus Torvalds }
1381da177e4SLinus Torvalds 
1397fa6b066SStephen Hemminger static u32 always_on(struct net_device *dev)
1401da177e4SLinus Torvalds {
1411da177e4SLinus Torvalds 	return 1;
1421da177e4SLinus Torvalds }
1431da177e4SLinus Torvalds 
1447282d491SJeff Garzik static const struct ethtool_ops loopback_ethtool_ops = {
1457fa6b066SStephen Hemminger 	.get_link		= always_on,
146af730342SJulian Wiedmann 	.get_ts_info		= ethtool_op_get_ts_info,
1471da177e4SLinus Torvalds };
1481da177e4SLinus Torvalds 
1495f6d88b9SEric W. Biederman static int loopback_dev_init(struct net_device *dev)
1505f6d88b9SEric W. Biederman {
1511c213bd2SWANG Cong 	dev->lstats = netdev_alloc_pcpu_stats(struct pcpu_lstats);
152a7855c78SEric Dumazet 	if (!dev->lstats)
1535f6d88b9SEric W. Biederman 		return -ENOMEM;
1545f6d88b9SEric W. Biederman 	return 0;
1555f6d88b9SEric W. Biederman }
1565f6d88b9SEric W. Biederman 
1575f6d88b9SEric W. Biederman static void loopback_dev_free(struct net_device *dev)
1585f6d88b9SEric W. Biederman {
159e05e9070SEric W. Biederman 	dev_net(dev)->loopback_dev = NULL;
160a7855c78SEric Dumazet 	free_percpu(dev->lstats);
1615f6d88b9SEric W. Biederman }
1625f6d88b9SEric W. Biederman 
163c02373bfSStephen Hemminger static const struct net_device_ops loopback_ops = {
164c02373bfSStephen Hemminger 	.ndo_init        = loopback_dev_init,
16500829823SStephen Hemminger 	.ndo_start_xmit  = loopback_xmit,
1666b10de38SEric Dumazet 	.ndo_get_stats64 = loopback_get_stats64,
16725f929fbSWANG Cong 	.ndo_set_mac_address = eth_mac_addr,
168c02373bfSStephen Hemminger };
169c02373bfSStephen Hemminger 
1704de83b88SMahesh Bandewar static void gen_lo_setup(struct net_device *dev,
1714de83b88SMahesh Bandewar 			 unsigned int mtu,
1724de83b88SMahesh Bandewar 			 const struct ethtool_ops *eth_ops,
1734de83b88SMahesh Bandewar 			 const struct header_ops *hdr_ops,
1744de83b88SMahesh Bandewar 			 const struct net_device_ops *dev_ops,
1754de83b88SMahesh Bandewar 			 void (*dev_destructor)(struct net_device *dev))
176854d8363SDaniel Lezcano {
1774de83b88SMahesh Bandewar 	dev->mtu		= mtu;
178854d8363SDaniel Lezcano 	dev->hard_header_len	= ETH_HLEN;	/* 14	*/
179217e6fa2SWillem de Bruijn 	dev->min_header_len	= ETH_HLEN;	/* 14	*/
180854d8363SDaniel Lezcano 	dev->addr_len		= ETH_ALEN;	/* 6	*/
181854d8363SDaniel Lezcano 	dev->type		= ARPHRD_LOOPBACK;	/* 0x0001*/
182854d8363SDaniel Lezcano 	dev->flags		= IFF_LOOPBACK;
183e65db2b7SPhil Sutter 	dev->priv_flags		|= IFF_LIVE_ADDR_CHANGE | IFF_NO_QUEUE;
18402875878SEric Dumazet 	netif_keep_dst(dev);
185f6c382fcSMarcelo Ricardo Leitner 	dev->hw_features	= NETIF_F_GSO_SOFTWARE;
186854d8363SDaniel Lezcano 	dev->features		= NETIF_F_SG | NETIF_F_FRAGLIST
187f6c382fcSMarcelo Ricardo Leitner 		| NETIF_F_GSO_SOFTWARE
18834324dc2SMichał Mirosław 		| NETIF_F_HW_CSUM
189cf0bdefdSMichał Mirosław 		| NETIF_F_RXCSUM
19053692b1dSTom Herbert 		| NETIF_F_SCTP_CRC
191854d8363SDaniel Lezcano 		| NETIF_F_HIGHDMA
192ce286d32SEric W. Biederman 		| NETIF_F_LLTX
1930553c891SKrishna Kumar 		| NETIF_F_NETNS_LOCAL
194eed2a12fSMahesh Bandewar 		| NETIF_F_VLAN_CHALLENGED
195eed2a12fSMahesh Bandewar 		| NETIF_F_LOOPBACK;
1964de83b88SMahesh Bandewar 	dev->ethtool_ops	= eth_ops;
1974de83b88SMahesh Bandewar 	dev->header_ops		= hdr_ops;
1984de83b88SMahesh Bandewar 	dev->netdev_ops		= dev_ops;
199cf124db5SDavid S. Miller 	dev->needs_free_netdev	= true;
2004de83b88SMahesh Bandewar 	dev->priv_destructor	= dev_destructor;
2014de83b88SMahesh Bandewar }
2024de83b88SMahesh Bandewar 
2034de83b88SMahesh Bandewar /* The loopback device is special. There is only one instance
2044de83b88SMahesh Bandewar  * per network namespace.
2054de83b88SMahesh Bandewar  */
2064de83b88SMahesh Bandewar static void loopback_setup(struct net_device *dev)
2074de83b88SMahesh Bandewar {
2084de83b88SMahesh Bandewar 	gen_lo_setup(dev, (64 * 1024), &loopback_ethtool_ops, &eth_header_ops,
2094de83b88SMahesh Bandewar 		     &loopback_ops, loopback_dev_free);
210854d8363SDaniel Lezcano }
211de3cb747SDaniel Lezcano 
21222783649SRalf Baechle /* Setup and register the loopback device. */
2134665079cSPavel Emelyanov static __net_init int loopback_net_init(struct net *net)
2141da177e4SLinus Torvalds {
215854d8363SDaniel Lezcano 	struct net_device *dev;
216854d8363SDaniel Lezcano 	int err;
217aeed9e82SHerbert Xu 
218854d8363SDaniel Lezcano 	err = -ENOMEM;
219c835a677STom Gundersen 	dev = alloc_netdev(0, "lo", NET_NAME_UNKNOWN, loopback_setup);
220854d8363SDaniel Lezcano 	if (!dev)
221854d8363SDaniel Lezcano 		goto out;
222854d8363SDaniel Lezcano 
223c346dca1SYOSHIFUJI Hideaki 	dev_net_set(dev, net);
224854d8363SDaniel Lezcano 	err = register_netdev(dev);
225854d8363SDaniel Lezcano 	if (err)
226854d8363SDaniel Lezcano 		goto out_free_netdev;
227854d8363SDaniel Lezcano 
2281fb9489bSPavel Emelyanov 	BUG_ON(dev->ifindex != LOOPBACK_IFINDEX);
2292774c7abSEric W. Biederman 	net->loopback_dev = dev;
2309d6dda32SPavel Emelyanov 	return 0;
231854d8363SDaniel Lezcano 
232854d8363SDaniel Lezcano out_free_netdev:
233854d8363SDaniel Lezcano 	free_netdev(dev);
2349d6dda32SPavel Emelyanov out:
23509ad9bc7SOctavian Purdila 	if (net_eq(net, &init_net))
2369d6dda32SPavel Emelyanov 		panic("loopback: Failed to register netdevice: %d\n", err);
2379d6dda32SPavel Emelyanov 	return err;
238854d8363SDaniel Lezcano }
23960903f2cSAdrian Bunk 
240505d4f73SEric W. Biederman /* Registered in net/core/dev.c */
241505d4f73SEric W. Biederman struct pernet_operations __net_initdata loopback_net_ops = {
2422774c7abSEric W. Biederman 	.init = loopback_net_init,
2432774c7abSEric W. Biederman };
2444de83b88SMahesh Bandewar 
2454de83b88SMahesh Bandewar /* blackhole netdevice */
2464de83b88SMahesh Bandewar static netdev_tx_t blackhole_netdev_xmit(struct sk_buff *skb,
2474de83b88SMahesh Bandewar 					 struct net_device *dev)
2484de83b88SMahesh Bandewar {
2494de83b88SMahesh Bandewar 	kfree_skb(skb);
2504de83b88SMahesh Bandewar 	net_warn_ratelimited("%s(): Dropping skb.\n", __func__);
2514de83b88SMahesh Bandewar 	return NETDEV_TX_OK;
2524de83b88SMahesh Bandewar }
2534de83b88SMahesh Bandewar 
2544de83b88SMahesh Bandewar static const struct net_device_ops blackhole_netdev_ops = {
2554de83b88SMahesh Bandewar 	.ndo_start_xmit = blackhole_netdev_xmit,
2564de83b88SMahesh Bandewar };
2574de83b88SMahesh Bandewar 
2584de83b88SMahesh Bandewar /* This is a dst-dummy device used specifically for invalidated
2594de83b88SMahesh Bandewar  * DSTs and unlike loopback, this is not per-ns.
2604de83b88SMahesh Bandewar  */
2614de83b88SMahesh Bandewar static void blackhole_netdev_setup(struct net_device *dev)
2624de83b88SMahesh Bandewar {
2634de83b88SMahesh Bandewar 	gen_lo_setup(dev, ETH_MIN_MTU, NULL, NULL, &blackhole_netdev_ops, NULL);
2644de83b88SMahesh Bandewar }
2654de83b88SMahesh Bandewar 
2664de83b88SMahesh Bandewar /* Setup and register the blackhole_netdev. */
2674de83b88SMahesh Bandewar static int __init blackhole_netdev_init(void)
2684de83b88SMahesh Bandewar {
2694de83b88SMahesh Bandewar 	blackhole_netdev = alloc_netdev(0, "blackhole_dev", NET_NAME_UNKNOWN,
2704de83b88SMahesh Bandewar 					blackhole_netdev_setup);
2714de83b88SMahesh Bandewar 	if (!blackhole_netdev)
2724de83b88SMahesh Bandewar 		return -ENOMEM;
2734de83b88SMahesh Bandewar 
274d62962b3SMahesh Bandewar 	rtnl_lock();
2754de83b88SMahesh Bandewar 	dev_init_scheduler(blackhole_netdev);
2764de83b88SMahesh Bandewar 	dev_activate(blackhole_netdev);
277d62962b3SMahesh Bandewar 	rtnl_unlock();
2784de83b88SMahesh Bandewar 
2794de83b88SMahesh Bandewar 	blackhole_netdev->flags |= IFF_UP | IFF_RUNNING;
2804de83b88SMahesh Bandewar 	dev_net_set(blackhole_netdev, &init_net);
2814de83b88SMahesh Bandewar 
2824de83b88SMahesh Bandewar 	return 0;
2834de83b88SMahesh Bandewar }
2844de83b88SMahesh Bandewar 
2854de83b88SMahesh Bandewar device_initcall(blackhole_netdev_init);
286