xref: /openbmc/linux/drivers/net/loopback.c (revision a7b862ab)
12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds  * INET		An implementation of the TCP/IP protocol suite for the LINUX
41da177e4SLinus Torvalds  *		operating system.  INET is implemented using the  BSD Socket
51da177e4SLinus Torvalds  *		interface as the means of communication with the user level.
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  *		Pseudo-driver for the loopback interface.
81da177e4SLinus Torvalds  *
91da177e4SLinus Torvalds  * Version:	@(#)loopback.c	1.0.4b	08/16/93
101da177e4SLinus Torvalds  *
1102c30a84SJesper Juhl  * Authors:	Ross Biro
121da177e4SLinus Torvalds  *		Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
131da177e4SLinus Torvalds  *		Donald Becker, <becker@scyld.com>
141da177e4SLinus Torvalds  *
151da177e4SLinus Torvalds  *		Alan Cox	:	Fixed oddments for NET3.014
161da177e4SLinus Torvalds  *		Alan Cox	:	Rejig for NET3.029 snap #3
171da177e4SLinus Torvalds  *		Alan Cox	:	Fixed NET3.029 bugs and sped up
181da177e4SLinus Torvalds  *		Larry McVoy	:	Tiny tweak to double performance
191da177e4SLinus Torvalds  *		Alan Cox	:	Backed out LMV's tweak - the linux mm
201da177e4SLinus Torvalds  *					can't take it...
211da177e4SLinus Torvalds  *              Michael Griffith:       Don't bother computing the checksums
221da177e4SLinus Torvalds  *                                      on packets received on the loopback
231da177e4SLinus Torvalds  *                                      interface.
241da177e4SLinus Torvalds  *		Alexey Kuznetsov:	Potential hang under some extreme
251da177e4SLinus Torvalds  *					cases removed.
261da177e4SLinus Torvalds  */
271da177e4SLinus Torvalds #include <linux/kernel.h>
281da177e4SLinus Torvalds #include <linux/jiffies.h>
291da177e4SLinus Torvalds #include <linux/module.h>
301da177e4SLinus Torvalds #include <linux/interrupt.h>
311da177e4SLinus Torvalds #include <linux/fs.h>
321da177e4SLinus Torvalds #include <linux/types.h>
331da177e4SLinus Torvalds #include <linux/string.h>
341da177e4SLinus Torvalds #include <linux/socket.h>
351da177e4SLinus Torvalds #include <linux/errno.h>
361da177e4SLinus Torvalds #include <linux/fcntl.h>
371da177e4SLinus Torvalds #include <linux/in.h>
381da177e4SLinus Torvalds 
397c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
40b3407c8eSEzequiel Lara Gomez #include <linux/io.h>
411da177e4SLinus Torvalds 
421da177e4SLinus Torvalds #include <linux/inet.h>
431da177e4SLinus Torvalds #include <linux/netdevice.h>
441da177e4SLinus Torvalds #include <linux/etherdevice.h>
451da177e4SLinus Torvalds #include <linux/skbuff.h>
461da177e4SLinus Torvalds #include <linux/ethtool.h>
47b6459415SJakub Kicinski #include <net/sch_generic.h>
481da177e4SLinus Torvalds #include <net/sock.h>
491da177e4SLinus Torvalds #include <net/checksum.h>
501da177e4SLinus Torvalds #include <linux/if_ether.h>	/* For the statistics structure. */
511da177e4SLinus Torvalds #include <linux/if_arp.h>	/* For ARPHRD_ETHER */
521da177e4SLinus Torvalds #include <linux/ip.h>
531da177e4SLinus Torvalds #include <linux/tcp.h>
541da177e4SLinus Torvalds #include <linux/percpu.h>
556df014cfSEzequiel Lara Gomez #include <linux/net_tstamp.h>
562774c7abSEric W. Biederman #include <net/net_namespace.h>
575eaa0bd8SEric Dumazet #include <linux/u64_stats_sync.h>
581da177e4SLinus Torvalds 
594de83b88SMahesh Bandewar /* blackhole_netdev - a device used for dsts that are marked expired!
604de83b88SMahesh Bandewar  * This is global device (instead of per-net-ns) since it's not needed
614de83b88SMahesh Bandewar  * to be per-ns and gets initialized at boot time.
624de83b88SMahesh Bandewar  */
634de83b88SMahesh Bandewar struct net_device *blackhole_netdev;
644de83b88SMahesh Bandewar EXPORT_SYMBOL(blackhole_netdev);
654de83b88SMahesh Bandewar 
66b3407c8eSEzequiel Lara Gomez /* The higher levels take care of making this non-reentrant (it's
671da177e4SLinus Torvalds  * called with bh's disabled).
681da177e4SLinus Torvalds  */
loopback_xmit(struct sk_buff * skb,struct net_device * dev)6961357325SStephen Hemminger static netdev_tx_t loopback_xmit(struct sk_buff *skb,
7061357325SStephen Hemminger 				 struct net_device *dev)
711da177e4SLinus Torvalds {
727eebb0b2SEric Dumazet 	int len;
731da177e4SLinus Torvalds 
746df014cfSEzequiel Lara Gomez 	skb_tx_timestamp(skb);
754c16128bSEric Dumazet 
764c16128bSEric Dumazet 	/* do not fool net_timestamp_check() with various clock bases */
77de799101SMartin KaFai Lau 	skb_clear_tstamp(skb);
784c16128bSEric Dumazet 
791da177e4SLinus Torvalds 	skb_orphan(skb);
801da177e4SLinus Torvalds 
81baebdf48SSebastian Andrzej Siewior 	/* Before queueing this packet to __netif_rx(),
82794ed393SEric Dumazet 	 * make sure dst is refcounted.
83794ed393SEric Dumazet 	 */
84794ed393SEric Dumazet 	skb_dst_force(skb);
85794ed393SEric Dumazet 
861da177e4SLinus Torvalds 	skb->protocol = eth_type_trans(skb, dev);
871da177e4SLinus Torvalds 
887eebb0b2SEric Dumazet 	len = skb->len;
89baebdf48SSebastian Andrzej Siewior 	if (likely(__netif_rx(skb) == NET_RX_SUCCESS))
90dd5382a0SEric Dumazet 		dev_lstats_add(dev, len);
911da177e4SLinus Torvalds 
926ed10654SPatrick McHardy 	return NETDEV_TX_OK;
931da177e4SLinus Torvalds }
941da177e4SLinus Torvalds 
dev_lstats_read(struct net_device * dev,u64 * packets,u64 * bytes)95de7d5084SEric Dumazet void dev_lstats_read(struct net_device *dev, u64 *packets, u64 *bytes)
961da177e4SLinus Torvalds {
971da177e4SLinus Torvalds 	int i;
981da177e4SLinus Torvalds 
99de7d5084SEric Dumazet 	*packets = 0;
100de7d5084SEric Dumazet 	*bytes = 0;
101de7d5084SEric Dumazet 
1020fed4846SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
1035175c378SEric Dumazet 		const struct pcpu_lstats *lb_stats;
1045eaa0bd8SEric Dumazet 		u64 tbytes, tpackets;
1055eaa0bd8SEric Dumazet 		unsigned int start;
1061da177e4SLinus Torvalds 
107a7855c78SEric Dumazet 		lb_stats = per_cpu_ptr(dev->lstats, i);
1085eaa0bd8SEric Dumazet 		do {
109068c38adSThomas Gleixner 			start = u64_stats_fetch_begin(&lb_stats->syncp);
110fd2f4737SEric Dumazet 			tpackets = u64_stats_read(&lb_stats->packets);
111fd2f4737SEric Dumazet 			tbytes = u64_stats_read(&lb_stats->bytes);
112068c38adSThomas Gleixner 		} while (u64_stats_fetch_retry(&lb_stats->syncp, start));
113de7d5084SEric Dumazet 		*bytes   += tbytes;
114de7d5084SEric Dumazet 		*packets += tpackets;
1151da177e4SLinus Torvalds 	}
116de7d5084SEric Dumazet }
117de7d5084SEric Dumazet EXPORT_SYMBOL(dev_lstats_read);
118de7d5084SEric Dumazet 
loopback_get_stats64(struct net_device * dev,struct rtnl_link_stats64 * stats)119de7d5084SEric Dumazet static void loopback_get_stats64(struct net_device *dev,
120de7d5084SEric Dumazet 				 struct rtnl_link_stats64 *stats)
121de7d5084SEric Dumazet {
122de7d5084SEric Dumazet 	u64 packets, bytes;
123de7d5084SEric Dumazet 
124de7d5084SEric Dumazet 	dev_lstats_read(dev, &packets, &bytes);
125de7d5084SEric Dumazet 
1265175c378SEric Dumazet 	stats->rx_packets = packets;
1275175c378SEric Dumazet 	stats->tx_packets = packets;
1285175c378SEric Dumazet 	stats->rx_bytes   = bytes;
1295175c378SEric Dumazet 	stats->tx_bytes   = bytes;
1301da177e4SLinus Torvalds }
1311da177e4SLinus Torvalds 
always_on(struct net_device * dev)1327fa6b066SStephen Hemminger static u32 always_on(struct net_device *dev)
1331da177e4SLinus Torvalds {
1341da177e4SLinus Torvalds 	return 1;
1351da177e4SLinus Torvalds }
1361da177e4SLinus Torvalds 
1377282d491SJeff Garzik static const struct ethtool_ops loopback_ethtool_ops = {
1387fa6b066SStephen Hemminger 	.get_link		= always_on,
139af730342SJulian Wiedmann 	.get_ts_info		= ethtool_op_get_ts_info,
1401da177e4SLinus Torvalds };
1411da177e4SLinus Torvalds 
loopback_dev_init(struct net_device * dev)1425f6d88b9SEric W. Biederman static int loopback_dev_init(struct net_device *dev)
1435f6d88b9SEric W. Biederman {
1441c213bd2SWANG Cong 	dev->lstats = netdev_alloc_pcpu_stats(struct pcpu_lstats);
145a7855c78SEric Dumazet 	if (!dev->lstats)
1465f6d88b9SEric W. Biederman 		return -ENOMEM;
147a7b862abSEric Dumazet 	netdev_lockdep_set_classes(dev);
1485f6d88b9SEric W. Biederman 	return 0;
1495f6d88b9SEric W. Biederman }
1505f6d88b9SEric W. Biederman 
loopback_dev_free(struct net_device * dev)1515f6d88b9SEric W. Biederman static void loopback_dev_free(struct net_device *dev)
1525f6d88b9SEric W. Biederman {
153e05e9070SEric W. Biederman 	dev_net(dev)->loopback_dev = NULL;
154a7855c78SEric Dumazet 	free_percpu(dev->lstats);
1555f6d88b9SEric W. Biederman }
1565f6d88b9SEric W. Biederman 
157c02373bfSStephen Hemminger static const struct net_device_ops loopback_ops = {
158c02373bfSStephen Hemminger 	.ndo_init        = loopback_dev_init,
15900829823SStephen Hemminger 	.ndo_start_xmit  = loopback_xmit,
1606b10de38SEric Dumazet 	.ndo_get_stats64 = loopback_get_stats64,
16125f929fbSWANG Cong 	.ndo_set_mac_address = eth_mac_addr,
162c02373bfSStephen Hemminger };
163c02373bfSStephen Hemminger 
gen_lo_setup(struct net_device * dev,unsigned int mtu,const struct ethtool_ops * eth_ops,const struct header_ops * hdr_ops,const struct net_device_ops * dev_ops,void (* dev_destructor)(struct net_device * dev))1644de83b88SMahesh Bandewar static void gen_lo_setup(struct net_device *dev,
1654de83b88SMahesh Bandewar 			 unsigned int mtu,
1664de83b88SMahesh Bandewar 			 const struct ethtool_ops *eth_ops,
1674de83b88SMahesh Bandewar 			 const struct header_ops *hdr_ops,
1684de83b88SMahesh Bandewar 			 const struct net_device_ops *dev_ops,
1694de83b88SMahesh Bandewar 			 void (*dev_destructor)(struct net_device *dev))
170854d8363SDaniel Lezcano {
1714de83b88SMahesh Bandewar 	dev->mtu		= mtu;
172854d8363SDaniel Lezcano 	dev->hard_header_len	= ETH_HLEN;	/* 14	*/
173217e6fa2SWillem de Bruijn 	dev->min_header_len	= ETH_HLEN;	/* 14	*/
174854d8363SDaniel Lezcano 	dev->addr_len		= ETH_ALEN;	/* 6	*/
175854d8363SDaniel Lezcano 	dev->type		= ARPHRD_LOOPBACK;	/* 0x0001*/
176854d8363SDaniel Lezcano 	dev->flags		= IFF_LOOPBACK;
177e65db2b7SPhil Sutter 	dev->priv_flags		|= IFF_LIVE_ADDR_CHANGE | IFF_NO_QUEUE;
17802875878SEric Dumazet 	netif_keep_dst(dev);
179f6c382fcSMarcelo Ricardo Leitner 	dev->hw_features	= NETIF_F_GSO_SOFTWARE;
180854d8363SDaniel Lezcano 	dev->features		= NETIF_F_SG | NETIF_F_FRAGLIST
181f6c382fcSMarcelo Ricardo Leitner 		| NETIF_F_GSO_SOFTWARE
18234324dc2SMichał Mirosław 		| NETIF_F_HW_CSUM
183cf0bdefdSMichał Mirosław 		| NETIF_F_RXCSUM
18453692b1dSTom Herbert 		| NETIF_F_SCTP_CRC
185854d8363SDaniel Lezcano 		| NETIF_F_HIGHDMA
186ce286d32SEric W. Biederman 		| NETIF_F_LLTX
1870553c891SKrishna Kumar 		| NETIF_F_NETNS_LOCAL
188eed2a12fSMahesh Bandewar 		| NETIF_F_VLAN_CHALLENGED
189eed2a12fSMahesh Bandewar 		| NETIF_F_LOOPBACK;
1904de83b88SMahesh Bandewar 	dev->ethtool_ops	= eth_ops;
1914de83b88SMahesh Bandewar 	dev->header_ops		= hdr_ops;
1924de83b88SMahesh Bandewar 	dev->netdev_ops		= dev_ops;
193cf124db5SDavid S. Miller 	dev->needs_free_netdev	= true;
1944de83b88SMahesh Bandewar 	dev->priv_destructor	= dev_destructor;
195d6f938ceSEric Dumazet 
196d6f938ceSEric Dumazet 	netif_set_tso_max_size(dev, GSO_MAX_SIZE);
1974de83b88SMahesh Bandewar }
1984de83b88SMahesh Bandewar 
1994de83b88SMahesh Bandewar /* The loopback device is special. There is only one instance
2004de83b88SMahesh Bandewar  * per network namespace.
2014de83b88SMahesh Bandewar  */
loopback_setup(struct net_device * dev)2024de83b88SMahesh Bandewar static void loopback_setup(struct net_device *dev)
2034de83b88SMahesh Bandewar {
2044de83b88SMahesh Bandewar 	gen_lo_setup(dev, (64 * 1024), &loopback_ethtool_ops, &eth_header_ops,
2054de83b88SMahesh Bandewar 		     &loopback_ops, loopback_dev_free);
206854d8363SDaniel Lezcano }
207de3cb747SDaniel Lezcano 
20822783649SRalf Baechle /* Setup and register the loopback device. */
loopback_net_init(struct net * net)2094665079cSPavel Emelyanov static __net_init int loopback_net_init(struct net *net)
2101da177e4SLinus Torvalds {
211854d8363SDaniel Lezcano 	struct net_device *dev;
212854d8363SDaniel Lezcano 	int err;
213aeed9e82SHerbert Xu 
214854d8363SDaniel Lezcano 	err = -ENOMEM;
21531d929deSRasmus Villemoes 	dev = alloc_netdev(0, "lo", NET_NAME_PREDICTABLE, loopback_setup);
216854d8363SDaniel Lezcano 	if (!dev)
217854d8363SDaniel Lezcano 		goto out;
218854d8363SDaniel Lezcano 
219c346dca1SYOSHIFUJI Hideaki 	dev_net_set(dev, net);
220854d8363SDaniel Lezcano 	err = register_netdev(dev);
221854d8363SDaniel Lezcano 	if (err)
222854d8363SDaniel Lezcano 		goto out_free_netdev;
223854d8363SDaniel Lezcano 
2241fb9489bSPavel Emelyanov 	BUG_ON(dev->ifindex != LOOPBACK_IFINDEX);
2252774c7abSEric W. Biederman 	net->loopback_dev = dev;
2269d6dda32SPavel Emelyanov 	return 0;
227854d8363SDaniel Lezcano 
228854d8363SDaniel Lezcano out_free_netdev:
229854d8363SDaniel Lezcano 	free_netdev(dev);
2309d6dda32SPavel Emelyanov out:
23109ad9bc7SOctavian Purdila 	if (net_eq(net, &init_net))
2329d6dda32SPavel Emelyanov 		panic("loopback: Failed to register netdevice: %d\n", err);
2339d6dda32SPavel Emelyanov 	return err;
234854d8363SDaniel Lezcano }
23560903f2cSAdrian Bunk 
236505d4f73SEric W. Biederman /* Registered in net/core/dev.c */
237505d4f73SEric W. Biederman struct pernet_operations __net_initdata loopback_net_ops = {
2382774c7abSEric W. Biederman 	.init = loopback_net_init,
2392774c7abSEric W. Biederman };
2404de83b88SMahesh Bandewar 
2414de83b88SMahesh Bandewar /* blackhole netdevice */
blackhole_netdev_xmit(struct sk_buff * skb,struct net_device * dev)2424de83b88SMahesh Bandewar static netdev_tx_t blackhole_netdev_xmit(struct sk_buff *skb,
2434de83b88SMahesh Bandewar 					 struct net_device *dev)
2444de83b88SMahesh Bandewar {
2454de83b88SMahesh Bandewar 	kfree_skb(skb);
2464de83b88SMahesh Bandewar 	net_warn_ratelimited("%s(): Dropping skb.\n", __func__);
2474de83b88SMahesh Bandewar 	return NETDEV_TX_OK;
2484de83b88SMahesh Bandewar }
2494de83b88SMahesh Bandewar 
2504de83b88SMahesh Bandewar static const struct net_device_ops blackhole_netdev_ops = {
2514de83b88SMahesh Bandewar 	.ndo_start_xmit = blackhole_netdev_xmit,
2524de83b88SMahesh Bandewar };
2534de83b88SMahesh Bandewar 
2544de83b88SMahesh Bandewar /* This is a dst-dummy device used specifically for invalidated
2554de83b88SMahesh Bandewar  * DSTs and unlike loopback, this is not per-ns.
2564de83b88SMahesh Bandewar  */
blackhole_netdev_setup(struct net_device * dev)2574de83b88SMahesh Bandewar static void blackhole_netdev_setup(struct net_device *dev)
2584de83b88SMahesh Bandewar {
2594de83b88SMahesh Bandewar 	gen_lo_setup(dev, ETH_MIN_MTU, NULL, NULL, &blackhole_netdev_ops, NULL);
2604de83b88SMahesh Bandewar }
2614de83b88SMahesh Bandewar 
2624de83b88SMahesh Bandewar /* Setup and register the blackhole_netdev. */
blackhole_netdev_init(void)2634de83b88SMahesh Bandewar static int __init blackhole_netdev_init(void)
2644de83b88SMahesh Bandewar {
2654de83b88SMahesh Bandewar 	blackhole_netdev = alloc_netdev(0, "blackhole_dev", NET_NAME_UNKNOWN,
2664de83b88SMahesh Bandewar 					blackhole_netdev_setup);
2674de83b88SMahesh Bandewar 	if (!blackhole_netdev)
2684de83b88SMahesh Bandewar 		return -ENOMEM;
2694de83b88SMahesh Bandewar 
270d62962b3SMahesh Bandewar 	rtnl_lock();
2714de83b88SMahesh Bandewar 	dev_init_scheduler(blackhole_netdev);
2724de83b88SMahesh Bandewar 	dev_activate(blackhole_netdev);
273d62962b3SMahesh Bandewar 	rtnl_unlock();
2744de83b88SMahesh Bandewar 
2754de83b88SMahesh Bandewar 	blackhole_netdev->flags |= IFF_UP | IFF_RUNNING;
2764de83b88SMahesh Bandewar 	dev_net_set(blackhole_netdev, &init_net);
2774de83b88SMahesh Bandewar 
2784de83b88SMahesh Bandewar 	return 0;
2794de83b88SMahesh Bandewar }
2804de83b88SMahesh Bandewar 
2814de83b88SMahesh Bandewar device_initcall(blackhole_netdev_init);
282