12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 21da177e4SLinus Torvalds /* 31da177e4SLinus Torvalds * INET An implementation of the TCP/IP protocol suite for the LINUX 41da177e4SLinus Torvalds * operating system. INET is implemented using the BSD Socket 51da177e4SLinus Torvalds * interface as the means of communication with the user level. 61da177e4SLinus Torvalds * 71da177e4SLinus Torvalds * Pseudo-driver for the loopback interface. 81da177e4SLinus Torvalds * 91da177e4SLinus Torvalds * Version: @(#)loopback.c 1.0.4b 08/16/93 101da177e4SLinus Torvalds * 1102c30a84SJesper Juhl * Authors: Ross Biro 121da177e4SLinus Torvalds * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG> 131da177e4SLinus Torvalds * Donald Becker, <becker@scyld.com> 141da177e4SLinus Torvalds * 151da177e4SLinus Torvalds * Alan Cox : Fixed oddments for NET3.014 161da177e4SLinus Torvalds * Alan Cox : Rejig for NET3.029 snap #3 171da177e4SLinus Torvalds * Alan Cox : Fixed NET3.029 bugs and sped up 181da177e4SLinus Torvalds * Larry McVoy : Tiny tweak to double performance 191da177e4SLinus Torvalds * Alan Cox : Backed out LMV's tweak - the linux mm 201da177e4SLinus Torvalds * can't take it... 211da177e4SLinus Torvalds * Michael Griffith: Don't bother computing the checksums 221da177e4SLinus Torvalds * on packets received on the loopback 231da177e4SLinus Torvalds * interface. 241da177e4SLinus Torvalds * Alexey Kuznetsov: Potential hang under some extreme 251da177e4SLinus Torvalds * cases removed. 261da177e4SLinus Torvalds */ 271da177e4SLinus Torvalds #include <linux/kernel.h> 281da177e4SLinus Torvalds #include <linux/jiffies.h> 291da177e4SLinus Torvalds #include <linux/module.h> 301da177e4SLinus Torvalds #include <linux/interrupt.h> 311da177e4SLinus Torvalds #include <linux/fs.h> 321da177e4SLinus Torvalds #include <linux/types.h> 331da177e4SLinus Torvalds #include <linux/string.h> 341da177e4SLinus Torvalds #include <linux/socket.h> 351da177e4SLinus Torvalds #include <linux/errno.h> 361da177e4SLinus Torvalds #include <linux/fcntl.h> 371da177e4SLinus Torvalds #include <linux/in.h> 381da177e4SLinus Torvalds 397c0f6ba6SLinus Torvalds #include <linux/uaccess.h> 40b3407c8eSEzequiel Lara Gomez #include <linux/io.h> 411da177e4SLinus Torvalds 421da177e4SLinus Torvalds #include <linux/inet.h> 431da177e4SLinus Torvalds #include <linux/netdevice.h> 441da177e4SLinus Torvalds #include <linux/etherdevice.h> 451da177e4SLinus Torvalds #include <linux/skbuff.h> 461da177e4SLinus Torvalds #include <linux/ethtool.h> 47b6459415SJakub Kicinski #include <net/sch_generic.h> 481da177e4SLinus Torvalds #include <net/sock.h> 491da177e4SLinus Torvalds #include <net/checksum.h> 501da177e4SLinus Torvalds #include <linux/if_ether.h> /* For the statistics structure. */ 511da177e4SLinus Torvalds #include <linux/if_arp.h> /* For ARPHRD_ETHER */ 521da177e4SLinus Torvalds #include <linux/ip.h> 531da177e4SLinus Torvalds #include <linux/tcp.h> 541da177e4SLinus Torvalds #include <linux/percpu.h> 556df014cfSEzequiel Lara Gomez #include <linux/net_tstamp.h> 562774c7abSEric W. Biederman #include <net/net_namespace.h> 575eaa0bd8SEric Dumazet #include <linux/u64_stats_sync.h> 581da177e4SLinus Torvalds 594de83b88SMahesh Bandewar /* blackhole_netdev - a device used for dsts that are marked expired! 604de83b88SMahesh Bandewar * This is global device (instead of per-net-ns) since it's not needed 614de83b88SMahesh Bandewar * to be per-ns and gets initialized at boot time. 624de83b88SMahesh Bandewar */ 634de83b88SMahesh Bandewar struct net_device *blackhole_netdev; 644de83b88SMahesh Bandewar EXPORT_SYMBOL(blackhole_netdev); 654de83b88SMahesh Bandewar 66b3407c8eSEzequiel Lara Gomez /* The higher levels take care of making this non-reentrant (it's 671da177e4SLinus Torvalds * called with bh's disabled). 681da177e4SLinus Torvalds */ 6961357325SStephen Hemminger static netdev_tx_t loopback_xmit(struct sk_buff *skb, 7061357325SStephen Hemminger struct net_device *dev) 711da177e4SLinus Torvalds { 727eebb0b2SEric Dumazet int len; 731da177e4SLinus Torvalds 746df014cfSEzequiel Lara Gomez skb_tx_timestamp(skb); 754c16128bSEric Dumazet 764c16128bSEric Dumazet /* do not fool net_timestamp_check() with various clock bases */ 77de799101SMartin KaFai Lau skb_clear_tstamp(skb); 784c16128bSEric Dumazet 791da177e4SLinus Torvalds skb_orphan(skb); 801da177e4SLinus Torvalds 81baebdf48SSebastian Andrzej Siewior /* Before queueing this packet to __netif_rx(), 82794ed393SEric Dumazet * make sure dst is refcounted. 83794ed393SEric Dumazet */ 84794ed393SEric Dumazet skb_dst_force(skb); 85794ed393SEric Dumazet 861da177e4SLinus Torvalds skb->protocol = eth_type_trans(skb, dev); 871da177e4SLinus Torvalds 887eebb0b2SEric Dumazet len = skb->len; 89baebdf48SSebastian Andrzej Siewior if (likely(__netif_rx(skb) == NET_RX_SUCCESS)) 90dd5382a0SEric Dumazet dev_lstats_add(dev, len); 911da177e4SLinus Torvalds 926ed10654SPatrick McHardy return NETDEV_TX_OK; 931da177e4SLinus Torvalds } 941da177e4SLinus Torvalds 95de7d5084SEric Dumazet void dev_lstats_read(struct net_device *dev, u64 *packets, u64 *bytes) 961da177e4SLinus Torvalds { 971da177e4SLinus Torvalds int i; 981da177e4SLinus Torvalds 99de7d5084SEric Dumazet *packets = 0; 100de7d5084SEric Dumazet *bytes = 0; 101de7d5084SEric Dumazet 1020fed4846SKAMEZAWA Hiroyuki for_each_possible_cpu(i) { 1035175c378SEric Dumazet const struct pcpu_lstats *lb_stats; 1045eaa0bd8SEric Dumazet u64 tbytes, tpackets; 1055eaa0bd8SEric Dumazet unsigned int start; 1061da177e4SLinus Torvalds 107a7855c78SEric Dumazet lb_stats = per_cpu_ptr(dev->lstats, i); 1085eaa0bd8SEric Dumazet do { 109068c38adSThomas Gleixner start = u64_stats_fetch_begin(&lb_stats->syncp); 110fd2f4737SEric Dumazet tpackets = u64_stats_read(&lb_stats->packets); 111fd2f4737SEric Dumazet tbytes = u64_stats_read(&lb_stats->bytes); 112068c38adSThomas Gleixner } while (u64_stats_fetch_retry(&lb_stats->syncp, start)); 113de7d5084SEric Dumazet *bytes += tbytes; 114de7d5084SEric Dumazet *packets += tpackets; 1151da177e4SLinus Torvalds } 116de7d5084SEric Dumazet } 117de7d5084SEric Dumazet EXPORT_SYMBOL(dev_lstats_read); 118de7d5084SEric Dumazet 119de7d5084SEric Dumazet static void loopback_get_stats64(struct net_device *dev, 120de7d5084SEric Dumazet struct rtnl_link_stats64 *stats) 121de7d5084SEric Dumazet { 122de7d5084SEric Dumazet u64 packets, bytes; 123de7d5084SEric Dumazet 124de7d5084SEric Dumazet dev_lstats_read(dev, &packets, &bytes); 125de7d5084SEric Dumazet 1265175c378SEric Dumazet stats->rx_packets = packets; 1275175c378SEric Dumazet stats->tx_packets = packets; 1285175c378SEric Dumazet stats->rx_bytes = bytes; 1295175c378SEric Dumazet stats->tx_bytes = bytes; 1301da177e4SLinus Torvalds } 1311da177e4SLinus Torvalds 1327fa6b066SStephen Hemminger static u32 always_on(struct net_device *dev) 1331da177e4SLinus Torvalds { 1341da177e4SLinus Torvalds return 1; 1351da177e4SLinus Torvalds } 1361da177e4SLinus Torvalds 1377282d491SJeff Garzik static const struct ethtool_ops loopback_ethtool_ops = { 1387fa6b066SStephen Hemminger .get_link = always_on, 139af730342SJulian Wiedmann .get_ts_info = ethtool_op_get_ts_info, 1401da177e4SLinus Torvalds }; 1411da177e4SLinus Torvalds 1425f6d88b9SEric W. Biederman static int loopback_dev_init(struct net_device *dev) 1435f6d88b9SEric W. Biederman { 1441c213bd2SWANG Cong dev->lstats = netdev_alloc_pcpu_stats(struct pcpu_lstats); 145a7855c78SEric Dumazet if (!dev->lstats) 1465f6d88b9SEric W. Biederman return -ENOMEM; 147*a7b862abSEric Dumazet netdev_lockdep_set_classes(dev); 1485f6d88b9SEric W. Biederman return 0; 1495f6d88b9SEric W. Biederman } 1505f6d88b9SEric W. Biederman 1515f6d88b9SEric W. Biederman static void loopback_dev_free(struct net_device *dev) 1525f6d88b9SEric W. Biederman { 153e05e9070SEric W. Biederman dev_net(dev)->loopback_dev = NULL; 154a7855c78SEric Dumazet free_percpu(dev->lstats); 1555f6d88b9SEric W. Biederman } 1565f6d88b9SEric W. Biederman 157c02373bfSStephen Hemminger static const struct net_device_ops loopback_ops = { 158c02373bfSStephen Hemminger .ndo_init = loopback_dev_init, 15900829823SStephen Hemminger .ndo_start_xmit = loopback_xmit, 1606b10de38SEric Dumazet .ndo_get_stats64 = loopback_get_stats64, 16125f929fbSWANG Cong .ndo_set_mac_address = eth_mac_addr, 162c02373bfSStephen Hemminger }; 163c02373bfSStephen Hemminger 1644de83b88SMahesh Bandewar static void gen_lo_setup(struct net_device *dev, 1654de83b88SMahesh Bandewar unsigned int mtu, 1664de83b88SMahesh Bandewar const struct ethtool_ops *eth_ops, 1674de83b88SMahesh Bandewar const struct header_ops *hdr_ops, 1684de83b88SMahesh Bandewar const struct net_device_ops *dev_ops, 1694de83b88SMahesh Bandewar void (*dev_destructor)(struct net_device *dev)) 170854d8363SDaniel Lezcano { 1714de83b88SMahesh Bandewar dev->mtu = mtu; 172854d8363SDaniel Lezcano dev->hard_header_len = ETH_HLEN; /* 14 */ 173217e6fa2SWillem de Bruijn dev->min_header_len = ETH_HLEN; /* 14 */ 174854d8363SDaniel Lezcano dev->addr_len = ETH_ALEN; /* 6 */ 175854d8363SDaniel Lezcano dev->type = ARPHRD_LOOPBACK; /* 0x0001*/ 176854d8363SDaniel Lezcano dev->flags = IFF_LOOPBACK; 177e65db2b7SPhil Sutter dev->priv_flags |= IFF_LIVE_ADDR_CHANGE | IFF_NO_QUEUE; 17802875878SEric Dumazet netif_keep_dst(dev); 179f6c382fcSMarcelo Ricardo Leitner dev->hw_features = NETIF_F_GSO_SOFTWARE; 180854d8363SDaniel Lezcano dev->features = NETIF_F_SG | NETIF_F_FRAGLIST 181f6c382fcSMarcelo Ricardo Leitner | NETIF_F_GSO_SOFTWARE 18234324dc2SMichał Mirosław | NETIF_F_HW_CSUM 183cf0bdefdSMichał Mirosław | NETIF_F_RXCSUM 18453692b1dSTom Herbert | NETIF_F_SCTP_CRC 185854d8363SDaniel Lezcano | NETIF_F_HIGHDMA 186ce286d32SEric W. Biederman | NETIF_F_LLTX 1870553c891SKrishna Kumar | NETIF_F_NETNS_LOCAL 188eed2a12fSMahesh Bandewar | NETIF_F_VLAN_CHALLENGED 189eed2a12fSMahesh Bandewar | NETIF_F_LOOPBACK; 1904de83b88SMahesh Bandewar dev->ethtool_ops = eth_ops; 1914de83b88SMahesh Bandewar dev->header_ops = hdr_ops; 1924de83b88SMahesh Bandewar dev->netdev_ops = dev_ops; 193cf124db5SDavid S. Miller dev->needs_free_netdev = true; 1944de83b88SMahesh Bandewar dev->priv_destructor = dev_destructor; 195d6f938ceSEric Dumazet 196d6f938ceSEric Dumazet netif_set_tso_max_size(dev, GSO_MAX_SIZE); 1974de83b88SMahesh Bandewar } 1984de83b88SMahesh Bandewar 1994de83b88SMahesh Bandewar /* The loopback device is special. There is only one instance 2004de83b88SMahesh Bandewar * per network namespace. 2014de83b88SMahesh Bandewar */ 2024de83b88SMahesh Bandewar static void loopback_setup(struct net_device *dev) 2034de83b88SMahesh Bandewar { 2044de83b88SMahesh Bandewar gen_lo_setup(dev, (64 * 1024), &loopback_ethtool_ops, ð_header_ops, 2054de83b88SMahesh Bandewar &loopback_ops, loopback_dev_free); 206854d8363SDaniel Lezcano } 207de3cb747SDaniel Lezcano 20822783649SRalf Baechle /* Setup and register the loopback device. */ 2094665079cSPavel Emelyanov static __net_init int loopback_net_init(struct net *net) 2101da177e4SLinus Torvalds { 211854d8363SDaniel Lezcano struct net_device *dev; 212854d8363SDaniel Lezcano int err; 213aeed9e82SHerbert Xu 214854d8363SDaniel Lezcano err = -ENOMEM; 21531d929deSRasmus Villemoes dev = alloc_netdev(0, "lo", NET_NAME_PREDICTABLE, loopback_setup); 216854d8363SDaniel Lezcano if (!dev) 217854d8363SDaniel Lezcano goto out; 218854d8363SDaniel Lezcano 219c346dca1SYOSHIFUJI Hideaki dev_net_set(dev, net); 220854d8363SDaniel Lezcano err = register_netdev(dev); 221854d8363SDaniel Lezcano if (err) 222854d8363SDaniel Lezcano goto out_free_netdev; 223854d8363SDaniel Lezcano 2241fb9489bSPavel Emelyanov BUG_ON(dev->ifindex != LOOPBACK_IFINDEX); 2252774c7abSEric W. Biederman net->loopback_dev = dev; 2269d6dda32SPavel Emelyanov return 0; 227854d8363SDaniel Lezcano 228854d8363SDaniel Lezcano out_free_netdev: 229854d8363SDaniel Lezcano free_netdev(dev); 2309d6dda32SPavel Emelyanov out: 23109ad9bc7SOctavian Purdila if (net_eq(net, &init_net)) 2329d6dda32SPavel Emelyanov panic("loopback: Failed to register netdevice: %d\n", err); 2339d6dda32SPavel Emelyanov return err; 234854d8363SDaniel Lezcano } 23560903f2cSAdrian Bunk 236505d4f73SEric W. Biederman /* Registered in net/core/dev.c */ 237505d4f73SEric W. Biederman struct pernet_operations __net_initdata loopback_net_ops = { 2382774c7abSEric W. Biederman .init = loopback_net_init, 2392774c7abSEric W. Biederman }; 2404de83b88SMahesh Bandewar 2414de83b88SMahesh Bandewar /* blackhole netdevice */ 2424de83b88SMahesh Bandewar static netdev_tx_t blackhole_netdev_xmit(struct sk_buff *skb, 2434de83b88SMahesh Bandewar struct net_device *dev) 2444de83b88SMahesh Bandewar { 2454de83b88SMahesh Bandewar kfree_skb(skb); 2464de83b88SMahesh Bandewar net_warn_ratelimited("%s(): Dropping skb.\n", __func__); 2474de83b88SMahesh Bandewar return NETDEV_TX_OK; 2484de83b88SMahesh Bandewar } 2494de83b88SMahesh Bandewar 2504de83b88SMahesh Bandewar static const struct net_device_ops blackhole_netdev_ops = { 2514de83b88SMahesh Bandewar .ndo_start_xmit = blackhole_netdev_xmit, 2524de83b88SMahesh Bandewar }; 2534de83b88SMahesh Bandewar 2544de83b88SMahesh Bandewar /* This is a dst-dummy device used specifically for invalidated 2554de83b88SMahesh Bandewar * DSTs and unlike loopback, this is not per-ns. 2564de83b88SMahesh Bandewar */ 2574de83b88SMahesh Bandewar static void blackhole_netdev_setup(struct net_device *dev) 2584de83b88SMahesh Bandewar { 2594de83b88SMahesh Bandewar gen_lo_setup(dev, ETH_MIN_MTU, NULL, NULL, &blackhole_netdev_ops, NULL); 2604de83b88SMahesh Bandewar } 2614de83b88SMahesh Bandewar 2624de83b88SMahesh Bandewar /* Setup and register the blackhole_netdev. */ 2634de83b88SMahesh Bandewar static int __init blackhole_netdev_init(void) 2644de83b88SMahesh Bandewar { 2654de83b88SMahesh Bandewar blackhole_netdev = alloc_netdev(0, "blackhole_dev", NET_NAME_UNKNOWN, 2664de83b88SMahesh Bandewar blackhole_netdev_setup); 2674de83b88SMahesh Bandewar if (!blackhole_netdev) 2684de83b88SMahesh Bandewar return -ENOMEM; 2694de83b88SMahesh Bandewar 270d62962b3SMahesh Bandewar rtnl_lock(); 2714de83b88SMahesh Bandewar dev_init_scheduler(blackhole_netdev); 2724de83b88SMahesh Bandewar dev_activate(blackhole_netdev); 273d62962b3SMahesh Bandewar rtnl_unlock(); 2744de83b88SMahesh Bandewar 2754de83b88SMahesh Bandewar blackhole_netdev->flags |= IFF_UP | IFF_RUNNING; 2764de83b88SMahesh Bandewar dev_net_set(blackhole_netdev, &init_net); 2774de83b88SMahesh Bandewar 2784de83b88SMahesh Bandewar return 0; 2794de83b88SMahesh Bandewar } 2804de83b88SMahesh Bandewar 2814de83b88SMahesh Bandewar device_initcall(blackhole_netdev_init); 282