10e6fbc5bSPravin B Shelar /* 20e6fbc5bSPravin B Shelar * Copyright (c) 2013 Nicira, Inc. 30e6fbc5bSPravin B Shelar * 40e6fbc5bSPravin B Shelar * This program is free software; you can redistribute it and/or 50e6fbc5bSPravin B Shelar * modify it under the terms of version 2 of the GNU General Public 60e6fbc5bSPravin B Shelar * License as published by the Free Software Foundation. 70e6fbc5bSPravin B Shelar * 80e6fbc5bSPravin B Shelar * This program is distributed in the hope that it will be useful, but 90e6fbc5bSPravin B Shelar * WITHOUT ANY WARRANTY; without even the implied warranty of 100e6fbc5bSPravin B Shelar * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 110e6fbc5bSPravin B Shelar * General Public License for more details. 120e6fbc5bSPravin B Shelar * 130e6fbc5bSPravin B Shelar * You should have received a copy of the GNU General Public License 140e6fbc5bSPravin B Shelar * along with this program; if not, write to the Free Software 150e6fbc5bSPravin B Shelar * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 160e6fbc5bSPravin B Shelar * 02110-1301, USA 170e6fbc5bSPravin B Shelar */ 180e6fbc5bSPravin B Shelar 190e6fbc5bSPravin B Shelar #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 200e6fbc5bSPravin B Shelar 210e6fbc5bSPravin B Shelar #include <linux/types.h> 220e6fbc5bSPravin B Shelar #include <linux/kernel.h> 230e6fbc5bSPravin B Shelar #include <linux/skbuff.h> 240e6fbc5bSPravin B Shelar #include <linux/netdevice.h> 250e6fbc5bSPravin B Shelar #include <linux/in.h> 260e6fbc5bSPravin B Shelar #include <linux/if_arp.h> 270e6fbc5bSPravin B Shelar #include <linux/mroute.h> 280e6fbc5bSPravin B Shelar #include <linux/init.h> 290e6fbc5bSPravin B Shelar #include <linux/in6.h> 300e6fbc5bSPravin B Shelar #include <linux/inetdevice.h> 310e6fbc5bSPravin B Shelar #include <linux/netfilter_ipv4.h> 320e6fbc5bSPravin B Shelar #include <linux/etherdevice.h> 330e6fbc5bSPravin B Shelar #include <linux/if_ether.h> 340e6fbc5bSPravin B Shelar #include <linux/if_vlan.h> 350e6fbc5bSPravin B Shelar 360e6fbc5bSPravin B Shelar #include <net/ip.h> 370e6fbc5bSPravin B Shelar #include <net/icmp.h> 380e6fbc5bSPravin B Shelar #include <net/protocol.h> 390e6fbc5bSPravin B Shelar #include <net/ip_tunnels.h> 400e6fbc5bSPravin B Shelar #include <net/arp.h> 410e6fbc5bSPravin B Shelar #include <net/checksum.h> 420e6fbc5bSPravin B Shelar #include <net/dsfield.h> 430e6fbc5bSPravin B Shelar #include <net/inet_ecn.h> 440e6fbc5bSPravin B Shelar #include <net/xfrm.h> 450e6fbc5bSPravin B Shelar #include <net/net_namespace.h> 460e6fbc5bSPravin B Shelar #include <net/netns/generic.h> 470e6fbc5bSPravin B Shelar #include <net/rtnetlink.h> 480e6fbc5bSPravin B Shelar 49aad88724SEric Dumazet int iptunnel_xmit(struct sock *sk, struct rtable *rt, struct sk_buff *skb, 500e6fbc5bSPravin B Shelar __be32 src, __be32 dst, __u8 proto, 51963a88b3SNicolas Dichtel __u8 tos, __u8 ttl, __be16 df, bool xnet) 520e6fbc5bSPravin B Shelar { 530e6fbc5bSPravin B Shelar int pkt_len = skb->len; 540e6fbc5bSPravin B Shelar struct iphdr *iph; 550e6fbc5bSPravin B Shelar int err; 560e6fbc5bSPravin B Shelar 57963a88b3SNicolas Dichtel skb_scrub_packet(skb, xnet); 58963a88b3SNicolas Dichtel 597539fadcSTom Herbert skb_clear_hash(skb); 600e6fbc5bSPravin B Shelar skb_dst_set(skb, &rt->dst); 610e6fbc5bSPravin B Shelar memset(IPCB(skb), 0, sizeof(*IPCB(skb))); 620e6fbc5bSPravin B Shelar 630e6fbc5bSPravin B Shelar /* Push down and install the IP header. */ 6478a3694dSSteffen Klassert skb_push(skb, sizeof(struct iphdr)); 650e6fbc5bSPravin B Shelar skb_reset_network_header(skb); 660e6fbc5bSPravin B Shelar 670e6fbc5bSPravin B Shelar iph = ip_hdr(skb); 680e6fbc5bSPravin B Shelar 690e6fbc5bSPravin B Shelar iph->version = 4; 700e6fbc5bSPravin B Shelar iph->ihl = sizeof(struct iphdr) >> 2; 710e6fbc5bSPravin B Shelar iph->frag_off = df; 720e6fbc5bSPravin B Shelar iph->protocol = proto; 730e6fbc5bSPravin B Shelar iph->tos = tos; 740e6fbc5bSPravin B Shelar iph->daddr = dst; 750e6fbc5bSPravin B Shelar iph->saddr = src; 760e6fbc5bSPravin B Shelar iph->ttl = ttl; 7773f156a6SEric Dumazet __ip_select_ident(iph, skb_shinfo(skb)->gso_segs ?: 1); 780e6fbc5bSPravin B Shelar 79aad88724SEric Dumazet err = ip_local_out_sk(sk, skb); 800e6fbc5bSPravin B Shelar if (unlikely(net_xmit_eval(err))) 810e6fbc5bSPravin B Shelar pkt_len = 0; 820e6fbc5bSPravin B Shelar return pkt_len; 830e6fbc5bSPravin B Shelar } 840e6fbc5bSPravin B Shelar EXPORT_SYMBOL_GPL(iptunnel_xmit); 853d7b46cdSPravin B Shelar 863d7b46cdSPravin B Shelar int iptunnel_pull_header(struct sk_buff *skb, int hdr_len, __be16 inner_proto) 873d7b46cdSPravin B Shelar { 883d7b46cdSPravin B Shelar if (unlikely(!pskb_may_pull(skb, hdr_len))) 893d7b46cdSPravin B Shelar return -ENOMEM; 903d7b46cdSPravin B Shelar 913d7b46cdSPravin B Shelar skb_pull_rcsum(skb, hdr_len); 923d7b46cdSPravin B Shelar 933d7b46cdSPravin B Shelar if (inner_proto == htons(ETH_P_TEB)) { 943d7b46cdSPravin B Shelar struct ethhdr *eh = (struct ethhdr *)skb->data; 953d7b46cdSPravin B Shelar 963d7b46cdSPravin B Shelar if (unlikely(!pskb_may_pull(skb, ETH_HLEN))) 973d7b46cdSPravin B Shelar return -ENOMEM; 983d7b46cdSPravin B Shelar 993d7b46cdSPravin B Shelar if (likely(ntohs(eh->h_proto) >= ETH_P_802_3_MIN)) 1003d7b46cdSPravin B Shelar skb->protocol = eh->h_proto; 1013d7b46cdSPravin B Shelar else 1023d7b46cdSPravin B Shelar skb->protocol = htons(ETH_P_802_2); 1033d7b46cdSPravin B Shelar 1043d7b46cdSPravin B Shelar } else { 1053d7b46cdSPravin B Shelar skb->protocol = inner_proto; 1063d7b46cdSPravin B Shelar } 1073d7b46cdSPravin B Shelar 1083d7b46cdSPravin B Shelar nf_reset(skb); 1093d7b46cdSPravin B Shelar secpath_reset(skb); 1107539fadcSTom Herbert skb_clear_hash_if_not_l4(skb); 111fbd02dd4SPravin B Shelar skb_dst_drop(skb); 1123d7b46cdSPravin B Shelar skb->vlan_tci = 0; 1133d7b46cdSPravin B Shelar skb_set_queue_mapping(skb, 0); 1143d7b46cdSPravin B Shelar skb->pkt_type = PACKET_HOST; 1153d7b46cdSPravin B Shelar return 0; 1163d7b46cdSPravin B Shelar } 1173d7b46cdSPravin B Shelar EXPORT_SYMBOL_GPL(iptunnel_pull_header); 1182d26f0a3SEric Dumazet 1192d26f0a3SEric Dumazet struct sk_buff *iptunnel_handle_offloads(struct sk_buff *skb, 1202d26f0a3SEric Dumazet bool csum_help, 1212d26f0a3SEric Dumazet int gso_type_mask) 1222d26f0a3SEric Dumazet { 1232d26f0a3SEric Dumazet int err; 1242d26f0a3SEric Dumazet 1252d26f0a3SEric Dumazet if (likely(!skb->encapsulation)) { 1262d26f0a3SEric Dumazet skb_reset_inner_headers(skb); 1272d26f0a3SEric Dumazet skb->encapsulation = 1; 1282d26f0a3SEric Dumazet } 1292d26f0a3SEric Dumazet 1302d26f0a3SEric Dumazet if (skb_is_gso(skb)) { 1312d26f0a3SEric Dumazet err = skb_unclone(skb, GFP_ATOMIC); 1322d26f0a3SEric Dumazet if (unlikely(err)) 1332d26f0a3SEric Dumazet goto error; 1342d26f0a3SEric Dumazet skb_shinfo(skb)->gso_type |= gso_type_mask; 1352d26f0a3SEric Dumazet return skb; 1362d26f0a3SEric Dumazet } 1372d26f0a3SEric Dumazet 1387e2b10c1STom Herbert /* If packet is not gso and we are resolving any partial checksum, 1397e2b10c1STom Herbert * clear encapsulation flag. This allows setting CHECKSUM_PARTIAL 1407e2b10c1STom Herbert * on the outer header without confusing devices that implement 1417e2b10c1STom Herbert * NETIF_F_IP_CSUM with encapsulation. 1427e2b10c1STom Herbert */ 1437e2b10c1STom Herbert if (csum_help) 1447e2b10c1STom Herbert skb->encapsulation = 0; 1457e2b10c1STom Herbert 1462d26f0a3SEric Dumazet if (skb->ip_summed == CHECKSUM_PARTIAL && csum_help) { 1472d26f0a3SEric Dumazet err = skb_checksum_help(skb); 1482d26f0a3SEric Dumazet if (unlikely(err)) 1492d26f0a3SEric Dumazet goto error; 1502d26f0a3SEric Dumazet } else if (skb->ip_summed != CHECKSUM_PARTIAL) 1512d26f0a3SEric Dumazet skb->ip_summed = CHECKSUM_NONE; 1522d26f0a3SEric Dumazet 1532d26f0a3SEric Dumazet return skb; 1542d26f0a3SEric Dumazet error: 1552d26f0a3SEric Dumazet kfree_skb(skb); 1562d26f0a3SEric Dumazet return ERR_PTR(err); 1572d26f0a3SEric Dumazet } 1582d26f0a3SEric Dumazet EXPORT_SYMBOL_GPL(iptunnel_handle_offloads); 159ebe44f35SDavid S. Miller 160ebe44f35SDavid S. Miller /* Often modified stats are per cpu, other are shared (netdev->stats) */ 161ebe44f35SDavid S. Miller struct rtnl_link_stats64 *ip_tunnel_get_stats64(struct net_device *dev, 162ebe44f35SDavid S. Miller struct rtnl_link_stats64 *tot) 163ebe44f35SDavid S. Miller { 164ebe44f35SDavid S. Miller int i; 165ebe44f35SDavid S. Miller 166ebe44f35SDavid S. Miller for_each_possible_cpu(i) { 167ebe44f35SDavid S. Miller const struct pcpu_sw_netstats *tstats = 168ebe44f35SDavid S. Miller per_cpu_ptr(dev->tstats, i); 169ebe44f35SDavid S. Miller u64 rx_packets, rx_bytes, tx_packets, tx_bytes; 170ebe44f35SDavid S. Miller unsigned int start; 171ebe44f35SDavid S. Miller 172ebe44f35SDavid S. Miller do { 17357a7744eSEric W. Biederman start = u64_stats_fetch_begin_irq(&tstats->syncp); 174ebe44f35SDavid S. Miller rx_packets = tstats->rx_packets; 175ebe44f35SDavid S. Miller tx_packets = tstats->tx_packets; 176ebe44f35SDavid S. Miller rx_bytes = tstats->rx_bytes; 177ebe44f35SDavid S. Miller tx_bytes = tstats->tx_bytes; 17857a7744eSEric W. Biederman } while (u64_stats_fetch_retry_irq(&tstats->syncp, start)); 179ebe44f35SDavid S. Miller 180ebe44f35SDavid S. Miller tot->rx_packets += rx_packets; 181ebe44f35SDavid S. Miller tot->tx_packets += tx_packets; 182ebe44f35SDavid S. Miller tot->rx_bytes += rx_bytes; 183ebe44f35SDavid S. Miller tot->tx_bytes += tx_bytes; 184ebe44f35SDavid S. Miller } 185ebe44f35SDavid S. Miller 186ebe44f35SDavid S. Miller tot->multicast = dev->stats.multicast; 187ebe44f35SDavid S. Miller 188ebe44f35SDavid S. Miller tot->rx_crc_errors = dev->stats.rx_crc_errors; 189ebe44f35SDavid S. Miller tot->rx_fifo_errors = dev->stats.rx_fifo_errors; 190ebe44f35SDavid S. Miller tot->rx_length_errors = dev->stats.rx_length_errors; 191ebe44f35SDavid S. Miller tot->rx_frame_errors = dev->stats.rx_frame_errors; 192ebe44f35SDavid S. Miller tot->rx_errors = dev->stats.rx_errors; 193ebe44f35SDavid S. Miller 194ebe44f35SDavid S. Miller tot->tx_fifo_errors = dev->stats.tx_fifo_errors; 195ebe44f35SDavid S. Miller tot->tx_carrier_errors = dev->stats.tx_carrier_errors; 196ebe44f35SDavid S. Miller tot->tx_dropped = dev->stats.tx_dropped; 197ebe44f35SDavid S. Miller tot->tx_aborted_errors = dev->stats.tx_aborted_errors; 198ebe44f35SDavid S. Miller tot->tx_errors = dev->stats.tx_errors; 199ebe44f35SDavid S. Miller 200ebe44f35SDavid S. Miller tot->collisions = dev->stats.collisions; 201ebe44f35SDavid S. Miller 202ebe44f35SDavid S. Miller return tot; 203ebe44f35SDavid S. Miller } 204ebe44f35SDavid S. Miller EXPORT_SYMBOL_GPL(ip_tunnel_get_stats64); 205