147505b8bSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 260c778b2SVlad Yasevich /* SCTP kernel implementation 31da177e4SLinus Torvalds * (C) Copyright IBM Corp. 2001, 2004 41da177e4SLinus Torvalds * Copyright (c) 1999-2000 Cisco, Inc. 51da177e4SLinus Torvalds * Copyright (c) 1999-2001 Motorola, Inc. 61da177e4SLinus Torvalds * Copyright (c) 2001 Intel Corp. 71da177e4SLinus Torvalds * Copyright (c) 2001 Nokia, Inc. 81da177e4SLinus Torvalds * Copyright (c) 2001 La Monte H.P. Yarroll 91da177e4SLinus Torvalds * 1060c778b2SVlad Yasevich * This file is part of the SCTP kernel implementation 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * Initialization/cleanup for SCTP protocol support. 131da177e4SLinus Torvalds * 141da177e4SLinus Torvalds * Please send any bug reports or fixes you make to the 151da177e4SLinus Torvalds * email address(es): 1691705c61SDaniel Borkmann * lksctp developers <linux-sctp@vger.kernel.org> 171da177e4SLinus Torvalds * 181da177e4SLinus Torvalds * Written or modified by: 191da177e4SLinus Torvalds * La Monte H.P. Yarroll <piggy@acm.org> 201da177e4SLinus Torvalds * Karl Knutson <karl@athena.chicago.il.us> 211da177e4SLinus Torvalds * Jon Grimm <jgrimm@us.ibm.com> 221da177e4SLinus Torvalds * Sridhar Samudrala <sri@us.ibm.com> 231da177e4SLinus Torvalds * Daisy Chang <daisyc@us.ibm.com> 241da177e4SLinus Torvalds * Ardelle Fan <ardelle.fan@intel.com> 251da177e4SLinus Torvalds */ 261da177e4SLinus Torvalds 27145ce502SJoe Perches #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 28145ce502SJoe Perches 291da177e4SLinus Torvalds #include <linux/module.h> 301da177e4SLinus Torvalds #include <linux/init.h> 311da177e4SLinus Torvalds #include <linux/netdevice.h> 321da177e4SLinus Torvalds #include <linux/inetdevice.h> 331da177e4SLinus Torvalds #include <linux/seq_file.h> 3457c8a661SMike Rapoport #include <linux/memblock.h> 35845525a6SVlad Yasevich #include <linux/highmem.h> 36845525a6SVlad Yasevich #include <linux/swap.h> 375a0e3ad6STejun Heo #include <linux/slab.h> 38457c4cbcSEric W. Biederman #include <net/net_namespace.h> 391da177e4SLinus Torvalds #include <net/protocol.h> 401da177e4SLinus Torvalds #include <net/ip.h> 411da177e4SLinus Torvalds #include <net/ipv6.h> 4214c85021SArnaldo Carvalho de Melo #include <net/route.h> 431da177e4SLinus Torvalds #include <net/sctp/sctp.h> 441da177e4SLinus Torvalds #include <net/addrconf.h> 451da177e4SLinus Torvalds #include <net/inet_common.h> 461da177e4SLinus Torvalds #include <net/inet_ecn.h> 47965ae444SXin Long #include <net/udp_tunnel.h> 481da177e4SLinus Torvalds 49d9749fb5SNeil Horman #define MAX_SCTP_PORT_HASH_ENTRIES (64 * 1024) 50d9749fb5SNeil Horman 511da177e4SLinus Torvalds /* Global data structures. */ 524cbf1caeSBrian Haley struct sctp_globals sctp_globals __read_mostly; 531da177e4SLinus Torvalds 541da177e4SLinus Torvalds struct idr sctp_assocs_id; 551da177e4SLinus Torvalds DEFINE_SPINLOCK(sctp_assocs_id_lock); 561da177e4SLinus Torvalds 571da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet6_specific; 581da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet_specific; 591da177e4SLinus Torvalds static struct sctp_af *sctp_af_v4_specific; 601da177e4SLinus Torvalds static struct sctp_af *sctp_af_v6_specific; 611da177e4SLinus Torvalds 62e18b890bSChristoph Lameter struct kmem_cache *sctp_chunk_cachep __read_mostly; 63e18b890bSChristoph Lameter struct kmem_cache *sctp_bucket_cachep __read_mostly; 641da177e4SLinus Torvalds 658d987e5cSEric Dumazet long sysctl_sctp_mem[3]; 66007e3936SVlad Yasevich int sysctl_sctp_rmem[3]; 67007e3936SVlad Yasevich int sysctl_sctp_wmem[3]; 684d93df0aSNeil Horman 691da177e4SLinus Torvalds /* Private helper to extract ipv4 address and stash them in 701da177e4SLinus Torvalds * the protocol structure. 711da177e4SLinus Torvalds */ 721da177e4SLinus Torvalds static void sctp_v4_copy_addrlist(struct list_head *addrlist, 731da177e4SLinus Torvalds struct net_device *dev) 741da177e4SLinus Torvalds { 751da177e4SLinus Torvalds struct in_device *in_dev; 761da177e4SLinus Torvalds struct in_ifaddr *ifa; 771da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 781da177e4SLinus Torvalds 791da177e4SLinus Torvalds rcu_read_lock(); 80e5ed6399SHerbert Xu if ((in_dev = __in_dev_get_rcu(dev)) == NULL) { 811da177e4SLinus Torvalds rcu_read_unlock(); 821da177e4SLinus Torvalds return; 831da177e4SLinus Torvalds } 841da177e4SLinus Torvalds 85cd5a411dSFlorian Westphal in_dev_for_each_ifa_rcu(ifa, in_dev) { 861da177e4SLinus Torvalds /* Add the address to the local list. */ 87939cfa75SDaniel Borkmann addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 881da177e4SLinus Torvalds if (addr) { 892a6fd78aSAl Viro addr->a.v4.sin_family = AF_INET; 902a6fd78aSAl Viro addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 9129303547SVlad Yasevich addr->valid = 1; 9229303547SVlad Yasevich INIT_LIST_HEAD(&addr->list); 931da177e4SLinus Torvalds list_add_tail(&addr->list, addrlist); 941da177e4SLinus Torvalds } 951da177e4SLinus Torvalds } 961da177e4SLinus Torvalds 971da177e4SLinus Torvalds rcu_read_unlock(); 981da177e4SLinus Torvalds } 991da177e4SLinus Torvalds 1001da177e4SLinus Torvalds /* Extract our IP addresses from the system and stash them in the 1011da177e4SLinus Torvalds * protocol structure. 1021da177e4SLinus Torvalds */ 1034db67e80SEric W. Biederman static void sctp_get_local_addr_list(struct net *net) 1041da177e4SLinus Torvalds { 1051da177e4SLinus Torvalds struct net_device *dev; 1061da177e4SLinus Torvalds struct list_head *pos; 1071da177e4SLinus Torvalds struct sctp_af *af; 1081da177e4SLinus Torvalds 109c6d14c84SEric Dumazet rcu_read_lock(); 1104db67e80SEric W. Biederman for_each_netdev_rcu(net, dev) { 1112c0740e4SDave Jones list_for_each(pos, &sctp_address_families) { 1121da177e4SLinus Torvalds af = list_entry(pos, struct sctp_af, list); 1134db67e80SEric W. Biederman af->copy_addrlist(&net->sctp.local_addr_list, dev); 1141da177e4SLinus Torvalds } 1151da177e4SLinus Torvalds } 116c6d14c84SEric Dumazet rcu_read_unlock(); 1171da177e4SLinus Torvalds } 1181da177e4SLinus Torvalds 1191da177e4SLinus Torvalds /* Free the existing local addresses. */ 1204db67e80SEric W. Biederman static void sctp_free_local_addr_list(struct net *net) 1211da177e4SLinus Torvalds { 1221da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1231da177e4SLinus Torvalds struct list_head *pos, *temp; 1241da177e4SLinus Torvalds 1254db67e80SEric W. Biederman list_for_each_safe(pos, temp, &net->sctp.local_addr_list) { 1261da177e4SLinus Torvalds addr = list_entry(pos, struct sctp_sockaddr_entry, list); 1271da177e4SLinus Torvalds list_del(pos); 1281da177e4SLinus Torvalds kfree(addr); 1291da177e4SLinus Torvalds } 1301da177e4SLinus Torvalds } 1311da177e4SLinus Torvalds 1321da177e4SLinus Torvalds /* Copy the local addresses which are valid for 'scope' into 'bp'. */ 1334db67e80SEric W. Biederman int sctp_copy_local_addr_list(struct net *net, struct sctp_bind_addr *bp, 1341c662018SXin Long enum sctp_scope scope, gfp_t gfp, int copy_flags) 1351da177e4SLinus Torvalds { 1361da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1372e3ce5bcSXin Long union sctp_addr laddr; 1381da177e4SLinus Torvalds int error = 0; 1391da177e4SLinus Torvalds 14029303547SVlad Yasevich rcu_read_lock(); 1414db67e80SEric W. Biederman list_for_each_entry_rcu(addr, &net->sctp.local_addr_list, list) { 14229303547SVlad Yasevich if (!addr->valid) 14329303547SVlad Yasevich continue; 144165f2cf6SXin Long if (!sctp_in_scope(net, &addr->a, scope)) 145165f2cf6SXin Long continue; 146165f2cf6SXin Long 1471da177e4SLinus Torvalds /* Now that the address is in scope, check to see if 1481da177e4SLinus Torvalds * the address type is really supported by the local 1491da177e4SLinus Torvalds * sock as well as the remote peer. 1501da177e4SLinus Torvalds */ 151165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET && 152471e39dfSMarcelo Ricardo Leitner (!(copy_flags & SCTP_ADDR4_ALLOWED) || 153471e39dfSMarcelo Ricardo Leitner !(copy_flags & SCTP_ADDR4_PEERSUPP))) 154165f2cf6SXin Long continue; 155165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET6 && 156165f2cf6SXin Long (!(copy_flags & SCTP_ADDR6_ALLOWED) || 157165f2cf6SXin Long !(copy_flags & SCTP_ADDR6_PEERSUPP))) 158165f2cf6SXin Long continue; 159165f2cf6SXin Long 1602e3ce5bcSXin Long laddr = addr->a; 1612e3ce5bcSXin Long /* also works for setting ipv6 address port */ 1622e3ce5bcSXin Long laddr.v4.sin_port = htons(bp->port); 1632e3ce5bcSXin Long if (sctp_bind_addr_state(bp, &laddr) != -1) 164b8607805SXin Long continue; 165b8607805SXin Long 166165f2cf6SXin Long error = sctp_add_bind_addr(bp, &addr->a, sizeof(addr->a), 167f57d96b2SVlad Yasevich SCTP_ADDR_SRC, GFP_ATOMIC); 1681da177e4SLinus Torvalds if (error) 169165f2cf6SXin Long break; 1701da177e4SLinus Torvalds } 1711da177e4SLinus Torvalds 17229303547SVlad Yasevich rcu_read_unlock(); 1731da177e4SLinus Torvalds return error; 1741da177e4SLinus Torvalds } 1751da177e4SLinus Torvalds 176b7e10c25SRichard Haines /* Copy over any ip options */ 177b7e10c25SRichard Haines static void sctp_v4_copy_ip_options(struct sock *sk, struct sock *newsk) 178b7e10c25SRichard Haines { 179b7e10c25SRichard Haines struct inet_sock *newinet, *inet = inet_sk(sk); 180b7e10c25SRichard Haines struct ip_options_rcu *inet_opt, *newopt = NULL; 181b7e10c25SRichard Haines 182b7e10c25SRichard Haines newinet = inet_sk(newsk); 183b7e10c25SRichard Haines 184b7e10c25SRichard Haines rcu_read_lock(); 185b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 186b7e10c25SRichard Haines if (inet_opt) { 187b7e10c25SRichard Haines newopt = sock_kmalloc(newsk, sizeof(*inet_opt) + 188b7e10c25SRichard Haines inet_opt->opt.optlen, GFP_ATOMIC); 189b7e10c25SRichard Haines if (newopt) 190b7e10c25SRichard Haines memcpy(newopt, inet_opt, sizeof(*inet_opt) + 191b7e10c25SRichard Haines inet_opt->opt.optlen); 192b7e10c25SRichard Haines else 193b7e10c25SRichard Haines pr_err("%s: Failed to copy ip options\n", __func__); 194b7e10c25SRichard Haines } 195b7e10c25SRichard Haines RCU_INIT_POINTER(newinet->inet_opt, newopt); 196b7e10c25SRichard Haines rcu_read_unlock(); 197b7e10c25SRichard Haines } 198b7e10c25SRichard Haines 199b7e10c25SRichard Haines /* Account for the IP options */ 200b7e10c25SRichard Haines static int sctp_v4_ip_options_len(struct sock *sk) 201b7e10c25SRichard Haines { 202b7e10c25SRichard Haines struct inet_sock *inet = inet_sk(sk); 203b7e10c25SRichard Haines struct ip_options_rcu *inet_opt; 204b7e10c25SRichard Haines int len = 0; 205b7e10c25SRichard Haines 206b7e10c25SRichard Haines rcu_read_lock(); 207b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 208b7e10c25SRichard Haines if (inet_opt) 209b7e10c25SRichard Haines len = inet_opt->opt.optlen; 210b7e10c25SRichard Haines 211b7e10c25SRichard Haines rcu_read_unlock(); 212b7e10c25SRichard Haines return len; 213b7e10c25SRichard Haines } 214b7e10c25SRichard Haines 2151da177e4SLinus Torvalds /* Initialize a sctp_addr from in incoming skb. */ 2161da177e4SLinus Torvalds static void sctp_v4_from_skb(union sctp_addr *addr, struct sk_buff *skb, 2171da177e4SLinus Torvalds int is_saddr) 2181da177e4SLinus Torvalds { 2190630c56eSMarcelo Ricardo Leitner /* Always called on head skb, so this is safe */ 2200630c56eSMarcelo Ricardo Leitner struct sctphdr *sh = sctp_hdr(skb); 2210630c56eSMarcelo Ricardo Leitner struct sockaddr_in *sa = &addr->v4; 2221da177e4SLinus Torvalds 2231da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2241da177e4SLinus Torvalds 2251da177e4SLinus Torvalds if (is_saddr) { 2260630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->source; 2270630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->saddr; 2281da177e4SLinus Torvalds } else { 2290630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->dest; 2300630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->daddr; 2311da177e4SLinus Torvalds } 232b6f3320bSXin Long memset(sa->sin_zero, 0, sizeof(sa->sin_zero)); 2331da177e4SLinus Torvalds } 2341da177e4SLinus Torvalds 2351da177e4SLinus Torvalds /* Initialize an sctp_addr from a socket. */ 2361da177e4SLinus Torvalds static void sctp_v4_from_sk(union sctp_addr *addr, struct sock *sk) 2371da177e4SLinus Torvalds { 2381da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2397dcdbd95SAl Viro addr->v4.sin_port = 0; 240c720c7e8SEric Dumazet addr->v4.sin_addr.s_addr = inet_sk(sk)->inet_rcv_saddr; 241b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 2421da177e4SLinus Torvalds } 2431da177e4SLinus Torvalds 2441da177e4SLinus Torvalds /* Initialize sk->sk_rcv_saddr from sctp_addr. */ 2451da177e4SLinus Torvalds static void sctp_v4_to_sk_saddr(union sctp_addr *addr, struct sock *sk) 2461da177e4SLinus Torvalds { 247c720c7e8SEric Dumazet inet_sk(sk)->inet_rcv_saddr = addr->v4.sin_addr.s_addr; 2481da177e4SLinus Torvalds } 2491da177e4SLinus Torvalds 2501da177e4SLinus Torvalds /* Initialize sk->sk_daddr from sctp_addr. */ 2511da177e4SLinus Torvalds static void sctp_v4_to_sk_daddr(union sctp_addr *addr, struct sock *sk) 2521da177e4SLinus Torvalds { 253c720c7e8SEric Dumazet inet_sk(sk)->inet_daddr = addr->v4.sin_addr.s_addr; 2541da177e4SLinus Torvalds } 2551da177e4SLinus Torvalds 2561da177e4SLinus Torvalds /* Initialize a sctp_addr from an address parameter. */ 257*0c5dc070SMarcelo Ricardo Leitner static bool sctp_v4_from_addr_param(union sctp_addr *addr, 2581da177e4SLinus Torvalds union sctp_addr_param *param, 259dd86d136SAl Viro __be16 port, int iif) 2601da177e4SLinus Torvalds { 261*0c5dc070SMarcelo Ricardo Leitner if (ntohs(param->v4.param_hdr.length) < sizeof(struct sctp_ipv4addr_param)) 262*0c5dc070SMarcelo Ricardo Leitner return false; 263*0c5dc070SMarcelo Ricardo Leitner 2641da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2651da177e4SLinus Torvalds addr->v4.sin_port = port; 2661da177e4SLinus Torvalds addr->v4.sin_addr.s_addr = param->v4.addr.s_addr; 267b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 268*0c5dc070SMarcelo Ricardo Leitner 269*0c5dc070SMarcelo Ricardo Leitner return true; 2701da177e4SLinus Torvalds } 2711da177e4SLinus Torvalds 2721da177e4SLinus Torvalds /* Initialize an address parameter from a sctp_addr and return the length 2731da177e4SLinus Torvalds * of the address parameter. 2741da177e4SLinus Torvalds */ 2751da177e4SLinus Torvalds static int sctp_v4_to_addr_param(const union sctp_addr *addr, 2761da177e4SLinus Torvalds union sctp_addr_param *param) 2771da177e4SLinus Torvalds { 278a38905e6SXin Long int length = sizeof(struct sctp_ipv4addr_param); 2791da177e4SLinus Torvalds 2801da177e4SLinus Torvalds param->v4.param_hdr.type = SCTP_PARAM_IPV4_ADDRESS; 281dbc16db1SAl Viro param->v4.param_hdr.length = htons(length); 2821da177e4SLinus Torvalds param->v4.addr.s_addr = addr->v4.sin_addr.s_addr; 2831da177e4SLinus Torvalds 2841da177e4SLinus Torvalds return length; 2851da177e4SLinus Torvalds } 2861da177e4SLinus Torvalds 2871da177e4SLinus Torvalds /* Initialize a sctp_addr from a dst_entry. */ 28818a353f4SDavid S. Miller static void sctp_v4_dst_saddr(union sctp_addr *saddr, struct flowi4 *fl4, 289854d43a4SAl Viro __be16 port) 2901da177e4SLinus Torvalds { 2911da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 2921da177e4SLinus Torvalds saddr->v4.sin_port = port; 29318a353f4SDavid S. Miller saddr->v4.sin_addr.s_addr = fl4->saddr; 294b6f3320bSXin Long memset(saddr->v4.sin_zero, 0, sizeof(saddr->v4.sin_zero)); 2951da177e4SLinus Torvalds } 2961da177e4SLinus Torvalds 2971da177e4SLinus Torvalds /* Compare two addresses exactly. */ 2981da177e4SLinus Torvalds static int sctp_v4_cmp_addr(const union sctp_addr *addr1, 2991da177e4SLinus Torvalds const union sctp_addr *addr2) 3001da177e4SLinus Torvalds { 3011da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 3021da177e4SLinus Torvalds return 0; 3031da177e4SLinus Torvalds if (addr1->v4.sin_port != addr2->v4.sin_port) 3041da177e4SLinus Torvalds return 0; 3051da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr != addr2->v4.sin_addr.s_addr) 3061da177e4SLinus Torvalds return 0; 3071da177e4SLinus Torvalds 3081da177e4SLinus Torvalds return 1; 3091da177e4SLinus Torvalds } 3101da177e4SLinus Torvalds 3111da177e4SLinus Torvalds /* Initialize addr struct to INADDR_ANY. */ 3126fbfa9f9SAl Viro static void sctp_v4_inaddr_any(union sctp_addr *addr, __be16 port) 3131da177e4SLinus Torvalds { 3141da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 315e6f1cebfSAl Viro addr->v4.sin_addr.s_addr = htonl(INADDR_ANY); 3161da177e4SLinus Torvalds addr->v4.sin_port = port; 317b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 3181da177e4SLinus Torvalds } 3191da177e4SLinus Torvalds 3201da177e4SLinus Torvalds /* Is this a wildcard address? */ 3211da177e4SLinus Torvalds static int sctp_v4_is_any(const union sctp_addr *addr) 3221da177e4SLinus Torvalds { 323e6f1cebfSAl Viro return htonl(INADDR_ANY) == addr->v4.sin_addr.s_addr; 3241da177e4SLinus Torvalds } 3251da177e4SLinus Torvalds 3261da177e4SLinus Torvalds /* This function checks if the address is a valid address to be used for 3271da177e4SLinus Torvalds * SCTP binding. 3281da177e4SLinus Torvalds * 3291da177e4SLinus Torvalds * Output: 3301da177e4SLinus Torvalds * Return 0 - If the address is a non-unicast or an illegal address. 3311da177e4SLinus Torvalds * Return 1 - If the address is a unicast. 3321da177e4SLinus Torvalds */ 3335636bef7SVlad Yasevich static int sctp_v4_addr_valid(union sctp_addr *addr, 3345636bef7SVlad Yasevich struct sctp_sock *sp, 3355636bef7SVlad Yasevich const struct sk_buff *skb) 3361da177e4SLinus Torvalds { 3377dab83deSVlad Yasevich /* IPv4 addresses not allowed */ 3387dab83deSVlad Yasevich if (sp && ipv6_only_sock(sctp_opt2sk(sp))) 3397dab83deSVlad Yasevich return 0; 3407dab83deSVlad Yasevich 3411da177e4SLinus Torvalds /* Is this a non-unicast address or a unusable SCTP address? */ 342b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) 3431da177e4SLinus Torvalds return 0; 3441da177e4SLinus Torvalds 3455636bef7SVlad Yasevich /* Is this a broadcast address? */ 346511c3f92SEric Dumazet if (skb && skb_rtable(skb)->rt_flags & RTCF_BROADCAST) 3475636bef7SVlad Yasevich return 0; 3485636bef7SVlad Yasevich 3491da177e4SLinus Torvalds return 1; 3501da177e4SLinus Torvalds } 3511da177e4SLinus Torvalds 3521da177e4SLinus Torvalds /* Should this be available for binding? */ 3531da177e4SLinus Torvalds static int sctp_v4_available(union sctp_addr *addr, struct sctp_sock *sp) 3541da177e4SLinus Torvalds { 355bb2db45bSEric W. Biederman struct net *net = sock_net(&sp->inet.sk); 356bb2db45bSEric W. Biederman int ret = inet_addr_type(net, addr->v4.sin_addr.s_addr); 3571da177e4SLinus Torvalds 3581da177e4SLinus Torvalds 359e6f1cebfSAl Viro if (addr->v4.sin_addr.s_addr != htonl(INADDR_ANY) && 360cdac4e07SNeil Horman ret != RTN_LOCAL && 361cdac4e07SNeil Horman !sp->inet.freebind && 36249a60158SVincent Bernat !net->ipv4.sysctl_ip_nonlocal_bind) 3631da177e4SLinus Torvalds return 0; 364cdac4e07SNeil Horman 3657dab83deSVlad Yasevich if (ipv6_only_sock(sctp_opt2sk(sp))) 3667dab83deSVlad Yasevich return 0; 3677dab83deSVlad Yasevich 3681da177e4SLinus Torvalds return 1; 3691da177e4SLinus Torvalds } 3701da177e4SLinus Torvalds 3711da177e4SLinus Torvalds /* Checking the loopback, private and other address scopes as defined in 3721da177e4SLinus Torvalds * RFC 1918. The IPv4 scoping is based on the draft for SCTP IPv4 3731da177e4SLinus Torvalds * scoping <draft-stewart-tsvwg-sctp-ipv4-00.txt>. 3741da177e4SLinus Torvalds * 3751da177e4SLinus Torvalds * Level 0 - unusable SCTP addresses 3761da177e4SLinus Torvalds * Level 1 - loopback address 3771da177e4SLinus Torvalds * Level 2 - link-local addresses 3781da177e4SLinus Torvalds * Level 3 - private addresses. 3791da177e4SLinus Torvalds * Level 4 - global addresses 3801da177e4SLinus Torvalds * For INIT and INIT-ACK address list, let L be the level of 38193c3216aSRandy Dunlap * requested destination address, sender and receiver 3821da177e4SLinus Torvalds * SHOULD include all of its addresses with level greater 3831da177e4SLinus Torvalds * than or equal to L. 38472388433SBhaskar Dutta * 38572388433SBhaskar Dutta * IPv4 scoping can be controlled through sysctl option 38672388433SBhaskar Dutta * net.sctp.addr_scope_policy 3871da177e4SLinus Torvalds */ 3881c662018SXin Long static enum sctp_scope sctp_v4_scope(union sctp_addr *addr) 3891da177e4SLinus Torvalds { 3901c662018SXin Long enum sctp_scope retval; 3911da177e4SLinus Torvalds 3921da177e4SLinus Torvalds /* Check for unusable SCTP addresses. */ 393b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) { 3941da177e4SLinus Torvalds retval = SCTP_SCOPE_UNUSABLE; 395b5cb2bbcSJoe Perches } else if (ipv4_is_loopback(addr->v4.sin_addr.s_addr)) { 3961da177e4SLinus Torvalds retval = SCTP_SCOPE_LOOPBACK; 397b5cb2bbcSJoe Perches } else if (ipv4_is_linklocal_169(addr->v4.sin_addr.s_addr)) { 3981da177e4SLinus Torvalds retval = SCTP_SCOPE_LINK; 399b5cb2bbcSJoe Perches } else if (ipv4_is_private_10(addr->v4.sin_addr.s_addr) || 400b5cb2bbcSJoe Perches ipv4_is_private_172(addr->v4.sin_addr.s_addr) || 401b5cb2bbcSJoe Perches ipv4_is_private_192(addr->v4.sin_addr.s_addr)) { 4021da177e4SLinus Torvalds retval = SCTP_SCOPE_PRIVATE; 4031da177e4SLinus Torvalds } else { 4041da177e4SLinus Torvalds retval = SCTP_SCOPE_GLOBAL; 4051da177e4SLinus Torvalds } 4061da177e4SLinus Torvalds 4071da177e4SLinus Torvalds return retval; 4081da177e4SLinus Torvalds } 4091da177e4SLinus Torvalds 4101da177e4SLinus Torvalds /* Returns a valid dst cache entry for the given source and destination ip 4111da177e4SLinus Torvalds * addresses. If an association is passed, trys to get a dst entry with a 4121da177e4SLinus Torvalds * source address that matches an address in the bind address list. 4131da177e4SLinus Torvalds */ 414da0420beSVlad Yasevich static void sctp_v4_get_dst(struct sctp_transport *t, union sctp_addr *saddr, 415da0420beSVlad Yasevich struct flowi *fl, struct sock *sk) 4161da177e4SLinus Torvalds { 417da0420beSVlad Yasevich struct sctp_association *asoc = t->asoc; 4181da177e4SLinus Torvalds struct rtable *rt; 419582eea23SMarcelo Ricardo Leitner struct flowi _fl; 420582eea23SMarcelo Ricardo Leitner struct flowi4 *fl4 = &_fl.u.ip4; 4211da177e4SLinus Torvalds struct sctp_bind_addr *bp; 4221da177e4SLinus Torvalds struct sctp_sockaddr_entry *laddr; 4231da177e4SLinus Torvalds struct dst_entry *dst = NULL; 424da0420beSVlad Yasevich union sctp_addr *daddr = &t->ipaddr; 4251da177e4SLinus Torvalds union sctp_addr dst_saddr; 4268a9c58d2SXin Long __u8 tos = inet_sk(sk)->tos; 4271da177e4SLinus Torvalds 4288a9c58d2SXin Long if (t->dscp & SCTP_DSCP_SET_MASK) 4298a9c58d2SXin Long tos = t->dscp & SCTP_DSCP_VAL_MASK; 430582eea23SMarcelo Ricardo Leitner memset(&_fl, 0x0, sizeof(_fl)); 4319914ae3cSVlad Yasevich fl4->daddr = daddr->v4.sin_addr.s_addr; 4329914ae3cSVlad Yasevich fl4->fl4_dport = daddr->v4.sin_port; 4339914ae3cSVlad Yasevich fl4->flowi4_proto = IPPROTO_SCTP; 4341da177e4SLinus Torvalds if (asoc) { 4358a9c58d2SXin Long fl4->flowi4_tos = RT_CONN_FLAGS_TOS(asoc->base.sk, tos); 4369914ae3cSVlad Yasevich fl4->flowi4_oif = asoc->base.sk->sk_bound_dev_if; 4379914ae3cSVlad Yasevich fl4->fl4_sport = htons(asoc->base.bind_addr.port); 4381da177e4SLinus Torvalds } 4396429d3dcSWei Yongjun if (saddr) { 4409914ae3cSVlad Yasevich fl4->saddr = saddr->v4.sin_addr.s_addr; 441ecf938feSXin Long if (!fl4->fl4_sport) 4429914ae3cSVlad Yasevich fl4->fl4_sport = saddr->v4.sin_port; 4436429d3dcSWei Yongjun } 4441da177e4SLinus Torvalds 445bb33381dSDaniel Borkmann pr_debug("%s: dst:%pI4, src:%pI4 - ", __func__, &fl4->daddr, 446bb33381dSDaniel Borkmann &fl4->saddr); 4471da177e4SLinus Torvalds 448bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 449582eea23SMarcelo Ricardo Leitner if (!IS_ERR(rt)) { 450d8d1f30bSChangli Gao dst = &rt->dst; 451582eea23SMarcelo Ricardo Leitner t->dst = dst; 452582eea23SMarcelo Ricardo Leitner memcpy(fl, &_fl, sizeof(_fl)); 453582eea23SMarcelo Ricardo Leitner } 4541da177e4SLinus Torvalds 4551da177e4SLinus Torvalds /* If there is no association or if a source address is passed, no 4561da177e4SLinus Torvalds * more validation is required. 4571da177e4SLinus Torvalds */ 4581da177e4SLinus Torvalds if (!asoc || saddr) 4591da177e4SLinus Torvalds goto out; 4601da177e4SLinus Torvalds 4611da177e4SLinus Torvalds bp = &asoc->base.bind_addr; 4621da177e4SLinus Torvalds 4631da177e4SLinus Torvalds if (dst) { 4641da177e4SLinus Torvalds /* Walk through the bind address list and look for a bind 4651da177e4SLinus Torvalds * address that matches the source address of the returned dst. 4661da177e4SLinus Torvalds */ 46718a353f4SDavid S. Miller sctp_v4_dst_saddr(&dst_saddr, fl4, htons(bp->port)); 468559cf710SVlad Yasevich rcu_read_lock(); 469559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4708a07eb0aSMichio Honda if (!laddr->valid || (laddr->state == SCTP_ADDR_DEL) || 4718a07eb0aSMichio Honda (laddr->state != SCTP_ADDR_SRC && 4728a07eb0aSMichio Honda !asoc->src_out_of_asoc_ok)) 473dc022a98SSridhar Samudrala continue; 474854d43a4SAl Viro if (sctp_v4_cmp_addr(&dst_saddr, &laddr->a)) 4751da177e4SLinus Torvalds goto out_unlock; 4761da177e4SLinus Torvalds } 477559cf710SVlad Yasevich rcu_read_unlock(); 4781da177e4SLinus Torvalds 4791da177e4SLinus Torvalds /* None of the bound addresses match the source address of the 4801da177e4SLinus Torvalds * dst. So release it. 4811da177e4SLinus Torvalds */ 4821da177e4SLinus Torvalds dst_release(dst); 4831da177e4SLinus Torvalds dst = NULL; 4841da177e4SLinus Torvalds } 4851da177e4SLinus Torvalds 4861da177e4SLinus Torvalds /* Walk through the bind address list and try to get a dst that 4871da177e4SLinus Torvalds * matches a bind address as the source address. 4881da177e4SLinus Torvalds */ 489559cf710SVlad Yasevich rcu_read_lock(); 490559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4910ca50d12SMarcelo Ricardo Leitner struct net_device *odev; 4920ca50d12SMarcelo Ricardo Leitner 493559cf710SVlad Yasevich if (!laddr->valid) 494559cf710SVlad Yasevich continue; 49507868284SMarcelo Ricardo Leitner if (laddr->state != SCTP_ADDR_SRC || 49607868284SMarcelo Ricardo Leitner AF_INET != laddr->a.sa.sa_family) 49707868284SMarcelo Ricardo Leitner continue; 49807868284SMarcelo Ricardo Leitner 4999914ae3cSVlad Yasevich fl4->fl4_sport = laddr->a.v4.sin_port; 50085350871SXufeng Zhang flowi4_update_output(fl4, 50185350871SXufeng Zhang asoc->base.sk->sk_bound_dev_if, 5028a9c58d2SXin Long RT_CONN_FLAGS_TOS(asoc->base.sk, tos), 50385350871SXufeng Zhang daddr->v4.sin_addr.s_addr, 50485350871SXufeng Zhang laddr->a.v4.sin_addr.s_addr); 50585350871SXufeng Zhang 506bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 50707868284SMarcelo Ricardo Leitner if (IS_ERR(rt)) 50807868284SMarcelo Ricardo Leitner continue; 50907868284SMarcelo Ricardo Leitner 5100ca50d12SMarcelo Ricardo Leitner /* Ensure the src address belongs to the output 5110ca50d12SMarcelo Ricardo Leitner * interface. 5120ca50d12SMarcelo Ricardo Leitner */ 5130ca50d12SMarcelo Ricardo Leitner odev = __ip_dev_find(sock_net(sk), laddr->a.v4.sin_addr.s_addr, 5140ca50d12SMarcelo Ricardo Leitner false); 515d82f0f1fSMarcelo Ricardo Leitner if (!odev || odev->ifindex != fl4->flowi4_oif) { 516582eea23SMarcelo Ricardo Leitner if (!dst) { 5174a31a6b1STommi Rantala dst = &rt->dst; 518582eea23SMarcelo Ricardo Leitner t->dst = dst; 519582eea23SMarcelo Ricardo Leitner memcpy(fl, &_fl, sizeof(_fl)); 520582eea23SMarcelo Ricardo Leitner } else { 521d82f0f1fSMarcelo Ricardo Leitner dst_release(&rt->dst); 522582eea23SMarcelo Ricardo Leitner } 5230ca50d12SMarcelo Ricardo Leitner continue; 524d82f0f1fSMarcelo Ricardo Leitner } 5250ca50d12SMarcelo Ricardo Leitner 526410f0383SMarcelo Ricardo Leitner dst_release(dst); 527d8d1f30bSChangli Gao dst = &rt->dst; 528582eea23SMarcelo Ricardo Leitner t->dst = dst; 529582eea23SMarcelo Ricardo Leitner memcpy(fl, &_fl, sizeof(_fl)); 53007868284SMarcelo Ricardo Leitner break; 5311da177e4SLinus Torvalds } 5321da177e4SLinus Torvalds 5331da177e4SLinus Torvalds out_unlock: 534559cf710SVlad Yasevich rcu_read_unlock(); 5351da177e4SLinus Torvalds out: 536582eea23SMarcelo Ricardo Leitner if (dst) { 537bb33381dSDaniel Borkmann pr_debug("rt_dst:%pI4, rt_src:%pI4\n", 538582eea23SMarcelo Ricardo Leitner &fl->u.ip4.daddr, &fl->u.ip4.saddr); 539582eea23SMarcelo Ricardo Leitner } else { 540582eea23SMarcelo Ricardo Leitner t->dst = NULL; 541bb33381dSDaniel Borkmann pr_debug("no route\n"); 5421da177e4SLinus Torvalds } 543582eea23SMarcelo Ricardo Leitner } 5441da177e4SLinus Torvalds 5451da177e4SLinus Torvalds /* For v4, the source address is cached in the route entry(dst). So no need 5461da177e4SLinus Torvalds * to cache it separately and hence this is an empty routine. 5471da177e4SLinus Torvalds */ 548e5117101SYOSHIFUJI Hideaki static void sctp_v4_get_saddr(struct sctp_sock *sk, 5499914ae3cSVlad Yasevich struct sctp_transport *t, 5509914ae3cSVlad Yasevich struct flowi *fl) 5511da177e4SLinus Torvalds { 5529914ae3cSVlad Yasevich union sctp_addr *saddr = &t->saddr; 5539914ae3cSVlad Yasevich struct rtable *rt = (struct rtable *)t->dst; 55423ec47a0SVladislav Yasevich 5551da177e4SLinus Torvalds if (rt) { 5561da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 557902ebd3eSDavid S. Miller saddr->v4.sin_addr.s_addr = fl->u.ip4.saddr; 5581da177e4SLinus Torvalds } 5591da177e4SLinus Torvalds } 5601da177e4SLinus Torvalds 5611da177e4SLinus Torvalds /* What interface did this skb arrive on? */ 5621da177e4SLinus Torvalds static int sctp_v4_skb_iif(const struct sk_buff *skb) 5631da177e4SLinus Torvalds { 56492101b3bSDavid S. Miller return inet_iif(skb); 5651da177e4SLinus Torvalds } 5661da177e4SLinus Torvalds 5671da177e4SLinus Torvalds /* Was this packet marked by Explicit Congestion Notification? */ 5681da177e4SLinus Torvalds static int sctp_v4_is_ce(const struct sk_buff *skb) 5691da177e4SLinus Torvalds { 570eddc9ec5SArnaldo Carvalho de Melo return INET_ECN_is_ce(ip_hdr(skb)->tos); 5711da177e4SLinus Torvalds } 5721da177e4SLinus Torvalds 5731da177e4SLinus Torvalds /* Create and initialize a new sk for the socket returned by accept(). */ 5741da177e4SLinus Torvalds static struct sock *sctp_v4_create_accept_sk(struct sock *sk, 575cdfbabfbSDavid Howells struct sctp_association *asoc, 576cdfbabfbSDavid Howells bool kern) 5771da177e4SLinus Torvalds { 5783b1e0a65SYOSHIFUJI Hideaki struct sock *newsk = sk_alloc(sock_net(sk), PF_INET, GFP_KERNEL, 579cdfbabfbSDavid Howells sk->sk_prot, kern); 580914e1c8bSVlad Yasevich struct inet_sock *newinet; 5811da177e4SLinus Torvalds 5821da177e4SLinus Torvalds if (!newsk) 5831da177e4SLinus Torvalds goto out; 5841da177e4SLinus Torvalds 5851da177e4SLinus Torvalds sock_init_data(NULL, newsk); 5861da177e4SLinus Torvalds 587914e1c8bSVlad Yasevich sctp_copy_sock(newsk, sk, asoc); 5881da177e4SLinus Torvalds sock_reset_flag(newsk, SOCK_ZAPPED); 5891da177e4SLinus Torvalds 590b7e10c25SRichard Haines sctp_v4_copy_ip_options(sk, newsk); 591b7e10c25SRichard Haines 5921da177e4SLinus Torvalds newinet = inet_sk(newsk); 5931da177e4SLinus Torvalds 594c720c7e8SEric Dumazet newinet->inet_daddr = asoc->peer.primary_addr.v4.sin_addr.s_addr; 5951da177e4SLinus Torvalds 596e6848976SArnaldo Carvalho de Melo sk_refcnt_debug_inc(newsk); 5971da177e4SLinus Torvalds 5981da177e4SLinus Torvalds if (newsk->sk_prot->init(newsk)) { 5991da177e4SLinus Torvalds sk_common_release(newsk); 6001da177e4SLinus Torvalds newsk = NULL; 6011da177e4SLinus Torvalds } 6021da177e4SLinus Torvalds 6031da177e4SLinus Torvalds out: 6041da177e4SLinus Torvalds return newsk; 6051da177e4SLinus Torvalds } 6061da177e4SLinus Torvalds 607299ee123SJason Gunthorpe static int sctp_v4_addr_to_user(struct sctp_sock *sp, union sctp_addr *addr) 6081da177e4SLinus Torvalds { 609299ee123SJason Gunthorpe /* No address mapping for V4 sockets */ 61009279e61SXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 611299ee123SJason Gunthorpe return sizeof(struct sockaddr_in); 6121da177e4SLinus Torvalds } 6131da177e4SLinus Torvalds 6141da177e4SLinus Torvalds /* Dump the v4 addr to the seq file. */ 6151da177e4SLinus Torvalds static void sctp_v4_seq_dump_addr(struct seq_file *seq, union sctp_addr *addr) 6161da177e4SLinus Torvalds { 61721454aaaSHarvey Harrison seq_printf(seq, "%pI4 ", &addr->v4.sin_addr); 6181da177e4SLinus Torvalds } 6191da177e4SLinus Torvalds 620b9031d9dSVlad Yasevich static void sctp_v4_ecn_capable(struct sock *sk) 621b9031d9dSVlad Yasevich { 622b9031d9dSVlad Yasevich INET_ECN_xmit(sk); 623b9031d9dSVlad Yasevich } 624b9031d9dSVlad Yasevich 6259c3b5751SKees Cook static void sctp_addr_wq_timeout_handler(struct timer_list *t) 6269f7d653bSMichio Honda { 6279c3b5751SKees Cook struct net *net = from_timer(net, t, sctp.addr_wq_timer); 6289f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw, *temp; 6299f7d653bSMichio Honda struct sctp_sock *sp; 6309f7d653bSMichio Honda 6314db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6329f7d653bSMichio Honda 6334db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 634bb33381dSDaniel Borkmann pr_debug("%s: the first ent in wq:%p is addr:%pISc for cmd:%d at " 635bb33381dSDaniel Borkmann "entry:%p\n", __func__, &net->sctp.addr_waitq, &addrw->a.sa, 636bb33381dSDaniel Borkmann addrw->state, addrw); 6379f7d653bSMichio Honda 638dfd56b8bSEric Dumazet #if IS_ENABLED(CONFIG_IPV6) 6399f7d653bSMichio Honda /* Now we send an ASCONF for each association */ 6409f7d653bSMichio Honda /* Note. we currently don't handle link local IPv6 addressees */ 6419f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET6) { 6429f7d653bSMichio Honda struct in6_addr *in6; 6439f7d653bSMichio Honda 6449f7d653bSMichio Honda if (ipv6_addr_type(&addrw->a.v6.sin6_addr) & 6459f7d653bSMichio Honda IPV6_ADDR_LINKLOCAL) 6469f7d653bSMichio Honda goto free_next; 6479f7d653bSMichio Honda 6489f7d653bSMichio Honda in6 = (struct in6_addr *)&addrw->a.v6.sin6_addr; 6494db67e80SEric W. Biederman if (ipv6_chk_addr(net, in6, NULL, 0) == 0 && 6509f7d653bSMichio Honda addrw->state == SCTP_ADDR_NEW) { 6519f7d653bSMichio Honda unsigned long timeo_val; 6529f7d653bSMichio Honda 653bb33381dSDaniel Borkmann pr_debug("%s: this is on DAD, trying %d sec " 654bb33381dSDaniel Borkmann "later\n", __func__, 6559f7d653bSMichio Honda SCTP_ADDRESS_TICK_DELAY); 656bb33381dSDaniel Borkmann 6579f7d653bSMichio Honda timeo_val = jiffies; 6589f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 6594db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 6609f7d653bSMichio Honda break; 6619f7d653bSMichio Honda } 6629f7d653bSMichio Honda } 6635d0c90cfSDavid S. Miller #endif 6644db67e80SEric W. Biederman list_for_each_entry(sp, &net->sctp.auto_asconf_splist, auto_asconf_list) { 6659f7d653bSMichio Honda struct sock *sk; 6669f7d653bSMichio Honda 6679f7d653bSMichio Honda sk = sctp_opt2sk(sp); 6689f7d653bSMichio Honda /* ignore bound-specific endpoints */ 6699f7d653bSMichio Honda if (!sctp_is_ep_boundall(sk)) 6709f7d653bSMichio Honda continue; 6715bc1d1b4Swangweidong bh_lock_sock(sk); 6729f7d653bSMichio Honda if (sctp_asconf_mgmt(sp, addrw) < 0) 673bb33381dSDaniel Borkmann pr_debug("%s: sctp_asconf_mgmt failed\n", __func__); 6745bc1d1b4Swangweidong bh_unlock_sock(sk); 6759f7d653bSMichio Honda } 67639d84a58SDaniel Halperin #if IS_ENABLED(CONFIG_IPV6) 6779f7d653bSMichio Honda free_next: 67839d84a58SDaniel Halperin #endif 6799f7d653bSMichio Honda list_del(&addrw->list); 6809f7d653bSMichio Honda kfree(addrw); 6819f7d653bSMichio Honda } 6824db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6839f7d653bSMichio Honda } 6849f7d653bSMichio Honda 6854db67e80SEric W. Biederman static void sctp_free_addr_wq(struct net *net) 6869f7d653bSMichio Honda { 6879f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 6889f7d653bSMichio Honda struct sctp_sockaddr_entry *temp; 6899f7d653bSMichio Honda 6904db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6914db67e80SEric W. Biederman del_timer(&net->sctp.addr_wq_timer); 6924db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 6939f7d653bSMichio Honda list_del(&addrw->list); 6949f7d653bSMichio Honda kfree(addrw); 6959f7d653bSMichio Honda } 6964db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6979f7d653bSMichio Honda } 6989f7d653bSMichio Honda 6999f7d653bSMichio Honda /* lookup the entry for the same address in the addr_waitq 7009f7d653bSMichio Honda * sctp_addr_wq MUST be locked 7019f7d653bSMichio Honda */ 7024db67e80SEric W. Biederman static struct sctp_sockaddr_entry *sctp_addr_wq_lookup(struct net *net, 7034db67e80SEric W. Biederman struct sctp_sockaddr_entry *addr) 7049f7d653bSMichio Honda { 7059f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 7069f7d653bSMichio Honda 7074db67e80SEric W. Biederman list_for_each_entry(addrw, &net->sctp.addr_waitq, list) { 7089f7d653bSMichio Honda if (addrw->a.sa.sa_family != addr->a.sa.sa_family) 7099f7d653bSMichio Honda continue; 7109f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET) { 7119f7d653bSMichio Honda if (addrw->a.v4.sin_addr.s_addr == 7129f7d653bSMichio Honda addr->a.v4.sin_addr.s_addr) 7139f7d653bSMichio Honda return addrw; 7149f7d653bSMichio Honda } else if (addrw->a.sa.sa_family == AF_INET6) { 7159f7d653bSMichio Honda if (ipv6_addr_equal(&addrw->a.v6.sin6_addr, 7169f7d653bSMichio Honda &addr->a.v6.sin6_addr)) 7179f7d653bSMichio Honda return addrw; 7189f7d653bSMichio Honda } 7199f7d653bSMichio Honda } 7209f7d653bSMichio Honda return NULL; 7219f7d653bSMichio Honda } 7229f7d653bSMichio Honda 7234db67e80SEric W. Biederman void sctp_addr_wq_mgmt(struct net *net, struct sctp_sockaddr_entry *addr, int cmd) 7249f7d653bSMichio Honda { 7259f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 7269f7d653bSMichio Honda unsigned long timeo_val; 7279f7d653bSMichio Honda 7289f7d653bSMichio Honda /* first, we check if an opposite message already exist in the queue. 7299f7d653bSMichio Honda * If we found such message, it is removed. 7309f7d653bSMichio Honda * This operation is a bit stupid, but the DHCP client attaches the 7319f7d653bSMichio Honda * new address after a couple of addition and deletion of that address 7329f7d653bSMichio Honda */ 7339f7d653bSMichio Honda 7344db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 7359f7d653bSMichio Honda /* Offsets existing events in addr_wq */ 7364db67e80SEric W. Biederman addrw = sctp_addr_wq_lookup(net, addr); 7379f7d653bSMichio Honda if (addrw) { 7389f7d653bSMichio Honda if (addrw->state != cmd) { 739bb33381dSDaniel Borkmann pr_debug("%s: offsets existing entry for %d, addr:%pISc " 740bb33381dSDaniel Borkmann "in wq:%p\n", __func__, addrw->state, &addrw->a.sa, 7414db67e80SEric W. Biederman &net->sctp.addr_waitq); 742bb33381dSDaniel Borkmann 7439f7d653bSMichio Honda list_del(&addrw->list); 7449f7d653bSMichio Honda kfree(addrw); 7459f7d653bSMichio Honda } 7464db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7479f7d653bSMichio Honda return; 7489f7d653bSMichio Honda } 7499f7d653bSMichio Honda 7509f7d653bSMichio Honda /* OK, we have to add the new address to the wait queue */ 7519f7d653bSMichio Honda addrw = kmemdup(addr, sizeof(struct sctp_sockaddr_entry), GFP_ATOMIC); 7529f7d653bSMichio Honda if (addrw == NULL) { 7534db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7549f7d653bSMichio Honda return; 7559f7d653bSMichio Honda } 7569f7d653bSMichio Honda addrw->state = cmd; 7574db67e80SEric W. Biederman list_add_tail(&addrw->list, &net->sctp.addr_waitq); 758bb33381dSDaniel Borkmann 759bb33381dSDaniel Borkmann pr_debug("%s: add new entry for cmd:%d, addr:%pISc in wq:%p\n", 760bb33381dSDaniel Borkmann __func__, addrw->state, &addrw->a.sa, &net->sctp.addr_waitq); 7619f7d653bSMichio Honda 7624db67e80SEric W. Biederman if (!timer_pending(&net->sctp.addr_wq_timer)) { 7639f7d653bSMichio Honda timeo_val = jiffies; 7649f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 7654db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 7669f7d653bSMichio Honda } 7674db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7689f7d653bSMichio Honda } 7699f7d653bSMichio Honda 77029303547SVlad Yasevich /* Event handler for inet address addition/deletion events. 77129303547SVlad Yasevich * The sctp_local_addr_list needs to be protocted by a spin lock since 77229303547SVlad Yasevich * multiple notifiers (say IPv4 and IPv6) may be running at the same 77329303547SVlad Yasevich * time and thus corrupt the list. 77429303547SVlad Yasevich * The reader side is protected with RCU. 77529303547SVlad Yasevich */ 77624123186SAdrian Bunk static int sctp_inetaddr_event(struct notifier_block *this, unsigned long ev, 7771da177e4SLinus Torvalds void *ptr) 7781da177e4SLinus Torvalds { 77929c7cf96SSridhar Samudrala struct in_ifaddr *ifa = (struct in_ifaddr *)ptr; 78029303547SVlad Yasevich struct sctp_sockaddr_entry *addr = NULL; 78129303547SVlad Yasevich struct sctp_sockaddr_entry *temp; 7824db67e80SEric W. Biederman struct net *net = dev_net(ifa->ifa_dev->dev); 78322626216SChidambar 'ilLogict' Zinnoury int found = 0; 7841da177e4SLinus Torvalds 78529c7cf96SSridhar Samudrala switch (ev) { 78629c7cf96SSridhar Samudrala case NETDEV_UP: 787400b8b9aSXin Long addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 78829c7cf96SSridhar Samudrala if (addr) { 78929c7cf96SSridhar Samudrala addr->a.v4.sin_family = AF_INET; 79029c7cf96SSridhar Samudrala addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 79129303547SVlad Yasevich addr->valid = 1; 7924db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 7934db67e80SEric W. Biederman list_add_tail_rcu(&addr->list, &net->sctp.local_addr_list); 7944db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_NEW); 7954db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 79629c7cf96SSridhar Samudrala } 79729c7cf96SSridhar Samudrala break; 79829c7cf96SSridhar Samudrala case NETDEV_DOWN: 7994db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 80029303547SVlad Yasevich list_for_each_entry_safe(addr, temp, 8014db67e80SEric W. Biederman &net->sctp.local_addr_list, list) { 802a40a7d15SPavel Emelyanov if (addr->a.sa.sa_family == AF_INET && 803a40a7d15SPavel Emelyanov addr->a.v4.sin_addr.s_addr == 804a40a7d15SPavel Emelyanov ifa->ifa_local) { 8054db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_DEL); 80622626216SChidambar 'ilLogict' Zinnoury found = 1; 80729303547SVlad Yasevich addr->valid = 0; 80829303547SVlad Yasevich list_del_rcu(&addr->list); 80929c7cf96SSridhar Samudrala break; 81029c7cf96SSridhar Samudrala } 81129c7cf96SSridhar Samudrala } 8124db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 81322626216SChidambar 'ilLogict' Zinnoury if (found) 8141231f0baSLai Jiangshan kfree_rcu(addr, rcu); 81529c7cf96SSridhar Samudrala break; 81629c7cf96SSridhar Samudrala } 8171da177e4SLinus Torvalds 8181da177e4SLinus Torvalds return NOTIFY_DONE; 8191da177e4SLinus Torvalds } 8201da177e4SLinus Torvalds 8211da177e4SLinus Torvalds /* 8221da177e4SLinus Torvalds * Initialize the control inode/socket with a control endpoint data 8231da177e4SLinus Torvalds * structure. This endpoint is reserved exclusively for the OOTB processing. 8241da177e4SLinus Torvalds */ 8252ce95503SEric W. Biederman static int sctp_ctl_sock_init(struct net *net) 8261da177e4SLinus Torvalds { 8271da177e4SLinus Torvalds int err; 828fb13d9f9SBrian Haley sa_family_t family = PF_INET; 8291da177e4SLinus Torvalds 8301da177e4SLinus Torvalds if (sctp_get_pf_specific(PF_INET6)) 8311da177e4SLinus Torvalds family = PF_INET6; 8321da177e4SLinus Torvalds 8332ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, family, 8342ce95503SEric W. Biederman SOCK_SEQPACKET, IPPROTO_SCTP, net); 835fb13d9f9SBrian Haley 836fb13d9f9SBrian Haley /* If IPv6 socket could not be created, try the IPv4 socket */ 837fb13d9f9SBrian Haley if (err < 0 && family == PF_INET6) 8382ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, AF_INET, 839fb13d9f9SBrian Haley SOCK_SEQPACKET, IPPROTO_SCTP, 8402ce95503SEric W. Biederman net); 841fb13d9f9SBrian Haley 8421da177e4SLinus Torvalds if (err < 0) { 843145ce502SJoe Perches pr_err("Failed to create the SCTP control socket\n"); 8441da177e4SLinus Torvalds return err; 8451da177e4SLinus Torvalds } 8461da177e4SLinus Torvalds return 0; 8471da177e4SLinus Torvalds } 8481da177e4SLinus Torvalds 849965ae444SXin Long static int sctp_udp_rcv(struct sock *sk, struct sk_buff *skb) 850965ae444SXin Long { 851a1dd2cf2SXin Long SCTP_INPUT_CB(skb)->encap_port = udp_hdr(skb)->source; 852a1dd2cf2SXin Long 853965ae444SXin Long skb_set_transport_header(skb, sizeof(struct udphdr)); 854965ae444SXin Long sctp_rcv(skb); 855965ae444SXin Long return 0; 856965ae444SXin Long } 857965ae444SXin Long 85889ba4917SXin Long static int sctp_udp_err_lookup(struct sock *sk, struct sk_buff *skb) 85989ba4917SXin Long { 86089ba4917SXin Long struct sctp_association *asoc; 86189ba4917SXin Long struct sctp_transport *t; 86289ba4917SXin Long int family; 86389ba4917SXin Long 86489ba4917SXin Long skb->transport_header += sizeof(struct udphdr); 86589ba4917SXin Long family = (ip_hdr(skb)->version == 4) ? AF_INET : AF_INET6; 86689ba4917SXin Long sk = sctp_err_lookup(dev_net(skb->dev), family, skb, sctp_hdr(skb), 86789ba4917SXin Long &asoc, &t); 86889ba4917SXin Long if (!sk) 86989ba4917SXin Long return -ENOENT; 87089ba4917SXin Long 87189ba4917SXin Long sctp_err_finish(sk, t); 87289ba4917SXin Long return 0; 87389ba4917SXin Long } 87489ba4917SXin Long 875965ae444SXin Long int sctp_udp_sock_start(struct net *net) 876965ae444SXin Long { 877965ae444SXin Long struct udp_tunnel_sock_cfg tuncfg = {NULL}; 878965ae444SXin Long struct udp_port_cfg udp_conf = {0}; 879965ae444SXin Long struct socket *sock; 880965ae444SXin Long int err; 881965ae444SXin Long 882965ae444SXin Long udp_conf.family = AF_INET; 883965ae444SXin Long udp_conf.local_ip.s_addr = htonl(INADDR_ANY); 884965ae444SXin Long udp_conf.local_udp_port = htons(net->sctp.udp_port); 885965ae444SXin Long err = udp_sock_create(net, &udp_conf, &sock); 886965ae444SXin Long if (err) { 887965ae444SXin Long pr_err("Failed to create the SCTP UDP tunneling v4 sock\n"); 888965ae444SXin Long return err; 889965ae444SXin Long } 890965ae444SXin Long 891965ae444SXin Long tuncfg.encap_type = 1; 892965ae444SXin Long tuncfg.encap_rcv = sctp_udp_rcv; 89389ba4917SXin Long tuncfg.encap_err_lookup = sctp_udp_err_lookup; 894965ae444SXin Long setup_udp_tunnel_sock(net, sock, &tuncfg); 895965ae444SXin Long net->sctp.udp4_sock = sock->sk; 896965ae444SXin Long 8979d6ba260SXin Long #if IS_ENABLED(CONFIG_IPV6) 8989d6ba260SXin Long memset(&udp_conf, 0, sizeof(udp_conf)); 8999d6ba260SXin Long 9009d6ba260SXin Long udp_conf.family = AF_INET6; 9019d6ba260SXin Long udp_conf.local_ip6 = in6addr_any; 9029d6ba260SXin Long udp_conf.local_udp_port = htons(net->sctp.udp_port); 9039d6ba260SXin Long udp_conf.use_udp6_rx_checksums = true; 9049d6ba260SXin Long udp_conf.ipv6_v6only = true; 9059d6ba260SXin Long err = udp_sock_create(net, &udp_conf, &sock); 9069d6ba260SXin Long if (err) { 9079d6ba260SXin Long pr_err("Failed to create the SCTP UDP tunneling v6 sock\n"); 9089d6ba260SXin Long udp_tunnel_sock_release(net->sctp.udp4_sock->sk_socket); 9099d6ba260SXin Long net->sctp.udp4_sock = NULL; 9109d6ba260SXin Long return err; 9119d6ba260SXin Long } 9129d6ba260SXin Long 9139d6ba260SXin Long tuncfg.encap_type = 1; 9149d6ba260SXin Long tuncfg.encap_rcv = sctp_udp_rcv; 91589ba4917SXin Long tuncfg.encap_err_lookup = sctp_udp_err_lookup; 9169d6ba260SXin Long setup_udp_tunnel_sock(net, sock, &tuncfg); 9179d6ba260SXin Long net->sctp.udp6_sock = sock->sk; 9189d6ba260SXin Long #endif 9199d6ba260SXin Long 920965ae444SXin Long return 0; 921965ae444SXin Long } 922965ae444SXin Long 923965ae444SXin Long void sctp_udp_sock_stop(struct net *net) 924965ae444SXin Long { 925965ae444SXin Long if (net->sctp.udp4_sock) { 926965ae444SXin Long udp_tunnel_sock_release(net->sctp.udp4_sock->sk_socket); 927965ae444SXin Long net->sctp.udp4_sock = NULL; 928965ae444SXin Long } 9299d6ba260SXin Long if (net->sctp.udp6_sock) { 9309d6ba260SXin Long udp_tunnel_sock_release(net->sctp.udp6_sock->sk_socket); 9319d6ba260SXin Long net->sctp.udp6_sock = NULL; 9329d6ba260SXin Long } 933965ae444SXin Long } 934965ae444SXin Long 9351da177e4SLinus Torvalds /* Register address family specific functions. */ 9361da177e4SLinus Torvalds int sctp_register_af(struct sctp_af *af) 9371da177e4SLinus Torvalds { 9381da177e4SLinus Torvalds switch (af->sa_family) { 9391da177e4SLinus Torvalds case AF_INET: 9401da177e4SLinus Torvalds if (sctp_af_v4_specific) 9411da177e4SLinus Torvalds return 0; 9421da177e4SLinus Torvalds sctp_af_v4_specific = af; 9431da177e4SLinus Torvalds break; 9441da177e4SLinus Torvalds case AF_INET6: 9451da177e4SLinus Torvalds if (sctp_af_v6_specific) 9461da177e4SLinus Torvalds return 0; 9471da177e4SLinus Torvalds sctp_af_v6_specific = af; 9481da177e4SLinus Torvalds break; 9491da177e4SLinus Torvalds default: 9501da177e4SLinus Torvalds return 0; 9511da177e4SLinus Torvalds } 9521da177e4SLinus Torvalds 9531da177e4SLinus Torvalds INIT_LIST_HEAD(&af->list); 9541da177e4SLinus Torvalds list_add_tail(&af->list, &sctp_address_families); 9551da177e4SLinus Torvalds return 1; 9561da177e4SLinus Torvalds } 9571da177e4SLinus Torvalds 9581da177e4SLinus Torvalds /* Get the table of functions for manipulating a particular address 9591da177e4SLinus Torvalds * family. 9601da177e4SLinus Torvalds */ 9611da177e4SLinus Torvalds struct sctp_af *sctp_get_af_specific(sa_family_t family) 9621da177e4SLinus Torvalds { 9631da177e4SLinus Torvalds switch (family) { 9641da177e4SLinus Torvalds case AF_INET: 9651da177e4SLinus Torvalds return sctp_af_v4_specific; 9661da177e4SLinus Torvalds case AF_INET6: 9671da177e4SLinus Torvalds return sctp_af_v6_specific; 9681da177e4SLinus Torvalds default: 9691da177e4SLinus Torvalds return NULL; 9701da177e4SLinus Torvalds } 9711da177e4SLinus Torvalds } 9721da177e4SLinus Torvalds 9731da177e4SLinus Torvalds /* Common code to initialize a AF_INET msg_name. */ 9741da177e4SLinus Torvalds static void sctp_inet_msgname(char *msgname, int *addr_len) 9751da177e4SLinus Torvalds { 9761da177e4SLinus Torvalds struct sockaddr_in *sin; 9771da177e4SLinus Torvalds 9781da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 9791da177e4SLinus Torvalds *addr_len = sizeof(struct sockaddr_in); 9801da177e4SLinus Torvalds sin->sin_family = AF_INET; 9811da177e4SLinus Torvalds memset(sin->sin_zero, 0, sizeof(sin->sin_zero)); 9821da177e4SLinus Torvalds } 9831da177e4SLinus Torvalds 9841da177e4SLinus Torvalds /* Copy the primary address of the peer primary address as the msg_name. */ 9851da177e4SLinus Torvalds static void sctp_inet_event_msgname(struct sctp_ulpevent *event, char *msgname, 9861da177e4SLinus Torvalds int *addr_len) 9871da177e4SLinus Torvalds { 9881da177e4SLinus Torvalds struct sockaddr_in *sin, *sinfrom; 9891da177e4SLinus Torvalds 9901da177e4SLinus Torvalds if (msgname) { 9911da177e4SLinus Torvalds struct sctp_association *asoc; 9921da177e4SLinus Torvalds 9931da177e4SLinus Torvalds asoc = event->asoc; 9941da177e4SLinus Torvalds sctp_inet_msgname(msgname, addr_len); 9951da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 9961da177e4SLinus Torvalds sinfrom = &asoc->peer.primary_addr.v4; 9971da177e4SLinus Torvalds sin->sin_port = htons(asoc->peer.port); 9981da177e4SLinus Torvalds sin->sin_addr.s_addr = sinfrom->sin_addr.s_addr; 9991da177e4SLinus Torvalds } 10001da177e4SLinus Torvalds } 10011da177e4SLinus Torvalds 10021da177e4SLinus Torvalds /* Initialize and copy out a msgname from an inbound skb. */ 10031da177e4SLinus Torvalds static void sctp_inet_skb_msgname(struct sk_buff *skb, char *msgname, int *len) 10041da177e4SLinus Torvalds { 10051da177e4SLinus Torvalds if (msgname) { 10062c0fd387SArnaldo Carvalho de Melo struct sctphdr *sh = sctp_hdr(skb); 10072c0fd387SArnaldo Carvalho de Melo struct sockaddr_in *sin = (struct sockaddr_in *)msgname; 10082c0fd387SArnaldo Carvalho de Melo 10091da177e4SLinus Torvalds sctp_inet_msgname(msgname, len); 10101da177e4SLinus Torvalds sin->sin_port = sh->source; 1011eddc9ec5SArnaldo Carvalho de Melo sin->sin_addr.s_addr = ip_hdr(skb)->saddr; 10121da177e4SLinus Torvalds } 10131da177e4SLinus Torvalds } 10141da177e4SLinus Torvalds 10151da177e4SLinus Torvalds /* Do we support this AF? */ 10161da177e4SLinus Torvalds static int sctp_inet_af_supported(sa_family_t family, struct sctp_sock *sp) 10171da177e4SLinus Torvalds { 10181da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 1019a02cec21SEric Dumazet return AF_INET == family; 10201da177e4SLinus Torvalds } 10211da177e4SLinus Torvalds 10221da177e4SLinus Torvalds /* Address matching with wildcards allowed. */ 10231da177e4SLinus Torvalds static int sctp_inet_cmp_addr(const union sctp_addr *addr1, 10241da177e4SLinus Torvalds const union sctp_addr *addr2, 10251da177e4SLinus Torvalds struct sctp_sock *opt) 10261da177e4SLinus Torvalds { 10271da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 10281da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 10291da177e4SLinus Torvalds return 0; 1030e6f1cebfSAl Viro if (htonl(INADDR_ANY) == addr1->v4.sin_addr.s_addr || 1031e6f1cebfSAl Viro htonl(INADDR_ANY) == addr2->v4.sin_addr.s_addr) 10321da177e4SLinus Torvalds return 1; 10331da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr == addr2->v4.sin_addr.s_addr) 10341da177e4SLinus Torvalds return 1; 10351da177e4SLinus Torvalds 10361da177e4SLinus Torvalds return 0; 10371da177e4SLinus Torvalds } 10381da177e4SLinus Torvalds 10391da177e4SLinus Torvalds /* Verify that provided sockaddr looks bindable. Common verification has 10401da177e4SLinus Torvalds * already been taken care of. 10411da177e4SLinus Torvalds */ 10421da177e4SLinus Torvalds static int sctp_inet_bind_verify(struct sctp_sock *opt, union sctp_addr *addr) 10431da177e4SLinus Torvalds { 10441da177e4SLinus Torvalds return sctp_v4_available(addr, opt); 10451da177e4SLinus Torvalds } 10461da177e4SLinus Torvalds 10471da177e4SLinus Torvalds /* Verify that sockaddr looks sendable. Common verification has already 10481da177e4SLinus Torvalds * been taken care of. 10491da177e4SLinus Torvalds */ 10501da177e4SLinus Torvalds static int sctp_inet_send_verify(struct sctp_sock *opt, union sctp_addr *addr) 10511da177e4SLinus Torvalds { 10521da177e4SLinus Torvalds return 1; 10531da177e4SLinus Torvalds } 10541da177e4SLinus Torvalds 10551da177e4SLinus Torvalds /* Fill in Supported Address Type information for INIT and INIT-ACK 10561da177e4SLinus Torvalds * chunks. Returns number of addresses supported. 10571da177e4SLinus Torvalds */ 10581da177e4SLinus Torvalds static int sctp_inet_supported_addrs(const struct sctp_sock *opt, 10593dbe8656SAl Viro __be16 *types) 10601da177e4SLinus Torvalds { 10611da177e4SLinus Torvalds types[0] = SCTP_PARAM_IPV4_ADDRESS; 10621da177e4SLinus Torvalds return 1; 10631da177e4SLinus Torvalds } 10641da177e4SLinus Torvalds 10651da177e4SLinus Torvalds /* Wrapper routine that calls the ip transmit routine. */ 1066600af7fdSXin Long static inline int sctp_v4_xmit(struct sk_buff *skb, struct sctp_transport *t) 10671da177e4SLinus Torvalds { 1068600af7fdSXin Long struct dst_entry *dst = dst_clone(t->dst); 1069600af7fdSXin Long struct flowi4 *fl4 = &t->fl.u.ip4; 1070600af7fdSXin Long struct sock *sk = skb->sk; 1071600af7fdSXin Long struct inet_sock *inet = inet_sk(sk); 10728a9c58d2SXin Long __u8 dscp = inet->tos; 1073600af7fdSXin Long __be16 df = 0; 1074f880374cSHerbert Xu 1075bb33381dSDaniel Borkmann pr_debug("%s: skb:%p, len:%d, src:%pI4, dst:%pI4\n", __func__, skb, 1076600af7fdSXin Long skb->len, &fl4->saddr, &fl4->daddr); 10778a9c58d2SXin Long 1078600af7fdSXin Long if (t->dscp & SCTP_DSCP_SET_MASK) 1079600af7fdSXin Long dscp = t->dscp & SCTP_DSCP_VAL_MASK; 10801da177e4SLinus Torvalds 1081600af7fdSXin Long inet->pmtudisc = t->param_flags & SPP_PMTUD_ENABLE ? IP_PMTUDISC_DO 1082600af7fdSXin Long : IP_PMTUDISC_DONT; 1083600af7fdSXin Long SCTP_INC_STATS(sock_net(sk), SCTP_MIB_OUTSCTPPACKS); 1084f880374cSHerbert Xu 1085600af7fdSXin Long if (!t->encap_port || !sctp_sk(sk)->udp_port) { 1086600af7fdSXin Long skb_dst_set(skb, dst); 1087600af7fdSXin Long return __ip_queue_xmit(sk, skb, &t->fl, dscp); 1088600af7fdSXin Long } 1089bb33381dSDaniel Borkmann 1090600af7fdSXin Long if (skb_is_gso(skb)) 1091600af7fdSXin Long skb_shinfo(skb)->gso_type |= SKB_GSO_UDP_TUNNEL_CSUM; 1092600af7fdSXin Long 1093600af7fdSXin Long if (ip_dont_fragment(sk, dst) && !skb->ignore_df) 1094600af7fdSXin Long df = htons(IP_DF); 1095600af7fdSXin Long 1096600af7fdSXin Long skb->encapsulation = 1; 1097600af7fdSXin Long skb_reset_inner_mac_header(skb); 1098600af7fdSXin Long skb_reset_inner_transport_header(skb); 1099600af7fdSXin Long skb_set_inner_ipproto(skb, IPPROTO_SCTP); 1100600af7fdSXin Long udp_tunnel_xmit_skb((struct rtable *)dst, sk, skb, fl4->saddr, 1101600af7fdSXin Long fl4->daddr, dscp, ip4_dst_hoplimit(dst), df, 1102600af7fdSXin Long sctp_sk(sk)->udp_port, t->encap_port, false, false); 1103600af7fdSXin Long return 0; 11041da177e4SLinus Torvalds } 11051da177e4SLinus Torvalds 110615efbe76SNeil Horman static struct sctp_af sctp_af_inet; 11071da177e4SLinus Torvalds 11081da177e4SLinus Torvalds static struct sctp_pf sctp_pf_inet = { 11091da177e4SLinus Torvalds .event_msgname = sctp_inet_event_msgname, 11101da177e4SLinus Torvalds .skb_msgname = sctp_inet_skb_msgname, 11111da177e4SLinus Torvalds .af_supported = sctp_inet_af_supported, 11121da177e4SLinus Torvalds .cmp_addr = sctp_inet_cmp_addr, 11131da177e4SLinus Torvalds .bind_verify = sctp_inet_bind_verify, 11141da177e4SLinus Torvalds .send_verify = sctp_inet_send_verify, 11151da177e4SLinus Torvalds .supported_addrs = sctp_inet_supported_addrs, 11161da177e4SLinus Torvalds .create_accept_sk = sctp_v4_create_accept_sk, 1117299ee123SJason Gunthorpe .addr_to_user = sctp_v4_addr_to_user, 1118299ee123SJason Gunthorpe .to_sk_saddr = sctp_v4_to_sk_saddr, 1119299ee123SJason Gunthorpe .to_sk_daddr = sctp_v4_to_sk_daddr, 1120b7e10c25SRichard Haines .copy_ip_options = sctp_v4_copy_ip_options, 112115efbe76SNeil Horman .af = &sctp_af_inet 11221da177e4SLinus Torvalds }; 11231da177e4SLinus Torvalds 11241da177e4SLinus Torvalds /* Notifier for inetaddr addition/deletion events. */ 11251da177e4SLinus Torvalds static struct notifier_block sctp_inetaddr_notifier = { 11261da177e4SLinus Torvalds .notifier_call = sctp_inetaddr_event, 11271da177e4SLinus Torvalds }; 11281da177e4SLinus Torvalds 11291da177e4SLinus Torvalds /* Socket operations. */ 113090ddc4f0SEric Dumazet static const struct proto_ops inet_seqpacket_ops = { 11311da177e4SLinus Torvalds .family = PF_INET, 11321da177e4SLinus Torvalds .owner = THIS_MODULE, 11331da177e4SLinus Torvalds .release = inet_release, /* Needs to be wrapped... */ 11341da177e4SLinus Torvalds .bind = inet_bind, 1135644fbdeaSXin Long .connect = sctp_inet_connect, 11361da177e4SLinus Torvalds .socketpair = sock_no_socketpair, 11371da177e4SLinus Torvalds .accept = inet_accept, 11381da177e4SLinus Torvalds .getname = inet_getname, /* Semantics are different. */ 1139a11e1d43SLinus Torvalds .poll = sctp_poll, 11401da177e4SLinus Torvalds .ioctl = inet_ioctl, 1141c7cbdbf2SArnd Bergmann .gettstamp = sock_gettstamp, 11421da177e4SLinus Torvalds .listen = sctp_inet_listen, 11431da177e4SLinus Torvalds .shutdown = inet_shutdown, /* Looks harmless. */ 1144543d9cfeSArnaldo Carvalho de Melo .setsockopt = sock_common_setsockopt, /* IP_SOL IP_OPTION is a problem */ 11451da177e4SLinus Torvalds .getsockopt = sock_common_getsockopt, 11461da177e4SLinus Torvalds .sendmsg = inet_sendmsg, 1147fd2d180aSXin Long .recvmsg = inet_recvmsg, 11481da177e4SLinus Torvalds .mmap = sock_no_mmap, 11491da177e4SLinus Torvalds .sendpage = sock_no_sendpage, 11501da177e4SLinus Torvalds }; 11511da177e4SLinus Torvalds 11521da177e4SLinus Torvalds /* Registration with AF_INET family. */ 11531da177e4SLinus Torvalds static struct inet_protosw sctp_seqpacket_protosw = { 11541da177e4SLinus Torvalds .type = SOCK_SEQPACKET, 11551da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 11561da177e4SLinus Torvalds .prot = &sctp_prot, 11571da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 11581da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 11591da177e4SLinus Torvalds }; 11601da177e4SLinus Torvalds static struct inet_protosw sctp_stream_protosw = { 11611da177e4SLinus Torvalds .type = SOCK_STREAM, 11621da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 11631da177e4SLinus Torvalds .prot = &sctp_prot, 11641da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 11651da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 11661da177e4SLinus Torvalds }; 11671da177e4SLinus Torvalds 1168a1dd2cf2SXin Long static int sctp4_rcv(struct sk_buff *skb) 1169a1dd2cf2SXin Long { 11700356010dSXin Long SCTP_INPUT_CB(skb)->encap_port = 0; 1171a1dd2cf2SXin Long return sctp_rcv(skb); 1172a1dd2cf2SXin Long } 1173a1dd2cf2SXin Long 11741da177e4SLinus Torvalds /* Register with IP layer. */ 117532613090SAlexey Dobriyan static const struct net_protocol sctp_protocol = { 1176a1dd2cf2SXin Long .handler = sctp4_rcv, 11771da177e4SLinus Torvalds .err_handler = sctp_v4_err, 11781da177e4SLinus Torvalds .no_policy = 1, 1179bb2db45bSEric W. Biederman .netns_ok = 1, 11808ed1dc44SHannes Frederic Sowa .icmp_strict_tag_validation = 1, 11811da177e4SLinus Torvalds }; 11821da177e4SLinus Torvalds 11831da177e4SLinus Torvalds /* IPv4 address related functions. */ 118415efbe76SNeil Horman static struct sctp_af sctp_af_inet = { 1185543d9cfeSArnaldo Carvalho de Melo .sa_family = AF_INET, 11861da177e4SLinus Torvalds .sctp_xmit = sctp_v4_xmit, 11871da177e4SLinus Torvalds .setsockopt = ip_setsockopt, 11881da177e4SLinus Torvalds .getsockopt = ip_getsockopt, 11891da177e4SLinus Torvalds .get_dst = sctp_v4_get_dst, 11901da177e4SLinus Torvalds .get_saddr = sctp_v4_get_saddr, 11911da177e4SLinus Torvalds .copy_addrlist = sctp_v4_copy_addrlist, 11921da177e4SLinus Torvalds .from_skb = sctp_v4_from_skb, 11931da177e4SLinus Torvalds .from_sk = sctp_v4_from_sk, 11941da177e4SLinus Torvalds .from_addr_param = sctp_v4_from_addr_param, 11951da177e4SLinus Torvalds .to_addr_param = sctp_v4_to_addr_param, 11961da177e4SLinus Torvalds .cmp_addr = sctp_v4_cmp_addr, 11971da177e4SLinus Torvalds .addr_valid = sctp_v4_addr_valid, 11981da177e4SLinus Torvalds .inaddr_any = sctp_v4_inaddr_any, 11991da177e4SLinus Torvalds .is_any = sctp_v4_is_any, 12001da177e4SLinus Torvalds .available = sctp_v4_available, 12011da177e4SLinus Torvalds .scope = sctp_v4_scope, 12021da177e4SLinus Torvalds .skb_iif = sctp_v4_skb_iif, 12031da177e4SLinus Torvalds .is_ce = sctp_v4_is_ce, 12041da177e4SLinus Torvalds .seq_dump_addr = sctp_v4_seq_dump_addr, 1205b9031d9dSVlad Yasevich .ecn_capable = sctp_v4_ecn_capable, 12061da177e4SLinus Torvalds .net_header_len = sizeof(struct iphdr), 12071da177e4SLinus Torvalds .sockaddr_len = sizeof(struct sockaddr_in), 1208b7e10c25SRichard Haines .ip_options_len = sctp_v4_ip_options_len, 12091da177e4SLinus Torvalds }; 12101da177e4SLinus Torvalds 12118d72651dSwangweidong struct sctp_pf *sctp_get_pf_specific(sa_family_t family) 12128d72651dSwangweidong { 12131da177e4SLinus Torvalds switch (family) { 12141da177e4SLinus Torvalds case PF_INET: 12151da177e4SLinus Torvalds return sctp_pf_inet_specific; 12161da177e4SLinus Torvalds case PF_INET6: 12171da177e4SLinus Torvalds return sctp_pf_inet6_specific; 12181da177e4SLinus Torvalds default: 12191da177e4SLinus Torvalds return NULL; 12201da177e4SLinus Torvalds } 12211da177e4SLinus Torvalds } 12221da177e4SLinus Torvalds 12231da177e4SLinus Torvalds /* Register the PF specific function table. */ 12241da177e4SLinus Torvalds int sctp_register_pf(struct sctp_pf *pf, sa_family_t family) 12251da177e4SLinus Torvalds { 12261da177e4SLinus Torvalds switch (family) { 12271da177e4SLinus Torvalds case PF_INET: 12281da177e4SLinus Torvalds if (sctp_pf_inet_specific) 12291da177e4SLinus Torvalds return 0; 12301da177e4SLinus Torvalds sctp_pf_inet_specific = pf; 12311da177e4SLinus Torvalds break; 12321da177e4SLinus Torvalds case PF_INET6: 12331da177e4SLinus Torvalds if (sctp_pf_inet6_specific) 12341da177e4SLinus Torvalds return 0; 12351da177e4SLinus Torvalds sctp_pf_inet6_specific = pf; 12361da177e4SLinus Torvalds break; 12371da177e4SLinus Torvalds default: 12381da177e4SLinus Torvalds return 0; 12391da177e4SLinus Torvalds } 12401da177e4SLinus Torvalds return 1; 12411da177e4SLinus Torvalds } 12421da177e4SLinus Torvalds 1243b01a2407SEric W. Biederman static inline int init_sctp_mibs(struct net *net) 12441da177e4SLinus Torvalds { 1245698365faSWANG Cong net->sctp.sctp_statistics = alloc_percpu(struct sctp_mib); 1246698365faSWANG Cong if (!net->sctp.sctp_statistics) 1247698365faSWANG Cong return -ENOMEM; 1248698365faSWANG Cong return 0; 12491da177e4SLinus Torvalds } 12501da177e4SLinus Torvalds 1251b01a2407SEric W. Biederman static inline void cleanup_sctp_mibs(struct net *net) 12521da177e4SLinus Torvalds { 1253698365faSWANG Cong free_percpu(net->sctp.sctp_statistics); 12541da177e4SLinus Torvalds } 12551da177e4SLinus Torvalds 1256270637abSVlad Yasevich static void sctp_v4_pf_init(void) 1257270637abSVlad Yasevich { 1258270637abSVlad Yasevich /* Initialize the SCTP specific PF functions. */ 1259270637abSVlad Yasevich sctp_register_pf(&sctp_pf_inet, PF_INET); 1260270637abSVlad Yasevich sctp_register_af(&sctp_af_inet); 1261270637abSVlad Yasevich } 1262270637abSVlad Yasevich 1263270637abSVlad Yasevich static void sctp_v4_pf_exit(void) 1264270637abSVlad Yasevich { 1265270637abSVlad Yasevich list_del(&sctp_af_inet.list); 1266270637abSVlad Yasevich } 1267270637abSVlad Yasevich 1268270637abSVlad Yasevich static int sctp_v4_protosw_init(void) 1269270637abSVlad Yasevich { 1270270637abSVlad Yasevich int rc; 1271270637abSVlad Yasevich 1272270637abSVlad Yasevich rc = proto_register(&sctp_prot, 1); 1273270637abSVlad Yasevich if (rc) 1274270637abSVlad Yasevich return rc; 1275270637abSVlad Yasevich 1276270637abSVlad Yasevich /* Register SCTP(UDP and TCP style) with socket layer. */ 1277270637abSVlad Yasevich inet_register_protosw(&sctp_seqpacket_protosw); 1278270637abSVlad Yasevich inet_register_protosw(&sctp_stream_protosw); 1279270637abSVlad Yasevich 1280270637abSVlad Yasevich return 0; 1281270637abSVlad Yasevich } 1282270637abSVlad Yasevich 1283270637abSVlad Yasevich static void sctp_v4_protosw_exit(void) 1284270637abSVlad Yasevich { 1285270637abSVlad Yasevich inet_unregister_protosw(&sctp_stream_protosw); 1286270637abSVlad Yasevich inet_unregister_protosw(&sctp_seqpacket_protosw); 1287270637abSVlad Yasevich proto_unregister(&sctp_prot); 1288270637abSVlad Yasevich } 1289270637abSVlad Yasevich 1290270637abSVlad Yasevich static int sctp_v4_add_protocol(void) 1291270637abSVlad Yasevich { 1292270637abSVlad Yasevich /* Register notifier for inet address additions/deletions. */ 1293270637abSVlad Yasevich register_inetaddr_notifier(&sctp_inetaddr_notifier); 1294270637abSVlad Yasevich 1295270637abSVlad Yasevich /* Register SCTP with inet layer. */ 1296270637abSVlad Yasevich if (inet_add_protocol(&sctp_protocol, IPPROTO_SCTP) < 0) 1297270637abSVlad Yasevich return -EAGAIN; 1298270637abSVlad Yasevich 1299270637abSVlad Yasevich return 0; 1300270637abSVlad Yasevich } 1301270637abSVlad Yasevich 1302270637abSVlad Yasevich static void sctp_v4_del_protocol(void) 1303270637abSVlad Yasevich { 1304270637abSVlad Yasevich inet_del_protocol(&sctp_protocol, IPPROTO_SCTP); 1305270637abSVlad Yasevich unregister_inetaddr_notifier(&sctp_inetaddr_notifier); 1306270637abSVlad Yasevich } 1307270637abSVlad Yasevich 13088e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_defaults_init(struct net *net) 13094db67e80SEric W. Biederman { 13102ce95503SEric W. Biederman int status; 13112ce95503SEric W. Biederman 1312e1fc3b14SEric W. Biederman /* 1313e1fc3b14SEric W. Biederman * 14. Suggested SCTP Protocol Parameter Values 1314e1fc3b14SEric W. Biederman */ 1315e1fc3b14SEric W. Biederman /* The following protocol parameters are RECOMMENDED: */ 1316e1fc3b14SEric W. Biederman /* RTO.Initial - 3 seconds */ 1317e1fc3b14SEric W. Biederman net->sctp.rto_initial = SCTP_RTO_INITIAL; 1318e1fc3b14SEric W. Biederman /* RTO.Min - 1 second */ 1319e1fc3b14SEric W. Biederman net->sctp.rto_min = SCTP_RTO_MIN; 1320e1fc3b14SEric W. Biederman /* RTO.Max - 60 seconds */ 1321e1fc3b14SEric W. Biederman net->sctp.rto_max = SCTP_RTO_MAX; 1322e1fc3b14SEric W. Biederman /* RTO.Alpha - 1/8 */ 1323e1fc3b14SEric W. Biederman net->sctp.rto_alpha = SCTP_RTO_ALPHA; 1324e1fc3b14SEric W. Biederman /* RTO.Beta - 1/4 */ 1325e1fc3b14SEric W. Biederman net->sctp.rto_beta = SCTP_RTO_BETA; 1326e1fc3b14SEric W. Biederman 1327e1fc3b14SEric W. Biederman /* Valid.Cookie.Life - 60 seconds */ 1328e1fc3b14SEric W. Biederman net->sctp.valid_cookie_life = SCTP_DEFAULT_COOKIE_LIFE; 1329e1fc3b14SEric W. Biederman 1330e1fc3b14SEric W. Biederman /* Whether Cookie Preservative is enabled(1) or not(0) */ 1331e1fc3b14SEric W. Biederman net->sctp.cookie_preserve_enable = 1; 1332e1fc3b14SEric W. Biederman 13333c68198eSNeil Horman /* Default sctp sockets to use md5 as their hmac alg */ 13340d0863b0SNeil Horman #if defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_MD5) 13353c68198eSNeil Horman net->sctp.sctp_hmac_alg = "md5"; 13360d0863b0SNeil Horman #elif defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_SHA1) 13373c68198eSNeil Horman net->sctp.sctp_hmac_alg = "sha1"; 13383c68198eSNeil Horman #else 13393c68198eSNeil Horman net->sctp.sctp_hmac_alg = NULL; 13403c68198eSNeil Horman #endif 13413c68198eSNeil Horman 1342e1fc3b14SEric W. Biederman /* Max.Burst - 4 */ 1343e1fc3b14SEric W. Biederman net->sctp.max_burst = SCTP_DEFAULT_MAX_BURST; 1344e1fc3b14SEric W. Biederman 134534515e94SXin Long /* Disable of Primary Path Switchover by default */ 134634515e94SXin Long net->sctp.ps_retrans = SCTP_PS_RETRANS_MAX; 134734515e94SXin Long 1348566178f8SZhu Yanjun /* Enable pf state by default */ 1349566178f8SZhu Yanjun net->sctp.pf_enable = 1; 1350566178f8SZhu Yanjun 1351aef587beSXin Long /* Ignore pf exposure feature by default */ 1352aef587beSXin Long net->sctp.pf_expose = SCTP_PF_EXPOSE_UNSET; 1353aef587beSXin Long 1354e1fc3b14SEric W. Biederman /* Association.Max.Retrans - 10 attempts 1355e1fc3b14SEric W. Biederman * Path.Max.Retrans - 5 attempts (per destination address) 1356e1fc3b14SEric W. Biederman * Max.Init.Retransmits - 8 attempts 1357e1fc3b14SEric W. Biederman */ 1358e1fc3b14SEric W. Biederman net->sctp.max_retrans_association = 10; 1359e1fc3b14SEric W. Biederman net->sctp.max_retrans_path = 5; 1360e1fc3b14SEric W. Biederman net->sctp.max_retrans_init = 8; 1361e1fc3b14SEric W. Biederman 1362e1fc3b14SEric W. Biederman /* Sendbuffer growth - do per-socket accounting */ 1363e1fc3b14SEric W. Biederman net->sctp.sndbuf_policy = 0; 1364e1fc3b14SEric W. Biederman 1365e1fc3b14SEric W. Biederman /* Rcvbuffer growth - do per-socket accounting */ 1366e1fc3b14SEric W. Biederman net->sctp.rcvbuf_policy = 0; 1367e1fc3b14SEric W. Biederman 1368e1fc3b14SEric W. Biederman /* HB.interval - 30 seconds */ 1369e1fc3b14SEric W. Biederman net->sctp.hb_interval = SCTP_DEFAULT_TIMEOUT_HEARTBEAT; 1370e1fc3b14SEric W. Biederman 1371e1fc3b14SEric W. Biederman /* delayed SACK timeout */ 1372e1fc3b14SEric W. Biederman net->sctp.sack_timeout = SCTP_DEFAULT_TIMEOUT_SACK; 1373e1fc3b14SEric W. Biederman 1374e1fc3b14SEric W. Biederman /* Disable ADDIP by default. */ 1375e1fc3b14SEric W. Biederman net->sctp.addip_enable = 0; 1376e1fc3b14SEric W. Biederman net->sctp.addip_noauth = 0; 1377e1fc3b14SEric W. Biederman net->sctp.default_auto_asconf = 0; 1378e1fc3b14SEric W. Biederman 1379e1fc3b14SEric W. Biederman /* Enable PR-SCTP by default. */ 1380e1fc3b14SEric W. Biederman net->sctp.prsctp_enable = 1; 1381e1fc3b14SEric W. Biederman 1382c28445c3SXin Long /* Disable RECONF by default. */ 1383c28445c3SXin Long net->sctp.reconf_enable = 0; 1384c28445c3SXin Long 1385e1fc3b14SEric W. Biederman /* Disable AUTH by default. */ 1386e1fc3b14SEric W. Biederman net->sctp.auth_enable = 0; 1387e1fc3b14SEric W. Biederman 13881b0b8114SXin Long /* Enable ECN by default. */ 13891b0b8114SXin Long net->sctp.ecn_enable = 1; 13901b0b8114SXin Long 1391965ae444SXin Long /* Set UDP tunneling listening port to 0 by default */ 1392965ae444SXin Long net->sctp.udp_port = 0; 1393965ae444SXin Long 1394e8a3001cSXin Long /* Set remote encap port to 0 by default */ 1395e8a3001cSXin Long net->sctp.encap_port = 0; 1396e8a3001cSXin Long 1397e1fc3b14SEric W. Biederman /* Set SCOPE policy to enabled */ 1398e1fc3b14SEric W. Biederman net->sctp.scope_policy = SCTP_SCOPE_POLICY_ENABLE; 1399e1fc3b14SEric W. Biederman 1400e1fc3b14SEric W. Biederman /* Set the default rwnd update threshold */ 1401e1fc3b14SEric W. Biederman net->sctp.rwnd_upd_shift = SCTP_DEFAULT_RWND_SHIFT; 1402e1fc3b14SEric W. Biederman 1403e1fc3b14SEric W. Biederman /* Initialize maximum autoclose timeout. */ 1404e1fc3b14SEric W. Biederman net->sctp.max_autoclose = INT_MAX / HZ; 1405e1fc3b14SEric W. Biederman 1406ebb7e95dSEric W. Biederman status = sctp_sysctl_net_register(net); 1407ebb7e95dSEric W. Biederman if (status) 1408ebb7e95dSEric W. Biederman goto err_sysctl_register; 1409ebb7e95dSEric W. Biederman 1410b01a2407SEric W. Biederman /* Allocate and initialise sctp mibs. */ 1411b01a2407SEric W. Biederman status = init_sctp_mibs(net); 1412b01a2407SEric W. Biederman if (status) 1413b01a2407SEric W. Biederman goto err_init_mibs; 1414b01a2407SEric W. Biederman 1415d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 141613d782f6SEric W. Biederman /* Initialize proc fs directory. */ 141713d782f6SEric W. Biederman status = sctp_proc_init(net); 141813d782f6SEric W. Biederman if (status) 141913d782f6SEric W. Biederman goto err_init_proc; 1420d47d08c8SAl Viro #endif 142113d782f6SEric W. Biederman 142213d782f6SEric W. Biederman sctp_dbg_objcnt_init(net); 142313d782f6SEric W. Biederman 14244db67e80SEric W. Biederman /* Initialize the local address list. */ 14254db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.local_addr_list); 14264db67e80SEric W. Biederman spin_lock_init(&net->sctp.local_addr_lock); 14274db67e80SEric W. Biederman sctp_get_local_addr_list(net); 14284db67e80SEric W. Biederman 14294db67e80SEric W. Biederman /* Initialize the address event list */ 14304db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.addr_waitq); 14314db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.auto_asconf_splist); 14324db67e80SEric W. Biederman spin_lock_init(&net->sctp.addr_wq_lock); 14334db67e80SEric W. Biederman net->sctp.addr_wq_timer.expires = 0; 14349c3b5751SKees Cook timer_setup(&net->sctp.addr_wq_timer, sctp_addr_wq_timeout_handler, 0); 14354db67e80SEric W. Biederman 14364db67e80SEric W. Biederman return 0; 14372ce95503SEric W. Biederman 14387ae665f1SArnd Bergmann #ifdef CONFIG_PROC_FS 143913d782f6SEric W. Biederman err_init_proc: 1440b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 14417ae665f1SArnd Bergmann #endif 1442b01a2407SEric W. Biederman err_init_mibs: 1443ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 1444ebb7e95dSEric W. Biederman err_sysctl_register: 14452ce95503SEric W. Biederman return status; 14464db67e80SEric W. Biederman } 14474db67e80SEric W. Biederman 14488e2d61e0SMarcelo Ricardo Leitner static void __net_exit sctp_defaults_exit(struct net *net) 14494db67e80SEric W. Biederman { 14504db67e80SEric W. Biederman /* Free the local address list */ 14514db67e80SEric W. Biederman sctp_free_addr_wq(net); 14524db67e80SEric W. Biederman sctp_free_local_addr_list(net); 14532ce95503SEric W. Biederman 1454d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 1455d47d08c8SAl Viro remove_proc_subtree("sctp", net->proc_net); 1456d47d08c8SAl Viro net->sctp.proc_net_sctp = NULL; 1457d47d08c8SAl Viro #endif 1458b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 1459ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 14604db67e80SEric W. Biederman } 14614db67e80SEric W. Biederman 14628e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_defaults_ops = { 14638e2d61e0SMarcelo Ricardo Leitner .init = sctp_defaults_init, 14648e2d61e0SMarcelo Ricardo Leitner .exit = sctp_defaults_exit, 14658e2d61e0SMarcelo Ricardo Leitner }; 14668e2d61e0SMarcelo Ricardo Leitner 14678e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_ctrlsock_init(struct net *net) 14688e2d61e0SMarcelo Ricardo Leitner { 14698e2d61e0SMarcelo Ricardo Leitner int status; 14708e2d61e0SMarcelo Ricardo Leitner 14718e2d61e0SMarcelo Ricardo Leitner /* Initialize the control inode/socket for handling OOTB packets. */ 14728e2d61e0SMarcelo Ricardo Leitner status = sctp_ctl_sock_init(net); 14738e2d61e0SMarcelo Ricardo Leitner if (status) 14748e2d61e0SMarcelo Ricardo Leitner pr_err("Failed to initialize the SCTP control sock\n"); 14758e2d61e0SMarcelo Ricardo Leitner 14768e2d61e0SMarcelo Ricardo Leitner return status; 14778e2d61e0SMarcelo Ricardo Leitner } 14788e2d61e0SMarcelo Ricardo Leitner 1479b456d724SChristophe JAILLET static void __net_exit sctp_ctrlsock_exit(struct net *net) 14808e2d61e0SMarcelo Ricardo Leitner { 14818e2d61e0SMarcelo Ricardo Leitner /* Free the control endpoint. */ 14828e2d61e0SMarcelo Ricardo Leitner inet_ctl_sock_destroy(net->sctp.ctl_sock); 14838e2d61e0SMarcelo Ricardo Leitner } 14848e2d61e0SMarcelo Ricardo Leitner 14858e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_ctrlsock_ops = { 14868e2d61e0SMarcelo Ricardo Leitner .init = sctp_ctrlsock_init, 14878e2d61e0SMarcelo Ricardo Leitner .exit = sctp_ctrlsock_exit, 14884db67e80SEric W. Biederman }; 14894db67e80SEric W. Biederman 14901da177e4SLinus Torvalds /* Initialize the universe into something sensible. */ 1491dda91928SDaniel Borkmann static __init int sctp_init(void) 14921da177e4SLinus Torvalds { 1493ca79b0c2SArun KS unsigned long nr_pages = totalram_pages(); 1494623b57beSColin Ian King unsigned long limit; 1495623b57beSColin Ian King unsigned long goal; 1496d9749fb5SNeil Horman int max_entry_order; 1497623b57beSColin Ian King int num_entries; 1498623b57beSColin Ian King int max_share; 1499623b57beSColin Ian King int status; 1500623b57beSColin Ian King int order; 1501623b57beSColin Ian King int i; 15021da177e4SLinus Torvalds 1503b4772ef8SEyal Birger sock_skb_cb_check_size(sizeof(struct sctp_ulpevent)); 15041da177e4SLinus Torvalds 1505827bf122SSridhar Samudrala /* Allocate bind_bucket and chunk caches. */ 15061da177e4SLinus Torvalds status = -ENOBUFS; 15071da177e4SLinus Torvalds sctp_bucket_cachep = kmem_cache_create("sctp_bind_bucket", 15081da177e4SLinus Torvalds sizeof(struct sctp_bind_bucket), 15091da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 151020c2df83SPaul Mundt NULL); 15111da177e4SLinus Torvalds if (!sctp_bucket_cachep) 1512827bf122SSridhar Samudrala goto out; 15131da177e4SLinus Torvalds 15141da177e4SLinus Torvalds sctp_chunk_cachep = kmem_cache_create("sctp_chunk", 15151da177e4SLinus Torvalds sizeof(struct sctp_chunk), 15161da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 151720c2df83SPaul Mundt NULL); 15181da177e4SLinus Torvalds if (!sctp_chunk_cachep) 15191da177e4SLinus Torvalds goto err_chunk_cachep; 15201da177e4SLinus Torvalds 1521908c7f19STejun Heo status = percpu_counter_init(&sctp_sockets_allocated, 0, GFP_KERNEL); 1522632c928aSEric W. Biederman if (status) 1523632c928aSEric W. Biederman goto err_percpu_counter_init; 1524632c928aSEric W. Biederman 15251da177e4SLinus Torvalds /* Implementation specific variables. */ 15261da177e4SLinus Torvalds 15271da177e4SLinus Torvalds /* Initialize default stream count setup information. */ 15281da177e4SLinus Torvalds sctp_max_instreams = SCTP_DEFAULT_INSTREAMS; 15291da177e4SLinus Torvalds sctp_max_outstreams = SCTP_DEFAULT_OUTSTREAMS; 15301da177e4SLinus Torvalds 15311da177e4SLinus Torvalds /* Initialize handle used for association ids. */ 15321da177e4SLinus Torvalds idr_init(&sctp_assocs_id); 15331da177e4SLinus Torvalds 1534f03d78dbSEric Dumazet limit = nr_free_buffer_pages() / 8; 15354d93df0aSNeil Horman limit = max(limit, 128UL); 15364d93df0aSNeil Horman sysctl_sctp_mem[0] = limit / 4 * 3; 15374d93df0aSNeil Horman sysctl_sctp_mem[1] = limit; 15384d93df0aSNeil Horman sysctl_sctp_mem[2] = sysctl_sctp_mem[0] * 2; 15394d93df0aSNeil Horman 15404d93df0aSNeil Horman /* Set per-socket limits to no more than 1/128 the pressure threshold*/ 15414d93df0aSNeil Horman limit = (sysctl_sctp_mem[1]) << (PAGE_SHIFT - 7); 15424d93df0aSNeil Horman max_share = min(4UL*1024*1024, limit); 15434d93df0aSNeil Horman 1544845525a6SVlad Yasevich sysctl_sctp_rmem[0] = SK_MEM_QUANTUM; /* give each asoc 1 page min */ 154587fb4b7bSEric Dumazet sysctl_sctp_rmem[1] = 1500 * SKB_TRUESIZE(1); 15464d93df0aSNeil Horman sysctl_sctp_rmem[2] = max(sysctl_sctp_rmem[1], max_share); 15474d93df0aSNeil Horman 15483ab224beSHideo Aoki sysctl_sctp_wmem[0] = SK_MEM_QUANTUM; 15494d93df0aSNeil Horman sysctl_sctp_wmem[1] = 16*1024; 15504d93df0aSNeil Horman sysctl_sctp_wmem[2] = max(64*1024, max_share); 15514d93df0aSNeil Horman 15521da177e4SLinus Torvalds /* Size and allocate the association hash table. 15531da177e4SLinus Torvalds * The methodology is similar to that of the tcp hash tables. 1554d9749fb5SNeil Horman * Though not identical. Start by getting a goal size 15551da177e4SLinus Torvalds */ 15563d6357deSArun KS if (nr_pages >= (128 * 1024)) 15573d6357deSArun KS goal = nr_pages >> (22 - PAGE_SHIFT); 15581da177e4SLinus Torvalds else 15593d6357deSArun KS goal = nr_pages >> (24 - PAGE_SHIFT); 15601da177e4SLinus Torvalds 1561d9749fb5SNeil Horman /* Then compute the page order for said goal */ 1562d9749fb5SNeil Horman order = get_order(goal); 1563d9749fb5SNeil Horman 1564d9749fb5SNeil Horman /* Now compute the required page order for the maximum sized table we 1565d9749fb5SNeil Horman * want to create 1566d9749fb5SNeil Horman */ 1567d9749fb5SNeil Horman max_entry_order = get_order(MAX_SCTP_PORT_HASH_ENTRIES * 1568d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket)); 1569d9749fb5SNeil Horman 1570d9749fb5SNeil Horman /* Limit the page order by that maximum hash table size */ 1571d9749fb5SNeil Horman order = min(order, max_entry_order); 15721da177e4SLinus Torvalds 15731da177e4SLinus Torvalds /* Allocate and initialize the endpoint hash table. */ 15741da177e4SLinus Torvalds sctp_ep_hashsize = 64; 15753b77d661SZhang Yanfei sctp_ep_hashtable = 15766da2ec56SKees Cook kmalloc_array(64, sizeof(struct sctp_hashbucket), GFP_KERNEL); 15771da177e4SLinus Torvalds if (!sctp_ep_hashtable) { 1578145ce502SJoe Perches pr_err("Failed endpoint_hash alloc\n"); 15791da177e4SLinus Torvalds status = -ENOMEM; 15801da177e4SLinus Torvalds goto err_ehash_alloc; 15811da177e4SLinus Torvalds } 15821da177e4SLinus Torvalds for (i = 0; i < sctp_ep_hashsize; i++) { 15831da177e4SLinus Torvalds rwlock_init(&sctp_ep_hashtable[i].lock); 1584d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_ep_hashtable[i].chain); 15851da177e4SLinus Torvalds } 15861da177e4SLinus Torvalds 1587d9749fb5SNeil Horman /* Allocate and initialize the SCTP port hash table. 1588d9749fb5SNeil Horman * Note that order is initalized to start at the max sized 1589d9749fb5SNeil Horman * table we want to support. If we can't get that many pages 1590d9749fb5SNeil Horman * reduce the order and try again 1591d9749fb5SNeil Horman */ 15921da177e4SLinus Torvalds do { 15931da177e4SLinus Torvalds sctp_port_hashtable = (struct sctp_bind_hashbucket *) 15946857a02aSEric Dumazet __get_free_pages(GFP_KERNEL | __GFP_NOWARN, order); 15951da177e4SLinus Torvalds } while (!sctp_port_hashtable && --order > 0); 1596d9749fb5SNeil Horman 15971da177e4SLinus Torvalds if (!sctp_port_hashtable) { 1598145ce502SJoe Perches pr_err("Failed bind hash alloc\n"); 15991da177e4SLinus Torvalds status = -ENOMEM; 16001da177e4SLinus Torvalds goto err_bhash_alloc; 16011da177e4SLinus Torvalds } 1602d9749fb5SNeil Horman 1603d9749fb5SNeil Horman /* Now compute the number of entries that will fit in the 1604d9749fb5SNeil Horman * port hash space we allocated 1605d9749fb5SNeil Horman */ 1606d9749fb5SNeil Horman num_entries = (1UL << order) * PAGE_SIZE / 1607d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket); 1608d9749fb5SNeil Horman 160993c3216aSRandy Dunlap /* And finish by rounding it down to the nearest power of two. 161093c3216aSRandy Dunlap * This wastes some memory of course, but it's needed because 1611d9749fb5SNeil Horman * the hash function operates based on the assumption that 161293c3216aSRandy Dunlap * the number of entries is a power of two. 1613d9749fb5SNeil Horman */ 1614d9749fb5SNeil Horman sctp_port_hashsize = rounddown_pow_of_two(num_entries); 1615d9749fb5SNeil Horman 16161da177e4SLinus Torvalds for (i = 0; i < sctp_port_hashsize; i++) { 16171da177e4SLinus Torvalds spin_lock_init(&sctp_port_hashtable[i].lock); 1618d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_port_hashtable[i].chain); 16191da177e4SLinus Torvalds } 16201da177e4SLinus Torvalds 1621a5e27d18SWei Yongjun status = sctp_transport_hashtable_init(); 1622a5e27d18SWei Yongjun if (status) 16234f008781SXin Long goto err_thash_alloc; 16244f008781SXin Long 1625d9749fb5SNeil Horman pr_info("Hash tables configured (bind %d/%d)\n", sctp_port_hashsize, 1626d9749fb5SNeil Horman num_entries); 16271da177e4SLinus Torvalds 16281da177e4SLinus Torvalds sctp_sysctl_register(); 16291da177e4SLinus Torvalds 16301da177e4SLinus Torvalds INIT_LIST_HEAD(&sctp_address_families); 1631270637abSVlad Yasevich sctp_v4_pf_init(); 1632270637abSVlad Yasevich sctp_v6_pf_init(); 16331ba896f6SXin Long sctp_sched_ops_init(); 16341da177e4SLinus Torvalds 16358e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_defaults_ops); 16368e2d61e0SMarcelo Ricardo Leitner if (status) 16378e2d61e0SMarcelo Ricardo Leitner goto err_register_defaults; 1638270637abSVlad Yasevich 16398e2d61e0SMarcelo Ricardo Leitner status = sctp_v4_protosw_init(); 1640827bf122SSridhar Samudrala if (status) 1641270637abSVlad Yasevich goto err_protosw_init; 1642827bf122SSridhar Samudrala 1643270637abSVlad Yasevich status = sctp_v6_protosw_init(); 16441da177e4SLinus Torvalds if (status) 1645270637abSVlad Yasevich goto err_v6_protosw_init; 16461da177e4SLinus Torvalds 16478e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_ctrlsock_ops); 16484db67e80SEric W. Biederman if (status) 16498e2d61e0SMarcelo Ricardo Leitner goto err_register_ctrlsock; 16504db67e80SEric W. Biederman 1651270637abSVlad Yasevich status = sctp_v4_add_protocol(); 1652270637abSVlad Yasevich if (status) 1653827bf122SSridhar Samudrala goto err_add_protocol; 1654827bf122SSridhar Samudrala 1655827bf122SSridhar Samudrala /* Register SCTP with inet6 layer. */ 1656827bf122SSridhar Samudrala status = sctp_v6_add_protocol(); 1657827bf122SSridhar Samudrala if (status) 1658827bf122SSridhar Samudrala goto err_v6_add_protocol; 1659827bf122SSridhar Samudrala 166090017accSMarcelo Ricardo Leitner if (sctp_offload_init() < 0) 166190017accSMarcelo Ricardo Leitner pr_crit("%s: Cannot add SCTP protocol offload\n", __func__); 166290017accSMarcelo Ricardo Leitner 16631da177e4SLinus Torvalds out: 16641da177e4SLinus Torvalds return status; 1665827bf122SSridhar Samudrala err_v6_add_protocol: 1666270637abSVlad Yasevich sctp_v4_del_protocol(); 1667d1dd5247SVlad Yasevich err_add_protocol: 16688e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 16698e2d61e0SMarcelo Ricardo Leitner err_register_ctrlsock: 1670270637abSVlad Yasevich sctp_v6_protosw_exit(); 1671270637abSVlad Yasevich err_v6_protosw_init: 1672270637abSVlad Yasevich sctp_v4_protosw_exit(); 1673270637abSVlad Yasevich err_protosw_init: 16748e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 16758e2d61e0SMarcelo Ricardo Leitner err_register_defaults: 1676270637abSVlad Yasevich sctp_v4_pf_exit(); 1677270637abSVlad Yasevich sctp_v6_pf_exit(); 16781da177e4SLinus Torvalds sctp_sysctl_unregister(); 16791da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 16801da177e4SLinus Torvalds get_order(sctp_port_hashsize * 16811da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 16821da177e4SLinus Torvalds err_bhash_alloc: 16834f008781SXin Long sctp_transport_hashtable_destroy(); 16844f008781SXin Long err_thash_alloc: 16851da177e4SLinus Torvalds kfree(sctp_ep_hashtable); 16861da177e4SLinus Torvalds err_ehash_alloc: 1687632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 1688632c928aSEric W. Biederman err_percpu_counter_init: 16891da177e4SLinus Torvalds kmem_cache_destroy(sctp_chunk_cachep); 16901da177e4SLinus Torvalds err_chunk_cachep: 16911da177e4SLinus Torvalds kmem_cache_destroy(sctp_bucket_cachep); 16921da177e4SLinus Torvalds goto out; 16931da177e4SLinus Torvalds } 16941da177e4SLinus Torvalds 16951da177e4SLinus Torvalds /* Exit handler for the SCTP protocol. */ 1696dda91928SDaniel Borkmann static __exit void sctp_exit(void) 16971da177e4SLinus Torvalds { 16981da177e4SLinus Torvalds /* BUG. This should probably do something useful like clean 16991da177e4SLinus Torvalds * up all the remaining associations and all that memory. 17001da177e4SLinus Torvalds */ 17011da177e4SLinus Torvalds 1702827bf122SSridhar Samudrala /* Unregister with inet6/inet layers. */ 1703827bf122SSridhar Samudrala sctp_v6_del_protocol(); 1704270637abSVlad Yasevich sctp_v4_del_protocol(); 17051da177e4SLinus Torvalds 17068e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 17074db67e80SEric W. Biederman 1708270637abSVlad Yasevich /* Free protosw registrations */ 1709270637abSVlad Yasevich sctp_v6_protosw_exit(); 1710270637abSVlad Yasevich sctp_v4_protosw_exit(); 1711270637abSVlad Yasevich 17128e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 17138e2d61e0SMarcelo Ricardo Leitner 1714827bf122SSridhar Samudrala /* Unregister with socket layer. */ 1715270637abSVlad Yasevich sctp_v6_pf_exit(); 1716270637abSVlad Yasevich sctp_v4_pf_exit(); 1717827bf122SSridhar Samudrala 17181da177e4SLinus Torvalds sctp_sysctl_unregister(); 17191da177e4SLinus Torvalds 17201da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 17211da177e4SLinus Torvalds get_order(sctp_port_hashsize * 17221da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 1723b5eff712SXin Long kfree(sctp_ep_hashtable); 17244f008781SXin Long sctp_transport_hashtable_destroy(); 17251da177e4SLinus Torvalds 1726632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 17271da177e4SLinus Torvalds 1728eaa184a1SJesper Dangaard Brouer rcu_barrier(); /* Wait for completion of call_rcu()'s */ 1729eaa184a1SJesper Dangaard Brouer 1730827bf122SSridhar Samudrala kmem_cache_destroy(sctp_chunk_cachep); 1731827bf122SSridhar Samudrala kmem_cache_destroy(sctp_bucket_cachep); 17321da177e4SLinus Torvalds } 17331da177e4SLinus Torvalds 17341da177e4SLinus Torvalds module_init(sctp_init); 17351da177e4SLinus Torvalds module_exit(sctp_exit); 17361da177e4SLinus Torvalds 1737bb97d31fSArnaldo Carvalho de Melo /* 1738bb97d31fSArnaldo Carvalho de Melo * __stringify doesn't likes enums, so use IPPROTO_SCTP value (132) directly. 1739bb97d31fSArnaldo Carvalho de Melo */ 1740bb97d31fSArnaldo Carvalho de Melo MODULE_ALIAS("net-pf-" __stringify(PF_INET) "-proto-132"); 1741882a382cSSridhar Samudrala MODULE_ALIAS("net-pf-" __stringify(PF_INET6) "-proto-132"); 174291705c61SDaniel Borkmann MODULE_AUTHOR("Linux Kernel SCTP developers <linux-sctp@vger.kernel.org>"); 17431da177e4SLinus Torvalds MODULE_DESCRIPTION("Support for the SCTP protocol (RFC2960)"); 174471acc0ddSDavid S. Miller module_param_named(no_checksums, sctp_checksum_disable, bool, 0644); 174571acc0ddSDavid S. Miller MODULE_PARM_DESC(no_checksums, "Disable checksums computing and verification"); 17461da177e4SLinus Torvalds MODULE_LICENSE("GPL"); 1747