147505b8bSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 260c778b2SVlad Yasevich /* SCTP kernel implementation 31da177e4SLinus Torvalds * (C) Copyright IBM Corp. 2001, 2004 41da177e4SLinus Torvalds * Copyright (c) 1999-2000 Cisco, Inc. 51da177e4SLinus Torvalds * Copyright (c) 1999-2001 Motorola, Inc. 61da177e4SLinus Torvalds * Copyright (c) 2001 Intel Corp. 71da177e4SLinus Torvalds * Copyright (c) 2001 Nokia, Inc. 81da177e4SLinus Torvalds * Copyright (c) 2001 La Monte H.P. Yarroll 91da177e4SLinus Torvalds * 1060c778b2SVlad Yasevich * This file is part of the SCTP kernel implementation 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * Initialization/cleanup for SCTP protocol support. 131da177e4SLinus Torvalds * 141da177e4SLinus Torvalds * Please send any bug reports or fixes you make to the 151da177e4SLinus Torvalds * email address(es): 1691705c61SDaniel Borkmann * lksctp developers <linux-sctp@vger.kernel.org> 171da177e4SLinus Torvalds * 181da177e4SLinus Torvalds * Written or modified by: 191da177e4SLinus Torvalds * La Monte H.P. Yarroll <piggy@acm.org> 201da177e4SLinus Torvalds * Karl Knutson <karl@athena.chicago.il.us> 211da177e4SLinus Torvalds * Jon Grimm <jgrimm@us.ibm.com> 221da177e4SLinus Torvalds * Sridhar Samudrala <sri@us.ibm.com> 231da177e4SLinus Torvalds * Daisy Chang <daisyc@us.ibm.com> 241da177e4SLinus Torvalds * Ardelle Fan <ardelle.fan@intel.com> 251da177e4SLinus Torvalds */ 261da177e4SLinus Torvalds 27145ce502SJoe Perches #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 28145ce502SJoe Perches 291da177e4SLinus Torvalds #include <linux/module.h> 301da177e4SLinus Torvalds #include <linux/init.h> 311da177e4SLinus Torvalds #include <linux/netdevice.h> 321da177e4SLinus Torvalds #include <linux/inetdevice.h> 331da177e4SLinus Torvalds #include <linux/seq_file.h> 3457c8a661SMike Rapoport #include <linux/memblock.h> 35845525a6SVlad Yasevich #include <linux/highmem.h> 36845525a6SVlad Yasevich #include <linux/swap.h> 375a0e3ad6STejun Heo #include <linux/slab.h> 38457c4cbcSEric W. Biederman #include <net/net_namespace.h> 391da177e4SLinus Torvalds #include <net/protocol.h> 401da177e4SLinus Torvalds #include <net/ip.h> 411da177e4SLinus Torvalds #include <net/ipv6.h> 4214c85021SArnaldo Carvalho de Melo #include <net/route.h> 431da177e4SLinus Torvalds #include <net/sctp/sctp.h> 441da177e4SLinus Torvalds #include <net/addrconf.h> 451da177e4SLinus Torvalds #include <net/inet_common.h> 461da177e4SLinus Torvalds #include <net/inet_ecn.h> 471da177e4SLinus Torvalds 48d9749fb5SNeil Horman #define MAX_SCTP_PORT_HASH_ENTRIES (64 * 1024) 49d9749fb5SNeil Horman 501da177e4SLinus Torvalds /* Global data structures. */ 514cbf1caeSBrian Haley struct sctp_globals sctp_globals __read_mostly; 521da177e4SLinus Torvalds 531da177e4SLinus Torvalds struct idr sctp_assocs_id; 541da177e4SLinus Torvalds DEFINE_SPINLOCK(sctp_assocs_id_lock); 551da177e4SLinus Torvalds 561da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet6_specific; 571da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet_specific; 581da177e4SLinus Torvalds static struct sctp_af *sctp_af_v4_specific; 591da177e4SLinus Torvalds static struct sctp_af *sctp_af_v6_specific; 601da177e4SLinus Torvalds 61e18b890bSChristoph Lameter struct kmem_cache *sctp_chunk_cachep __read_mostly; 62e18b890bSChristoph Lameter struct kmem_cache *sctp_bucket_cachep __read_mostly; 631da177e4SLinus Torvalds 648d987e5cSEric Dumazet long sysctl_sctp_mem[3]; 65007e3936SVlad Yasevich int sysctl_sctp_rmem[3]; 66007e3936SVlad Yasevich int sysctl_sctp_wmem[3]; 674d93df0aSNeil Horman 681da177e4SLinus Torvalds /* Private helper to extract ipv4 address and stash them in 691da177e4SLinus Torvalds * the protocol structure. 701da177e4SLinus Torvalds */ 711da177e4SLinus Torvalds static void sctp_v4_copy_addrlist(struct list_head *addrlist, 721da177e4SLinus Torvalds struct net_device *dev) 731da177e4SLinus Torvalds { 741da177e4SLinus Torvalds struct in_device *in_dev; 751da177e4SLinus Torvalds struct in_ifaddr *ifa; 761da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 771da177e4SLinus Torvalds 781da177e4SLinus Torvalds rcu_read_lock(); 79e5ed6399SHerbert Xu if ((in_dev = __in_dev_get_rcu(dev)) == NULL) { 801da177e4SLinus Torvalds rcu_read_unlock(); 811da177e4SLinus Torvalds return; 821da177e4SLinus Torvalds } 831da177e4SLinus Torvalds 84cd5a411dSFlorian Westphal in_dev_for_each_ifa_rcu(ifa, in_dev) { 851da177e4SLinus Torvalds /* Add the address to the local list. */ 86939cfa75SDaniel Borkmann addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 871da177e4SLinus Torvalds if (addr) { 882a6fd78aSAl Viro addr->a.v4.sin_family = AF_INET; 892a6fd78aSAl Viro addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 9029303547SVlad Yasevich addr->valid = 1; 9129303547SVlad Yasevich INIT_LIST_HEAD(&addr->list); 921da177e4SLinus Torvalds list_add_tail(&addr->list, addrlist); 931da177e4SLinus Torvalds } 941da177e4SLinus Torvalds } 951da177e4SLinus Torvalds 961da177e4SLinus Torvalds rcu_read_unlock(); 971da177e4SLinus Torvalds } 981da177e4SLinus Torvalds 991da177e4SLinus Torvalds /* Extract our IP addresses from the system and stash them in the 1001da177e4SLinus Torvalds * protocol structure. 1011da177e4SLinus Torvalds */ 1024db67e80SEric W. Biederman static void sctp_get_local_addr_list(struct net *net) 1031da177e4SLinus Torvalds { 1041da177e4SLinus Torvalds struct net_device *dev; 1051da177e4SLinus Torvalds struct list_head *pos; 1061da177e4SLinus Torvalds struct sctp_af *af; 1071da177e4SLinus Torvalds 108c6d14c84SEric Dumazet rcu_read_lock(); 1094db67e80SEric W. Biederman for_each_netdev_rcu(net, dev) { 1102c0740e4SDave Jones list_for_each(pos, &sctp_address_families) { 1111da177e4SLinus Torvalds af = list_entry(pos, struct sctp_af, list); 1124db67e80SEric W. Biederman af->copy_addrlist(&net->sctp.local_addr_list, dev); 1131da177e4SLinus Torvalds } 1141da177e4SLinus Torvalds } 115c6d14c84SEric Dumazet rcu_read_unlock(); 1161da177e4SLinus Torvalds } 1171da177e4SLinus Torvalds 1181da177e4SLinus Torvalds /* Free the existing local addresses. */ 1194db67e80SEric W. Biederman static void sctp_free_local_addr_list(struct net *net) 1201da177e4SLinus Torvalds { 1211da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1221da177e4SLinus Torvalds struct list_head *pos, *temp; 1231da177e4SLinus Torvalds 1244db67e80SEric W. Biederman list_for_each_safe(pos, temp, &net->sctp.local_addr_list) { 1251da177e4SLinus Torvalds addr = list_entry(pos, struct sctp_sockaddr_entry, list); 1261da177e4SLinus Torvalds list_del(pos); 1271da177e4SLinus Torvalds kfree(addr); 1281da177e4SLinus Torvalds } 1291da177e4SLinus Torvalds } 1301da177e4SLinus Torvalds 1311da177e4SLinus Torvalds /* Copy the local addresses which are valid for 'scope' into 'bp'. */ 1324db67e80SEric W. Biederman int sctp_copy_local_addr_list(struct net *net, struct sctp_bind_addr *bp, 1331c662018SXin Long enum sctp_scope scope, gfp_t gfp, int copy_flags) 1341da177e4SLinus Torvalds { 1351da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1362e3ce5bcSXin Long union sctp_addr laddr; 1371da177e4SLinus Torvalds int error = 0; 1381da177e4SLinus Torvalds 13929303547SVlad Yasevich rcu_read_lock(); 1404db67e80SEric W. Biederman list_for_each_entry_rcu(addr, &net->sctp.local_addr_list, list) { 14129303547SVlad Yasevich if (!addr->valid) 14229303547SVlad Yasevich continue; 143165f2cf6SXin Long if (!sctp_in_scope(net, &addr->a, scope)) 144165f2cf6SXin Long continue; 145165f2cf6SXin Long 1461da177e4SLinus Torvalds /* Now that the address is in scope, check to see if 1471da177e4SLinus Torvalds * the address type is really supported by the local 1481da177e4SLinus Torvalds * sock as well as the remote peer. 1491da177e4SLinus Torvalds */ 150165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET && 151165f2cf6SXin Long !(copy_flags & SCTP_ADDR4_PEERSUPP)) 152165f2cf6SXin Long continue; 153165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET6 && 154165f2cf6SXin Long (!(copy_flags & SCTP_ADDR6_ALLOWED) || 155165f2cf6SXin Long !(copy_flags & SCTP_ADDR6_PEERSUPP))) 156165f2cf6SXin Long continue; 157165f2cf6SXin Long 1582e3ce5bcSXin Long laddr = addr->a; 1592e3ce5bcSXin Long /* also works for setting ipv6 address port */ 1602e3ce5bcSXin Long laddr.v4.sin_port = htons(bp->port); 1612e3ce5bcSXin Long if (sctp_bind_addr_state(bp, &laddr) != -1) 162b8607805SXin Long continue; 163b8607805SXin Long 164165f2cf6SXin Long error = sctp_add_bind_addr(bp, &addr->a, sizeof(addr->a), 165f57d96b2SVlad Yasevich SCTP_ADDR_SRC, GFP_ATOMIC); 1661da177e4SLinus Torvalds if (error) 167165f2cf6SXin Long break; 1681da177e4SLinus Torvalds } 1691da177e4SLinus Torvalds 17029303547SVlad Yasevich rcu_read_unlock(); 1711da177e4SLinus Torvalds return error; 1721da177e4SLinus Torvalds } 1731da177e4SLinus Torvalds 174b7e10c25SRichard Haines /* Copy over any ip options */ 175b7e10c25SRichard Haines static void sctp_v4_copy_ip_options(struct sock *sk, struct sock *newsk) 176b7e10c25SRichard Haines { 177b7e10c25SRichard Haines struct inet_sock *newinet, *inet = inet_sk(sk); 178b7e10c25SRichard Haines struct ip_options_rcu *inet_opt, *newopt = NULL; 179b7e10c25SRichard Haines 180b7e10c25SRichard Haines newinet = inet_sk(newsk); 181b7e10c25SRichard Haines 182b7e10c25SRichard Haines rcu_read_lock(); 183b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 184b7e10c25SRichard Haines if (inet_opt) { 185b7e10c25SRichard Haines newopt = sock_kmalloc(newsk, sizeof(*inet_opt) + 186b7e10c25SRichard Haines inet_opt->opt.optlen, GFP_ATOMIC); 187b7e10c25SRichard Haines if (newopt) 188b7e10c25SRichard Haines memcpy(newopt, inet_opt, sizeof(*inet_opt) + 189b7e10c25SRichard Haines inet_opt->opt.optlen); 190b7e10c25SRichard Haines else 191b7e10c25SRichard Haines pr_err("%s: Failed to copy ip options\n", __func__); 192b7e10c25SRichard Haines } 193b7e10c25SRichard Haines RCU_INIT_POINTER(newinet->inet_opt, newopt); 194b7e10c25SRichard Haines rcu_read_unlock(); 195b7e10c25SRichard Haines } 196b7e10c25SRichard Haines 197b7e10c25SRichard Haines /* Account for the IP options */ 198b7e10c25SRichard Haines static int sctp_v4_ip_options_len(struct sock *sk) 199b7e10c25SRichard Haines { 200b7e10c25SRichard Haines struct inet_sock *inet = inet_sk(sk); 201b7e10c25SRichard Haines struct ip_options_rcu *inet_opt; 202b7e10c25SRichard Haines int len = 0; 203b7e10c25SRichard Haines 204b7e10c25SRichard Haines rcu_read_lock(); 205b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 206b7e10c25SRichard Haines if (inet_opt) 207b7e10c25SRichard Haines len = inet_opt->opt.optlen; 208b7e10c25SRichard Haines 209b7e10c25SRichard Haines rcu_read_unlock(); 210b7e10c25SRichard Haines return len; 211b7e10c25SRichard Haines } 212b7e10c25SRichard Haines 2131da177e4SLinus Torvalds /* Initialize a sctp_addr from in incoming skb. */ 2141da177e4SLinus Torvalds static void sctp_v4_from_skb(union sctp_addr *addr, struct sk_buff *skb, 2151da177e4SLinus Torvalds int is_saddr) 2161da177e4SLinus Torvalds { 2170630c56eSMarcelo Ricardo Leitner /* Always called on head skb, so this is safe */ 2180630c56eSMarcelo Ricardo Leitner struct sctphdr *sh = sctp_hdr(skb); 2190630c56eSMarcelo Ricardo Leitner struct sockaddr_in *sa = &addr->v4; 2201da177e4SLinus Torvalds 2211da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2221da177e4SLinus Torvalds 2231da177e4SLinus Torvalds if (is_saddr) { 2240630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->source; 2250630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->saddr; 2261da177e4SLinus Torvalds } else { 2270630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->dest; 2280630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->daddr; 2291da177e4SLinus Torvalds } 2301da177e4SLinus Torvalds } 2311da177e4SLinus Torvalds 2321da177e4SLinus Torvalds /* Initialize an sctp_addr from a socket. */ 2331da177e4SLinus Torvalds static void sctp_v4_from_sk(union sctp_addr *addr, struct sock *sk) 2341da177e4SLinus Torvalds { 2351da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2367dcdbd95SAl Viro addr->v4.sin_port = 0; 237c720c7e8SEric Dumazet addr->v4.sin_addr.s_addr = inet_sk(sk)->inet_rcv_saddr; 2381da177e4SLinus Torvalds } 2391da177e4SLinus Torvalds 2401da177e4SLinus Torvalds /* Initialize sk->sk_rcv_saddr from sctp_addr. */ 2411da177e4SLinus Torvalds static void sctp_v4_to_sk_saddr(union sctp_addr *addr, struct sock *sk) 2421da177e4SLinus Torvalds { 243c720c7e8SEric Dumazet inet_sk(sk)->inet_rcv_saddr = addr->v4.sin_addr.s_addr; 2441da177e4SLinus Torvalds } 2451da177e4SLinus Torvalds 2461da177e4SLinus Torvalds /* Initialize sk->sk_daddr from sctp_addr. */ 2471da177e4SLinus Torvalds static void sctp_v4_to_sk_daddr(union sctp_addr *addr, struct sock *sk) 2481da177e4SLinus Torvalds { 249c720c7e8SEric Dumazet inet_sk(sk)->inet_daddr = addr->v4.sin_addr.s_addr; 2501da177e4SLinus Torvalds } 2511da177e4SLinus Torvalds 2521da177e4SLinus Torvalds /* Initialize a sctp_addr from an address parameter. */ 2531da177e4SLinus Torvalds static void sctp_v4_from_addr_param(union sctp_addr *addr, 2541da177e4SLinus Torvalds union sctp_addr_param *param, 255dd86d136SAl Viro __be16 port, int iif) 2561da177e4SLinus Torvalds { 2571da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2581da177e4SLinus Torvalds addr->v4.sin_port = port; 2591da177e4SLinus Torvalds addr->v4.sin_addr.s_addr = param->v4.addr.s_addr; 2601da177e4SLinus Torvalds } 2611da177e4SLinus Torvalds 2621da177e4SLinus Torvalds /* Initialize an address parameter from a sctp_addr and return the length 2631da177e4SLinus Torvalds * of the address parameter. 2641da177e4SLinus Torvalds */ 2651da177e4SLinus Torvalds static int sctp_v4_to_addr_param(const union sctp_addr *addr, 2661da177e4SLinus Torvalds union sctp_addr_param *param) 2671da177e4SLinus Torvalds { 268a38905e6SXin Long int length = sizeof(struct sctp_ipv4addr_param); 2691da177e4SLinus Torvalds 2701da177e4SLinus Torvalds param->v4.param_hdr.type = SCTP_PARAM_IPV4_ADDRESS; 271dbc16db1SAl Viro param->v4.param_hdr.length = htons(length); 2721da177e4SLinus Torvalds param->v4.addr.s_addr = addr->v4.sin_addr.s_addr; 2731da177e4SLinus Torvalds 2741da177e4SLinus Torvalds return length; 2751da177e4SLinus Torvalds } 2761da177e4SLinus Torvalds 2771da177e4SLinus Torvalds /* Initialize a sctp_addr from a dst_entry. */ 27818a353f4SDavid S. Miller static void sctp_v4_dst_saddr(union sctp_addr *saddr, struct flowi4 *fl4, 279854d43a4SAl Viro __be16 port) 2801da177e4SLinus Torvalds { 2811da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 2821da177e4SLinus Torvalds saddr->v4.sin_port = port; 28318a353f4SDavid S. Miller saddr->v4.sin_addr.s_addr = fl4->saddr; 2841da177e4SLinus Torvalds } 2851da177e4SLinus Torvalds 2861da177e4SLinus Torvalds /* Compare two addresses exactly. */ 2871da177e4SLinus Torvalds static int sctp_v4_cmp_addr(const union sctp_addr *addr1, 2881da177e4SLinus Torvalds const union sctp_addr *addr2) 2891da177e4SLinus Torvalds { 2901da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 2911da177e4SLinus Torvalds return 0; 2921da177e4SLinus Torvalds if (addr1->v4.sin_port != addr2->v4.sin_port) 2931da177e4SLinus Torvalds return 0; 2941da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr != addr2->v4.sin_addr.s_addr) 2951da177e4SLinus Torvalds return 0; 2961da177e4SLinus Torvalds 2971da177e4SLinus Torvalds return 1; 2981da177e4SLinus Torvalds } 2991da177e4SLinus Torvalds 3001da177e4SLinus Torvalds /* Initialize addr struct to INADDR_ANY. */ 3016fbfa9f9SAl Viro static void sctp_v4_inaddr_any(union sctp_addr *addr, __be16 port) 3021da177e4SLinus Torvalds { 3031da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 304e6f1cebfSAl Viro addr->v4.sin_addr.s_addr = htonl(INADDR_ANY); 3051da177e4SLinus Torvalds addr->v4.sin_port = port; 3061da177e4SLinus Torvalds } 3071da177e4SLinus Torvalds 3081da177e4SLinus Torvalds /* Is this a wildcard address? */ 3091da177e4SLinus Torvalds static int sctp_v4_is_any(const union sctp_addr *addr) 3101da177e4SLinus Torvalds { 311e6f1cebfSAl Viro return htonl(INADDR_ANY) == addr->v4.sin_addr.s_addr; 3121da177e4SLinus Torvalds } 3131da177e4SLinus Torvalds 3141da177e4SLinus Torvalds /* This function checks if the address is a valid address to be used for 3151da177e4SLinus Torvalds * SCTP binding. 3161da177e4SLinus Torvalds * 3171da177e4SLinus Torvalds * Output: 3181da177e4SLinus Torvalds * Return 0 - If the address is a non-unicast or an illegal address. 3191da177e4SLinus Torvalds * Return 1 - If the address is a unicast. 3201da177e4SLinus Torvalds */ 3215636bef7SVlad Yasevich static int sctp_v4_addr_valid(union sctp_addr *addr, 3225636bef7SVlad Yasevich struct sctp_sock *sp, 3235636bef7SVlad Yasevich const struct sk_buff *skb) 3241da177e4SLinus Torvalds { 3257dab83deSVlad Yasevich /* IPv4 addresses not allowed */ 3267dab83deSVlad Yasevich if (sp && ipv6_only_sock(sctp_opt2sk(sp))) 3277dab83deSVlad Yasevich return 0; 3287dab83deSVlad Yasevich 3291da177e4SLinus Torvalds /* Is this a non-unicast address or a unusable SCTP address? */ 330b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) 3311da177e4SLinus Torvalds return 0; 3321da177e4SLinus Torvalds 3335636bef7SVlad Yasevich /* Is this a broadcast address? */ 334511c3f92SEric Dumazet if (skb && skb_rtable(skb)->rt_flags & RTCF_BROADCAST) 3355636bef7SVlad Yasevich return 0; 3365636bef7SVlad Yasevich 3371da177e4SLinus Torvalds return 1; 3381da177e4SLinus Torvalds } 3391da177e4SLinus Torvalds 3401da177e4SLinus Torvalds /* Should this be available for binding? */ 3411da177e4SLinus Torvalds static int sctp_v4_available(union sctp_addr *addr, struct sctp_sock *sp) 3421da177e4SLinus Torvalds { 343bb2db45bSEric W. Biederman struct net *net = sock_net(&sp->inet.sk); 344bb2db45bSEric W. Biederman int ret = inet_addr_type(net, addr->v4.sin_addr.s_addr); 3451da177e4SLinus Torvalds 3461da177e4SLinus Torvalds 347e6f1cebfSAl Viro if (addr->v4.sin_addr.s_addr != htonl(INADDR_ANY) && 348cdac4e07SNeil Horman ret != RTN_LOCAL && 349cdac4e07SNeil Horman !sp->inet.freebind && 35049a60158SVincent Bernat !net->ipv4.sysctl_ip_nonlocal_bind) 3511da177e4SLinus Torvalds return 0; 352cdac4e07SNeil Horman 3537dab83deSVlad Yasevich if (ipv6_only_sock(sctp_opt2sk(sp))) 3547dab83deSVlad Yasevich return 0; 3557dab83deSVlad Yasevich 3561da177e4SLinus Torvalds return 1; 3571da177e4SLinus Torvalds } 3581da177e4SLinus Torvalds 3591da177e4SLinus Torvalds /* Checking the loopback, private and other address scopes as defined in 3601da177e4SLinus Torvalds * RFC 1918. The IPv4 scoping is based on the draft for SCTP IPv4 3611da177e4SLinus Torvalds * scoping <draft-stewart-tsvwg-sctp-ipv4-00.txt>. 3621da177e4SLinus Torvalds * 3631da177e4SLinus Torvalds * Level 0 - unusable SCTP addresses 3641da177e4SLinus Torvalds * Level 1 - loopback address 3651da177e4SLinus Torvalds * Level 2 - link-local addresses 3661da177e4SLinus Torvalds * Level 3 - private addresses. 3671da177e4SLinus Torvalds * Level 4 - global addresses 3681da177e4SLinus Torvalds * For INIT and INIT-ACK address list, let L be the level of 3691da177e4SLinus Torvalds * of requested destination address, sender and receiver 3701da177e4SLinus Torvalds * SHOULD include all of its addresses with level greater 3711da177e4SLinus Torvalds * than or equal to L. 37272388433SBhaskar Dutta * 37372388433SBhaskar Dutta * IPv4 scoping can be controlled through sysctl option 37472388433SBhaskar Dutta * net.sctp.addr_scope_policy 3751da177e4SLinus Torvalds */ 3761c662018SXin Long static enum sctp_scope sctp_v4_scope(union sctp_addr *addr) 3771da177e4SLinus Torvalds { 3781c662018SXin Long enum sctp_scope retval; 3791da177e4SLinus Torvalds 3801da177e4SLinus Torvalds /* Check for unusable SCTP addresses. */ 381b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) { 3821da177e4SLinus Torvalds retval = SCTP_SCOPE_UNUSABLE; 383b5cb2bbcSJoe Perches } else if (ipv4_is_loopback(addr->v4.sin_addr.s_addr)) { 3841da177e4SLinus Torvalds retval = SCTP_SCOPE_LOOPBACK; 385b5cb2bbcSJoe Perches } else if (ipv4_is_linklocal_169(addr->v4.sin_addr.s_addr)) { 3861da177e4SLinus Torvalds retval = SCTP_SCOPE_LINK; 387b5cb2bbcSJoe Perches } else if (ipv4_is_private_10(addr->v4.sin_addr.s_addr) || 388b5cb2bbcSJoe Perches ipv4_is_private_172(addr->v4.sin_addr.s_addr) || 389b5cb2bbcSJoe Perches ipv4_is_private_192(addr->v4.sin_addr.s_addr)) { 3901da177e4SLinus Torvalds retval = SCTP_SCOPE_PRIVATE; 3911da177e4SLinus Torvalds } else { 3921da177e4SLinus Torvalds retval = SCTP_SCOPE_GLOBAL; 3931da177e4SLinus Torvalds } 3941da177e4SLinus Torvalds 3951da177e4SLinus Torvalds return retval; 3961da177e4SLinus Torvalds } 3971da177e4SLinus Torvalds 3981da177e4SLinus Torvalds /* Returns a valid dst cache entry for the given source and destination ip 3991da177e4SLinus Torvalds * addresses. If an association is passed, trys to get a dst entry with a 4001da177e4SLinus Torvalds * source address that matches an address in the bind address list. 4011da177e4SLinus Torvalds */ 402da0420beSVlad Yasevich static void sctp_v4_get_dst(struct sctp_transport *t, union sctp_addr *saddr, 403da0420beSVlad Yasevich struct flowi *fl, struct sock *sk) 4041da177e4SLinus Torvalds { 405da0420beSVlad Yasevich struct sctp_association *asoc = t->asoc; 4061da177e4SLinus Torvalds struct rtable *rt; 4079914ae3cSVlad Yasevich struct flowi4 *fl4 = &fl->u.ip4; 4081da177e4SLinus Torvalds struct sctp_bind_addr *bp; 4091da177e4SLinus Torvalds struct sctp_sockaddr_entry *laddr; 4101da177e4SLinus Torvalds struct dst_entry *dst = NULL; 411da0420beSVlad Yasevich union sctp_addr *daddr = &t->ipaddr; 4121da177e4SLinus Torvalds union sctp_addr dst_saddr; 4138a9c58d2SXin Long __u8 tos = inet_sk(sk)->tos; 4141da177e4SLinus Torvalds 4158a9c58d2SXin Long if (t->dscp & SCTP_DSCP_SET_MASK) 4168a9c58d2SXin Long tos = t->dscp & SCTP_DSCP_VAL_MASK; 4179914ae3cSVlad Yasevich memset(fl4, 0x0, sizeof(struct flowi4)); 4189914ae3cSVlad Yasevich fl4->daddr = daddr->v4.sin_addr.s_addr; 4199914ae3cSVlad Yasevich fl4->fl4_dport = daddr->v4.sin_port; 4209914ae3cSVlad Yasevich fl4->flowi4_proto = IPPROTO_SCTP; 4211da177e4SLinus Torvalds if (asoc) { 4228a9c58d2SXin Long fl4->flowi4_tos = RT_CONN_FLAGS_TOS(asoc->base.sk, tos); 4239914ae3cSVlad Yasevich fl4->flowi4_oif = asoc->base.sk->sk_bound_dev_if; 4249914ae3cSVlad Yasevich fl4->fl4_sport = htons(asoc->base.bind_addr.port); 4251da177e4SLinus Torvalds } 4266429d3dcSWei Yongjun if (saddr) { 4279914ae3cSVlad Yasevich fl4->saddr = saddr->v4.sin_addr.s_addr; 428ecf938feSXin Long if (!fl4->fl4_sport) 4299914ae3cSVlad Yasevich fl4->fl4_sport = saddr->v4.sin_port; 4306429d3dcSWei Yongjun } 4311da177e4SLinus Torvalds 432bb33381dSDaniel Borkmann pr_debug("%s: dst:%pI4, src:%pI4 - ", __func__, &fl4->daddr, 433bb33381dSDaniel Borkmann &fl4->saddr); 4341da177e4SLinus Torvalds 435bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 436b23dd4feSDavid S. Miller if (!IS_ERR(rt)) 437d8d1f30bSChangli Gao dst = &rt->dst; 4381da177e4SLinus Torvalds 4391da177e4SLinus Torvalds /* If there is no association or if a source address is passed, no 4401da177e4SLinus Torvalds * more validation is required. 4411da177e4SLinus Torvalds */ 4421da177e4SLinus Torvalds if (!asoc || saddr) 4431da177e4SLinus Torvalds goto out; 4441da177e4SLinus Torvalds 4451da177e4SLinus Torvalds bp = &asoc->base.bind_addr; 4461da177e4SLinus Torvalds 4471da177e4SLinus Torvalds if (dst) { 4481da177e4SLinus Torvalds /* Walk through the bind address list and look for a bind 4491da177e4SLinus Torvalds * address that matches the source address of the returned dst. 4501da177e4SLinus Torvalds */ 45118a353f4SDavid S. Miller sctp_v4_dst_saddr(&dst_saddr, fl4, htons(bp->port)); 452559cf710SVlad Yasevich rcu_read_lock(); 453559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4548a07eb0aSMichio Honda if (!laddr->valid || (laddr->state == SCTP_ADDR_DEL) || 4558a07eb0aSMichio Honda (laddr->state != SCTP_ADDR_SRC && 4568a07eb0aSMichio Honda !asoc->src_out_of_asoc_ok)) 457dc022a98SSridhar Samudrala continue; 458854d43a4SAl Viro if (sctp_v4_cmp_addr(&dst_saddr, &laddr->a)) 4591da177e4SLinus Torvalds goto out_unlock; 4601da177e4SLinus Torvalds } 461559cf710SVlad Yasevich rcu_read_unlock(); 4621da177e4SLinus Torvalds 4631da177e4SLinus Torvalds /* None of the bound addresses match the source address of the 4641da177e4SLinus Torvalds * dst. So release it. 4651da177e4SLinus Torvalds */ 4661da177e4SLinus Torvalds dst_release(dst); 4671da177e4SLinus Torvalds dst = NULL; 4681da177e4SLinus Torvalds } 4691da177e4SLinus Torvalds 4701da177e4SLinus Torvalds /* Walk through the bind address list and try to get a dst that 4711da177e4SLinus Torvalds * matches a bind address as the source address. 4721da177e4SLinus Torvalds */ 473559cf710SVlad Yasevich rcu_read_lock(); 474559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4750ca50d12SMarcelo Ricardo Leitner struct net_device *odev; 4760ca50d12SMarcelo Ricardo Leitner 477559cf710SVlad Yasevich if (!laddr->valid) 478559cf710SVlad Yasevich continue; 47907868284SMarcelo Ricardo Leitner if (laddr->state != SCTP_ADDR_SRC || 48007868284SMarcelo Ricardo Leitner AF_INET != laddr->a.sa.sa_family) 48107868284SMarcelo Ricardo Leitner continue; 48207868284SMarcelo Ricardo Leitner 4839914ae3cSVlad Yasevich fl4->fl4_sport = laddr->a.v4.sin_port; 48485350871SXufeng Zhang flowi4_update_output(fl4, 48585350871SXufeng Zhang asoc->base.sk->sk_bound_dev_if, 4868a9c58d2SXin Long RT_CONN_FLAGS_TOS(asoc->base.sk, tos), 48785350871SXufeng Zhang daddr->v4.sin_addr.s_addr, 48885350871SXufeng Zhang laddr->a.v4.sin_addr.s_addr); 48985350871SXufeng Zhang 490bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 49107868284SMarcelo Ricardo Leitner if (IS_ERR(rt)) 49207868284SMarcelo Ricardo Leitner continue; 49307868284SMarcelo Ricardo Leitner 4940ca50d12SMarcelo Ricardo Leitner /* Ensure the src address belongs to the output 4950ca50d12SMarcelo Ricardo Leitner * interface. 4960ca50d12SMarcelo Ricardo Leitner */ 4970ca50d12SMarcelo Ricardo Leitner odev = __ip_dev_find(sock_net(sk), laddr->a.v4.sin_addr.s_addr, 4980ca50d12SMarcelo Ricardo Leitner false); 499d82f0f1fSMarcelo Ricardo Leitner if (!odev || odev->ifindex != fl4->flowi4_oif) { 5004a31a6b1STommi Rantala if (!dst) 5014a31a6b1STommi Rantala dst = &rt->dst; 5024a31a6b1STommi Rantala else 503d82f0f1fSMarcelo Ricardo Leitner dst_release(&rt->dst); 5040ca50d12SMarcelo Ricardo Leitner continue; 505d82f0f1fSMarcelo Ricardo Leitner } 5060ca50d12SMarcelo Ricardo Leitner 507410f0383SMarcelo Ricardo Leitner dst_release(dst); 508d8d1f30bSChangli Gao dst = &rt->dst; 50907868284SMarcelo Ricardo Leitner break; 5101da177e4SLinus Torvalds } 5111da177e4SLinus Torvalds 5121da177e4SLinus Torvalds out_unlock: 513559cf710SVlad Yasevich rcu_read_unlock(); 5141da177e4SLinus Torvalds out: 515da0420beSVlad Yasevich t->dst = dst; 5161da177e4SLinus Torvalds if (dst) 517bb33381dSDaniel Borkmann pr_debug("rt_dst:%pI4, rt_src:%pI4\n", 51818a353f4SDavid S. Miller &fl4->daddr, &fl4->saddr); 5191da177e4SLinus Torvalds else 520bb33381dSDaniel Borkmann pr_debug("no route\n"); 5211da177e4SLinus Torvalds } 5221da177e4SLinus Torvalds 5231da177e4SLinus Torvalds /* For v4, the source address is cached in the route entry(dst). So no need 5241da177e4SLinus Torvalds * to cache it separately and hence this is an empty routine. 5251da177e4SLinus Torvalds */ 526e5117101SYOSHIFUJI Hideaki static void sctp_v4_get_saddr(struct sctp_sock *sk, 5279914ae3cSVlad Yasevich struct sctp_transport *t, 5289914ae3cSVlad Yasevich struct flowi *fl) 5291da177e4SLinus Torvalds { 5309914ae3cSVlad Yasevich union sctp_addr *saddr = &t->saddr; 5319914ae3cSVlad Yasevich struct rtable *rt = (struct rtable *)t->dst; 53223ec47a0SVladislav Yasevich 5331da177e4SLinus Torvalds if (rt) { 5341da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 535902ebd3eSDavid S. Miller saddr->v4.sin_addr.s_addr = fl->u.ip4.saddr; 5361da177e4SLinus Torvalds } 5371da177e4SLinus Torvalds } 5381da177e4SLinus Torvalds 5391da177e4SLinus Torvalds /* What interface did this skb arrive on? */ 5401da177e4SLinus Torvalds static int sctp_v4_skb_iif(const struct sk_buff *skb) 5411da177e4SLinus Torvalds { 54292101b3bSDavid S. Miller return inet_iif(skb); 5431da177e4SLinus Torvalds } 5441da177e4SLinus Torvalds 5451da177e4SLinus Torvalds /* Was this packet marked by Explicit Congestion Notification? */ 5461da177e4SLinus Torvalds static int sctp_v4_is_ce(const struct sk_buff *skb) 5471da177e4SLinus Torvalds { 548eddc9ec5SArnaldo Carvalho de Melo return INET_ECN_is_ce(ip_hdr(skb)->tos); 5491da177e4SLinus Torvalds } 5501da177e4SLinus Torvalds 5511da177e4SLinus Torvalds /* Create and initialize a new sk for the socket returned by accept(). */ 5521da177e4SLinus Torvalds static struct sock *sctp_v4_create_accept_sk(struct sock *sk, 553cdfbabfbSDavid Howells struct sctp_association *asoc, 554cdfbabfbSDavid Howells bool kern) 5551da177e4SLinus Torvalds { 5563b1e0a65SYOSHIFUJI Hideaki struct sock *newsk = sk_alloc(sock_net(sk), PF_INET, GFP_KERNEL, 557cdfbabfbSDavid Howells sk->sk_prot, kern); 558914e1c8bSVlad Yasevich struct inet_sock *newinet; 5591da177e4SLinus Torvalds 5601da177e4SLinus Torvalds if (!newsk) 5611da177e4SLinus Torvalds goto out; 5621da177e4SLinus Torvalds 5631da177e4SLinus Torvalds sock_init_data(NULL, newsk); 5641da177e4SLinus Torvalds 565914e1c8bSVlad Yasevich sctp_copy_sock(newsk, sk, asoc); 5661da177e4SLinus Torvalds sock_reset_flag(newsk, SOCK_ZAPPED); 5671da177e4SLinus Torvalds 568b7e10c25SRichard Haines sctp_v4_copy_ip_options(sk, newsk); 569b7e10c25SRichard Haines 5701da177e4SLinus Torvalds newinet = inet_sk(newsk); 5711da177e4SLinus Torvalds 572c720c7e8SEric Dumazet newinet->inet_daddr = asoc->peer.primary_addr.v4.sin_addr.s_addr; 5731da177e4SLinus Torvalds 574e6848976SArnaldo Carvalho de Melo sk_refcnt_debug_inc(newsk); 5751da177e4SLinus Torvalds 5761da177e4SLinus Torvalds if (newsk->sk_prot->init(newsk)) { 5771da177e4SLinus Torvalds sk_common_release(newsk); 5781da177e4SLinus Torvalds newsk = NULL; 5791da177e4SLinus Torvalds } 5801da177e4SLinus Torvalds 5811da177e4SLinus Torvalds out: 5821da177e4SLinus Torvalds return newsk; 5831da177e4SLinus Torvalds } 5841da177e4SLinus Torvalds 585299ee123SJason Gunthorpe static int sctp_v4_addr_to_user(struct sctp_sock *sp, union sctp_addr *addr) 5861da177e4SLinus Torvalds { 587299ee123SJason Gunthorpe /* No address mapping for V4 sockets */ 58809279e61SXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 589299ee123SJason Gunthorpe return sizeof(struct sockaddr_in); 5901da177e4SLinus Torvalds } 5911da177e4SLinus Torvalds 5921da177e4SLinus Torvalds /* Dump the v4 addr to the seq file. */ 5931da177e4SLinus Torvalds static void sctp_v4_seq_dump_addr(struct seq_file *seq, union sctp_addr *addr) 5941da177e4SLinus Torvalds { 59521454aaaSHarvey Harrison seq_printf(seq, "%pI4 ", &addr->v4.sin_addr); 5961da177e4SLinus Torvalds } 5971da177e4SLinus Torvalds 598b9031d9dSVlad Yasevich static void sctp_v4_ecn_capable(struct sock *sk) 599b9031d9dSVlad Yasevich { 600b9031d9dSVlad Yasevich INET_ECN_xmit(sk); 601b9031d9dSVlad Yasevich } 602b9031d9dSVlad Yasevich 6039c3b5751SKees Cook static void sctp_addr_wq_timeout_handler(struct timer_list *t) 6049f7d653bSMichio Honda { 6059c3b5751SKees Cook struct net *net = from_timer(net, t, sctp.addr_wq_timer); 6069f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw, *temp; 6079f7d653bSMichio Honda struct sctp_sock *sp; 6089f7d653bSMichio Honda 6094db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6109f7d653bSMichio Honda 6114db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 612bb33381dSDaniel Borkmann pr_debug("%s: the first ent in wq:%p is addr:%pISc for cmd:%d at " 613bb33381dSDaniel Borkmann "entry:%p\n", __func__, &net->sctp.addr_waitq, &addrw->a.sa, 614bb33381dSDaniel Borkmann addrw->state, addrw); 6159f7d653bSMichio Honda 616dfd56b8bSEric Dumazet #if IS_ENABLED(CONFIG_IPV6) 6179f7d653bSMichio Honda /* Now we send an ASCONF for each association */ 6189f7d653bSMichio Honda /* Note. we currently don't handle link local IPv6 addressees */ 6199f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET6) { 6209f7d653bSMichio Honda struct in6_addr *in6; 6219f7d653bSMichio Honda 6229f7d653bSMichio Honda if (ipv6_addr_type(&addrw->a.v6.sin6_addr) & 6239f7d653bSMichio Honda IPV6_ADDR_LINKLOCAL) 6249f7d653bSMichio Honda goto free_next; 6259f7d653bSMichio Honda 6269f7d653bSMichio Honda in6 = (struct in6_addr *)&addrw->a.v6.sin6_addr; 6274db67e80SEric W. Biederman if (ipv6_chk_addr(net, in6, NULL, 0) == 0 && 6289f7d653bSMichio Honda addrw->state == SCTP_ADDR_NEW) { 6299f7d653bSMichio Honda unsigned long timeo_val; 6309f7d653bSMichio Honda 631bb33381dSDaniel Borkmann pr_debug("%s: this is on DAD, trying %d sec " 632bb33381dSDaniel Borkmann "later\n", __func__, 6339f7d653bSMichio Honda SCTP_ADDRESS_TICK_DELAY); 634bb33381dSDaniel Borkmann 6359f7d653bSMichio Honda timeo_val = jiffies; 6369f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 6374db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 6389f7d653bSMichio Honda break; 6399f7d653bSMichio Honda } 6409f7d653bSMichio Honda } 6415d0c90cfSDavid S. Miller #endif 6424db67e80SEric W. Biederman list_for_each_entry(sp, &net->sctp.auto_asconf_splist, auto_asconf_list) { 6439f7d653bSMichio Honda struct sock *sk; 6449f7d653bSMichio Honda 6459f7d653bSMichio Honda sk = sctp_opt2sk(sp); 6469f7d653bSMichio Honda /* ignore bound-specific endpoints */ 6479f7d653bSMichio Honda if (!sctp_is_ep_boundall(sk)) 6489f7d653bSMichio Honda continue; 6495bc1d1b4Swangweidong bh_lock_sock(sk); 6509f7d653bSMichio Honda if (sctp_asconf_mgmt(sp, addrw) < 0) 651bb33381dSDaniel Borkmann pr_debug("%s: sctp_asconf_mgmt failed\n", __func__); 6525bc1d1b4Swangweidong bh_unlock_sock(sk); 6539f7d653bSMichio Honda } 65439d84a58SDaniel Halperin #if IS_ENABLED(CONFIG_IPV6) 6559f7d653bSMichio Honda free_next: 65639d84a58SDaniel Halperin #endif 6579f7d653bSMichio Honda list_del(&addrw->list); 6589f7d653bSMichio Honda kfree(addrw); 6599f7d653bSMichio Honda } 6604db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6619f7d653bSMichio Honda } 6629f7d653bSMichio Honda 6634db67e80SEric W. Biederman static void sctp_free_addr_wq(struct net *net) 6649f7d653bSMichio Honda { 6659f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 6669f7d653bSMichio Honda struct sctp_sockaddr_entry *temp; 6679f7d653bSMichio Honda 6684db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6694db67e80SEric W. Biederman del_timer(&net->sctp.addr_wq_timer); 6704db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 6719f7d653bSMichio Honda list_del(&addrw->list); 6729f7d653bSMichio Honda kfree(addrw); 6739f7d653bSMichio Honda } 6744db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6759f7d653bSMichio Honda } 6769f7d653bSMichio Honda 6779f7d653bSMichio Honda /* lookup the entry for the same address in the addr_waitq 6789f7d653bSMichio Honda * sctp_addr_wq MUST be locked 6799f7d653bSMichio Honda */ 6804db67e80SEric W. Biederman static struct sctp_sockaddr_entry *sctp_addr_wq_lookup(struct net *net, 6814db67e80SEric W. Biederman struct sctp_sockaddr_entry *addr) 6829f7d653bSMichio Honda { 6839f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 6849f7d653bSMichio Honda 6854db67e80SEric W. Biederman list_for_each_entry(addrw, &net->sctp.addr_waitq, list) { 6869f7d653bSMichio Honda if (addrw->a.sa.sa_family != addr->a.sa.sa_family) 6879f7d653bSMichio Honda continue; 6889f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET) { 6899f7d653bSMichio Honda if (addrw->a.v4.sin_addr.s_addr == 6909f7d653bSMichio Honda addr->a.v4.sin_addr.s_addr) 6919f7d653bSMichio Honda return addrw; 6929f7d653bSMichio Honda } else if (addrw->a.sa.sa_family == AF_INET6) { 6939f7d653bSMichio Honda if (ipv6_addr_equal(&addrw->a.v6.sin6_addr, 6949f7d653bSMichio Honda &addr->a.v6.sin6_addr)) 6959f7d653bSMichio Honda return addrw; 6969f7d653bSMichio Honda } 6979f7d653bSMichio Honda } 6989f7d653bSMichio Honda return NULL; 6999f7d653bSMichio Honda } 7009f7d653bSMichio Honda 7014db67e80SEric W. Biederman void sctp_addr_wq_mgmt(struct net *net, struct sctp_sockaddr_entry *addr, int cmd) 7029f7d653bSMichio Honda { 7039f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 7049f7d653bSMichio Honda unsigned long timeo_val; 7059f7d653bSMichio Honda 7069f7d653bSMichio Honda /* first, we check if an opposite message already exist in the queue. 7079f7d653bSMichio Honda * If we found such message, it is removed. 7089f7d653bSMichio Honda * This operation is a bit stupid, but the DHCP client attaches the 7099f7d653bSMichio Honda * new address after a couple of addition and deletion of that address 7109f7d653bSMichio Honda */ 7119f7d653bSMichio Honda 7124db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 7139f7d653bSMichio Honda /* Offsets existing events in addr_wq */ 7144db67e80SEric W. Biederman addrw = sctp_addr_wq_lookup(net, addr); 7159f7d653bSMichio Honda if (addrw) { 7169f7d653bSMichio Honda if (addrw->state != cmd) { 717bb33381dSDaniel Borkmann pr_debug("%s: offsets existing entry for %d, addr:%pISc " 718bb33381dSDaniel Borkmann "in wq:%p\n", __func__, addrw->state, &addrw->a.sa, 7194db67e80SEric W. Biederman &net->sctp.addr_waitq); 720bb33381dSDaniel Borkmann 7219f7d653bSMichio Honda list_del(&addrw->list); 7229f7d653bSMichio Honda kfree(addrw); 7239f7d653bSMichio Honda } 7244db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7259f7d653bSMichio Honda return; 7269f7d653bSMichio Honda } 7279f7d653bSMichio Honda 7289f7d653bSMichio Honda /* OK, we have to add the new address to the wait queue */ 7299f7d653bSMichio Honda addrw = kmemdup(addr, sizeof(struct sctp_sockaddr_entry), GFP_ATOMIC); 7309f7d653bSMichio Honda if (addrw == NULL) { 7314db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7329f7d653bSMichio Honda return; 7339f7d653bSMichio Honda } 7349f7d653bSMichio Honda addrw->state = cmd; 7354db67e80SEric W. Biederman list_add_tail(&addrw->list, &net->sctp.addr_waitq); 736bb33381dSDaniel Borkmann 737bb33381dSDaniel Borkmann pr_debug("%s: add new entry for cmd:%d, addr:%pISc in wq:%p\n", 738bb33381dSDaniel Borkmann __func__, addrw->state, &addrw->a.sa, &net->sctp.addr_waitq); 7399f7d653bSMichio Honda 7404db67e80SEric W. Biederman if (!timer_pending(&net->sctp.addr_wq_timer)) { 7419f7d653bSMichio Honda timeo_val = jiffies; 7429f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 7434db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 7449f7d653bSMichio Honda } 7454db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7469f7d653bSMichio Honda } 7479f7d653bSMichio Honda 74829303547SVlad Yasevich /* Event handler for inet address addition/deletion events. 74929303547SVlad Yasevich * The sctp_local_addr_list needs to be protocted by a spin lock since 75029303547SVlad Yasevich * multiple notifiers (say IPv4 and IPv6) may be running at the same 75129303547SVlad Yasevich * time and thus corrupt the list. 75229303547SVlad Yasevich * The reader side is protected with RCU. 75329303547SVlad Yasevich */ 75424123186SAdrian Bunk static int sctp_inetaddr_event(struct notifier_block *this, unsigned long ev, 7551da177e4SLinus Torvalds void *ptr) 7561da177e4SLinus Torvalds { 75729c7cf96SSridhar Samudrala struct in_ifaddr *ifa = (struct in_ifaddr *)ptr; 75829303547SVlad Yasevich struct sctp_sockaddr_entry *addr = NULL; 75929303547SVlad Yasevich struct sctp_sockaddr_entry *temp; 7604db67e80SEric W. Biederman struct net *net = dev_net(ifa->ifa_dev->dev); 76122626216SChidambar 'ilLogict' Zinnoury int found = 0; 7621da177e4SLinus Torvalds 76329c7cf96SSridhar Samudrala switch (ev) { 76429c7cf96SSridhar Samudrala case NETDEV_UP: 765400b8b9aSXin Long addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 76629c7cf96SSridhar Samudrala if (addr) { 76729c7cf96SSridhar Samudrala addr->a.v4.sin_family = AF_INET; 76829c7cf96SSridhar Samudrala addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 76929303547SVlad Yasevich addr->valid = 1; 7704db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 7714db67e80SEric W. Biederman list_add_tail_rcu(&addr->list, &net->sctp.local_addr_list); 7724db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_NEW); 7734db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 77429c7cf96SSridhar Samudrala } 77529c7cf96SSridhar Samudrala break; 77629c7cf96SSridhar Samudrala case NETDEV_DOWN: 7774db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 77829303547SVlad Yasevich list_for_each_entry_safe(addr, temp, 7794db67e80SEric W. Biederman &net->sctp.local_addr_list, list) { 780a40a7d15SPavel Emelyanov if (addr->a.sa.sa_family == AF_INET && 781a40a7d15SPavel Emelyanov addr->a.v4.sin_addr.s_addr == 782a40a7d15SPavel Emelyanov ifa->ifa_local) { 7834db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_DEL); 78422626216SChidambar 'ilLogict' Zinnoury found = 1; 78529303547SVlad Yasevich addr->valid = 0; 78629303547SVlad Yasevich list_del_rcu(&addr->list); 78729c7cf96SSridhar Samudrala break; 78829c7cf96SSridhar Samudrala } 78929c7cf96SSridhar Samudrala } 7904db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 79122626216SChidambar 'ilLogict' Zinnoury if (found) 7921231f0baSLai Jiangshan kfree_rcu(addr, rcu); 79329c7cf96SSridhar Samudrala break; 79429c7cf96SSridhar Samudrala } 7951da177e4SLinus Torvalds 7961da177e4SLinus Torvalds return NOTIFY_DONE; 7971da177e4SLinus Torvalds } 7981da177e4SLinus Torvalds 7991da177e4SLinus Torvalds /* 8001da177e4SLinus Torvalds * Initialize the control inode/socket with a control endpoint data 8011da177e4SLinus Torvalds * structure. This endpoint is reserved exclusively for the OOTB processing. 8021da177e4SLinus Torvalds */ 8032ce95503SEric W. Biederman static int sctp_ctl_sock_init(struct net *net) 8041da177e4SLinus Torvalds { 8051da177e4SLinus Torvalds int err; 806fb13d9f9SBrian Haley sa_family_t family = PF_INET; 8071da177e4SLinus Torvalds 8081da177e4SLinus Torvalds if (sctp_get_pf_specific(PF_INET6)) 8091da177e4SLinus Torvalds family = PF_INET6; 8101da177e4SLinus Torvalds 8112ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, family, 8122ce95503SEric W. Biederman SOCK_SEQPACKET, IPPROTO_SCTP, net); 813fb13d9f9SBrian Haley 814fb13d9f9SBrian Haley /* If IPv6 socket could not be created, try the IPv4 socket */ 815fb13d9f9SBrian Haley if (err < 0 && family == PF_INET6) 8162ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, AF_INET, 817fb13d9f9SBrian Haley SOCK_SEQPACKET, IPPROTO_SCTP, 8182ce95503SEric W. Biederman net); 819fb13d9f9SBrian Haley 8201da177e4SLinus Torvalds if (err < 0) { 821145ce502SJoe Perches pr_err("Failed to create the SCTP control socket\n"); 8221da177e4SLinus Torvalds return err; 8231da177e4SLinus Torvalds } 8241da177e4SLinus Torvalds return 0; 8251da177e4SLinus Torvalds } 8261da177e4SLinus Torvalds 8271da177e4SLinus Torvalds /* Register address family specific functions. */ 8281da177e4SLinus Torvalds int sctp_register_af(struct sctp_af *af) 8291da177e4SLinus Torvalds { 8301da177e4SLinus Torvalds switch (af->sa_family) { 8311da177e4SLinus Torvalds case AF_INET: 8321da177e4SLinus Torvalds if (sctp_af_v4_specific) 8331da177e4SLinus Torvalds return 0; 8341da177e4SLinus Torvalds sctp_af_v4_specific = af; 8351da177e4SLinus Torvalds break; 8361da177e4SLinus Torvalds case AF_INET6: 8371da177e4SLinus Torvalds if (sctp_af_v6_specific) 8381da177e4SLinus Torvalds return 0; 8391da177e4SLinus Torvalds sctp_af_v6_specific = af; 8401da177e4SLinus Torvalds break; 8411da177e4SLinus Torvalds default: 8421da177e4SLinus Torvalds return 0; 8431da177e4SLinus Torvalds } 8441da177e4SLinus Torvalds 8451da177e4SLinus Torvalds INIT_LIST_HEAD(&af->list); 8461da177e4SLinus Torvalds list_add_tail(&af->list, &sctp_address_families); 8471da177e4SLinus Torvalds return 1; 8481da177e4SLinus Torvalds } 8491da177e4SLinus Torvalds 8501da177e4SLinus Torvalds /* Get the table of functions for manipulating a particular address 8511da177e4SLinus Torvalds * family. 8521da177e4SLinus Torvalds */ 8531da177e4SLinus Torvalds struct sctp_af *sctp_get_af_specific(sa_family_t family) 8541da177e4SLinus Torvalds { 8551da177e4SLinus Torvalds switch (family) { 8561da177e4SLinus Torvalds case AF_INET: 8571da177e4SLinus Torvalds return sctp_af_v4_specific; 8581da177e4SLinus Torvalds case AF_INET6: 8591da177e4SLinus Torvalds return sctp_af_v6_specific; 8601da177e4SLinus Torvalds default: 8611da177e4SLinus Torvalds return NULL; 8621da177e4SLinus Torvalds } 8631da177e4SLinus Torvalds } 8641da177e4SLinus Torvalds 8651da177e4SLinus Torvalds /* Common code to initialize a AF_INET msg_name. */ 8661da177e4SLinus Torvalds static void sctp_inet_msgname(char *msgname, int *addr_len) 8671da177e4SLinus Torvalds { 8681da177e4SLinus Torvalds struct sockaddr_in *sin; 8691da177e4SLinus Torvalds 8701da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 8711da177e4SLinus Torvalds *addr_len = sizeof(struct sockaddr_in); 8721da177e4SLinus Torvalds sin->sin_family = AF_INET; 8731da177e4SLinus Torvalds memset(sin->sin_zero, 0, sizeof(sin->sin_zero)); 8741da177e4SLinus Torvalds } 8751da177e4SLinus Torvalds 8761da177e4SLinus Torvalds /* Copy the primary address of the peer primary address as the msg_name. */ 8771da177e4SLinus Torvalds static void sctp_inet_event_msgname(struct sctp_ulpevent *event, char *msgname, 8781da177e4SLinus Torvalds int *addr_len) 8791da177e4SLinus Torvalds { 8801da177e4SLinus Torvalds struct sockaddr_in *sin, *sinfrom; 8811da177e4SLinus Torvalds 8821da177e4SLinus Torvalds if (msgname) { 8831da177e4SLinus Torvalds struct sctp_association *asoc; 8841da177e4SLinus Torvalds 8851da177e4SLinus Torvalds asoc = event->asoc; 8861da177e4SLinus Torvalds sctp_inet_msgname(msgname, addr_len); 8871da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 8881da177e4SLinus Torvalds sinfrom = &asoc->peer.primary_addr.v4; 8891da177e4SLinus Torvalds sin->sin_port = htons(asoc->peer.port); 8901da177e4SLinus Torvalds sin->sin_addr.s_addr = sinfrom->sin_addr.s_addr; 8911da177e4SLinus Torvalds } 8921da177e4SLinus Torvalds } 8931da177e4SLinus Torvalds 8941da177e4SLinus Torvalds /* Initialize and copy out a msgname from an inbound skb. */ 8951da177e4SLinus Torvalds static void sctp_inet_skb_msgname(struct sk_buff *skb, char *msgname, int *len) 8961da177e4SLinus Torvalds { 8971da177e4SLinus Torvalds if (msgname) { 8982c0fd387SArnaldo Carvalho de Melo struct sctphdr *sh = sctp_hdr(skb); 8992c0fd387SArnaldo Carvalho de Melo struct sockaddr_in *sin = (struct sockaddr_in *)msgname; 9002c0fd387SArnaldo Carvalho de Melo 9011da177e4SLinus Torvalds sctp_inet_msgname(msgname, len); 9021da177e4SLinus Torvalds sin->sin_port = sh->source; 903eddc9ec5SArnaldo Carvalho de Melo sin->sin_addr.s_addr = ip_hdr(skb)->saddr; 9041da177e4SLinus Torvalds } 9051da177e4SLinus Torvalds } 9061da177e4SLinus Torvalds 9071da177e4SLinus Torvalds /* Do we support this AF? */ 9081da177e4SLinus Torvalds static int sctp_inet_af_supported(sa_family_t family, struct sctp_sock *sp) 9091da177e4SLinus Torvalds { 9101da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 911a02cec21SEric Dumazet return AF_INET == family; 9121da177e4SLinus Torvalds } 9131da177e4SLinus Torvalds 9141da177e4SLinus Torvalds /* Address matching with wildcards allowed. */ 9151da177e4SLinus Torvalds static int sctp_inet_cmp_addr(const union sctp_addr *addr1, 9161da177e4SLinus Torvalds const union sctp_addr *addr2, 9171da177e4SLinus Torvalds struct sctp_sock *opt) 9181da177e4SLinus Torvalds { 9191da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 9201da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 9211da177e4SLinus Torvalds return 0; 922e6f1cebfSAl Viro if (htonl(INADDR_ANY) == addr1->v4.sin_addr.s_addr || 923e6f1cebfSAl Viro htonl(INADDR_ANY) == addr2->v4.sin_addr.s_addr) 9241da177e4SLinus Torvalds return 1; 9251da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr == addr2->v4.sin_addr.s_addr) 9261da177e4SLinus Torvalds return 1; 9271da177e4SLinus Torvalds 9281da177e4SLinus Torvalds return 0; 9291da177e4SLinus Torvalds } 9301da177e4SLinus Torvalds 9311da177e4SLinus Torvalds /* Verify that provided sockaddr looks bindable. Common verification has 9321da177e4SLinus Torvalds * already been taken care of. 9331da177e4SLinus Torvalds */ 9341da177e4SLinus Torvalds static int sctp_inet_bind_verify(struct sctp_sock *opt, union sctp_addr *addr) 9351da177e4SLinus Torvalds { 9361da177e4SLinus Torvalds return sctp_v4_available(addr, opt); 9371da177e4SLinus Torvalds } 9381da177e4SLinus Torvalds 9391da177e4SLinus Torvalds /* Verify that sockaddr looks sendable. Common verification has already 9401da177e4SLinus Torvalds * been taken care of. 9411da177e4SLinus Torvalds */ 9421da177e4SLinus Torvalds static int sctp_inet_send_verify(struct sctp_sock *opt, union sctp_addr *addr) 9431da177e4SLinus Torvalds { 9441da177e4SLinus Torvalds return 1; 9451da177e4SLinus Torvalds } 9461da177e4SLinus Torvalds 9471da177e4SLinus Torvalds /* Fill in Supported Address Type information for INIT and INIT-ACK 9481da177e4SLinus Torvalds * chunks. Returns number of addresses supported. 9491da177e4SLinus Torvalds */ 9501da177e4SLinus Torvalds static int sctp_inet_supported_addrs(const struct sctp_sock *opt, 9513dbe8656SAl Viro __be16 *types) 9521da177e4SLinus Torvalds { 9531da177e4SLinus Torvalds types[0] = SCTP_PARAM_IPV4_ADDRESS; 9541da177e4SLinus Torvalds return 1; 9551da177e4SLinus Torvalds } 9561da177e4SLinus Torvalds 9571da177e4SLinus Torvalds /* Wrapper routine that calls the ip transmit routine. */ 9581da177e4SLinus Torvalds static inline int sctp_v4_xmit(struct sk_buff *skb, 959f880374cSHerbert Xu struct sctp_transport *transport) 9601da177e4SLinus Torvalds { 961f880374cSHerbert Xu struct inet_sock *inet = inet_sk(skb->sk); 9628a9c58d2SXin Long __u8 dscp = inet->tos; 963f880374cSHerbert Xu 964bb33381dSDaniel Borkmann pr_debug("%s: skb:%p, len:%d, src:%pI4, dst:%pI4\n", __func__, skb, 9658a9c58d2SXin Long skb->len, &transport->fl.u.ip4.saddr, 9668a9c58d2SXin Long &transport->fl.u.ip4.daddr); 9678a9c58d2SXin Long 9688a9c58d2SXin Long if (transport->dscp & SCTP_DSCP_SET_MASK) 9698a9c58d2SXin Long dscp = transport->dscp & SCTP_DSCP_VAL_MASK; 9701da177e4SLinus Torvalds 971f880374cSHerbert Xu inet->pmtudisc = transport->param_flags & SPP_PMTUD_ENABLE ? 972f880374cSHerbert Xu IP_PMTUDISC_DO : IP_PMTUDISC_DONT; 973f880374cSHerbert Xu 974b01a2407SEric W. Biederman SCTP_INC_STATS(sock_net(&inet->sk), SCTP_MIB_OUTSCTPPACKS); 975bb33381dSDaniel Borkmann 9768a9c58d2SXin Long return __ip_queue_xmit(&inet->sk, skb, &transport->fl, dscp); 9771da177e4SLinus Torvalds } 9781da177e4SLinus Torvalds 97915efbe76SNeil Horman static struct sctp_af sctp_af_inet; 9801da177e4SLinus Torvalds 9811da177e4SLinus Torvalds static struct sctp_pf sctp_pf_inet = { 9821da177e4SLinus Torvalds .event_msgname = sctp_inet_event_msgname, 9831da177e4SLinus Torvalds .skb_msgname = sctp_inet_skb_msgname, 9841da177e4SLinus Torvalds .af_supported = sctp_inet_af_supported, 9851da177e4SLinus Torvalds .cmp_addr = sctp_inet_cmp_addr, 9861da177e4SLinus Torvalds .bind_verify = sctp_inet_bind_verify, 9871da177e4SLinus Torvalds .send_verify = sctp_inet_send_verify, 9881da177e4SLinus Torvalds .supported_addrs = sctp_inet_supported_addrs, 9891da177e4SLinus Torvalds .create_accept_sk = sctp_v4_create_accept_sk, 990299ee123SJason Gunthorpe .addr_to_user = sctp_v4_addr_to_user, 991299ee123SJason Gunthorpe .to_sk_saddr = sctp_v4_to_sk_saddr, 992299ee123SJason Gunthorpe .to_sk_daddr = sctp_v4_to_sk_daddr, 993b7e10c25SRichard Haines .copy_ip_options = sctp_v4_copy_ip_options, 99415efbe76SNeil Horman .af = &sctp_af_inet 9951da177e4SLinus Torvalds }; 9961da177e4SLinus Torvalds 9971da177e4SLinus Torvalds /* Notifier for inetaddr addition/deletion events. */ 9981da177e4SLinus Torvalds static struct notifier_block sctp_inetaddr_notifier = { 9991da177e4SLinus Torvalds .notifier_call = sctp_inetaddr_event, 10001da177e4SLinus Torvalds }; 10011da177e4SLinus Torvalds 10021da177e4SLinus Torvalds /* Socket operations. */ 100390ddc4f0SEric Dumazet static const struct proto_ops inet_seqpacket_ops = { 10041da177e4SLinus Torvalds .family = PF_INET, 10051da177e4SLinus Torvalds .owner = THIS_MODULE, 10061da177e4SLinus Torvalds .release = inet_release, /* Needs to be wrapped... */ 10071da177e4SLinus Torvalds .bind = inet_bind, 1008644fbdeaSXin Long .connect = sctp_inet_connect, 10091da177e4SLinus Torvalds .socketpair = sock_no_socketpair, 10101da177e4SLinus Torvalds .accept = inet_accept, 10111da177e4SLinus Torvalds .getname = inet_getname, /* Semantics are different. */ 1012a11e1d43SLinus Torvalds .poll = sctp_poll, 10131da177e4SLinus Torvalds .ioctl = inet_ioctl, 1014c7cbdbf2SArnd Bergmann .gettstamp = sock_gettstamp, 10151da177e4SLinus Torvalds .listen = sctp_inet_listen, 10161da177e4SLinus Torvalds .shutdown = inet_shutdown, /* Looks harmless. */ 1017543d9cfeSArnaldo Carvalho de Melo .setsockopt = sock_common_setsockopt, /* IP_SOL IP_OPTION is a problem */ 10181da177e4SLinus Torvalds .getsockopt = sock_common_getsockopt, 10191da177e4SLinus Torvalds .sendmsg = inet_sendmsg, 1020fd2d180aSXin Long .recvmsg = inet_recvmsg, 10211da177e4SLinus Torvalds .mmap = sock_no_mmap, 10221da177e4SLinus Torvalds .sendpage = sock_no_sendpage, 1023543d9cfeSArnaldo Carvalho de Melo #ifdef CONFIG_COMPAT 1024543d9cfeSArnaldo Carvalho de Melo .compat_setsockopt = compat_sock_common_setsockopt, 1025543d9cfeSArnaldo Carvalho de Melo .compat_getsockopt = compat_sock_common_getsockopt, 1026543d9cfeSArnaldo Carvalho de Melo #endif 10271da177e4SLinus Torvalds }; 10281da177e4SLinus Torvalds 10291da177e4SLinus Torvalds /* Registration with AF_INET family. */ 10301da177e4SLinus Torvalds static struct inet_protosw sctp_seqpacket_protosw = { 10311da177e4SLinus Torvalds .type = SOCK_SEQPACKET, 10321da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 10331da177e4SLinus Torvalds .prot = &sctp_prot, 10341da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 10351da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 10361da177e4SLinus Torvalds }; 10371da177e4SLinus Torvalds static struct inet_protosw sctp_stream_protosw = { 10381da177e4SLinus Torvalds .type = SOCK_STREAM, 10391da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 10401da177e4SLinus Torvalds .prot = &sctp_prot, 10411da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 10421da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 10431da177e4SLinus Torvalds }; 10441da177e4SLinus Torvalds 10451da177e4SLinus Torvalds /* Register with IP layer. */ 104632613090SAlexey Dobriyan static const struct net_protocol sctp_protocol = { 10471da177e4SLinus Torvalds .handler = sctp_rcv, 10481da177e4SLinus Torvalds .err_handler = sctp_v4_err, 10491da177e4SLinus Torvalds .no_policy = 1, 1050bb2db45bSEric W. Biederman .netns_ok = 1, 10518ed1dc44SHannes Frederic Sowa .icmp_strict_tag_validation = 1, 10521da177e4SLinus Torvalds }; 10531da177e4SLinus Torvalds 10541da177e4SLinus Torvalds /* IPv4 address related functions. */ 105515efbe76SNeil Horman static struct sctp_af sctp_af_inet = { 1056543d9cfeSArnaldo Carvalho de Melo .sa_family = AF_INET, 10571da177e4SLinus Torvalds .sctp_xmit = sctp_v4_xmit, 10581da177e4SLinus Torvalds .setsockopt = ip_setsockopt, 10591da177e4SLinus Torvalds .getsockopt = ip_getsockopt, 10601da177e4SLinus Torvalds .get_dst = sctp_v4_get_dst, 10611da177e4SLinus Torvalds .get_saddr = sctp_v4_get_saddr, 10621da177e4SLinus Torvalds .copy_addrlist = sctp_v4_copy_addrlist, 10631da177e4SLinus Torvalds .from_skb = sctp_v4_from_skb, 10641da177e4SLinus Torvalds .from_sk = sctp_v4_from_sk, 10651da177e4SLinus Torvalds .from_addr_param = sctp_v4_from_addr_param, 10661da177e4SLinus Torvalds .to_addr_param = sctp_v4_to_addr_param, 10671da177e4SLinus Torvalds .cmp_addr = sctp_v4_cmp_addr, 10681da177e4SLinus Torvalds .addr_valid = sctp_v4_addr_valid, 10691da177e4SLinus Torvalds .inaddr_any = sctp_v4_inaddr_any, 10701da177e4SLinus Torvalds .is_any = sctp_v4_is_any, 10711da177e4SLinus Torvalds .available = sctp_v4_available, 10721da177e4SLinus Torvalds .scope = sctp_v4_scope, 10731da177e4SLinus Torvalds .skb_iif = sctp_v4_skb_iif, 10741da177e4SLinus Torvalds .is_ce = sctp_v4_is_ce, 10751da177e4SLinus Torvalds .seq_dump_addr = sctp_v4_seq_dump_addr, 1076b9031d9dSVlad Yasevich .ecn_capable = sctp_v4_ecn_capable, 10771da177e4SLinus Torvalds .net_header_len = sizeof(struct iphdr), 10781da177e4SLinus Torvalds .sockaddr_len = sizeof(struct sockaddr_in), 1079b7e10c25SRichard Haines .ip_options_len = sctp_v4_ip_options_len, 1080543d9cfeSArnaldo Carvalho de Melo #ifdef CONFIG_COMPAT 1081543d9cfeSArnaldo Carvalho de Melo .compat_setsockopt = compat_ip_setsockopt, 1082543d9cfeSArnaldo Carvalho de Melo .compat_getsockopt = compat_ip_getsockopt, 1083543d9cfeSArnaldo Carvalho de Melo #endif 10841da177e4SLinus Torvalds }; 10851da177e4SLinus Torvalds 10868d72651dSwangweidong struct sctp_pf *sctp_get_pf_specific(sa_family_t family) 10878d72651dSwangweidong { 10881da177e4SLinus Torvalds switch (family) { 10891da177e4SLinus Torvalds case PF_INET: 10901da177e4SLinus Torvalds return sctp_pf_inet_specific; 10911da177e4SLinus Torvalds case PF_INET6: 10921da177e4SLinus Torvalds return sctp_pf_inet6_specific; 10931da177e4SLinus Torvalds default: 10941da177e4SLinus Torvalds return NULL; 10951da177e4SLinus Torvalds } 10961da177e4SLinus Torvalds } 10971da177e4SLinus Torvalds 10981da177e4SLinus Torvalds /* Register the PF specific function table. */ 10991da177e4SLinus Torvalds int sctp_register_pf(struct sctp_pf *pf, sa_family_t family) 11001da177e4SLinus Torvalds { 11011da177e4SLinus Torvalds switch (family) { 11021da177e4SLinus Torvalds case PF_INET: 11031da177e4SLinus Torvalds if (sctp_pf_inet_specific) 11041da177e4SLinus Torvalds return 0; 11051da177e4SLinus Torvalds sctp_pf_inet_specific = pf; 11061da177e4SLinus Torvalds break; 11071da177e4SLinus Torvalds case PF_INET6: 11081da177e4SLinus Torvalds if (sctp_pf_inet6_specific) 11091da177e4SLinus Torvalds return 0; 11101da177e4SLinus Torvalds sctp_pf_inet6_specific = pf; 11111da177e4SLinus Torvalds break; 11121da177e4SLinus Torvalds default: 11131da177e4SLinus Torvalds return 0; 11141da177e4SLinus Torvalds } 11151da177e4SLinus Torvalds return 1; 11161da177e4SLinus Torvalds } 11171da177e4SLinus Torvalds 1118b01a2407SEric W. Biederman static inline int init_sctp_mibs(struct net *net) 11191da177e4SLinus Torvalds { 1120698365faSWANG Cong net->sctp.sctp_statistics = alloc_percpu(struct sctp_mib); 1121698365faSWANG Cong if (!net->sctp.sctp_statistics) 1122698365faSWANG Cong return -ENOMEM; 1123698365faSWANG Cong return 0; 11241da177e4SLinus Torvalds } 11251da177e4SLinus Torvalds 1126b01a2407SEric W. Biederman static inline void cleanup_sctp_mibs(struct net *net) 11271da177e4SLinus Torvalds { 1128698365faSWANG Cong free_percpu(net->sctp.sctp_statistics); 11291da177e4SLinus Torvalds } 11301da177e4SLinus Torvalds 1131270637abSVlad Yasevich static void sctp_v4_pf_init(void) 1132270637abSVlad Yasevich { 1133270637abSVlad Yasevich /* Initialize the SCTP specific PF functions. */ 1134270637abSVlad Yasevich sctp_register_pf(&sctp_pf_inet, PF_INET); 1135270637abSVlad Yasevich sctp_register_af(&sctp_af_inet); 1136270637abSVlad Yasevich } 1137270637abSVlad Yasevich 1138270637abSVlad Yasevich static void sctp_v4_pf_exit(void) 1139270637abSVlad Yasevich { 1140270637abSVlad Yasevich list_del(&sctp_af_inet.list); 1141270637abSVlad Yasevich } 1142270637abSVlad Yasevich 1143270637abSVlad Yasevich static int sctp_v4_protosw_init(void) 1144270637abSVlad Yasevich { 1145270637abSVlad Yasevich int rc; 1146270637abSVlad Yasevich 1147270637abSVlad Yasevich rc = proto_register(&sctp_prot, 1); 1148270637abSVlad Yasevich if (rc) 1149270637abSVlad Yasevich return rc; 1150270637abSVlad Yasevich 1151270637abSVlad Yasevich /* Register SCTP(UDP and TCP style) with socket layer. */ 1152270637abSVlad Yasevich inet_register_protosw(&sctp_seqpacket_protosw); 1153270637abSVlad Yasevich inet_register_protosw(&sctp_stream_protosw); 1154270637abSVlad Yasevich 1155270637abSVlad Yasevich return 0; 1156270637abSVlad Yasevich } 1157270637abSVlad Yasevich 1158270637abSVlad Yasevich static void sctp_v4_protosw_exit(void) 1159270637abSVlad Yasevich { 1160270637abSVlad Yasevich inet_unregister_protosw(&sctp_stream_protosw); 1161270637abSVlad Yasevich inet_unregister_protosw(&sctp_seqpacket_protosw); 1162270637abSVlad Yasevich proto_unregister(&sctp_prot); 1163270637abSVlad Yasevich } 1164270637abSVlad Yasevich 1165270637abSVlad Yasevich static int sctp_v4_add_protocol(void) 1166270637abSVlad Yasevich { 1167270637abSVlad Yasevich /* Register notifier for inet address additions/deletions. */ 1168270637abSVlad Yasevich register_inetaddr_notifier(&sctp_inetaddr_notifier); 1169270637abSVlad Yasevich 1170270637abSVlad Yasevich /* Register SCTP with inet layer. */ 1171270637abSVlad Yasevich if (inet_add_protocol(&sctp_protocol, IPPROTO_SCTP) < 0) 1172270637abSVlad Yasevich return -EAGAIN; 1173270637abSVlad Yasevich 1174270637abSVlad Yasevich return 0; 1175270637abSVlad Yasevich } 1176270637abSVlad Yasevich 1177270637abSVlad Yasevich static void sctp_v4_del_protocol(void) 1178270637abSVlad Yasevich { 1179270637abSVlad Yasevich inet_del_protocol(&sctp_protocol, IPPROTO_SCTP); 1180270637abSVlad Yasevich unregister_inetaddr_notifier(&sctp_inetaddr_notifier); 1181270637abSVlad Yasevich } 1182270637abSVlad Yasevich 11838e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_defaults_init(struct net *net) 11844db67e80SEric W. Biederman { 11852ce95503SEric W. Biederman int status; 11862ce95503SEric W. Biederman 1187e1fc3b14SEric W. Biederman /* 1188e1fc3b14SEric W. Biederman * 14. Suggested SCTP Protocol Parameter Values 1189e1fc3b14SEric W. Biederman */ 1190e1fc3b14SEric W. Biederman /* The following protocol parameters are RECOMMENDED: */ 1191e1fc3b14SEric W. Biederman /* RTO.Initial - 3 seconds */ 1192e1fc3b14SEric W. Biederman net->sctp.rto_initial = SCTP_RTO_INITIAL; 1193e1fc3b14SEric W. Biederman /* RTO.Min - 1 second */ 1194e1fc3b14SEric W. Biederman net->sctp.rto_min = SCTP_RTO_MIN; 1195e1fc3b14SEric W. Biederman /* RTO.Max - 60 seconds */ 1196e1fc3b14SEric W. Biederman net->sctp.rto_max = SCTP_RTO_MAX; 1197e1fc3b14SEric W. Biederman /* RTO.Alpha - 1/8 */ 1198e1fc3b14SEric W. Biederman net->sctp.rto_alpha = SCTP_RTO_ALPHA; 1199e1fc3b14SEric W. Biederman /* RTO.Beta - 1/4 */ 1200e1fc3b14SEric W. Biederman net->sctp.rto_beta = SCTP_RTO_BETA; 1201e1fc3b14SEric W. Biederman 1202e1fc3b14SEric W. Biederman /* Valid.Cookie.Life - 60 seconds */ 1203e1fc3b14SEric W. Biederman net->sctp.valid_cookie_life = SCTP_DEFAULT_COOKIE_LIFE; 1204e1fc3b14SEric W. Biederman 1205e1fc3b14SEric W. Biederman /* Whether Cookie Preservative is enabled(1) or not(0) */ 1206e1fc3b14SEric W. Biederman net->sctp.cookie_preserve_enable = 1; 1207e1fc3b14SEric W. Biederman 12083c68198eSNeil Horman /* Default sctp sockets to use md5 as their hmac alg */ 12090d0863b0SNeil Horman #if defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_MD5) 12103c68198eSNeil Horman net->sctp.sctp_hmac_alg = "md5"; 12110d0863b0SNeil Horman #elif defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_SHA1) 12123c68198eSNeil Horman net->sctp.sctp_hmac_alg = "sha1"; 12133c68198eSNeil Horman #else 12143c68198eSNeil Horman net->sctp.sctp_hmac_alg = NULL; 12153c68198eSNeil Horman #endif 12163c68198eSNeil Horman 1217e1fc3b14SEric W. Biederman /* Max.Burst - 4 */ 1218e1fc3b14SEric W. Biederman net->sctp.max_burst = SCTP_DEFAULT_MAX_BURST; 1219e1fc3b14SEric W. Biederman 1220*34515e94SXin Long /* Disable of Primary Path Switchover by default */ 1221*34515e94SXin Long net->sctp.ps_retrans = SCTP_PS_RETRANS_MAX; 1222*34515e94SXin Long 1223566178f8SZhu Yanjun /* Enable pf state by default */ 1224566178f8SZhu Yanjun net->sctp.pf_enable = 1; 1225566178f8SZhu Yanjun 1226aef587beSXin Long /* Ignore pf exposure feature by default */ 1227aef587beSXin Long net->sctp.pf_expose = SCTP_PF_EXPOSE_UNSET; 1228aef587beSXin Long 1229e1fc3b14SEric W. Biederman /* Association.Max.Retrans - 10 attempts 1230e1fc3b14SEric W. Biederman * Path.Max.Retrans - 5 attempts (per destination address) 1231e1fc3b14SEric W. Biederman * Max.Init.Retransmits - 8 attempts 1232e1fc3b14SEric W. Biederman */ 1233e1fc3b14SEric W. Biederman net->sctp.max_retrans_association = 10; 1234e1fc3b14SEric W. Biederman net->sctp.max_retrans_path = 5; 1235e1fc3b14SEric W. Biederman net->sctp.max_retrans_init = 8; 1236e1fc3b14SEric W. Biederman 1237e1fc3b14SEric W. Biederman /* Sendbuffer growth - do per-socket accounting */ 1238e1fc3b14SEric W. Biederman net->sctp.sndbuf_policy = 0; 1239e1fc3b14SEric W. Biederman 1240e1fc3b14SEric W. Biederman /* Rcvbuffer growth - do per-socket accounting */ 1241e1fc3b14SEric W. Biederman net->sctp.rcvbuf_policy = 0; 1242e1fc3b14SEric W. Biederman 1243e1fc3b14SEric W. Biederman /* HB.interval - 30 seconds */ 1244e1fc3b14SEric W. Biederman net->sctp.hb_interval = SCTP_DEFAULT_TIMEOUT_HEARTBEAT; 1245e1fc3b14SEric W. Biederman 1246e1fc3b14SEric W. Biederman /* delayed SACK timeout */ 1247e1fc3b14SEric W. Biederman net->sctp.sack_timeout = SCTP_DEFAULT_TIMEOUT_SACK; 1248e1fc3b14SEric W. Biederman 1249e1fc3b14SEric W. Biederman /* Disable ADDIP by default. */ 1250e1fc3b14SEric W. Biederman net->sctp.addip_enable = 0; 1251e1fc3b14SEric W. Biederman net->sctp.addip_noauth = 0; 1252e1fc3b14SEric W. Biederman net->sctp.default_auto_asconf = 0; 1253e1fc3b14SEric W. Biederman 1254e1fc3b14SEric W. Biederman /* Enable PR-SCTP by default. */ 1255e1fc3b14SEric W. Biederman net->sctp.prsctp_enable = 1; 1256e1fc3b14SEric W. Biederman 1257c28445c3SXin Long /* Disable RECONF by default. */ 1258c28445c3SXin Long net->sctp.reconf_enable = 0; 1259c28445c3SXin Long 1260e1fc3b14SEric W. Biederman /* Disable AUTH by default. */ 1261e1fc3b14SEric W. Biederman net->sctp.auth_enable = 0; 1262e1fc3b14SEric W. Biederman 12631b0b8114SXin Long /* Enable ECN by default. */ 12641b0b8114SXin Long net->sctp.ecn_enable = 1; 12651b0b8114SXin Long 1266e1fc3b14SEric W. Biederman /* Set SCOPE policy to enabled */ 1267e1fc3b14SEric W. Biederman net->sctp.scope_policy = SCTP_SCOPE_POLICY_ENABLE; 1268e1fc3b14SEric W. Biederman 1269e1fc3b14SEric W. Biederman /* Set the default rwnd update threshold */ 1270e1fc3b14SEric W. Biederman net->sctp.rwnd_upd_shift = SCTP_DEFAULT_RWND_SHIFT; 1271e1fc3b14SEric W. Biederman 1272e1fc3b14SEric W. Biederman /* Initialize maximum autoclose timeout. */ 1273e1fc3b14SEric W. Biederman net->sctp.max_autoclose = INT_MAX / HZ; 1274e1fc3b14SEric W. Biederman 1275ebb7e95dSEric W. Biederman status = sctp_sysctl_net_register(net); 1276ebb7e95dSEric W. Biederman if (status) 1277ebb7e95dSEric W. Biederman goto err_sysctl_register; 1278ebb7e95dSEric W. Biederman 1279b01a2407SEric W. Biederman /* Allocate and initialise sctp mibs. */ 1280b01a2407SEric W. Biederman status = init_sctp_mibs(net); 1281b01a2407SEric W. Biederman if (status) 1282b01a2407SEric W. Biederman goto err_init_mibs; 1283b01a2407SEric W. Biederman 1284d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 128513d782f6SEric W. Biederman /* Initialize proc fs directory. */ 128613d782f6SEric W. Biederman status = sctp_proc_init(net); 128713d782f6SEric W. Biederman if (status) 128813d782f6SEric W. Biederman goto err_init_proc; 1289d47d08c8SAl Viro #endif 129013d782f6SEric W. Biederman 129113d782f6SEric W. Biederman sctp_dbg_objcnt_init(net); 129213d782f6SEric W. Biederman 12934db67e80SEric W. Biederman /* Initialize the local address list. */ 12944db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.local_addr_list); 12954db67e80SEric W. Biederman spin_lock_init(&net->sctp.local_addr_lock); 12964db67e80SEric W. Biederman sctp_get_local_addr_list(net); 12974db67e80SEric W. Biederman 12984db67e80SEric W. Biederman /* Initialize the address event list */ 12994db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.addr_waitq); 13004db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.auto_asconf_splist); 13014db67e80SEric W. Biederman spin_lock_init(&net->sctp.addr_wq_lock); 13024db67e80SEric W. Biederman net->sctp.addr_wq_timer.expires = 0; 13039c3b5751SKees Cook timer_setup(&net->sctp.addr_wq_timer, sctp_addr_wq_timeout_handler, 0); 13044db67e80SEric W. Biederman 13054db67e80SEric W. Biederman return 0; 13062ce95503SEric W. Biederman 13077ae665f1SArnd Bergmann #ifdef CONFIG_PROC_FS 130813d782f6SEric W. Biederman err_init_proc: 1309b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 13107ae665f1SArnd Bergmann #endif 1311b01a2407SEric W. Biederman err_init_mibs: 1312ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 1313ebb7e95dSEric W. Biederman err_sysctl_register: 13142ce95503SEric W. Biederman return status; 13154db67e80SEric W. Biederman } 13164db67e80SEric W. Biederman 13178e2d61e0SMarcelo Ricardo Leitner static void __net_exit sctp_defaults_exit(struct net *net) 13184db67e80SEric W. Biederman { 13194db67e80SEric W. Biederman /* Free the local address list */ 13204db67e80SEric W. Biederman sctp_free_addr_wq(net); 13214db67e80SEric W. Biederman sctp_free_local_addr_list(net); 13222ce95503SEric W. Biederman 1323d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 1324d47d08c8SAl Viro remove_proc_subtree("sctp", net->proc_net); 1325d47d08c8SAl Viro net->sctp.proc_net_sctp = NULL; 1326d47d08c8SAl Viro #endif 1327b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 1328ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 13294db67e80SEric W. Biederman } 13304db67e80SEric W. Biederman 13318e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_defaults_ops = { 13328e2d61e0SMarcelo Ricardo Leitner .init = sctp_defaults_init, 13338e2d61e0SMarcelo Ricardo Leitner .exit = sctp_defaults_exit, 13348e2d61e0SMarcelo Ricardo Leitner }; 13358e2d61e0SMarcelo Ricardo Leitner 13368e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_ctrlsock_init(struct net *net) 13378e2d61e0SMarcelo Ricardo Leitner { 13388e2d61e0SMarcelo Ricardo Leitner int status; 13398e2d61e0SMarcelo Ricardo Leitner 13408e2d61e0SMarcelo Ricardo Leitner /* Initialize the control inode/socket for handling OOTB packets. */ 13418e2d61e0SMarcelo Ricardo Leitner status = sctp_ctl_sock_init(net); 13428e2d61e0SMarcelo Ricardo Leitner if (status) 13438e2d61e0SMarcelo Ricardo Leitner pr_err("Failed to initialize the SCTP control sock\n"); 13448e2d61e0SMarcelo Ricardo Leitner 13458e2d61e0SMarcelo Ricardo Leitner return status; 13468e2d61e0SMarcelo Ricardo Leitner } 13478e2d61e0SMarcelo Ricardo Leitner 1348b456d724SChristophe JAILLET static void __net_exit sctp_ctrlsock_exit(struct net *net) 13498e2d61e0SMarcelo Ricardo Leitner { 13508e2d61e0SMarcelo Ricardo Leitner /* Free the control endpoint. */ 13518e2d61e0SMarcelo Ricardo Leitner inet_ctl_sock_destroy(net->sctp.ctl_sock); 13528e2d61e0SMarcelo Ricardo Leitner } 13538e2d61e0SMarcelo Ricardo Leitner 13548e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_ctrlsock_ops = { 13558e2d61e0SMarcelo Ricardo Leitner .init = sctp_ctrlsock_init, 13568e2d61e0SMarcelo Ricardo Leitner .exit = sctp_ctrlsock_exit, 13574db67e80SEric W. Biederman }; 13584db67e80SEric W. Biederman 13591da177e4SLinus Torvalds /* Initialize the universe into something sensible. */ 1360dda91928SDaniel Borkmann static __init int sctp_init(void) 13611da177e4SLinus Torvalds { 13621da177e4SLinus Torvalds int i; 13631da177e4SLinus Torvalds int status = -EINVAL; 13641da177e4SLinus Torvalds unsigned long goal; 13654d93df0aSNeil Horman unsigned long limit; 1366ca79b0c2SArun KS unsigned long nr_pages = totalram_pages(); 13674d93df0aSNeil Horman int max_share; 13681da177e4SLinus Torvalds int order; 1369d9749fb5SNeil Horman int num_entries; 1370d9749fb5SNeil Horman int max_entry_order; 13711da177e4SLinus Torvalds 1372b4772ef8SEyal Birger sock_skb_cb_check_size(sizeof(struct sctp_ulpevent)); 13731da177e4SLinus Torvalds 1374827bf122SSridhar Samudrala /* Allocate bind_bucket and chunk caches. */ 13751da177e4SLinus Torvalds status = -ENOBUFS; 13761da177e4SLinus Torvalds sctp_bucket_cachep = kmem_cache_create("sctp_bind_bucket", 13771da177e4SLinus Torvalds sizeof(struct sctp_bind_bucket), 13781da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 137920c2df83SPaul Mundt NULL); 13801da177e4SLinus Torvalds if (!sctp_bucket_cachep) 1381827bf122SSridhar Samudrala goto out; 13821da177e4SLinus Torvalds 13831da177e4SLinus Torvalds sctp_chunk_cachep = kmem_cache_create("sctp_chunk", 13841da177e4SLinus Torvalds sizeof(struct sctp_chunk), 13851da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 138620c2df83SPaul Mundt NULL); 13871da177e4SLinus Torvalds if (!sctp_chunk_cachep) 13881da177e4SLinus Torvalds goto err_chunk_cachep; 13891da177e4SLinus Torvalds 1390908c7f19STejun Heo status = percpu_counter_init(&sctp_sockets_allocated, 0, GFP_KERNEL); 1391632c928aSEric W. Biederman if (status) 1392632c928aSEric W. Biederman goto err_percpu_counter_init; 1393632c928aSEric W. Biederman 13941da177e4SLinus Torvalds /* Implementation specific variables. */ 13951da177e4SLinus Torvalds 13961da177e4SLinus Torvalds /* Initialize default stream count setup information. */ 13971da177e4SLinus Torvalds sctp_max_instreams = SCTP_DEFAULT_INSTREAMS; 13981da177e4SLinus Torvalds sctp_max_outstreams = SCTP_DEFAULT_OUTSTREAMS; 13991da177e4SLinus Torvalds 14001da177e4SLinus Torvalds /* Initialize handle used for association ids. */ 14011da177e4SLinus Torvalds idr_init(&sctp_assocs_id); 14021da177e4SLinus Torvalds 1403f03d78dbSEric Dumazet limit = nr_free_buffer_pages() / 8; 14044d93df0aSNeil Horman limit = max(limit, 128UL); 14054d93df0aSNeil Horman sysctl_sctp_mem[0] = limit / 4 * 3; 14064d93df0aSNeil Horman sysctl_sctp_mem[1] = limit; 14074d93df0aSNeil Horman sysctl_sctp_mem[2] = sysctl_sctp_mem[0] * 2; 14084d93df0aSNeil Horman 14094d93df0aSNeil Horman /* Set per-socket limits to no more than 1/128 the pressure threshold*/ 14104d93df0aSNeil Horman limit = (sysctl_sctp_mem[1]) << (PAGE_SHIFT - 7); 14114d93df0aSNeil Horman max_share = min(4UL*1024*1024, limit); 14124d93df0aSNeil Horman 1413845525a6SVlad Yasevich sysctl_sctp_rmem[0] = SK_MEM_QUANTUM; /* give each asoc 1 page min */ 141487fb4b7bSEric Dumazet sysctl_sctp_rmem[1] = 1500 * SKB_TRUESIZE(1); 14154d93df0aSNeil Horman sysctl_sctp_rmem[2] = max(sysctl_sctp_rmem[1], max_share); 14164d93df0aSNeil Horman 14173ab224beSHideo Aoki sysctl_sctp_wmem[0] = SK_MEM_QUANTUM; 14184d93df0aSNeil Horman sysctl_sctp_wmem[1] = 16*1024; 14194d93df0aSNeil Horman sysctl_sctp_wmem[2] = max(64*1024, max_share); 14204d93df0aSNeil Horman 14211da177e4SLinus Torvalds /* Size and allocate the association hash table. 14221da177e4SLinus Torvalds * The methodology is similar to that of the tcp hash tables. 1423d9749fb5SNeil Horman * Though not identical. Start by getting a goal size 14241da177e4SLinus Torvalds */ 14253d6357deSArun KS if (nr_pages >= (128 * 1024)) 14263d6357deSArun KS goal = nr_pages >> (22 - PAGE_SHIFT); 14271da177e4SLinus Torvalds else 14283d6357deSArun KS goal = nr_pages >> (24 - PAGE_SHIFT); 14291da177e4SLinus Torvalds 1430d9749fb5SNeil Horman /* Then compute the page order for said goal */ 1431d9749fb5SNeil Horman order = get_order(goal); 1432d9749fb5SNeil Horman 1433d9749fb5SNeil Horman /* Now compute the required page order for the maximum sized table we 1434d9749fb5SNeil Horman * want to create 1435d9749fb5SNeil Horman */ 1436d9749fb5SNeil Horman max_entry_order = get_order(MAX_SCTP_PORT_HASH_ENTRIES * 1437d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket)); 1438d9749fb5SNeil Horman 1439d9749fb5SNeil Horman /* Limit the page order by that maximum hash table size */ 1440d9749fb5SNeil Horman order = min(order, max_entry_order); 14411da177e4SLinus Torvalds 14421da177e4SLinus Torvalds /* Allocate and initialize the endpoint hash table. */ 14431da177e4SLinus Torvalds sctp_ep_hashsize = 64; 14443b77d661SZhang Yanfei sctp_ep_hashtable = 14456da2ec56SKees Cook kmalloc_array(64, sizeof(struct sctp_hashbucket), GFP_KERNEL); 14461da177e4SLinus Torvalds if (!sctp_ep_hashtable) { 1447145ce502SJoe Perches pr_err("Failed endpoint_hash alloc\n"); 14481da177e4SLinus Torvalds status = -ENOMEM; 14491da177e4SLinus Torvalds goto err_ehash_alloc; 14501da177e4SLinus Torvalds } 14511da177e4SLinus Torvalds for (i = 0; i < sctp_ep_hashsize; i++) { 14521da177e4SLinus Torvalds rwlock_init(&sctp_ep_hashtable[i].lock); 1453d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_ep_hashtable[i].chain); 14541da177e4SLinus Torvalds } 14551da177e4SLinus Torvalds 1456d9749fb5SNeil Horman /* Allocate and initialize the SCTP port hash table. 1457d9749fb5SNeil Horman * Note that order is initalized to start at the max sized 1458d9749fb5SNeil Horman * table we want to support. If we can't get that many pages 1459d9749fb5SNeil Horman * reduce the order and try again 1460d9749fb5SNeil Horman */ 14611da177e4SLinus Torvalds do { 14621da177e4SLinus Torvalds sctp_port_hashtable = (struct sctp_bind_hashbucket *) 14636857a02aSEric Dumazet __get_free_pages(GFP_KERNEL | __GFP_NOWARN, order); 14641da177e4SLinus Torvalds } while (!sctp_port_hashtable && --order > 0); 1465d9749fb5SNeil Horman 14661da177e4SLinus Torvalds if (!sctp_port_hashtable) { 1467145ce502SJoe Perches pr_err("Failed bind hash alloc\n"); 14681da177e4SLinus Torvalds status = -ENOMEM; 14691da177e4SLinus Torvalds goto err_bhash_alloc; 14701da177e4SLinus Torvalds } 1471d9749fb5SNeil Horman 1472d9749fb5SNeil Horman /* Now compute the number of entries that will fit in the 1473d9749fb5SNeil Horman * port hash space we allocated 1474d9749fb5SNeil Horman */ 1475d9749fb5SNeil Horman num_entries = (1UL << order) * PAGE_SIZE / 1476d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket); 1477d9749fb5SNeil Horman 1478d9749fb5SNeil Horman /* And finish by rounding it down to the nearest power of two 1479d9749fb5SNeil Horman * this wastes some memory of course, but its needed because 1480d9749fb5SNeil Horman * the hash function operates based on the assumption that 1481d9749fb5SNeil Horman * that the number of entries is a power of two 1482d9749fb5SNeil Horman */ 1483d9749fb5SNeil Horman sctp_port_hashsize = rounddown_pow_of_two(num_entries); 1484d9749fb5SNeil Horman 14851da177e4SLinus Torvalds for (i = 0; i < sctp_port_hashsize; i++) { 14861da177e4SLinus Torvalds spin_lock_init(&sctp_port_hashtable[i].lock); 1487d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_port_hashtable[i].chain); 14881da177e4SLinus Torvalds } 14891da177e4SLinus Torvalds 1490a5e27d18SWei Yongjun status = sctp_transport_hashtable_init(); 1491a5e27d18SWei Yongjun if (status) 14924f008781SXin Long goto err_thash_alloc; 14934f008781SXin Long 1494d9749fb5SNeil Horman pr_info("Hash tables configured (bind %d/%d)\n", sctp_port_hashsize, 1495d9749fb5SNeil Horman num_entries); 14961da177e4SLinus Torvalds 14971da177e4SLinus Torvalds sctp_sysctl_register(); 14981da177e4SLinus Torvalds 14991da177e4SLinus Torvalds INIT_LIST_HEAD(&sctp_address_families); 1500270637abSVlad Yasevich sctp_v4_pf_init(); 1501270637abSVlad Yasevich sctp_v6_pf_init(); 15021ba896f6SXin Long sctp_sched_ops_init(); 15031da177e4SLinus Torvalds 15048e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_defaults_ops); 15058e2d61e0SMarcelo Ricardo Leitner if (status) 15068e2d61e0SMarcelo Ricardo Leitner goto err_register_defaults; 1507270637abSVlad Yasevich 15088e2d61e0SMarcelo Ricardo Leitner status = sctp_v4_protosw_init(); 1509827bf122SSridhar Samudrala if (status) 1510270637abSVlad Yasevich goto err_protosw_init; 1511827bf122SSridhar Samudrala 1512270637abSVlad Yasevich status = sctp_v6_protosw_init(); 15131da177e4SLinus Torvalds if (status) 1514270637abSVlad Yasevich goto err_v6_protosw_init; 15151da177e4SLinus Torvalds 15168e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_ctrlsock_ops); 15174db67e80SEric W. Biederman if (status) 15188e2d61e0SMarcelo Ricardo Leitner goto err_register_ctrlsock; 15194db67e80SEric W. Biederman 1520270637abSVlad Yasevich status = sctp_v4_add_protocol(); 1521270637abSVlad Yasevich if (status) 1522827bf122SSridhar Samudrala goto err_add_protocol; 1523827bf122SSridhar Samudrala 1524827bf122SSridhar Samudrala /* Register SCTP with inet6 layer. */ 1525827bf122SSridhar Samudrala status = sctp_v6_add_protocol(); 1526827bf122SSridhar Samudrala if (status) 1527827bf122SSridhar Samudrala goto err_v6_add_protocol; 1528827bf122SSridhar Samudrala 152990017accSMarcelo Ricardo Leitner if (sctp_offload_init() < 0) 153090017accSMarcelo Ricardo Leitner pr_crit("%s: Cannot add SCTP protocol offload\n", __func__); 153190017accSMarcelo Ricardo Leitner 15321da177e4SLinus Torvalds out: 15331da177e4SLinus Torvalds return status; 1534827bf122SSridhar Samudrala err_v6_add_protocol: 1535270637abSVlad Yasevich sctp_v4_del_protocol(); 1536d1dd5247SVlad Yasevich err_add_protocol: 15378e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 15388e2d61e0SMarcelo Ricardo Leitner err_register_ctrlsock: 1539270637abSVlad Yasevich sctp_v6_protosw_exit(); 1540270637abSVlad Yasevich err_v6_protosw_init: 1541270637abSVlad Yasevich sctp_v4_protosw_exit(); 1542270637abSVlad Yasevich err_protosw_init: 15438e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 15448e2d61e0SMarcelo Ricardo Leitner err_register_defaults: 1545270637abSVlad Yasevich sctp_v4_pf_exit(); 1546270637abSVlad Yasevich sctp_v6_pf_exit(); 15471da177e4SLinus Torvalds sctp_sysctl_unregister(); 15481da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 15491da177e4SLinus Torvalds get_order(sctp_port_hashsize * 15501da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 15511da177e4SLinus Torvalds err_bhash_alloc: 15524f008781SXin Long sctp_transport_hashtable_destroy(); 15534f008781SXin Long err_thash_alloc: 15541da177e4SLinus Torvalds kfree(sctp_ep_hashtable); 15551da177e4SLinus Torvalds err_ehash_alloc: 1556632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 1557632c928aSEric W. Biederman err_percpu_counter_init: 15581da177e4SLinus Torvalds kmem_cache_destroy(sctp_chunk_cachep); 15591da177e4SLinus Torvalds err_chunk_cachep: 15601da177e4SLinus Torvalds kmem_cache_destroy(sctp_bucket_cachep); 15611da177e4SLinus Torvalds goto out; 15621da177e4SLinus Torvalds } 15631da177e4SLinus Torvalds 15641da177e4SLinus Torvalds /* Exit handler for the SCTP protocol. */ 1565dda91928SDaniel Borkmann static __exit void sctp_exit(void) 15661da177e4SLinus Torvalds { 15671da177e4SLinus Torvalds /* BUG. This should probably do something useful like clean 15681da177e4SLinus Torvalds * up all the remaining associations and all that memory. 15691da177e4SLinus Torvalds */ 15701da177e4SLinus Torvalds 1571827bf122SSridhar Samudrala /* Unregister with inet6/inet layers. */ 1572827bf122SSridhar Samudrala sctp_v6_del_protocol(); 1573270637abSVlad Yasevich sctp_v4_del_protocol(); 15741da177e4SLinus Torvalds 15758e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 15764db67e80SEric W. Biederman 1577270637abSVlad Yasevich /* Free protosw registrations */ 1578270637abSVlad Yasevich sctp_v6_protosw_exit(); 1579270637abSVlad Yasevich sctp_v4_protosw_exit(); 1580270637abSVlad Yasevich 15818e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 15828e2d61e0SMarcelo Ricardo Leitner 1583827bf122SSridhar Samudrala /* Unregister with socket layer. */ 1584270637abSVlad Yasevich sctp_v6_pf_exit(); 1585270637abSVlad Yasevich sctp_v4_pf_exit(); 1586827bf122SSridhar Samudrala 15871da177e4SLinus Torvalds sctp_sysctl_unregister(); 15881da177e4SLinus Torvalds 15891da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 15901da177e4SLinus Torvalds get_order(sctp_port_hashsize * 15911da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 1592b5eff712SXin Long kfree(sctp_ep_hashtable); 15934f008781SXin Long sctp_transport_hashtable_destroy(); 15941da177e4SLinus Torvalds 1595632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 15961da177e4SLinus Torvalds 1597eaa184a1SJesper Dangaard Brouer rcu_barrier(); /* Wait for completion of call_rcu()'s */ 1598eaa184a1SJesper Dangaard Brouer 1599827bf122SSridhar Samudrala kmem_cache_destroy(sctp_chunk_cachep); 1600827bf122SSridhar Samudrala kmem_cache_destroy(sctp_bucket_cachep); 16011da177e4SLinus Torvalds } 16021da177e4SLinus Torvalds 16031da177e4SLinus Torvalds module_init(sctp_init); 16041da177e4SLinus Torvalds module_exit(sctp_exit); 16051da177e4SLinus Torvalds 1606bb97d31fSArnaldo Carvalho de Melo /* 1607bb97d31fSArnaldo Carvalho de Melo * __stringify doesn't likes enums, so use IPPROTO_SCTP value (132) directly. 1608bb97d31fSArnaldo Carvalho de Melo */ 1609bb97d31fSArnaldo Carvalho de Melo MODULE_ALIAS("net-pf-" __stringify(PF_INET) "-proto-132"); 1610882a382cSSridhar Samudrala MODULE_ALIAS("net-pf-" __stringify(PF_INET6) "-proto-132"); 161191705c61SDaniel Borkmann MODULE_AUTHOR("Linux Kernel SCTP developers <linux-sctp@vger.kernel.org>"); 16121da177e4SLinus Torvalds MODULE_DESCRIPTION("Support for the SCTP protocol (RFC2960)"); 161371acc0ddSDavid S. Miller module_param_named(no_checksums, sctp_checksum_disable, bool, 0644); 161471acc0ddSDavid S. Miller MODULE_PARM_DESC(no_checksums, "Disable checksums computing and verification"); 16151da177e4SLinus Torvalds MODULE_LICENSE("GPL"); 1616