147505b8bSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 260c778b2SVlad Yasevich /* SCTP kernel implementation 31da177e4SLinus Torvalds * (C) Copyright IBM Corp. 2001, 2004 41da177e4SLinus Torvalds * Copyright (c) 1999-2000 Cisco, Inc. 51da177e4SLinus Torvalds * Copyright (c) 1999-2001 Motorola, Inc. 61da177e4SLinus Torvalds * Copyright (c) 2001 Intel Corp. 71da177e4SLinus Torvalds * Copyright (c) 2001 Nokia, Inc. 81da177e4SLinus Torvalds * Copyright (c) 2001 La Monte H.P. Yarroll 91da177e4SLinus Torvalds * 1060c778b2SVlad Yasevich * This file is part of the SCTP kernel implementation 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * Initialization/cleanup for SCTP protocol support. 131da177e4SLinus Torvalds * 141da177e4SLinus Torvalds * Please send any bug reports or fixes you make to the 151da177e4SLinus Torvalds * email address(es): 1691705c61SDaniel Borkmann * lksctp developers <linux-sctp@vger.kernel.org> 171da177e4SLinus Torvalds * 181da177e4SLinus Torvalds * Written or modified by: 191da177e4SLinus Torvalds * La Monte H.P. Yarroll <piggy@acm.org> 201da177e4SLinus Torvalds * Karl Knutson <karl@athena.chicago.il.us> 211da177e4SLinus Torvalds * Jon Grimm <jgrimm@us.ibm.com> 221da177e4SLinus Torvalds * Sridhar Samudrala <sri@us.ibm.com> 231da177e4SLinus Torvalds * Daisy Chang <daisyc@us.ibm.com> 241da177e4SLinus Torvalds * Ardelle Fan <ardelle.fan@intel.com> 251da177e4SLinus Torvalds */ 261da177e4SLinus Torvalds 27145ce502SJoe Perches #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 28145ce502SJoe Perches 291da177e4SLinus Torvalds #include <linux/module.h> 301da177e4SLinus Torvalds #include <linux/init.h> 311da177e4SLinus Torvalds #include <linux/netdevice.h> 321da177e4SLinus Torvalds #include <linux/inetdevice.h> 331da177e4SLinus Torvalds #include <linux/seq_file.h> 3457c8a661SMike Rapoport #include <linux/memblock.h> 35845525a6SVlad Yasevich #include <linux/highmem.h> 36845525a6SVlad Yasevich #include <linux/swap.h> 375a0e3ad6STejun Heo #include <linux/slab.h> 38457c4cbcSEric W. Biederman #include <net/net_namespace.h> 391da177e4SLinus Torvalds #include <net/protocol.h> 401da177e4SLinus Torvalds #include <net/ip.h> 411da177e4SLinus Torvalds #include <net/ipv6.h> 4214c85021SArnaldo Carvalho de Melo #include <net/route.h> 431da177e4SLinus Torvalds #include <net/sctp/sctp.h> 441da177e4SLinus Torvalds #include <net/addrconf.h> 451da177e4SLinus Torvalds #include <net/inet_common.h> 461da177e4SLinus Torvalds #include <net/inet_ecn.h> 471da177e4SLinus Torvalds 48d9749fb5SNeil Horman #define MAX_SCTP_PORT_HASH_ENTRIES (64 * 1024) 49d9749fb5SNeil Horman 501da177e4SLinus Torvalds /* Global data structures. */ 514cbf1caeSBrian Haley struct sctp_globals sctp_globals __read_mostly; 521da177e4SLinus Torvalds 531da177e4SLinus Torvalds struct idr sctp_assocs_id; 541da177e4SLinus Torvalds DEFINE_SPINLOCK(sctp_assocs_id_lock); 551da177e4SLinus Torvalds 561da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet6_specific; 571da177e4SLinus Torvalds static struct sctp_pf *sctp_pf_inet_specific; 581da177e4SLinus Torvalds static struct sctp_af *sctp_af_v4_specific; 591da177e4SLinus Torvalds static struct sctp_af *sctp_af_v6_specific; 601da177e4SLinus Torvalds 61e18b890bSChristoph Lameter struct kmem_cache *sctp_chunk_cachep __read_mostly; 62e18b890bSChristoph Lameter struct kmem_cache *sctp_bucket_cachep __read_mostly; 631da177e4SLinus Torvalds 648d987e5cSEric Dumazet long sysctl_sctp_mem[3]; 65007e3936SVlad Yasevich int sysctl_sctp_rmem[3]; 66007e3936SVlad Yasevich int sysctl_sctp_wmem[3]; 674d93df0aSNeil Horman 681da177e4SLinus Torvalds /* Private helper to extract ipv4 address and stash them in 691da177e4SLinus Torvalds * the protocol structure. 701da177e4SLinus Torvalds */ 711da177e4SLinus Torvalds static void sctp_v4_copy_addrlist(struct list_head *addrlist, 721da177e4SLinus Torvalds struct net_device *dev) 731da177e4SLinus Torvalds { 741da177e4SLinus Torvalds struct in_device *in_dev; 751da177e4SLinus Torvalds struct in_ifaddr *ifa; 761da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 771da177e4SLinus Torvalds 781da177e4SLinus Torvalds rcu_read_lock(); 79e5ed6399SHerbert Xu if ((in_dev = __in_dev_get_rcu(dev)) == NULL) { 801da177e4SLinus Torvalds rcu_read_unlock(); 811da177e4SLinus Torvalds return; 821da177e4SLinus Torvalds } 831da177e4SLinus Torvalds 84cd5a411dSFlorian Westphal in_dev_for_each_ifa_rcu(ifa, in_dev) { 851da177e4SLinus Torvalds /* Add the address to the local list. */ 86939cfa75SDaniel Borkmann addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 871da177e4SLinus Torvalds if (addr) { 882a6fd78aSAl Viro addr->a.v4.sin_family = AF_INET; 892a6fd78aSAl Viro addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 9029303547SVlad Yasevich addr->valid = 1; 9129303547SVlad Yasevich INIT_LIST_HEAD(&addr->list); 921da177e4SLinus Torvalds list_add_tail(&addr->list, addrlist); 931da177e4SLinus Torvalds } 941da177e4SLinus Torvalds } 951da177e4SLinus Torvalds 961da177e4SLinus Torvalds rcu_read_unlock(); 971da177e4SLinus Torvalds } 981da177e4SLinus Torvalds 991da177e4SLinus Torvalds /* Extract our IP addresses from the system and stash them in the 1001da177e4SLinus Torvalds * protocol structure. 1011da177e4SLinus Torvalds */ 1024db67e80SEric W. Biederman static void sctp_get_local_addr_list(struct net *net) 1031da177e4SLinus Torvalds { 1041da177e4SLinus Torvalds struct net_device *dev; 1051da177e4SLinus Torvalds struct list_head *pos; 1061da177e4SLinus Torvalds struct sctp_af *af; 1071da177e4SLinus Torvalds 108c6d14c84SEric Dumazet rcu_read_lock(); 1094db67e80SEric W. Biederman for_each_netdev_rcu(net, dev) { 1102c0740e4SDave Jones list_for_each(pos, &sctp_address_families) { 1111da177e4SLinus Torvalds af = list_entry(pos, struct sctp_af, list); 1124db67e80SEric W. Biederman af->copy_addrlist(&net->sctp.local_addr_list, dev); 1131da177e4SLinus Torvalds } 1141da177e4SLinus Torvalds } 115c6d14c84SEric Dumazet rcu_read_unlock(); 1161da177e4SLinus Torvalds } 1171da177e4SLinus Torvalds 1181da177e4SLinus Torvalds /* Free the existing local addresses. */ 1194db67e80SEric W. Biederman static void sctp_free_local_addr_list(struct net *net) 1201da177e4SLinus Torvalds { 1211da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1221da177e4SLinus Torvalds struct list_head *pos, *temp; 1231da177e4SLinus Torvalds 1244db67e80SEric W. Biederman list_for_each_safe(pos, temp, &net->sctp.local_addr_list) { 1251da177e4SLinus Torvalds addr = list_entry(pos, struct sctp_sockaddr_entry, list); 1261da177e4SLinus Torvalds list_del(pos); 1271da177e4SLinus Torvalds kfree(addr); 1281da177e4SLinus Torvalds } 1291da177e4SLinus Torvalds } 1301da177e4SLinus Torvalds 1311da177e4SLinus Torvalds /* Copy the local addresses which are valid for 'scope' into 'bp'. */ 1324db67e80SEric W. Biederman int sctp_copy_local_addr_list(struct net *net, struct sctp_bind_addr *bp, 1331c662018SXin Long enum sctp_scope scope, gfp_t gfp, int copy_flags) 1341da177e4SLinus Torvalds { 1351da177e4SLinus Torvalds struct sctp_sockaddr_entry *addr; 1362e3ce5bcSXin Long union sctp_addr laddr; 1371da177e4SLinus Torvalds int error = 0; 1381da177e4SLinus Torvalds 13929303547SVlad Yasevich rcu_read_lock(); 1404db67e80SEric W. Biederman list_for_each_entry_rcu(addr, &net->sctp.local_addr_list, list) { 14129303547SVlad Yasevich if (!addr->valid) 14229303547SVlad Yasevich continue; 143165f2cf6SXin Long if (!sctp_in_scope(net, &addr->a, scope)) 144165f2cf6SXin Long continue; 145165f2cf6SXin Long 1461da177e4SLinus Torvalds /* Now that the address is in scope, check to see if 1471da177e4SLinus Torvalds * the address type is really supported by the local 1481da177e4SLinus Torvalds * sock as well as the remote peer. 1491da177e4SLinus Torvalds */ 150165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET && 151165f2cf6SXin Long !(copy_flags & SCTP_ADDR4_PEERSUPP)) 152165f2cf6SXin Long continue; 153165f2cf6SXin Long if (addr->a.sa.sa_family == AF_INET6 && 154165f2cf6SXin Long (!(copy_flags & SCTP_ADDR6_ALLOWED) || 155165f2cf6SXin Long !(copy_flags & SCTP_ADDR6_PEERSUPP))) 156165f2cf6SXin Long continue; 157165f2cf6SXin Long 1582e3ce5bcSXin Long laddr = addr->a; 1592e3ce5bcSXin Long /* also works for setting ipv6 address port */ 1602e3ce5bcSXin Long laddr.v4.sin_port = htons(bp->port); 1612e3ce5bcSXin Long if (sctp_bind_addr_state(bp, &laddr) != -1) 162b8607805SXin Long continue; 163b8607805SXin Long 164165f2cf6SXin Long error = sctp_add_bind_addr(bp, &addr->a, sizeof(addr->a), 165f57d96b2SVlad Yasevich SCTP_ADDR_SRC, GFP_ATOMIC); 1661da177e4SLinus Torvalds if (error) 167165f2cf6SXin Long break; 1681da177e4SLinus Torvalds } 1691da177e4SLinus Torvalds 17029303547SVlad Yasevich rcu_read_unlock(); 1711da177e4SLinus Torvalds return error; 1721da177e4SLinus Torvalds } 1731da177e4SLinus Torvalds 174b7e10c25SRichard Haines /* Copy over any ip options */ 175b7e10c25SRichard Haines static void sctp_v4_copy_ip_options(struct sock *sk, struct sock *newsk) 176b7e10c25SRichard Haines { 177b7e10c25SRichard Haines struct inet_sock *newinet, *inet = inet_sk(sk); 178b7e10c25SRichard Haines struct ip_options_rcu *inet_opt, *newopt = NULL; 179b7e10c25SRichard Haines 180b7e10c25SRichard Haines newinet = inet_sk(newsk); 181b7e10c25SRichard Haines 182b7e10c25SRichard Haines rcu_read_lock(); 183b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 184b7e10c25SRichard Haines if (inet_opt) { 185b7e10c25SRichard Haines newopt = sock_kmalloc(newsk, sizeof(*inet_opt) + 186b7e10c25SRichard Haines inet_opt->opt.optlen, GFP_ATOMIC); 187b7e10c25SRichard Haines if (newopt) 188b7e10c25SRichard Haines memcpy(newopt, inet_opt, sizeof(*inet_opt) + 189b7e10c25SRichard Haines inet_opt->opt.optlen); 190b7e10c25SRichard Haines else 191b7e10c25SRichard Haines pr_err("%s: Failed to copy ip options\n", __func__); 192b7e10c25SRichard Haines } 193b7e10c25SRichard Haines RCU_INIT_POINTER(newinet->inet_opt, newopt); 194b7e10c25SRichard Haines rcu_read_unlock(); 195b7e10c25SRichard Haines } 196b7e10c25SRichard Haines 197b7e10c25SRichard Haines /* Account for the IP options */ 198b7e10c25SRichard Haines static int sctp_v4_ip_options_len(struct sock *sk) 199b7e10c25SRichard Haines { 200b7e10c25SRichard Haines struct inet_sock *inet = inet_sk(sk); 201b7e10c25SRichard Haines struct ip_options_rcu *inet_opt; 202b7e10c25SRichard Haines int len = 0; 203b7e10c25SRichard Haines 204b7e10c25SRichard Haines rcu_read_lock(); 205b7e10c25SRichard Haines inet_opt = rcu_dereference(inet->inet_opt); 206b7e10c25SRichard Haines if (inet_opt) 207b7e10c25SRichard Haines len = inet_opt->opt.optlen; 208b7e10c25SRichard Haines 209b7e10c25SRichard Haines rcu_read_unlock(); 210b7e10c25SRichard Haines return len; 211b7e10c25SRichard Haines } 212b7e10c25SRichard Haines 2131da177e4SLinus Torvalds /* Initialize a sctp_addr from in incoming skb. */ 2141da177e4SLinus Torvalds static void sctp_v4_from_skb(union sctp_addr *addr, struct sk_buff *skb, 2151da177e4SLinus Torvalds int is_saddr) 2161da177e4SLinus Torvalds { 2170630c56eSMarcelo Ricardo Leitner /* Always called on head skb, so this is safe */ 2180630c56eSMarcelo Ricardo Leitner struct sctphdr *sh = sctp_hdr(skb); 2190630c56eSMarcelo Ricardo Leitner struct sockaddr_in *sa = &addr->v4; 2201da177e4SLinus Torvalds 2211da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2221da177e4SLinus Torvalds 2231da177e4SLinus Torvalds if (is_saddr) { 2240630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->source; 2250630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->saddr; 2261da177e4SLinus Torvalds } else { 2270630c56eSMarcelo Ricardo Leitner sa->sin_port = sh->dest; 2280630c56eSMarcelo Ricardo Leitner sa->sin_addr.s_addr = ip_hdr(skb)->daddr; 2291da177e4SLinus Torvalds } 230*b6f3320bSXin Long memset(sa->sin_zero, 0, sizeof(sa->sin_zero)); 2311da177e4SLinus Torvalds } 2321da177e4SLinus Torvalds 2331da177e4SLinus Torvalds /* Initialize an sctp_addr from a socket. */ 2341da177e4SLinus Torvalds static void sctp_v4_from_sk(union sctp_addr *addr, struct sock *sk) 2351da177e4SLinus Torvalds { 2361da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2377dcdbd95SAl Viro addr->v4.sin_port = 0; 238c720c7e8SEric Dumazet addr->v4.sin_addr.s_addr = inet_sk(sk)->inet_rcv_saddr; 239*b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 2401da177e4SLinus Torvalds } 2411da177e4SLinus Torvalds 2421da177e4SLinus Torvalds /* Initialize sk->sk_rcv_saddr from sctp_addr. */ 2431da177e4SLinus Torvalds static void sctp_v4_to_sk_saddr(union sctp_addr *addr, struct sock *sk) 2441da177e4SLinus Torvalds { 245c720c7e8SEric Dumazet inet_sk(sk)->inet_rcv_saddr = addr->v4.sin_addr.s_addr; 2461da177e4SLinus Torvalds } 2471da177e4SLinus Torvalds 2481da177e4SLinus Torvalds /* Initialize sk->sk_daddr from sctp_addr. */ 2491da177e4SLinus Torvalds static void sctp_v4_to_sk_daddr(union sctp_addr *addr, struct sock *sk) 2501da177e4SLinus Torvalds { 251c720c7e8SEric Dumazet inet_sk(sk)->inet_daddr = addr->v4.sin_addr.s_addr; 2521da177e4SLinus Torvalds } 2531da177e4SLinus Torvalds 2541da177e4SLinus Torvalds /* Initialize a sctp_addr from an address parameter. */ 2551da177e4SLinus Torvalds static void sctp_v4_from_addr_param(union sctp_addr *addr, 2561da177e4SLinus Torvalds union sctp_addr_param *param, 257dd86d136SAl Viro __be16 port, int iif) 2581da177e4SLinus Torvalds { 2591da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 2601da177e4SLinus Torvalds addr->v4.sin_port = port; 2611da177e4SLinus Torvalds addr->v4.sin_addr.s_addr = param->v4.addr.s_addr; 262*b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 2631da177e4SLinus Torvalds } 2641da177e4SLinus Torvalds 2651da177e4SLinus Torvalds /* Initialize an address parameter from a sctp_addr and return the length 2661da177e4SLinus Torvalds * of the address parameter. 2671da177e4SLinus Torvalds */ 2681da177e4SLinus Torvalds static int sctp_v4_to_addr_param(const union sctp_addr *addr, 2691da177e4SLinus Torvalds union sctp_addr_param *param) 2701da177e4SLinus Torvalds { 271a38905e6SXin Long int length = sizeof(struct sctp_ipv4addr_param); 2721da177e4SLinus Torvalds 2731da177e4SLinus Torvalds param->v4.param_hdr.type = SCTP_PARAM_IPV4_ADDRESS; 274dbc16db1SAl Viro param->v4.param_hdr.length = htons(length); 2751da177e4SLinus Torvalds param->v4.addr.s_addr = addr->v4.sin_addr.s_addr; 2761da177e4SLinus Torvalds 2771da177e4SLinus Torvalds return length; 2781da177e4SLinus Torvalds } 2791da177e4SLinus Torvalds 2801da177e4SLinus Torvalds /* Initialize a sctp_addr from a dst_entry. */ 28118a353f4SDavid S. Miller static void sctp_v4_dst_saddr(union sctp_addr *saddr, struct flowi4 *fl4, 282854d43a4SAl Viro __be16 port) 2831da177e4SLinus Torvalds { 2841da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 2851da177e4SLinus Torvalds saddr->v4.sin_port = port; 28618a353f4SDavid S. Miller saddr->v4.sin_addr.s_addr = fl4->saddr; 287*b6f3320bSXin Long memset(saddr->v4.sin_zero, 0, sizeof(saddr->v4.sin_zero)); 2881da177e4SLinus Torvalds } 2891da177e4SLinus Torvalds 2901da177e4SLinus Torvalds /* Compare two addresses exactly. */ 2911da177e4SLinus Torvalds static int sctp_v4_cmp_addr(const union sctp_addr *addr1, 2921da177e4SLinus Torvalds const union sctp_addr *addr2) 2931da177e4SLinus Torvalds { 2941da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 2951da177e4SLinus Torvalds return 0; 2961da177e4SLinus Torvalds if (addr1->v4.sin_port != addr2->v4.sin_port) 2971da177e4SLinus Torvalds return 0; 2981da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr != addr2->v4.sin_addr.s_addr) 2991da177e4SLinus Torvalds return 0; 3001da177e4SLinus Torvalds 3011da177e4SLinus Torvalds return 1; 3021da177e4SLinus Torvalds } 3031da177e4SLinus Torvalds 3041da177e4SLinus Torvalds /* Initialize addr struct to INADDR_ANY. */ 3056fbfa9f9SAl Viro static void sctp_v4_inaddr_any(union sctp_addr *addr, __be16 port) 3061da177e4SLinus Torvalds { 3071da177e4SLinus Torvalds addr->v4.sin_family = AF_INET; 308e6f1cebfSAl Viro addr->v4.sin_addr.s_addr = htonl(INADDR_ANY); 3091da177e4SLinus Torvalds addr->v4.sin_port = port; 310*b6f3320bSXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 3111da177e4SLinus Torvalds } 3121da177e4SLinus Torvalds 3131da177e4SLinus Torvalds /* Is this a wildcard address? */ 3141da177e4SLinus Torvalds static int sctp_v4_is_any(const union sctp_addr *addr) 3151da177e4SLinus Torvalds { 316e6f1cebfSAl Viro return htonl(INADDR_ANY) == addr->v4.sin_addr.s_addr; 3171da177e4SLinus Torvalds } 3181da177e4SLinus Torvalds 3191da177e4SLinus Torvalds /* This function checks if the address is a valid address to be used for 3201da177e4SLinus Torvalds * SCTP binding. 3211da177e4SLinus Torvalds * 3221da177e4SLinus Torvalds * Output: 3231da177e4SLinus Torvalds * Return 0 - If the address is a non-unicast or an illegal address. 3241da177e4SLinus Torvalds * Return 1 - If the address is a unicast. 3251da177e4SLinus Torvalds */ 3265636bef7SVlad Yasevich static int sctp_v4_addr_valid(union sctp_addr *addr, 3275636bef7SVlad Yasevich struct sctp_sock *sp, 3285636bef7SVlad Yasevich const struct sk_buff *skb) 3291da177e4SLinus Torvalds { 3307dab83deSVlad Yasevich /* IPv4 addresses not allowed */ 3317dab83deSVlad Yasevich if (sp && ipv6_only_sock(sctp_opt2sk(sp))) 3327dab83deSVlad Yasevich return 0; 3337dab83deSVlad Yasevich 3341da177e4SLinus Torvalds /* Is this a non-unicast address or a unusable SCTP address? */ 335b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) 3361da177e4SLinus Torvalds return 0; 3371da177e4SLinus Torvalds 3385636bef7SVlad Yasevich /* Is this a broadcast address? */ 339511c3f92SEric Dumazet if (skb && skb_rtable(skb)->rt_flags & RTCF_BROADCAST) 3405636bef7SVlad Yasevich return 0; 3415636bef7SVlad Yasevich 3421da177e4SLinus Torvalds return 1; 3431da177e4SLinus Torvalds } 3441da177e4SLinus Torvalds 3451da177e4SLinus Torvalds /* Should this be available for binding? */ 3461da177e4SLinus Torvalds static int sctp_v4_available(union sctp_addr *addr, struct sctp_sock *sp) 3471da177e4SLinus Torvalds { 348bb2db45bSEric W. Biederman struct net *net = sock_net(&sp->inet.sk); 349bb2db45bSEric W. Biederman int ret = inet_addr_type(net, addr->v4.sin_addr.s_addr); 3501da177e4SLinus Torvalds 3511da177e4SLinus Torvalds 352e6f1cebfSAl Viro if (addr->v4.sin_addr.s_addr != htonl(INADDR_ANY) && 353cdac4e07SNeil Horman ret != RTN_LOCAL && 354cdac4e07SNeil Horman !sp->inet.freebind && 35549a60158SVincent Bernat !net->ipv4.sysctl_ip_nonlocal_bind) 3561da177e4SLinus Torvalds return 0; 357cdac4e07SNeil Horman 3587dab83deSVlad Yasevich if (ipv6_only_sock(sctp_opt2sk(sp))) 3597dab83deSVlad Yasevich return 0; 3607dab83deSVlad Yasevich 3611da177e4SLinus Torvalds return 1; 3621da177e4SLinus Torvalds } 3631da177e4SLinus Torvalds 3641da177e4SLinus Torvalds /* Checking the loopback, private and other address scopes as defined in 3651da177e4SLinus Torvalds * RFC 1918. The IPv4 scoping is based on the draft for SCTP IPv4 3661da177e4SLinus Torvalds * scoping <draft-stewart-tsvwg-sctp-ipv4-00.txt>. 3671da177e4SLinus Torvalds * 3681da177e4SLinus Torvalds * Level 0 - unusable SCTP addresses 3691da177e4SLinus Torvalds * Level 1 - loopback address 3701da177e4SLinus Torvalds * Level 2 - link-local addresses 3711da177e4SLinus Torvalds * Level 3 - private addresses. 3721da177e4SLinus Torvalds * Level 4 - global addresses 3731da177e4SLinus Torvalds * For INIT and INIT-ACK address list, let L be the level of 3741da177e4SLinus Torvalds * of requested destination address, sender and receiver 3751da177e4SLinus Torvalds * SHOULD include all of its addresses with level greater 3761da177e4SLinus Torvalds * than or equal to L. 37772388433SBhaskar Dutta * 37872388433SBhaskar Dutta * IPv4 scoping can be controlled through sysctl option 37972388433SBhaskar Dutta * net.sctp.addr_scope_policy 3801da177e4SLinus Torvalds */ 3811c662018SXin Long static enum sctp_scope sctp_v4_scope(union sctp_addr *addr) 3821da177e4SLinus Torvalds { 3831c662018SXin Long enum sctp_scope retval; 3841da177e4SLinus Torvalds 3851da177e4SLinus Torvalds /* Check for unusable SCTP addresses. */ 386b5cb2bbcSJoe Perches if (IS_IPV4_UNUSABLE_ADDRESS(addr->v4.sin_addr.s_addr)) { 3871da177e4SLinus Torvalds retval = SCTP_SCOPE_UNUSABLE; 388b5cb2bbcSJoe Perches } else if (ipv4_is_loopback(addr->v4.sin_addr.s_addr)) { 3891da177e4SLinus Torvalds retval = SCTP_SCOPE_LOOPBACK; 390b5cb2bbcSJoe Perches } else if (ipv4_is_linklocal_169(addr->v4.sin_addr.s_addr)) { 3911da177e4SLinus Torvalds retval = SCTP_SCOPE_LINK; 392b5cb2bbcSJoe Perches } else if (ipv4_is_private_10(addr->v4.sin_addr.s_addr) || 393b5cb2bbcSJoe Perches ipv4_is_private_172(addr->v4.sin_addr.s_addr) || 394b5cb2bbcSJoe Perches ipv4_is_private_192(addr->v4.sin_addr.s_addr)) { 3951da177e4SLinus Torvalds retval = SCTP_SCOPE_PRIVATE; 3961da177e4SLinus Torvalds } else { 3971da177e4SLinus Torvalds retval = SCTP_SCOPE_GLOBAL; 3981da177e4SLinus Torvalds } 3991da177e4SLinus Torvalds 4001da177e4SLinus Torvalds return retval; 4011da177e4SLinus Torvalds } 4021da177e4SLinus Torvalds 4031da177e4SLinus Torvalds /* Returns a valid dst cache entry for the given source and destination ip 4041da177e4SLinus Torvalds * addresses. If an association is passed, trys to get a dst entry with a 4051da177e4SLinus Torvalds * source address that matches an address in the bind address list. 4061da177e4SLinus Torvalds */ 407da0420beSVlad Yasevich static void sctp_v4_get_dst(struct sctp_transport *t, union sctp_addr *saddr, 408da0420beSVlad Yasevich struct flowi *fl, struct sock *sk) 4091da177e4SLinus Torvalds { 410da0420beSVlad Yasevich struct sctp_association *asoc = t->asoc; 4111da177e4SLinus Torvalds struct rtable *rt; 4129914ae3cSVlad Yasevich struct flowi4 *fl4 = &fl->u.ip4; 4131da177e4SLinus Torvalds struct sctp_bind_addr *bp; 4141da177e4SLinus Torvalds struct sctp_sockaddr_entry *laddr; 4151da177e4SLinus Torvalds struct dst_entry *dst = NULL; 416da0420beSVlad Yasevich union sctp_addr *daddr = &t->ipaddr; 4171da177e4SLinus Torvalds union sctp_addr dst_saddr; 4188a9c58d2SXin Long __u8 tos = inet_sk(sk)->tos; 4191da177e4SLinus Torvalds 4208a9c58d2SXin Long if (t->dscp & SCTP_DSCP_SET_MASK) 4218a9c58d2SXin Long tos = t->dscp & SCTP_DSCP_VAL_MASK; 4229914ae3cSVlad Yasevich memset(fl4, 0x0, sizeof(struct flowi4)); 4239914ae3cSVlad Yasevich fl4->daddr = daddr->v4.sin_addr.s_addr; 4249914ae3cSVlad Yasevich fl4->fl4_dport = daddr->v4.sin_port; 4259914ae3cSVlad Yasevich fl4->flowi4_proto = IPPROTO_SCTP; 4261da177e4SLinus Torvalds if (asoc) { 4278a9c58d2SXin Long fl4->flowi4_tos = RT_CONN_FLAGS_TOS(asoc->base.sk, tos); 4289914ae3cSVlad Yasevich fl4->flowi4_oif = asoc->base.sk->sk_bound_dev_if; 4299914ae3cSVlad Yasevich fl4->fl4_sport = htons(asoc->base.bind_addr.port); 4301da177e4SLinus Torvalds } 4316429d3dcSWei Yongjun if (saddr) { 4329914ae3cSVlad Yasevich fl4->saddr = saddr->v4.sin_addr.s_addr; 433ecf938feSXin Long if (!fl4->fl4_sport) 4349914ae3cSVlad Yasevich fl4->fl4_sport = saddr->v4.sin_port; 4356429d3dcSWei Yongjun } 4361da177e4SLinus Torvalds 437bb33381dSDaniel Borkmann pr_debug("%s: dst:%pI4, src:%pI4 - ", __func__, &fl4->daddr, 438bb33381dSDaniel Borkmann &fl4->saddr); 4391da177e4SLinus Torvalds 440bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 441b23dd4feSDavid S. Miller if (!IS_ERR(rt)) 442d8d1f30bSChangli Gao dst = &rt->dst; 4431da177e4SLinus Torvalds 4441da177e4SLinus Torvalds /* If there is no association or if a source address is passed, no 4451da177e4SLinus Torvalds * more validation is required. 4461da177e4SLinus Torvalds */ 4471da177e4SLinus Torvalds if (!asoc || saddr) 4481da177e4SLinus Torvalds goto out; 4491da177e4SLinus Torvalds 4501da177e4SLinus Torvalds bp = &asoc->base.bind_addr; 4511da177e4SLinus Torvalds 4521da177e4SLinus Torvalds if (dst) { 4531da177e4SLinus Torvalds /* Walk through the bind address list and look for a bind 4541da177e4SLinus Torvalds * address that matches the source address of the returned dst. 4551da177e4SLinus Torvalds */ 45618a353f4SDavid S. Miller sctp_v4_dst_saddr(&dst_saddr, fl4, htons(bp->port)); 457559cf710SVlad Yasevich rcu_read_lock(); 458559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4598a07eb0aSMichio Honda if (!laddr->valid || (laddr->state == SCTP_ADDR_DEL) || 4608a07eb0aSMichio Honda (laddr->state != SCTP_ADDR_SRC && 4618a07eb0aSMichio Honda !asoc->src_out_of_asoc_ok)) 462dc022a98SSridhar Samudrala continue; 463854d43a4SAl Viro if (sctp_v4_cmp_addr(&dst_saddr, &laddr->a)) 4641da177e4SLinus Torvalds goto out_unlock; 4651da177e4SLinus Torvalds } 466559cf710SVlad Yasevich rcu_read_unlock(); 4671da177e4SLinus Torvalds 4681da177e4SLinus Torvalds /* None of the bound addresses match the source address of the 4691da177e4SLinus Torvalds * dst. So release it. 4701da177e4SLinus Torvalds */ 4711da177e4SLinus Torvalds dst_release(dst); 4721da177e4SLinus Torvalds dst = NULL; 4731da177e4SLinus Torvalds } 4741da177e4SLinus Torvalds 4751da177e4SLinus Torvalds /* Walk through the bind address list and try to get a dst that 4761da177e4SLinus Torvalds * matches a bind address as the source address. 4771da177e4SLinus Torvalds */ 478559cf710SVlad Yasevich rcu_read_lock(); 479559cf710SVlad Yasevich list_for_each_entry_rcu(laddr, &bp->address_list, list) { 4800ca50d12SMarcelo Ricardo Leitner struct net_device *odev; 4810ca50d12SMarcelo Ricardo Leitner 482559cf710SVlad Yasevich if (!laddr->valid) 483559cf710SVlad Yasevich continue; 48407868284SMarcelo Ricardo Leitner if (laddr->state != SCTP_ADDR_SRC || 48507868284SMarcelo Ricardo Leitner AF_INET != laddr->a.sa.sa_family) 48607868284SMarcelo Ricardo Leitner continue; 48707868284SMarcelo Ricardo Leitner 4889914ae3cSVlad Yasevich fl4->fl4_sport = laddr->a.v4.sin_port; 48985350871SXufeng Zhang flowi4_update_output(fl4, 49085350871SXufeng Zhang asoc->base.sk->sk_bound_dev_if, 4918a9c58d2SXin Long RT_CONN_FLAGS_TOS(asoc->base.sk, tos), 49285350871SXufeng Zhang daddr->v4.sin_addr.s_addr, 49385350871SXufeng Zhang laddr->a.v4.sin_addr.s_addr); 49485350871SXufeng Zhang 495bb2db45bSEric W. Biederman rt = ip_route_output_key(sock_net(sk), fl4); 49607868284SMarcelo Ricardo Leitner if (IS_ERR(rt)) 49707868284SMarcelo Ricardo Leitner continue; 49807868284SMarcelo Ricardo Leitner 4990ca50d12SMarcelo Ricardo Leitner /* Ensure the src address belongs to the output 5000ca50d12SMarcelo Ricardo Leitner * interface. 5010ca50d12SMarcelo Ricardo Leitner */ 5020ca50d12SMarcelo Ricardo Leitner odev = __ip_dev_find(sock_net(sk), laddr->a.v4.sin_addr.s_addr, 5030ca50d12SMarcelo Ricardo Leitner false); 504d82f0f1fSMarcelo Ricardo Leitner if (!odev || odev->ifindex != fl4->flowi4_oif) { 5054a31a6b1STommi Rantala if (!dst) 5064a31a6b1STommi Rantala dst = &rt->dst; 5074a31a6b1STommi Rantala else 508d82f0f1fSMarcelo Ricardo Leitner dst_release(&rt->dst); 5090ca50d12SMarcelo Ricardo Leitner continue; 510d82f0f1fSMarcelo Ricardo Leitner } 5110ca50d12SMarcelo Ricardo Leitner 512410f0383SMarcelo Ricardo Leitner dst_release(dst); 513d8d1f30bSChangli Gao dst = &rt->dst; 51407868284SMarcelo Ricardo Leitner break; 5151da177e4SLinus Torvalds } 5161da177e4SLinus Torvalds 5171da177e4SLinus Torvalds out_unlock: 518559cf710SVlad Yasevich rcu_read_unlock(); 5191da177e4SLinus Torvalds out: 520da0420beSVlad Yasevich t->dst = dst; 5211da177e4SLinus Torvalds if (dst) 522bb33381dSDaniel Borkmann pr_debug("rt_dst:%pI4, rt_src:%pI4\n", 52318a353f4SDavid S. Miller &fl4->daddr, &fl4->saddr); 5241da177e4SLinus Torvalds else 525bb33381dSDaniel Borkmann pr_debug("no route\n"); 5261da177e4SLinus Torvalds } 5271da177e4SLinus Torvalds 5281da177e4SLinus Torvalds /* For v4, the source address is cached in the route entry(dst). So no need 5291da177e4SLinus Torvalds * to cache it separately and hence this is an empty routine. 5301da177e4SLinus Torvalds */ 531e5117101SYOSHIFUJI Hideaki static void sctp_v4_get_saddr(struct sctp_sock *sk, 5329914ae3cSVlad Yasevich struct sctp_transport *t, 5339914ae3cSVlad Yasevich struct flowi *fl) 5341da177e4SLinus Torvalds { 5359914ae3cSVlad Yasevich union sctp_addr *saddr = &t->saddr; 5369914ae3cSVlad Yasevich struct rtable *rt = (struct rtable *)t->dst; 53723ec47a0SVladislav Yasevich 5381da177e4SLinus Torvalds if (rt) { 5391da177e4SLinus Torvalds saddr->v4.sin_family = AF_INET; 540902ebd3eSDavid S. Miller saddr->v4.sin_addr.s_addr = fl->u.ip4.saddr; 5411da177e4SLinus Torvalds } 5421da177e4SLinus Torvalds } 5431da177e4SLinus Torvalds 5441da177e4SLinus Torvalds /* What interface did this skb arrive on? */ 5451da177e4SLinus Torvalds static int sctp_v4_skb_iif(const struct sk_buff *skb) 5461da177e4SLinus Torvalds { 54792101b3bSDavid S. Miller return inet_iif(skb); 5481da177e4SLinus Torvalds } 5491da177e4SLinus Torvalds 5501da177e4SLinus Torvalds /* Was this packet marked by Explicit Congestion Notification? */ 5511da177e4SLinus Torvalds static int sctp_v4_is_ce(const struct sk_buff *skb) 5521da177e4SLinus Torvalds { 553eddc9ec5SArnaldo Carvalho de Melo return INET_ECN_is_ce(ip_hdr(skb)->tos); 5541da177e4SLinus Torvalds } 5551da177e4SLinus Torvalds 5561da177e4SLinus Torvalds /* Create and initialize a new sk for the socket returned by accept(). */ 5571da177e4SLinus Torvalds static struct sock *sctp_v4_create_accept_sk(struct sock *sk, 558cdfbabfbSDavid Howells struct sctp_association *asoc, 559cdfbabfbSDavid Howells bool kern) 5601da177e4SLinus Torvalds { 5613b1e0a65SYOSHIFUJI Hideaki struct sock *newsk = sk_alloc(sock_net(sk), PF_INET, GFP_KERNEL, 562cdfbabfbSDavid Howells sk->sk_prot, kern); 563914e1c8bSVlad Yasevich struct inet_sock *newinet; 5641da177e4SLinus Torvalds 5651da177e4SLinus Torvalds if (!newsk) 5661da177e4SLinus Torvalds goto out; 5671da177e4SLinus Torvalds 5681da177e4SLinus Torvalds sock_init_data(NULL, newsk); 5691da177e4SLinus Torvalds 570914e1c8bSVlad Yasevich sctp_copy_sock(newsk, sk, asoc); 5711da177e4SLinus Torvalds sock_reset_flag(newsk, SOCK_ZAPPED); 5721da177e4SLinus Torvalds 573b7e10c25SRichard Haines sctp_v4_copy_ip_options(sk, newsk); 574b7e10c25SRichard Haines 5751da177e4SLinus Torvalds newinet = inet_sk(newsk); 5761da177e4SLinus Torvalds 577c720c7e8SEric Dumazet newinet->inet_daddr = asoc->peer.primary_addr.v4.sin_addr.s_addr; 5781da177e4SLinus Torvalds 579e6848976SArnaldo Carvalho de Melo sk_refcnt_debug_inc(newsk); 5801da177e4SLinus Torvalds 5811da177e4SLinus Torvalds if (newsk->sk_prot->init(newsk)) { 5821da177e4SLinus Torvalds sk_common_release(newsk); 5831da177e4SLinus Torvalds newsk = NULL; 5841da177e4SLinus Torvalds } 5851da177e4SLinus Torvalds 5861da177e4SLinus Torvalds out: 5871da177e4SLinus Torvalds return newsk; 5881da177e4SLinus Torvalds } 5891da177e4SLinus Torvalds 590299ee123SJason Gunthorpe static int sctp_v4_addr_to_user(struct sctp_sock *sp, union sctp_addr *addr) 5911da177e4SLinus Torvalds { 592299ee123SJason Gunthorpe /* No address mapping for V4 sockets */ 59309279e61SXin Long memset(addr->v4.sin_zero, 0, sizeof(addr->v4.sin_zero)); 594299ee123SJason Gunthorpe return sizeof(struct sockaddr_in); 5951da177e4SLinus Torvalds } 5961da177e4SLinus Torvalds 5971da177e4SLinus Torvalds /* Dump the v4 addr to the seq file. */ 5981da177e4SLinus Torvalds static void sctp_v4_seq_dump_addr(struct seq_file *seq, union sctp_addr *addr) 5991da177e4SLinus Torvalds { 60021454aaaSHarvey Harrison seq_printf(seq, "%pI4 ", &addr->v4.sin_addr); 6011da177e4SLinus Torvalds } 6021da177e4SLinus Torvalds 603b9031d9dSVlad Yasevich static void sctp_v4_ecn_capable(struct sock *sk) 604b9031d9dSVlad Yasevich { 605b9031d9dSVlad Yasevich INET_ECN_xmit(sk); 606b9031d9dSVlad Yasevich } 607b9031d9dSVlad Yasevich 6089c3b5751SKees Cook static void sctp_addr_wq_timeout_handler(struct timer_list *t) 6099f7d653bSMichio Honda { 6109c3b5751SKees Cook struct net *net = from_timer(net, t, sctp.addr_wq_timer); 6119f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw, *temp; 6129f7d653bSMichio Honda struct sctp_sock *sp; 6139f7d653bSMichio Honda 6144db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6159f7d653bSMichio Honda 6164db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 617bb33381dSDaniel Borkmann pr_debug("%s: the first ent in wq:%p is addr:%pISc for cmd:%d at " 618bb33381dSDaniel Borkmann "entry:%p\n", __func__, &net->sctp.addr_waitq, &addrw->a.sa, 619bb33381dSDaniel Borkmann addrw->state, addrw); 6209f7d653bSMichio Honda 621dfd56b8bSEric Dumazet #if IS_ENABLED(CONFIG_IPV6) 6229f7d653bSMichio Honda /* Now we send an ASCONF for each association */ 6239f7d653bSMichio Honda /* Note. we currently don't handle link local IPv6 addressees */ 6249f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET6) { 6259f7d653bSMichio Honda struct in6_addr *in6; 6269f7d653bSMichio Honda 6279f7d653bSMichio Honda if (ipv6_addr_type(&addrw->a.v6.sin6_addr) & 6289f7d653bSMichio Honda IPV6_ADDR_LINKLOCAL) 6299f7d653bSMichio Honda goto free_next; 6309f7d653bSMichio Honda 6319f7d653bSMichio Honda in6 = (struct in6_addr *)&addrw->a.v6.sin6_addr; 6324db67e80SEric W. Biederman if (ipv6_chk_addr(net, in6, NULL, 0) == 0 && 6339f7d653bSMichio Honda addrw->state == SCTP_ADDR_NEW) { 6349f7d653bSMichio Honda unsigned long timeo_val; 6359f7d653bSMichio Honda 636bb33381dSDaniel Borkmann pr_debug("%s: this is on DAD, trying %d sec " 637bb33381dSDaniel Borkmann "later\n", __func__, 6389f7d653bSMichio Honda SCTP_ADDRESS_TICK_DELAY); 639bb33381dSDaniel Borkmann 6409f7d653bSMichio Honda timeo_val = jiffies; 6419f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 6424db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 6439f7d653bSMichio Honda break; 6449f7d653bSMichio Honda } 6459f7d653bSMichio Honda } 6465d0c90cfSDavid S. Miller #endif 6474db67e80SEric W. Biederman list_for_each_entry(sp, &net->sctp.auto_asconf_splist, auto_asconf_list) { 6489f7d653bSMichio Honda struct sock *sk; 6499f7d653bSMichio Honda 6509f7d653bSMichio Honda sk = sctp_opt2sk(sp); 6519f7d653bSMichio Honda /* ignore bound-specific endpoints */ 6529f7d653bSMichio Honda if (!sctp_is_ep_boundall(sk)) 6539f7d653bSMichio Honda continue; 6545bc1d1b4Swangweidong bh_lock_sock(sk); 6559f7d653bSMichio Honda if (sctp_asconf_mgmt(sp, addrw) < 0) 656bb33381dSDaniel Borkmann pr_debug("%s: sctp_asconf_mgmt failed\n", __func__); 6575bc1d1b4Swangweidong bh_unlock_sock(sk); 6589f7d653bSMichio Honda } 65939d84a58SDaniel Halperin #if IS_ENABLED(CONFIG_IPV6) 6609f7d653bSMichio Honda free_next: 66139d84a58SDaniel Halperin #endif 6629f7d653bSMichio Honda list_del(&addrw->list); 6639f7d653bSMichio Honda kfree(addrw); 6649f7d653bSMichio Honda } 6654db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6669f7d653bSMichio Honda } 6679f7d653bSMichio Honda 6684db67e80SEric W. Biederman static void sctp_free_addr_wq(struct net *net) 6699f7d653bSMichio Honda { 6709f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 6719f7d653bSMichio Honda struct sctp_sockaddr_entry *temp; 6729f7d653bSMichio Honda 6734db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 6744db67e80SEric W. Biederman del_timer(&net->sctp.addr_wq_timer); 6754db67e80SEric W. Biederman list_for_each_entry_safe(addrw, temp, &net->sctp.addr_waitq, list) { 6769f7d653bSMichio Honda list_del(&addrw->list); 6779f7d653bSMichio Honda kfree(addrw); 6789f7d653bSMichio Honda } 6794db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 6809f7d653bSMichio Honda } 6819f7d653bSMichio Honda 6829f7d653bSMichio Honda /* lookup the entry for the same address in the addr_waitq 6839f7d653bSMichio Honda * sctp_addr_wq MUST be locked 6849f7d653bSMichio Honda */ 6854db67e80SEric W. Biederman static struct sctp_sockaddr_entry *sctp_addr_wq_lookup(struct net *net, 6864db67e80SEric W. Biederman struct sctp_sockaddr_entry *addr) 6879f7d653bSMichio Honda { 6889f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 6899f7d653bSMichio Honda 6904db67e80SEric W. Biederman list_for_each_entry(addrw, &net->sctp.addr_waitq, list) { 6919f7d653bSMichio Honda if (addrw->a.sa.sa_family != addr->a.sa.sa_family) 6929f7d653bSMichio Honda continue; 6939f7d653bSMichio Honda if (addrw->a.sa.sa_family == AF_INET) { 6949f7d653bSMichio Honda if (addrw->a.v4.sin_addr.s_addr == 6959f7d653bSMichio Honda addr->a.v4.sin_addr.s_addr) 6969f7d653bSMichio Honda return addrw; 6979f7d653bSMichio Honda } else if (addrw->a.sa.sa_family == AF_INET6) { 6989f7d653bSMichio Honda if (ipv6_addr_equal(&addrw->a.v6.sin6_addr, 6999f7d653bSMichio Honda &addr->a.v6.sin6_addr)) 7009f7d653bSMichio Honda return addrw; 7019f7d653bSMichio Honda } 7029f7d653bSMichio Honda } 7039f7d653bSMichio Honda return NULL; 7049f7d653bSMichio Honda } 7059f7d653bSMichio Honda 7064db67e80SEric W. Biederman void sctp_addr_wq_mgmt(struct net *net, struct sctp_sockaddr_entry *addr, int cmd) 7079f7d653bSMichio Honda { 7089f7d653bSMichio Honda struct sctp_sockaddr_entry *addrw; 7099f7d653bSMichio Honda unsigned long timeo_val; 7109f7d653bSMichio Honda 7119f7d653bSMichio Honda /* first, we check if an opposite message already exist in the queue. 7129f7d653bSMichio Honda * If we found such message, it is removed. 7139f7d653bSMichio Honda * This operation is a bit stupid, but the DHCP client attaches the 7149f7d653bSMichio Honda * new address after a couple of addition and deletion of that address 7159f7d653bSMichio Honda */ 7169f7d653bSMichio Honda 7174db67e80SEric W. Biederman spin_lock_bh(&net->sctp.addr_wq_lock); 7189f7d653bSMichio Honda /* Offsets existing events in addr_wq */ 7194db67e80SEric W. Biederman addrw = sctp_addr_wq_lookup(net, addr); 7209f7d653bSMichio Honda if (addrw) { 7219f7d653bSMichio Honda if (addrw->state != cmd) { 722bb33381dSDaniel Borkmann pr_debug("%s: offsets existing entry for %d, addr:%pISc " 723bb33381dSDaniel Borkmann "in wq:%p\n", __func__, addrw->state, &addrw->a.sa, 7244db67e80SEric W. Biederman &net->sctp.addr_waitq); 725bb33381dSDaniel Borkmann 7269f7d653bSMichio Honda list_del(&addrw->list); 7279f7d653bSMichio Honda kfree(addrw); 7289f7d653bSMichio Honda } 7294db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7309f7d653bSMichio Honda return; 7319f7d653bSMichio Honda } 7329f7d653bSMichio Honda 7339f7d653bSMichio Honda /* OK, we have to add the new address to the wait queue */ 7349f7d653bSMichio Honda addrw = kmemdup(addr, sizeof(struct sctp_sockaddr_entry), GFP_ATOMIC); 7359f7d653bSMichio Honda if (addrw == NULL) { 7364db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7379f7d653bSMichio Honda return; 7389f7d653bSMichio Honda } 7399f7d653bSMichio Honda addrw->state = cmd; 7404db67e80SEric W. Biederman list_add_tail(&addrw->list, &net->sctp.addr_waitq); 741bb33381dSDaniel Borkmann 742bb33381dSDaniel Borkmann pr_debug("%s: add new entry for cmd:%d, addr:%pISc in wq:%p\n", 743bb33381dSDaniel Borkmann __func__, addrw->state, &addrw->a.sa, &net->sctp.addr_waitq); 7449f7d653bSMichio Honda 7454db67e80SEric W. Biederman if (!timer_pending(&net->sctp.addr_wq_timer)) { 7469f7d653bSMichio Honda timeo_val = jiffies; 7479f7d653bSMichio Honda timeo_val += msecs_to_jiffies(SCTP_ADDRESS_TICK_DELAY); 7484db67e80SEric W. Biederman mod_timer(&net->sctp.addr_wq_timer, timeo_val); 7499f7d653bSMichio Honda } 7504db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.addr_wq_lock); 7519f7d653bSMichio Honda } 7529f7d653bSMichio Honda 75329303547SVlad Yasevich /* Event handler for inet address addition/deletion events. 75429303547SVlad Yasevich * The sctp_local_addr_list needs to be protocted by a spin lock since 75529303547SVlad Yasevich * multiple notifiers (say IPv4 and IPv6) may be running at the same 75629303547SVlad Yasevich * time and thus corrupt the list. 75729303547SVlad Yasevich * The reader side is protected with RCU. 75829303547SVlad Yasevich */ 75924123186SAdrian Bunk static int sctp_inetaddr_event(struct notifier_block *this, unsigned long ev, 7601da177e4SLinus Torvalds void *ptr) 7611da177e4SLinus Torvalds { 76229c7cf96SSridhar Samudrala struct in_ifaddr *ifa = (struct in_ifaddr *)ptr; 76329303547SVlad Yasevich struct sctp_sockaddr_entry *addr = NULL; 76429303547SVlad Yasevich struct sctp_sockaddr_entry *temp; 7654db67e80SEric W. Biederman struct net *net = dev_net(ifa->ifa_dev->dev); 76622626216SChidambar 'ilLogict' Zinnoury int found = 0; 7671da177e4SLinus Torvalds 76829c7cf96SSridhar Samudrala switch (ev) { 76929c7cf96SSridhar Samudrala case NETDEV_UP: 770400b8b9aSXin Long addr = kzalloc(sizeof(*addr), GFP_ATOMIC); 77129c7cf96SSridhar Samudrala if (addr) { 77229c7cf96SSridhar Samudrala addr->a.v4.sin_family = AF_INET; 77329c7cf96SSridhar Samudrala addr->a.v4.sin_addr.s_addr = ifa->ifa_local; 77429303547SVlad Yasevich addr->valid = 1; 7754db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 7764db67e80SEric W. Biederman list_add_tail_rcu(&addr->list, &net->sctp.local_addr_list); 7774db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_NEW); 7784db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 77929c7cf96SSridhar Samudrala } 78029c7cf96SSridhar Samudrala break; 78129c7cf96SSridhar Samudrala case NETDEV_DOWN: 7824db67e80SEric W. Biederman spin_lock_bh(&net->sctp.local_addr_lock); 78329303547SVlad Yasevich list_for_each_entry_safe(addr, temp, 7844db67e80SEric W. Biederman &net->sctp.local_addr_list, list) { 785a40a7d15SPavel Emelyanov if (addr->a.sa.sa_family == AF_INET && 786a40a7d15SPavel Emelyanov addr->a.v4.sin_addr.s_addr == 787a40a7d15SPavel Emelyanov ifa->ifa_local) { 7884db67e80SEric W. Biederman sctp_addr_wq_mgmt(net, addr, SCTP_ADDR_DEL); 78922626216SChidambar 'ilLogict' Zinnoury found = 1; 79029303547SVlad Yasevich addr->valid = 0; 79129303547SVlad Yasevich list_del_rcu(&addr->list); 79229c7cf96SSridhar Samudrala break; 79329c7cf96SSridhar Samudrala } 79429c7cf96SSridhar Samudrala } 7954db67e80SEric W. Biederman spin_unlock_bh(&net->sctp.local_addr_lock); 79622626216SChidambar 'ilLogict' Zinnoury if (found) 7971231f0baSLai Jiangshan kfree_rcu(addr, rcu); 79829c7cf96SSridhar Samudrala break; 79929c7cf96SSridhar Samudrala } 8001da177e4SLinus Torvalds 8011da177e4SLinus Torvalds return NOTIFY_DONE; 8021da177e4SLinus Torvalds } 8031da177e4SLinus Torvalds 8041da177e4SLinus Torvalds /* 8051da177e4SLinus Torvalds * Initialize the control inode/socket with a control endpoint data 8061da177e4SLinus Torvalds * structure. This endpoint is reserved exclusively for the OOTB processing. 8071da177e4SLinus Torvalds */ 8082ce95503SEric W. Biederman static int sctp_ctl_sock_init(struct net *net) 8091da177e4SLinus Torvalds { 8101da177e4SLinus Torvalds int err; 811fb13d9f9SBrian Haley sa_family_t family = PF_INET; 8121da177e4SLinus Torvalds 8131da177e4SLinus Torvalds if (sctp_get_pf_specific(PF_INET6)) 8141da177e4SLinus Torvalds family = PF_INET6; 8151da177e4SLinus Torvalds 8162ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, family, 8172ce95503SEric W. Biederman SOCK_SEQPACKET, IPPROTO_SCTP, net); 818fb13d9f9SBrian Haley 819fb13d9f9SBrian Haley /* If IPv6 socket could not be created, try the IPv4 socket */ 820fb13d9f9SBrian Haley if (err < 0 && family == PF_INET6) 8212ce95503SEric W. Biederman err = inet_ctl_sock_create(&net->sctp.ctl_sock, AF_INET, 822fb13d9f9SBrian Haley SOCK_SEQPACKET, IPPROTO_SCTP, 8232ce95503SEric W. Biederman net); 824fb13d9f9SBrian Haley 8251da177e4SLinus Torvalds if (err < 0) { 826145ce502SJoe Perches pr_err("Failed to create the SCTP control socket\n"); 8271da177e4SLinus Torvalds return err; 8281da177e4SLinus Torvalds } 8291da177e4SLinus Torvalds return 0; 8301da177e4SLinus Torvalds } 8311da177e4SLinus Torvalds 8321da177e4SLinus Torvalds /* Register address family specific functions. */ 8331da177e4SLinus Torvalds int sctp_register_af(struct sctp_af *af) 8341da177e4SLinus Torvalds { 8351da177e4SLinus Torvalds switch (af->sa_family) { 8361da177e4SLinus Torvalds case AF_INET: 8371da177e4SLinus Torvalds if (sctp_af_v4_specific) 8381da177e4SLinus Torvalds return 0; 8391da177e4SLinus Torvalds sctp_af_v4_specific = af; 8401da177e4SLinus Torvalds break; 8411da177e4SLinus Torvalds case AF_INET6: 8421da177e4SLinus Torvalds if (sctp_af_v6_specific) 8431da177e4SLinus Torvalds return 0; 8441da177e4SLinus Torvalds sctp_af_v6_specific = af; 8451da177e4SLinus Torvalds break; 8461da177e4SLinus Torvalds default: 8471da177e4SLinus Torvalds return 0; 8481da177e4SLinus Torvalds } 8491da177e4SLinus Torvalds 8501da177e4SLinus Torvalds INIT_LIST_HEAD(&af->list); 8511da177e4SLinus Torvalds list_add_tail(&af->list, &sctp_address_families); 8521da177e4SLinus Torvalds return 1; 8531da177e4SLinus Torvalds } 8541da177e4SLinus Torvalds 8551da177e4SLinus Torvalds /* Get the table of functions for manipulating a particular address 8561da177e4SLinus Torvalds * family. 8571da177e4SLinus Torvalds */ 8581da177e4SLinus Torvalds struct sctp_af *sctp_get_af_specific(sa_family_t family) 8591da177e4SLinus Torvalds { 8601da177e4SLinus Torvalds switch (family) { 8611da177e4SLinus Torvalds case AF_INET: 8621da177e4SLinus Torvalds return sctp_af_v4_specific; 8631da177e4SLinus Torvalds case AF_INET6: 8641da177e4SLinus Torvalds return sctp_af_v6_specific; 8651da177e4SLinus Torvalds default: 8661da177e4SLinus Torvalds return NULL; 8671da177e4SLinus Torvalds } 8681da177e4SLinus Torvalds } 8691da177e4SLinus Torvalds 8701da177e4SLinus Torvalds /* Common code to initialize a AF_INET msg_name. */ 8711da177e4SLinus Torvalds static void sctp_inet_msgname(char *msgname, int *addr_len) 8721da177e4SLinus Torvalds { 8731da177e4SLinus Torvalds struct sockaddr_in *sin; 8741da177e4SLinus Torvalds 8751da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 8761da177e4SLinus Torvalds *addr_len = sizeof(struct sockaddr_in); 8771da177e4SLinus Torvalds sin->sin_family = AF_INET; 8781da177e4SLinus Torvalds memset(sin->sin_zero, 0, sizeof(sin->sin_zero)); 8791da177e4SLinus Torvalds } 8801da177e4SLinus Torvalds 8811da177e4SLinus Torvalds /* Copy the primary address of the peer primary address as the msg_name. */ 8821da177e4SLinus Torvalds static void sctp_inet_event_msgname(struct sctp_ulpevent *event, char *msgname, 8831da177e4SLinus Torvalds int *addr_len) 8841da177e4SLinus Torvalds { 8851da177e4SLinus Torvalds struct sockaddr_in *sin, *sinfrom; 8861da177e4SLinus Torvalds 8871da177e4SLinus Torvalds if (msgname) { 8881da177e4SLinus Torvalds struct sctp_association *asoc; 8891da177e4SLinus Torvalds 8901da177e4SLinus Torvalds asoc = event->asoc; 8911da177e4SLinus Torvalds sctp_inet_msgname(msgname, addr_len); 8921da177e4SLinus Torvalds sin = (struct sockaddr_in *)msgname; 8931da177e4SLinus Torvalds sinfrom = &asoc->peer.primary_addr.v4; 8941da177e4SLinus Torvalds sin->sin_port = htons(asoc->peer.port); 8951da177e4SLinus Torvalds sin->sin_addr.s_addr = sinfrom->sin_addr.s_addr; 8961da177e4SLinus Torvalds } 8971da177e4SLinus Torvalds } 8981da177e4SLinus Torvalds 8991da177e4SLinus Torvalds /* Initialize and copy out a msgname from an inbound skb. */ 9001da177e4SLinus Torvalds static void sctp_inet_skb_msgname(struct sk_buff *skb, char *msgname, int *len) 9011da177e4SLinus Torvalds { 9021da177e4SLinus Torvalds if (msgname) { 9032c0fd387SArnaldo Carvalho de Melo struct sctphdr *sh = sctp_hdr(skb); 9042c0fd387SArnaldo Carvalho de Melo struct sockaddr_in *sin = (struct sockaddr_in *)msgname; 9052c0fd387SArnaldo Carvalho de Melo 9061da177e4SLinus Torvalds sctp_inet_msgname(msgname, len); 9071da177e4SLinus Torvalds sin->sin_port = sh->source; 908eddc9ec5SArnaldo Carvalho de Melo sin->sin_addr.s_addr = ip_hdr(skb)->saddr; 9091da177e4SLinus Torvalds } 9101da177e4SLinus Torvalds } 9111da177e4SLinus Torvalds 9121da177e4SLinus Torvalds /* Do we support this AF? */ 9131da177e4SLinus Torvalds static int sctp_inet_af_supported(sa_family_t family, struct sctp_sock *sp) 9141da177e4SLinus Torvalds { 9151da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 916a02cec21SEric Dumazet return AF_INET == family; 9171da177e4SLinus Torvalds } 9181da177e4SLinus Torvalds 9191da177e4SLinus Torvalds /* Address matching with wildcards allowed. */ 9201da177e4SLinus Torvalds static int sctp_inet_cmp_addr(const union sctp_addr *addr1, 9211da177e4SLinus Torvalds const union sctp_addr *addr2, 9221da177e4SLinus Torvalds struct sctp_sock *opt) 9231da177e4SLinus Torvalds { 9241da177e4SLinus Torvalds /* PF_INET only supports AF_INET addresses. */ 9251da177e4SLinus Torvalds if (addr1->sa.sa_family != addr2->sa.sa_family) 9261da177e4SLinus Torvalds return 0; 927e6f1cebfSAl Viro if (htonl(INADDR_ANY) == addr1->v4.sin_addr.s_addr || 928e6f1cebfSAl Viro htonl(INADDR_ANY) == addr2->v4.sin_addr.s_addr) 9291da177e4SLinus Torvalds return 1; 9301da177e4SLinus Torvalds if (addr1->v4.sin_addr.s_addr == addr2->v4.sin_addr.s_addr) 9311da177e4SLinus Torvalds return 1; 9321da177e4SLinus Torvalds 9331da177e4SLinus Torvalds return 0; 9341da177e4SLinus Torvalds } 9351da177e4SLinus Torvalds 9361da177e4SLinus Torvalds /* Verify that provided sockaddr looks bindable. Common verification has 9371da177e4SLinus Torvalds * already been taken care of. 9381da177e4SLinus Torvalds */ 9391da177e4SLinus Torvalds static int sctp_inet_bind_verify(struct sctp_sock *opt, union sctp_addr *addr) 9401da177e4SLinus Torvalds { 9411da177e4SLinus Torvalds return sctp_v4_available(addr, opt); 9421da177e4SLinus Torvalds } 9431da177e4SLinus Torvalds 9441da177e4SLinus Torvalds /* Verify that sockaddr looks sendable. Common verification has already 9451da177e4SLinus Torvalds * been taken care of. 9461da177e4SLinus Torvalds */ 9471da177e4SLinus Torvalds static int sctp_inet_send_verify(struct sctp_sock *opt, union sctp_addr *addr) 9481da177e4SLinus Torvalds { 9491da177e4SLinus Torvalds return 1; 9501da177e4SLinus Torvalds } 9511da177e4SLinus Torvalds 9521da177e4SLinus Torvalds /* Fill in Supported Address Type information for INIT and INIT-ACK 9531da177e4SLinus Torvalds * chunks. Returns number of addresses supported. 9541da177e4SLinus Torvalds */ 9551da177e4SLinus Torvalds static int sctp_inet_supported_addrs(const struct sctp_sock *opt, 9563dbe8656SAl Viro __be16 *types) 9571da177e4SLinus Torvalds { 9581da177e4SLinus Torvalds types[0] = SCTP_PARAM_IPV4_ADDRESS; 9591da177e4SLinus Torvalds return 1; 9601da177e4SLinus Torvalds } 9611da177e4SLinus Torvalds 9621da177e4SLinus Torvalds /* Wrapper routine that calls the ip transmit routine. */ 9631da177e4SLinus Torvalds static inline int sctp_v4_xmit(struct sk_buff *skb, 964f880374cSHerbert Xu struct sctp_transport *transport) 9651da177e4SLinus Torvalds { 966f880374cSHerbert Xu struct inet_sock *inet = inet_sk(skb->sk); 9678a9c58d2SXin Long __u8 dscp = inet->tos; 968f880374cSHerbert Xu 969bb33381dSDaniel Borkmann pr_debug("%s: skb:%p, len:%d, src:%pI4, dst:%pI4\n", __func__, skb, 9708a9c58d2SXin Long skb->len, &transport->fl.u.ip4.saddr, 9718a9c58d2SXin Long &transport->fl.u.ip4.daddr); 9728a9c58d2SXin Long 9738a9c58d2SXin Long if (transport->dscp & SCTP_DSCP_SET_MASK) 9748a9c58d2SXin Long dscp = transport->dscp & SCTP_DSCP_VAL_MASK; 9751da177e4SLinus Torvalds 976f880374cSHerbert Xu inet->pmtudisc = transport->param_flags & SPP_PMTUD_ENABLE ? 977f880374cSHerbert Xu IP_PMTUDISC_DO : IP_PMTUDISC_DONT; 978f880374cSHerbert Xu 979b01a2407SEric W. Biederman SCTP_INC_STATS(sock_net(&inet->sk), SCTP_MIB_OUTSCTPPACKS); 980bb33381dSDaniel Borkmann 9818a9c58d2SXin Long return __ip_queue_xmit(&inet->sk, skb, &transport->fl, dscp); 9821da177e4SLinus Torvalds } 9831da177e4SLinus Torvalds 98415efbe76SNeil Horman static struct sctp_af sctp_af_inet; 9851da177e4SLinus Torvalds 9861da177e4SLinus Torvalds static struct sctp_pf sctp_pf_inet = { 9871da177e4SLinus Torvalds .event_msgname = sctp_inet_event_msgname, 9881da177e4SLinus Torvalds .skb_msgname = sctp_inet_skb_msgname, 9891da177e4SLinus Torvalds .af_supported = sctp_inet_af_supported, 9901da177e4SLinus Torvalds .cmp_addr = sctp_inet_cmp_addr, 9911da177e4SLinus Torvalds .bind_verify = sctp_inet_bind_verify, 9921da177e4SLinus Torvalds .send_verify = sctp_inet_send_verify, 9931da177e4SLinus Torvalds .supported_addrs = sctp_inet_supported_addrs, 9941da177e4SLinus Torvalds .create_accept_sk = sctp_v4_create_accept_sk, 995299ee123SJason Gunthorpe .addr_to_user = sctp_v4_addr_to_user, 996299ee123SJason Gunthorpe .to_sk_saddr = sctp_v4_to_sk_saddr, 997299ee123SJason Gunthorpe .to_sk_daddr = sctp_v4_to_sk_daddr, 998b7e10c25SRichard Haines .copy_ip_options = sctp_v4_copy_ip_options, 99915efbe76SNeil Horman .af = &sctp_af_inet 10001da177e4SLinus Torvalds }; 10011da177e4SLinus Torvalds 10021da177e4SLinus Torvalds /* Notifier for inetaddr addition/deletion events. */ 10031da177e4SLinus Torvalds static struct notifier_block sctp_inetaddr_notifier = { 10041da177e4SLinus Torvalds .notifier_call = sctp_inetaddr_event, 10051da177e4SLinus Torvalds }; 10061da177e4SLinus Torvalds 10071da177e4SLinus Torvalds /* Socket operations. */ 100890ddc4f0SEric Dumazet static const struct proto_ops inet_seqpacket_ops = { 10091da177e4SLinus Torvalds .family = PF_INET, 10101da177e4SLinus Torvalds .owner = THIS_MODULE, 10111da177e4SLinus Torvalds .release = inet_release, /* Needs to be wrapped... */ 10121da177e4SLinus Torvalds .bind = inet_bind, 1013644fbdeaSXin Long .connect = sctp_inet_connect, 10141da177e4SLinus Torvalds .socketpair = sock_no_socketpair, 10151da177e4SLinus Torvalds .accept = inet_accept, 10161da177e4SLinus Torvalds .getname = inet_getname, /* Semantics are different. */ 1017a11e1d43SLinus Torvalds .poll = sctp_poll, 10181da177e4SLinus Torvalds .ioctl = inet_ioctl, 1019c7cbdbf2SArnd Bergmann .gettstamp = sock_gettstamp, 10201da177e4SLinus Torvalds .listen = sctp_inet_listen, 10211da177e4SLinus Torvalds .shutdown = inet_shutdown, /* Looks harmless. */ 1022543d9cfeSArnaldo Carvalho de Melo .setsockopt = sock_common_setsockopt, /* IP_SOL IP_OPTION is a problem */ 10231da177e4SLinus Torvalds .getsockopt = sock_common_getsockopt, 10241da177e4SLinus Torvalds .sendmsg = inet_sendmsg, 1025fd2d180aSXin Long .recvmsg = inet_recvmsg, 10261da177e4SLinus Torvalds .mmap = sock_no_mmap, 10271da177e4SLinus Torvalds .sendpage = sock_no_sendpage, 1028543d9cfeSArnaldo Carvalho de Melo #ifdef CONFIG_COMPAT 1029543d9cfeSArnaldo Carvalho de Melo .compat_setsockopt = compat_sock_common_setsockopt, 1030543d9cfeSArnaldo Carvalho de Melo .compat_getsockopt = compat_sock_common_getsockopt, 1031543d9cfeSArnaldo Carvalho de Melo #endif 10321da177e4SLinus Torvalds }; 10331da177e4SLinus Torvalds 10341da177e4SLinus Torvalds /* Registration with AF_INET family. */ 10351da177e4SLinus Torvalds static struct inet_protosw sctp_seqpacket_protosw = { 10361da177e4SLinus Torvalds .type = SOCK_SEQPACKET, 10371da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 10381da177e4SLinus Torvalds .prot = &sctp_prot, 10391da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 10401da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 10411da177e4SLinus Torvalds }; 10421da177e4SLinus Torvalds static struct inet_protosw sctp_stream_protosw = { 10431da177e4SLinus Torvalds .type = SOCK_STREAM, 10441da177e4SLinus Torvalds .protocol = IPPROTO_SCTP, 10451da177e4SLinus Torvalds .prot = &sctp_prot, 10461da177e4SLinus Torvalds .ops = &inet_seqpacket_ops, 10471da177e4SLinus Torvalds .flags = SCTP_PROTOSW_FLAG 10481da177e4SLinus Torvalds }; 10491da177e4SLinus Torvalds 10501da177e4SLinus Torvalds /* Register with IP layer. */ 105132613090SAlexey Dobriyan static const struct net_protocol sctp_protocol = { 10521da177e4SLinus Torvalds .handler = sctp_rcv, 10531da177e4SLinus Torvalds .err_handler = sctp_v4_err, 10541da177e4SLinus Torvalds .no_policy = 1, 1055bb2db45bSEric W. Biederman .netns_ok = 1, 10568ed1dc44SHannes Frederic Sowa .icmp_strict_tag_validation = 1, 10571da177e4SLinus Torvalds }; 10581da177e4SLinus Torvalds 10591da177e4SLinus Torvalds /* IPv4 address related functions. */ 106015efbe76SNeil Horman static struct sctp_af sctp_af_inet = { 1061543d9cfeSArnaldo Carvalho de Melo .sa_family = AF_INET, 10621da177e4SLinus Torvalds .sctp_xmit = sctp_v4_xmit, 10631da177e4SLinus Torvalds .setsockopt = ip_setsockopt, 10641da177e4SLinus Torvalds .getsockopt = ip_getsockopt, 10651da177e4SLinus Torvalds .get_dst = sctp_v4_get_dst, 10661da177e4SLinus Torvalds .get_saddr = sctp_v4_get_saddr, 10671da177e4SLinus Torvalds .copy_addrlist = sctp_v4_copy_addrlist, 10681da177e4SLinus Torvalds .from_skb = sctp_v4_from_skb, 10691da177e4SLinus Torvalds .from_sk = sctp_v4_from_sk, 10701da177e4SLinus Torvalds .from_addr_param = sctp_v4_from_addr_param, 10711da177e4SLinus Torvalds .to_addr_param = sctp_v4_to_addr_param, 10721da177e4SLinus Torvalds .cmp_addr = sctp_v4_cmp_addr, 10731da177e4SLinus Torvalds .addr_valid = sctp_v4_addr_valid, 10741da177e4SLinus Torvalds .inaddr_any = sctp_v4_inaddr_any, 10751da177e4SLinus Torvalds .is_any = sctp_v4_is_any, 10761da177e4SLinus Torvalds .available = sctp_v4_available, 10771da177e4SLinus Torvalds .scope = sctp_v4_scope, 10781da177e4SLinus Torvalds .skb_iif = sctp_v4_skb_iif, 10791da177e4SLinus Torvalds .is_ce = sctp_v4_is_ce, 10801da177e4SLinus Torvalds .seq_dump_addr = sctp_v4_seq_dump_addr, 1081b9031d9dSVlad Yasevich .ecn_capable = sctp_v4_ecn_capable, 10821da177e4SLinus Torvalds .net_header_len = sizeof(struct iphdr), 10831da177e4SLinus Torvalds .sockaddr_len = sizeof(struct sockaddr_in), 1084b7e10c25SRichard Haines .ip_options_len = sctp_v4_ip_options_len, 1085543d9cfeSArnaldo Carvalho de Melo #ifdef CONFIG_COMPAT 1086543d9cfeSArnaldo Carvalho de Melo .compat_setsockopt = compat_ip_setsockopt, 1087543d9cfeSArnaldo Carvalho de Melo .compat_getsockopt = compat_ip_getsockopt, 1088543d9cfeSArnaldo Carvalho de Melo #endif 10891da177e4SLinus Torvalds }; 10901da177e4SLinus Torvalds 10918d72651dSwangweidong struct sctp_pf *sctp_get_pf_specific(sa_family_t family) 10928d72651dSwangweidong { 10931da177e4SLinus Torvalds switch (family) { 10941da177e4SLinus Torvalds case PF_INET: 10951da177e4SLinus Torvalds return sctp_pf_inet_specific; 10961da177e4SLinus Torvalds case PF_INET6: 10971da177e4SLinus Torvalds return sctp_pf_inet6_specific; 10981da177e4SLinus Torvalds default: 10991da177e4SLinus Torvalds return NULL; 11001da177e4SLinus Torvalds } 11011da177e4SLinus Torvalds } 11021da177e4SLinus Torvalds 11031da177e4SLinus Torvalds /* Register the PF specific function table. */ 11041da177e4SLinus Torvalds int sctp_register_pf(struct sctp_pf *pf, sa_family_t family) 11051da177e4SLinus Torvalds { 11061da177e4SLinus Torvalds switch (family) { 11071da177e4SLinus Torvalds case PF_INET: 11081da177e4SLinus Torvalds if (sctp_pf_inet_specific) 11091da177e4SLinus Torvalds return 0; 11101da177e4SLinus Torvalds sctp_pf_inet_specific = pf; 11111da177e4SLinus Torvalds break; 11121da177e4SLinus Torvalds case PF_INET6: 11131da177e4SLinus Torvalds if (sctp_pf_inet6_specific) 11141da177e4SLinus Torvalds return 0; 11151da177e4SLinus Torvalds sctp_pf_inet6_specific = pf; 11161da177e4SLinus Torvalds break; 11171da177e4SLinus Torvalds default: 11181da177e4SLinus Torvalds return 0; 11191da177e4SLinus Torvalds } 11201da177e4SLinus Torvalds return 1; 11211da177e4SLinus Torvalds } 11221da177e4SLinus Torvalds 1123b01a2407SEric W. Biederman static inline int init_sctp_mibs(struct net *net) 11241da177e4SLinus Torvalds { 1125698365faSWANG Cong net->sctp.sctp_statistics = alloc_percpu(struct sctp_mib); 1126698365faSWANG Cong if (!net->sctp.sctp_statistics) 1127698365faSWANG Cong return -ENOMEM; 1128698365faSWANG Cong return 0; 11291da177e4SLinus Torvalds } 11301da177e4SLinus Torvalds 1131b01a2407SEric W. Biederman static inline void cleanup_sctp_mibs(struct net *net) 11321da177e4SLinus Torvalds { 1133698365faSWANG Cong free_percpu(net->sctp.sctp_statistics); 11341da177e4SLinus Torvalds } 11351da177e4SLinus Torvalds 1136270637abSVlad Yasevich static void sctp_v4_pf_init(void) 1137270637abSVlad Yasevich { 1138270637abSVlad Yasevich /* Initialize the SCTP specific PF functions. */ 1139270637abSVlad Yasevich sctp_register_pf(&sctp_pf_inet, PF_INET); 1140270637abSVlad Yasevich sctp_register_af(&sctp_af_inet); 1141270637abSVlad Yasevich } 1142270637abSVlad Yasevich 1143270637abSVlad Yasevich static void sctp_v4_pf_exit(void) 1144270637abSVlad Yasevich { 1145270637abSVlad Yasevich list_del(&sctp_af_inet.list); 1146270637abSVlad Yasevich } 1147270637abSVlad Yasevich 1148270637abSVlad Yasevich static int sctp_v4_protosw_init(void) 1149270637abSVlad Yasevich { 1150270637abSVlad Yasevich int rc; 1151270637abSVlad Yasevich 1152270637abSVlad Yasevich rc = proto_register(&sctp_prot, 1); 1153270637abSVlad Yasevich if (rc) 1154270637abSVlad Yasevich return rc; 1155270637abSVlad Yasevich 1156270637abSVlad Yasevich /* Register SCTP(UDP and TCP style) with socket layer. */ 1157270637abSVlad Yasevich inet_register_protosw(&sctp_seqpacket_protosw); 1158270637abSVlad Yasevich inet_register_protosw(&sctp_stream_protosw); 1159270637abSVlad Yasevich 1160270637abSVlad Yasevich return 0; 1161270637abSVlad Yasevich } 1162270637abSVlad Yasevich 1163270637abSVlad Yasevich static void sctp_v4_protosw_exit(void) 1164270637abSVlad Yasevich { 1165270637abSVlad Yasevich inet_unregister_protosw(&sctp_stream_protosw); 1166270637abSVlad Yasevich inet_unregister_protosw(&sctp_seqpacket_protosw); 1167270637abSVlad Yasevich proto_unregister(&sctp_prot); 1168270637abSVlad Yasevich } 1169270637abSVlad Yasevich 1170270637abSVlad Yasevich static int sctp_v4_add_protocol(void) 1171270637abSVlad Yasevich { 1172270637abSVlad Yasevich /* Register notifier for inet address additions/deletions. */ 1173270637abSVlad Yasevich register_inetaddr_notifier(&sctp_inetaddr_notifier); 1174270637abSVlad Yasevich 1175270637abSVlad Yasevich /* Register SCTP with inet layer. */ 1176270637abSVlad Yasevich if (inet_add_protocol(&sctp_protocol, IPPROTO_SCTP) < 0) 1177270637abSVlad Yasevich return -EAGAIN; 1178270637abSVlad Yasevich 1179270637abSVlad Yasevich return 0; 1180270637abSVlad Yasevich } 1181270637abSVlad Yasevich 1182270637abSVlad Yasevich static void sctp_v4_del_protocol(void) 1183270637abSVlad Yasevich { 1184270637abSVlad Yasevich inet_del_protocol(&sctp_protocol, IPPROTO_SCTP); 1185270637abSVlad Yasevich unregister_inetaddr_notifier(&sctp_inetaddr_notifier); 1186270637abSVlad Yasevich } 1187270637abSVlad Yasevich 11888e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_defaults_init(struct net *net) 11894db67e80SEric W. Biederman { 11902ce95503SEric W. Biederman int status; 11912ce95503SEric W. Biederman 1192e1fc3b14SEric W. Biederman /* 1193e1fc3b14SEric W. Biederman * 14. Suggested SCTP Protocol Parameter Values 1194e1fc3b14SEric W. Biederman */ 1195e1fc3b14SEric W. Biederman /* The following protocol parameters are RECOMMENDED: */ 1196e1fc3b14SEric W. Biederman /* RTO.Initial - 3 seconds */ 1197e1fc3b14SEric W. Biederman net->sctp.rto_initial = SCTP_RTO_INITIAL; 1198e1fc3b14SEric W. Biederman /* RTO.Min - 1 second */ 1199e1fc3b14SEric W. Biederman net->sctp.rto_min = SCTP_RTO_MIN; 1200e1fc3b14SEric W. Biederman /* RTO.Max - 60 seconds */ 1201e1fc3b14SEric W. Biederman net->sctp.rto_max = SCTP_RTO_MAX; 1202e1fc3b14SEric W. Biederman /* RTO.Alpha - 1/8 */ 1203e1fc3b14SEric W. Biederman net->sctp.rto_alpha = SCTP_RTO_ALPHA; 1204e1fc3b14SEric W. Biederman /* RTO.Beta - 1/4 */ 1205e1fc3b14SEric W. Biederman net->sctp.rto_beta = SCTP_RTO_BETA; 1206e1fc3b14SEric W. Biederman 1207e1fc3b14SEric W. Biederman /* Valid.Cookie.Life - 60 seconds */ 1208e1fc3b14SEric W. Biederman net->sctp.valid_cookie_life = SCTP_DEFAULT_COOKIE_LIFE; 1209e1fc3b14SEric W. Biederman 1210e1fc3b14SEric W. Biederman /* Whether Cookie Preservative is enabled(1) or not(0) */ 1211e1fc3b14SEric W. Biederman net->sctp.cookie_preserve_enable = 1; 1212e1fc3b14SEric W. Biederman 12133c68198eSNeil Horman /* Default sctp sockets to use md5 as their hmac alg */ 12140d0863b0SNeil Horman #if defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_MD5) 12153c68198eSNeil Horman net->sctp.sctp_hmac_alg = "md5"; 12160d0863b0SNeil Horman #elif defined (CONFIG_SCTP_DEFAULT_COOKIE_HMAC_SHA1) 12173c68198eSNeil Horman net->sctp.sctp_hmac_alg = "sha1"; 12183c68198eSNeil Horman #else 12193c68198eSNeil Horman net->sctp.sctp_hmac_alg = NULL; 12203c68198eSNeil Horman #endif 12213c68198eSNeil Horman 1222e1fc3b14SEric W. Biederman /* Max.Burst - 4 */ 1223e1fc3b14SEric W. Biederman net->sctp.max_burst = SCTP_DEFAULT_MAX_BURST; 1224e1fc3b14SEric W. Biederman 122534515e94SXin Long /* Disable of Primary Path Switchover by default */ 122634515e94SXin Long net->sctp.ps_retrans = SCTP_PS_RETRANS_MAX; 122734515e94SXin Long 1228566178f8SZhu Yanjun /* Enable pf state by default */ 1229566178f8SZhu Yanjun net->sctp.pf_enable = 1; 1230566178f8SZhu Yanjun 1231aef587beSXin Long /* Ignore pf exposure feature by default */ 1232aef587beSXin Long net->sctp.pf_expose = SCTP_PF_EXPOSE_UNSET; 1233aef587beSXin Long 1234e1fc3b14SEric W. Biederman /* Association.Max.Retrans - 10 attempts 1235e1fc3b14SEric W. Biederman * Path.Max.Retrans - 5 attempts (per destination address) 1236e1fc3b14SEric W. Biederman * Max.Init.Retransmits - 8 attempts 1237e1fc3b14SEric W. Biederman */ 1238e1fc3b14SEric W. Biederman net->sctp.max_retrans_association = 10; 1239e1fc3b14SEric W. Biederman net->sctp.max_retrans_path = 5; 1240e1fc3b14SEric W. Biederman net->sctp.max_retrans_init = 8; 1241e1fc3b14SEric W. Biederman 1242e1fc3b14SEric W. Biederman /* Sendbuffer growth - do per-socket accounting */ 1243e1fc3b14SEric W. Biederman net->sctp.sndbuf_policy = 0; 1244e1fc3b14SEric W. Biederman 1245e1fc3b14SEric W. Biederman /* Rcvbuffer growth - do per-socket accounting */ 1246e1fc3b14SEric W. Biederman net->sctp.rcvbuf_policy = 0; 1247e1fc3b14SEric W. Biederman 1248e1fc3b14SEric W. Biederman /* HB.interval - 30 seconds */ 1249e1fc3b14SEric W. Biederman net->sctp.hb_interval = SCTP_DEFAULT_TIMEOUT_HEARTBEAT; 1250e1fc3b14SEric W. Biederman 1251e1fc3b14SEric W. Biederman /* delayed SACK timeout */ 1252e1fc3b14SEric W. Biederman net->sctp.sack_timeout = SCTP_DEFAULT_TIMEOUT_SACK; 1253e1fc3b14SEric W. Biederman 1254e1fc3b14SEric W. Biederman /* Disable ADDIP by default. */ 1255e1fc3b14SEric W. Biederman net->sctp.addip_enable = 0; 1256e1fc3b14SEric W. Biederman net->sctp.addip_noauth = 0; 1257e1fc3b14SEric W. Biederman net->sctp.default_auto_asconf = 0; 1258e1fc3b14SEric W. Biederman 1259e1fc3b14SEric W. Biederman /* Enable PR-SCTP by default. */ 1260e1fc3b14SEric W. Biederman net->sctp.prsctp_enable = 1; 1261e1fc3b14SEric W. Biederman 1262c28445c3SXin Long /* Disable RECONF by default. */ 1263c28445c3SXin Long net->sctp.reconf_enable = 0; 1264c28445c3SXin Long 1265e1fc3b14SEric W. Biederman /* Disable AUTH by default. */ 1266e1fc3b14SEric W. Biederman net->sctp.auth_enable = 0; 1267e1fc3b14SEric W. Biederman 12681b0b8114SXin Long /* Enable ECN by default. */ 12691b0b8114SXin Long net->sctp.ecn_enable = 1; 12701b0b8114SXin Long 1271e1fc3b14SEric W. Biederman /* Set SCOPE policy to enabled */ 1272e1fc3b14SEric W. Biederman net->sctp.scope_policy = SCTP_SCOPE_POLICY_ENABLE; 1273e1fc3b14SEric W. Biederman 1274e1fc3b14SEric W. Biederman /* Set the default rwnd update threshold */ 1275e1fc3b14SEric W. Biederman net->sctp.rwnd_upd_shift = SCTP_DEFAULT_RWND_SHIFT; 1276e1fc3b14SEric W. Biederman 1277e1fc3b14SEric W. Biederman /* Initialize maximum autoclose timeout. */ 1278e1fc3b14SEric W. Biederman net->sctp.max_autoclose = INT_MAX / HZ; 1279e1fc3b14SEric W. Biederman 1280ebb7e95dSEric W. Biederman status = sctp_sysctl_net_register(net); 1281ebb7e95dSEric W. Biederman if (status) 1282ebb7e95dSEric W. Biederman goto err_sysctl_register; 1283ebb7e95dSEric W. Biederman 1284b01a2407SEric W. Biederman /* Allocate and initialise sctp mibs. */ 1285b01a2407SEric W. Biederman status = init_sctp_mibs(net); 1286b01a2407SEric W. Biederman if (status) 1287b01a2407SEric W. Biederman goto err_init_mibs; 1288b01a2407SEric W. Biederman 1289d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 129013d782f6SEric W. Biederman /* Initialize proc fs directory. */ 129113d782f6SEric W. Biederman status = sctp_proc_init(net); 129213d782f6SEric W. Biederman if (status) 129313d782f6SEric W. Biederman goto err_init_proc; 1294d47d08c8SAl Viro #endif 129513d782f6SEric W. Biederman 129613d782f6SEric W. Biederman sctp_dbg_objcnt_init(net); 129713d782f6SEric W. Biederman 12984db67e80SEric W. Biederman /* Initialize the local address list. */ 12994db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.local_addr_list); 13004db67e80SEric W. Biederman spin_lock_init(&net->sctp.local_addr_lock); 13014db67e80SEric W. Biederman sctp_get_local_addr_list(net); 13024db67e80SEric W. Biederman 13034db67e80SEric W. Biederman /* Initialize the address event list */ 13044db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.addr_waitq); 13054db67e80SEric W. Biederman INIT_LIST_HEAD(&net->sctp.auto_asconf_splist); 13064db67e80SEric W. Biederman spin_lock_init(&net->sctp.addr_wq_lock); 13074db67e80SEric W. Biederman net->sctp.addr_wq_timer.expires = 0; 13089c3b5751SKees Cook timer_setup(&net->sctp.addr_wq_timer, sctp_addr_wq_timeout_handler, 0); 13094db67e80SEric W. Biederman 13104db67e80SEric W. Biederman return 0; 13112ce95503SEric W. Biederman 13127ae665f1SArnd Bergmann #ifdef CONFIG_PROC_FS 131313d782f6SEric W. Biederman err_init_proc: 1314b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 13157ae665f1SArnd Bergmann #endif 1316b01a2407SEric W. Biederman err_init_mibs: 1317ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 1318ebb7e95dSEric W. Biederman err_sysctl_register: 13192ce95503SEric W. Biederman return status; 13204db67e80SEric W. Biederman } 13214db67e80SEric W. Biederman 13228e2d61e0SMarcelo Ricardo Leitner static void __net_exit sctp_defaults_exit(struct net *net) 13234db67e80SEric W. Biederman { 13244db67e80SEric W. Biederman /* Free the local address list */ 13254db67e80SEric W. Biederman sctp_free_addr_wq(net); 13264db67e80SEric W. Biederman sctp_free_local_addr_list(net); 13272ce95503SEric W. Biederman 1328d47d08c8SAl Viro #ifdef CONFIG_PROC_FS 1329d47d08c8SAl Viro remove_proc_subtree("sctp", net->proc_net); 1330d47d08c8SAl Viro net->sctp.proc_net_sctp = NULL; 1331d47d08c8SAl Viro #endif 1332b01a2407SEric W. Biederman cleanup_sctp_mibs(net); 1333ebb7e95dSEric W. Biederman sctp_sysctl_net_unregister(net); 13344db67e80SEric W. Biederman } 13354db67e80SEric W. Biederman 13368e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_defaults_ops = { 13378e2d61e0SMarcelo Ricardo Leitner .init = sctp_defaults_init, 13388e2d61e0SMarcelo Ricardo Leitner .exit = sctp_defaults_exit, 13398e2d61e0SMarcelo Ricardo Leitner }; 13408e2d61e0SMarcelo Ricardo Leitner 13418e2d61e0SMarcelo Ricardo Leitner static int __net_init sctp_ctrlsock_init(struct net *net) 13428e2d61e0SMarcelo Ricardo Leitner { 13438e2d61e0SMarcelo Ricardo Leitner int status; 13448e2d61e0SMarcelo Ricardo Leitner 13458e2d61e0SMarcelo Ricardo Leitner /* Initialize the control inode/socket for handling OOTB packets. */ 13468e2d61e0SMarcelo Ricardo Leitner status = sctp_ctl_sock_init(net); 13478e2d61e0SMarcelo Ricardo Leitner if (status) 13488e2d61e0SMarcelo Ricardo Leitner pr_err("Failed to initialize the SCTP control sock\n"); 13498e2d61e0SMarcelo Ricardo Leitner 13508e2d61e0SMarcelo Ricardo Leitner return status; 13518e2d61e0SMarcelo Ricardo Leitner } 13528e2d61e0SMarcelo Ricardo Leitner 1353b456d724SChristophe JAILLET static void __net_exit sctp_ctrlsock_exit(struct net *net) 13548e2d61e0SMarcelo Ricardo Leitner { 13558e2d61e0SMarcelo Ricardo Leitner /* Free the control endpoint. */ 13568e2d61e0SMarcelo Ricardo Leitner inet_ctl_sock_destroy(net->sctp.ctl_sock); 13578e2d61e0SMarcelo Ricardo Leitner } 13588e2d61e0SMarcelo Ricardo Leitner 13598e2d61e0SMarcelo Ricardo Leitner static struct pernet_operations sctp_ctrlsock_ops = { 13608e2d61e0SMarcelo Ricardo Leitner .init = sctp_ctrlsock_init, 13618e2d61e0SMarcelo Ricardo Leitner .exit = sctp_ctrlsock_exit, 13624db67e80SEric W. Biederman }; 13634db67e80SEric W. Biederman 13641da177e4SLinus Torvalds /* Initialize the universe into something sensible. */ 1365dda91928SDaniel Borkmann static __init int sctp_init(void) 13661da177e4SLinus Torvalds { 13671da177e4SLinus Torvalds int i; 13681da177e4SLinus Torvalds int status = -EINVAL; 13691da177e4SLinus Torvalds unsigned long goal; 13704d93df0aSNeil Horman unsigned long limit; 1371ca79b0c2SArun KS unsigned long nr_pages = totalram_pages(); 13724d93df0aSNeil Horman int max_share; 13731da177e4SLinus Torvalds int order; 1374d9749fb5SNeil Horman int num_entries; 1375d9749fb5SNeil Horman int max_entry_order; 13761da177e4SLinus Torvalds 1377b4772ef8SEyal Birger sock_skb_cb_check_size(sizeof(struct sctp_ulpevent)); 13781da177e4SLinus Torvalds 1379827bf122SSridhar Samudrala /* Allocate bind_bucket and chunk caches. */ 13801da177e4SLinus Torvalds status = -ENOBUFS; 13811da177e4SLinus Torvalds sctp_bucket_cachep = kmem_cache_create("sctp_bind_bucket", 13821da177e4SLinus Torvalds sizeof(struct sctp_bind_bucket), 13831da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 138420c2df83SPaul Mundt NULL); 13851da177e4SLinus Torvalds if (!sctp_bucket_cachep) 1386827bf122SSridhar Samudrala goto out; 13871da177e4SLinus Torvalds 13881da177e4SLinus Torvalds sctp_chunk_cachep = kmem_cache_create("sctp_chunk", 13891da177e4SLinus Torvalds sizeof(struct sctp_chunk), 13901da177e4SLinus Torvalds 0, SLAB_HWCACHE_ALIGN, 139120c2df83SPaul Mundt NULL); 13921da177e4SLinus Torvalds if (!sctp_chunk_cachep) 13931da177e4SLinus Torvalds goto err_chunk_cachep; 13941da177e4SLinus Torvalds 1395908c7f19STejun Heo status = percpu_counter_init(&sctp_sockets_allocated, 0, GFP_KERNEL); 1396632c928aSEric W. Biederman if (status) 1397632c928aSEric W. Biederman goto err_percpu_counter_init; 1398632c928aSEric W. Biederman 13991da177e4SLinus Torvalds /* Implementation specific variables. */ 14001da177e4SLinus Torvalds 14011da177e4SLinus Torvalds /* Initialize default stream count setup information. */ 14021da177e4SLinus Torvalds sctp_max_instreams = SCTP_DEFAULT_INSTREAMS; 14031da177e4SLinus Torvalds sctp_max_outstreams = SCTP_DEFAULT_OUTSTREAMS; 14041da177e4SLinus Torvalds 14051da177e4SLinus Torvalds /* Initialize handle used for association ids. */ 14061da177e4SLinus Torvalds idr_init(&sctp_assocs_id); 14071da177e4SLinus Torvalds 1408f03d78dbSEric Dumazet limit = nr_free_buffer_pages() / 8; 14094d93df0aSNeil Horman limit = max(limit, 128UL); 14104d93df0aSNeil Horman sysctl_sctp_mem[0] = limit / 4 * 3; 14114d93df0aSNeil Horman sysctl_sctp_mem[1] = limit; 14124d93df0aSNeil Horman sysctl_sctp_mem[2] = sysctl_sctp_mem[0] * 2; 14134d93df0aSNeil Horman 14144d93df0aSNeil Horman /* Set per-socket limits to no more than 1/128 the pressure threshold*/ 14154d93df0aSNeil Horman limit = (sysctl_sctp_mem[1]) << (PAGE_SHIFT - 7); 14164d93df0aSNeil Horman max_share = min(4UL*1024*1024, limit); 14174d93df0aSNeil Horman 1418845525a6SVlad Yasevich sysctl_sctp_rmem[0] = SK_MEM_QUANTUM; /* give each asoc 1 page min */ 141987fb4b7bSEric Dumazet sysctl_sctp_rmem[1] = 1500 * SKB_TRUESIZE(1); 14204d93df0aSNeil Horman sysctl_sctp_rmem[2] = max(sysctl_sctp_rmem[1], max_share); 14214d93df0aSNeil Horman 14223ab224beSHideo Aoki sysctl_sctp_wmem[0] = SK_MEM_QUANTUM; 14234d93df0aSNeil Horman sysctl_sctp_wmem[1] = 16*1024; 14244d93df0aSNeil Horman sysctl_sctp_wmem[2] = max(64*1024, max_share); 14254d93df0aSNeil Horman 14261da177e4SLinus Torvalds /* Size and allocate the association hash table. 14271da177e4SLinus Torvalds * The methodology is similar to that of the tcp hash tables. 1428d9749fb5SNeil Horman * Though not identical. Start by getting a goal size 14291da177e4SLinus Torvalds */ 14303d6357deSArun KS if (nr_pages >= (128 * 1024)) 14313d6357deSArun KS goal = nr_pages >> (22 - PAGE_SHIFT); 14321da177e4SLinus Torvalds else 14333d6357deSArun KS goal = nr_pages >> (24 - PAGE_SHIFT); 14341da177e4SLinus Torvalds 1435d9749fb5SNeil Horman /* Then compute the page order for said goal */ 1436d9749fb5SNeil Horman order = get_order(goal); 1437d9749fb5SNeil Horman 1438d9749fb5SNeil Horman /* Now compute the required page order for the maximum sized table we 1439d9749fb5SNeil Horman * want to create 1440d9749fb5SNeil Horman */ 1441d9749fb5SNeil Horman max_entry_order = get_order(MAX_SCTP_PORT_HASH_ENTRIES * 1442d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket)); 1443d9749fb5SNeil Horman 1444d9749fb5SNeil Horman /* Limit the page order by that maximum hash table size */ 1445d9749fb5SNeil Horman order = min(order, max_entry_order); 14461da177e4SLinus Torvalds 14471da177e4SLinus Torvalds /* Allocate and initialize the endpoint hash table. */ 14481da177e4SLinus Torvalds sctp_ep_hashsize = 64; 14493b77d661SZhang Yanfei sctp_ep_hashtable = 14506da2ec56SKees Cook kmalloc_array(64, sizeof(struct sctp_hashbucket), GFP_KERNEL); 14511da177e4SLinus Torvalds if (!sctp_ep_hashtable) { 1452145ce502SJoe Perches pr_err("Failed endpoint_hash alloc\n"); 14531da177e4SLinus Torvalds status = -ENOMEM; 14541da177e4SLinus Torvalds goto err_ehash_alloc; 14551da177e4SLinus Torvalds } 14561da177e4SLinus Torvalds for (i = 0; i < sctp_ep_hashsize; i++) { 14571da177e4SLinus Torvalds rwlock_init(&sctp_ep_hashtable[i].lock); 1458d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_ep_hashtable[i].chain); 14591da177e4SLinus Torvalds } 14601da177e4SLinus Torvalds 1461d9749fb5SNeil Horman /* Allocate and initialize the SCTP port hash table. 1462d9749fb5SNeil Horman * Note that order is initalized to start at the max sized 1463d9749fb5SNeil Horman * table we want to support. If we can't get that many pages 1464d9749fb5SNeil Horman * reduce the order and try again 1465d9749fb5SNeil Horman */ 14661da177e4SLinus Torvalds do { 14671da177e4SLinus Torvalds sctp_port_hashtable = (struct sctp_bind_hashbucket *) 14686857a02aSEric Dumazet __get_free_pages(GFP_KERNEL | __GFP_NOWARN, order); 14691da177e4SLinus Torvalds } while (!sctp_port_hashtable && --order > 0); 1470d9749fb5SNeil Horman 14711da177e4SLinus Torvalds if (!sctp_port_hashtable) { 1472145ce502SJoe Perches pr_err("Failed bind hash alloc\n"); 14731da177e4SLinus Torvalds status = -ENOMEM; 14741da177e4SLinus Torvalds goto err_bhash_alloc; 14751da177e4SLinus Torvalds } 1476d9749fb5SNeil Horman 1477d9749fb5SNeil Horman /* Now compute the number of entries that will fit in the 1478d9749fb5SNeil Horman * port hash space we allocated 1479d9749fb5SNeil Horman */ 1480d9749fb5SNeil Horman num_entries = (1UL << order) * PAGE_SIZE / 1481d9749fb5SNeil Horman sizeof(struct sctp_bind_hashbucket); 1482d9749fb5SNeil Horman 1483d9749fb5SNeil Horman /* And finish by rounding it down to the nearest power of two 1484d9749fb5SNeil Horman * this wastes some memory of course, but its needed because 1485d9749fb5SNeil Horman * the hash function operates based on the assumption that 1486d9749fb5SNeil Horman * that the number of entries is a power of two 1487d9749fb5SNeil Horman */ 1488d9749fb5SNeil Horman sctp_port_hashsize = rounddown_pow_of_two(num_entries); 1489d9749fb5SNeil Horman 14901da177e4SLinus Torvalds for (i = 0; i < sctp_port_hashsize; i++) { 14911da177e4SLinus Torvalds spin_lock_init(&sctp_port_hashtable[i].lock); 1492d970dbf8SVlad Yasevich INIT_HLIST_HEAD(&sctp_port_hashtable[i].chain); 14931da177e4SLinus Torvalds } 14941da177e4SLinus Torvalds 1495a5e27d18SWei Yongjun status = sctp_transport_hashtable_init(); 1496a5e27d18SWei Yongjun if (status) 14974f008781SXin Long goto err_thash_alloc; 14984f008781SXin Long 1499d9749fb5SNeil Horman pr_info("Hash tables configured (bind %d/%d)\n", sctp_port_hashsize, 1500d9749fb5SNeil Horman num_entries); 15011da177e4SLinus Torvalds 15021da177e4SLinus Torvalds sctp_sysctl_register(); 15031da177e4SLinus Torvalds 15041da177e4SLinus Torvalds INIT_LIST_HEAD(&sctp_address_families); 1505270637abSVlad Yasevich sctp_v4_pf_init(); 1506270637abSVlad Yasevich sctp_v6_pf_init(); 15071ba896f6SXin Long sctp_sched_ops_init(); 15081da177e4SLinus Torvalds 15098e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_defaults_ops); 15108e2d61e0SMarcelo Ricardo Leitner if (status) 15118e2d61e0SMarcelo Ricardo Leitner goto err_register_defaults; 1512270637abSVlad Yasevich 15138e2d61e0SMarcelo Ricardo Leitner status = sctp_v4_protosw_init(); 1514827bf122SSridhar Samudrala if (status) 1515270637abSVlad Yasevich goto err_protosw_init; 1516827bf122SSridhar Samudrala 1517270637abSVlad Yasevich status = sctp_v6_protosw_init(); 15181da177e4SLinus Torvalds if (status) 1519270637abSVlad Yasevich goto err_v6_protosw_init; 15201da177e4SLinus Torvalds 15218e2d61e0SMarcelo Ricardo Leitner status = register_pernet_subsys(&sctp_ctrlsock_ops); 15224db67e80SEric W. Biederman if (status) 15238e2d61e0SMarcelo Ricardo Leitner goto err_register_ctrlsock; 15244db67e80SEric W. Biederman 1525270637abSVlad Yasevich status = sctp_v4_add_protocol(); 1526270637abSVlad Yasevich if (status) 1527827bf122SSridhar Samudrala goto err_add_protocol; 1528827bf122SSridhar Samudrala 1529827bf122SSridhar Samudrala /* Register SCTP with inet6 layer. */ 1530827bf122SSridhar Samudrala status = sctp_v6_add_protocol(); 1531827bf122SSridhar Samudrala if (status) 1532827bf122SSridhar Samudrala goto err_v6_add_protocol; 1533827bf122SSridhar Samudrala 153490017accSMarcelo Ricardo Leitner if (sctp_offload_init() < 0) 153590017accSMarcelo Ricardo Leitner pr_crit("%s: Cannot add SCTP protocol offload\n", __func__); 153690017accSMarcelo Ricardo Leitner 15371da177e4SLinus Torvalds out: 15381da177e4SLinus Torvalds return status; 1539827bf122SSridhar Samudrala err_v6_add_protocol: 1540270637abSVlad Yasevich sctp_v4_del_protocol(); 1541d1dd5247SVlad Yasevich err_add_protocol: 15428e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 15438e2d61e0SMarcelo Ricardo Leitner err_register_ctrlsock: 1544270637abSVlad Yasevich sctp_v6_protosw_exit(); 1545270637abSVlad Yasevich err_v6_protosw_init: 1546270637abSVlad Yasevich sctp_v4_protosw_exit(); 1547270637abSVlad Yasevich err_protosw_init: 15488e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 15498e2d61e0SMarcelo Ricardo Leitner err_register_defaults: 1550270637abSVlad Yasevich sctp_v4_pf_exit(); 1551270637abSVlad Yasevich sctp_v6_pf_exit(); 15521da177e4SLinus Torvalds sctp_sysctl_unregister(); 15531da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 15541da177e4SLinus Torvalds get_order(sctp_port_hashsize * 15551da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 15561da177e4SLinus Torvalds err_bhash_alloc: 15574f008781SXin Long sctp_transport_hashtable_destroy(); 15584f008781SXin Long err_thash_alloc: 15591da177e4SLinus Torvalds kfree(sctp_ep_hashtable); 15601da177e4SLinus Torvalds err_ehash_alloc: 1561632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 1562632c928aSEric W. Biederman err_percpu_counter_init: 15631da177e4SLinus Torvalds kmem_cache_destroy(sctp_chunk_cachep); 15641da177e4SLinus Torvalds err_chunk_cachep: 15651da177e4SLinus Torvalds kmem_cache_destroy(sctp_bucket_cachep); 15661da177e4SLinus Torvalds goto out; 15671da177e4SLinus Torvalds } 15681da177e4SLinus Torvalds 15691da177e4SLinus Torvalds /* Exit handler for the SCTP protocol. */ 1570dda91928SDaniel Borkmann static __exit void sctp_exit(void) 15711da177e4SLinus Torvalds { 15721da177e4SLinus Torvalds /* BUG. This should probably do something useful like clean 15731da177e4SLinus Torvalds * up all the remaining associations and all that memory. 15741da177e4SLinus Torvalds */ 15751da177e4SLinus Torvalds 1576827bf122SSridhar Samudrala /* Unregister with inet6/inet layers. */ 1577827bf122SSridhar Samudrala sctp_v6_del_protocol(); 1578270637abSVlad Yasevich sctp_v4_del_protocol(); 15791da177e4SLinus Torvalds 15808e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_ctrlsock_ops); 15814db67e80SEric W. Biederman 1582270637abSVlad Yasevich /* Free protosw registrations */ 1583270637abSVlad Yasevich sctp_v6_protosw_exit(); 1584270637abSVlad Yasevich sctp_v4_protosw_exit(); 1585270637abSVlad Yasevich 15868e2d61e0SMarcelo Ricardo Leitner unregister_pernet_subsys(&sctp_defaults_ops); 15878e2d61e0SMarcelo Ricardo Leitner 1588827bf122SSridhar Samudrala /* Unregister with socket layer. */ 1589270637abSVlad Yasevich sctp_v6_pf_exit(); 1590270637abSVlad Yasevich sctp_v4_pf_exit(); 1591827bf122SSridhar Samudrala 15921da177e4SLinus Torvalds sctp_sysctl_unregister(); 15931da177e4SLinus Torvalds 15941da177e4SLinus Torvalds free_pages((unsigned long)sctp_port_hashtable, 15951da177e4SLinus Torvalds get_order(sctp_port_hashsize * 15961da177e4SLinus Torvalds sizeof(struct sctp_bind_hashbucket))); 1597b5eff712SXin Long kfree(sctp_ep_hashtable); 15984f008781SXin Long sctp_transport_hashtable_destroy(); 15991da177e4SLinus Torvalds 1600632c928aSEric W. Biederman percpu_counter_destroy(&sctp_sockets_allocated); 16011da177e4SLinus Torvalds 1602eaa184a1SJesper Dangaard Brouer rcu_barrier(); /* Wait for completion of call_rcu()'s */ 1603eaa184a1SJesper Dangaard Brouer 1604827bf122SSridhar Samudrala kmem_cache_destroy(sctp_chunk_cachep); 1605827bf122SSridhar Samudrala kmem_cache_destroy(sctp_bucket_cachep); 16061da177e4SLinus Torvalds } 16071da177e4SLinus Torvalds 16081da177e4SLinus Torvalds module_init(sctp_init); 16091da177e4SLinus Torvalds module_exit(sctp_exit); 16101da177e4SLinus Torvalds 1611bb97d31fSArnaldo Carvalho de Melo /* 1612bb97d31fSArnaldo Carvalho de Melo * __stringify doesn't likes enums, so use IPPROTO_SCTP value (132) directly. 1613bb97d31fSArnaldo Carvalho de Melo */ 1614bb97d31fSArnaldo Carvalho de Melo MODULE_ALIAS("net-pf-" __stringify(PF_INET) "-proto-132"); 1615882a382cSSridhar Samudrala MODULE_ALIAS("net-pf-" __stringify(PF_INET6) "-proto-132"); 161691705c61SDaniel Borkmann MODULE_AUTHOR("Linux Kernel SCTP developers <linux-sctp@vger.kernel.org>"); 16171da177e4SLinus Torvalds MODULE_DESCRIPTION("Support for the SCTP protocol (RFC2960)"); 161871acc0ddSDavid S. Miller module_param_named(no_checksums, sctp_checksum_disable, bool, 0644); 161971acc0ddSDavid S. Miller MODULE_PARM_DESC(no_checksums, "Disable checksums computing and verification"); 16201da177e4SLinus Torvalds MODULE_LICENSE("GPL"); 1621