1 /* 2 * IPv6 Address [auto]configuration 3 * Linux INET6 implementation 4 * 5 * Authors: 6 * Pedro Roque <roque@di.fc.ul.pt> 7 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru> 8 * 9 * This program is free software; you can redistribute it and/or 10 * modify it under the terms of the GNU General Public License 11 * as published by the Free Software Foundation; either version 12 * 2 of the License, or (at your option) any later version. 13 */ 14 15 /* 16 * Changes: 17 * 18 * Janos Farkas : delete timer on ifdown 19 * <chexum@bankinf.banki.hu> 20 * Andi Kleen : kill double kfree on module 21 * unload. 22 * Maciej W. Rozycki : FDDI support 23 * sekiya@USAGI : Don't send too many RS 24 * packets. 25 * yoshfuji@USAGI : Fixed interval between DAD 26 * packets. 27 * YOSHIFUJI Hideaki @USAGI : improved accuracy of 28 * address validation timer. 29 * YOSHIFUJI Hideaki @USAGI : Privacy Extensions (RFC3041) 30 * support. 31 * Yuji SEKIYA @USAGI : Don't assign a same IPv6 32 * address on a same interface. 33 * YOSHIFUJI Hideaki @USAGI : ARCnet support 34 * YOSHIFUJI Hideaki @USAGI : convert /proc/net/if_inet6 to 35 * seq_file. 36 * YOSHIFUJI Hideaki @USAGI : improved source address 37 * selection; consider scope, 38 * status etc. 39 */ 40 41 #include <linux/errno.h> 42 #include <linux/types.h> 43 #include <linux/kernel.h> 44 #include <linux/socket.h> 45 #include <linux/sockios.h> 46 #include <linux/net.h> 47 #include <linux/in6.h> 48 #include <linux/netdevice.h> 49 #include <linux/if_addr.h> 50 #include <linux/if_arp.h> 51 #include <linux/if_arcnet.h> 52 #include <linux/if_infiniband.h> 53 #include <linux/route.h> 54 #include <linux/inetdevice.h> 55 #include <linux/init.h> 56 #include <linux/slab.h> 57 #ifdef CONFIG_SYSCTL 58 #include <linux/sysctl.h> 59 #endif 60 #include <linux/capability.h> 61 #include <linux/delay.h> 62 #include <linux/notifier.h> 63 #include <linux/string.h> 64 65 #include <net/net_namespace.h> 66 #include <net/sock.h> 67 #include <net/snmp.h> 68 69 #include <net/ipv6.h> 70 #include <net/protocol.h> 71 #include <net/ndisc.h> 72 #include <net/ip6_route.h> 73 #include <net/addrconf.h> 74 #include <net/tcp.h> 75 #include <net/ip.h> 76 #include <net/netlink.h> 77 #include <net/pkt_sched.h> 78 #include <linux/if_tunnel.h> 79 #include <linux/rtnetlink.h> 80 81 #ifdef CONFIG_IPV6_PRIVACY 82 #include <linux/random.h> 83 #endif 84 85 #include <linux/uaccess.h> 86 #include <asm/unaligned.h> 87 88 #include <linux/proc_fs.h> 89 #include <linux/seq_file.h> 90 91 /* Set to 3 to get tracing... */ 92 #define ACONF_DEBUG 2 93 94 #if ACONF_DEBUG >= 3 95 #define ADBG(x) printk x 96 #else 97 #define ADBG(x) 98 #endif 99 100 #define INFINITY_LIFE_TIME 0xFFFFFFFF 101 #define TIME_DELTA(a, b) ((unsigned long)((long)(a) - (long)(b))) 102 103 #define ADDRCONF_TIMER_FUZZ_MINUS (HZ > 50 ? HZ/50 : 1) 104 #define ADDRCONF_TIMER_FUZZ (HZ / 4) 105 #define ADDRCONF_TIMER_FUZZ_MAX (HZ) 106 107 #ifdef CONFIG_SYSCTL 108 static void addrconf_sysctl_register(struct inet6_dev *idev); 109 static void addrconf_sysctl_unregister(struct inet6_dev *idev); 110 #else 111 static inline void addrconf_sysctl_register(struct inet6_dev *idev) 112 { 113 } 114 115 static inline void addrconf_sysctl_unregister(struct inet6_dev *idev) 116 { 117 } 118 #endif 119 120 #ifdef CONFIG_IPV6_PRIVACY 121 static int __ipv6_regen_rndid(struct inet6_dev *idev); 122 static int __ipv6_try_regen_rndid(struct inet6_dev *idev, struct in6_addr *tmpaddr); 123 static void ipv6_regen_rndid(unsigned long data); 124 125 static int desync_factor = MAX_DESYNC_FACTOR * HZ; 126 #endif 127 128 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev); 129 static int ipv6_count_addresses(struct inet6_dev *idev); 130 131 /* 132 * Configured unicast address hash table 133 */ 134 static struct hlist_head inet6_addr_lst[IN6_ADDR_HSIZE]; 135 static DEFINE_SPINLOCK(addrconf_hash_lock); 136 137 static void addrconf_verify(unsigned long); 138 139 static DEFINE_TIMER(addr_chk_timer, addrconf_verify, 0, 0); 140 static DEFINE_SPINLOCK(addrconf_verify_lock); 141 142 static void addrconf_join_anycast(struct inet6_ifaddr *ifp); 143 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp); 144 145 static void addrconf_type_change(struct net_device *dev, 146 unsigned long event); 147 static int addrconf_ifdown(struct net_device *dev, int how); 148 149 static void addrconf_dad_start(struct inet6_ifaddr *ifp, u32 flags); 150 static void addrconf_dad_timer(unsigned long data); 151 static void addrconf_dad_completed(struct inet6_ifaddr *ifp); 152 static void addrconf_dad_run(struct inet6_dev *idev); 153 static void addrconf_rs_timer(unsigned long data); 154 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa); 155 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa); 156 157 static void inet6_prefix_notify(int event, struct inet6_dev *idev, 158 struct prefix_info *pinfo); 159 static bool ipv6_chk_same_addr(struct net *net, const struct in6_addr *addr, 160 struct net_device *dev); 161 162 static ATOMIC_NOTIFIER_HEAD(inet6addr_chain); 163 164 static struct ipv6_devconf ipv6_devconf __read_mostly = { 165 .forwarding = 0, 166 .hop_limit = IPV6_DEFAULT_HOPLIMIT, 167 .mtu6 = IPV6_MIN_MTU, 168 .accept_ra = 1, 169 .accept_redirects = 1, 170 .autoconf = 1, 171 .force_mld_version = 0, 172 .dad_transmits = 1, 173 .rtr_solicits = MAX_RTR_SOLICITATIONS, 174 .rtr_solicit_interval = RTR_SOLICITATION_INTERVAL, 175 .rtr_solicit_delay = MAX_RTR_SOLICITATION_DELAY, 176 #ifdef CONFIG_IPV6_PRIVACY 177 .use_tempaddr = 0, 178 .temp_valid_lft = TEMP_VALID_LIFETIME, 179 .temp_prefered_lft = TEMP_PREFERRED_LIFETIME, 180 .regen_max_retry = REGEN_MAX_RETRY, 181 .max_desync_factor = MAX_DESYNC_FACTOR, 182 #endif 183 .max_addresses = IPV6_MAX_ADDRESSES, 184 .accept_ra_defrtr = 1, 185 .accept_ra_pinfo = 1, 186 #ifdef CONFIG_IPV6_ROUTER_PREF 187 .accept_ra_rtr_pref = 1, 188 .rtr_probe_interval = 60 * HZ, 189 #ifdef CONFIG_IPV6_ROUTE_INFO 190 .accept_ra_rt_info_max_plen = 0, 191 #endif 192 #endif 193 .proxy_ndp = 0, 194 .accept_source_route = 0, /* we do not accept RH0 by default. */ 195 .disable_ipv6 = 0, 196 .accept_dad = 1, 197 }; 198 199 static struct ipv6_devconf ipv6_devconf_dflt __read_mostly = { 200 .forwarding = 0, 201 .hop_limit = IPV6_DEFAULT_HOPLIMIT, 202 .mtu6 = IPV6_MIN_MTU, 203 .accept_ra = 1, 204 .accept_redirects = 1, 205 .autoconf = 1, 206 .dad_transmits = 1, 207 .rtr_solicits = MAX_RTR_SOLICITATIONS, 208 .rtr_solicit_interval = RTR_SOLICITATION_INTERVAL, 209 .rtr_solicit_delay = MAX_RTR_SOLICITATION_DELAY, 210 #ifdef CONFIG_IPV6_PRIVACY 211 .use_tempaddr = 0, 212 .temp_valid_lft = TEMP_VALID_LIFETIME, 213 .temp_prefered_lft = TEMP_PREFERRED_LIFETIME, 214 .regen_max_retry = REGEN_MAX_RETRY, 215 .max_desync_factor = MAX_DESYNC_FACTOR, 216 #endif 217 .max_addresses = IPV6_MAX_ADDRESSES, 218 .accept_ra_defrtr = 1, 219 .accept_ra_pinfo = 1, 220 #ifdef CONFIG_IPV6_ROUTER_PREF 221 .accept_ra_rtr_pref = 1, 222 .rtr_probe_interval = 60 * HZ, 223 #ifdef CONFIG_IPV6_ROUTE_INFO 224 .accept_ra_rt_info_max_plen = 0, 225 #endif 226 #endif 227 .proxy_ndp = 0, 228 .accept_source_route = 0, /* we do not accept RH0 by default. */ 229 .disable_ipv6 = 0, 230 .accept_dad = 1, 231 }; 232 233 /* IPv6 Wildcard Address and Loopback Address defined by RFC2553 */ 234 const struct in6_addr in6addr_any = IN6ADDR_ANY_INIT; 235 const struct in6_addr in6addr_loopback = IN6ADDR_LOOPBACK_INIT; 236 const struct in6_addr in6addr_linklocal_allnodes = IN6ADDR_LINKLOCAL_ALLNODES_INIT; 237 const struct in6_addr in6addr_linklocal_allrouters = IN6ADDR_LINKLOCAL_ALLROUTERS_INIT; 238 239 /* Check if a valid qdisc is available */ 240 static inline bool addrconf_qdisc_ok(const struct net_device *dev) 241 { 242 return !qdisc_tx_is_noop(dev); 243 } 244 245 /* Check if a route is valid prefix route */ 246 static inline int addrconf_is_prefix_route(const struct rt6_info *rt) 247 { 248 return ((rt->rt6i_flags & (RTF_GATEWAY | RTF_DEFAULT)) == 0); 249 } 250 251 static void addrconf_del_timer(struct inet6_ifaddr *ifp) 252 { 253 if (del_timer(&ifp->timer)) 254 __in6_ifa_put(ifp); 255 } 256 257 enum addrconf_timer_t { 258 AC_NONE, 259 AC_DAD, 260 AC_RS, 261 }; 262 263 static void addrconf_mod_timer(struct inet6_ifaddr *ifp, 264 enum addrconf_timer_t what, 265 unsigned long when) 266 { 267 if (!del_timer(&ifp->timer)) 268 in6_ifa_hold(ifp); 269 270 switch (what) { 271 case AC_DAD: 272 ifp->timer.function = addrconf_dad_timer; 273 break; 274 case AC_RS: 275 ifp->timer.function = addrconf_rs_timer; 276 break; 277 default: 278 break; 279 } 280 ifp->timer.expires = jiffies + when; 281 add_timer(&ifp->timer); 282 } 283 284 static int snmp6_alloc_dev(struct inet6_dev *idev) 285 { 286 if (snmp_mib_init((void __percpu **)idev->stats.ipv6, 287 sizeof(struct ipstats_mib)) < 0) 288 goto err_ip; 289 if (snmp_mib_init((void __percpu **)idev->stats.icmpv6, 290 sizeof(struct icmpv6_mib)) < 0) 291 goto err_icmp; 292 if (snmp_mib_init((void __percpu **)idev->stats.icmpv6msg, 293 sizeof(struct icmpv6msg_mib)) < 0) 294 goto err_icmpmsg; 295 296 return 0; 297 298 err_icmpmsg: 299 snmp_mib_free((void __percpu **)idev->stats.icmpv6); 300 err_icmp: 301 snmp_mib_free((void __percpu **)idev->stats.ipv6); 302 err_ip: 303 return -ENOMEM; 304 } 305 306 static void snmp6_free_dev(struct inet6_dev *idev) 307 { 308 snmp_mib_free((void __percpu **)idev->stats.icmpv6msg); 309 snmp_mib_free((void __percpu **)idev->stats.icmpv6); 310 snmp_mib_free((void __percpu **)idev->stats.ipv6); 311 } 312 313 /* Nobody refers to this device, we may destroy it. */ 314 315 static void in6_dev_finish_destroy_rcu(struct rcu_head *head) 316 { 317 struct inet6_dev *idev = container_of(head, struct inet6_dev, rcu); 318 kfree(idev); 319 } 320 321 void in6_dev_finish_destroy(struct inet6_dev *idev) 322 { 323 struct net_device *dev = idev->dev; 324 325 WARN_ON(!list_empty(&idev->addr_list)); 326 WARN_ON(idev->mc_list != NULL); 327 328 #ifdef NET_REFCNT_DEBUG 329 printk(KERN_DEBUG "in6_dev_finish_destroy: %s\n", dev ? dev->name : "NIL"); 330 #endif 331 dev_put(dev); 332 if (!idev->dead) { 333 pr_warning("Freeing alive inet6 device %p\n", idev); 334 return; 335 } 336 snmp6_free_dev(idev); 337 call_rcu(&idev->rcu, in6_dev_finish_destroy_rcu); 338 } 339 340 EXPORT_SYMBOL(in6_dev_finish_destroy); 341 342 static struct inet6_dev * ipv6_add_dev(struct net_device *dev) 343 { 344 struct inet6_dev *ndev; 345 346 ASSERT_RTNL(); 347 348 if (dev->mtu < IPV6_MIN_MTU) 349 return NULL; 350 351 ndev = kzalloc(sizeof(struct inet6_dev), GFP_KERNEL); 352 353 if (ndev == NULL) 354 return NULL; 355 356 rwlock_init(&ndev->lock); 357 ndev->dev = dev; 358 INIT_LIST_HEAD(&ndev->addr_list); 359 360 memcpy(&ndev->cnf, dev_net(dev)->ipv6.devconf_dflt, sizeof(ndev->cnf)); 361 ndev->cnf.mtu6 = dev->mtu; 362 ndev->cnf.sysctl = NULL; 363 ndev->nd_parms = neigh_parms_alloc(dev, &nd_tbl); 364 if (ndev->nd_parms == NULL) { 365 kfree(ndev); 366 return NULL; 367 } 368 if (ndev->cnf.forwarding) 369 dev_disable_lro(dev); 370 /* We refer to the device */ 371 dev_hold(dev); 372 373 if (snmp6_alloc_dev(ndev) < 0) { 374 ADBG((KERN_WARNING 375 "%s(): cannot allocate memory for statistics; dev=%s.\n", 376 __func__, dev->name)); 377 neigh_parms_release(&nd_tbl, ndev->nd_parms); 378 ndev->dead = 1; 379 in6_dev_finish_destroy(ndev); 380 return NULL; 381 } 382 383 if (snmp6_register_dev(ndev) < 0) { 384 ADBG((KERN_WARNING 385 "%s(): cannot create /proc/net/dev_snmp6/%s\n", 386 __func__, dev->name)); 387 neigh_parms_release(&nd_tbl, ndev->nd_parms); 388 ndev->dead = 1; 389 in6_dev_finish_destroy(ndev); 390 return NULL; 391 } 392 393 /* One reference from device. We must do this before 394 * we invoke __ipv6_regen_rndid(). 395 */ 396 in6_dev_hold(ndev); 397 398 if (dev->flags & (IFF_NOARP | IFF_LOOPBACK)) 399 ndev->cnf.accept_dad = -1; 400 401 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 402 if (dev->type == ARPHRD_SIT && (dev->priv_flags & IFF_ISATAP)) { 403 printk(KERN_INFO 404 "%s: Disabled Multicast RS\n", 405 dev->name); 406 ndev->cnf.rtr_solicits = 0; 407 } 408 #endif 409 410 #ifdef CONFIG_IPV6_PRIVACY 411 INIT_LIST_HEAD(&ndev->tempaddr_list); 412 setup_timer(&ndev->regen_timer, ipv6_regen_rndid, (unsigned long)ndev); 413 if ((dev->flags&IFF_LOOPBACK) || 414 dev->type == ARPHRD_TUNNEL || 415 dev->type == ARPHRD_TUNNEL6 || 416 dev->type == ARPHRD_SIT || 417 dev->type == ARPHRD_NONE) { 418 printk(KERN_INFO 419 "%s: Disabled Privacy Extensions\n", 420 dev->name); 421 ndev->cnf.use_tempaddr = -1; 422 } else { 423 in6_dev_hold(ndev); 424 ipv6_regen_rndid((unsigned long) ndev); 425 } 426 #endif 427 428 if (netif_running(dev) && addrconf_qdisc_ok(dev)) 429 ndev->if_flags |= IF_READY; 430 431 ipv6_mc_init_dev(ndev); 432 ndev->tstamp = jiffies; 433 addrconf_sysctl_register(ndev); 434 /* protected by rtnl_lock */ 435 rcu_assign_pointer(dev->ip6_ptr, ndev); 436 437 /* Join all-node multicast group */ 438 ipv6_dev_mc_inc(dev, &in6addr_linklocal_allnodes); 439 440 return ndev; 441 } 442 443 static struct inet6_dev * ipv6_find_idev(struct net_device *dev) 444 { 445 struct inet6_dev *idev; 446 447 ASSERT_RTNL(); 448 449 idev = __in6_dev_get(dev); 450 if (!idev) { 451 idev = ipv6_add_dev(dev); 452 if (!idev) 453 return NULL; 454 } 455 456 if (dev->flags&IFF_UP) 457 ipv6_mc_up(idev); 458 return idev; 459 } 460 461 #ifdef CONFIG_SYSCTL 462 static void dev_forward_change(struct inet6_dev *idev) 463 { 464 struct net_device *dev; 465 struct inet6_ifaddr *ifa; 466 467 if (!idev) 468 return; 469 dev = idev->dev; 470 if (idev->cnf.forwarding) 471 dev_disable_lro(dev); 472 if (dev && (dev->flags & IFF_MULTICAST)) { 473 if (idev->cnf.forwarding) 474 ipv6_dev_mc_inc(dev, &in6addr_linklocal_allrouters); 475 else 476 ipv6_dev_mc_dec(dev, &in6addr_linklocal_allrouters); 477 } 478 479 list_for_each_entry(ifa, &idev->addr_list, if_list) { 480 if (ifa->flags&IFA_F_TENTATIVE) 481 continue; 482 if (idev->cnf.forwarding) 483 addrconf_join_anycast(ifa); 484 else 485 addrconf_leave_anycast(ifa); 486 } 487 } 488 489 490 static void addrconf_forward_change(struct net *net, __s32 newf) 491 { 492 struct net_device *dev; 493 struct inet6_dev *idev; 494 495 rcu_read_lock(); 496 for_each_netdev_rcu(net, dev) { 497 idev = __in6_dev_get(dev); 498 if (idev) { 499 int changed = (!idev->cnf.forwarding) ^ (!newf); 500 idev->cnf.forwarding = newf; 501 if (changed) 502 dev_forward_change(idev); 503 } 504 } 505 rcu_read_unlock(); 506 } 507 508 static int addrconf_fixup_forwarding(struct ctl_table *table, int *p, int old) 509 { 510 struct net *net; 511 512 net = (struct net *)table->extra2; 513 if (p == &net->ipv6.devconf_dflt->forwarding) 514 return 0; 515 516 if (!rtnl_trylock()) { 517 /* Restore the original values before restarting */ 518 *p = old; 519 return restart_syscall(); 520 } 521 522 if (p == &net->ipv6.devconf_all->forwarding) { 523 __s32 newf = net->ipv6.devconf_all->forwarding; 524 net->ipv6.devconf_dflt->forwarding = newf; 525 addrconf_forward_change(net, newf); 526 } else if ((!*p) ^ (!old)) 527 dev_forward_change((struct inet6_dev *)table->extra1); 528 rtnl_unlock(); 529 530 if (*p) 531 rt6_purge_dflt_routers(net); 532 return 1; 533 } 534 #endif 535 536 static void inet6_ifa_finish_destroy_rcu(struct rcu_head *head) 537 { 538 struct inet6_ifaddr *ifp = container_of(head, struct inet6_ifaddr, rcu); 539 kfree(ifp); 540 } 541 542 /* Nobody refers to this ifaddr, destroy it */ 543 void inet6_ifa_finish_destroy(struct inet6_ifaddr *ifp) 544 { 545 WARN_ON(!hlist_unhashed(&ifp->addr_lst)); 546 547 #ifdef NET_REFCNT_DEBUG 548 printk(KERN_DEBUG "inet6_ifa_finish_destroy\n"); 549 #endif 550 551 in6_dev_put(ifp->idev); 552 553 if (del_timer(&ifp->timer)) 554 pr_notice("Timer is still running, when freeing ifa=%p\n", ifp); 555 556 if (ifp->state != INET6_IFADDR_STATE_DEAD) { 557 pr_warning("Freeing alive inet6 address %p\n", ifp); 558 return; 559 } 560 dst_release(&ifp->rt->u.dst); 561 562 call_rcu(&ifp->rcu, inet6_ifa_finish_destroy_rcu); 563 } 564 565 static void 566 ipv6_link_dev_addr(struct inet6_dev *idev, struct inet6_ifaddr *ifp) 567 { 568 struct list_head *p; 569 int ifp_scope = ipv6_addr_src_scope(&ifp->addr); 570 571 /* 572 * Each device address list is sorted in order of scope - 573 * global before linklocal. 574 */ 575 list_for_each(p, &idev->addr_list) { 576 struct inet6_ifaddr *ifa 577 = list_entry(p, struct inet6_ifaddr, if_list); 578 if (ifp_scope >= ipv6_addr_src_scope(&ifa->addr)) 579 break; 580 } 581 582 list_add_tail(&ifp->if_list, p); 583 } 584 585 static u32 ipv6_addr_hash(const struct in6_addr *addr) 586 { 587 /* 588 * We perform the hash function over the last 64 bits of the address 589 * This will include the IEEE address token on links that support it. 590 */ 591 return jhash_2words((__force u32)addr->s6_addr32[2], 592 (__force u32)addr->s6_addr32[3], 0) 593 & (IN6_ADDR_HSIZE - 1); 594 } 595 596 /* On success it returns ifp with increased reference count */ 597 598 static struct inet6_ifaddr * 599 ipv6_add_addr(struct inet6_dev *idev, const struct in6_addr *addr, int pfxlen, 600 int scope, u32 flags) 601 { 602 struct inet6_ifaddr *ifa = NULL; 603 struct rt6_info *rt; 604 unsigned int hash; 605 int err = 0; 606 int addr_type = ipv6_addr_type(addr); 607 608 if (addr_type == IPV6_ADDR_ANY || 609 addr_type & IPV6_ADDR_MULTICAST || 610 (!(idev->dev->flags & IFF_LOOPBACK) && 611 addr_type & IPV6_ADDR_LOOPBACK)) 612 return ERR_PTR(-EADDRNOTAVAIL); 613 614 rcu_read_lock_bh(); 615 if (idev->dead) { 616 err = -ENODEV; /*XXX*/ 617 goto out2; 618 } 619 620 if (idev->cnf.disable_ipv6) { 621 err = -EACCES; 622 goto out2; 623 } 624 625 spin_lock(&addrconf_hash_lock); 626 627 /* Ignore adding duplicate addresses on an interface */ 628 if (ipv6_chk_same_addr(dev_net(idev->dev), addr, idev->dev)) { 629 ADBG(("ipv6_add_addr: already assigned\n")); 630 err = -EEXIST; 631 goto out; 632 } 633 634 ifa = kzalloc(sizeof(struct inet6_ifaddr), GFP_ATOMIC); 635 636 if (ifa == NULL) { 637 ADBG(("ipv6_add_addr: malloc failed\n")); 638 err = -ENOBUFS; 639 goto out; 640 } 641 642 rt = addrconf_dst_alloc(idev, addr, 0); 643 if (IS_ERR(rt)) { 644 err = PTR_ERR(rt); 645 goto out; 646 } 647 648 ipv6_addr_copy(&ifa->addr, addr); 649 650 spin_lock_init(&ifa->lock); 651 spin_lock_init(&ifa->state_lock); 652 init_timer(&ifa->timer); 653 INIT_HLIST_NODE(&ifa->addr_lst); 654 ifa->timer.data = (unsigned long) ifa; 655 ifa->scope = scope; 656 ifa->prefix_len = pfxlen; 657 ifa->flags = flags | IFA_F_TENTATIVE; 658 ifa->cstamp = ifa->tstamp = jiffies; 659 660 ifa->rt = rt; 661 662 /* 663 * part one of RFC 4429, section 3.3 664 * We should not configure an address as 665 * optimistic if we do not yet know the link 666 * layer address of our nexhop router 667 */ 668 669 if (rt->rt6i_nexthop == NULL) 670 ifa->flags &= ~IFA_F_OPTIMISTIC; 671 672 ifa->idev = idev; 673 in6_dev_hold(idev); 674 /* For caller */ 675 in6_ifa_hold(ifa); 676 677 /* Add to big hash table */ 678 hash = ipv6_addr_hash(addr); 679 680 hlist_add_head_rcu(&ifa->addr_lst, &inet6_addr_lst[hash]); 681 spin_unlock(&addrconf_hash_lock); 682 683 write_lock(&idev->lock); 684 /* Add to inet6_dev unicast addr list. */ 685 ipv6_link_dev_addr(idev, ifa); 686 687 #ifdef CONFIG_IPV6_PRIVACY 688 if (ifa->flags&IFA_F_TEMPORARY) { 689 list_add(&ifa->tmp_list, &idev->tempaddr_list); 690 in6_ifa_hold(ifa); 691 } 692 #endif 693 694 in6_ifa_hold(ifa); 695 write_unlock(&idev->lock); 696 out2: 697 rcu_read_unlock_bh(); 698 699 if (likely(err == 0)) 700 atomic_notifier_call_chain(&inet6addr_chain, NETDEV_UP, ifa); 701 else { 702 kfree(ifa); 703 ifa = ERR_PTR(err); 704 } 705 706 return ifa; 707 out: 708 spin_unlock(&addrconf_hash_lock); 709 goto out2; 710 } 711 712 /* This function wants to get referenced ifp and releases it before return */ 713 714 static void ipv6_del_addr(struct inet6_ifaddr *ifp) 715 { 716 struct inet6_ifaddr *ifa, *ifn; 717 struct inet6_dev *idev = ifp->idev; 718 int state; 719 int hash; 720 int deleted = 0, onlink = 0; 721 unsigned long expires = jiffies; 722 723 hash = ipv6_addr_hash(&ifp->addr); 724 725 spin_lock_bh(&ifp->state_lock); 726 state = ifp->state; 727 ifp->state = INET6_IFADDR_STATE_DEAD; 728 spin_unlock_bh(&ifp->state_lock); 729 730 if (state == INET6_IFADDR_STATE_DEAD) 731 goto out; 732 733 spin_lock_bh(&addrconf_hash_lock); 734 hlist_del_init_rcu(&ifp->addr_lst); 735 spin_unlock_bh(&addrconf_hash_lock); 736 737 write_lock_bh(&idev->lock); 738 #ifdef CONFIG_IPV6_PRIVACY 739 if (ifp->flags&IFA_F_TEMPORARY) { 740 list_del(&ifp->tmp_list); 741 if (ifp->ifpub) { 742 in6_ifa_put(ifp->ifpub); 743 ifp->ifpub = NULL; 744 } 745 __in6_ifa_put(ifp); 746 } 747 #endif 748 749 list_for_each_entry_safe(ifa, ifn, &idev->addr_list, if_list) { 750 if (ifa == ifp) { 751 list_del_init(&ifp->if_list); 752 __in6_ifa_put(ifp); 753 754 if (!(ifp->flags & IFA_F_PERMANENT) || onlink > 0) 755 break; 756 deleted = 1; 757 continue; 758 } else if (ifp->flags & IFA_F_PERMANENT) { 759 if (ipv6_prefix_equal(&ifa->addr, &ifp->addr, 760 ifp->prefix_len)) { 761 if (ifa->flags & IFA_F_PERMANENT) { 762 onlink = 1; 763 if (deleted) 764 break; 765 } else { 766 unsigned long lifetime; 767 768 if (!onlink) 769 onlink = -1; 770 771 spin_lock(&ifa->lock); 772 773 lifetime = addrconf_timeout_fixup(ifa->valid_lft, HZ); 774 /* 775 * Note: Because this address is 776 * not permanent, lifetime < 777 * LONG_MAX / HZ here. 778 */ 779 if (time_before(expires, 780 ifa->tstamp + lifetime * HZ)) 781 expires = ifa->tstamp + lifetime * HZ; 782 spin_unlock(&ifa->lock); 783 } 784 } 785 } 786 } 787 write_unlock_bh(&idev->lock); 788 789 addrconf_del_timer(ifp); 790 791 ipv6_ifa_notify(RTM_DELADDR, ifp); 792 793 atomic_notifier_call_chain(&inet6addr_chain, NETDEV_DOWN, ifp); 794 795 /* 796 * Purge or update corresponding prefix 797 * 798 * 1) we don't purge prefix here if address was not permanent. 799 * prefix is managed by its own lifetime. 800 * 2) if there're no addresses, delete prefix. 801 * 3) if there're still other permanent address(es), 802 * corresponding prefix is still permanent. 803 * 4) otherwise, update prefix lifetime to the 804 * longest valid lifetime among the corresponding 805 * addresses on the device. 806 * Note: subsequent RA will update lifetime. 807 * 808 * --yoshfuji 809 */ 810 if ((ifp->flags & IFA_F_PERMANENT) && onlink < 1) { 811 struct in6_addr prefix; 812 struct rt6_info *rt; 813 struct net *net = dev_net(ifp->idev->dev); 814 ipv6_addr_prefix(&prefix, &ifp->addr, ifp->prefix_len); 815 rt = rt6_lookup(net, &prefix, NULL, ifp->idev->dev->ifindex, 1); 816 817 if (rt && addrconf_is_prefix_route(rt)) { 818 if (onlink == 0) { 819 ip6_del_rt(rt); 820 rt = NULL; 821 } else if (!(rt->rt6i_flags & RTF_EXPIRES)) { 822 rt->rt6i_expires = expires; 823 rt->rt6i_flags |= RTF_EXPIRES; 824 } 825 } 826 dst_release(&rt->u.dst); 827 } 828 829 out: 830 in6_ifa_put(ifp); 831 } 832 833 #ifdef CONFIG_IPV6_PRIVACY 834 static int ipv6_create_tempaddr(struct inet6_ifaddr *ifp, struct inet6_ifaddr *ift) 835 { 836 struct inet6_dev *idev = ifp->idev; 837 struct in6_addr addr, *tmpaddr; 838 unsigned long tmp_prefered_lft, tmp_valid_lft, tmp_cstamp, tmp_tstamp; 839 unsigned long regen_advance; 840 int tmp_plen; 841 int ret = 0; 842 int max_addresses; 843 u32 addr_flags; 844 845 write_lock(&idev->lock); 846 if (ift) { 847 spin_lock_bh(&ift->lock); 848 memcpy(&addr.s6_addr[8], &ift->addr.s6_addr[8], 8); 849 spin_unlock_bh(&ift->lock); 850 tmpaddr = &addr; 851 } else { 852 tmpaddr = NULL; 853 } 854 retry: 855 in6_dev_hold(idev); 856 if (idev->cnf.use_tempaddr <= 0) { 857 write_unlock(&idev->lock); 858 printk(KERN_INFO 859 "ipv6_create_tempaddr(): use_tempaddr is disabled.\n"); 860 in6_dev_put(idev); 861 ret = -1; 862 goto out; 863 } 864 spin_lock_bh(&ifp->lock); 865 if (ifp->regen_count++ >= idev->cnf.regen_max_retry) { 866 idev->cnf.use_tempaddr = -1; /*XXX*/ 867 spin_unlock_bh(&ifp->lock); 868 write_unlock(&idev->lock); 869 printk(KERN_WARNING 870 "ipv6_create_tempaddr(): regeneration time exceeded. disabled temporary address support.\n"); 871 in6_dev_put(idev); 872 ret = -1; 873 goto out; 874 } 875 in6_ifa_hold(ifp); 876 memcpy(addr.s6_addr, ifp->addr.s6_addr, 8); 877 if (__ipv6_try_regen_rndid(idev, tmpaddr) < 0) { 878 spin_unlock_bh(&ifp->lock); 879 write_unlock(&idev->lock); 880 printk(KERN_WARNING 881 "ipv6_create_tempaddr(): regeneration of randomized interface id failed.\n"); 882 in6_ifa_put(ifp); 883 in6_dev_put(idev); 884 ret = -1; 885 goto out; 886 } 887 memcpy(&addr.s6_addr[8], idev->rndid, 8); 888 tmp_valid_lft = min_t(__u32, 889 ifp->valid_lft, 890 idev->cnf.temp_valid_lft); 891 tmp_prefered_lft = min_t(__u32, 892 ifp->prefered_lft, 893 idev->cnf.temp_prefered_lft - desync_factor / HZ); 894 tmp_plen = ifp->prefix_len; 895 max_addresses = idev->cnf.max_addresses; 896 tmp_cstamp = ifp->cstamp; 897 tmp_tstamp = ifp->tstamp; 898 spin_unlock_bh(&ifp->lock); 899 900 regen_advance = idev->cnf.regen_max_retry * 901 idev->cnf.dad_transmits * 902 idev->nd_parms->retrans_time / HZ; 903 write_unlock(&idev->lock); 904 905 /* A temporary address is created only if this calculated Preferred 906 * Lifetime is greater than REGEN_ADVANCE time units. In particular, 907 * an implementation must not create a temporary address with a zero 908 * Preferred Lifetime. 909 */ 910 if (tmp_prefered_lft <= regen_advance) { 911 in6_ifa_put(ifp); 912 in6_dev_put(idev); 913 ret = -1; 914 goto out; 915 } 916 917 addr_flags = IFA_F_TEMPORARY; 918 /* set in addrconf_prefix_rcv() */ 919 if (ifp->flags & IFA_F_OPTIMISTIC) 920 addr_flags |= IFA_F_OPTIMISTIC; 921 922 ift = !max_addresses || 923 ipv6_count_addresses(idev) < max_addresses ? 924 ipv6_add_addr(idev, &addr, tmp_plen, 925 ipv6_addr_type(&addr)&IPV6_ADDR_SCOPE_MASK, 926 addr_flags) : NULL; 927 if (!ift || IS_ERR(ift)) { 928 in6_ifa_put(ifp); 929 in6_dev_put(idev); 930 printk(KERN_INFO 931 "ipv6_create_tempaddr(): retry temporary address regeneration.\n"); 932 tmpaddr = &addr; 933 write_lock(&idev->lock); 934 goto retry; 935 } 936 937 spin_lock_bh(&ift->lock); 938 ift->ifpub = ifp; 939 ift->valid_lft = tmp_valid_lft; 940 ift->prefered_lft = tmp_prefered_lft; 941 ift->cstamp = tmp_cstamp; 942 ift->tstamp = tmp_tstamp; 943 spin_unlock_bh(&ift->lock); 944 945 addrconf_dad_start(ift, 0); 946 in6_ifa_put(ift); 947 in6_dev_put(idev); 948 out: 949 return ret; 950 } 951 #endif 952 953 /* 954 * Choose an appropriate source address (RFC3484) 955 */ 956 enum { 957 IPV6_SADDR_RULE_INIT = 0, 958 IPV6_SADDR_RULE_LOCAL, 959 IPV6_SADDR_RULE_SCOPE, 960 IPV6_SADDR_RULE_PREFERRED, 961 #ifdef CONFIG_IPV6_MIP6 962 IPV6_SADDR_RULE_HOA, 963 #endif 964 IPV6_SADDR_RULE_OIF, 965 IPV6_SADDR_RULE_LABEL, 966 #ifdef CONFIG_IPV6_PRIVACY 967 IPV6_SADDR_RULE_PRIVACY, 968 #endif 969 IPV6_SADDR_RULE_ORCHID, 970 IPV6_SADDR_RULE_PREFIX, 971 IPV6_SADDR_RULE_MAX 972 }; 973 974 struct ipv6_saddr_score { 975 int rule; 976 int addr_type; 977 struct inet6_ifaddr *ifa; 978 DECLARE_BITMAP(scorebits, IPV6_SADDR_RULE_MAX); 979 int scopedist; 980 int matchlen; 981 }; 982 983 struct ipv6_saddr_dst { 984 const struct in6_addr *addr; 985 int ifindex; 986 int scope; 987 int label; 988 unsigned int prefs; 989 }; 990 991 static inline int ipv6_saddr_preferred(int type) 992 { 993 if (type & (IPV6_ADDR_MAPPED|IPV6_ADDR_COMPATv4|IPV6_ADDR_LOOPBACK)) 994 return 1; 995 return 0; 996 } 997 998 static int ipv6_get_saddr_eval(struct net *net, 999 struct ipv6_saddr_score *score, 1000 struct ipv6_saddr_dst *dst, 1001 int i) 1002 { 1003 int ret; 1004 1005 if (i <= score->rule) { 1006 switch (i) { 1007 case IPV6_SADDR_RULE_SCOPE: 1008 ret = score->scopedist; 1009 break; 1010 case IPV6_SADDR_RULE_PREFIX: 1011 ret = score->matchlen; 1012 break; 1013 default: 1014 ret = !!test_bit(i, score->scorebits); 1015 } 1016 goto out; 1017 } 1018 1019 switch (i) { 1020 case IPV6_SADDR_RULE_INIT: 1021 /* Rule 0: remember if hiscore is not ready yet */ 1022 ret = !!score->ifa; 1023 break; 1024 case IPV6_SADDR_RULE_LOCAL: 1025 /* Rule 1: Prefer same address */ 1026 ret = ipv6_addr_equal(&score->ifa->addr, dst->addr); 1027 break; 1028 case IPV6_SADDR_RULE_SCOPE: 1029 /* Rule 2: Prefer appropriate scope 1030 * 1031 * ret 1032 * ^ 1033 * -1 | d 15 1034 * ---+--+-+---> scope 1035 * | 1036 * | d is scope of the destination. 1037 * B-d | \ 1038 * | \ <- smaller scope is better if 1039 * B-15 | \ if scope is enough for destinaion. 1040 * | ret = B - scope (-1 <= scope >= d <= 15). 1041 * d-C-1 | / 1042 * |/ <- greater is better 1043 * -C / if scope is not enough for destination. 1044 * /| ret = scope - C (-1 <= d < scope <= 15). 1045 * 1046 * d - C - 1 < B -15 (for all -1 <= d <= 15). 1047 * C > d + 14 - B >= 15 + 14 - B = 29 - B. 1048 * Assume B = 0 and we get C > 29. 1049 */ 1050 ret = __ipv6_addr_src_scope(score->addr_type); 1051 if (ret >= dst->scope) 1052 ret = -ret; 1053 else 1054 ret -= 128; /* 30 is enough */ 1055 score->scopedist = ret; 1056 break; 1057 case IPV6_SADDR_RULE_PREFERRED: 1058 /* Rule 3: Avoid deprecated and optimistic addresses */ 1059 ret = ipv6_saddr_preferred(score->addr_type) || 1060 !(score->ifa->flags & (IFA_F_DEPRECATED|IFA_F_OPTIMISTIC)); 1061 break; 1062 #ifdef CONFIG_IPV6_MIP6 1063 case IPV6_SADDR_RULE_HOA: 1064 { 1065 /* Rule 4: Prefer home address */ 1066 int prefhome = !(dst->prefs & IPV6_PREFER_SRC_COA); 1067 ret = !(score->ifa->flags & IFA_F_HOMEADDRESS) ^ prefhome; 1068 break; 1069 } 1070 #endif 1071 case IPV6_SADDR_RULE_OIF: 1072 /* Rule 5: Prefer outgoing interface */ 1073 ret = (!dst->ifindex || 1074 dst->ifindex == score->ifa->idev->dev->ifindex); 1075 break; 1076 case IPV6_SADDR_RULE_LABEL: 1077 /* Rule 6: Prefer matching label */ 1078 ret = ipv6_addr_label(net, 1079 &score->ifa->addr, score->addr_type, 1080 score->ifa->idev->dev->ifindex) == dst->label; 1081 break; 1082 #ifdef CONFIG_IPV6_PRIVACY 1083 case IPV6_SADDR_RULE_PRIVACY: 1084 { 1085 /* Rule 7: Prefer public address 1086 * Note: prefer temprary address if use_tempaddr >= 2 1087 */ 1088 int preftmp = dst->prefs & (IPV6_PREFER_SRC_PUBLIC|IPV6_PREFER_SRC_TMP) ? 1089 !!(dst->prefs & IPV6_PREFER_SRC_TMP) : 1090 score->ifa->idev->cnf.use_tempaddr >= 2; 1091 ret = (!(score->ifa->flags & IFA_F_TEMPORARY)) ^ preftmp; 1092 break; 1093 } 1094 #endif 1095 case IPV6_SADDR_RULE_ORCHID: 1096 /* Rule 8-: Prefer ORCHID vs ORCHID or 1097 * non-ORCHID vs non-ORCHID 1098 */ 1099 ret = !(ipv6_addr_orchid(&score->ifa->addr) ^ 1100 ipv6_addr_orchid(dst->addr)); 1101 break; 1102 case IPV6_SADDR_RULE_PREFIX: 1103 /* Rule 8: Use longest matching prefix */ 1104 score->matchlen = ret = ipv6_addr_diff(&score->ifa->addr, 1105 dst->addr); 1106 break; 1107 default: 1108 ret = 0; 1109 } 1110 1111 if (ret) 1112 __set_bit(i, score->scorebits); 1113 score->rule = i; 1114 out: 1115 return ret; 1116 } 1117 1118 int ipv6_dev_get_saddr(struct net *net, struct net_device *dst_dev, 1119 const struct in6_addr *daddr, unsigned int prefs, 1120 struct in6_addr *saddr) 1121 { 1122 struct ipv6_saddr_score scores[2], 1123 *score = &scores[0], *hiscore = &scores[1]; 1124 struct ipv6_saddr_dst dst; 1125 struct net_device *dev; 1126 int dst_type; 1127 1128 dst_type = __ipv6_addr_type(daddr); 1129 dst.addr = daddr; 1130 dst.ifindex = dst_dev ? dst_dev->ifindex : 0; 1131 dst.scope = __ipv6_addr_src_scope(dst_type); 1132 dst.label = ipv6_addr_label(net, daddr, dst_type, dst.ifindex); 1133 dst.prefs = prefs; 1134 1135 hiscore->rule = -1; 1136 hiscore->ifa = NULL; 1137 1138 rcu_read_lock(); 1139 1140 for_each_netdev_rcu(net, dev) { 1141 struct inet6_dev *idev; 1142 1143 /* Candidate Source Address (section 4) 1144 * - multicast and link-local destination address, 1145 * the set of candidate source address MUST only 1146 * include addresses assigned to interfaces 1147 * belonging to the same link as the outgoing 1148 * interface. 1149 * (- For site-local destination addresses, the 1150 * set of candidate source addresses MUST only 1151 * include addresses assigned to interfaces 1152 * belonging to the same site as the outgoing 1153 * interface.) 1154 */ 1155 if (((dst_type & IPV6_ADDR_MULTICAST) || 1156 dst.scope <= IPV6_ADDR_SCOPE_LINKLOCAL) && 1157 dst.ifindex && dev->ifindex != dst.ifindex) 1158 continue; 1159 1160 idev = __in6_dev_get(dev); 1161 if (!idev) 1162 continue; 1163 1164 read_lock_bh(&idev->lock); 1165 list_for_each_entry(score->ifa, &idev->addr_list, if_list) { 1166 int i; 1167 1168 /* 1169 * - Tentative Address (RFC2462 section 5.4) 1170 * - A tentative address is not considered 1171 * "assigned to an interface" in the traditional 1172 * sense, unless it is also flagged as optimistic. 1173 * - Candidate Source Address (section 4) 1174 * - In any case, anycast addresses, multicast 1175 * addresses, and the unspecified address MUST 1176 * NOT be included in a candidate set. 1177 */ 1178 if ((score->ifa->flags & IFA_F_TENTATIVE) && 1179 (!(score->ifa->flags & IFA_F_OPTIMISTIC))) 1180 continue; 1181 1182 score->addr_type = __ipv6_addr_type(&score->ifa->addr); 1183 1184 if (unlikely(score->addr_type == IPV6_ADDR_ANY || 1185 score->addr_type & IPV6_ADDR_MULTICAST)) { 1186 LIMIT_NETDEBUG(KERN_DEBUG 1187 "ADDRCONF: unspecified / multicast address " 1188 "assigned as unicast address on %s", 1189 dev->name); 1190 continue; 1191 } 1192 1193 score->rule = -1; 1194 bitmap_zero(score->scorebits, IPV6_SADDR_RULE_MAX); 1195 1196 for (i = 0; i < IPV6_SADDR_RULE_MAX; i++) { 1197 int minihiscore, miniscore; 1198 1199 minihiscore = ipv6_get_saddr_eval(net, hiscore, &dst, i); 1200 miniscore = ipv6_get_saddr_eval(net, score, &dst, i); 1201 1202 if (minihiscore > miniscore) { 1203 if (i == IPV6_SADDR_RULE_SCOPE && 1204 score->scopedist > 0) { 1205 /* 1206 * special case: 1207 * each remaining entry 1208 * has too small (not enough) 1209 * scope, because ifa entries 1210 * are sorted by their scope 1211 * values. 1212 */ 1213 goto try_nextdev; 1214 } 1215 break; 1216 } else if (minihiscore < miniscore) { 1217 if (hiscore->ifa) 1218 in6_ifa_put(hiscore->ifa); 1219 1220 in6_ifa_hold(score->ifa); 1221 1222 swap(hiscore, score); 1223 1224 /* restore our iterator */ 1225 score->ifa = hiscore->ifa; 1226 1227 break; 1228 } 1229 } 1230 } 1231 try_nextdev: 1232 read_unlock_bh(&idev->lock); 1233 } 1234 rcu_read_unlock(); 1235 1236 if (!hiscore->ifa) 1237 return -EADDRNOTAVAIL; 1238 1239 ipv6_addr_copy(saddr, &hiscore->ifa->addr); 1240 in6_ifa_put(hiscore->ifa); 1241 return 0; 1242 } 1243 EXPORT_SYMBOL(ipv6_dev_get_saddr); 1244 1245 int ipv6_get_lladdr(struct net_device *dev, struct in6_addr *addr, 1246 unsigned char banned_flags) 1247 { 1248 struct inet6_dev *idev; 1249 int err = -EADDRNOTAVAIL; 1250 1251 rcu_read_lock(); 1252 idev = __in6_dev_get(dev); 1253 if (idev) { 1254 struct inet6_ifaddr *ifp; 1255 1256 read_lock_bh(&idev->lock); 1257 list_for_each_entry(ifp, &idev->addr_list, if_list) { 1258 if (ifp->scope == IFA_LINK && 1259 !(ifp->flags & banned_flags)) { 1260 ipv6_addr_copy(addr, &ifp->addr); 1261 err = 0; 1262 break; 1263 } 1264 } 1265 read_unlock_bh(&idev->lock); 1266 } 1267 rcu_read_unlock(); 1268 return err; 1269 } 1270 1271 static int ipv6_count_addresses(struct inet6_dev *idev) 1272 { 1273 int cnt = 0; 1274 struct inet6_ifaddr *ifp; 1275 1276 read_lock_bh(&idev->lock); 1277 list_for_each_entry(ifp, &idev->addr_list, if_list) 1278 cnt++; 1279 read_unlock_bh(&idev->lock); 1280 return cnt; 1281 } 1282 1283 int ipv6_chk_addr(struct net *net, struct in6_addr *addr, 1284 struct net_device *dev, int strict) 1285 { 1286 struct inet6_ifaddr *ifp; 1287 struct hlist_node *node; 1288 unsigned int hash = ipv6_addr_hash(addr); 1289 1290 rcu_read_lock_bh(); 1291 hlist_for_each_entry_rcu(ifp, node, &inet6_addr_lst[hash], addr_lst) { 1292 if (!net_eq(dev_net(ifp->idev->dev), net)) 1293 continue; 1294 if (ipv6_addr_equal(&ifp->addr, addr) && 1295 !(ifp->flags&IFA_F_TENTATIVE) && 1296 (dev == NULL || ifp->idev->dev == dev || 1297 !(ifp->scope&(IFA_LINK|IFA_HOST) || strict))) { 1298 rcu_read_unlock_bh(); 1299 return 1; 1300 } 1301 } 1302 1303 rcu_read_unlock_bh(); 1304 return 0; 1305 } 1306 EXPORT_SYMBOL(ipv6_chk_addr); 1307 1308 static bool ipv6_chk_same_addr(struct net *net, const struct in6_addr *addr, 1309 struct net_device *dev) 1310 { 1311 unsigned int hash = ipv6_addr_hash(addr); 1312 struct inet6_ifaddr *ifp; 1313 struct hlist_node *node; 1314 1315 hlist_for_each_entry(ifp, node, &inet6_addr_lst[hash], addr_lst) { 1316 if (!net_eq(dev_net(ifp->idev->dev), net)) 1317 continue; 1318 if (ipv6_addr_equal(&ifp->addr, addr)) { 1319 if (dev == NULL || ifp->idev->dev == dev) 1320 return true; 1321 } 1322 } 1323 return false; 1324 } 1325 1326 int ipv6_chk_prefix(struct in6_addr *addr, struct net_device *dev) 1327 { 1328 struct inet6_dev *idev; 1329 struct inet6_ifaddr *ifa; 1330 int onlink; 1331 1332 onlink = 0; 1333 rcu_read_lock(); 1334 idev = __in6_dev_get(dev); 1335 if (idev) { 1336 read_lock_bh(&idev->lock); 1337 list_for_each_entry(ifa, &idev->addr_list, if_list) { 1338 onlink = ipv6_prefix_equal(addr, &ifa->addr, 1339 ifa->prefix_len); 1340 if (onlink) 1341 break; 1342 } 1343 read_unlock_bh(&idev->lock); 1344 } 1345 rcu_read_unlock(); 1346 return onlink; 1347 } 1348 1349 EXPORT_SYMBOL(ipv6_chk_prefix); 1350 1351 struct inet6_ifaddr *ipv6_get_ifaddr(struct net *net, const struct in6_addr *addr, 1352 struct net_device *dev, int strict) 1353 { 1354 struct inet6_ifaddr *ifp, *result = NULL; 1355 unsigned int hash = ipv6_addr_hash(addr); 1356 struct hlist_node *node; 1357 1358 rcu_read_lock_bh(); 1359 hlist_for_each_entry_rcu_bh(ifp, node, &inet6_addr_lst[hash], addr_lst) { 1360 if (!net_eq(dev_net(ifp->idev->dev), net)) 1361 continue; 1362 if (ipv6_addr_equal(&ifp->addr, addr)) { 1363 if (dev == NULL || ifp->idev->dev == dev || 1364 !(ifp->scope&(IFA_LINK|IFA_HOST) || strict)) { 1365 result = ifp; 1366 in6_ifa_hold(ifp); 1367 break; 1368 } 1369 } 1370 } 1371 rcu_read_unlock_bh(); 1372 1373 return result; 1374 } 1375 1376 /* Gets referenced address, destroys ifaddr */ 1377 1378 static void addrconf_dad_stop(struct inet6_ifaddr *ifp, int dad_failed) 1379 { 1380 if (ifp->flags&IFA_F_PERMANENT) { 1381 spin_lock_bh(&ifp->lock); 1382 addrconf_del_timer(ifp); 1383 ifp->flags |= IFA_F_TENTATIVE; 1384 if (dad_failed) 1385 ifp->flags |= IFA_F_DADFAILED; 1386 spin_unlock_bh(&ifp->lock); 1387 if (dad_failed) 1388 ipv6_ifa_notify(0, ifp); 1389 in6_ifa_put(ifp); 1390 #ifdef CONFIG_IPV6_PRIVACY 1391 } else if (ifp->flags&IFA_F_TEMPORARY) { 1392 struct inet6_ifaddr *ifpub; 1393 spin_lock_bh(&ifp->lock); 1394 ifpub = ifp->ifpub; 1395 if (ifpub) { 1396 in6_ifa_hold(ifpub); 1397 spin_unlock_bh(&ifp->lock); 1398 ipv6_create_tempaddr(ifpub, ifp); 1399 in6_ifa_put(ifpub); 1400 } else { 1401 spin_unlock_bh(&ifp->lock); 1402 } 1403 ipv6_del_addr(ifp); 1404 #endif 1405 } else 1406 ipv6_del_addr(ifp); 1407 } 1408 1409 static int addrconf_dad_end(struct inet6_ifaddr *ifp) 1410 { 1411 int err = -ENOENT; 1412 1413 spin_lock(&ifp->state_lock); 1414 if (ifp->state == INET6_IFADDR_STATE_DAD) { 1415 ifp->state = INET6_IFADDR_STATE_POSTDAD; 1416 err = 0; 1417 } 1418 spin_unlock(&ifp->state_lock); 1419 1420 return err; 1421 } 1422 1423 void addrconf_dad_failure(struct inet6_ifaddr *ifp) 1424 { 1425 struct inet6_dev *idev = ifp->idev; 1426 1427 if (addrconf_dad_end(ifp)) 1428 return; 1429 1430 if (net_ratelimit()) 1431 printk(KERN_INFO "%s: IPv6 duplicate address %pI6c detected!\n", 1432 ifp->idev->dev->name, &ifp->addr); 1433 1434 if (idev->cnf.accept_dad > 1 && !idev->cnf.disable_ipv6) { 1435 struct in6_addr addr; 1436 1437 addr.s6_addr32[0] = htonl(0xfe800000); 1438 addr.s6_addr32[1] = 0; 1439 1440 if (!ipv6_generate_eui64(addr.s6_addr + 8, idev->dev) && 1441 ipv6_addr_equal(&ifp->addr, &addr)) { 1442 /* DAD failed for link-local based on MAC address */ 1443 idev->cnf.disable_ipv6 = 1; 1444 1445 printk(KERN_INFO "%s: IPv6 being disabled!\n", 1446 ifp->idev->dev->name); 1447 } 1448 } 1449 1450 addrconf_dad_stop(ifp, 1); 1451 } 1452 1453 /* Join to solicited addr multicast group. */ 1454 1455 void addrconf_join_solict(struct net_device *dev, struct in6_addr *addr) 1456 { 1457 struct in6_addr maddr; 1458 1459 if (dev->flags&(IFF_LOOPBACK|IFF_NOARP)) 1460 return; 1461 1462 addrconf_addr_solict_mult(addr, &maddr); 1463 ipv6_dev_mc_inc(dev, &maddr); 1464 } 1465 1466 void addrconf_leave_solict(struct inet6_dev *idev, struct in6_addr *addr) 1467 { 1468 struct in6_addr maddr; 1469 1470 if (idev->dev->flags&(IFF_LOOPBACK|IFF_NOARP)) 1471 return; 1472 1473 addrconf_addr_solict_mult(addr, &maddr); 1474 __ipv6_dev_mc_dec(idev, &maddr); 1475 } 1476 1477 static void addrconf_join_anycast(struct inet6_ifaddr *ifp) 1478 { 1479 struct in6_addr addr; 1480 ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len); 1481 if (ipv6_addr_any(&addr)) 1482 return; 1483 ipv6_dev_ac_inc(ifp->idev->dev, &addr); 1484 } 1485 1486 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp) 1487 { 1488 struct in6_addr addr; 1489 ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len); 1490 if (ipv6_addr_any(&addr)) 1491 return; 1492 __ipv6_dev_ac_dec(ifp->idev, &addr); 1493 } 1494 1495 static int addrconf_ifid_eui48(u8 *eui, struct net_device *dev) 1496 { 1497 if (dev->addr_len != ETH_ALEN) 1498 return -1; 1499 memcpy(eui, dev->dev_addr, 3); 1500 memcpy(eui + 5, dev->dev_addr + 3, 3); 1501 1502 /* 1503 * The zSeries OSA network cards can be shared among various 1504 * OS instances, but the OSA cards have only one MAC address. 1505 * This leads to duplicate address conflicts in conjunction 1506 * with IPv6 if more than one instance uses the same card. 1507 * 1508 * The driver for these cards can deliver a unique 16-bit 1509 * identifier for each instance sharing the same card. It is 1510 * placed instead of 0xFFFE in the interface identifier. The 1511 * "u" bit of the interface identifier is not inverted in this 1512 * case. Hence the resulting interface identifier has local 1513 * scope according to RFC2373. 1514 */ 1515 if (dev->dev_id) { 1516 eui[3] = (dev->dev_id >> 8) & 0xFF; 1517 eui[4] = dev->dev_id & 0xFF; 1518 } else { 1519 eui[3] = 0xFF; 1520 eui[4] = 0xFE; 1521 eui[0] ^= 2; 1522 } 1523 return 0; 1524 } 1525 1526 static int addrconf_ifid_arcnet(u8 *eui, struct net_device *dev) 1527 { 1528 /* XXX: inherit EUI-64 from other interface -- yoshfuji */ 1529 if (dev->addr_len != ARCNET_ALEN) 1530 return -1; 1531 memset(eui, 0, 7); 1532 eui[7] = *(u8*)dev->dev_addr; 1533 return 0; 1534 } 1535 1536 static int addrconf_ifid_infiniband(u8 *eui, struct net_device *dev) 1537 { 1538 if (dev->addr_len != INFINIBAND_ALEN) 1539 return -1; 1540 memcpy(eui, dev->dev_addr + 12, 8); 1541 eui[0] |= 2; 1542 return 0; 1543 } 1544 1545 int __ipv6_isatap_ifid(u8 *eui, __be32 addr) 1546 { 1547 if (addr == 0) 1548 return -1; 1549 eui[0] = (ipv4_is_zeronet(addr) || ipv4_is_private_10(addr) || 1550 ipv4_is_loopback(addr) || ipv4_is_linklocal_169(addr) || 1551 ipv4_is_private_172(addr) || ipv4_is_test_192(addr) || 1552 ipv4_is_anycast_6to4(addr) || ipv4_is_private_192(addr) || 1553 ipv4_is_test_198(addr) || ipv4_is_multicast(addr) || 1554 ipv4_is_lbcast(addr)) ? 0x00 : 0x02; 1555 eui[1] = 0; 1556 eui[2] = 0x5E; 1557 eui[3] = 0xFE; 1558 memcpy(eui + 4, &addr, 4); 1559 return 0; 1560 } 1561 EXPORT_SYMBOL(__ipv6_isatap_ifid); 1562 1563 static int addrconf_ifid_sit(u8 *eui, struct net_device *dev) 1564 { 1565 if (dev->priv_flags & IFF_ISATAP) 1566 return __ipv6_isatap_ifid(eui, *(__be32 *)dev->dev_addr); 1567 return -1; 1568 } 1569 1570 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev) 1571 { 1572 switch (dev->type) { 1573 case ARPHRD_ETHER: 1574 case ARPHRD_FDDI: 1575 case ARPHRD_IEEE802_TR: 1576 return addrconf_ifid_eui48(eui, dev); 1577 case ARPHRD_ARCNET: 1578 return addrconf_ifid_arcnet(eui, dev); 1579 case ARPHRD_INFINIBAND: 1580 return addrconf_ifid_infiniband(eui, dev); 1581 case ARPHRD_SIT: 1582 return addrconf_ifid_sit(eui, dev); 1583 } 1584 return -1; 1585 } 1586 1587 static int ipv6_inherit_eui64(u8 *eui, struct inet6_dev *idev) 1588 { 1589 int err = -1; 1590 struct inet6_ifaddr *ifp; 1591 1592 read_lock_bh(&idev->lock); 1593 list_for_each_entry(ifp, &idev->addr_list, if_list) { 1594 if (ifp->scope == IFA_LINK && !(ifp->flags&IFA_F_TENTATIVE)) { 1595 memcpy(eui, ifp->addr.s6_addr+8, 8); 1596 err = 0; 1597 break; 1598 } 1599 } 1600 read_unlock_bh(&idev->lock); 1601 return err; 1602 } 1603 1604 #ifdef CONFIG_IPV6_PRIVACY 1605 /* (re)generation of randomized interface identifier (RFC 3041 3.2, 3.5) */ 1606 static int __ipv6_regen_rndid(struct inet6_dev *idev) 1607 { 1608 regen: 1609 get_random_bytes(idev->rndid, sizeof(idev->rndid)); 1610 idev->rndid[0] &= ~0x02; 1611 1612 /* 1613 * <draft-ietf-ipngwg-temp-addresses-v2-00.txt>: 1614 * check if generated address is not inappropriate 1615 * 1616 * - Reserved subnet anycast (RFC 2526) 1617 * 11111101 11....11 1xxxxxxx 1618 * - ISATAP (RFC4214) 6.1 1619 * 00-00-5E-FE-xx-xx-xx-xx 1620 * - value 0 1621 * - XXX: already assigned to an address on the device 1622 */ 1623 if (idev->rndid[0] == 0xfd && 1624 (idev->rndid[1]&idev->rndid[2]&idev->rndid[3]&idev->rndid[4]&idev->rndid[5]&idev->rndid[6]) == 0xff && 1625 (idev->rndid[7]&0x80)) 1626 goto regen; 1627 if ((idev->rndid[0]|idev->rndid[1]) == 0) { 1628 if (idev->rndid[2] == 0x5e && idev->rndid[3] == 0xfe) 1629 goto regen; 1630 if ((idev->rndid[2]|idev->rndid[3]|idev->rndid[4]|idev->rndid[5]|idev->rndid[6]|idev->rndid[7]) == 0x00) 1631 goto regen; 1632 } 1633 1634 return 0; 1635 } 1636 1637 static void ipv6_regen_rndid(unsigned long data) 1638 { 1639 struct inet6_dev *idev = (struct inet6_dev *) data; 1640 unsigned long expires; 1641 1642 rcu_read_lock_bh(); 1643 write_lock_bh(&idev->lock); 1644 1645 if (idev->dead) 1646 goto out; 1647 1648 if (__ipv6_regen_rndid(idev) < 0) 1649 goto out; 1650 1651 expires = jiffies + 1652 idev->cnf.temp_prefered_lft * HZ - 1653 idev->cnf.regen_max_retry * idev->cnf.dad_transmits * idev->nd_parms->retrans_time - desync_factor; 1654 if (time_before(expires, jiffies)) { 1655 printk(KERN_WARNING 1656 "ipv6_regen_rndid(): too short regeneration interval; timer disabled for %s.\n", 1657 idev->dev->name); 1658 goto out; 1659 } 1660 1661 if (!mod_timer(&idev->regen_timer, expires)) 1662 in6_dev_hold(idev); 1663 1664 out: 1665 write_unlock_bh(&idev->lock); 1666 rcu_read_unlock_bh(); 1667 in6_dev_put(idev); 1668 } 1669 1670 static int __ipv6_try_regen_rndid(struct inet6_dev *idev, struct in6_addr *tmpaddr) { 1671 int ret = 0; 1672 1673 if (tmpaddr && memcmp(idev->rndid, &tmpaddr->s6_addr[8], 8) == 0) 1674 ret = __ipv6_regen_rndid(idev); 1675 return ret; 1676 } 1677 #endif 1678 1679 /* 1680 * Add prefix route. 1681 */ 1682 1683 static void 1684 addrconf_prefix_route(struct in6_addr *pfx, int plen, struct net_device *dev, 1685 unsigned long expires, u32 flags) 1686 { 1687 struct fib6_config cfg = { 1688 .fc_table = RT6_TABLE_PREFIX, 1689 .fc_metric = IP6_RT_PRIO_ADDRCONF, 1690 .fc_ifindex = dev->ifindex, 1691 .fc_expires = expires, 1692 .fc_dst_len = plen, 1693 .fc_flags = RTF_UP | flags, 1694 .fc_nlinfo.nl_net = dev_net(dev), 1695 .fc_protocol = RTPROT_KERNEL, 1696 }; 1697 1698 ipv6_addr_copy(&cfg.fc_dst, pfx); 1699 1700 /* Prevent useless cloning on PtP SIT. 1701 This thing is done here expecting that the whole 1702 class of non-broadcast devices need not cloning. 1703 */ 1704 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 1705 if (dev->type == ARPHRD_SIT && (dev->flags & IFF_POINTOPOINT)) 1706 cfg.fc_flags |= RTF_NONEXTHOP; 1707 #endif 1708 1709 ip6_route_add(&cfg); 1710 } 1711 1712 /* Create "default" multicast route to the interface */ 1713 1714 static void addrconf_add_mroute(struct net_device *dev) 1715 { 1716 struct fib6_config cfg = { 1717 .fc_table = RT6_TABLE_LOCAL, 1718 .fc_metric = IP6_RT_PRIO_ADDRCONF, 1719 .fc_ifindex = dev->ifindex, 1720 .fc_dst_len = 8, 1721 .fc_flags = RTF_UP, 1722 .fc_nlinfo.nl_net = dev_net(dev), 1723 }; 1724 1725 ipv6_addr_set(&cfg.fc_dst, htonl(0xFF000000), 0, 0, 0); 1726 1727 ip6_route_add(&cfg); 1728 } 1729 1730 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 1731 static void sit_route_add(struct net_device *dev) 1732 { 1733 struct fib6_config cfg = { 1734 .fc_table = RT6_TABLE_MAIN, 1735 .fc_metric = IP6_RT_PRIO_ADDRCONF, 1736 .fc_ifindex = dev->ifindex, 1737 .fc_dst_len = 96, 1738 .fc_flags = RTF_UP | RTF_NONEXTHOP, 1739 .fc_nlinfo.nl_net = dev_net(dev), 1740 }; 1741 1742 /* prefix length - 96 bits "::d.d.d.d" */ 1743 ip6_route_add(&cfg); 1744 } 1745 #endif 1746 1747 static void addrconf_add_lroute(struct net_device *dev) 1748 { 1749 struct in6_addr addr; 1750 1751 ipv6_addr_set(&addr, htonl(0xFE800000), 0, 0, 0); 1752 addrconf_prefix_route(&addr, 64, dev, 0, 0); 1753 } 1754 1755 static struct inet6_dev *addrconf_add_dev(struct net_device *dev) 1756 { 1757 struct inet6_dev *idev; 1758 1759 ASSERT_RTNL(); 1760 1761 idev = ipv6_find_idev(dev); 1762 if (!idev) 1763 return NULL; 1764 1765 /* Add default multicast route */ 1766 addrconf_add_mroute(dev); 1767 1768 /* Add link local route */ 1769 addrconf_add_lroute(dev); 1770 return idev; 1771 } 1772 1773 void addrconf_prefix_rcv(struct net_device *dev, u8 *opt, int len) 1774 { 1775 struct prefix_info *pinfo; 1776 __u32 valid_lft; 1777 __u32 prefered_lft; 1778 int addr_type; 1779 struct inet6_dev *in6_dev; 1780 struct net *net = dev_net(dev); 1781 1782 pinfo = (struct prefix_info *) opt; 1783 1784 if (len < sizeof(struct prefix_info)) { 1785 ADBG(("addrconf: prefix option too short\n")); 1786 return; 1787 } 1788 1789 /* 1790 * Validation checks ([ADDRCONF], page 19) 1791 */ 1792 1793 addr_type = ipv6_addr_type(&pinfo->prefix); 1794 1795 if (addr_type & (IPV6_ADDR_MULTICAST|IPV6_ADDR_LINKLOCAL)) 1796 return; 1797 1798 valid_lft = ntohl(pinfo->valid); 1799 prefered_lft = ntohl(pinfo->prefered); 1800 1801 if (prefered_lft > valid_lft) { 1802 if (net_ratelimit()) 1803 printk(KERN_WARNING "addrconf: prefix option has invalid lifetime\n"); 1804 return; 1805 } 1806 1807 in6_dev = in6_dev_get(dev); 1808 1809 if (in6_dev == NULL) { 1810 if (net_ratelimit()) 1811 printk(KERN_DEBUG "addrconf: device %s not configured\n", dev->name); 1812 return; 1813 } 1814 1815 /* 1816 * Two things going on here: 1817 * 1) Add routes for on-link prefixes 1818 * 2) Configure prefixes with the auto flag set 1819 */ 1820 1821 if (pinfo->onlink) { 1822 struct rt6_info *rt; 1823 unsigned long rt_expires; 1824 1825 /* Avoid arithmetic overflow. Really, we could 1826 * save rt_expires in seconds, likely valid_lft, 1827 * but it would require division in fib gc, that it 1828 * not good. 1829 */ 1830 if (HZ > USER_HZ) 1831 rt_expires = addrconf_timeout_fixup(valid_lft, HZ); 1832 else 1833 rt_expires = addrconf_timeout_fixup(valid_lft, USER_HZ); 1834 1835 if (addrconf_finite_timeout(rt_expires)) 1836 rt_expires *= HZ; 1837 1838 rt = rt6_lookup(net, &pinfo->prefix, NULL, 1839 dev->ifindex, 1); 1840 1841 if (rt && addrconf_is_prefix_route(rt)) { 1842 /* Autoconf prefix route */ 1843 if (valid_lft == 0) { 1844 ip6_del_rt(rt); 1845 rt = NULL; 1846 } else if (addrconf_finite_timeout(rt_expires)) { 1847 /* not infinity */ 1848 rt->rt6i_expires = jiffies + rt_expires; 1849 rt->rt6i_flags |= RTF_EXPIRES; 1850 } else { 1851 rt->rt6i_flags &= ~RTF_EXPIRES; 1852 rt->rt6i_expires = 0; 1853 } 1854 } else if (valid_lft) { 1855 clock_t expires = 0; 1856 int flags = RTF_ADDRCONF | RTF_PREFIX_RT; 1857 if (addrconf_finite_timeout(rt_expires)) { 1858 /* not infinity */ 1859 flags |= RTF_EXPIRES; 1860 expires = jiffies_to_clock_t(rt_expires); 1861 } 1862 addrconf_prefix_route(&pinfo->prefix, pinfo->prefix_len, 1863 dev, expires, flags); 1864 } 1865 if (rt) 1866 dst_release(&rt->u.dst); 1867 } 1868 1869 /* Try to figure out our local address for this prefix */ 1870 1871 if (pinfo->autoconf && in6_dev->cnf.autoconf) { 1872 struct inet6_ifaddr * ifp; 1873 struct in6_addr addr; 1874 int create = 0, update_lft = 0; 1875 1876 if (pinfo->prefix_len == 64) { 1877 memcpy(&addr, &pinfo->prefix, 8); 1878 if (ipv6_generate_eui64(addr.s6_addr + 8, dev) && 1879 ipv6_inherit_eui64(addr.s6_addr + 8, in6_dev)) { 1880 in6_dev_put(in6_dev); 1881 return; 1882 } 1883 goto ok; 1884 } 1885 if (net_ratelimit()) 1886 printk(KERN_DEBUG "IPv6 addrconf: prefix with wrong length %d\n", 1887 pinfo->prefix_len); 1888 in6_dev_put(in6_dev); 1889 return; 1890 1891 ok: 1892 1893 ifp = ipv6_get_ifaddr(net, &addr, dev, 1); 1894 1895 if (ifp == NULL && valid_lft) { 1896 int max_addresses = in6_dev->cnf.max_addresses; 1897 u32 addr_flags = 0; 1898 1899 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 1900 if (in6_dev->cnf.optimistic_dad && 1901 !net->ipv6.devconf_all->forwarding) 1902 addr_flags = IFA_F_OPTIMISTIC; 1903 #endif 1904 1905 /* Do not allow to create too much of autoconfigured 1906 * addresses; this would be too easy way to crash kernel. 1907 */ 1908 if (!max_addresses || 1909 ipv6_count_addresses(in6_dev) < max_addresses) 1910 ifp = ipv6_add_addr(in6_dev, &addr, pinfo->prefix_len, 1911 addr_type&IPV6_ADDR_SCOPE_MASK, 1912 addr_flags); 1913 1914 if (!ifp || IS_ERR(ifp)) { 1915 in6_dev_put(in6_dev); 1916 return; 1917 } 1918 1919 update_lft = create = 1; 1920 ifp->cstamp = jiffies; 1921 addrconf_dad_start(ifp, RTF_ADDRCONF|RTF_PREFIX_RT); 1922 } 1923 1924 if (ifp) { 1925 int flags; 1926 unsigned long now; 1927 #ifdef CONFIG_IPV6_PRIVACY 1928 struct inet6_ifaddr *ift; 1929 #endif 1930 u32 stored_lft; 1931 1932 /* update lifetime (RFC2462 5.5.3 e) */ 1933 spin_lock(&ifp->lock); 1934 now = jiffies; 1935 if (ifp->valid_lft > (now - ifp->tstamp) / HZ) 1936 stored_lft = ifp->valid_lft - (now - ifp->tstamp) / HZ; 1937 else 1938 stored_lft = 0; 1939 if (!update_lft && stored_lft) { 1940 if (valid_lft > MIN_VALID_LIFETIME || 1941 valid_lft > stored_lft) 1942 update_lft = 1; 1943 else if (stored_lft <= MIN_VALID_LIFETIME) { 1944 /* valid_lft <= stored_lft is always true */ 1945 /* 1946 * RFC 4862 Section 5.5.3e: 1947 * "Note that the preferred lifetime of 1948 * the corresponding address is always 1949 * reset to the Preferred Lifetime in 1950 * the received Prefix Information 1951 * option, regardless of whether the 1952 * valid lifetime is also reset or 1953 * ignored." 1954 * 1955 * So if the preferred lifetime in 1956 * this advertisement is different 1957 * than what we have stored, but the 1958 * valid lifetime is invalid, just 1959 * reset prefered_lft. 1960 * 1961 * We must set the valid lifetime 1962 * to the stored lifetime since we'll 1963 * be updating the timestamp below, 1964 * else we'll set it back to the 1965 * minumum. 1966 */ 1967 if (prefered_lft != ifp->prefered_lft) { 1968 valid_lft = stored_lft; 1969 update_lft = 1; 1970 } 1971 } else { 1972 valid_lft = MIN_VALID_LIFETIME; 1973 if (valid_lft < prefered_lft) 1974 prefered_lft = valid_lft; 1975 update_lft = 1; 1976 } 1977 } 1978 1979 if (update_lft) { 1980 ifp->valid_lft = valid_lft; 1981 ifp->prefered_lft = prefered_lft; 1982 ifp->tstamp = now; 1983 flags = ifp->flags; 1984 ifp->flags &= ~IFA_F_DEPRECATED; 1985 spin_unlock(&ifp->lock); 1986 1987 if (!(flags&IFA_F_TENTATIVE)) 1988 ipv6_ifa_notify(0, ifp); 1989 } else 1990 spin_unlock(&ifp->lock); 1991 1992 #ifdef CONFIG_IPV6_PRIVACY 1993 read_lock_bh(&in6_dev->lock); 1994 /* update all temporary addresses in the list */ 1995 list_for_each_entry(ift, &in6_dev->tempaddr_list, tmp_list) { 1996 /* 1997 * When adjusting the lifetimes of an existing 1998 * temporary address, only lower the lifetimes. 1999 * Implementations must not increase the 2000 * lifetimes of an existing temporary address 2001 * when processing a Prefix Information Option. 2002 */ 2003 if (ifp != ift->ifpub) 2004 continue; 2005 2006 spin_lock(&ift->lock); 2007 flags = ift->flags; 2008 if (ift->valid_lft > valid_lft && 2009 ift->valid_lft - valid_lft > (jiffies - ift->tstamp) / HZ) 2010 ift->valid_lft = valid_lft + (jiffies - ift->tstamp) / HZ; 2011 if (ift->prefered_lft > prefered_lft && 2012 ift->prefered_lft - prefered_lft > (jiffies - ift->tstamp) / HZ) 2013 ift->prefered_lft = prefered_lft + (jiffies - ift->tstamp) / HZ; 2014 spin_unlock(&ift->lock); 2015 if (!(flags&IFA_F_TENTATIVE)) 2016 ipv6_ifa_notify(0, ift); 2017 } 2018 2019 if (create && in6_dev->cnf.use_tempaddr > 0) { 2020 /* 2021 * When a new public address is created as described in [ADDRCONF], 2022 * also create a new temporary address. 2023 */ 2024 read_unlock_bh(&in6_dev->lock); 2025 ipv6_create_tempaddr(ifp, NULL); 2026 } else { 2027 read_unlock_bh(&in6_dev->lock); 2028 } 2029 #endif 2030 in6_ifa_put(ifp); 2031 addrconf_verify(0); 2032 } 2033 } 2034 inet6_prefix_notify(RTM_NEWPREFIX, in6_dev, pinfo); 2035 in6_dev_put(in6_dev); 2036 } 2037 2038 /* 2039 * Set destination address. 2040 * Special case for SIT interfaces where we create a new "virtual" 2041 * device. 2042 */ 2043 int addrconf_set_dstaddr(struct net *net, void __user *arg) 2044 { 2045 struct in6_ifreq ireq; 2046 struct net_device *dev; 2047 int err = -EINVAL; 2048 2049 rtnl_lock(); 2050 2051 err = -EFAULT; 2052 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 2053 goto err_exit; 2054 2055 dev = __dev_get_by_index(net, ireq.ifr6_ifindex); 2056 2057 err = -ENODEV; 2058 if (dev == NULL) 2059 goto err_exit; 2060 2061 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 2062 if (dev->type == ARPHRD_SIT) { 2063 const struct net_device_ops *ops = dev->netdev_ops; 2064 struct ifreq ifr; 2065 struct ip_tunnel_parm p; 2066 2067 err = -EADDRNOTAVAIL; 2068 if (!(ipv6_addr_type(&ireq.ifr6_addr) & IPV6_ADDR_COMPATv4)) 2069 goto err_exit; 2070 2071 memset(&p, 0, sizeof(p)); 2072 p.iph.daddr = ireq.ifr6_addr.s6_addr32[3]; 2073 p.iph.saddr = 0; 2074 p.iph.version = 4; 2075 p.iph.ihl = 5; 2076 p.iph.protocol = IPPROTO_IPV6; 2077 p.iph.ttl = 64; 2078 ifr.ifr_ifru.ifru_data = (__force void __user *)&p; 2079 2080 if (ops->ndo_do_ioctl) { 2081 mm_segment_t oldfs = get_fs(); 2082 2083 set_fs(KERNEL_DS); 2084 err = ops->ndo_do_ioctl(dev, &ifr, SIOCADDTUNNEL); 2085 set_fs(oldfs); 2086 } else 2087 err = -EOPNOTSUPP; 2088 2089 if (err == 0) { 2090 err = -ENOBUFS; 2091 dev = __dev_get_by_name(net, p.name); 2092 if (!dev) 2093 goto err_exit; 2094 err = dev_open(dev); 2095 } 2096 } 2097 #endif 2098 2099 err_exit: 2100 rtnl_unlock(); 2101 return err; 2102 } 2103 2104 /* 2105 * Manual configuration of address on an interface 2106 */ 2107 static int inet6_addr_add(struct net *net, int ifindex, struct in6_addr *pfx, 2108 unsigned int plen, __u8 ifa_flags, __u32 prefered_lft, 2109 __u32 valid_lft) 2110 { 2111 struct inet6_ifaddr *ifp; 2112 struct inet6_dev *idev; 2113 struct net_device *dev; 2114 int scope; 2115 u32 flags; 2116 clock_t expires; 2117 unsigned long timeout; 2118 2119 ASSERT_RTNL(); 2120 2121 if (plen > 128) 2122 return -EINVAL; 2123 2124 /* check the lifetime */ 2125 if (!valid_lft || prefered_lft > valid_lft) 2126 return -EINVAL; 2127 2128 dev = __dev_get_by_index(net, ifindex); 2129 if (!dev) 2130 return -ENODEV; 2131 2132 if ((idev = addrconf_add_dev(dev)) == NULL) 2133 return -ENOBUFS; 2134 2135 scope = ipv6_addr_scope(pfx); 2136 2137 timeout = addrconf_timeout_fixup(valid_lft, HZ); 2138 if (addrconf_finite_timeout(timeout)) { 2139 expires = jiffies_to_clock_t(timeout * HZ); 2140 valid_lft = timeout; 2141 flags = RTF_EXPIRES; 2142 } else { 2143 expires = 0; 2144 flags = 0; 2145 ifa_flags |= IFA_F_PERMANENT; 2146 } 2147 2148 timeout = addrconf_timeout_fixup(prefered_lft, HZ); 2149 if (addrconf_finite_timeout(timeout)) { 2150 if (timeout == 0) 2151 ifa_flags |= IFA_F_DEPRECATED; 2152 prefered_lft = timeout; 2153 } 2154 2155 ifp = ipv6_add_addr(idev, pfx, plen, scope, ifa_flags); 2156 2157 if (!IS_ERR(ifp)) { 2158 spin_lock_bh(&ifp->lock); 2159 ifp->valid_lft = valid_lft; 2160 ifp->prefered_lft = prefered_lft; 2161 ifp->tstamp = jiffies; 2162 spin_unlock_bh(&ifp->lock); 2163 2164 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, dev, 2165 expires, flags); 2166 /* 2167 * Note that section 3.1 of RFC 4429 indicates 2168 * that the Optimistic flag should not be set for 2169 * manually configured addresses 2170 */ 2171 addrconf_dad_start(ifp, 0); 2172 in6_ifa_put(ifp); 2173 addrconf_verify(0); 2174 return 0; 2175 } 2176 2177 return PTR_ERR(ifp); 2178 } 2179 2180 static int inet6_addr_del(struct net *net, int ifindex, struct in6_addr *pfx, 2181 unsigned int plen) 2182 { 2183 struct inet6_ifaddr *ifp; 2184 struct inet6_dev *idev; 2185 struct net_device *dev; 2186 2187 if (plen > 128) 2188 return -EINVAL; 2189 2190 dev = __dev_get_by_index(net, ifindex); 2191 if (!dev) 2192 return -ENODEV; 2193 2194 if ((idev = __in6_dev_get(dev)) == NULL) 2195 return -ENXIO; 2196 2197 read_lock_bh(&idev->lock); 2198 list_for_each_entry(ifp, &idev->addr_list, if_list) { 2199 if (ifp->prefix_len == plen && 2200 ipv6_addr_equal(pfx, &ifp->addr)) { 2201 in6_ifa_hold(ifp); 2202 read_unlock_bh(&idev->lock); 2203 2204 ipv6_del_addr(ifp); 2205 2206 /* If the last address is deleted administratively, 2207 disable IPv6 on this interface. 2208 */ 2209 if (list_empty(&idev->addr_list)) 2210 addrconf_ifdown(idev->dev, 1); 2211 return 0; 2212 } 2213 } 2214 read_unlock_bh(&idev->lock); 2215 return -EADDRNOTAVAIL; 2216 } 2217 2218 2219 int addrconf_add_ifaddr(struct net *net, void __user *arg) 2220 { 2221 struct in6_ifreq ireq; 2222 int err; 2223 2224 if (!capable(CAP_NET_ADMIN)) 2225 return -EPERM; 2226 2227 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 2228 return -EFAULT; 2229 2230 rtnl_lock(); 2231 err = inet6_addr_add(net, ireq.ifr6_ifindex, &ireq.ifr6_addr, 2232 ireq.ifr6_prefixlen, IFA_F_PERMANENT, 2233 INFINITY_LIFE_TIME, INFINITY_LIFE_TIME); 2234 rtnl_unlock(); 2235 return err; 2236 } 2237 2238 int addrconf_del_ifaddr(struct net *net, void __user *arg) 2239 { 2240 struct in6_ifreq ireq; 2241 int err; 2242 2243 if (!capable(CAP_NET_ADMIN)) 2244 return -EPERM; 2245 2246 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 2247 return -EFAULT; 2248 2249 rtnl_lock(); 2250 err = inet6_addr_del(net, ireq.ifr6_ifindex, &ireq.ifr6_addr, 2251 ireq.ifr6_prefixlen); 2252 rtnl_unlock(); 2253 return err; 2254 } 2255 2256 static void add_addr(struct inet6_dev *idev, const struct in6_addr *addr, 2257 int plen, int scope) 2258 { 2259 struct inet6_ifaddr *ifp; 2260 2261 ifp = ipv6_add_addr(idev, addr, plen, scope, IFA_F_PERMANENT); 2262 if (!IS_ERR(ifp)) { 2263 spin_lock_bh(&ifp->lock); 2264 ifp->flags &= ~IFA_F_TENTATIVE; 2265 spin_unlock_bh(&ifp->lock); 2266 ipv6_ifa_notify(RTM_NEWADDR, ifp); 2267 in6_ifa_put(ifp); 2268 } 2269 } 2270 2271 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 2272 static void sit_add_v4_addrs(struct inet6_dev *idev) 2273 { 2274 struct in6_addr addr; 2275 struct net_device *dev; 2276 struct net *net = dev_net(idev->dev); 2277 int scope; 2278 2279 ASSERT_RTNL(); 2280 2281 memset(&addr, 0, sizeof(struct in6_addr)); 2282 memcpy(&addr.s6_addr32[3], idev->dev->dev_addr, 4); 2283 2284 if (idev->dev->flags&IFF_POINTOPOINT) { 2285 addr.s6_addr32[0] = htonl(0xfe800000); 2286 scope = IFA_LINK; 2287 } else { 2288 scope = IPV6_ADDR_COMPATv4; 2289 } 2290 2291 if (addr.s6_addr32[3]) { 2292 add_addr(idev, &addr, 128, scope); 2293 return; 2294 } 2295 2296 for_each_netdev(net, dev) { 2297 struct in_device * in_dev = __in_dev_get_rtnl(dev); 2298 if (in_dev && (dev->flags & IFF_UP)) { 2299 struct in_ifaddr * ifa; 2300 2301 int flag = scope; 2302 2303 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) { 2304 int plen; 2305 2306 addr.s6_addr32[3] = ifa->ifa_local; 2307 2308 if (ifa->ifa_scope == RT_SCOPE_LINK) 2309 continue; 2310 if (ifa->ifa_scope >= RT_SCOPE_HOST) { 2311 if (idev->dev->flags&IFF_POINTOPOINT) 2312 continue; 2313 flag |= IFA_HOST; 2314 } 2315 if (idev->dev->flags&IFF_POINTOPOINT) 2316 plen = 64; 2317 else 2318 plen = 96; 2319 2320 add_addr(idev, &addr, plen, flag); 2321 } 2322 } 2323 } 2324 } 2325 #endif 2326 2327 static void init_loopback(struct net_device *dev) 2328 { 2329 struct inet6_dev *idev; 2330 2331 /* ::1 */ 2332 2333 ASSERT_RTNL(); 2334 2335 if ((idev = ipv6_find_idev(dev)) == NULL) { 2336 printk(KERN_DEBUG "init loopback: add_dev failed\n"); 2337 return; 2338 } 2339 2340 add_addr(idev, &in6addr_loopback, 128, IFA_HOST); 2341 } 2342 2343 static void addrconf_add_linklocal(struct inet6_dev *idev, struct in6_addr *addr) 2344 { 2345 struct inet6_ifaddr * ifp; 2346 u32 addr_flags = IFA_F_PERMANENT; 2347 2348 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 2349 if (idev->cnf.optimistic_dad && 2350 !dev_net(idev->dev)->ipv6.devconf_all->forwarding) 2351 addr_flags |= IFA_F_OPTIMISTIC; 2352 #endif 2353 2354 2355 ifp = ipv6_add_addr(idev, addr, 64, IFA_LINK, addr_flags); 2356 if (!IS_ERR(ifp)) { 2357 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, idev->dev, 0, 0); 2358 addrconf_dad_start(ifp, 0); 2359 in6_ifa_put(ifp); 2360 } 2361 } 2362 2363 static void addrconf_dev_config(struct net_device *dev) 2364 { 2365 struct in6_addr addr; 2366 struct inet6_dev * idev; 2367 2368 ASSERT_RTNL(); 2369 2370 if ((dev->type != ARPHRD_ETHER) && 2371 (dev->type != ARPHRD_FDDI) && 2372 (dev->type != ARPHRD_IEEE802_TR) && 2373 (dev->type != ARPHRD_ARCNET) && 2374 (dev->type != ARPHRD_INFINIBAND)) { 2375 /* Alas, we support only Ethernet autoconfiguration. */ 2376 return; 2377 } 2378 2379 idev = addrconf_add_dev(dev); 2380 if (idev == NULL) 2381 return; 2382 2383 memset(&addr, 0, sizeof(struct in6_addr)); 2384 addr.s6_addr32[0] = htonl(0xFE800000); 2385 2386 if (ipv6_generate_eui64(addr.s6_addr + 8, dev) == 0) 2387 addrconf_add_linklocal(idev, &addr); 2388 } 2389 2390 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 2391 static void addrconf_sit_config(struct net_device *dev) 2392 { 2393 struct inet6_dev *idev; 2394 2395 ASSERT_RTNL(); 2396 2397 /* 2398 * Configure the tunnel with one of our IPv4 2399 * addresses... we should configure all of 2400 * our v4 addrs in the tunnel 2401 */ 2402 2403 if ((idev = ipv6_find_idev(dev)) == NULL) { 2404 printk(KERN_DEBUG "init sit: add_dev failed\n"); 2405 return; 2406 } 2407 2408 if (dev->priv_flags & IFF_ISATAP) { 2409 struct in6_addr addr; 2410 2411 ipv6_addr_set(&addr, htonl(0xFE800000), 0, 0, 0); 2412 addrconf_prefix_route(&addr, 64, dev, 0, 0); 2413 if (!ipv6_generate_eui64(addr.s6_addr + 8, dev)) 2414 addrconf_add_linklocal(idev, &addr); 2415 return; 2416 } 2417 2418 sit_add_v4_addrs(idev); 2419 2420 if (dev->flags&IFF_POINTOPOINT) { 2421 addrconf_add_mroute(dev); 2422 addrconf_add_lroute(dev); 2423 } else 2424 sit_route_add(dev); 2425 } 2426 #endif 2427 2428 static inline int 2429 ipv6_inherit_linklocal(struct inet6_dev *idev, struct net_device *link_dev) 2430 { 2431 struct in6_addr lladdr; 2432 2433 if (!ipv6_get_lladdr(link_dev, &lladdr, IFA_F_TENTATIVE)) { 2434 addrconf_add_linklocal(idev, &lladdr); 2435 return 0; 2436 } 2437 return -1; 2438 } 2439 2440 static void ip6_tnl_add_linklocal(struct inet6_dev *idev) 2441 { 2442 struct net_device *link_dev; 2443 struct net *net = dev_net(idev->dev); 2444 2445 /* first try to inherit the link-local address from the link device */ 2446 if (idev->dev->iflink && 2447 (link_dev = __dev_get_by_index(net, idev->dev->iflink))) { 2448 if (!ipv6_inherit_linklocal(idev, link_dev)) 2449 return; 2450 } 2451 /* then try to inherit it from any device */ 2452 for_each_netdev(net, link_dev) { 2453 if (!ipv6_inherit_linklocal(idev, link_dev)) 2454 return; 2455 } 2456 printk(KERN_DEBUG "init ip6-ip6: add_linklocal failed\n"); 2457 } 2458 2459 /* 2460 * Autoconfigure tunnel with a link-local address so routing protocols, 2461 * DHCPv6, MLD etc. can be run over the virtual link 2462 */ 2463 2464 static void addrconf_ip6_tnl_config(struct net_device *dev) 2465 { 2466 struct inet6_dev *idev; 2467 2468 ASSERT_RTNL(); 2469 2470 idev = addrconf_add_dev(dev); 2471 if (!idev) { 2472 printk(KERN_DEBUG "init ip6-ip6: add_dev failed\n"); 2473 return; 2474 } 2475 ip6_tnl_add_linklocal(idev); 2476 } 2477 2478 static int addrconf_notify(struct notifier_block *this, unsigned long event, 2479 void * data) 2480 { 2481 struct net_device *dev = (struct net_device *) data; 2482 struct inet6_dev *idev = __in6_dev_get(dev); 2483 int run_pending = 0; 2484 int err; 2485 2486 switch (event) { 2487 case NETDEV_REGISTER: 2488 if (!idev && dev->mtu >= IPV6_MIN_MTU) { 2489 idev = ipv6_add_dev(dev); 2490 if (!idev) 2491 return notifier_from_errno(-ENOMEM); 2492 } 2493 break; 2494 2495 case NETDEV_UP: 2496 case NETDEV_CHANGE: 2497 if (dev->flags & IFF_SLAVE) 2498 break; 2499 2500 if (event == NETDEV_UP) { 2501 if (!addrconf_qdisc_ok(dev)) { 2502 /* device is not ready yet. */ 2503 printk(KERN_INFO 2504 "ADDRCONF(NETDEV_UP): %s: " 2505 "link is not ready\n", 2506 dev->name); 2507 break; 2508 } 2509 2510 if (!idev && dev->mtu >= IPV6_MIN_MTU) 2511 idev = ipv6_add_dev(dev); 2512 2513 if (idev) { 2514 idev->if_flags |= IF_READY; 2515 run_pending = 1; 2516 } 2517 } else { 2518 if (!addrconf_qdisc_ok(dev)) { 2519 /* device is still not ready. */ 2520 break; 2521 } 2522 2523 if (idev) { 2524 if (idev->if_flags & IF_READY) 2525 /* device is already configured. */ 2526 break; 2527 idev->if_flags |= IF_READY; 2528 } 2529 2530 printk(KERN_INFO 2531 "ADDRCONF(NETDEV_CHANGE): %s: " 2532 "link becomes ready\n", 2533 dev->name); 2534 2535 run_pending = 1; 2536 } 2537 2538 switch (dev->type) { 2539 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE) 2540 case ARPHRD_SIT: 2541 addrconf_sit_config(dev); 2542 break; 2543 #endif 2544 case ARPHRD_TUNNEL6: 2545 addrconf_ip6_tnl_config(dev); 2546 break; 2547 case ARPHRD_LOOPBACK: 2548 init_loopback(dev); 2549 break; 2550 2551 default: 2552 addrconf_dev_config(dev); 2553 break; 2554 } 2555 2556 if (idev) { 2557 if (run_pending) 2558 addrconf_dad_run(idev); 2559 2560 /* 2561 * If the MTU changed during the interface down, 2562 * when the interface up, the changed MTU must be 2563 * reflected in the idev as well as routers. 2564 */ 2565 if (idev->cnf.mtu6 != dev->mtu && 2566 dev->mtu >= IPV6_MIN_MTU) { 2567 rt6_mtu_change(dev, dev->mtu); 2568 idev->cnf.mtu6 = dev->mtu; 2569 } 2570 idev->tstamp = jiffies; 2571 inet6_ifinfo_notify(RTM_NEWLINK, idev); 2572 2573 /* 2574 * If the changed mtu during down is lower than 2575 * IPV6_MIN_MTU stop IPv6 on this interface. 2576 */ 2577 if (dev->mtu < IPV6_MIN_MTU) 2578 addrconf_ifdown(dev, 1); 2579 } 2580 break; 2581 2582 case NETDEV_CHANGEMTU: 2583 if (idev && dev->mtu >= IPV6_MIN_MTU) { 2584 rt6_mtu_change(dev, dev->mtu); 2585 idev->cnf.mtu6 = dev->mtu; 2586 break; 2587 } 2588 2589 if (!idev && dev->mtu >= IPV6_MIN_MTU) { 2590 idev = ipv6_add_dev(dev); 2591 if (idev) 2592 break; 2593 } 2594 2595 /* 2596 * MTU falled under IPV6_MIN_MTU. 2597 * Stop IPv6 on this interface. 2598 */ 2599 2600 case NETDEV_DOWN: 2601 case NETDEV_UNREGISTER: 2602 /* 2603 * Remove all addresses from this interface. 2604 */ 2605 addrconf_ifdown(dev, event != NETDEV_DOWN); 2606 break; 2607 2608 case NETDEV_CHANGENAME: 2609 if (idev) { 2610 snmp6_unregister_dev(idev); 2611 addrconf_sysctl_unregister(idev); 2612 addrconf_sysctl_register(idev); 2613 err = snmp6_register_dev(idev); 2614 if (err) 2615 return notifier_from_errno(err); 2616 } 2617 break; 2618 2619 case NETDEV_PRE_TYPE_CHANGE: 2620 case NETDEV_POST_TYPE_CHANGE: 2621 addrconf_type_change(dev, event); 2622 break; 2623 } 2624 2625 return NOTIFY_OK; 2626 } 2627 2628 /* 2629 * addrconf module should be notified of a device going up 2630 */ 2631 static struct notifier_block ipv6_dev_notf = { 2632 .notifier_call = addrconf_notify, 2633 }; 2634 2635 static void addrconf_type_change(struct net_device *dev, unsigned long event) 2636 { 2637 struct inet6_dev *idev; 2638 ASSERT_RTNL(); 2639 2640 idev = __in6_dev_get(dev); 2641 2642 if (event == NETDEV_POST_TYPE_CHANGE) 2643 ipv6_mc_remap(idev); 2644 else if (event == NETDEV_PRE_TYPE_CHANGE) 2645 ipv6_mc_unmap(idev); 2646 } 2647 2648 static int addrconf_ifdown(struct net_device *dev, int how) 2649 { 2650 struct net *net = dev_net(dev); 2651 struct inet6_dev *idev; 2652 struct inet6_ifaddr *ifa; 2653 LIST_HEAD(keep_list); 2654 int state; 2655 2656 ASSERT_RTNL(); 2657 2658 rt6_ifdown(net, dev); 2659 neigh_ifdown(&nd_tbl, dev); 2660 2661 idev = __in6_dev_get(dev); 2662 if (idev == NULL) 2663 return -ENODEV; 2664 2665 /* 2666 * Step 1: remove reference to ipv6 device from parent device. 2667 * Do not dev_put! 2668 */ 2669 if (how) { 2670 idev->dead = 1; 2671 2672 /* protected by rtnl_lock */ 2673 rcu_assign_pointer(dev->ip6_ptr, NULL); 2674 2675 /* Step 1.5: remove snmp6 entry */ 2676 snmp6_unregister_dev(idev); 2677 2678 } 2679 2680 write_lock_bh(&idev->lock); 2681 2682 /* Step 2: clear flags for stateless addrconf */ 2683 if (!how) 2684 idev->if_flags &= ~(IF_RS_SENT|IF_RA_RCVD|IF_READY); 2685 2686 #ifdef CONFIG_IPV6_PRIVACY 2687 if (how && del_timer(&idev->regen_timer)) 2688 in6_dev_put(idev); 2689 2690 /* Step 3: clear tempaddr list */ 2691 while (!list_empty(&idev->tempaddr_list)) { 2692 ifa = list_first_entry(&idev->tempaddr_list, 2693 struct inet6_ifaddr, tmp_list); 2694 list_del(&ifa->tmp_list); 2695 write_unlock_bh(&idev->lock); 2696 spin_lock_bh(&ifa->lock); 2697 2698 if (ifa->ifpub) { 2699 in6_ifa_put(ifa->ifpub); 2700 ifa->ifpub = NULL; 2701 } 2702 spin_unlock_bh(&ifa->lock); 2703 in6_ifa_put(ifa); 2704 write_lock_bh(&idev->lock); 2705 } 2706 #endif 2707 2708 while (!list_empty(&idev->addr_list)) { 2709 ifa = list_first_entry(&idev->addr_list, 2710 struct inet6_ifaddr, if_list); 2711 addrconf_del_timer(ifa); 2712 2713 /* If just doing link down, and address is permanent 2714 and not link-local, then retain it. */ 2715 if (!how && 2716 (ifa->flags&IFA_F_PERMANENT) && 2717 !(ipv6_addr_type(&ifa->addr) & IPV6_ADDR_LINKLOCAL)) { 2718 list_move_tail(&ifa->if_list, &keep_list); 2719 2720 /* If not doing DAD on this address, just keep it. */ 2721 if ((dev->flags&(IFF_NOARP|IFF_LOOPBACK)) || 2722 idev->cnf.accept_dad <= 0 || 2723 (ifa->flags & IFA_F_NODAD)) 2724 continue; 2725 2726 /* If it was tentative already, no need to notify */ 2727 if (ifa->flags & IFA_F_TENTATIVE) 2728 continue; 2729 2730 /* Flag it for later restoration when link comes up */ 2731 ifa->flags |= IFA_F_TENTATIVE; 2732 ifa->state = INET6_IFADDR_STATE_DAD; 2733 2734 write_unlock_bh(&idev->lock); 2735 2736 in6_ifa_hold(ifa); 2737 } else { 2738 list_del(&ifa->if_list); 2739 2740 /* clear hash table */ 2741 spin_lock_bh(&addrconf_hash_lock); 2742 hlist_del_init_rcu(&ifa->addr_lst); 2743 spin_unlock_bh(&addrconf_hash_lock); 2744 2745 write_unlock_bh(&idev->lock); 2746 spin_lock_bh(&ifa->state_lock); 2747 state = ifa->state; 2748 ifa->state = INET6_IFADDR_STATE_DEAD; 2749 spin_unlock_bh(&ifa->state_lock); 2750 2751 if (state == INET6_IFADDR_STATE_DEAD) 2752 goto put_ifa; 2753 } 2754 2755 __ipv6_ifa_notify(RTM_DELADDR, ifa); 2756 if (ifa->state == INET6_IFADDR_STATE_DEAD) 2757 atomic_notifier_call_chain(&inet6addr_chain, 2758 NETDEV_DOWN, ifa); 2759 2760 put_ifa: 2761 in6_ifa_put(ifa); 2762 2763 write_lock_bh(&idev->lock); 2764 } 2765 2766 list_splice(&keep_list, &idev->addr_list); 2767 2768 write_unlock_bh(&idev->lock); 2769 2770 /* Step 5: Discard multicast list */ 2771 if (how) 2772 ipv6_mc_destroy_dev(idev); 2773 else 2774 ipv6_mc_down(idev); 2775 2776 idev->tstamp = jiffies; 2777 2778 /* Last: Shot the device (if unregistered) */ 2779 if (how) { 2780 addrconf_sysctl_unregister(idev); 2781 neigh_parms_release(&nd_tbl, idev->nd_parms); 2782 neigh_ifdown(&nd_tbl, dev); 2783 in6_dev_put(idev); 2784 } 2785 return 0; 2786 } 2787 2788 static void addrconf_rs_timer(unsigned long data) 2789 { 2790 struct inet6_ifaddr *ifp = (struct inet6_ifaddr *) data; 2791 struct inet6_dev *idev = ifp->idev; 2792 2793 read_lock(&idev->lock); 2794 if (idev->dead || !(idev->if_flags & IF_READY)) 2795 goto out; 2796 2797 if (idev->cnf.forwarding) 2798 goto out; 2799 2800 /* Announcement received after solicitation was sent */ 2801 if (idev->if_flags & IF_RA_RCVD) 2802 goto out; 2803 2804 spin_lock(&ifp->lock); 2805 if (ifp->probes++ < idev->cnf.rtr_solicits) { 2806 /* The wait after the last probe can be shorter */ 2807 addrconf_mod_timer(ifp, AC_RS, 2808 (ifp->probes == idev->cnf.rtr_solicits) ? 2809 idev->cnf.rtr_solicit_delay : 2810 idev->cnf.rtr_solicit_interval); 2811 spin_unlock(&ifp->lock); 2812 2813 ndisc_send_rs(idev->dev, &ifp->addr, &in6addr_linklocal_allrouters); 2814 } else { 2815 spin_unlock(&ifp->lock); 2816 /* 2817 * Note: we do not support deprecated "all on-link" 2818 * assumption any longer. 2819 */ 2820 printk(KERN_DEBUG "%s: no IPv6 routers present\n", 2821 idev->dev->name); 2822 } 2823 2824 out: 2825 read_unlock(&idev->lock); 2826 in6_ifa_put(ifp); 2827 } 2828 2829 /* 2830 * Duplicate Address Detection 2831 */ 2832 static void addrconf_dad_kick(struct inet6_ifaddr *ifp) 2833 { 2834 unsigned long rand_num; 2835 struct inet6_dev *idev = ifp->idev; 2836 2837 if (ifp->flags & IFA_F_OPTIMISTIC) 2838 rand_num = 0; 2839 else 2840 rand_num = net_random() % (idev->cnf.rtr_solicit_delay ? : 1); 2841 2842 ifp->probes = idev->cnf.dad_transmits; 2843 addrconf_mod_timer(ifp, AC_DAD, rand_num); 2844 } 2845 2846 static void addrconf_dad_start(struct inet6_ifaddr *ifp, u32 flags) 2847 { 2848 struct inet6_dev *idev = ifp->idev; 2849 struct net_device *dev = idev->dev; 2850 2851 addrconf_join_solict(dev, &ifp->addr); 2852 2853 net_srandom(ifp->addr.s6_addr32[3]); 2854 2855 read_lock_bh(&idev->lock); 2856 spin_lock(&ifp->lock); 2857 if (ifp->state == INET6_IFADDR_STATE_DEAD) 2858 goto out; 2859 2860 if (dev->flags&(IFF_NOARP|IFF_LOOPBACK) || 2861 idev->cnf.accept_dad < 1 || 2862 !(ifp->flags&IFA_F_TENTATIVE) || 2863 ifp->flags & IFA_F_NODAD) { 2864 ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED); 2865 spin_unlock(&ifp->lock); 2866 read_unlock_bh(&idev->lock); 2867 2868 addrconf_dad_completed(ifp); 2869 return; 2870 } 2871 2872 if (!(idev->if_flags & IF_READY)) { 2873 spin_unlock(&ifp->lock); 2874 read_unlock_bh(&idev->lock); 2875 /* 2876 * If the device is not ready: 2877 * - keep it tentative if it is a permanent address. 2878 * - otherwise, kill it. 2879 */ 2880 in6_ifa_hold(ifp); 2881 addrconf_dad_stop(ifp, 0); 2882 return; 2883 } 2884 2885 /* 2886 * Optimistic nodes can start receiving 2887 * Frames right away 2888 */ 2889 if (ifp->flags & IFA_F_OPTIMISTIC) 2890 ip6_ins_rt(ifp->rt); 2891 2892 addrconf_dad_kick(ifp); 2893 out: 2894 spin_unlock(&ifp->lock); 2895 read_unlock_bh(&idev->lock); 2896 } 2897 2898 static void addrconf_dad_timer(unsigned long data) 2899 { 2900 struct inet6_ifaddr *ifp = (struct inet6_ifaddr *) data; 2901 struct inet6_dev *idev = ifp->idev; 2902 struct in6_addr mcaddr; 2903 2904 if (!ifp->probes && addrconf_dad_end(ifp)) 2905 goto out; 2906 2907 read_lock(&idev->lock); 2908 if (idev->dead || !(idev->if_flags & IF_READY)) { 2909 read_unlock(&idev->lock); 2910 goto out; 2911 } 2912 2913 spin_lock(&ifp->lock); 2914 if (ifp->state == INET6_IFADDR_STATE_DEAD) { 2915 spin_unlock(&ifp->lock); 2916 read_unlock(&idev->lock); 2917 goto out; 2918 } 2919 2920 if (ifp->probes == 0) { 2921 /* 2922 * DAD was successful 2923 */ 2924 2925 ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED); 2926 spin_unlock(&ifp->lock); 2927 read_unlock(&idev->lock); 2928 2929 addrconf_dad_completed(ifp); 2930 2931 goto out; 2932 } 2933 2934 ifp->probes--; 2935 addrconf_mod_timer(ifp, AC_DAD, ifp->idev->nd_parms->retrans_time); 2936 spin_unlock(&ifp->lock); 2937 read_unlock(&idev->lock); 2938 2939 /* send a neighbour solicitation for our addr */ 2940 addrconf_addr_solict_mult(&ifp->addr, &mcaddr); 2941 ndisc_send_ns(ifp->idev->dev, NULL, &ifp->addr, &mcaddr, &in6addr_any); 2942 out: 2943 in6_ifa_put(ifp); 2944 } 2945 2946 static void addrconf_dad_completed(struct inet6_ifaddr *ifp) 2947 { 2948 struct net_device *dev = ifp->idev->dev; 2949 2950 /* 2951 * Configure the address for reception. Now it is valid. 2952 */ 2953 2954 ipv6_ifa_notify(RTM_NEWADDR, ifp); 2955 2956 /* If added prefix is link local and forwarding is off, 2957 start sending router solicitations. 2958 */ 2959 2960 if (ifp->idev->cnf.forwarding == 0 && 2961 ifp->idev->cnf.rtr_solicits > 0 && 2962 (dev->flags&IFF_LOOPBACK) == 0 && 2963 (ipv6_addr_type(&ifp->addr) & IPV6_ADDR_LINKLOCAL)) { 2964 /* 2965 * If a host as already performed a random delay 2966 * [...] as part of DAD [...] there is no need 2967 * to delay again before sending the first RS 2968 */ 2969 ndisc_send_rs(ifp->idev->dev, &ifp->addr, &in6addr_linklocal_allrouters); 2970 2971 spin_lock_bh(&ifp->lock); 2972 ifp->probes = 1; 2973 ifp->idev->if_flags |= IF_RS_SENT; 2974 addrconf_mod_timer(ifp, AC_RS, ifp->idev->cnf.rtr_solicit_interval); 2975 spin_unlock_bh(&ifp->lock); 2976 } 2977 } 2978 2979 static void addrconf_dad_run(struct inet6_dev *idev) 2980 { 2981 struct inet6_ifaddr *ifp; 2982 2983 read_lock_bh(&idev->lock); 2984 list_for_each_entry(ifp, &idev->addr_list, if_list) { 2985 spin_lock(&ifp->lock); 2986 if (ifp->flags & IFA_F_TENTATIVE && 2987 ifp->state == INET6_IFADDR_STATE_DAD) 2988 addrconf_dad_kick(ifp); 2989 spin_unlock(&ifp->lock); 2990 } 2991 read_unlock_bh(&idev->lock); 2992 } 2993 2994 #ifdef CONFIG_PROC_FS 2995 struct if6_iter_state { 2996 struct seq_net_private p; 2997 int bucket; 2998 }; 2999 3000 static struct inet6_ifaddr *if6_get_first(struct seq_file *seq) 3001 { 3002 struct inet6_ifaddr *ifa = NULL; 3003 struct if6_iter_state *state = seq->private; 3004 struct net *net = seq_file_net(seq); 3005 3006 for (state->bucket = 0; state->bucket < IN6_ADDR_HSIZE; ++state->bucket) { 3007 struct hlist_node *n; 3008 hlist_for_each_entry_rcu_bh(ifa, n, &inet6_addr_lst[state->bucket], 3009 addr_lst) 3010 if (net_eq(dev_net(ifa->idev->dev), net)) 3011 return ifa; 3012 } 3013 return NULL; 3014 } 3015 3016 static struct inet6_ifaddr *if6_get_next(struct seq_file *seq, 3017 struct inet6_ifaddr *ifa) 3018 { 3019 struct if6_iter_state *state = seq->private; 3020 struct net *net = seq_file_net(seq); 3021 struct hlist_node *n = &ifa->addr_lst; 3022 3023 hlist_for_each_entry_continue_rcu_bh(ifa, n, addr_lst) 3024 if (net_eq(dev_net(ifa->idev->dev), net)) 3025 return ifa; 3026 3027 while (++state->bucket < IN6_ADDR_HSIZE) { 3028 hlist_for_each_entry_rcu_bh(ifa, n, 3029 &inet6_addr_lst[state->bucket], addr_lst) { 3030 if (net_eq(dev_net(ifa->idev->dev), net)) 3031 return ifa; 3032 } 3033 } 3034 3035 return NULL; 3036 } 3037 3038 static struct inet6_ifaddr *if6_get_idx(struct seq_file *seq, loff_t pos) 3039 { 3040 struct inet6_ifaddr *ifa = if6_get_first(seq); 3041 3042 if (ifa) 3043 while (pos && (ifa = if6_get_next(seq, ifa)) != NULL) 3044 --pos; 3045 return pos ? NULL : ifa; 3046 } 3047 3048 static void *if6_seq_start(struct seq_file *seq, loff_t *pos) 3049 __acquires(rcu_bh) 3050 { 3051 rcu_read_lock_bh(); 3052 return if6_get_idx(seq, *pos); 3053 } 3054 3055 static void *if6_seq_next(struct seq_file *seq, void *v, loff_t *pos) 3056 { 3057 struct inet6_ifaddr *ifa; 3058 3059 ifa = if6_get_next(seq, v); 3060 ++*pos; 3061 return ifa; 3062 } 3063 3064 static void if6_seq_stop(struct seq_file *seq, void *v) 3065 __releases(rcu_bh) 3066 { 3067 rcu_read_unlock_bh(); 3068 } 3069 3070 static int if6_seq_show(struct seq_file *seq, void *v) 3071 { 3072 struct inet6_ifaddr *ifp = (struct inet6_ifaddr *)v; 3073 seq_printf(seq, "%pi6 %02x %02x %02x %02x %8s\n", 3074 &ifp->addr, 3075 ifp->idev->dev->ifindex, 3076 ifp->prefix_len, 3077 ifp->scope, 3078 ifp->flags, 3079 ifp->idev->dev->name); 3080 return 0; 3081 } 3082 3083 static const struct seq_operations if6_seq_ops = { 3084 .start = if6_seq_start, 3085 .next = if6_seq_next, 3086 .show = if6_seq_show, 3087 .stop = if6_seq_stop, 3088 }; 3089 3090 static int if6_seq_open(struct inode *inode, struct file *file) 3091 { 3092 return seq_open_net(inode, file, &if6_seq_ops, 3093 sizeof(struct if6_iter_state)); 3094 } 3095 3096 static const struct file_operations if6_fops = { 3097 .owner = THIS_MODULE, 3098 .open = if6_seq_open, 3099 .read = seq_read, 3100 .llseek = seq_lseek, 3101 .release = seq_release_net, 3102 }; 3103 3104 static int __net_init if6_proc_net_init(struct net *net) 3105 { 3106 if (!proc_net_fops_create(net, "if_inet6", S_IRUGO, &if6_fops)) 3107 return -ENOMEM; 3108 return 0; 3109 } 3110 3111 static void __net_exit if6_proc_net_exit(struct net *net) 3112 { 3113 proc_net_remove(net, "if_inet6"); 3114 } 3115 3116 static struct pernet_operations if6_proc_net_ops = { 3117 .init = if6_proc_net_init, 3118 .exit = if6_proc_net_exit, 3119 }; 3120 3121 int __init if6_proc_init(void) 3122 { 3123 return register_pernet_subsys(&if6_proc_net_ops); 3124 } 3125 3126 void if6_proc_exit(void) 3127 { 3128 unregister_pernet_subsys(&if6_proc_net_ops); 3129 } 3130 #endif /* CONFIG_PROC_FS */ 3131 3132 #if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE) 3133 /* Check if address is a home address configured on any interface. */ 3134 int ipv6_chk_home_addr(struct net *net, struct in6_addr *addr) 3135 { 3136 int ret = 0; 3137 struct inet6_ifaddr *ifp = NULL; 3138 struct hlist_node *n; 3139 unsigned int hash = ipv6_addr_hash(addr); 3140 3141 rcu_read_lock_bh(); 3142 hlist_for_each_entry_rcu_bh(ifp, n, &inet6_addr_lst[hash], addr_lst) { 3143 if (!net_eq(dev_net(ifp->idev->dev), net)) 3144 continue; 3145 if (ipv6_addr_equal(&ifp->addr, addr) && 3146 (ifp->flags & IFA_F_HOMEADDRESS)) { 3147 ret = 1; 3148 break; 3149 } 3150 } 3151 rcu_read_unlock_bh(); 3152 return ret; 3153 } 3154 #endif 3155 3156 /* 3157 * Periodic address status verification 3158 */ 3159 3160 static void addrconf_verify(unsigned long foo) 3161 { 3162 unsigned long now, next, next_sec, next_sched; 3163 struct inet6_ifaddr *ifp; 3164 struct hlist_node *node; 3165 int i; 3166 3167 rcu_read_lock_bh(); 3168 spin_lock(&addrconf_verify_lock); 3169 now = jiffies; 3170 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY); 3171 3172 del_timer(&addr_chk_timer); 3173 3174 for (i = 0; i < IN6_ADDR_HSIZE; i++) { 3175 restart: 3176 hlist_for_each_entry_rcu_bh(ifp, node, 3177 &inet6_addr_lst[i], addr_lst) { 3178 unsigned long age; 3179 3180 if (ifp->flags & IFA_F_PERMANENT) 3181 continue; 3182 3183 spin_lock(&ifp->lock); 3184 /* We try to batch several events at once. */ 3185 age = (now - ifp->tstamp + ADDRCONF_TIMER_FUZZ_MINUS) / HZ; 3186 3187 if (ifp->valid_lft != INFINITY_LIFE_TIME && 3188 age >= ifp->valid_lft) { 3189 spin_unlock(&ifp->lock); 3190 in6_ifa_hold(ifp); 3191 ipv6_del_addr(ifp); 3192 goto restart; 3193 } else if (ifp->prefered_lft == INFINITY_LIFE_TIME) { 3194 spin_unlock(&ifp->lock); 3195 continue; 3196 } else if (age >= ifp->prefered_lft) { 3197 /* jiffies - ifp->tstamp > age >= ifp->prefered_lft */ 3198 int deprecate = 0; 3199 3200 if (!(ifp->flags&IFA_F_DEPRECATED)) { 3201 deprecate = 1; 3202 ifp->flags |= IFA_F_DEPRECATED; 3203 } 3204 3205 if (time_before(ifp->tstamp + ifp->valid_lft * HZ, next)) 3206 next = ifp->tstamp + ifp->valid_lft * HZ; 3207 3208 spin_unlock(&ifp->lock); 3209 3210 if (deprecate) { 3211 in6_ifa_hold(ifp); 3212 3213 ipv6_ifa_notify(0, ifp); 3214 in6_ifa_put(ifp); 3215 goto restart; 3216 } 3217 #ifdef CONFIG_IPV6_PRIVACY 3218 } else if ((ifp->flags&IFA_F_TEMPORARY) && 3219 !(ifp->flags&IFA_F_TENTATIVE)) { 3220 unsigned long regen_advance = ifp->idev->cnf.regen_max_retry * 3221 ifp->idev->cnf.dad_transmits * 3222 ifp->idev->nd_parms->retrans_time / HZ; 3223 3224 if (age >= ifp->prefered_lft - regen_advance) { 3225 struct inet6_ifaddr *ifpub = ifp->ifpub; 3226 if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next)) 3227 next = ifp->tstamp + ifp->prefered_lft * HZ; 3228 if (!ifp->regen_count && ifpub) { 3229 ifp->regen_count++; 3230 in6_ifa_hold(ifp); 3231 in6_ifa_hold(ifpub); 3232 spin_unlock(&ifp->lock); 3233 3234 spin_lock(&ifpub->lock); 3235 ifpub->regen_count = 0; 3236 spin_unlock(&ifpub->lock); 3237 ipv6_create_tempaddr(ifpub, ifp); 3238 in6_ifa_put(ifpub); 3239 in6_ifa_put(ifp); 3240 goto restart; 3241 } 3242 } else if (time_before(ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ, next)) 3243 next = ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ; 3244 spin_unlock(&ifp->lock); 3245 #endif 3246 } else { 3247 /* ifp->prefered_lft <= ifp->valid_lft */ 3248 if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next)) 3249 next = ifp->tstamp + ifp->prefered_lft * HZ; 3250 spin_unlock(&ifp->lock); 3251 } 3252 } 3253 } 3254 3255 next_sec = round_jiffies_up(next); 3256 next_sched = next; 3257 3258 /* If rounded timeout is accurate enough, accept it. */ 3259 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ)) 3260 next_sched = next_sec; 3261 3262 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */ 3263 if (time_before(next_sched, jiffies + ADDRCONF_TIMER_FUZZ_MAX)) 3264 next_sched = jiffies + ADDRCONF_TIMER_FUZZ_MAX; 3265 3266 ADBG((KERN_DEBUG "now = %lu, schedule = %lu, rounded schedule = %lu => %lu\n", 3267 now, next, next_sec, next_sched)); 3268 3269 addr_chk_timer.expires = next_sched; 3270 add_timer(&addr_chk_timer); 3271 spin_unlock(&addrconf_verify_lock); 3272 rcu_read_unlock_bh(); 3273 } 3274 3275 static struct in6_addr *extract_addr(struct nlattr *addr, struct nlattr *local) 3276 { 3277 struct in6_addr *pfx = NULL; 3278 3279 if (addr) 3280 pfx = nla_data(addr); 3281 3282 if (local) { 3283 if (pfx && nla_memcmp(local, pfx, sizeof(*pfx))) 3284 pfx = NULL; 3285 else 3286 pfx = nla_data(local); 3287 } 3288 3289 return pfx; 3290 } 3291 3292 static const struct nla_policy ifa_ipv6_policy[IFA_MAX+1] = { 3293 [IFA_ADDRESS] = { .len = sizeof(struct in6_addr) }, 3294 [IFA_LOCAL] = { .len = sizeof(struct in6_addr) }, 3295 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) }, 3296 }; 3297 3298 static int 3299 inet6_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg) 3300 { 3301 struct net *net = sock_net(skb->sk); 3302 struct ifaddrmsg *ifm; 3303 struct nlattr *tb[IFA_MAX+1]; 3304 struct in6_addr *pfx; 3305 int err; 3306 3307 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy); 3308 if (err < 0) 3309 return err; 3310 3311 ifm = nlmsg_data(nlh); 3312 pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]); 3313 if (pfx == NULL) 3314 return -EINVAL; 3315 3316 return inet6_addr_del(net, ifm->ifa_index, pfx, ifm->ifa_prefixlen); 3317 } 3318 3319 static int inet6_addr_modify(struct inet6_ifaddr *ifp, u8 ifa_flags, 3320 u32 prefered_lft, u32 valid_lft) 3321 { 3322 u32 flags; 3323 clock_t expires; 3324 unsigned long timeout; 3325 3326 if (!valid_lft || (prefered_lft > valid_lft)) 3327 return -EINVAL; 3328 3329 timeout = addrconf_timeout_fixup(valid_lft, HZ); 3330 if (addrconf_finite_timeout(timeout)) { 3331 expires = jiffies_to_clock_t(timeout * HZ); 3332 valid_lft = timeout; 3333 flags = RTF_EXPIRES; 3334 } else { 3335 expires = 0; 3336 flags = 0; 3337 ifa_flags |= IFA_F_PERMANENT; 3338 } 3339 3340 timeout = addrconf_timeout_fixup(prefered_lft, HZ); 3341 if (addrconf_finite_timeout(timeout)) { 3342 if (timeout == 0) 3343 ifa_flags |= IFA_F_DEPRECATED; 3344 prefered_lft = timeout; 3345 } 3346 3347 spin_lock_bh(&ifp->lock); 3348 ifp->flags = (ifp->flags & ~(IFA_F_DEPRECATED | IFA_F_PERMANENT | IFA_F_NODAD | IFA_F_HOMEADDRESS)) | ifa_flags; 3349 ifp->tstamp = jiffies; 3350 ifp->valid_lft = valid_lft; 3351 ifp->prefered_lft = prefered_lft; 3352 3353 spin_unlock_bh(&ifp->lock); 3354 if (!(ifp->flags&IFA_F_TENTATIVE)) 3355 ipv6_ifa_notify(0, ifp); 3356 3357 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, ifp->idev->dev, 3358 expires, flags); 3359 addrconf_verify(0); 3360 3361 return 0; 3362 } 3363 3364 static int 3365 inet6_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg) 3366 { 3367 struct net *net = sock_net(skb->sk); 3368 struct ifaddrmsg *ifm; 3369 struct nlattr *tb[IFA_MAX+1]; 3370 struct in6_addr *pfx; 3371 struct inet6_ifaddr *ifa; 3372 struct net_device *dev; 3373 u32 valid_lft = INFINITY_LIFE_TIME, preferred_lft = INFINITY_LIFE_TIME; 3374 u8 ifa_flags; 3375 int err; 3376 3377 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy); 3378 if (err < 0) 3379 return err; 3380 3381 ifm = nlmsg_data(nlh); 3382 pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]); 3383 if (pfx == NULL) 3384 return -EINVAL; 3385 3386 if (tb[IFA_CACHEINFO]) { 3387 struct ifa_cacheinfo *ci; 3388 3389 ci = nla_data(tb[IFA_CACHEINFO]); 3390 valid_lft = ci->ifa_valid; 3391 preferred_lft = ci->ifa_prefered; 3392 } else { 3393 preferred_lft = INFINITY_LIFE_TIME; 3394 valid_lft = INFINITY_LIFE_TIME; 3395 } 3396 3397 dev = __dev_get_by_index(net, ifm->ifa_index); 3398 if (dev == NULL) 3399 return -ENODEV; 3400 3401 /* We ignore other flags so far. */ 3402 ifa_flags = ifm->ifa_flags & (IFA_F_NODAD | IFA_F_HOMEADDRESS); 3403 3404 ifa = ipv6_get_ifaddr(net, pfx, dev, 1); 3405 if (ifa == NULL) { 3406 /* 3407 * It would be best to check for !NLM_F_CREATE here but 3408 * userspace alreay relies on not having to provide this. 3409 */ 3410 return inet6_addr_add(net, ifm->ifa_index, pfx, 3411 ifm->ifa_prefixlen, ifa_flags, 3412 preferred_lft, valid_lft); 3413 } 3414 3415 if (nlh->nlmsg_flags & NLM_F_EXCL || 3416 !(nlh->nlmsg_flags & NLM_F_REPLACE)) 3417 err = -EEXIST; 3418 else 3419 err = inet6_addr_modify(ifa, ifa_flags, preferred_lft, valid_lft); 3420 3421 in6_ifa_put(ifa); 3422 3423 return err; 3424 } 3425 3426 static void put_ifaddrmsg(struct nlmsghdr *nlh, u8 prefixlen, u8 flags, 3427 u8 scope, int ifindex) 3428 { 3429 struct ifaddrmsg *ifm; 3430 3431 ifm = nlmsg_data(nlh); 3432 ifm->ifa_family = AF_INET6; 3433 ifm->ifa_prefixlen = prefixlen; 3434 ifm->ifa_flags = flags; 3435 ifm->ifa_scope = scope; 3436 ifm->ifa_index = ifindex; 3437 } 3438 3439 static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp, 3440 unsigned long tstamp, u32 preferred, u32 valid) 3441 { 3442 struct ifa_cacheinfo ci; 3443 3444 ci.cstamp = (u32)(TIME_DELTA(cstamp, INITIAL_JIFFIES) / HZ * 100 3445 + TIME_DELTA(cstamp, INITIAL_JIFFIES) % HZ * 100 / HZ); 3446 ci.tstamp = (u32)(TIME_DELTA(tstamp, INITIAL_JIFFIES) / HZ * 100 3447 + TIME_DELTA(tstamp, INITIAL_JIFFIES) % HZ * 100 / HZ); 3448 ci.ifa_prefered = preferred; 3449 ci.ifa_valid = valid; 3450 3451 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci); 3452 } 3453 3454 static inline int rt_scope(int ifa_scope) 3455 { 3456 if (ifa_scope & IFA_HOST) 3457 return RT_SCOPE_HOST; 3458 else if (ifa_scope & IFA_LINK) 3459 return RT_SCOPE_LINK; 3460 else if (ifa_scope & IFA_SITE) 3461 return RT_SCOPE_SITE; 3462 else 3463 return RT_SCOPE_UNIVERSE; 3464 } 3465 3466 static inline int inet6_ifaddr_msgsize(void) 3467 { 3468 return NLMSG_ALIGN(sizeof(struct ifaddrmsg)) 3469 + nla_total_size(16) /* IFA_ADDRESS */ 3470 + nla_total_size(sizeof(struct ifa_cacheinfo)); 3471 } 3472 3473 static int inet6_fill_ifaddr(struct sk_buff *skb, struct inet6_ifaddr *ifa, 3474 u32 pid, u32 seq, int event, unsigned int flags) 3475 { 3476 struct nlmsghdr *nlh; 3477 u32 preferred, valid; 3478 3479 nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags); 3480 if (nlh == NULL) 3481 return -EMSGSIZE; 3482 3483 put_ifaddrmsg(nlh, ifa->prefix_len, ifa->flags, rt_scope(ifa->scope), 3484 ifa->idev->dev->ifindex); 3485 3486 if (!(ifa->flags&IFA_F_PERMANENT)) { 3487 preferred = ifa->prefered_lft; 3488 valid = ifa->valid_lft; 3489 if (preferred != INFINITY_LIFE_TIME) { 3490 long tval = (jiffies - ifa->tstamp)/HZ; 3491 if (preferred > tval) 3492 preferred -= tval; 3493 else 3494 preferred = 0; 3495 if (valid != INFINITY_LIFE_TIME) 3496 valid -= tval; 3497 } 3498 } else { 3499 preferred = INFINITY_LIFE_TIME; 3500 valid = INFINITY_LIFE_TIME; 3501 } 3502 3503 if (nla_put(skb, IFA_ADDRESS, 16, &ifa->addr) < 0 || 3504 put_cacheinfo(skb, ifa->cstamp, ifa->tstamp, preferred, valid) < 0) { 3505 nlmsg_cancel(skb, nlh); 3506 return -EMSGSIZE; 3507 } 3508 3509 return nlmsg_end(skb, nlh); 3510 } 3511 3512 static int inet6_fill_ifmcaddr(struct sk_buff *skb, struct ifmcaddr6 *ifmca, 3513 u32 pid, u32 seq, int event, u16 flags) 3514 { 3515 struct nlmsghdr *nlh; 3516 u8 scope = RT_SCOPE_UNIVERSE; 3517 int ifindex = ifmca->idev->dev->ifindex; 3518 3519 if (ipv6_addr_scope(&ifmca->mca_addr) & IFA_SITE) 3520 scope = RT_SCOPE_SITE; 3521 3522 nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags); 3523 if (nlh == NULL) 3524 return -EMSGSIZE; 3525 3526 put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex); 3527 if (nla_put(skb, IFA_MULTICAST, 16, &ifmca->mca_addr) < 0 || 3528 put_cacheinfo(skb, ifmca->mca_cstamp, ifmca->mca_tstamp, 3529 INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) { 3530 nlmsg_cancel(skb, nlh); 3531 return -EMSGSIZE; 3532 } 3533 3534 return nlmsg_end(skb, nlh); 3535 } 3536 3537 static int inet6_fill_ifacaddr(struct sk_buff *skb, struct ifacaddr6 *ifaca, 3538 u32 pid, u32 seq, int event, unsigned int flags) 3539 { 3540 struct nlmsghdr *nlh; 3541 u8 scope = RT_SCOPE_UNIVERSE; 3542 int ifindex = ifaca->aca_idev->dev->ifindex; 3543 3544 if (ipv6_addr_scope(&ifaca->aca_addr) & IFA_SITE) 3545 scope = RT_SCOPE_SITE; 3546 3547 nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags); 3548 if (nlh == NULL) 3549 return -EMSGSIZE; 3550 3551 put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex); 3552 if (nla_put(skb, IFA_ANYCAST, 16, &ifaca->aca_addr) < 0 || 3553 put_cacheinfo(skb, ifaca->aca_cstamp, ifaca->aca_tstamp, 3554 INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) { 3555 nlmsg_cancel(skb, nlh); 3556 return -EMSGSIZE; 3557 } 3558 3559 return nlmsg_end(skb, nlh); 3560 } 3561 3562 enum addr_type_t { 3563 UNICAST_ADDR, 3564 MULTICAST_ADDR, 3565 ANYCAST_ADDR, 3566 }; 3567 3568 /* called with rcu_read_lock() */ 3569 static int in6_dump_addrs(struct inet6_dev *idev, struct sk_buff *skb, 3570 struct netlink_callback *cb, enum addr_type_t type, 3571 int s_ip_idx, int *p_ip_idx) 3572 { 3573 struct ifmcaddr6 *ifmca; 3574 struct ifacaddr6 *ifaca; 3575 int err = 1; 3576 int ip_idx = *p_ip_idx; 3577 3578 read_lock_bh(&idev->lock); 3579 switch (type) { 3580 case UNICAST_ADDR: { 3581 struct inet6_ifaddr *ifa; 3582 3583 /* unicast address incl. temp addr */ 3584 list_for_each_entry(ifa, &idev->addr_list, if_list) { 3585 if (++ip_idx < s_ip_idx) 3586 continue; 3587 err = inet6_fill_ifaddr(skb, ifa, 3588 NETLINK_CB(cb->skb).pid, 3589 cb->nlh->nlmsg_seq, 3590 RTM_NEWADDR, 3591 NLM_F_MULTI); 3592 if (err <= 0) 3593 break; 3594 } 3595 break; 3596 } 3597 case MULTICAST_ADDR: 3598 /* multicast address */ 3599 for (ifmca = idev->mc_list; ifmca; 3600 ifmca = ifmca->next, ip_idx++) { 3601 if (ip_idx < s_ip_idx) 3602 continue; 3603 err = inet6_fill_ifmcaddr(skb, ifmca, 3604 NETLINK_CB(cb->skb).pid, 3605 cb->nlh->nlmsg_seq, 3606 RTM_GETMULTICAST, 3607 NLM_F_MULTI); 3608 if (err <= 0) 3609 break; 3610 } 3611 break; 3612 case ANYCAST_ADDR: 3613 /* anycast address */ 3614 for (ifaca = idev->ac_list; ifaca; 3615 ifaca = ifaca->aca_next, ip_idx++) { 3616 if (ip_idx < s_ip_idx) 3617 continue; 3618 err = inet6_fill_ifacaddr(skb, ifaca, 3619 NETLINK_CB(cb->skb).pid, 3620 cb->nlh->nlmsg_seq, 3621 RTM_GETANYCAST, 3622 NLM_F_MULTI); 3623 if (err <= 0) 3624 break; 3625 } 3626 break; 3627 default: 3628 break; 3629 } 3630 read_unlock_bh(&idev->lock); 3631 *p_ip_idx = ip_idx; 3632 return err; 3633 } 3634 3635 static int inet6_dump_addr(struct sk_buff *skb, struct netlink_callback *cb, 3636 enum addr_type_t type) 3637 { 3638 struct net *net = sock_net(skb->sk); 3639 int h, s_h; 3640 int idx, ip_idx; 3641 int s_idx, s_ip_idx; 3642 struct net_device *dev; 3643 struct inet6_dev *idev; 3644 struct hlist_head *head; 3645 struct hlist_node *node; 3646 3647 s_h = cb->args[0]; 3648 s_idx = idx = cb->args[1]; 3649 s_ip_idx = ip_idx = cb->args[2]; 3650 3651 rcu_read_lock(); 3652 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) { 3653 idx = 0; 3654 head = &net->dev_index_head[h]; 3655 hlist_for_each_entry_rcu(dev, node, head, index_hlist) { 3656 if (idx < s_idx) 3657 goto cont; 3658 if (h > s_h || idx > s_idx) 3659 s_ip_idx = 0; 3660 ip_idx = 0; 3661 idev = __in6_dev_get(dev); 3662 if (!idev) 3663 goto cont; 3664 3665 if (in6_dump_addrs(idev, skb, cb, type, 3666 s_ip_idx, &ip_idx) <= 0) 3667 goto done; 3668 cont: 3669 idx++; 3670 } 3671 } 3672 done: 3673 rcu_read_unlock(); 3674 cb->args[0] = h; 3675 cb->args[1] = idx; 3676 cb->args[2] = ip_idx; 3677 3678 return skb->len; 3679 } 3680 3681 static int inet6_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb) 3682 { 3683 enum addr_type_t type = UNICAST_ADDR; 3684 3685 return inet6_dump_addr(skb, cb, type); 3686 } 3687 3688 static int inet6_dump_ifmcaddr(struct sk_buff *skb, struct netlink_callback *cb) 3689 { 3690 enum addr_type_t type = MULTICAST_ADDR; 3691 3692 return inet6_dump_addr(skb, cb, type); 3693 } 3694 3695 3696 static int inet6_dump_ifacaddr(struct sk_buff *skb, struct netlink_callback *cb) 3697 { 3698 enum addr_type_t type = ANYCAST_ADDR; 3699 3700 return inet6_dump_addr(skb, cb, type); 3701 } 3702 3703 static int inet6_rtm_getaddr(struct sk_buff *in_skb, struct nlmsghdr* nlh, 3704 void *arg) 3705 { 3706 struct net *net = sock_net(in_skb->sk); 3707 struct ifaddrmsg *ifm; 3708 struct nlattr *tb[IFA_MAX+1]; 3709 struct in6_addr *addr = NULL; 3710 struct net_device *dev = NULL; 3711 struct inet6_ifaddr *ifa; 3712 struct sk_buff *skb; 3713 int err; 3714 3715 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy); 3716 if (err < 0) 3717 goto errout; 3718 3719 addr = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]); 3720 if (addr == NULL) { 3721 err = -EINVAL; 3722 goto errout; 3723 } 3724 3725 ifm = nlmsg_data(nlh); 3726 if (ifm->ifa_index) 3727 dev = __dev_get_by_index(net, ifm->ifa_index); 3728 3729 ifa = ipv6_get_ifaddr(net, addr, dev, 1); 3730 if (!ifa) { 3731 err = -EADDRNOTAVAIL; 3732 goto errout; 3733 } 3734 3735 skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_KERNEL); 3736 if (!skb) { 3737 err = -ENOBUFS; 3738 goto errout_ifa; 3739 } 3740 3741 err = inet6_fill_ifaddr(skb, ifa, NETLINK_CB(in_skb).pid, 3742 nlh->nlmsg_seq, RTM_NEWADDR, 0); 3743 if (err < 0) { 3744 /* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */ 3745 WARN_ON(err == -EMSGSIZE); 3746 kfree_skb(skb); 3747 goto errout_ifa; 3748 } 3749 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).pid); 3750 errout_ifa: 3751 in6_ifa_put(ifa); 3752 errout: 3753 return err; 3754 } 3755 3756 static void inet6_ifa_notify(int event, struct inet6_ifaddr *ifa) 3757 { 3758 struct sk_buff *skb; 3759 struct net *net = dev_net(ifa->idev->dev); 3760 int err = -ENOBUFS; 3761 3762 skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_ATOMIC); 3763 if (skb == NULL) 3764 goto errout; 3765 3766 err = inet6_fill_ifaddr(skb, ifa, 0, 0, event, 0); 3767 if (err < 0) { 3768 /* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */ 3769 WARN_ON(err == -EMSGSIZE); 3770 kfree_skb(skb); 3771 goto errout; 3772 } 3773 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFADDR, NULL, GFP_ATOMIC); 3774 return; 3775 errout: 3776 if (err < 0) 3777 rtnl_set_sk_err(net, RTNLGRP_IPV6_IFADDR, err); 3778 } 3779 3780 static inline void ipv6_store_devconf(struct ipv6_devconf *cnf, 3781 __s32 *array, int bytes) 3782 { 3783 BUG_ON(bytes < (DEVCONF_MAX * 4)); 3784 3785 memset(array, 0, bytes); 3786 array[DEVCONF_FORWARDING] = cnf->forwarding; 3787 array[DEVCONF_HOPLIMIT] = cnf->hop_limit; 3788 array[DEVCONF_MTU6] = cnf->mtu6; 3789 array[DEVCONF_ACCEPT_RA] = cnf->accept_ra; 3790 array[DEVCONF_ACCEPT_REDIRECTS] = cnf->accept_redirects; 3791 array[DEVCONF_AUTOCONF] = cnf->autoconf; 3792 array[DEVCONF_DAD_TRANSMITS] = cnf->dad_transmits; 3793 array[DEVCONF_RTR_SOLICITS] = cnf->rtr_solicits; 3794 array[DEVCONF_RTR_SOLICIT_INTERVAL] = cnf->rtr_solicit_interval; 3795 array[DEVCONF_RTR_SOLICIT_DELAY] = cnf->rtr_solicit_delay; 3796 array[DEVCONF_FORCE_MLD_VERSION] = cnf->force_mld_version; 3797 #ifdef CONFIG_IPV6_PRIVACY 3798 array[DEVCONF_USE_TEMPADDR] = cnf->use_tempaddr; 3799 array[DEVCONF_TEMP_VALID_LFT] = cnf->temp_valid_lft; 3800 array[DEVCONF_TEMP_PREFERED_LFT] = cnf->temp_prefered_lft; 3801 array[DEVCONF_REGEN_MAX_RETRY] = cnf->regen_max_retry; 3802 array[DEVCONF_MAX_DESYNC_FACTOR] = cnf->max_desync_factor; 3803 #endif 3804 array[DEVCONF_MAX_ADDRESSES] = cnf->max_addresses; 3805 array[DEVCONF_ACCEPT_RA_DEFRTR] = cnf->accept_ra_defrtr; 3806 array[DEVCONF_ACCEPT_RA_PINFO] = cnf->accept_ra_pinfo; 3807 #ifdef CONFIG_IPV6_ROUTER_PREF 3808 array[DEVCONF_ACCEPT_RA_RTR_PREF] = cnf->accept_ra_rtr_pref; 3809 array[DEVCONF_RTR_PROBE_INTERVAL] = cnf->rtr_probe_interval; 3810 #ifdef CONFIG_IPV6_ROUTE_INFO 3811 array[DEVCONF_ACCEPT_RA_RT_INFO_MAX_PLEN] = cnf->accept_ra_rt_info_max_plen; 3812 #endif 3813 #endif 3814 array[DEVCONF_PROXY_NDP] = cnf->proxy_ndp; 3815 array[DEVCONF_ACCEPT_SOURCE_ROUTE] = cnf->accept_source_route; 3816 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 3817 array[DEVCONF_OPTIMISTIC_DAD] = cnf->optimistic_dad; 3818 #endif 3819 #ifdef CONFIG_IPV6_MROUTE 3820 array[DEVCONF_MC_FORWARDING] = cnf->mc_forwarding; 3821 #endif 3822 array[DEVCONF_DISABLE_IPV6] = cnf->disable_ipv6; 3823 array[DEVCONF_ACCEPT_DAD] = cnf->accept_dad; 3824 array[DEVCONF_FORCE_TLLAO] = cnf->force_tllao; 3825 } 3826 3827 static inline size_t inet6_if_nlmsg_size(void) 3828 { 3829 return NLMSG_ALIGN(sizeof(struct ifinfomsg)) 3830 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */ 3831 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */ 3832 + nla_total_size(4) /* IFLA_MTU */ 3833 + nla_total_size(4) /* IFLA_LINK */ 3834 + nla_total_size( /* IFLA_PROTINFO */ 3835 nla_total_size(4) /* IFLA_INET6_FLAGS */ 3836 + nla_total_size(sizeof(struct ifla_cacheinfo)) 3837 + nla_total_size(DEVCONF_MAX * 4) /* IFLA_INET6_CONF */ 3838 + nla_total_size(IPSTATS_MIB_MAX * 8) /* IFLA_INET6_STATS */ 3839 + nla_total_size(ICMP6_MIB_MAX * 8) /* IFLA_INET6_ICMP6STATS */ 3840 ); 3841 } 3842 3843 static inline void __snmp6_fill_stats(u64 *stats, void __percpu **mib, 3844 int items, int bytes) 3845 { 3846 int i; 3847 int pad = bytes - sizeof(u64) * items; 3848 BUG_ON(pad < 0); 3849 3850 /* Use put_unaligned() because stats may not be aligned for u64. */ 3851 put_unaligned(items, &stats[0]); 3852 for (i = 1; i < items; i++) 3853 put_unaligned(snmp_fold_field(mib, i), &stats[i]); 3854 3855 memset(&stats[items], 0, pad); 3856 } 3857 3858 static void snmp6_fill_stats(u64 *stats, struct inet6_dev *idev, int attrtype, 3859 int bytes) 3860 { 3861 switch (attrtype) { 3862 case IFLA_INET6_STATS: 3863 __snmp6_fill_stats(stats, (void __percpu **)idev->stats.ipv6, IPSTATS_MIB_MAX, bytes); 3864 break; 3865 case IFLA_INET6_ICMP6STATS: 3866 __snmp6_fill_stats(stats, (void __percpu **)idev->stats.icmpv6, ICMP6_MIB_MAX, bytes); 3867 break; 3868 } 3869 } 3870 3871 static int inet6_fill_ifinfo(struct sk_buff *skb, struct inet6_dev *idev, 3872 u32 pid, u32 seq, int event, unsigned int flags) 3873 { 3874 struct net_device *dev = idev->dev; 3875 struct nlattr *nla; 3876 struct ifinfomsg *hdr; 3877 struct nlmsghdr *nlh; 3878 void *protoinfo; 3879 struct ifla_cacheinfo ci; 3880 3881 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*hdr), flags); 3882 if (nlh == NULL) 3883 return -EMSGSIZE; 3884 3885 hdr = nlmsg_data(nlh); 3886 hdr->ifi_family = AF_INET6; 3887 hdr->__ifi_pad = 0; 3888 hdr->ifi_type = dev->type; 3889 hdr->ifi_index = dev->ifindex; 3890 hdr->ifi_flags = dev_get_flags(dev); 3891 hdr->ifi_change = 0; 3892 3893 NLA_PUT_STRING(skb, IFLA_IFNAME, dev->name); 3894 3895 if (dev->addr_len) 3896 NLA_PUT(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr); 3897 3898 NLA_PUT_U32(skb, IFLA_MTU, dev->mtu); 3899 if (dev->ifindex != dev->iflink) 3900 NLA_PUT_U32(skb, IFLA_LINK, dev->iflink); 3901 3902 protoinfo = nla_nest_start(skb, IFLA_PROTINFO); 3903 if (protoinfo == NULL) 3904 goto nla_put_failure; 3905 3906 NLA_PUT_U32(skb, IFLA_INET6_FLAGS, idev->if_flags); 3907 3908 ci.max_reasm_len = IPV6_MAXPLEN; 3909 ci.tstamp = (__u32)(TIME_DELTA(idev->tstamp, INITIAL_JIFFIES) / HZ * 100 3910 + TIME_DELTA(idev->tstamp, INITIAL_JIFFIES) % HZ * 100 / HZ); 3911 ci.reachable_time = idev->nd_parms->reachable_time; 3912 ci.retrans_time = idev->nd_parms->retrans_time; 3913 NLA_PUT(skb, IFLA_INET6_CACHEINFO, sizeof(ci), &ci); 3914 3915 nla = nla_reserve(skb, IFLA_INET6_CONF, DEVCONF_MAX * sizeof(s32)); 3916 if (nla == NULL) 3917 goto nla_put_failure; 3918 ipv6_store_devconf(&idev->cnf, nla_data(nla), nla_len(nla)); 3919 3920 /* XXX - MC not implemented */ 3921 3922 nla = nla_reserve(skb, IFLA_INET6_STATS, IPSTATS_MIB_MAX * sizeof(u64)); 3923 if (nla == NULL) 3924 goto nla_put_failure; 3925 snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_STATS, nla_len(nla)); 3926 3927 nla = nla_reserve(skb, IFLA_INET6_ICMP6STATS, ICMP6_MIB_MAX * sizeof(u64)); 3928 if (nla == NULL) 3929 goto nla_put_failure; 3930 snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_ICMP6STATS, nla_len(nla)); 3931 3932 nla_nest_end(skb, protoinfo); 3933 return nlmsg_end(skb, nlh); 3934 3935 nla_put_failure: 3936 nlmsg_cancel(skb, nlh); 3937 return -EMSGSIZE; 3938 } 3939 3940 static int inet6_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb) 3941 { 3942 struct net *net = sock_net(skb->sk); 3943 int h, s_h; 3944 int idx = 0, s_idx; 3945 struct net_device *dev; 3946 struct inet6_dev *idev; 3947 struct hlist_head *head; 3948 struct hlist_node *node; 3949 3950 s_h = cb->args[0]; 3951 s_idx = cb->args[1]; 3952 3953 rcu_read_lock(); 3954 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) { 3955 idx = 0; 3956 head = &net->dev_index_head[h]; 3957 hlist_for_each_entry_rcu(dev, node, head, index_hlist) { 3958 if (idx < s_idx) 3959 goto cont; 3960 idev = __in6_dev_get(dev); 3961 if (!idev) 3962 goto cont; 3963 if (inet6_fill_ifinfo(skb, idev, 3964 NETLINK_CB(cb->skb).pid, 3965 cb->nlh->nlmsg_seq, 3966 RTM_NEWLINK, NLM_F_MULTI) <= 0) 3967 goto out; 3968 cont: 3969 idx++; 3970 } 3971 } 3972 out: 3973 rcu_read_unlock(); 3974 cb->args[1] = idx; 3975 cb->args[0] = h; 3976 3977 return skb->len; 3978 } 3979 3980 void inet6_ifinfo_notify(int event, struct inet6_dev *idev) 3981 { 3982 struct sk_buff *skb; 3983 struct net *net = dev_net(idev->dev); 3984 int err = -ENOBUFS; 3985 3986 skb = nlmsg_new(inet6_if_nlmsg_size(), GFP_ATOMIC); 3987 if (skb == NULL) 3988 goto errout; 3989 3990 err = inet6_fill_ifinfo(skb, idev, 0, 0, event, 0); 3991 if (err < 0) { 3992 /* -EMSGSIZE implies BUG in inet6_if_nlmsg_size() */ 3993 WARN_ON(err == -EMSGSIZE); 3994 kfree_skb(skb); 3995 goto errout; 3996 } 3997 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFADDR, NULL, GFP_ATOMIC); 3998 return; 3999 errout: 4000 if (err < 0) 4001 rtnl_set_sk_err(net, RTNLGRP_IPV6_IFADDR, err); 4002 } 4003 4004 static inline size_t inet6_prefix_nlmsg_size(void) 4005 { 4006 return NLMSG_ALIGN(sizeof(struct prefixmsg)) 4007 + nla_total_size(sizeof(struct in6_addr)) 4008 + nla_total_size(sizeof(struct prefix_cacheinfo)); 4009 } 4010 4011 static int inet6_fill_prefix(struct sk_buff *skb, struct inet6_dev *idev, 4012 struct prefix_info *pinfo, u32 pid, u32 seq, 4013 int event, unsigned int flags) 4014 { 4015 struct prefixmsg *pmsg; 4016 struct nlmsghdr *nlh; 4017 struct prefix_cacheinfo ci; 4018 4019 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*pmsg), flags); 4020 if (nlh == NULL) 4021 return -EMSGSIZE; 4022 4023 pmsg = nlmsg_data(nlh); 4024 pmsg->prefix_family = AF_INET6; 4025 pmsg->prefix_pad1 = 0; 4026 pmsg->prefix_pad2 = 0; 4027 pmsg->prefix_ifindex = idev->dev->ifindex; 4028 pmsg->prefix_len = pinfo->prefix_len; 4029 pmsg->prefix_type = pinfo->type; 4030 pmsg->prefix_pad3 = 0; 4031 pmsg->prefix_flags = 0; 4032 if (pinfo->onlink) 4033 pmsg->prefix_flags |= IF_PREFIX_ONLINK; 4034 if (pinfo->autoconf) 4035 pmsg->prefix_flags |= IF_PREFIX_AUTOCONF; 4036 4037 NLA_PUT(skb, PREFIX_ADDRESS, sizeof(pinfo->prefix), &pinfo->prefix); 4038 4039 ci.preferred_time = ntohl(pinfo->prefered); 4040 ci.valid_time = ntohl(pinfo->valid); 4041 NLA_PUT(skb, PREFIX_CACHEINFO, sizeof(ci), &ci); 4042 4043 return nlmsg_end(skb, nlh); 4044 4045 nla_put_failure: 4046 nlmsg_cancel(skb, nlh); 4047 return -EMSGSIZE; 4048 } 4049 4050 static void inet6_prefix_notify(int event, struct inet6_dev *idev, 4051 struct prefix_info *pinfo) 4052 { 4053 struct sk_buff *skb; 4054 struct net *net = dev_net(idev->dev); 4055 int err = -ENOBUFS; 4056 4057 skb = nlmsg_new(inet6_prefix_nlmsg_size(), GFP_ATOMIC); 4058 if (skb == NULL) 4059 goto errout; 4060 4061 err = inet6_fill_prefix(skb, idev, pinfo, 0, 0, event, 0); 4062 if (err < 0) { 4063 /* -EMSGSIZE implies BUG in inet6_prefix_nlmsg_size() */ 4064 WARN_ON(err == -EMSGSIZE); 4065 kfree_skb(skb); 4066 goto errout; 4067 } 4068 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_PREFIX, NULL, GFP_ATOMIC); 4069 return; 4070 errout: 4071 if (err < 0) 4072 rtnl_set_sk_err(net, RTNLGRP_IPV6_PREFIX, err); 4073 } 4074 4075 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp) 4076 { 4077 inet6_ifa_notify(event ? : RTM_NEWADDR, ifp); 4078 4079 switch (event) { 4080 case RTM_NEWADDR: 4081 /* 4082 * If the address was optimistic 4083 * we inserted the route at the start of 4084 * our DAD process, so we don't need 4085 * to do it again 4086 */ 4087 if (!(ifp->rt->rt6i_node)) 4088 ip6_ins_rt(ifp->rt); 4089 if (ifp->idev->cnf.forwarding) 4090 addrconf_join_anycast(ifp); 4091 break; 4092 case RTM_DELADDR: 4093 if (ifp->idev->cnf.forwarding) 4094 addrconf_leave_anycast(ifp); 4095 addrconf_leave_solict(ifp->idev, &ifp->addr); 4096 dst_hold(&ifp->rt->u.dst); 4097 4098 if (ifp->state == INET6_IFADDR_STATE_DEAD && 4099 ip6_del_rt(ifp->rt)) 4100 dst_free(&ifp->rt->u.dst); 4101 break; 4102 } 4103 } 4104 4105 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp) 4106 { 4107 rcu_read_lock_bh(); 4108 if (likely(ifp->idev->dead == 0)) 4109 __ipv6_ifa_notify(event, ifp); 4110 rcu_read_unlock_bh(); 4111 } 4112 4113 #ifdef CONFIG_SYSCTL 4114 4115 static 4116 int addrconf_sysctl_forward(ctl_table *ctl, int write, 4117 void __user *buffer, size_t *lenp, loff_t *ppos) 4118 { 4119 int *valp = ctl->data; 4120 int val = *valp; 4121 loff_t pos = *ppos; 4122 int ret; 4123 4124 ret = proc_dointvec(ctl, write, buffer, lenp, ppos); 4125 4126 if (write) 4127 ret = addrconf_fixup_forwarding(ctl, valp, val); 4128 if (ret) 4129 *ppos = pos; 4130 return ret; 4131 } 4132 4133 static void dev_disable_change(struct inet6_dev *idev) 4134 { 4135 if (!idev || !idev->dev) 4136 return; 4137 4138 if (idev->cnf.disable_ipv6) 4139 addrconf_notify(NULL, NETDEV_DOWN, idev->dev); 4140 else 4141 addrconf_notify(NULL, NETDEV_UP, idev->dev); 4142 } 4143 4144 static void addrconf_disable_change(struct net *net, __s32 newf) 4145 { 4146 struct net_device *dev; 4147 struct inet6_dev *idev; 4148 4149 rcu_read_lock(); 4150 for_each_netdev_rcu(net, dev) { 4151 idev = __in6_dev_get(dev); 4152 if (idev) { 4153 int changed = (!idev->cnf.disable_ipv6) ^ (!newf); 4154 idev->cnf.disable_ipv6 = newf; 4155 if (changed) 4156 dev_disable_change(idev); 4157 } 4158 } 4159 rcu_read_unlock(); 4160 } 4161 4162 static int addrconf_disable_ipv6(struct ctl_table *table, int *p, int old) 4163 { 4164 struct net *net; 4165 4166 net = (struct net *)table->extra2; 4167 4168 if (p == &net->ipv6.devconf_dflt->disable_ipv6) 4169 return 0; 4170 4171 if (!rtnl_trylock()) { 4172 /* Restore the original values before restarting */ 4173 *p = old; 4174 return restart_syscall(); 4175 } 4176 4177 if (p == &net->ipv6.devconf_all->disable_ipv6) { 4178 __s32 newf = net->ipv6.devconf_all->disable_ipv6; 4179 net->ipv6.devconf_dflt->disable_ipv6 = newf; 4180 addrconf_disable_change(net, newf); 4181 } else if ((!*p) ^ (!old)) 4182 dev_disable_change((struct inet6_dev *)table->extra1); 4183 4184 rtnl_unlock(); 4185 return 0; 4186 } 4187 4188 static 4189 int addrconf_sysctl_disable(ctl_table *ctl, int write, 4190 void __user *buffer, size_t *lenp, loff_t *ppos) 4191 { 4192 int *valp = ctl->data; 4193 int val = *valp; 4194 loff_t pos = *ppos; 4195 int ret; 4196 4197 ret = proc_dointvec(ctl, write, buffer, lenp, ppos); 4198 4199 if (write) 4200 ret = addrconf_disable_ipv6(ctl, valp, val); 4201 if (ret) 4202 *ppos = pos; 4203 return ret; 4204 } 4205 4206 static struct addrconf_sysctl_table 4207 { 4208 struct ctl_table_header *sysctl_header; 4209 ctl_table addrconf_vars[DEVCONF_MAX+1]; 4210 char *dev_name; 4211 } addrconf_sysctl __read_mostly = { 4212 .sysctl_header = NULL, 4213 .addrconf_vars = { 4214 { 4215 .procname = "forwarding", 4216 .data = &ipv6_devconf.forwarding, 4217 .maxlen = sizeof(int), 4218 .mode = 0644, 4219 .proc_handler = addrconf_sysctl_forward, 4220 }, 4221 { 4222 .procname = "hop_limit", 4223 .data = &ipv6_devconf.hop_limit, 4224 .maxlen = sizeof(int), 4225 .mode = 0644, 4226 .proc_handler = proc_dointvec, 4227 }, 4228 { 4229 .procname = "mtu", 4230 .data = &ipv6_devconf.mtu6, 4231 .maxlen = sizeof(int), 4232 .mode = 0644, 4233 .proc_handler = proc_dointvec, 4234 }, 4235 { 4236 .procname = "accept_ra", 4237 .data = &ipv6_devconf.accept_ra, 4238 .maxlen = sizeof(int), 4239 .mode = 0644, 4240 .proc_handler = proc_dointvec, 4241 }, 4242 { 4243 .procname = "accept_redirects", 4244 .data = &ipv6_devconf.accept_redirects, 4245 .maxlen = sizeof(int), 4246 .mode = 0644, 4247 .proc_handler = proc_dointvec, 4248 }, 4249 { 4250 .procname = "autoconf", 4251 .data = &ipv6_devconf.autoconf, 4252 .maxlen = sizeof(int), 4253 .mode = 0644, 4254 .proc_handler = proc_dointvec, 4255 }, 4256 { 4257 .procname = "dad_transmits", 4258 .data = &ipv6_devconf.dad_transmits, 4259 .maxlen = sizeof(int), 4260 .mode = 0644, 4261 .proc_handler = proc_dointvec, 4262 }, 4263 { 4264 .procname = "router_solicitations", 4265 .data = &ipv6_devconf.rtr_solicits, 4266 .maxlen = sizeof(int), 4267 .mode = 0644, 4268 .proc_handler = proc_dointvec, 4269 }, 4270 { 4271 .procname = "router_solicitation_interval", 4272 .data = &ipv6_devconf.rtr_solicit_interval, 4273 .maxlen = sizeof(int), 4274 .mode = 0644, 4275 .proc_handler = proc_dointvec_jiffies, 4276 }, 4277 { 4278 .procname = "router_solicitation_delay", 4279 .data = &ipv6_devconf.rtr_solicit_delay, 4280 .maxlen = sizeof(int), 4281 .mode = 0644, 4282 .proc_handler = proc_dointvec_jiffies, 4283 }, 4284 { 4285 .procname = "force_mld_version", 4286 .data = &ipv6_devconf.force_mld_version, 4287 .maxlen = sizeof(int), 4288 .mode = 0644, 4289 .proc_handler = proc_dointvec, 4290 }, 4291 #ifdef CONFIG_IPV6_PRIVACY 4292 { 4293 .procname = "use_tempaddr", 4294 .data = &ipv6_devconf.use_tempaddr, 4295 .maxlen = sizeof(int), 4296 .mode = 0644, 4297 .proc_handler = proc_dointvec, 4298 }, 4299 { 4300 .procname = "temp_valid_lft", 4301 .data = &ipv6_devconf.temp_valid_lft, 4302 .maxlen = sizeof(int), 4303 .mode = 0644, 4304 .proc_handler = proc_dointvec, 4305 }, 4306 { 4307 .procname = "temp_prefered_lft", 4308 .data = &ipv6_devconf.temp_prefered_lft, 4309 .maxlen = sizeof(int), 4310 .mode = 0644, 4311 .proc_handler = proc_dointvec, 4312 }, 4313 { 4314 .procname = "regen_max_retry", 4315 .data = &ipv6_devconf.regen_max_retry, 4316 .maxlen = sizeof(int), 4317 .mode = 0644, 4318 .proc_handler = proc_dointvec, 4319 }, 4320 { 4321 .procname = "max_desync_factor", 4322 .data = &ipv6_devconf.max_desync_factor, 4323 .maxlen = sizeof(int), 4324 .mode = 0644, 4325 .proc_handler = proc_dointvec, 4326 }, 4327 #endif 4328 { 4329 .procname = "max_addresses", 4330 .data = &ipv6_devconf.max_addresses, 4331 .maxlen = sizeof(int), 4332 .mode = 0644, 4333 .proc_handler = proc_dointvec, 4334 }, 4335 { 4336 .procname = "accept_ra_defrtr", 4337 .data = &ipv6_devconf.accept_ra_defrtr, 4338 .maxlen = sizeof(int), 4339 .mode = 0644, 4340 .proc_handler = proc_dointvec, 4341 }, 4342 { 4343 .procname = "accept_ra_pinfo", 4344 .data = &ipv6_devconf.accept_ra_pinfo, 4345 .maxlen = sizeof(int), 4346 .mode = 0644, 4347 .proc_handler = proc_dointvec, 4348 }, 4349 #ifdef CONFIG_IPV6_ROUTER_PREF 4350 { 4351 .procname = "accept_ra_rtr_pref", 4352 .data = &ipv6_devconf.accept_ra_rtr_pref, 4353 .maxlen = sizeof(int), 4354 .mode = 0644, 4355 .proc_handler = proc_dointvec, 4356 }, 4357 { 4358 .procname = "router_probe_interval", 4359 .data = &ipv6_devconf.rtr_probe_interval, 4360 .maxlen = sizeof(int), 4361 .mode = 0644, 4362 .proc_handler = proc_dointvec_jiffies, 4363 }, 4364 #ifdef CONFIG_IPV6_ROUTE_INFO 4365 { 4366 .procname = "accept_ra_rt_info_max_plen", 4367 .data = &ipv6_devconf.accept_ra_rt_info_max_plen, 4368 .maxlen = sizeof(int), 4369 .mode = 0644, 4370 .proc_handler = proc_dointvec, 4371 }, 4372 #endif 4373 #endif 4374 { 4375 .procname = "proxy_ndp", 4376 .data = &ipv6_devconf.proxy_ndp, 4377 .maxlen = sizeof(int), 4378 .mode = 0644, 4379 .proc_handler = proc_dointvec, 4380 }, 4381 { 4382 .procname = "accept_source_route", 4383 .data = &ipv6_devconf.accept_source_route, 4384 .maxlen = sizeof(int), 4385 .mode = 0644, 4386 .proc_handler = proc_dointvec, 4387 }, 4388 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 4389 { 4390 .procname = "optimistic_dad", 4391 .data = &ipv6_devconf.optimistic_dad, 4392 .maxlen = sizeof(int), 4393 .mode = 0644, 4394 .proc_handler = proc_dointvec, 4395 4396 }, 4397 #endif 4398 #ifdef CONFIG_IPV6_MROUTE 4399 { 4400 .procname = "mc_forwarding", 4401 .data = &ipv6_devconf.mc_forwarding, 4402 .maxlen = sizeof(int), 4403 .mode = 0444, 4404 .proc_handler = proc_dointvec, 4405 }, 4406 #endif 4407 { 4408 .procname = "disable_ipv6", 4409 .data = &ipv6_devconf.disable_ipv6, 4410 .maxlen = sizeof(int), 4411 .mode = 0644, 4412 .proc_handler = addrconf_sysctl_disable, 4413 }, 4414 { 4415 .procname = "accept_dad", 4416 .data = &ipv6_devconf.accept_dad, 4417 .maxlen = sizeof(int), 4418 .mode = 0644, 4419 .proc_handler = proc_dointvec, 4420 }, 4421 { 4422 .procname = "force_tllao", 4423 .data = &ipv6_devconf.force_tllao, 4424 .maxlen = sizeof(int), 4425 .mode = 0644, 4426 .proc_handler = proc_dointvec 4427 }, 4428 { 4429 /* sentinel */ 4430 } 4431 }, 4432 }; 4433 4434 static int __addrconf_sysctl_register(struct net *net, char *dev_name, 4435 struct inet6_dev *idev, struct ipv6_devconf *p) 4436 { 4437 int i; 4438 struct addrconf_sysctl_table *t; 4439 4440 #define ADDRCONF_CTL_PATH_DEV 3 4441 4442 struct ctl_path addrconf_ctl_path[] = { 4443 { .procname = "net", }, 4444 { .procname = "ipv6", }, 4445 { .procname = "conf", }, 4446 { /* to be set */ }, 4447 { }, 4448 }; 4449 4450 4451 t = kmemdup(&addrconf_sysctl, sizeof(*t), GFP_KERNEL); 4452 if (t == NULL) 4453 goto out; 4454 4455 for (i = 0; t->addrconf_vars[i].data; i++) { 4456 t->addrconf_vars[i].data += (char *)p - (char *)&ipv6_devconf; 4457 t->addrconf_vars[i].extra1 = idev; /* embedded; no ref */ 4458 t->addrconf_vars[i].extra2 = net; 4459 } 4460 4461 /* 4462 * Make a copy of dev_name, because '.procname' is regarded as const 4463 * by sysctl and we wouldn't want anyone to change it under our feet 4464 * (see SIOCSIFNAME). 4465 */ 4466 t->dev_name = kstrdup(dev_name, GFP_KERNEL); 4467 if (!t->dev_name) 4468 goto free; 4469 4470 addrconf_ctl_path[ADDRCONF_CTL_PATH_DEV].procname = t->dev_name; 4471 4472 t->sysctl_header = register_net_sysctl_table(net, addrconf_ctl_path, 4473 t->addrconf_vars); 4474 if (t->sysctl_header == NULL) 4475 goto free_procname; 4476 4477 p->sysctl = t; 4478 return 0; 4479 4480 free_procname: 4481 kfree(t->dev_name); 4482 free: 4483 kfree(t); 4484 out: 4485 return -ENOBUFS; 4486 } 4487 4488 static void __addrconf_sysctl_unregister(struct ipv6_devconf *p) 4489 { 4490 struct addrconf_sysctl_table *t; 4491 4492 if (p->sysctl == NULL) 4493 return; 4494 4495 t = p->sysctl; 4496 p->sysctl = NULL; 4497 unregister_sysctl_table(t->sysctl_header); 4498 kfree(t->dev_name); 4499 kfree(t); 4500 } 4501 4502 static void addrconf_sysctl_register(struct inet6_dev *idev) 4503 { 4504 neigh_sysctl_register(idev->dev, idev->nd_parms, "ipv6", 4505 &ndisc_ifinfo_sysctl_change); 4506 __addrconf_sysctl_register(dev_net(idev->dev), idev->dev->name, 4507 idev, &idev->cnf); 4508 } 4509 4510 static void addrconf_sysctl_unregister(struct inet6_dev *idev) 4511 { 4512 __addrconf_sysctl_unregister(&idev->cnf); 4513 neigh_sysctl_unregister(idev->nd_parms); 4514 } 4515 4516 4517 #endif 4518 4519 static int __net_init addrconf_init_net(struct net *net) 4520 { 4521 int err; 4522 struct ipv6_devconf *all, *dflt; 4523 4524 err = -ENOMEM; 4525 all = &ipv6_devconf; 4526 dflt = &ipv6_devconf_dflt; 4527 4528 if (!net_eq(net, &init_net)) { 4529 all = kmemdup(all, sizeof(ipv6_devconf), GFP_KERNEL); 4530 if (all == NULL) 4531 goto err_alloc_all; 4532 4533 dflt = kmemdup(dflt, sizeof(ipv6_devconf_dflt), GFP_KERNEL); 4534 if (dflt == NULL) 4535 goto err_alloc_dflt; 4536 } else { 4537 /* these will be inherited by all namespaces */ 4538 dflt->autoconf = ipv6_defaults.autoconf; 4539 dflt->disable_ipv6 = ipv6_defaults.disable_ipv6; 4540 } 4541 4542 net->ipv6.devconf_all = all; 4543 net->ipv6.devconf_dflt = dflt; 4544 4545 #ifdef CONFIG_SYSCTL 4546 err = __addrconf_sysctl_register(net, "all", NULL, all); 4547 if (err < 0) 4548 goto err_reg_all; 4549 4550 err = __addrconf_sysctl_register(net, "default", NULL, dflt); 4551 if (err < 0) 4552 goto err_reg_dflt; 4553 #endif 4554 return 0; 4555 4556 #ifdef CONFIG_SYSCTL 4557 err_reg_dflt: 4558 __addrconf_sysctl_unregister(all); 4559 err_reg_all: 4560 kfree(dflt); 4561 #endif 4562 err_alloc_dflt: 4563 kfree(all); 4564 err_alloc_all: 4565 return err; 4566 } 4567 4568 static void __net_exit addrconf_exit_net(struct net *net) 4569 { 4570 #ifdef CONFIG_SYSCTL 4571 __addrconf_sysctl_unregister(net->ipv6.devconf_dflt); 4572 __addrconf_sysctl_unregister(net->ipv6.devconf_all); 4573 #endif 4574 if (!net_eq(net, &init_net)) { 4575 kfree(net->ipv6.devconf_dflt); 4576 kfree(net->ipv6.devconf_all); 4577 } 4578 } 4579 4580 static struct pernet_operations addrconf_ops = { 4581 .init = addrconf_init_net, 4582 .exit = addrconf_exit_net, 4583 }; 4584 4585 /* 4586 * Device notifier 4587 */ 4588 4589 int register_inet6addr_notifier(struct notifier_block *nb) 4590 { 4591 return atomic_notifier_chain_register(&inet6addr_chain, nb); 4592 } 4593 EXPORT_SYMBOL(register_inet6addr_notifier); 4594 4595 int unregister_inet6addr_notifier(struct notifier_block *nb) 4596 { 4597 return atomic_notifier_chain_unregister(&inet6addr_chain, nb); 4598 } 4599 EXPORT_SYMBOL(unregister_inet6addr_notifier); 4600 4601 /* 4602 * Init / cleanup code 4603 */ 4604 4605 int __init addrconf_init(void) 4606 { 4607 int i, err; 4608 4609 err = ipv6_addr_label_init(); 4610 if (err < 0) { 4611 printk(KERN_CRIT "IPv6 Addrconf:" 4612 " cannot initialize default policy table: %d.\n", err); 4613 return err; 4614 } 4615 4616 register_pernet_subsys(&addrconf_ops); 4617 4618 /* The addrconf netdev notifier requires that loopback_dev 4619 * has it's ipv6 private information allocated and setup 4620 * before it can bring up and give link-local addresses 4621 * to other devices which are up. 4622 * 4623 * Unfortunately, loopback_dev is not necessarily the first 4624 * entry in the global dev_base list of net devices. In fact, 4625 * it is likely to be the very last entry on that list. 4626 * So this causes the notifier registry below to try and 4627 * give link-local addresses to all devices besides loopback_dev 4628 * first, then loopback_dev, which cases all the non-loopback_dev 4629 * devices to fail to get a link-local address. 4630 * 4631 * So, as a temporary fix, allocate the ipv6 structure for 4632 * loopback_dev first by hand. 4633 * Longer term, all of the dependencies ipv6 has upon the loopback 4634 * device and it being up should be removed. 4635 */ 4636 rtnl_lock(); 4637 if (!ipv6_add_dev(init_net.loopback_dev)) 4638 err = -ENOMEM; 4639 rtnl_unlock(); 4640 if (err) 4641 goto errlo; 4642 4643 for (i = 0; i < IN6_ADDR_HSIZE; i++) 4644 INIT_HLIST_HEAD(&inet6_addr_lst[i]); 4645 4646 register_netdevice_notifier(&ipv6_dev_notf); 4647 4648 addrconf_verify(0); 4649 4650 err = __rtnl_register(PF_INET6, RTM_GETLINK, NULL, inet6_dump_ifinfo); 4651 if (err < 0) 4652 goto errout; 4653 4654 /* Only the first call to __rtnl_register can fail */ 4655 __rtnl_register(PF_INET6, RTM_NEWADDR, inet6_rtm_newaddr, NULL); 4656 __rtnl_register(PF_INET6, RTM_DELADDR, inet6_rtm_deladdr, NULL); 4657 __rtnl_register(PF_INET6, RTM_GETADDR, inet6_rtm_getaddr, inet6_dump_ifaddr); 4658 __rtnl_register(PF_INET6, RTM_GETMULTICAST, NULL, inet6_dump_ifmcaddr); 4659 __rtnl_register(PF_INET6, RTM_GETANYCAST, NULL, inet6_dump_ifacaddr); 4660 4661 ipv6_addr_label_rtnl_register(); 4662 4663 return 0; 4664 errout: 4665 unregister_netdevice_notifier(&ipv6_dev_notf); 4666 errlo: 4667 unregister_pernet_subsys(&addrconf_ops); 4668 4669 return err; 4670 } 4671 4672 void addrconf_cleanup(void) 4673 { 4674 struct net_device *dev; 4675 int i; 4676 4677 unregister_netdevice_notifier(&ipv6_dev_notf); 4678 unregister_pernet_subsys(&addrconf_ops); 4679 4680 rtnl_lock(); 4681 4682 /* clean dev list */ 4683 for_each_netdev(&init_net, dev) { 4684 if (__in6_dev_get(dev) == NULL) 4685 continue; 4686 addrconf_ifdown(dev, 1); 4687 } 4688 addrconf_ifdown(init_net.loopback_dev, 2); 4689 4690 /* 4691 * Check hash table. 4692 */ 4693 spin_lock_bh(&addrconf_hash_lock); 4694 for (i = 0; i < IN6_ADDR_HSIZE; i++) 4695 WARN_ON(!hlist_empty(&inet6_addr_lst[i])); 4696 spin_unlock_bh(&addrconf_hash_lock); 4697 4698 del_timer(&addr_chk_timer); 4699 rtnl_unlock(); 4700 } 4701