1 /* 2 * inet_diag.c Module for monitoring INET transport protocols sockets. 3 * 4 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru> 5 * 6 * This program is free software; you can redistribute it and/or 7 * modify it under the terms of the GNU General Public License 8 * as published by the Free Software Foundation; either version 9 * 2 of the License, or (at your option) any later version. 10 */ 11 12 #include <linux/kernel.h> 13 #include <linux/module.h> 14 #include <linux/types.h> 15 #include <linux/fcntl.h> 16 #include <linux/random.h> 17 #include <linux/slab.h> 18 #include <linux/cache.h> 19 #include <linux/init.h> 20 #include <linux/time.h> 21 22 #include <net/icmp.h> 23 #include <net/tcp.h> 24 #include <net/ipv6.h> 25 #include <net/inet_common.h> 26 #include <net/inet_connection_sock.h> 27 #include <net/inet_hashtables.h> 28 #include <net/inet_timewait_sock.h> 29 #include <net/inet6_hashtables.h> 30 #include <net/netlink.h> 31 32 #include <linux/inet.h> 33 #include <linux/stddef.h> 34 35 #include <linux/inet_diag.h> 36 #include <linux/sock_diag.h> 37 38 static const struct inet_diag_handler **inet_diag_table; 39 40 struct inet_diag_entry { 41 __be32 *saddr; 42 __be32 *daddr; 43 u16 sport; 44 u16 dport; 45 u16 family; 46 u16 userlocks; 47 #if IS_ENABLED(CONFIG_IPV6) 48 struct in6_addr saddr_storage; /* for IPv4-mapped-IPv6 addresses */ 49 struct in6_addr daddr_storage; /* for IPv4-mapped-IPv6 addresses */ 50 #endif 51 }; 52 53 static DEFINE_MUTEX(inet_diag_table_mutex); 54 55 static const struct inet_diag_handler *inet_diag_lock_handler(int proto) 56 { 57 if (!inet_diag_table[proto]) 58 request_module("net-pf-%d-proto-%d-type-%d-%d", PF_NETLINK, 59 NETLINK_SOCK_DIAG, AF_INET, proto); 60 61 mutex_lock(&inet_diag_table_mutex); 62 if (!inet_diag_table[proto]) 63 return ERR_PTR(-ENOENT); 64 65 return inet_diag_table[proto]; 66 } 67 68 static inline void inet_diag_unlock_handler( 69 const struct inet_diag_handler *handler) 70 { 71 mutex_unlock(&inet_diag_table_mutex); 72 } 73 74 int inet_sk_diag_fill(struct sock *sk, struct inet_connection_sock *icsk, 75 struct sk_buff *skb, struct inet_diag_req_v2 *req, 76 struct user_namespace *user_ns, 77 u32 portid, u32 seq, u16 nlmsg_flags, 78 const struct nlmsghdr *unlh) 79 { 80 const struct inet_sock *inet = inet_sk(sk); 81 struct inet_diag_msg *r; 82 struct nlmsghdr *nlh; 83 struct nlattr *attr; 84 void *info = NULL; 85 const struct inet_diag_handler *handler; 86 int ext = req->idiag_ext; 87 88 handler = inet_diag_table[req->sdiag_protocol]; 89 BUG_ON(handler == NULL); 90 91 nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r), 92 nlmsg_flags); 93 if (!nlh) 94 return -EMSGSIZE; 95 96 r = nlmsg_data(nlh); 97 BUG_ON(sk->sk_state == TCP_TIME_WAIT); 98 99 r->idiag_family = sk->sk_family; 100 r->idiag_state = sk->sk_state; 101 r->idiag_timer = 0; 102 r->idiag_retrans = 0; 103 104 r->id.idiag_if = sk->sk_bound_dev_if; 105 sock_diag_save_cookie(sk, r->id.idiag_cookie); 106 107 r->id.idiag_sport = inet->inet_sport; 108 r->id.idiag_dport = inet->inet_dport; 109 110 memset(&r->id.idiag_src, 0, sizeof(r->id.idiag_src)); 111 memset(&r->id.idiag_dst, 0, sizeof(r->id.idiag_dst)); 112 113 r->id.idiag_src[0] = inet->inet_rcv_saddr; 114 r->id.idiag_dst[0] = inet->inet_daddr; 115 116 if (nla_put_u8(skb, INET_DIAG_SHUTDOWN, sk->sk_shutdown)) 117 goto errout; 118 119 /* IPv6 dual-stack sockets use inet->tos for IPv4 connections, 120 * hence this needs to be included regardless of socket family. 121 */ 122 if (ext & (1 << (INET_DIAG_TOS - 1))) 123 if (nla_put_u8(skb, INET_DIAG_TOS, inet->tos) < 0) 124 goto errout; 125 126 #if IS_ENABLED(CONFIG_IPV6) 127 if (r->idiag_family == AF_INET6) { 128 129 *(struct in6_addr *)r->id.idiag_src = sk->sk_v6_rcv_saddr; 130 *(struct in6_addr *)r->id.idiag_dst = sk->sk_v6_daddr; 131 132 if (ext & (1 << (INET_DIAG_TCLASS - 1))) 133 if (nla_put_u8(skb, INET_DIAG_TCLASS, 134 inet6_sk(sk)->tclass) < 0) 135 goto errout; 136 } 137 #endif 138 139 r->idiag_uid = from_kuid_munged(user_ns, sock_i_uid(sk)); 140 r->idiag_inode = sock_i_ino(sk); 141 142 if (ext & (1 << (INET_DIAG_MEMINFO - 1))) { 143 struct inet_diag_meminfo minfo = { 144 .idiag_rmem = sk_rmem_alloc_get(sk), 145 .idiag_wmem = sk->sk_wmem_queued, 146 .idiag_fmem = sk->sk_forward_alloc, 147 .idiag_tmem = sk_wmem_alloc_get(sk), 148 }; 149 150 if (nla_put(skb, INET_DIAG_MEMINFO, sizeof(minfo), &minfo) < 0) 151 goto errout; 152 } 153 154 if (ext & (1 << (INET_DIAG_SKMEMINFO - 1))) 155 if (sock_diag_put_meminfo(sk, skb, INET_DIAG_SKMEMINFO)) 156 goto errout; 157 158 if (icsk == NULL) { 159 handler->idiag_get_info(sk, r, NULL); 160 goto out; 161 } 162 163 #define EXPIRES_IN_MS(tmo) DIV_ROUND_UP((tmo - jiffies) * 1000, HZ) 164 165 if (icsk->icsk_pending == ICSK_TIME_RETRANS || 166 icsk->icsk_pending == ICSK_TIME_EARLY_RETRANS || 167 icsk->icsk_pending == ICSK_TIME_LOSS_PROBE) { 168 r->idiag_timer = 1; 169 r->idiag_retrans = icsk->icsk_retransmits; 170 r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout); 171 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) { 172 r->idiag_timer = 4; 173 r->idiag_retrans = icsk->icsk_probes_out; 174 r->idiag_expires = EXPIRES_IN_MS(icsk->icsk_timeout); 175 } else if (timer_pending(&sk->sk_timer)) { 176 r->idiag_timer = 2; 177 r->idiag_retrans = icsk->icsk_probes_out; 178 r->idiag_expires = EXPIRES_IN_MS(sk->sk_timer.expires); 179 } else { 180 r->idiag_timer = 0; 181 r->idiag_expires = 0; 182 } 183 #undef EXPIRES_IN_MS 184 185 if (ext & (1 << (INET_DIAG_INFO - 1))) { 186 attr = nla_reserve(skb, INET_DIAG_INFO, 187 sizeof(struct tcp_info)); 188 if (!attr) 189 goto errout; 190 191 info = nla_data(attr); 192 } 193 194 if ((ext & (1 << (INET_DIAG_CONG - 1))) && icsk->icsk_ca_ops) 195 if (nla_put_string(skb, INET_DIAG_CONG, 196 icsk->icsk_ca_ops->name) < 0) 197 goto errout; 198 199 handler->idiag_get_info(sk, r, info); 200 201 if (sk->sk_state < TCP_TIME_WAIT && 202 icsk->icsk_ca_ops && icsk->icsk_ca_ops->get_info) 203 icsk->icsk_ca_ops->get_info(sk, ext, skb); 204 205 out: 206 nlmsg_end(skb, nlh); 207 return 0; 208 209 errout: 210 nlmsg_cancel(skb, nlh); 211 return -EMSGSIZE; 212 } 213 EXPORT_SYMBOL_GPL(inet_sk_diag_fill); 214 215 static int inet_csk_diag_fill(struct sock *sk, 216 struct sk_buff *skb, struct inet_diag_req_v2 *req, 217 struct user_namespace *user_ns, 218 u32 portid, u32 seq, u16 nlmsg_flags, 219 const struct nlmsghdr *unlh) 220 { 221 return inet_sk_diag_fill(sk, inet_csk(sk), 222 skb, req, user_ns, portid, seq, nlmsg_flags, unlh); 223 } 224 225 static int inet_twsk_diag_fill(struct inet_timewait_sock *tw, 226 struct sk_buff *skb, struct inet_diag_req_v2 *req, 227 u32 portid, u32 seq, u16 nlmsg_flags, 228 const struct nlmsghdr *unlh) 229 { 230 s32 tmo; 231 struct inet_diag_msg *r; 232 struct nlmsghdr *nlh; 233 234 nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r), 235 nlmsg_flags); 236 if (!nlh) 237 return -EMSGSIZE; 238 239 r = nlmsg_data(nlh); 240 BUG_ON(tw->tw_state != TCP_TIME_WAIT); 241 242 tmo = tw->tw_ttd - inet_tw_time_stamp(); 243 if (tmo < 0) 244 tmo = 0; 245 246 r->idiag_family = tw->tw_family; 247 r->idiag_retrans = 0; 248 249 r->id.idiag_if = tw->tw_bound_dev_if; 250 sock_diag_save_cookie(tw, r->id.idiag_cookie); 251 252 r->id.idiag_sport = tw->tw_sport; 253 r->id.idiag_dport = tw->tw_dport; 254 255 memset(&r->id.idiag_src, 0, sizeof(r->id.idiag_src)); 256 memset(&r->id.idiag_dst, 0, sizeof(r->id.idiag_dst)); 257 258 r->id.idiag_src[0] = tw->tw_rcv_saddr; 259 r->id.idiag_dst[0] = tw->tw_daddr; 260 261 r->idiag_state = tw->tw_substate; 262 r->idiag_timer = 3; 263 r->idiag_expires = jiffies_to_msecs(tmo); 264 r->idiag_rqueue = 0; 265 r->idiag_wqueue = 0; 266 r->idiag_uid = 0; 267 r->idiag_inode = 0; 268 #if IS_ENABLED(CONFIG_IPV6) 269 if (tw->tw_family == AF_INET6) { 270 *(struct in6_addr *)r->id.idiag_src = tw->tw_v6_rcv_saddr; 271 *(struct in6_addr *)r->id.idiag_dst = tw->tw_v6_daddr; 272 } 273 #endif 274 275 nlmsg_end(skb, nlh); 276 return 0; 277 } 278 279 static int sk_diag_fill(struct sock *sk, struct sk_buff *skb, 280 struct inet_diag_req_v2 *r, 281 struct user_namespace *user_ns, 282 u32 portid, u32 seq, u16 nlmsg_flags, 283 const struct nlmsghdr *unlh) 284 { 285 if (sk->sk_state == TCP_TIME_WAIT) 286 return inet_twsk_diag_fill(inet_twsk(sk), skb, r, portid, seq, 287 nlmsg_flags, unlh); 288 289 return inet_csk_diag_fill(sk, skb, r, user_ns, portid, seq, 290 nlmsg_flags, unlh); 291 } 292 293 int inet_diag_dump_one_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *in_skb, 294 const struct nlmsghdr *nlh, struct inet_diag_req_v2 *req) 295 { 296 int err; 297 struct sock *sk; 298 struct sk_buff *rep; 299 struct net *net = sock_net(in_skb->sk); 300 301 err = -EINVAL; 302 if (req->sdiag_family == AF_INET) { 303 sk = inet_lookup(net, hashinfo, req->id.idiag_dst[0], 304 req->id.idiag_dport, req->id.idiag_src[0], 305 req->id.idiag_sport, req->id.idiag_if); 306 } 307 #if IS_ENABLED(CONFIG_IPV6) 308 else if (req->sdiag_family == AF_INET6) { 309 sk = inet6_lookup(net, hashinfo, 310 (struct in6_addr *)req->id.idiag_dst, 311 req->id.idiag_dport, 312 (struct in6_addr *)req->id.idiag_src, 313 req->id.idiag_sport, 314 req->id.idiag_if); 315 } 316 #endif 317 else { 318 goto out_nosk; 319 } 320 321 err = -ENOENT; 322 if (sk == NULL) 323 goto out_nosk; 324 325 err = sock_diag_check_cookie(sk, req->id.idiag_cookie); 326 if (err) 327 goto out; 328 329 rep = nlmsg_new(sizeof(struct inet_diag_msg) + 330 sizeof(struct inet_diag_meminfo) + 331 sizeof(struct tcp_info) + 64, GFP_KERNEL); 332 if (!rep) { 333 err = -ENOMEM; 334 goto out; 335 } 336 337 err = sk_diag_fill(sk, rep, req, 338 sk_user_ns(NETLINK_CB(in_skb).sk), 339 NETLINK_CB(in_skb).portid, 340 nlh->nlmsg_seq, 0, nlh); 341 if (err < 0) { 342 WARN_ON(err == -EMSGSIZE); 343 nlmsg_free(rep); 344 goto out; 345 } 346 err = netlink_unicast(net->diag_nlsk, rep, NETLINK_CB(in_skb).portid, 347 MSG_DONTWAIT); 348 if (err > 0) 349 err = 0; 350 351 out: 352 if (sk) 353 sock_gen_put(sk); 354 355 out_nosk: 356 return err; 357 } 358 EXPORT_SYMBOL_GPL(inet_diag_dump_one_icsk); 359 360 static int inet_diag_get_exact(struct sk_buff *in_skb, 361 const struct nlmsghdr *nlh, 362 struct inet_diag_req_v2 *req) 363 { 364 const struct inet_diag_handler *handler; 365 int err; 366 367 handler = inet_diag_lock_handler(req->sdiag_protocol); 368 if (IS_ERR(handler)) 369 err = PTR_ERR(handler); 370 else 371 err = handler->dump_one(in_skb, nlh, req); 372 inet_diag_unlock_handler(handler); 373 374 return err; 375 } 376 377 static int bitstring_match(const __be32 *a1, const __be32 *a2, int bits) 378 { 379 int words = bits >> 5; 380 381 bits &= 0x1f; 382 383 if (words) { 384 if (memcmp(a1, a2, words << 2)) 385 return 0; 386 } 387 if (bits) { 388 __be32 w1, w2; 389 __be32 mask; 390 391 w1 = a1[words]; 392 w2 = a2[words]; 393 394 mask = htonl((0xffffffff) << (32 - bits)); 395 396 if ((w1 ^ w2) & mask) 397 return 0; 398 } 399 400 return 1; 401 } 402 403 404 static int inet_diag_bc_run(const struct nlattr *_bc, 405 const struct inet_diag_entry *entry) 406 { 407 const void *bc = nla_data(_bc); 408 int len = nla_len(_bc); 409 410 while (len > 0) { 411 int yes = 1; 412 const struct inet_diag_bc_op *op = bc; 413 414 switch (op->code) { 415 case INET_DIAG_BC_NOP: 416 break; 417 case INET_DIAG_BC_JMP: 418 yes = 0; 419 break; 420 case INET_DIAG_BC_S_GE: 421 yes = entry->sport >= op[1].no; 422 break; 423 case INET_DIAG_BC_S_LE: 424 yes = entry->sport <= op[1].no; 425 break; 426 case INET_DIAG_BC_D_GE: 427 yes = entry->dport >= op[1].no; 428 break; 429 case INET_DIAG_BC_D_LE: 430 yes = entry->dport <= op[1].no; 431 break; 432 case INET_DIAG_BC_AUTO: 433 yes = !(entry->userlocks & SOCK_BINDPORT_LOCK); 434 break; 435 case INET_DIAG_BC_S_COND: 436 case INET_DIAG_BC_D_COND: { 437 struct inet_diag_hostcond *cond; 438 __be32 *addr; 439 440 cond = (struct inet_diag_hostcond *)(op + 1); 441 if (cond->port != -1 && 442 cond->port != (op->code == INET_DIAG_BC_S_COND ? 443 entry->sport : entry->dport)) { 444 yes = 0; 445 break; 446 } 447 448 if (op->code == INET_DIAG_BC_S_COND) 449 addr = entry->saddr; 450 else 451 addr = entry->daddr; 452 453 if (cond->family != AF_UNSPEC && 454 cond->family != entry->family) { 455 if (entry->family == AF_INET6 && 456 cond->family == AF_INET) { 457 if (addr[0] == 0 && addr[1] == 0 && 458 addr[2] == htonl(0xffff) && 459 bitstring_match(addr + 3, 460 cond->addr, 461 cond->prefix_len)) 462 break; 463 } 464 yes = 0; 465 break; 466 } 467 468 if (cond->prefix_len == 0) 469 break; 470 if (bitstring_match(addr, cond->addr, 471 cond->prefix_len)) 472 break; 473 yes = 0; 474 break; 475 } 476 } 477 478 if (yes) { 479 len -= op->yes; 480 bc += op->yes; 481 } else { 482 len -= op->no; 483 bc += op->no; 484 } 485 } 486 return len == 0; 487 } 488 489 int inet_diag_bc_sk(const struct nlattr *bc, struct sock *sk) 490 { 491 struct inet_diag_entry entry; 492 struct inet_sock *inet = inet_sk(sk); 493 494 if (bc == NULL) 495 return 1; 496 497 entry.family = sk->sk_family; 498 #if IS_ENABLED(CONFIG_IPV6) 499 if (entry.family == AF_INET6) { 500 501 entry.saddr = sk->sk_v6_rcv_saddr.s6_addr32; 502 entry.daddr = sk->sk_v6_daddr.s6_addr32; 503 } else 504 #endif 505 { 506 entry.saddr = &inet->inet_rcv_saddr; 507 entry.daddr = &inet->inet_daddr; 508 } 509 entry.sport = inet->inet_num; 510 entry.dport = ntohs(inet->inet_dport); 511 entry.userlocks = (sk->sk_state != TCP_TIME_WAIT) ? sk->sk_userlocks : 0; 512 513 return inet_diag_bc_run(bc, &entry); 514 } 515 EXPORT_SYMBOL_GPL(inet_diag_bc_sk); 516 517 static int valid_cc(const void *bc, int len, int cc) 518 { 519 while (len >= 0) { 520 const struct inet_diag_bc_op *op = bc; 521 522 if (cc > len) 523 return 0; 524 if (cc == len) 525 return 1; 526 if (op->yes < 4 || op->yes & 3) 527 return 0; 528 len -= op->yes; 529 bc += op->yes; 530 } 531 return 0; 532 } 533 534 /* Validate an inet_diag_hostcond. */ 535 static bool valid_hostcond(const struct inet_diag_bc_op *op, int len, 536 int *min_len) 537 { 538 int addr_len; 539 struct inet_diag_hostcond *cond; 540 541 /* Check hostcond space. */ 542 *min_len += sizeof(struct inet_diag_hostcond); 543 if (len < *min_len) 544 return false; 545 cond = (struct inet_diag_hostcond *)(op + 1); 546 547 /* Check address family and address length. */ 548 switch (cond->family) { 549 case AF_UNSPEC: 550 addr_len = 0; 551 break; 552 case AF_INET: 553 addr_len = sizeof(struct in_addr); 554 break; 555 case AF_INET6: 556 addr_len = sizeof(struct in6_addr); 557 break; 558 default: 559 return false; 560 } 561 *min_len += addr_len; 562 if (len < *min_len) 563 return false; 564 565 /* Check prefix length (in bits) vs address length (in bytes). */ 566 if (cond->prefix_len > 8 * addr_len) 567 return false; 568 569 return true; 570 } 571 572 /* Validate a port comparison operator. */ 573 static inline bool valid_port_comparison(const struct inet_diag_bc_op *op, 574 int len, int *min_len) 575 { 576 /* Port comparisons put the port in a follow-on inet_diag_bc_op. */ 577 *min_len += sizeof(struct inet_diag_bc_op); 578 if (len < *min_len) 579 return false; 580 return true; 581 } 582 583 static int inet_diag_bc_audit(const void *bytecode, int bytecode_len) 584 { 585 const void *bc = bytecode; 586 int len = bytecode_len; 587 588 while (len > 0) { 589 const struct inet_diag_bc_op *op = bc; 590 int min_len = sizeof(struct inet_diag_bc_op); 591 592 //printk("BC: %d %d %d {%d} / %d\n", op->code, op->yes, op->no, op[1].no, len); 593 switch (op->code) { 594 case INET_DIAG_BC_S_COND: 595 case INET_DIAG_BC_D_COND: 596 if (!valid_hostcond(bc, len, &min_len)) 597 return -EINVAL; 598 break; 599 case INET_DIAG_BC_S_GE: 600 case INET_DIAG_BC_S_LE: 601 case INET_DIAG_BC_D_GE: 602 case INET_DIAG_BC_D_LE: 603 if (!valid_port_comparison(bc, len, &min_len)) 604 return -EINVAL; 605 break; 606 case INET_DIAG_BC_AUTO: 607 case INET_DIAG_BC_JMP: 608 case INET_DIAG_BC_NOP: 609 break; 610 default: 611 return -EINVAL; 612 } 613 614 if (op->code != INET_DIAG_BC_NOP) { 615 if (op->no < min_len || op->no > len + 4 || op->no & 3) 616 return -EINVAL; 617 if (op->no < len && 618 !valid_cc(bytecode, bytecode_len, len - op->no)) 619 return -EINVAL; 620 } 621 622 if (op->yes < min_len || op->yes > len + 4 || op->yes & 3) 623 return -EINVAL; 624 bc += op->yes; 625 len -= op->yes; 626 } 627 return len == 0 ? 0 : -EINVAL; 628 } 629 630 static int inet_csk_diag_dump(struct sock *sk, 631 struct sk_buff *skb, 632 struct netlink_callback *cb, 633 struct inet_diag_req_v2 *r, 634 const struct nlattr *bc) 635 { 636 if (!inet_diag_bc_sk(bc, sk)) 637 return 0; 638 639 return inet_csk_diag_fill(sk, skb, r, 640 sk_user_ns(NETLINK_CB(cb->skb).sk), 641 NETLINK_CB(cb->skb).portid, 642 cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh); 643 } 644 645 static void twsk_build_assert(void) 646 { 647 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_family) != 648 offsetof(struct sock, sk_family)); 649 650 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_num) != 651 offsetof(struct inet_sock, inet_num)); 652 653 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_dport) != 654 offsetof(struct inet_sock, inet_dport)); 655 656 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_rcv_saddr) != 657 offsetof(struct inet_sock, inet_rcv_saddr)); 658 659 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_daddr) != 660 offsetof(struct inet_sock, inet_daddr)); 661 662 #if IS_ENABLED(CONFIG_IPV6) 663 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_v6_rcv_saddr) != 664 offsetof(struct sock, sk_v6_rcv_saddr)); 665 666 BUILD_BUG_ON(offsetof(struct inet_timewait_sock, tw_v6_daddr) != 667 offsetof(struct sock, sk_v6_daddr)); 668 #endif 669 } 670 671 static int inet_twsk_diag_dump(struct sock *sk, 672 struct sk_buff *skb, 673 struct netlink_callback *cb, 674 struct inet_diag_req_v2 *r, 675 const struct nlattr *bc) 676 { 677 twsk_build_assert(); 678 679 if (!inet_diag_bc_sk(bc, sk)) 680 return 0; 681 682 return inet_twsk_diag_fill(inet_twsk(sk), skb, r, 683 NETLINK_CB(cb->skb).portid, 684 cb->nlh->nlmsg_seq, NLM_F_MULTI, cb->nlh); 685 } 686 687 /* Get the IPv4, IPv6, or IPv4-mapped-IPv6 local and remote addresses 688 * from a request_sock. For IPv4-mapped-IPv6 we must map IPv4 to IPv6. 689 */ 690 static inline void inet_diag_req_addrs(const struct sock *sk, 691 const struct request_sock *req, 692 struct inet_diag_entry *entry) 693 { 694 struct inet_request_sock *ireq = inet_rsk(req); 695 696 #if IS_ENABLED(CONFIG_IPV6) 697 if (sk->sk_family == AF_INET6) { 698 if (req->rsk_ops->family == AF_INET6) { 699 entry->saddr = ireq->ir_v6_loc_addr.s6_addr32; 700 entry->daddr = ireq->ir_v6_rmt_addr.s6_addr32; 701 } else if (req->rsk_ops->family == AF_INET) { 702 ipv6_addr_set_v4mapped(ireq->ir_loc_addr, 703 &entry->saddr_storage); 704 ipv6_addr_set_v4mapped(ireq->ir_rmt_addr, 705 &entry->daddr_storage); 706 entry->saddr = entry->saddr_storage.s6_addr32; 707 entry->daddr = entry->daddr_storage.s6_addr32; 708 } 709 } else 710 #endif 711 { 712 entry->saddr = &ireq->ir_loc_addr; 713 entry->daddr = &ireq->ir_rmt_addr; 714 } 715 } 716 717 static int inet_diag_fill_req(struct sk_buff *skb, struct sock *sk, 718 struct request_sock *req, 719 struct user_namespace *user_ns, 720 u32 portid, u32 seq, 721 const struct nlmsghdr *unlh) 722 { 723 const struct inet_request_sock *ireq = inet_rsk(req); 724 struct inet_sock *inet = inet_sk(sk); 725 struct inet_diag_msg *r; 726 struct nlmsghdr *nlh; 727 long tmo; 728 729 nlh = nlmsg_put(skb, portid, seq, unlh->nlmsg_type, sizeof(*r), 730 NLM_F_MULTI); 731 if (!nlh) 732 return -EMSGSIZE; 733 734 r = nlmsg_data(nlh); 735 r->idiag_family = sk->sk_family; 736 r->idiag_state = TCP_SYN_RECV; 737 r->idiag_timer = 1; 738 r->idiag_retrans = req->num_retrans; 739 740 r->id.idiag_if = sk->sk_bound_dev_if; 741 sock_diag_save_cookie(req, r->id.idiag_cookie); 742 743 tmo = req->expires - jiffies; 744 if (tmo < 0) 745 tmo = 0; 746 747 r->id.idiag_sport = inet->inet_sport; 748 r->id.idiag_dport = ireq->ir_rmt_port; 749 750 memset(&r->id.idiag_src, 0, sizeof(r->id.idiag_src)); 751 memset(&r->id.idiag_dst, 0, sizeof(r->id.idiag_dst)); 752 753 r->id.idiag_src[0] = ireq->ir_loc_addr; 754 r->id.idiag_dst[0] = ireq->ir_rmt_addr; 755 756 r->idiag_expires = jiffies_to_msecs(tmo); 757 r->idiag_rqueue = 0; 758 r->idiag_wqueue = 0; 759 r->idiag_uid = from_kuid_munged(user_ns, sock_i_uid(sk)); 760 r->idiag_inode = 0; 761 #if IS_ENABLED(CONFIG_IPV6) 762 if (r->idiag_family == AF_INET6) { 763 struct inet_diag_entry entry; 764 inet_diag_req_addrs(sk, req, &entry); 765 memcpy(r->id.idiag_src, entry.saddr, sizeof(struct in6_addr)); 766 memcpy(r->id.idiag_dst, entry.daddr, sizeof(struct in6_addr)); 767 } 768 #endif 769 770 nlmsg_end(skb, nlh); 771 return 0; 772 } 773 774 static int inet_diag_dump_reqs(struct sk_buff *skb, struct sock *sk, 775 struct netlink_callback *cb, 776 struct inet_diag_req_v2 *r, 777 const struct nlattr *bc) 778 { 779 struct inet_diag_entry entry; 780 struct inet_connection_sock *icsk = inet_csk(sk); 781 struct listen_sock *lopt; 782 struct inet_sock *inet = inet_sk(sk); 783 int j, s_j; 784 int reqnum, s_reqnum; 785 int err = 0; 786 787 s_j = cb->args[3]; 788 s_reqnum = cb->args[4]; 789 790 if (s_j > 0) 791 s_j--; 792 793 entry.family = sk->sk_family; 794 795 read_lock_bh(&icsk->icsk_accept_queue.syn_wait_lock); 796 797 lopt = icsk->icsk_accept_queue.listen_opt; 798 if (!lopt || !lopt->qlen) 799 goto out; 800 801 if (bc != NULL) { 802 entry.sport = inet->inet_num; 803 entry.userlocks = sk->sk_userlocks; 804 } 805 806 for (j = s_j; j < lopt->nr_table_entries; j++) { 807 struct request_sock *req, *head = lopt->syn_table[j]; 808 809 reqnum = 0; 810 for (req = head; req; reqnum++, req = req->dl_next) { 811 struct inet_request_sock *ireq = inet_rsk(req); 812 813 if (reqnum < s_reqnum) 814 continue; 815 if (r->id.idiag_dport != ireq->ir_rmt_port && 816 r->id.idiag_dport) 817 continue; 818 819 if (bc) { 820 inet_diag_req_addrs(sk, req, &entry); 821 entry.dport = ntohs(ireq->ir_rmt_port); 822 823 if (!inet_diag_bc_run(bc, &entry)) 824 continue; 825 } 826 827 err = inet_diag_fill_req(skb, sk, req, 828 sk_user_ns(NETLINK_CB(cb->skb).sk), 829 NETLINK_CB(cb->skb).portid, 830 cb->nlh->nlmsg_seq, cb->nlh); 831 if (err < 0) { 832 cb->args[3] = j + 1; 833 cb->args[4] = reqnum; 834 goto out; 835 } 836 } 837 838 s_reqnum = 0; 839 } 840 841 out: 842 read_unlock_bh(&icsk->icsk_accept_queue.syn_wait_lock); 843 844 return err; 845 } 846 847 void inet_diag_dump_icsk(struct inet_hashinfo *hashinfo, struct sk_buff *skb, 848 struct netlink_callback *cb, struct inet_diag_req_v2 *r, struct nlattr *bc) 849 { 850 int i, num; 851 int s_i, s_num; 852 struct net *net = sock_net(skb->sk); 853 854 s_i = cb->args[1]; 855 s_num = num = cb->args[2]; 856 857 if (cb->args[0] == 0) { 858 if (!(r->idiag_states & (TCPF_LISTEN | TCPF_SYN_RECV))) 859 goto skip_listen_ht; 860 861 for (i = s_i; i < INET_LHTABLE_SIZE; i++) { 862 struct sock *sk; 863 struct hlist_nulls_node *node; 864 struct inet_listen_hashbucket *ilb; 865 866 num = 0; 867 ilb = &hashinfo->listening_hash[i]; 868 spin_lock_bh(&ilb->lock); 869 sk_nulls_for_each(sk, node, &ilb->head) { 870 struct inet_sock *inet = inet_sk(sk); 871 872 if (!net_eq(sock_net(sk), net)) 873 continue; 874 875 if (num < s_num) { 876 num++; 877 continue; 878 } 879 880 if (r->sdiag_family != AF_UNSPEC && 881 sk->sk_family != r->sdiag_family) 882 goto next_listen; 883 884 if (r->id.idiag_sport != inet->inet_sport && 885 r->id.idiag_sport) 886 goto next_listen; 887 888 if (!(r->idiag_states & TCPF_LISTEN) || 889 r->id.idiag_dport || 890 cb->args[3] > 0) 891 goto syn_recv; 892 893 if (inet_csk_diag_dump(sk, skb, cb, r, bc) < 0) { 894 spin_unlock_bh(&ilb->lock); 895 goto done; 896 } 897 898 syn_recv: 899 if (!(r->idiag_states & TCPF_SYN_RECV)) 900 goto next_listen; 901 902 if (inet_diag_dump_reqs(skb, sk, cb, r, bc) < 0) { 903 spin_unlock_bh(&ilb->lock); 904 goto done; 905 } 906 907 next_listen: 908 cb->args[3] = 0; 909 cb->args[4] = 0; 910 ++num; 911 } 912 spin_unlock_bh(&ilb->lock); 913 914 s_num = 0; 915 cb->args[3] = 0; 916 cb->args[4] = 0; 917 } 918 skip_listen_ht: 919 cb->args[0] = 1; 920 s_i = num = s_num = 0; 921 } 922 923 if (!(r->idiag_states & ~(TCPF_LISTEN | TCPF_SYN_RECV))) 924 goto out; 925 926 for (i = s_i; i <= hashinfo->ehash_mask; i++) { 927 struct inet_ehash_bucket *head = &hashinfo->ehash[i]; 928 spinlock_t *lock = inet_ehash_lockp(hashinfo, i); 929 struct sock *sk; 930 struct hlist_nulls_node *node; 931 932 num = 0; 933 934 if (hlist_nulls_empty(&head->chain)) 935 continue; 936 937 if (i > s_i) 938 s_num = 0; 939 940 spin_lock_bh(lock); 941 sk_nulls_for_each(sk, node, &head->chain) { 942 int res; 943 int state; 944 945 if (!net_eq(sock_net(sk), net)) 946 continue; 947 if (num < s_num) 948 goto next_normal; 949 state = (sk->sk_state == TCP_TIME_WAIT) ? 950 inet_twsk(sk)->tw_substate : sk->sk_state; 951 if (!(r->idiag_states & (1 << state))) 952 goto next_normal; 953 if (r->sdiag_family != AF_UNSPEC && 954 sk->sk_family != r->sdiag_family) 955 goto next_normal; 956 if (r->id.idiag_sport != htons(sk->sk_num) && 957 r->id.idiag_sport) 958 goto next_normal; 959 if (r->id.idiag_dport != sk->sk_dport && 960 r->id.idiag_dport) 961 goto next_normal; 962 if (sk->sk_state == TCP_TIME_WAIT) 963 res = inet_twsk_diag_dump(sk, skb, cb, r, bc); 964 else 965 res = inet_csk_diag_dump(sk, skb, cb, r, bc); 966 if (res < 0) { 967 spin_unlock_bh(lock); 968 goto done; 969 } 970 next_normal: 971 ++num; 972 } 973 974 spin_unlock_bh(lock); 975 } 976 977 done: 978 cb->args[1] = i; 979 cb->args[2] = num; 980 out: 981 ; 982 } 983 EXPORT_SYMBOL_GPL(inet_diag_dump_icsk); 984 985 static int __inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb, 986 struct inet_diag_req_v2 *r, struct nlattr *bc) 987 { 988 const struct inet_diag_handler *handler; 989 int err = 0; 990 991 handler = inet_diag_lock_handler(r->sdiag_protocol); 992 if (!IS_ERR(handler)) 993 handler->dump(skb, cb, r, bc); 994 else 995 err = PTR_ERR(handler); 996 inet_diag_unlock_handler(handler); 997 998 return err ? : skb->len; 999 } 1000 1001 static int inet_diag_dump(struct sk_buff *skb, struct netlink_callback *cb) 1002 { 1003 struct nlattr *bc = NULL; 1004 int hdrlen = sizeof(struct inet_diag_req_v2); 1005 1006 if (nlmsg_attrlen(cb->nlh, hdrlen)) 1007 bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE); 1008 1009 return __inet_diag_dump(skb, cb, nlmsg_data(cb->nlh), bc); 1010 } 1011 1012 static inline int inet_diag_type2proto(int type) 1013 { 1014 switch (type) { 1015 case TCPDIAG_GETSOCK: 1016 return IPPROTO_TCP; 1017 case DCCPDIAG_GETSOCK: 1018 return IPPROTO_DCCP; 1019 default: 1020 return 0; 1021 } 1022 } 1023 1024 static int inet_diag_dump_compat(struct sk_buff *skb, struct netlink_callback *cb) 1025 { 1026 struct inet_diag_req *rc = nlmsg_data(cb->nlh); 1027 struct inet_diag_req_v2 req; 1028 struct nlattr *bc = NULL; 1029 int hdrlen = sizeof(struct inet_diag_req); 1030 1031 req.sdiag_family = AF_UNSPEC; /* compatibility */ 1032 req.sdiag_protocol = inet_diag_type2proto(cb->nlh->nlmsg_type); 1033 req.idiag_ext = rc->idiag_ext; 1034 req.idiag_states = rc->idiag_states; 1035 req.id = rc->id; 1036 1037 if (nlmsg_attrlen(cb->nlh, hdrlen)) 1038 bc = nlmsg_find_attr(cb->nlh, hdrlen, INET_DIAG_REQ_BYTECODE); 1039 1040 return __inet_diag_dump(skb, cb, &req, bc); 1041 } 1042 1043 static int inet_diag_get_exact_compat(struct sk_buff *in_skb, 1044 const struct nlmsghdr *nlh) 1045 { 1046 struct inet_diag_req *rc = nlmsg_data(nlh); 1047 struct inet_diag_req_v2 req; 1048 1049 req.sdiag_family = rc->idiag_family; 1050 req.sdiag_protocol = inet_diag_type2proto(nlh->nlmsg_type); 1051 req.idiag_ext = rc->idiag_ext; 1052 req.idiag_states = rc->idiag_states; 1053 req.id = rc->id; 1054 1055 return inet_diag_get_exact(in_skb, nlh, &req); 1056 } 1057 1058 static int inet_diag_rcv_msg_compat(struct sk_buff *skb, struct nlmsghdr *nlh) 1059 { 1060 int hdrlen = sizeof(struct inet_diag_req); 1061 struct net *net = sock_net(skb->sk); 1062 1063 if (nlh->nlmsg_type >= INET_DIAG_GETSOCK_MAX || 1064 nlmsg_len(nlh) < hdrlen) 1065 return -EINVAL; 1066 1067 if (nlh->nlmsg_flags & NLM_F_DUMP) { 1068 if (nlmsg_attrlen(nlh, hdrlen)) { 1069 struct nlattr *attr; 1070 1071 attr = nlmsg_find_attr(nlh, hdrlen, 1072 INET_DIAG_REQ_BYTECODE); 1073 if (attr == NULL || 1074 nla_len(attr) < sizeof(struct inet_diag_bc_op) || 1075 inet_diag_bc_audit(nla_data(attr), nla_len(attr))) 1076 return -EINVAL; 1077 } 1078 { 1079 struct netlink_dump_control c = { 1080 .dump = inet_diag_dump_compat, 1081 }; 1082 return netlink_dump_start(net->diag_nlsk, skb, nlh, &c); 1083 } 1084 } 1085 1086 return inet_diag_get_exact_compat(skb, nlh); 1087 } 1088 1089 static int inet_diag_handler_dump(struct sk_buff *skb, struct nlmsghdr *h) 1090 { 1091 int hdrlen = sizeof(struct inet_diag_req_v2); 1092 struct net *net = sock_net(skb->sk); 1093 1094 if (nlmsg_len(h) < hdrlen) 1095 return -EINVAL; 1096 1097 if (h->nlmsg_flags & NLM_F_DUMP) { 1098 if (nlmsg_attrlen(h, hdrlen)) { 1099 struct nlattr *attr; 1100 attr = nlmsg_find_attr(h, hdrlen, 1101 INET_DIAG_REQ_BYTECODE); 1102 if (attr == NULL || 1103 nla_len(attr) < sizeof(struct inet_diag_bc_op) || 1104 inet_diag_bc_audit(nla_data(attr), nla_len(attr))) 1105 return -EINVAL; 1106 } 1107 { 1108 struct netlink_dump_control c = { 1109 .dump = inet_diag_dump, 1110 }; 1111 return netlink_dump_start(net->diag_nlsk, skb, h, &c); 1112 } 1113 } 1114 1115 return inet_diag_get_exact(skb, h, nlmsg_data(h)); 1116 } 1117 1118 static const struct sock_diag_handler inet_diag_handler = { 1119 .family = AF_INET, 1120 .dump = inet_diag_handler_dump, 1121 }; 1122 1123 static const struct sock_diag_handler inet6_diag_handler = { 1124 .family = AF_INET6, 1125 .dump = inet_diag_handler_dump, 1126 }; 1127 1128 int inet_diag_register(const struct inet_diag_handler *h) 1129 { 1130 const __u16 type = h->idiag_type; 1131 int err = -EINVAL; 1132 1133 if (type >= IPPROTO_MAX) 1134 goto out; 1135 1136 mutex_lock(&inet_diag_table_mutex); 1137 err = -EEXIST; 1138 if (inet_diag_table[type] == NULL) { 1139 inet_diag_table[type] = h; 1140 err = 0; 1141 } 1142 mutex_unlock(&inet_diag_table_mutex); 1143 out: 1144 return err; 1145 } 1146 EXPORT_SYMBOL_GPL(inet_diag_register); 1147 1148 void inet_diag_unregister(const struct inet_diag_handler *h) 1149 { 1150 const __u16 type = h->idiag_type; 1151 1152 if (type >= IPPROTO_MAX) 1153 return; 1154 1155 mutex_lock(&inet_diag_table_mutex); 1156 inet_diag_table[type] = NULL; 1157 mutex_unlock(&inet_diag_table_mutex); 1158 } 1159 EXPORT_SYMBOL_GPL(inet_diag_unregister); 1160 1161 static int __init inet_diag_init(void) 1162 { 1163 const int inet_diag_table_size = (IPPROTO_MAX * 1164 sizeof(struct inet_diag_handler *)); 1165 int err = -ENOMEM; 1166 1167 inet_diag_table = kzalloc(inet_diag_table_size, GFP_KERNEL); 1168 if (!inet_diag_table) 1169 goto out; 1170 1171 err = sock_diag_register(&inet_diag_handler); 1172 if (err) 1173 goto out_free_nl; 1174 1175 err = sock_diag_register(&inet6_diag_handler); 1176 if (err) 1177 goto out_free_inet; 1178 1179 sock_diag_register_inet_compat(inet_diag_rcv_msg_compat); 1180 out: 1181 return err; 1182 1183 out_free_inet: 1184 sock_diag_unregister(&inet_diag_handler); 1185 out_free_nl: 1186 kfree(inet_diag_table); 1187 goto out; 1188 } 1189 1190 static void __exit inet_diag_exit(void) 1191 { 1192 sock_diag_unregister(&inet6_diag_handler); 1193 sock_diag_unregister(&inet_diag_handler); 1194 sock_diag_unregister_inet_compat(inet_diag_rcv_msg_compat); 1195 kfree(inet_diag_table); 1196 } 1197 1198 module_init(inet_diag_init); 1199 module_exit(inet_diag_exit); 1200 MODULE_LICENSE("GPL"); 1201 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 2 /* AF_INET */); 1202 MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 10 /* AF_INET6 */); 1203