1 /* incoming call handling 2 * 3 * Copyright (C) 2007 Red Hat, Inc. All Rights Reserved. 4 * Written by David Howells (dhowells@redhat.com) 5 * 6 * This program is free software; you can redistribute it and/or 7 * modify it under the terms of the GNU General Public License 8 * as published by the Free Software Foundation; either version 9 * 2 of the License, or (at your option) any later version. 10 */ 11 12 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 13 14 #include <linux/module.h> 15 #include <linux/net.h> 16 #include <linux/skbuff.h> 17 #include <linux/errqueue.h> 18 #include <linux/udp.h> 19 #include <linux/in.h> 20 #include <linux/in6.h> 21 #include <linux/icmp.h> 22 #include <linux/gfp.h> 23 #include <linux/circ_buf.h> 24 #include <net/sock.h> 25 #include <net/af_rxrpc.h> 26 #include <net/ip.h> 27 #include "ar-internal.h" 28 29 /* 30 * Preallocate a single service call, connection and peer and, if possible, 31 * give them a user ID and attach the user's side of the ID to them. 32 */ 33 static int rxrpc_service_prealloc_one(struct rxrpc_sock *rx, 34 struct rxrpc_backlog *b, 35 rxrpc_notify_rx_t notify_rx, 36 rxrpc_user_attach_call_t user_attach_call, 37 unsigned long user_call_ID, gfp_t gfp) 38 { 39 const void *here = __builtin_return_address(0); 40 struct rxrpc_call *call; 41 int max, tmp; 42 unsigned int size = RXRPC_BACKLOG_MAX; 43 unsigned int head, tail, call_head, call_tail; 44 45 max = rx->sk.sk_max_ack_backlog; 46 tmp = rx->sk.sk_ack_backlog; 47 if (tmp >= max) { 48 _leave(" = -ENOBUFS [full %u]", max); 49 return -ENOBUFS; 50 } 51 max -= tmp; 52 53 /* We don't need more conns and peers than we have calls, but on the 54 * other hand, we shouldn't ever use more peers than conns or conns 55 * than calls. 56 */ 57 call_head = b->call_backlog_head; 58 call_tail = READ_ONCE(b->call_backlog_tail); 59 tmp = CIRC_CNT(call_head, call_tail, size); 60 if (tmp >= max) { 61 _leave(" = -ENOBUFS [enough %u]", tmp); 62 return -ENOBUFS; 63 } 64 max = tmp + 1; 65 66 head = b->peer_backlog_head; 67 tail = READ_ONCE(b->peer_backlog_tail); 68 if (CIRC_CNT(head, tail, size) < max) { 69 struct rxrpc_peer *peer = rxrpc_alloc_peer(rx->local, gfp); 70 if (!peer) 71 return -ENOMEM; 72 b->peer_backlog[head] = peer; 73 smp_store_release(&b->peer_backlog_head, 74 (head + 1) & (size - 1)); 75 } 76 77 head = b->conn_backlog_head; 78 tail = READ_ONCE(b->conn_backlog_tail); 79 if (CIRC_CNT(head, tail, size) < max) { 80 struct rxrpc_connection *conn; 81 82 conn = rxrpc_prealloc_service_connection(gfp); 83 if (!conn) 84 return -ENOMEM; 85 b->conn_backlog[head] = conn; 86 smp_store_release(&b->conn_backlog_head, 87 (head + 1) & (size - 1)); 88 89 trace_rxrpc_conn(conn, rxrpc_conn_new_service, 90 atomic_read(&conn->usage), here); 91 } 92 93 /* Now it gets complicated, because calls get registered with the 94 * socket here, particularly if a user ID is preassigned by the user. 95 */ 96 call = rxrpc_alloc_call(gfp); 97 if (!call) 98 return -ENOMEM; 99 call->flags |= (1 << RXRPC_CALL_IS_SERVICE); 100 call->state = RXRPC_CALL_SERVER_PREALLOC; 101 102 trace_rxrpc_call(call, rxrpc_call_new_service, 103 atomic_read(&call->usage), 104 here, (const void *)user_call_ID); 105 106 write_lock(&rx->call_lock); 107 if (user_attach_call) { 108 struct rxrpc_call *xcall; 109 struct rb_node *parent, **pp; 110 111 /* Check the user ID isn't already in use */ 112 pp = &rx->calls.rb_node; 113 parent = NULL; 114 while (*pp) { 115 parent = *pp; 116 xcall = rb_entry(parent, struct rxrpc_call, sock_node); 117 if (user_call_ID < call->user_call_ID) 118 pp = &(*pp)->rb_left; 119 else if (user_call_ID > call->user_call_ID) 120 pp = &(*pp)->rb_right; 121 else 122 goto id_in_use; 123 } 124 125 call->user_call_ID = user_call_ID; 126 call->notify_rx = notify_rx; 127 rxrpc_get_call(call, rxrpc_call_got_kernel); 128 user_attach_call(call, user_call_ID); 129 rxrpc_get_call(call, rxrpc_call_got_userid); 130 rb_link_node(&call->sock_node, parent, pp); 131 rb_insert_color(&call->sock_node, &rx->calls); 132 set_bit(RXRPC_CALL_HAS_USERID, &call->flags); 133 } 134 135 list_add(&call->sock_link, &rx->sock_calls); 136 137 write_unlock(&rx->call_lock); 138 139 write_lock(&rxrpc_call_lock); 140 list_add_tail(&call->link, &rxrpc_calls); 141 write_unlock(&rxrpc_call_lock); 142 143 b->call_backlog[call_head] = call; 144 smp_store_release(&b->call_backlog_head, (call_head + 1) & (size - 1)); 145 _leave(" = 0 [%d -> %lx]", call->debug_id, user_call_ID); 146 return 0; 147 148 id_in_use: 149 write_unlock(&rx->call_lock); 150 rxrpc_cleanup_call(call); 151 _leave(" = -EBADSLT"); 152 return -EBADSLT; 153 } 154 155 /* 156 * Preallocate sufficient service connections, calls and peers to cover the 157 * entire backlog of a socket. When a new call comes in, if we don't have 158 * sufficient of each available, the call gets rejected as busy or ignored. 159 * 160 * The backlog is replenished when a connection is accepted or rejected. 161 */ 162 int rxrpc_service_prealloc(struct rxrpc_sock *rx, gfp_t gfp) 163 { 164 struct rxrpc_backlog *b = rx->backlog; 165 166 if (!b) { 167 b = kzalloc(sizeof(struct rxrpc_backlog), gfp); 168 if (!b) 169 return -ENOMEM; 170 rx->backlog = b; 171 } 172 173 if (rx->discard_new_call) 174 return 0; 175 176 while (rxrpc_service_prealloc_one(rx, b, NULL, NULL, 0, gfp) == 0) 177 ; 178 179 return 0; 180 } 181 182 /* 183 * Discard the preallocation on a service. 184 */ 185 void rxrpc_discard_prealloc(struct rxrpc_sock *rx) 186 { 187 struct rxrpc_backlog *b = rx->backlog; 188 unsigned int size = RXRPC_BACKLOG_MAX, head, tail; 189 190 if (!b) 191 return; 192 rx->backlog = NULL; 193 194 /* Make sure that there aren't any incoming calls in progress before we 195 * clear the preallocation buffers. 196 */ 197 spin_lock_bh(&rx->incoming_lock); 198 spin_unlock_bh(&rx->incoming_lock); 199 200 head = b->peer_backlog_head; 201 tail = b->peer_backlog_tail; 202 while (CIRC_CNT(head, tail, size) > 0) { 203 struct rxrpc_peer *peer = b->peer_backlog[tail]; 204 kfree(peer); 205 tail = (tail + 1) & (size - 1); 206 } 207 208 head = b->conn_backlog_head; 209 tail = b->conn_backlog_tail; 210 while (CIRC_CNT(head, tail, size) > 0) { 211 struct rxrpc_connection *conn = b->conn_backlog[tail]; 212 write_lock(&rxrpc_connection_lock); 213 list_del(&conn->link); 214 list_del(&conn->proc_link); 215 write_unlock(&rxrpc_connection_lock); 216 kfree(conn); 217 tail = (tail + 1) & (size - 1); 218 } 219 220 head = b->call_backlog_head; 221 tail = b->call_backlog_tail; 222 while (CIRC_CNT(head, tail, size) > 0) { 223 struct rxrpc_call *call = b->call_backlog[tail]; 224 if (rx->discard_new_call) { 225 _debug("discard %lx", call->user_call_ID); 226 rx->discard_new_call(call, call->user_call_ID); 227 rxrpc_put_call(call, rxrpc_call_put_kernel); 228 } 229 rxrpc_call_completed(call); 230 rxrpc_release_call(rx, call); 231 rxrpc_put_call(call, rxrpc_call_put); 232 tail = (tail + 1) & (size - 1); 233 } 234 235 kfree(b); 236 } 237 238 /* 239 * Allocate a new incoming call from the prealloc pool, along with a connection 240 * and a peer as necessary. 241 */ 242 static struct rxrpc_call *rxrpc_alloc_incoming_call(struct rxrpc_sock *rx, 243 struct rxrpc_local *local, 244 struct rxrpc_connection *conn, 245 struct sk_buff *skb) 246 { 247 struct rxrpc_backlog *b = rx->backlog; 248 struct rxrpc_peer *peer, *xpeer; 249 struct rxrpc_call *call; 250 unsigned short call_head, conn_head, peer_head; 251 unsigned short call_tail, conn_tail, peer_tail; 252 unsigned short call_count, conn_count; 253 254 /* #calls >= #conns >= #peers must hold true. */ 255 call_head = smp_load_acquire(&b->call_backlog_head); 256 call_tail = b->call_backlog_tail; 257 call_count = CIRC_CNT(call_head, call_tail, RXRPC_BACKLOG_MAX); 258 conn_head = smp_load_acquire(&b->conn_backlog_head); 259 conn_tail = b->conn_backlog_tail; 260 conn_count = CIRC_CNT(conn_head, conn_tail, RXRPC_BACKLOG_MAX); 261 ASSERTCMP(conn_count, >=, call_count); 262 peer_head = smp_load_acquire(&b->peer_backlog_head); 263 peer_tail = b->peer_backlog_tail; 264 ASSERTCMP(CIRC_CNT(peer_head, peer_tail, RXRPC_BACKLOG_MAX), >=, 265 conn_count); 266 267 if (call_count == 0) 268 return NULL; 269 270 if (!conn) { 271 /* No connection. We're going to need a peer to start off 272 * with. If one doesn't yet exist, use a spare from the 273 * preallocation set. We dump the address into the spare in 274 * anticipation - and to save on stack space. 275 */ 276 xpeer = b->peer_backlog[peer_tail]; 277 if (rxrpc_extract_addr_from_skb(&xpeer->srx, skb) < 0) 278 return NULL; 279 280 peer = rxrpc_lookup_incoming_peer(local, xpeer); 281 if (peer == xpeer) { 282 b->peer_backlog[peer_tail] = NULL; 283 smp_store_release(&b->peer_backlog_tail, 284 (peer_tail + 1) & 285 (RXRPC_BACKLOG_MAX - 1)); 286 } 287 288 /* Now allocate and set up the connection */ 289 conn = b->conn_backlog[conn_tail]; 290 b->conn_backlog[conn_tail] = NULL; 291 smp_store_release(&b->conn_backlog_tail, 292 (conn_tail + 1) & (RXRPC_BACKLOG_MAX - 1)); 293 rxrpc_get_local(local); 294 conn->params.local = local; 295 conn->params.peer = peer; 296 rxrpc_see_connection(conn); 297 rxrpc_new_incoming_connection(conn, skb); 298 } else { 299 rxrpc_get_connection(conn); 300 } 301 302 /* And now we can allocate and set up a new call */ 303 call = b->call_backlog[call_tail]; 304 b->call_backlog[call_tail] = NULL; 305 smp_store_release(&b->call_backlog_tail, 306 (call_tail + 1) & (RXRPC_BACKLOG_MAX - 1)); 307 308 rxrpc_see_call(call); 309 call->conn = conn; 310 call->peer = rxrpc_get_peer(conn->params.peer); 311 return call; 312 } 313 314 /* 315 * Set up a new incoming call. Called in BH context with the RCU read lock 316 * held. 317 * 318 * If this is for a kernel service, when we allocate the call, it will have 319 * three refs on it: (1) the kernel service, (2) the user_call_ID tree, (3) the 320 * retainer ref obtained from the backlog buffer. Prealloc calls for userspace 321 * services only have the ref from the backlog buffer. We want to pass this 322 * ref to non-BH context to dispose of. 323 * 324 * If we want to report an error, we mark the skb with the packet type and 325 * abort code and return NULL. 326 */ 327 struct rxrpc_call *rxrpc_new_incoming_call(struct rxrpc_local *local, 328 struct rxrpc_connection *conn, 329 struct sk_buff *skb) 330 { 331 struct rxrpc_skb_priv *sp = rxrpc_skb(skb); 332 struct rxrpc_sock *rx; 333 struct rxrpc_call *call; 334 u16 service_id = sp->hdr.serviceId; 335 336 _enter(""); 337 338 /* Get the socket providing the service */ 339 rx = rcu_dereference(local->service); 340 if (rx && service_id == rx->srx.srx_service) 341 goto found_service; 342 343 trace_rxrpc_abort("INV", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq, 344 RX_INVALID_OPERATION, EOPNOTSUPP); 345 skb->mark = RXRPC_SKB_MARK_LOCAL_ABORT; 346 skb->priority = RX_INVALID_OPERATION; 347 _leave(" = NULL [service]"); 348 return NULL; 349 350 found_service: 351 spin_lock(&rx->incoming_lock); 352 if (rx->sk.sk_state == RXRPC_SERVER_LISTEN_DISABLED || 353 rx->sk.sk_state == RXRPC_CLOSE) { 354 trace_rxrpc_abort("CLS", sp->hdr.cid, sp->hdr.callNumber, 355 sp->hdr.seq, RX_INVALID_OPERATION, ESHUTDOWN); 356 skb->mark = RXRPC_SKB_MARK_LOCAL_ABORT; 357 skb->priority = RX_INVALID_OPERATION; 358 _leave(" = NULL [close]"); 359 call = NULL; 360 goto out; 361 } 362 363 call = rxrpc_alloc_incoming_call(rx, local, conn, skb); 364 if (!call) { 365 skb->mark = RXRPC_SKB_MARK_BUSY; 366 _leave(" = NULL [busy]"); 367 call = NULL; 368 goto out; 369 } 370 371 trace_rxrpc_receive(call, rxrpc_receive_incoming, 372 sp->hdr.serial, sp->hdr.seq); 373 374 /* Make the call live. */ 375 rxrpc_incoming_call(rx, call, skb); 376 conn = call->conn; 377 378 if (rx->notify_new_call) 379 rx->notify_new_call(&rx->sk, call, call->user_call_ID); 380 else 381 sk_acceptq_added(&rx->sk); 382 383 spin_lock(&conn->state_lock); 384 switch (conn->state) { 385 case RXRPC_CONN_SERVICE_UNSECURED: 386 conn->state = RXRPC_CONN_SERVICE_CHALLENGING; 387 set_bit(RXRPC_CONN_EV_CHALLENGE, &call->conn->events); 388 rxrpc_queue_conn(call->conn); 389 break; 390 391 case RXRPC_CONN_SERVICE: 392 write_lock(&call->state_lock); 393 if (rx->discard_new_call) 394 call->state = RXRPC_CALL_SERVER_RECV_REQUEST; 395 else 396 call->state = RXRPC_CALL_SERVER_ACCEPTING; 397 write_unlock(&call->state_lock); 398 break; 399 400 case RXRPC_CONN_REMOTELY_ABORTED: 401 rxrpc_set_call_completion(call, RXRPC_CALL_REMOTELY_ABORTED, 402 conn->remote_abort, ECONNABORTED); 403 break; 404 case RXRPC_CONN_LOCALLY_ABORTED: 405 rxrpc_abort_call("CON", call, sp->hdr.seq, 406 conn->local_abort, ECONNABORTED); 407 break; 408 default: 409 BUG(); 410 } 411 spin_unlock(&conn->state_lock); 412 413 if (call->state == RXRPC_CALL_SERVER_ACCEPTING) 414 rxrpc_notify_socket(call); 415 416 /* We have to discard the prealloc queue's ref here and rely on a 417 * combination of the RCU read lock and refs held either by the socket 418 * (recvmsg queue, to-be-accepted queue or user ID tree) or the kernel 419 * service to prevent the call from being deallocated too early. 420 */ 421 rxrpc_put_call(call, rxrpc_call_put); 422 423 _leave(" = %p{%d}", call, call->debug_id); 424 out: 425 spin_unlock(&rx->incoming_lock); 426 return call; 427 } 428 429 /* 430 * handle acceptance of a call by userspace 431 * - assign the user call ID to the call at the front of the queue 432 */ 433 struct rxrpc_call *rxrpc_accept_call(struct rxrpc_sock *rx, 434 unsigned long user_call_ID, 435 rxrpc_notify_rx_t notify_rx) 436 { 437 struct rxrpc_call *call; 438 struct rb_node *parent, **pp; 439 int ret; 440 441 _enter(",%lx", user_call_ID); 442 443 ASSERT(!irqs_disabled()); 444 445 write_lock(&rx->call_lock); 446 447 if (list_empty(&rx->to_be_accepted)) { 448 write_unlock(&rx->call_lock); 449 kleave(" = -ENODATA [empty]"); 450 return ERR_PTR(-ENODATA); 451 } 452 453 /* check the user ID isn't already in use */ 454 pp = &rx->calls.rb_node; 455 parent = NULL; 456 while (*pp) { 457 parent = *pp; 458 call = rb_entry(parent, struct rxrpc_call, sock_node); 459 460 if (user_call_ID < call->user_call_ID) 461 pp = &(*pp)->rb_left; 462 else if (user_call_ID > call->user_call_ID) 463 pp = &(*pp)->rb_right; 464 else 465 goto id_in_use; 466 } 467 468 /* Dequeue the first call and check it's still valid. We gain 469 * responsibility for the queue's reference. 470 */ 471 call = list_entry(rx->to_be_accepted.next, 472 struct rxrpc_call, accept_link); 473 list_del_init(&call->accept_link); 474 sk_acceptq_removed(&rx->sk); 475 rxrpc_see_call(call); 476 477 write_lock_bh(&call->state_lock); 478 switch (call->state) { 479 case RXRPC_CALL_SERVER_ACCEPTING: 480 call->state = RXRPC_CALL_SERVER_RECV_REQUEST; 481 break; 482 case RXRPC_CALL_COMPLETE: 483 ret = call->error; 484 goto out_release; 485 default: 486 BUG(); 487 } 488 489 /* formalise the acceptance */ 490 call->notify_rx = notify_rx; 491 call->user_call_ID = user_call_ID; 492 rxrpc_get_call(call, rxrpc_call_got_userid); 493 rb_link_node(&call->sock_node, parent, pp); 494 rb_insert_color(&call->sock_node, &rx->calls); 495 if (test_and_set_bit(RXRPC_CALL_HAS_USERID, &call->flags)) 496 BUG(); 497 498 write_unlock_bh(&call->state_lock); 499 write_unlock(&rx->call_lock); 500 rxrpc_notify_socket(call); 501 rxrpc_service_prealloc(rx, GFP_KERNEL); 502 _leave(" = %p{%d}", call, call->debug_id); 503 return call; 504 505 out_release: 506 _debug("release %p", call); 507 write_unlock_bh(&call->state_lock); 508 write_unlock(&rx->call_lock); 509 rxrpc_release_call(rx, call); 510 rxrpc_put_call(call, rxrpc_call_put); 511 goto out; 512 513 id_in_use: 514 ret = -EBADSLT; 515 write_unlock(&rx->call_lock); 516 out: 517 rxrpc_service_prealloc(rx, GFP_KERNEL); 518 _leave(" = %d", ret); 519 return ERR_PTR(ret); 520 } 521 522 /* 523 * Handle rejection of a call by userspace 524 * - reject the call at the front of the queue 525 */ 526 int rxrpc_reject_call(struct rxrpc_sock *rx) 527 { 528 struct rxrpc_call *call; 529 bool abort = false; 530 int ret; 531 532 _enter(""); 533 534 ASSERT(!irqs_disabled()); 535 536 write_lock(&rx->call_lock); 537 538 if (list_empty(&rx->to_be_accepted)) { 539 write_unlock(&rx->call_lock); 540 return -ENODATA; 541 } 542 543 /* Dequeue the first call and check it's still valid. We gain 544 * responsibility for the queue's reference. 545 */ 546 call = list_entry(rx->to_be_accepted.next, 547 struct rxrpc_call, accept_link); 548 list_del_init(&call->accept_link); 549 sk_acceptq_removed(&rx->sk); 550 rxrpc_see_call(call); 551 552 write_lock_bh(&call->state_lock); 553 switch (call->state) { 554 case RXRPC_CALL_SERVER_ACCEPTING: 555 __rxrpc_abort_call("REJ", call, 1, RX_USER_ABORT, ECONNABORTED); 556 abort = true; 557 /* fall through */ 558 case RXRPC_CALL_COMPLETE: 559 ret = call->error; 560 goto out_discard; 561 default: 562 BUG(); 563 } 564 565 out_discard: 566 write_unlock_bh(&call->state_lock); 567 write_unlock(&rx->call_lock); 568 if (abort) { 569 rxrpc_send_abort_packet(call); 570 rxrpc_release_call(rx, call); 571 rxrpc_put_call(call, rxrpc_call_put); 572 } 573 rxrpc_service_prealloc(rx, GFP_KERNEL); 574 _leave(" = %d", ret); 575 return ret; 576 } 577 578 /* 579 * rxrpc_kernel_charge_accept - Charge up socket with preallocated calls 580 * @sock: The socket on which to preallocate 581 * @notify_rx: Event notification function for the call 582 * @user_attach_call: Func to attach call to user_call_ID 583 * @user_call_ID: The tag to attach to the preallocated call 584 * @gfp: The allocation conditions. 585 * 586 * Charge up the socket with preallocated calls, each with a user ID. A 587 * function should be provided to effect the attachment from the user's side. 588 * The user is given a ref to hold on the call. 589 * 590 * Note that the call may be come connected before this function returns. 591 */ 592 int rxrpc_kernel_charge_accept(struct socket *sock, 593 rxrpc_notify_rx_t notify_rx, 594 rxrpc_user_attach_call_t user_attach_call, 595 unsigned long user_call_ID, gfp_t gfp) 596 { 597 struct rxrpc_sock *rx = rxrpc_sk(sock->sk); 598 struct rxrpc_backlog *b = rx->backlog; 599 600 if (sock->sk->sk_state == RXRPC_CLOSE) 601 return -ESHUTDOWN; 602 603 return rxrpc_service_prealloc_one(rx, b, notify_rx, 604 user_attach_call, user_call_ID, 605 gfp); 606 } 607 EXPORT_SYMBOL(rxrpc_kernel_charge_accept); 608