1 /* 2 * fs/nfs/nfs4state.c 3 * 4 * Client-side XDR for NFSv4. 5 * 6 * Copyright (c) 2002 The Regents of the University of Michigan. 7 * All rights reserved. 8 * 9 * Kendrick Smith <kmsmith@umich.edu> 10 * 11 * Redistribution and use in source and binary forms, with or without 12 * modification, are permitted provided that the following conditions 13 * are met: 14 * 15 * 1. Redistributions of source code must retain the above copyright 16 * notice, this list of conditions and the following disclaimer. 17 * 2. Redistributions in binary form must reproduce the above copyright 18 * notice, this list of conditions and the following disclaimer in the 19 * documentation and/or other materials provided with the distribution. 20 * 3. Neither the name of the University nor the names of its 21 * contributors may be used to endorse or promote products derived 22 * from this software without specific prior written permission. 23 * 24 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED 25 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 26 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 27 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 29 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 30 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR 31 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 32 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 33 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 34 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 35 * 36 * Implementation of the NFSv4 state model. For the time being, 37 * this is minimal, but will be made much more complex in a 38 * subsequent patch. 39 */ 40 41 #include <linux/kernel.h> 42 #include <linux/slab.h> 43 #include <linux/fs.h> 44 #include <linux/nfs_fs.h> 45 #include <linux/kthread.h> 46 #include <linux/module.h> 47 #include <linux/random.h> 48 #include <linux/ratelimit.h> 49 #include <linux/workqueue.h> 50 #include <linux/bitops.h> 51 #include <linux/jiffies.h> 52 53 #include <linux/sunrpc/clnt.h> 54 55 #include "nfs4_fs.h" 56 #include "callback.h" 57 #include "delegation.h" 58 #include "internal.h" 59 #include "nfs4idmap.h" 60 #include "nfs4session.h" 61 #include "pnfs.h" 62 #include "netns.h" 63 64 #define NFSDBG_FACILITY NFSDBG_STATE 65 66 #define OPENOWNER_POOL_SIZE 8 67 68 const nfs4_stateid zero_stateid = { 69 .data = { 0 }, 70 .type = NFS4_SPECIAL_STATEID_TYPE, 71 }; 72 static DEFINE_MUTEX(nfs_clid_init_mutex); 73 74 int nfs4_init_clientid(struct nfs_client *clp, struct rpc_cred *cred) 75 { 76 struct nfs4_setclientid_res clid = { 77 .clientid = clp->cl_clientid, 78 .confirm = clp->cl_confirm, 79 }; 80 unsigned short port; 81 int status; 82 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id); 83 84 if (test_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state)) 85 goto do_confirm; 86 port = nn->nfs_callback_tcpport; 87 if (clp->cl_addr.ss_family == AF_INET6) 88 port = nn->nfs_callback_tcpport6; 89 90 status = nfs4_proc_setclientid(clp, NFS4_CALLBACK, port, cred, &clid); 91 if (status != 0) 92 goto out; 93 clp->cl_clientid = clid.clientid; 94 clp->cl_confirm = clid.confirm; 95 set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 96 do_confirm: 97 status = nfs4_proc_setclientid_confirm(clp, &clid, cred); 98 if (status != 0) 99 goto out; 100 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 101 nfs4_schedule_state_renewal(clp); 102 out: 103 return status; 104 } 105 106 /** 107 * nfs40_discover_server_trunking - Detect server IP address trunking (mv0) 108 * 109 * @clp: nfs_client under test 110 * @result: OUT: found nfs_client, or clp 111 * @cred: credential to use for trunking test 112 * 113 * Returns zero, a negative errno, or a negative NFS4ERR status. 114 * If zero is returned, an nfs_client pointer is planted in 115 * "result". 116 * 117 * Note: The returned client may not yet be marked ready. 118 */ 119 int nfs40_discover_server_trunking(struct nfs_client *clp, 120 struct nfs_client **result, 121 struct rpc_cred *cred) 122 { 123 struct nfs4_setclientid_res clid = { 124 .clientid = clp->cl_clientid, 125 .confirm = clp->cl_confirm, 126 }; 127 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id); 128 unsigned short port; 129 int status; 130 131 port = nn->nfs_callback_tcpport; 132 if (clp->cl_addr.ss_family == AF_INET6) 133 port = nn->nfs_callback_tcpport6; 134 135 status = nfs4_proc_setclientid(clp, NFS4_CALLBACK, port, cred, &clid); 136 if (status != 0) 137 goto out; 138 clp->cl_clientid = clid.clientid; 139 clp->cl_confirm = clid.confirm; 140 141 status = nfs40_walk_client_list(clp, result, cred); 142 if (status == 0) { 143 /* Sustain the lease, even if it's empty. If the clientid4 144 * goes stale it's of no use for trunking discovery. */ 145 nfs4_schedule_state_renewal(*result); 146 } 147 out: 148 return status; 149 } 150 151 struct rpc_cred *nfs4_get_machine_cred_locked(struct nfs_client *clp) 152 { 153 struct rpc_cred *cred = NULL; 154 155 if (clp->cl_machine_cred != NULL) 156 cred = get_rpccred(clp->cl_machine_cred); 157 return cred; 158 } 159 160 static void nfs4_root_machine_cred(struct nfs_client *clp) 161 { 162 struct rpc_cred *cred, *new; 163 164 new = rpc_lookup_machine_cred(NULL); 165 spin_lock(&clp->cl_lock); 166 cred = clp->cl_machine_cred; 167 clp->cl_machine_cred = new; 168 spin_unlock(&clp->cl_lock); 169 if (cred != NULL) 170 put_rpccred(cred); 171 } 172 173 static struct rpc_cred * 174 nfs4_get_renew_cred_server_locked(struct nfs_server *server) 175 { 176 struct rpc_cred *cred = NULL; 177 struct nfs4_state_owner *sp; 178 struct rb_node *pos; 179 180 for (pos = rb_first(&server->state_owners); 181 pos != NULL; 182 pos = rb_next(pos)) { 183 sp = rb_entry(pos, struct nfs4_state_owner, so_server_node); 184 if (list_empty(&sp->so_states)) 185 continue; 186 cred = get_rpccred(sp->so_cred); 187 break; 188 } 189 return cred; 190 } 191 192 /** 193 * nfs4_get_renew_cred_locked - Acquire credential for a renew operation 194 * @clp: client state handle 195 * 196 * Returns an rpc_cred with reference count bumped, or NULL. 197 * Caller must hold clp->cl_lock. 198 */ 199 struct rpc_cred *nfs4_get_renew_cred_locked(struct nfs_client *clp) 200 { 201 struct rpc_cred *cred = NULL; 202 struct nfs_server *server; 203 204 /* Use machine credentials if available */ 205 cred = nfs4_get_machine_cred_locked(clp); 206 if (cred != NULL) 207 goto out; 208 209 rcu_read_lock(); 210 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) { 211 cred = nfs4_get_renew_cred_server_locked(server); 212 if (cred != NULL) 213 break; 214 } 215 rcu_read_unlock(); 216 217 out: 218 return cred; 219 } 220 221 static void nfs4_end_drain_slot_table(struct nfs4_slot_table *tbl) 222 { 223 if (test_and_clear_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state)) { 224 spin_lock(&tbl->slot_tbl_lock); 225 nfs41_wake_slot_table(tbl); 226 spin_unlock(&tbl->slot_tbl_lock); 227 } 228 } 229 230 static void nfs4_end_drain_session(struct nfs_client *clp) 231 { 232 struct nfs4_session *ses = clp->cl_session; 233 234 if (clp->cl_slot_tbl) { 235 nfs4_end_drain_slot_table(clp->cl_slot_tbl); 236 return; 237 } 238 239 if (ses != NULL) { 240 nfs4_end_drain_slot_table(&ses->bc_slot_table); 241 nfs4_end_drain_slot_table(&ses->fc_slot_table); 242 } 243 } 244 245 static int nfs4_drain_slot_tbl(struct nfs4_slot_table *tbl) 246 { 247 set_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state); 248 spin_lock(&tbl->slot_tbl_lock); 249 if (tbl->highest_used_slotid != NFS4_NO_SLOT) { 250 reinit_completion(&tbl->complete); 251 spin_unlock(&tbl->slot_tbl_lock); 252 return wait_for_completion_interruptible(&tbl->complete); 253 } 254 spin_unlock(&tbl->slot_tbl_lock); 255 return 0; 256 } 257 258 static int nfs4_begin_drain_session(struct nfs_client *clp) 259 { 260 struct nfs4_session *ses = clp->cl_session; 261 int ret = 0; 262 263 if (clp->cl_slot_tbl) 264 return nfs4_drain_slot_tbl(clp->cl_slot_tbl); 265 266 /* back channel */ 267 ret = nfs4_drain_slot_tbl(&ses->bc_slot_table); 268 if (ret) 269 return ret; 270 /* fore channel */ 271 return nfs4_drain_slot_tbl(&ses->fc_slot_table); 272 } 273 274 #if defined(CONFIG_NFS_V4_1) 275 276 static int nfs41_setup_state_renewal(struct nfs_client *clp) 277 { 278 int status; 279 struct nfs_fsinfo fsinfo; 280 281 if (!test_bit(NFS_CS_CHECK_LEASE_TIME, &clp->cl_res_state)) { 282 nfs4_schedule_state_renewal(clp); 283 return 0; 284 } 285 286 status = nfs4_proc_get_lease_time(clp, &fsinfo); 287 if (status == 0) { 288 /* Update lease time and schedule renewal */ 289 spin_lock(&clp->cl_lock); 290 clp->cl_lease_time = fsinfo.lease_time * HZ; 291 clp->cl_last_renewal = jiffies; 292 spin_unlock(&clp->cl_lock); 293 294 nfs4_schedule_state_renewal(clp); 295 } 296 297 return status; 298 } 299 300 static void nfs41_finish_session_reset(struct nfs_client *clp) 301 { 302 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 303 clear_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state); 304 /* create_session negotiated new slot table */ 305 clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state); 306 nfs41_setup_state_renewal(clp); 307 } 308 309 int nfs41_init_clientid(struct nfs_client *clp, struct rpc_cred *cred) 310 { 311 int status; 312 313 if (test_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state)) 314 goto do_confirm; 315 status = nfs4_proc_exchange_id(clp, cred); 316 if (status != 0) 317 goto out; 318 set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 319 do_confirm: 320 status = nfs4_proc_create_session(clp, cred); 321 if (status != 0) 322 goto out; 323 nfs41_finish_session_reset(clp); 324 nfs_mark_client_ready(clp, NFS_CS_READY); 325 out: 326 return status; 327 } 328 329 /** 330 * nfs41_discover_server_trunking - Detect server IP address trunking (mv1) 331 * 332 * @clp: nfs_client under test 333 * @result: OUT: found nfs_client, or clp 334 * @cred: credential to use for trunking test 335 * 336 * Returns NFS4_OK, a negative errno, or a negative NFS4ERR status. 337 * If NFS4_OK is returned, an nfs_client pointer is planted in 338 * "result". 339 * 340 * Note: The returned client may not yet be marked ready. 341 */ 342 int nfs41_discover_server_trunking(struct nfs_client *clp, 343 struct nfs_client **result, 344 struct rpc_cred *cred) 345 { 346 int status; 347 348 status = nfs4_proc_exchange_id(clp, cred); 349 if (status != NFS4_OK) 350 return status; 351 352 status = nfs41_walk_client_list(clp, result, cred); 353 if (status < 0) 354 return status; 355 if (clp != *result) 356 return 0; 357 358 /* Purge state if the client id was established in a prior instance */ 359 if (clp->cl_exchange_flags & EXCHGID4_FLAG_CONFIRMED_R) 360 set_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state); 361 else 362 set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 363 nfs4_schedule_state_manager(clp); 364 status = nfs_wait_client_init_complete(clp); 365 if (status < 0) 366 nfs_put_client(clp); 367 return status; 368 } 369 370 #endif /* CONFIG_NFS_V4_1 */ 371 372 /** 373 * nfs4_get_clid_cred - Acquire credential for a setclientid operation 374 * @clp: client state handle 375 * 376 * Returns an rpc_cred with reference count bumped, or NULL. 377 */ 378 struct rpc_cred *nfs4_get_clid_cred(struct nfs_client *clp) 379 { 380 struct rpc_cred *cred; 381 382 spin_lock(&clp->cl_lock); 383 cred = nfs4_get_machine_cred_locked(clp); 384 spin_unlock(&clp->cl_lock); 385 return cred; 386 } 387 388 static struct nfs4_state_owner * 389 nfs4_find_state_owner_locked(struct nfs_server *server, struct rpc_cred *cred) 390 { 391 struct rb_node **p = &server->state_owners.rb_node, 392 *parent = NULL; 393 struct nfs4_state_owner *sp; 394 395 while (*p != NULL) { 396 parent = *p; 397 sp = rb_entry(parent, struct nfs4_state_owner, so_server_node); 398 399 if (cred < sp->so_cred) 400 p = &parent->rb_left; 401 else if (cred > sp->so_cred) 402 p = &parent->rb_right; 403 else { 404 if (!list_empty(&sp->so_lru)) 405 list_del_init(&sp->so_lru); 406 atomic_inc(&sp->so_count); 407 return sp; 408 } 409 } 410 return NULL; 411 } 412 413 static struct nfs4_state_owner * 414 nfs4_insert_state_owner_locked(struct nfs4_state_owner *new) 415 { 416 struct nfs_server *server = new->so_server; 417 struct rb_node **p = &server->state_owners.rb_node, 418 *parent = NULL; 419 struct nfs4_state_owner *sp; 420 int err; 421 422 while (*p != NULL) { 423 parent = *p; 424 sp = rb_entry(parent, struct nfs4_state_owner, so_server_node); 425 426 if (new->so_cred < sp->so_cred) 427 p = &parent->rb_left; 428 else if (new->so_cred > sp->so_cred) 429 p = &parent->rb_right; 430 else { 431 if (!list_empty(&sp->so_lru)) 432 list_del_init(&sp->so_lru); 433 atomic_inc(&sp->so_count); 434 return sp; 435 } 436 } 437 err = ida_get_new(&server->openowner_id, &new->so_seqid.owner_id); 438 if (err) 439 return ERR_PTR(err); 440 rb_link_node(&new->so_server_node, parent, p); 441 rb_insert_color(&new->so_server_node, &server->state_owners); 442 return new; 443 } 444 445 static void 446 nfs4_remove_state_owner_locked(struct nfs4_state_owner *sp) 447 { 448 struct nfs_server *server = sp->so_server; 449 450 if (!RB_EMPTY_NODE(&sp->so_server_node)) 451 rb_erase(&sp->so_server_node, &server->state_owners); 452 ida_remove(&server->openowner_id, sp->so_seqid.owner_id); 453 } 454 455 static void 456 nfs4_init_seqid_counter(struct nfs_seqid_counter *sc) 457 { 458 sc->create_time = ktime_get(); 459 sc->flags = 0; 460 sc->counter = 0; 461 spin_lock_init(&sc->lock); 462 INIT_LIST_HEAD(&sc->list); 463 rpc_init_wait_queue(&sc->wait, "Seqid_waitqueue"); 464 } 465 466 static void 467 nfs4_destroy_seqid_counter(struct nfs_seqid_counter *sc) 468 { 469 rpc_destroy_wait_queue(&sc->wait); 470 } 471 472 /* 473 * nfs4_alloc_state_owner(): this is called on the OPEN or CREATE path to 474 * create a new state_owner. 475 * 476 */ 477 static struct nfs4_state_owner * 478 nfs4_alloc_state_owner(struct nfs_server *server, 479 struct rpc_cred *cred, 480 gfp_t gfp_flags) 481 { 482 struct nfs4_state_owner *sp; 483 484 sp = kzalloc(sizeof(*sp), gfp_flags); 485 if (!sp) 486 return NULL; 487 sp->so_server = server; 488 sp->so_cred = get_rpccred(cred); 489 spin_lock_init(&sp->so_lock); 490 INIT_LIST_HEAD(&sp->so_states); 491 nfs4_init_seqid_counter(&sp->so_seqid); 492 atomic_set(&sp->so_count, 1); 493 INIT_LIST_HEAD(&sp->so_lru); 494 seqcount_init(&sp->so_reclaim_seqcount); 495 mutex_init(&sp->so_delegreturn_mutex); 496 return sp; 497 } 498 499 static void 500 nfs4_drop_state_owner(struct nfs4_state_owner *sp) 501 { 502 struct rb_node *rb_node = &sp->so_server_node; 503 504 if (!RB_EMPTY_NODE(rb_node)) { 505 struct nfs_server *server = sp->so_server; 506 struct nfs_client *clp = server->nfs_client; 507 508 spin_lock(&clp->cl_lock); 509 if (!RB_EMPTY_NODE(rb_node)) { 510 rb_erase(rb_node, &server->state_owners); 511 RB_CLEAR_NODE(rb_node); 512 } 513 spin_unlock(&clp->cl_lock); 514 } 515 } 516 517 static void nfs4_free_state_owner(struct nfs4_state_owner *sp) 518 { 519 nfs4_destroy_seqid_counter(&sp->so_seqid); 520 put_rpccred(sp->so_cred); 521 kfree(sp); 522 } 523 524 static void nfs4_gc_state_owners(struct nfs_server *server) 525 { 526 struct nfs_client *clp = server->nfs_client; 527 struct nfs4_state_owner *sp, *tmp; 528 unsigned long time_min, time_max; 529 LIST_HEAD(doomed); 530 531 spin_lock(&clp->cl_lock); 532 time_max = jiffies; 533 time_min = (long)time_max - (long)clp->cl_lease_time; 534 list_for_each_entry_safe(sp, tmp, &server->state_owners_lru, so_lru) { 535 /* NB: LRU is sorted so that oldest is at the head */ 536 if (time_in_range(sp->so_expires, time_min, time_max)) 537 break; 538 list_move(&sp->so_lru, &doomed); 539 nfs4_remove_state_owner_locked(sp); 540 } 541 spin_unlock(&clp->cl_lock); 542 543 list_for_each_entry_safe(sp, tmp, &doomed, so_lru) { 544 list_del(&sp->so_lru); 545 nfs4_free_state_owner(sp); 546 } 547 } 548 549 /** 550 * nfs4_get_state_owner - Look up a state owner given a credential 551 * @server: nfs_server to search 552 * @cred: RPC credential to match 553 * 554 * Returns a pointer to an instantiated nfs4_state_owner struct, or NULL. 555 */ 556 struct nfs4_state_owner *nfs4_get_state_owner(struct nfs_server *server, 557 struct rpc_cred *cred, 558 gfp_t gfp_flags) 559 { 560 struct nfs_client *clp = server->nfs_client; 561 struct nfs4_state_owner *sp, *new; 562 563 spin_lock(&clp->cl_lock); 564 sp = nfs4_find_state_owner_locked(server, cred); 565 spin_unlock(&clp->cl_lock); 566 if (sp != NULL) 567 goto out; 568 new = nfs4_alloc_state_owner(server, cred, gfp_flags); 569 if (new == NULL) 570 goto out; 571 do { 572 if (ida_pre_get(&server->openowner_id, gfp_flags) == 0) 573 break; 574 spin_lock(&clp->cl_lock); 575 sp = nfs4_insert_state_owner_locked(new); 576 spin_unlock(&clp->cl_lock); 577 } while (sp == ERR_PTR(-EAGAIN)); 578 if (sp != new) 579 nfs4_free_state_owner(new); 580 out: 581 nfs4_gc_state_owners(server); 582 return sp; 583 } 584 585 /** 586 * nfs4_put_state_owner - Release a nfs4_state_owner 587 * @sp: state owner data to release 588 * 589 * Note that we keep released state owners on an LRU 590 * list. 591 * This caches valid state owners so that they can be 592 * reused, to avoid the OPEN_CONFIRM on minor version 0. 593 * It also pins the uniquifier of dropped state owners for 594 * a while, to ensure that those state owner names are 595 * never reused. 596 */ 597 void nfs4_put_state_owner(struct nfs4_state_owner *sp) 598 { 599 struct nfs_server *server = sp->so_server; 600 struct nfs_client *clp = server->nfs_client; 601 602 if (!atomic_dec_and_lock(&sp->so_count, &clp->cl_lock)) 603 return; 604 605 sp->so_expires = jiffies; 606 list_add_tail(&sp->so_lru, &server->state_owners_lru); 607 spin_unlock(&clp->cl_lock); 608 } 609 610 /** 611 * nfs4_purge_state_owners - Release all cached state owners 612 * @server: nfs_server with cached state owners to release 613 * 614 * Called at umount time. Remaining state owners will be on 615 * the LRU with ref count of zero. 616 */ 617 void nfs4_purge_state_owners(struct nfs_server *server) 618 { 619 struct nfs_client *clp = server->nfs_client; 620 struct nfs4_state_owner *sp, *tmp; 621 LIST_HEAD(doomed); 622 623 spin_lock(&clp->cl_lock); 624 list_for_each_entry_safe(sp, tmp, &server->state_owners_lru, so_lru) { 625 list_move(&sp->so_lru, &doomed); 626 nfs4_remove_state_owner_locked(sp); 627 } 628 spin_unlock(&clp->cl_lock); 629 630 list_for_each_entry_safe(sp, tmp, &doomed, so_lru) { 631 list_del(&sp->so_lru); 632 nfs4_free_state_owner(sp); 633 } 634 } 635 636 static struct nfs4_state * 637 nfs4_alloc_open_state(void) 638 { 639 struct nfs4_state *state; 640 641 state = kzalloc(sizeof(*state), GFP_NOFS); 642 if (!state) 643 return NULL; 644 atomic_set(&state->count, 1); 645 INIT_LIST_HEAD(&state->lock_states); 646 spin_lock_init(&state->state_lock); 647 seqlock_init(&state->seqlock); 648 return state; 649 } 650 651 void 652 nfs4_state_set_mode_locked(struct nfs4_state *state, fmode_t fmode) 653 { 654 if (state->state == fmode) 655 return; 656 /* NB! List reordering - see the reclaim code for why. */ 657 if ((fmode & FMODE_WRITE) != (state->state & FMODE_WRITE)) { 658 if (fmode & FMODE_WRITE) 659 list_move(&state->open_states, &state->owner->so_states); 660 else 661 list_move_tail(&state->open_states, &state->owner->so_states); 662 } 663 state->state = fmode; 664 } 665 666 static struct nfs4_state * 667 __nfs4_find_state_byowner(struct inode *inode, struct nfs4_state_owner *owner) 668 { 669 struct nfs_inode *nfsi = NFS_I(inode); 670 struct nfs4_state *state; 671 672 list_for_each_entry(state, &nfsi->open_states, inode_states) { 673 if (state->owner != owner) 674 continue; 675 if (!nfs4_valid_open_stateid(state)) 676 continue; 677 if (atomic_inc_not_zero(&state->count)) 678 return state; 679 } 680 return NULL; 681 } 682 683 static void 684 nfs4_free_open_state(struct nfs4_state *state) 685 { 686 kfree(state); 687 } 688 689 struct nfs4_state * 690 nfs4_get_open_state(struct inode *inode, struct nfs4_state_owner *owner) 691 { 692 struct nfs4_state *state, *new; 693 struct nfs_inode *nfsi = NFS_I(inode); 694 695 spin_lock(&inode->i_lock); 696 state = __nfs4_find_state_byowner(inode, owner); 697 spin_unlock(&inode->i_lock); 698 if (state) 699 goto out; 700 new = nfs4_alloc_open_state(); 701 spin_lock(&owner->so_lock); 702 spin_lock(&inode->i_lock); 703 state = __nfs4_find_state_byowner(inode, owner); 704 if (state == NULL && new != NULL) { 705 state = new; 706 state->owner = owner; 707 atomic_inc(&owner->so_count); 708 list_add(&state->inode_states, &nfsi->open_states); 709 ihold(inode); 710 state->inode = inode; 711 spin_unlock(&inode->i_lock); 712 /* Note: The reclaim code dictates that we add stateless 713 * and read-only stateids to the end of the list */ 714 list_add_tail(&state->open_states, &owner->so_states); 715 spin_unlock(&owner->so_lock); 716 } else { 717 spin_unlock(&inode->i_lock); 718 spin_unlock(&owner->so_lock); 719 if (new) 720 nfs4_free_open_state(new); 721 } 722 out: 723 return state; 724 } 725 726 void nfs4_put_open_state(struct nfs4_state *state) 727 { 728 struct inode *inode = state->inode; 729 struct nfs4_state_owner *owner = state->owner; 730 731 if (!atomic_dec_and_lock(&state->count, &owner->so_lock)) 732 return; 733 spin_lock(&inode->i_lock); 734 list_del(&state->inode_states); 735 list_del(&state->open_states); 736 spin_unlock(&inode->i_lock); 737 spin_unlock(&owner->so_lock); 738 iput(inode); 739 nfs4_free_open_state(state); 740 nfs4_put_state_owner(owner); 741 } 742 743 /* 744 * Close the current file. 745 */ 746 static void __nfs4_close(struct nfs4_state *state, 747 fmode_t fmode, gfp_t gfp_mask, int wait) 748 { 749 struct nfs4_state_owner *owner = state->owner; 750 int call_close = 0; 751 fmode_t newstate; 752 753 atomic_inc(&owner->so_count); 754 /* Protect against nfs4_find_state() */ 755 spin_lock(&owner->so_lock); 756 switch (fmode & (FMODE_READ | FMODE_WRITE)) { 757 case FMODE_READ: 758 state->n_rdonly--; 759 break; 760 case FMODE_WRITE: 761 state->n_wronly--; 762 break; 763 case FMODE_READ|FMODE_WRITE: 764 state->n_rdwr--; 765 } 766 newstate = FMODE_READ|FMODE_WRITE; 767 if (state->n_rdwr == 0) { 768 if (state->n_rdonly == 0) { 769 newstate &= ~FMODE_READ; 770 call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags); 771 call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags); 772 } 773 if (state->n_wronly == 0) { 774 newstate &= ~FMODE_WRITE; 775 call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags); 776 call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags); 777 } 778 if (newstate == 0) 779 clear_bit(NFS_DELEGATED_STATE, &state->flags); 780 } 781 nfs4_state_set_mode_locked(state, newstate); 782 spin_unlock(&owner->so_lock); 783 784 if (!call_close) { 785 nfs4_put_open_state(state); 786 nfs4_put_state_owner(owner); 787 } else 788 nfs4_do_close(state, gfp_mask, wait); 789 } 790 791 void nfs4_close_state(struct nfs4_state *state, fmode_t fmode) 792 { 793 __nfs4_close(state, fmode, GFP_NOFS, 0); 794 } 795 796 void nfs4_close_sync(struct nfs4_state *state, fmode_t fmode) 797 { 798 __nfs4_close(state, fmode, GFP_KERNEL, 1); 799 } 800 801 /* 802 * Search the state->lock_states for an existing lock_owner 803 * that is compatible with current->files 804 */ 805 static struct nfs4_lock_state * 806 __nfs4_find_lock_state(struct nfs4_state *state, fl_owner_t fl_owner) 807 { 808 struct nfs4_lock_state *pos; 809 list_for_each_entry(pos, &state->lock_states, ls_locks) { 810 if (pos->ls_owner != fl_owner) 811 continue; 812 atomic_inc(&pos->ls_count); 813 return pos; 814 } 815 return NULL; 816 } 817 818 /* 819 * Return a compatible lock_state. If no initialized lock_state structure 820 * exists, return an uninitialized one. 821 * 822 */ 823 static struct nfs4_lock_state *nfs4_alloc_lock_state(struct nfs4_state *state, fl_owner_t fl_owner) 824 { 825 struct nfs4_lock_state *lsp; 826 struct nfs_server *server = state->owner->so_server; 827 828 lsp = kzalloc(sizeof(*lsp), GFP_NOFS); 829 if (lsp == NULL) 830 return NULL; 831 nfs4_init_seqid_counter(&lsp->ls_seqid); 832 atomic_set(&lsp->ls_count, 1); 833 lsp->ls_state = state; 834 lsp->ls_owner = fl_owner; 835 lsp->ls_seqid.owner_id = ida_simple_get(&server->lockowner_id, 0, 0, GFP_NOFS); 836 if (lsp->ls_seqid.owner_id < 0) 837 goto out_free; 838 INIT_LIST_HEAD(&lsp->ls_locks); 839 return lsp; 840 out_free: 841 kfree(lsp); 842 return NULL; 843 } 844 845 void nfs4_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp) 846 { 847 ida_simple_remove(&server->lockowner_id, lsp->ls_seqid.owner_id); 848 nfs4_destroy_seqid_counter(&lsp->ls_seqid); 849 kfree(lsp); 850 } 851 852 /* 853 * Return a compatible lock_state. If no initialized lock_state structure 854 * exists, return an uninitialized one. 855 * 856 */ 857 static struct nfs4_lock_state *nfs4_get_lock_state(struct nfs4_state *state, fl_owner_t owner) 858 { 859 struct nfs4_lock_state *lsp, *new = NULL; 860 861 for(;;) { 862 spin_lock(&state->state_lock); 863 lsp = __nfs4_find_lock_state(state, owner); 864 if (lsp != NULL) 865 break; 866 if (new != NULL) { 867 list_add(&new->ls_locks, &state->lock_states); 868 set_bit(LK_STATE_IN_USE, &state->flags); 869 lsp = new; 870 new = NULL; 871 break; 872 } 873 spin_unlock(&state->state_lock); 874 new = nfs4_alloc_lock_state(state, owner); 875 if (new == NULL) 876 return NULL; 877 } 878 spin_unlock(&state->state_lock); 879 if (new != NULL) 880 nfs4_free_lock_state(state->owner->so_server, new); 881 return lsp; 882 } 883 884 /* 885 * Release reference to lock_state, and free it if we see that 886 * it is no longer in use 887 */ 888 void nfs4_put_lock_state(struct nfs4_lock_state *lsp) 889 { 890 struct nfs_server *server; 891 struct nfs4_state *state; 892 893 if (lsp == NULL) 894 return; 895 state = lsp->ls_state; 896 if (!atomic_dec_and_lock(&lsp->ls_count, &state->state_lock)) 897 return; 898 list_del(&lsp->ls_locks); 899 if (list_empty(&state->lock_states)) 900 clear_bit(LK_STATE_IN_USE, &state->flags); 901 spin_unlock(&state->state_lock); 902 server = state->owner->so_server; 903 if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) { 904 struct nfs_client *clp = server->nfs_client; 905 906 clp->cl_mvops->free_lock_state(server, lsp); 907 } else 908 nfs4_free_lock_state(server, lsp); 909 } 910 911 static void nfs4_fl_copy_lock(struct file_lock *dst, struct file_lock *src) 912 { 913 struct nfs4_lock_state *lsp = src->fl_u.nfs4_fl.owner; 914 915 dst->fl_u.nfs4_fl.owner = lsp; 916 atomic_inc(&lsp->ls_count); 917 } 918 919 static void nfs4_fl_release_lock(struct file_lock *fl) 920 { 921 nfs4_put_lock_state(fl->fl_u.nfs4_fl.owner); 922 } 923 924 static const struct file_lock_operations nfs4_fl_lock_ops = { 925 .fl_copy_lock = nfs4_fl_copy_lock, 926 .fl_release_private = nfs4_fl_release_lock, 927 }; 928 929 int nfs4_set_lock_state(struct nfs4_state *state, struct file_lock *fl) 930 { 931 struct nfs4_lock_state *lsp; 932 933 if (fl->fl_ops != NULL) 934 return 0; 935 lsp = nfs4_get_lock_state(state, fl->fl_owner); 936 if (lsp == NULL) 937 return -ENOMEM; 938 fl->fl_u.nfs4_fl.owner = lsp; 939 fl->fl_ops = &nfs4_fl_lock_ops; 940 return 0; 941 } 942 943 static int nfs4_copy_lock_stateid(nfs4_stateid *dst, 944 struct nfs4_state *state, 945 const struct nfs_lockowner *lockowner) 946 { 947 struct nfs4_lock_state *lsp; 948 fl_owner_t fl_owner; 949 int ret = -ENOENT; 950 951 952 if (lockowner == NULL) 953 goto out; 954 955 if (test_bit(LK_STATE_IN_USE, &state->flags) == 0) 956 goto out; 957 958 fl_owner = lockowner->l_owner; 959 spin_lock(&state->state_lock); 960 lsp = __nfs4_find_lock_state(state, fl_owner); 961 if (lsp && test_bit(NFS_LOCK_LOST, &lsp->ls_flags)) 962 ret = -EIO; 963 else if (lsp != NULL && test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0) { 964 nfs4_stateid_copy(dst, &lsp->ls_stateid); 965 ret = 0; 966 } 967 spin_unlock(&state->state_lock); 968 nfs4_put_lock_state(lsp); 969 out: 970 return ret; 971 } 972 973 static void nfs4_copy_open_stateid(nfs4_stateid *dst, struct nfs4_state *state) 974 { 975 const nfs4_stateid *src; 976 int seq; 977 978 do { 979 src = &zero_stateid; 980 seq = read_seqbegin(&state->seqlock); 981 if (test_bit(NFS_OPEN_STATE, &state->flags)) 982 src = &state->open_stateid; 983 nfs4_stateid_copy(dst, src); 984 } while (read_seqretry(&state->seqlock, seq)); 985 } 986 987 /* 988 * Byte-range lock aware utility to initialize the stateid of read/write 989 * requests. 990 */ 991 int nfs4_select_rw_stateid(nfs4_stateid *dst, struct nfs4_state *state, 992 fmode_t fmode, const struct nfs_lockowner *lockowner) 993 { 994 int ret = nfs4_copy_lock_stateid(dst, state, lockowner); 995 if (ret == -EIO) 996 /* A lost lock - don't even consider delegations */ 997 goto out; 998 /* returns true if delegation stateid found and copied */ 999 if (nfs4_copy_delegation_stateid(dst, state->inode, fmode)) { 1000 ret = 0; 1001 goto out; 1002 } 1003 if (ret != -ENOENT) 1004 /* nfs4_copy_delegation_stateid() didn't over-write 1005 * dst, so it still has the lock stateid which we now 1006 * choose to use. 1007 */ 1008 goto out; 1009 nfs4_copy_open_stateid(dst, state); 1010 ret = 0; 1011 out: 1012 if (nfs_server_capable(state->inode, NFS_CAP_STATEID_NFSV41)) 1013 dst->seqid = 0; 1014 return ret; 1015 } 1016 1017 struct nfs_seqid *nfs_alloc_seqid(struct nfs_seqid_counter *counter, gfp_t gfp_mask) 1018 { 1019 struct nfs_seqid *new; 1020 1021 new = kmalloc(sizeof(*new), gfp_mask); 1022 if (new == NULL) 1023 return ERR_PTR(-ENOMEM); 1024 new->sequence = counter; 1025 INIT_LIST_HEAD(&new->list); 1026 new->task = NULL; 1027 return new; 1028 } 1029 1030 void nfs_release_seqid(struct nfs_seqid *seqid) 1031 { 1032 struct nfs_seqid_counter *sequence; 1033 1034 if (seqid == NULL || list_empty(&seqid->list)) 1035 return; 1036 sequence = seqid->sequence; 1037 spin_lock(&sequence->lock); 1038 list_del_init(&seqid->list); 1039 if (!list_empty(&sequence->list)) { 1040 struct nfs_seqid *next; 1041 1042 next = list_first_entry(&sequence->list, 1043 struct nfs_seqid, list); 1044 rpc_wake_up_queued_task(&sequence->wait, next->task); 1045 } 1046 spin_unlock(&sequence->lock); 1047 } 1048 1049 void nfs_free_seqid(struct nfs_seqid *seqid) 1050 { 1051 nfs_release_seqid(seqid); 1052 kfree(seqid); 1053 } 1054 1055 /* 1056 * Increment the seqid if the OPEN/OPEN_DOWNGRADE/CLOSE succeeded, or 1057 * failed with a seqid incrementing error - 1058 * see comments nfs4.h:seqid_mutating_error() 1059 */ 1060 static void nfs_increment_seqid(int status, struct nfs_seqid *seqid) 1061 { 1062 switch (status) { 1063 case 0: 1064 break; 1065 case -NFS4ERR_BAD_SEQID: 1066 if (seqid->sequence->flags & NFS_SEQID_CONFIRMED) 1067 return; 1068 pr_warn_ratelimited("NFS: v4 server returned a bad" 1069 " sequence-id error on an" 1070 " unconfirmed sequence %p!\n", 1071 seqid->sequence); 1072 case -NFS4ERR_STALE_CLIENTID: 1073 case -NFS4ERR_STALE_STATEID: 1074 case -NFS4ERR_BAD_STATEID: 1075 case -NFS4ERR_BADXDR: 1076 case -NFS4ERR_RESOURCE: 1077 case -NFS4ERR_NOFILEHANDLE: 1078 /* Non-seqid mutating errors */ 1079 return; 1080 }; 1081 /* 1082 * Note: no locking needed as we are guaranteed to be first 1083 * on the sequence list 1084 */ 1085 seqid->sequence->counter++; 1086 } 1087 1088 void nfs_increment_open_seqid(int status, struct nfs_seqid *seqid) 1089 { 1090 struct nfs4_state_owner *sp; 1091 1092 if (seqid == NULL) 1093 return; 1094 1095 sp = container_of(seqid->sequence, struct nfs4_state_owner, so_seqid); 1096 if (status == -NFS4ERR_BAD_SEQID) 1097 nfs4_drop_state_owner(sp); 1098 if (!nfs4_has_session(sp->so_server->nfs_client)) 1099 nfs_increment_seqid(status, seqid); 1100 } 1101 1102 /* 1103 * Increment the seqid if the LOCK/LOCKU succeeded, or 1104 * failed with a seqid incrementing error - 1105 * see comments nfs4.h:seqid_mutating_error() 1106 */ 1107 void nfs_increment_lock_seqid(int status, struct nfs_seqid *seqid) 1108 { 1109 if (seqid != NULL) 1110 nfs_increment_seqid(status, seqid); 1111 } 1112 1113 int nfs_wait_on_sequence(struct nfs_seqid *seqid, struct rpc_task *task) 1114 { 1115 struct nfs_seqid_counter *sequence; 1116 int status = 0; 1117 1118 if (seqid == NULL) 1119 goto out; 1120 sequence = seqid->sequence; 1121 spin_lock(&sequence->lock); 1122 seqid->task = task; 1123 if (list_empty(&seqid->list)) 1124 list_add_tail(&seqid->list, &sequence->list); 1125 if (list_first_entry(&sequence->list, struct nfs_seqid, list) == seqid) 1126 goto unlock; 1127 rpc_sleep_on(&sequence->wait, task, NULL); 1128 status = -EAGAIN; 1129 unlock: 1130 spin_unlock(&sequence->lock); 1131 out: 1132 return status; 1133 } 1134 1135 static int nfs4_run_state_manager(void *); 1136 1137 static void nfs4_clear_state_manager_bit(struct nfs_client *clp) 1138 { 1139 smp_mb__before_atomic(); 1140 clear_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state); 1141 smp_mb__after_atomic(); 1142 wake_up_bit(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING); 1143 rpc_wake_up(&clp->cl_rpcwaitq); 1144 } 1145 1146 /* 1147 * Schedule the nfs_client asynchronous state management routine 1148 */ 1149 void nfs4_schedule_state_manager(struct nfs_client *clp) 1150 { 1151 struct task_struct *task; 1152 char buf[INET6_ADDRSTRLEN + sizeof("-manager") + 1]; 1153 1154 if (test_and_set_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) != 0) 1155 return; 1156 __module_get(THIS_MODULE); 1157 atomic_inc(&clp->cl_count); 1158 1159 /* The rcu_read_lock() is not strictly necessary, as the state 1160 * manager is the only thread that ever changes the rpc_xprt 1161 * after it's initialized. At this point, we're single threaded. */ 1162 rcu_read_lock(); 1163 snprintf(buf, sizeof(buf), "%s-manager", 1164 rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR)); 1165 rcu_read_unlock(); 1166 task = kthread_run(nfs4_run_state_manager, clp, "%s", buf); 1167 if (IS_ERR(task)) { 1168 printk(KERN_ERR "%s: kthread_run: %ld\n", 1169 __func__, PTR_ERR(task)); 1170 nfs4_clear_state_manager_bit(clp); 1171 nfs_put_client(clp); 1172 module_put(THIS_MODULE); 1173 } 1174 } 1175 1176 /* 1177 * Schedule a lease recovery attempt 1178 */ 1179 void nfs4_schedule_lease_recovery(struct nfs_client *clp) 1180 { 1181 if (!clp) 1182 return; 1183 if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state)) 1184 set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state); 1185 dprintk("%s: scheduling lease recovery for server %s\n", __func__, 1186 clp->cl_hostname); 1187 nfs4_schedule_state_manager(clp); 1188 } 1189 EXPORT_SYMBOL_GPL(nfs4_schedule_lease_recovery); 1190 1191 /** 1192 * nfs4_schedule_migration_recovery - trigger migration recovery 1193 * 1194 * @server: FSID that is migrating 1195 * 1196 * Returns zero if recovery has started, otherwise a negative NFS4ERR 1197 * value is returned. 1198 */ 1199 int nfs4_schedule_migration_recovery(const struct nfs_server *server) 1200 { 1201 struct nfs_client *clp = server->nfs_client; 1202 1203 if (server->fh_expire_type != NFS4_FH_PERSISTENT) { 1204 pr_err("NFS: volatile file handles not supported (server %s)\n", 1205 clp->cl_hostname); 1206 return -NFS4ERR_IO; 1207 } 1208 1209 if (test_bit(NFS_MIG_FAILED, &server->mig_status)) 1210 return -NFS4ERR_IO; 1211 1212 dprintk("%s: scheduling migration recovery for (%llx:%llx) on %s\n", 1213 __func__, 1214 (unsigned long long)server->fsid.major, 1215 (unsigned long long)server->fsid.minor, 1216 clp->cl_hostname); 1217 1218 set_bit(NFS_MIG_IN_TRANSITION, 1219 &((struct nfs_server *)server)->mig_status); 1220 set_bit(NFS4CLNT_MOVED, &clp->cl_state); 1221 1222 nfs4_schedule_state_manager(clp); 1223 return 0; 1224 } 1225 EXPORT_SYMBOL_GPL(nfs4_schedule_migration_recovery); 1226 1227 /** 1228 * nfs4_schedule_lease_moved_recovery - start lease-moved recovery 1229 * 1230 * @clp: server to check for moved leases 1231 * 1232 */ 1233 void nfs4_schedule_lease_moved_recovery(struct nfs_client *clp) 1234 { 1235 dprintk("%s: scheduling lease-moved recovery for client ID %llx on %s\n", 1236 __func__, clp->cl_clientid, clp->cl_hostname); 1237 1238 set_bit(NFS4CLNT_LEASE_MOVED, &clp->cl_state); 1239 nfs4_schedule_state_manager(clp); 1240 } 1241 EXPORT_SYMBOL_GPL(nfs4_schedule_lease_moved_recovery); 1242 1243 int nfs4_wait_clnt_recover(struct nfs_client *clp) 1244 { 1245 int res; 1246 1247 might_sleep(); 1248 1249 atomic_inc(&clp->cl_count); 1250 res = wait_on_bit_action(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING, 1251 nfs_wait_bit_killable, TASK_KILLABLE); 1252 if (res) 1253 goto out; 1254 if (clp->cl_cons_state < 0) 1255 res = clp->cl_cons_state; 1256 out: 1257 nfs_put_client(clp); 1258 return res; 1259 } 1260 1261 int nfs4_client_recover_expired_lease(struct nfs_client *clp) 1262 { 1263 unsigned int loop; 1264 int ret; 1265 1266 for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) { 1267 ret = nfs4_wait_clnt_recover(clp); 1268 if (ret != 0) 1269 break; 1270 if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) && 1271 !test_bit(NFS4CLNT_CHECK_LEASE,&clp->cl_state)) 1272 break; 1273 nfs4_schedule_state_manager(clp); 1274 ret = -EIO; 1275 } 1276 return ret; 1277 } 1278 1279 /* 1280 * nfs40_handle_cb_pathdown - return all delegations after NFS4ERR_CB_PATH_DOWN 1281 * @clp: client to process 1282 * 1283 * Set the NFS4CLNT_LEASE_EXPIRED state in order to force a 1284 * resend of the SETCLIENTID and hence re-establish the 1285 * callback channel. Then return all existing delegations. 1286 */ 1287 static void nfs40_handle_cb_pathdown(struct nfs_client *clp) 1288 { 1289 set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1290 nfs_expire_all_delegations(clp); 1291 dprintk("%s: handling CB_PATHDOWN recovery for server %s\n", __func__, 1292 clp->cl_hostname); 1293 } 1294 1295 void nfs4_schedule_path_down_recovery(struct nfs_client *clp) 1296 { 1297 nfs40_handle_cb_pathdown(clp); 1298 nfs4_schedule_state_manager(clp); 1299 } 1300 1301 static int nfs4_state_mark_reclaim_reboot(struct nfs_client *clp, struct nfs4_state *state) 1302 { 1303 1304 set_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags); 1305 /* Don't recover state that expired before the reboot */ 1306 if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags)) { 1307 clear_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags); 1308 return 0; 1309 } 1310 set_bit(NFS_OWNER_RECLAIM_REBOOT, &state->owner->so_flags); 1311 set_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state); 1312 return 1; 1313 } 1314 1315 int nfs4_state_mark_reclaim_nograce(struct nfs_client *clp, struct nfs4_state *state) 1316 { 1317 set_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags); 1318 clear_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags); 1319 set_bit(NFS_OWNER_RECLAIM_NOGRACE, &state->owner->so_flags); 1320 set_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state); 1321 return 1; 1322 } 1323 1324 int nfs4_schedule_stateid_recovery(const struct nfs_server *server, struct nfs4_state *state) 1325 { 1326 struct nfs_client *clp = server->nfs_client; 1327 1328 if (!nfs4_valid_open_stateid(state)) 1329 return -EBADF; 1330 nfs4_state_mark_reclaim_nograce(clp, state); 1331 dprintk("%s: scheduling stateid recovery for server %s\n", __func__, 1332 clp->cl_hostname); 1333 nfs4_schedule_state_manager(clp); 1334 return 0; 1335 } 1336 EXPORT_SYMBOL_GPL(nfs4_schedule_stateid_recovery); 1337 1338 void nfs_inode_find_state_and_recover(struct inode *inode, 1339 const nfs4_stateid *stateid) 1340 { 1341 struct nfs_client *clp = NFS_SERVER(inode)->nfs_client; 1342 struct nfs_inode *nfsi = NFS_I(inode); 1343 struct nfs_open_context *ctx; 1344 struct nfs4_state *state; 1345 bool found = false; 1346 1347 spin_lock(&inode->i_lock); 1348 list_for_each_entry(ctx, &nfsi->open_files, list) { 1349 state = ctx->state; 1350 if (state == NULL) 1351 continue; 1352 if (!test_bit(NFS_DELEGATED_STATE, &state->flags)) 1353 continue; 1354 if (!nfs4_stateid_match(&state->stateid, stateid)) 1355 continue; 1356 nfs4_state_mark_reclaim_nograce(clp, state); 1357 found = true; 1358 } 1359 spin_unlock(&inode->i_lock); 1360 if (found) 1361 nfs4_schedule_state_manager(clp); 1362 } 1363 1364 static void nfs4_state_mark_open_context_bad(struct nfs4_state *state) 1365 { 1366 struct inode *inode = state->inode; 1367 struct nfs_inode *nfsi = NFS_I(inode); 1368 struct nfs_open_context *ctx; 1369 1370 spin_lock(&inode->i_lock); 1371 list_for_each_entry(ctx, &nfsi->open_files, list) { 1372 if (ctx->state != state) 1373 continue; 1374 set_bit(NFS_CONTEXT_BAD, &ctx->flags); 1375 } 1376 spin_unlock(&inode->i_lock); 1377 } 1378 1379 static void nfs4_state_mark_recovery_failed(struct nfs4_state *state, int error) 1380 { 1381 set_bit(NFS_STATE_RECOVERY_FAILED, &state->flags); 1382 nfs4_state_mark_open_context_bad(state); 1383 } 1384 1385 1386 static int nfs4_reclaim_locks(struct nfs4_state *state, const struct nfs4_state_recovery_ops *ops) 1387 { 1388 struct inode *inode = state->inode; 1389 struct nfs_inode *nfsi = NFS_I(inode); 1390 struct file_lock *fl; 1391 int status = 0; 1392 struct file_lock_context *flctx = inode->i_flctx; 1393 struct list_head *list; 1394 1395 if (flctx == NULL) 1396 return 0; 1397 1398 list = &flctx->flc_posix; 1399 1400 /* Guard against delegation returns and new lock/unlock calls */ 1401 down_write(&nfsi->rwsem); 1402 spin_lock(&flctx->flc_lock); 1403 restart: 1404 list_for_each_entry(fl, list, fl_list) { 1405 if (nfs_file_open_context(fl->fl_file)->state != state) 1406 continue; 1407 spin_unlock(&flctx->flc_lock); 1408 status = ops->recover_lock(state, fl); 1409 switch (status) { 1410 case 0: 1411 break; 1412 case -ESTALE: 1413 case -NFS4ERR_ADMIN_REVOKED: 1414 case -NFS4ERR_STALE_STATEID: 1415 case -NFS4ERR_BAD_STATEID: 1416 case -NFS4ERR_EXPIRED: 1417 case -NFS4ERR_NO_GRACE: 1418 case -NFS4ERR_STALE_CLIENTID: 1419 case -NFS4ERR_BADSESSION: 1420 case -NFS4ERR_BADSLOT: 1421 case -NFS4ERR_BAD_HIGH_SLOT: 1422 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION: 1423 goto out; 1424 default: 1425 pr_err("NFS: %s: unhandled error %d\n", 1426 __func__, status); 1427 case -ENOMEM: 1428 case -NFS4ERR_DENIED: 1429 case -NFS4ERR_RECLAIM_BAD: 1430 case -NFS4ERR_RECLAIM_CONFLICT: 1431 /* kill_proc(fl->fl_pid, SIGLOST, 1); */ 1432 status = 0; 1433 } 1434 spin_lock(&flctx->flc_lock); 1435 } 1436 if (list == &flctx->flc_posix) { 1437 list = &flctx->flc_flock; 1438 goto restart; 1439 } 1440 spin_unlock(&flctx->flc_lock); 1441 out: 1442 up_write(&nfsi->rwsem); 1443 return status; 1444 } 1445 1446 static int nfs4_reclaim_open_state(struct nfs4_state_owner *sp, const struct nfs4_state_recovery_ops *ops) 1447 { 1448 struct nfs4_state *state; 1449 struct nfs4_lock_state *lock; 1450 int status = 0; 1451 1452 /* Note: we rely on the sp->so_states list being ordered 1453 * so that we always reclaim open(O_RDWR) and/or open(O_WRITE) 1454 * states first. 1455 * This is needed to ensure that the server won't give us any 1456 * read delegations that we have to return if, say, we are 1457 * recovering after a network partition or a reboot from a 1458 * server that doesn't support a grace period. 1459 */ 1460 spin_lock(&sp->so_lock); 1461 raw_write_seqcount_begin(&sp->so_reclaim_seqcount); 1462 restart: 1463 list_for_each_entry(state, &sp->so_states, open_states) { 1464 if (!test_and_clear_bit(ops->state_flag_bit, &state->flags)) 1465 continue; 1466 if (!nfs4_valid_open_stateid(state)) 1467 continue; 1468 if (state->state == 0) 1469 continue; 1470 atomic_inc(&state->count); 1471 spin_unlock(&sp->so_lock); 1472 status = ops->recover_open(sp, state); 1473 if (status >= 0) { 1474 status = nfs4_reclaim_locks(state, ops); 1475 if (status >= 0) { 1476 if (!test_bit(NFS_DELEGATED_STATE, &state->flags)) { 1477 spin_lock(&state->state_lock); 1478 list_for_each_entry(lock, &state->lock_states, ls_locks) { 1479 if (!test_bit(NFS_LOCK_INITIALIZED, &lock->ls_flags)) 1480 pr_warn_ratelimited("NFS: " 1481 "%s: Lock reclaim " 1482 "failed!\n", __func__); 1483 } 1484 spin_unlock(&state->state_lock); 1485 } 1486 nfs4_put_open_state(state); 1487 clear_bit(NFS_STATE_RECLAIM_NOGRACE, 1488 &state->flags); 1489 spin_lock(&sp->so_lock); 1490 goto restart; 1491 } 1492 } 1493 switch (status) { 1494 default: 1495 printk(KERN_ERR "NFS: %s: unhandled error %d\n", 1496 __func__, status); 1497 case -ENOENT: 1498 case -ENOMEM: 1499 case -ESTALE: 1500 /* Open state on this file cannot be recovered */ 1501 nfs4_state_mark_recovery_failed(state, status); 1502 break; 1503 case -EAGAIN: 1504 ssleep(1); 1505 case -NFS4ERR_ADMIN_REVOKED: 1506 case -NFS4ERR_STALE_STATEID: 1507 case -NFS4ERR_BAD_STATEID: 1508 case -NFS4ERR_RECLAIM_BAD: 1509 case -NFS4ERR_RECLAIM_CONFLICT: 1510 nfs4_state_mark_reclaim_nograce(sp->so_server->nfs_client, state); 1511 break; 1512 case -NFS4ERR_EXPIRED: 1513 case -NFS4ERR_NO_GRACE: 1514 nfs4_state_mark_reclaim_nograce(sp->so_server->nfs_client, state); 1515 case -NFS4ERR_STALE_CLIENTID: 1516 case -NFS4ERR_BADSESSION: 1517 case -NFS4ERR_BADSLOT: 1518 case -NFS4ERR_BAD_HIGH_SLOT: 1519 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION: 1520 goto out_err; 1521 } 1522 nfs4_put_open_state(state); 1523 spin_lock(&sp->so_lock); 1524 goto restart; 1525 } 1526 raw_write_seqcount_end(&sp->so_reclaim_seqcount); 1527 spin_unlock(&sp->so_lock); 1528 return 0; 1529 out_err: 1530 nfs4_put_open_state(state); 1531 spin_lock(&sp->so_lock); 1532 raw_write_seqcount_end(&sp->so_reclaim_seqcount); 1533 spin_unlock(&sp->so_lock); 1534 return status; 1535 } 1536 1537 static void nfs4_clear_open_state(struct nfs4_state *state) 1538 { 1539 struct nfs4_lock_state *lock; 1540 1541 clear_bit(NFS_DELEGATED_STATE, &state->flags); 1542 clear_bit(NFS_O_RDONLY_STATE, &state->flags); 1543 clear_bit(NFS_O_WRONLY_STATE, &state->flags); 1544 clear_bit(NFS_O_RDWR_STATE, &state->flags); 1545 spin_lock(&state->state_lock); 1546 list_for_each_entry(lock, &state->lock_states, ls_locks) { 1547 lock->ls_seqid.flags = 0; 1548 clear_bit(NFS_LOCK_INITIALIZED, &lock->ls_flags); 1549 } 1550 spin_unlock(&state->state_lock); 1551 } 1552 1553 static void nfs4_reset_seqids(struct nfs_server *server, 1554 int (*mark_reclaim)(struct nfs_client *clp, struct nfs4_state *state)) 1555 { 1556 struct nfs_client *clp = server->nfs_client; 1557 struct nfs4_state_owner *sp; 1558 struct rb_node *pos; 1559 struct nfs4_state *state; 1560 1561 spin_lock(&clp->cl_lock); 1562 for (pos = rb_first(&server->state_owners); 1563 pos != NULL; 1564 pos = rb_next(pos)) { 1565 sp = rb_entry(pos, struct nfs4_state_owner, so_server_node); 1566 sp->so_seqid.flags = 0; 1567 spin_lock(&sp->so_lock); 1568 list_for_each_entry(state, &sp->so_states, open_states) { 1569 if (mark_reclaim(clp, state)) 1570 nfs4_clear_open_state(state); 1571 } 1572 spin_unlock(&sp->so_lock); 1573 } 1574 spin_unlock(&clp->cl_lock); 1575 } 1576 1577 static void nfs4_state_mark_reclaim_helper(struct nfs_client *clp, 1578 int (*mark_reclaim)(struct nfs_client *clp, struct nfs4_state *state)) 1579 { 1580 struct nfs_server *server; 1581 1582 rcu_read_lock(); 1583 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) 1584 nfs4_reset_seqids(server, mark_reclaim); 1585 rcu_read_unlock(); 1586 } 1587 1588 static void nfs4_state_start_reclaim_reboot(struct nfs_client *clp) 1589 { 1590 /* Mark all delegations for reclaim */ 1591 nfs_delegation_mark_reclaim(clp); 1592 nfs4_state_mark_reclaim_helper(clp, nfs4_state_mark_reclaim_reboot); 1593 } 1594 1595 static void nfs4_reclaim_complete(struct nfs_client *clp, 1596 const struct nfs4_state_recovery_ops *ops, 1597 struct rpc_cred *cred) 1598 { 1599 /* Notify the server we're done reclaiming our state */ 1600 if (ops->reclaim_complete) 1601 (void)ops->reclaim_complete(clp, cred); 1602 } 1603 1604 static void nfs4_clear_reclaim_server(struct nfs_server *server) 1605 { 1606 struct nfs_client *clp = server->nfs_client; 1607 struct nfs4_state_owner *sp; 1608 struct rb_node *pos; 1609 struct nfs4_state *state; 1610 1611 spin_lock(&clp->cl_lock); 1612 for (pos = rb_first(&server->state_owners); 1613 pos != NULL; 1614 pos = rb_next(pos)) { 1615 sp = rb_entry(pos, struct nfs4_state_owner, so_server_node); 1616 spin_lock(&sp->so_lock); 1617 list_for_each_entry(state, &sp->so_states, open_states) { 1618 if (!test_and_clear_bit(NFS_STATE_RECLAIM_REBOOT, 1619 &state->flags)) 1620 continue; 1621 nfs4_state_mark_reclaim_nograce(clp, state); 1622 } 1623 spin_unlock(&sp->so_lock); 1624 } 1625 spin_unlock(&clp->cl_lock); 1626 } 1627 1628 static int nfs4_state_clear_reclaim_reboot(struct nfs_client *clp) 1629 { 1630 struct nfs_server *server; 1631 1632 if (!test_and_clear_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state)) 1633 return 0; 1634 1635 rcu_read_lock(); 1636 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) 1637 nfs4_clear_reclaim_server(server); 1638 rcu_read_unlock(); 1639 1640 nfs_delegation_reap_unclaimed(clp); 1641 return 1; 1642 } 1643 1644 static void nfs4_state_end_reclaim_reboot(struct nfs_client *clp) 1645 { 1646 const struct nfs4_state_recovery_ops *ops; 1647 struct rpc_cred *cred; 1648 1649 if (!nfs4_state_clear_reclaim_reboot(clp)) 1650 return; 1651 ops = clp->cl_mvops->reboot_recovery_ops; 1652 cred = nfs4_get_clid_cred(clp); 1653 nfs4_reclaim_complete(clp, ops, cred); 1654 put_rpccred(cred); 1655 } 1656 1657 static void nfs_delegation_clear_all(struct nfs_client *clp) 1658 { 1659 nfs_delegation_mark_reclaim(clp); 1660 nfs_delegation_reap_unclaimed(clp); 1661 } 1662 1663 static void nfs4_state_start_reclaim_nograce(struct nfs_client *clp) 1664 { 1665 nfs_delegation_clear_all(clp); 1666 nfs4_state_mark_reclaim_helper(clp, nfs4_state_mark_reclaim_nograce); 1667 } 1668 1669 static int nfs4_recovery_handle_error(struct nfs_client *clp, int error) 1670 { 1671 switch (error) { 1672 case 0: 1673 break; 1674 case -NFS4ERR_CB_PATH_DOWN: 1675 nfs40_handle_cb_pathdown(clp); 1676 break; 1677 case -NFS4ERR_NO_GRACE: 1678 nfs4_state_end_reclaim_reboot(clp); 1679 break; 1680 case -NFS4ERR_STALE_CLIENTID: 1681 set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1682 nfs4_state_clear_reclaim_reboot(clp); 1683 nfs4_state_start_reclaim_reboot(clp); 1684 break; 1685 case -NFS4ERR_EXPIRED: 1686 set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1687 nfs4_state_start_reclaim_nograce(clp); 1688 break; 1689 case -NFS4ERR_BADSESSION: 1690 case -NFS4ERR_BADSLOT: 1691 case -NFS4ERR_BAD_HIGH_SLOT: 1692 case -NFS4ERR_DEADSESSION: 1693 case -NFS4ERR_SEQ_FALSE_RETRY: 1694 case -NFS4ERR_SEQ_MISORDERED: 1695 set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state); 1696 /* Zero session reset errors */ 1697 break; 1698 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION: 1699 set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state); 1700 break; 1701 default: 1702 dprintk("%s: failed to handle error %d for server %s\n", 1703 __func__, error, clp->cl_hostname); 1704 return error; 1705 } 1706 dprintk("%s: handled error %d for server %s\n", __func__, error, 1707 clp->cl_hostname); 1708 return 0; 1709 } 1710 1711 static int nfs4_do_reclaim(struct nfs_client *clp, const struct nfs4_state_recovery_ops *ops) 1712 { 1713 struct nfs4_state_owner *sp; 1714 struct nfs_server *server; 1715 struct rb_node *pos; 1716 int status = 0; 1717 1718 restart: 1719 rcu_read_lock(); 1720 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) { 1721 nfs4_purge_state_owners(server); 1722 spin_lock(&clp->cl_lock); 1723 for (pos = rb_first(&server->state_owners); 1724 pos != NULL; 1725 pos = rb_next(pos)) { 1726 sp = rb_entry(pos, 1727 struct nfs4_state_owner, so_server_node); 1728 if (!test_and_clear_bit(ops->owner_flag_bit, 1729 &sp->so_flags)) 1730 continue; 1731 if (!atomic_inc_not_zero(&sp->so_count)) 1732 continue; 1733 spin_unlock(&clp->cl_lock); 1734 rcu_read_unlock(); 1735 1736 status = nfs4_reclaim_open_state(sp, ops); 1737 if (status < 0) { 1738 set_bit(ops->owner_flag_bit, &sp->so_flags); 1739 nfs4_put_state_owner(sp); 1740 status = nfs4_recovery_handle_error(clp, status); 1741 return (status != 0) ? status : -EAGAIN; 1742 } 1743 1744 nfs4_put_state_owner(sp); 1745 goto restart; 1746 } 1747 spin_unlock(&clp->cl_lock); 1748 } 1749 rcu_read_unlock(); 1750 return 0; 1751 } 1752 1753 static int nfs4_check_lease(struct nfs_client *clp) 1754 { 1755 struct rpc_cred *cred; 1756 const struct nfs4_state_maintenance_ops *ops = 1757 clp->cl_mvops->state_renewal_ops; 1758 int status; 1759 1760 /* Is the client already known to have an expired lease? */ 1761 if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state)) 1762 return 0; 1763 spin_lock(&clp->cl_lock); 1764 cred = ops->get_state_renewal_cred_locked(clp); 1765 spin_unlock(&clp->cl_lock); 1766 if (cred == NULL) { 1767 cred = nfs4_get_clid_cred(clp); 1768 status = -ENOKEY; 1769 if (cred == NULL) 1770 goto out; 1771 } 1772 status = ops->renew_lease(clp, cred); 1773 put_rpccred(cred); 1774 if (status == -ETIMEDOUT) { 1775 set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state); 1776 return 0; 1777 } 1778 out: 1779 return nfs4_recovery_handle_error(clp, status); 1780 } 1781 1782 /* Set NFS4CLNT_LEASE_EXPIRED and reclaim reboot state for all v4.0 errors 1783 * and for recoverable errors on EXCHANGE_ID for v4.1 1784 */ 1785 static int nfs4_handle_reclaim_lease_error(struct nfs_client *clp, int status) 1786 { 1787 switch (status) { 1788 case -NFS4ERR_SEQ_MISORDERED: 1789 if (test_and_set_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) 1790 return -ESERVERFAULT; 1791 /* Lease confirmation error: retry after purging the lease */ 1792 ssleep(1); 1793 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 1794 break; 1795 case -NFS4ERR_STALE_CLIENTID: 1796 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 1797 nfs4_state_start_reclaim_reboot(clp); 1798 break; 1799 case -NFS4ERR_CLID_INUSE: 1800 pr_err("NFS: Server %s reports our clientid is in use\n", 1801 clp->cl_hostname); 1802 nfs_mark_client_ready(clp, -EPERM); 1803 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 1804 return -EPERM; 1805 case -EACCES: 1806 case -NFS4ERR_DELAY: 1807 case -ETIMEDOUT: 1808 case -EAGAIN: 1809 ssleep(1); 1810 break; 1811 1812 case -NFS4ERR_MINOR_VERS_MISMATCH: 1813 if (clp->cl_cons_state == NFS_CS_SESSION_INITING) 1814 nfs_mark_client_ready(clp, -EPROTONOSUPPORT); 1815 dprintk("%s: exit with error %d for server %s\n", 1816 __func__, -EPROTONOSUPPORT, clp->cl_hostname); 1817 return -EPROTONOSUPPORT; 1818 case -NFS4ERR_NOT_SAME: /* FixMe: implement recovery 1819 * in nfs4_exchange_id */ 1820 default: 1821 dprintk("%s: exit with error %d for server %s\n", __func__, 1822 status, clp->cl_hostname); 1823 return status; 1824 } 1825 set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1826 dprintk("%s: handled error %d for server %s\n", __func__, status, 1827 clp->cl_hostname); 1828 return 0; 1829 } 1830 1831 static int nfs4_establish_lease(struct nfs_client *clp) 1832 { 1833 struct rpc_cred *cred; 1834 const struct nfs4_state_recovery_ops *ops = 1835 clp->cl_mvops->reboot_recovery_ops; 1836 int status; 1837 1838 nfs4_begin_drain_session(clp); 1839 cred = nfs4_get_clid_cred(clp); 1840 if (cred == NULL) 1841 return -ENOENT; 1842 status = ops->establish_clid(clp, cred); 1843 put_rpccred(cred); 1844 if (status != 0) 1845 return status; 1846 pnfs_destroy_all_layouts(clp); 1847 return 0; 1848 } 1849 1850 /* 1851 * Returns zero or a negative errno. NFS4ERR values are converted 1852 * to local errno values. 1853 */ 1854 static int nfs4_reclaim_lease(struct nfs_client *clp) 1855 { 1856 int status; 1857 1858 status = nfs4_establish_lease(clp); 1859 if (status < 0) 1860 return nfs4_handle_reclaim_lease_error(clp, status); 1861 if (test_and_clear_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state)) 1862 nfs4_state_start_reclaim_nograce(clp); 1863 if (!test_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state)) 1864 set_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state); 1865 clear_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state); 1866 clear_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1867 return 0; 1868 } 1869 1870 static int nfs4_purge_lease(struct nfs_client *clp) 1871 { 1872 int status; 1873 1874 status = nfs4_establish_lease(clp); 1875 if (status < 0) 1876 return nfs4_handle_reclaim_lease_error(clp, status); 1877 clear_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state); 1878 set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state); 1879 nfs4_state_start_reclaim_nograce(clp); 1880 return 0; 1881 } 1882 1883 /* 1884 * Try remote migration of one FSID from a source server to a 1885 * destination server. The source server provides a list of 1886 * potential destinations. 1887 * 1888 * Returns zero or a negative NFS4ERR status code. 1889 */ 1890 static int nfs4_try_migration(struct nfs_server *server, struct rpc_cred *cred) 1891 { 1892 struct nfs_client *clp = server->nfs_client; 1893 struct nfs4_fs_locations *locations = NULL; 1894 struct inode *inode; 1895 struct page *page; 1896 int status, result; 1897 1898 dprintk("--> %s: FSID %llx:%llx on \"%s\"\n", __func__, 1899 (unsigned long long)server->fsid.major, 1900 (unsigned long long)server->fsid.minor, 1901 clp->cl_hostname); 1902 1903 result = 0; 1904 page = alloc_page(GFP_KERNEL); 1905 locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL); 1906 if (page == NULL || locations == NULL) { 1907 dprintk("<-- %s: no memory\n", __func__); 1908 goto out; 1909 } 1910 1911 inode = d_inode(server->super->s_root); 1912 result = nfs4_proc_get_locations(inode, locations, page, cred); 1913 if (result) { 1914 dprintk("<-- %s: failed to retrieve fs_locations: %d\n", 1915 __func__, result); 1916 goto out; 1917 } 1918 1919 result = -NFS4ERR_NXIO; 1920 if (!(locations->fattr.valid & NFS_ATTR_FATTR_V4_LOCATIONS)) { 1921 dprintk("<-- %s: No fs_locations data, migration skipped\n", 1922 __func__); 1923 goto out; 1924 } 1925 1926 nfs4_begin_drain_session(clp); 1927 1928 status = nfs4_replace_transport(server, locations); 1929 if (status != 0) { 1930 dprintk("<-- %s: failed to replace transport: %d\n", 1931 __func__, status); 1932 goto out; 1933 } 1934 1935 result = 0; 1936 dprintk("<-- %s: migration succeeded\n", __func__); 1937 1938 out: 1939 if (page != NULL) 1940 __free_page(page); 1941 kfree(locations); 1942 if (result) { 1943 pr_err("NFS: migration recovery failed (server %s)\n", 1944 clp->cl_hostname); 1945 set_bit(NFS_MIG_FAILED, &server->mig_status); 1946 } 1947 return result; 1948 } 1949 1950 /* 1951 * Returns zero or a negative NFS4ERR status code. 1952 */ 1953 static int nfs4_handle_migration(struct nfs_client *clp) 1954 { 1955 const struct nfs4_state_maintenance_ops *ops = 1956 clp->cl_mvops->state_renewal_ops; 1957 struct nfs_server *server; 1958 struct rpc_cred *cred; 1959 1960 dprintk("%s: migration reported on \"%s\"\n", __func__, 1961 clp->cl_hostname); 1962 1963 spin_lock(&clp->cl_lock); 1964 cred = ops->get_state_renewal_cred_locked(clp); 1965 spin_unlock(&clp->cl_lock); 1966 if (cred == NULL) 1967 return -NFS4ERR_NOENT; 1968 1969 clp->cl_mig_gen++; 1970 restart: 1971 rcu_read_lock(); 1972 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) { 1973 int status; 1974 1975 if (server->mig_gen == clp->cl_mig_gen) 1976 continue; 1977 server->mig_gen = clp->cl_mig_gen; 1978 1979 if (!test_and_clear_bit(NFS_MIG_IN_TRANSITION, 1980 &server->mig_status)) 1981 continue; 1982 1983 rcu_read_unlock(); 1984 status = nfs4_try_migration(server, cred); 1985 if (status < 0) { 1986 put_rpccred(cred); 1987 return status; 1988 } 1989 goto restart; 1990 } 1991 rcu_read_unlock(); 1992 put_rpccred(cred); 1993 return 0; 1994 } 1995 1996 /* 1997 * Test each nfs_server on the clp's cl_superblocks list to see 1998 * if it's moved to another server. Stop when the server no longer 1999 * returns NFS4ERR_LEASE_MOVED. 2000 */ 2001 static int nfs4_handle_lease_moved(struct nfs_client *clp) 2002 { 2003 const struct nfs4_state_maintenance_ops *ops = 2004 clp->cl_mvops->state_renewal_ops; 2005 struct nfs_server *server; 2006 struct rpc_cred *cred; 2007 2008 dprintk("%s: lease moved reported on \"%s\"\n", __func__, 2009 clp->cl_hostname); 2010 2011 spin_lock(&clp->cl_lock); 2012 cred = ops->get_state_renewal_cred_locked(clp); 2013 spin_unlock(&clp->cl_lock); 2014 if (cred == NULL) 2015 return -NFS4ERR_NOENT; 2016 2017 clp->cl_mig_gen++; 2018 restart: 2019 rcu_read_lock(); 2020 list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) { 2021 struct inode *inode; 2022 int status; 2023 2024 if (server->mig_gen == clp->cl_mig_gen) 2025 continue; 2026 server->mig_gen = clp->cl_mig_gen; 2027 2028 rcu_read_unlock(); 2029 2030 inode = d_inode(server->super->s_root); 2031 status = nfs4_proc_fsid_present(inode, cred); 2032 if (status != -NFS4ERR_MOVED) 2033 goto restart; /* wasn't this one */ 2034 if (nfs4_try_migration(server, cred) == -NFS4ERR_LEASE_MOVED) 2035 goto restart; /* there are more */ 2036 goto out; 2037 } 2038 rcu_read_unlock(); 2039 2040 out: 2041 put_rpccred(cred); 2042 return 0; 2043 } 2044 2045 /** 2046 * nfs4_discover_server_trunking - Detect server IP address trunking 2047 * 2048 * @clp: nfs_client under test 2049 * @result: OUT: found nfs_client, or clp 2050 * 2051 * Returns zero or a negative errno. If zero is returned, 2052 * an nfs_client pointer is planted in "result". 2053 * 2054 * Note: since we are invoked in process context, and 2055 * not from inside the state manager, we cannot use 2056 * nfs4_handle_reclaim_lease_error(). 2057 */ 2058 int nfs4_discover_server_trunking(struct nfs_client *clp, 2059 struct nfs_client **result) 2060 { 2061 const struct nfs4_state_recovery_ops *ops = 2062 clp->cl_mvops->reboot_recovery_ops; 2063 struct rpc_clnt *clnt; 2064 struct rpc_cred *cred; 2065 int i, status; 2066 2067 dprintk("NFS: %s: testing '%s'\n", __func__, clp->cl_hostname); 2068 2069 clnt = clp->cl_rpcclient; 2070 i = 0; 2071 2072 mutex_lock(&nfs_clid_init_mutex); 2073 again: 2074 status = -ENOENT; 2075 cred = nfs4_get_clid_cred(clp); 2076 if (cred == NULL) 2077 goto out_unlock; 2078 2079 status = ops->detect_trunking(clp, result, cred); 2080 put_rpccred(cred); 2081 switch (status) { 2082 case 0: 2083 break; 2084 case -ETIMEDOUT: 2085 if (clnt->cl_softrtry) 2086 break; 2087 case -NFS4ERR_DELAY: 2088 case -EAGAIN: 2089 ssleep(1); 2090 case -NFS4ERR_STALE_CLIENTID: 2091 dprintk("NFS: %s after status %d, retrying\n", 2092 __func__, status); 2093 goto again; 2094 case -EACCES: 2095 if (i++ == 0) { 2096 nfs4_root_machine_cred(clp); 2097 goto again; 2098 } 2099 if (clnt->cl_auth->au_flavor == RPC_AUTH_UNIX) 2100 break; 2101 case -NFS4ERR_CLID_INUSE: 2102 case -NFS4ERR_WRONGSEC: 2103 /* No point in retrying if we already used RPC_AUTH_UNIX */ 2104 if (clnt->cl_auth->au_flavor == RPC_AUTH_UNIX) { 2105 status = -EPERM; 2106 break; 2107 } 2108 clnt = rpc_clone_client_set_auth(clnt, RPC_AUTH_UNIX); 2109 if (IS_ERR(clnt)) { 2110 status = PTR_ERR(clnt); 2111 break; 2112 } 2113 /* Note: this is safe because we haven't yet marked the 2114 * client as ready, so we are the only user of 2115 * clp->cl_rpcclient 2116 */ 2117 clnt = xchg(&clp->cl_rpcclient, clnt); 2118 rpc_shutdown_client(clnt); 2119 clnt = clp->cl_rpcclient; 2120 goto again; 2121 2122 case -NFS4ERR_MINOR_VERS_MISMATCH: 2123 status = -EPROTONOSUPPORT; 2124 break; 2125 2126 case -EKEYEXPIRED: 2127 case -NFS4ERR_NOT_SAME: /* FixMe: implement recovery 2128 * in nfs4_exchange_id */ 2129 status = -EKEYEXPIRED; 2130 break; 2131 default: 2132 pr_warn("NFS: %s unhandled error %d. Exiting with error EIO\n", 2133 __func__, status); 2134 status = -EIO; 2135 } 2136 2137 out_unlock: 2138 mutex_unlock(&nfs_clid_init_mutex); 2139 dprintk("NFS: %s: status = %d\n", __func__, status); 2140 return status; 2141 } 2142 2143 #ifdef CONFIG_NFS_V4_1 2144 void nfs4_schedule_session_recovery(struct nfs4_session *session, int err) 2145 { 2146 struct nfs_client *clp = session->clp; 2147 2148 switch (err) { 2149 default: 2150 set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state); 2151 break; 2152 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION: 2153 set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state); 2154 } 2155 nfs4_schedule_lease_recovery(clp); 2156 } 2157 EXPORT_SYMBOL_GPL(nfs4_schedule_session_recovery); 2158 2159 void nfs41_notify_server(struct nfs_client *clp) 2160 { 2161 /* Use CHECK_LEASE to ping the server with a SEQUENCE */ 2162 set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state); 2163 nfs4_schedule_state_manager(clp); 2164 } 2165 2166 static void nfs4_reset_all_state(struct nfs_client *clp) 2167 { 2168 if (test_and_set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) == 0) { 2169 set_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state); 2170 clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state); 2171 nfs4_state_start_reclaim_nograce(clp); 2172 dprintk("%s: scheduling reset of all state for server %s!\n", 2173 __func__, clp->cl_hostname); 2174 nfs4_schedule_state_manager(clp); 2175 } 2176 } 2177 2178 static void nfs41_handle_server_reboot(struct nfs_client *clp) 2179 { 2180 if (test_and_set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) == 0) { 2181 nfs4_state_start_reclaim_reboot(clp); 2182 dprintk("%s: server %s rebooted!\n", __func__, 2183 clp->cl_hostname); 2184 nfs4_schedule_state_manager(clp); 2185 } 2186 } 2187 2188 static void nfs41_handle_all_state_revoked(struct nfs_client *clp) 2189 { 2190 nfs4_reset_all_state(clp); 2191 dprintk("%s: state revoked on server %s\n", __func__, clp->cl_hostname); 2192 } 2193 2194 static void nfs41_handle_some_state_revoked(struct nfs_client *clp) 2195 { 2196 nfs4_state_mark_reclaim_helper(clp, nfs4_state_mark_reclaim_nograce); 2197 nfs4_schedule_state_manager(clp); 2198 2199 dprintk("%s: state revoked on server %s\n", __func__, clp->cl_hostname); 2200 } 2201 2202 static void nfs41_handle_recallable_state_revoked(struct nfs_client *clp) 2203 { 2204 /* FIXME: For now, we destroy all layouts. */ 2205 pnfs_destroy_all_layouts(clp); 2206 /* FIXME: For now, we test all delegations+open state+locks. */ 2207 nfs41_handle_some_state_revoked(clp); 2208 dprintk("%s: Recallable state revoked on server %s!\n", __func__, 2209 clp->cl_hostname); 2210 } 2211 2212 static void nfs41_handle_backchannel_fault(struct nfs_client *clp) 2213 { 2214 set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state); 2215 nfs4_schedule_state_manager(clp); 2216 2217 dprintk("%s: server %s declared a backchannel fault\n", __func__, 2218 clp->cl_hostname); 2219 } 2220 2221 static void nfs41_handle_cb_path_down(struct nfs_client *clp) 2222 { 2223 if (test_and_set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, 2224 &clp->cl_state) == 0) 2225 nfs4_schedule_state_manager(clp); 2226 } 2227 2228 void nfs41_handle_sequence_flag_errors(struct nfs_client *clp, u32 flags) 2229 { 2230 if (!flags) 2231 return; 2232 2233 dprintk("%s: \"%s\" (client ID %llx) flags=0x%08x\n", 2234 __func__, clp->cl_hostname, clp->cl_clientid, flags); 2235 2236 if (flags & SEQ4_STATUS_RESTART_RECLAIM_NEEDED) 2237 nfs41_handle_server_reboot(clp); 2238 if (flags & (SEQ4_STATUS_EXPIRED_ALL_STATE_REVOKED)) 2239 nfs41_handle_all_state_revoked(clp); 2240 if (flags & (SEQ4_STATUS_EXPIRED_SOME_STATE_REVOKED | 2241 SEQ4_STATUS_ADMIN_STATE_REVOKED)) 2242 nfs41_handle_some_state_revoked(clp); 2243 if (flags & SEQ4_STATUS_LEASE_MOVED) 2244 nfs4_schedule_lease_moved_recovery(clp); 2245 if (flags & SEQ4_STATUS_RECALLABLE_STATE_REVOKED) 2246 nfs41_handle_recallable_state_revoked(clp); 2247 if (flags & SEQ4_STATUS_BACKCHANNEL_FAULT) 2248 nfs41_handle_backchannel_fault(clp); 2249 else if (flags & (SEQ4_STATUS_CB_PATH_DOWN | 2250 SEQ4_STATUS_CB_PATH_DOWN_SESSION)) 2251 nfs41_handle_cb_path_down(clp); 2252 } 2253 2254 static int nfs4_reset_session(struct nfs_client *clp) 2255 { 2256 struct rpc_cred *cred; 2257 int status; 2258 2259 if (!nfs4_has_session(clp)) 2260 return 0; 2261 nfs4_begin_drain_session(clp); 2262 cred = nfs4_get_clid_cred(clp); 2263 status = nfs4_proc_destroy_session(clp->cl_session, cred); 2264 switch (status) { 2265 case 0: 2266 case -NFS4ERR_BADSESSION: 2267 case -NFS4ERR_DEADSESSION: 2268 break; 2269 case -NFS4ERR_BACK_CHAN_BUSY: 2270 case -NFS4ERR_DELAY: 2271 set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state); 2272 status = 0; 2273 ssleep(1); 2274 goto out; 2275 default: 2276 status = nfs4_recovery_handle_error(clp, status); 2277 goto out; 2278 } 2279 2280 memset(clp->cl_session->sess_id.data, 0, NFS4_MAX_SESSIONID_LEN); 2281 status = nfs4_proc_create_session(clp, cred); 2282 if (status) { 2283 dprintk("%s: session reset failed with status %d for server %s!\n", 2284 __func__, status, clp->cl_hostname); 2285 status = nfs4_handle_reclaim_lease_error(clp, status); 2286 goto out; 2287 } 2288 nfs41_finish_session_reset(clp); 2289 dprintk("%s: session reset was successful for server %s!\n", 2290 __func__, clp->cl_hostname); 2291 out: 2292 if (cred) 2293 put_rpccred(cred); 2294 return status; 2295 } 2296 2297 static int nfs4_bind_conn_to_session(struct nfs_client *clp) 2298 { 2299 struct rpc_cred *cred; 2300 int ret; 2301 2302 if (!nfs4_has_session(clp)) 2303 return 0; 2304 nfs4_begin_drain_session(clp); 2305 cred = nfs4_get_clid_cred(clp); 2306 ret = nfs4_proc_bind_conn_to_session(clp, cred); 2307 if (cred) 2308 put_rpccred(cred); 2309 clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state); 2310 switch (ret) { 2311 case 0: 2312 dprintk("%s: bind_conn_to_session was successful for server %s!\n", 2313 __func__, clp->cl_hostname); 2314 break; 2315 case -NFS4ERR_DELAY: 2316 ssleep(1); 2317 set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state); 2318 break; 2319 default: 2320 return nfs4_recovery_handle_error(clp, ret); 2321 } 2322 return 0; 2323 } 2324 #else /* CONFIG_NFS_V4_1 */ 2325 static int nfs4_reset_session(struct nfs_client *clp) { return 0; } 2326 2327 static int nfs4_bind_conn_to_session(struct nfs_client *clp) 2328 { 2329 return 0; 2330 } 2331 #endif /* CONFIG_NFS_V4_1 */ 2332 2333 static void nfs4_state_manager(struct nfs_client *clp) 2334 { 2335 int status = 0; 2336 const char *section = "", *section_sep = ""; 2337 2338 /* Ensure exclusive access to NFSv4 state */ 2339 do { 2340 if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) { 2341 section = "purge state"; 2342 status = nfs4_purge_lease(clp); 2343 if (status < 0) 2344 goto out_error; 2345 continue; 2346 } 2347 2348 if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state)) { 2349 section = "lease expired"; 2350 /* We're going to have to re-establish a clientid */ 2351 status = nfs4_reclaim_lease(clp); 2352 if (status < 0) 2353 goto out_error; 2354 continue; 2355 } 2356 2357 /* Initialize or reset the session */ 2358 if (test_and_clear_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state)) { 2359 section = "reset session"; 2360 status = nfs4_reset_session(clp); 2361 if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state)) 2362 continue; 2363 if (status < 0) 2364 goto out_error; 2365 } 2366 2367 /* Send BIND_CONN_TO_SESSION */ 2368 if (test_and_clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION, 2369 &clp->cl_state)) { 2370 section = "bind conn to session"; 2371 status = nfs4_bind_conn_to_session(clp); 2372 if (status < 0) 2373 goto out_error; 2374 continue; 2375 } 2376 2377 if (test_and_clear_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state)) { 2378 section = "check lease"; 2379 status = nfs4_check_lease(clp); 2380 if (status < 0) 2381 goto out_error; 2382 continue; 2383 } 2384 2385 if (test_and_clear_bit(NFS4CLNT_MOVED, &clp->cl_state)) { 2386 section = "migration"; 2387 status = nfs4_handle_migration(clp); 2388 if (status < 0) 2389 goto out_error; 2390 } 2391 2392 if (test_and_clear_bit(NFS4CLNT_LEASE_MOVED, &clp->cl_state)) { 2393 section = "lease moved"; 2394 status = nfs4_handle_lease_moved(clp); 2395 if (status < 0) 2396 goto out_error; 2397 } 2398 2399 /* First recover reboot state... */ 2400 if (test_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state)) { 2401 section = "reclaim reboot"; 2402 status = nfs4_do_reclaim(clp, 2403 clp->cl_mvops->reboot_recovery_ops); 2404 if (status == -EAGAIN) 2405 continue; 2406 if (status < 0) 2407 goto out_error; 2408 nfs4_state_end_reclaim_reboot(clp); 2409 } 2410 2411 /* Now recover expired state... */ 2412 if (test_and_clear_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state)) { 2413 section = "reclaim nograce"; 2414 status = nfs4_do_reclaim(clp, 2415 clp->cl_mvops->nograce_recovery_ops); 2416 if (status == -EAGAIN) 2417 continue; 2418 if (status < 0) 2419 goto out_error; 2420 } 2421 2422 nfs4_end_drain_session(clp); 2423 if (test_and_clear_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state)) { 2424 nfs_client_return_marked_delegations(clp); 2425 continue; 2426 } 2427 2428 nfs4_clear_state_manager_bit(clp); 2429 /* Did we race with an attempt to give us more work? */ 2430 if (clp->cl_state == 0) 2431 break; 2432 if (test_and_set_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) != 0) 2433 break; 2434 } while (atomic_read(&clp->cl_count) > 1); 2435 return; 2436 out_error: 2437 if (strlen(section)) 2438 section_sep = ": "; 2439 pr_warn_ratelimited("NFS: state manager%s%s failed on NFSv4 server %s" 2440 " with error %d\n", section_sep, section, 2441 clp->cl_hostname, -status); 2442 ssleep(1); 2443 nfs4_end_drain_session(clp); 2444 nfs4_clear_state_manager_bit(clp); 2445 } 2446 2447 static int nfs4_run_state_manager(void *ptr) 2448 { 2449 struct nfs_client *clp = ptr; 2450 2451 allow_signal(SIGKILL); 2452 nfs4_state_manager(clp); 2453 nfs_put_client(clp); 2454 module_put_and_exit(0); 2455 return 0; 2456 } 2457 2458 /* 2459 * Local variables: 2460 * c-basic-offset: 8 2461 * End: 2462 */ 2463