xref: /openbmc/linux/fs/nfsd/nfs4recover.c (revision 8bd1369b)
1 /*
2 *  Copyright (c) 2004 The Regents of the University of Michigan.
3 *  Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
4 *  All rights reserved.
5 *
6 *  Andy Adamson <andros@citi.umich.edu>
7 *
8 *  Redistribution and use in source and binary forms, with or without
9 *  modification, are permitted provided that the following conditions
10 *  are met:
11 *
12 *  1. Redistributions of source code must retain the above copyright
13 *     notice, this list of conditions and the following disclaimer.
14 *  2. Redistributions in binary form must reproduce the above copyright
15 *     notice, this list of conditions and the following disclaimer in the
16 *     documentation and/or other materials provided with the distribution.
17 *  3. Neither the name of the University nor the names of its
18 *     contributors may be used to endorse or promote products derived
19 *     from this software without specific prior written permission.
20 *
21 *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 *
33 */
34 
35 #include <crypto/hash.h>
36 #include <linux/file.h>
37 #include <linux/slab.h>
38 #include <linux/namei.h>
39 #include <linux/sched.h>
40 #include <linux/fs.h>
41 #include <linux/module.h>
42 #include <net/net_namespace.h>
43 #include <linux/sunrpc/rpc_pipe_fs.h>
44 #include <linux/sunrpc/clnt.h>
45 #include <linux/nfsd/cld.h>
46 
47 #include "nfsd.h"
48 #include "state.h"
49 #include "vfs.h"
50 #include "netns.h"
51 
52 #define NFSDDBG_FACILITY                NFSDDBG_PROC
53 
54 /* Declarations */
55 struct nfsd4_client_tracking_ops {
56 	int (*init)(struct net *);
57 	void (*exit)(struct net *);
58 	void (*create)(struct nfs4_client *);
59 	void (*remove)(struct nfs4_client *);
60 	int (*check)(struct nfs4_client *);
61 	void (*grace_done)(struct nfsd_net *);
62 };
63 
64 /* Globals */
65 static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
66 
67 static int
68 nfs4_save_creds(const struct cred **original_creds)
69 {
70 	struct cred *new;
71 
72 	new = prepare_creds();
73 	if (!new)
74 		return -ENOMEM;
75 
76 	new->fsuid = GLOBAL_ROOT_UID;
77 	new->fsgid = GLOBAL_ROOT_GID;
78 	*original_creds = override_creds(new);
79 	put_cred(new);
80 	return 0;
81 }
82 
83 static void
84 nfs4_reset_creds(const struct cred *original)
85 {
86 	revert_creds(original);
87 }
88 
89 static void
90 md5_to_hex(char *out, char *md5)
91 {
92 	int i;
93 
94 	for (i=0; i<16; i++) {
95 		unsigned char c = md5[i];
96 
97 		*out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 		*out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
99 	}
100 	*out = '\0';
101 }
102 
103 static int
104 nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
105 {
106 	struct xdr_netobj cksum;
107 	struct crypto_shash *tfm;
108 	int status;
109 
110 	dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
111 			clname->len, clname->data);
112 	tfm = crypto_alloc_shash("md5", 0, 0);
113 	if (IS_ERR(tfm)) {
114 		status = PTR_ERR(tfm);
115 		goto out_no_tfm;
116 	}
117 
118 	cksum.len = crypto_shash_digestsize(tfm);
119 	cksum.data = kmalloc(cksum.len, GFP_KERNEL);
120 	if (cksum.data == NULL) {
121 		status = -ENOMEM;
122  		goto out;
123 	}
124 
125 	{
126 		SHASH_DESC_ON_STACK(desc, tfm);
127 
128 		desc->tfm = tfm;
129 		desc->flags = CRYPTO_TFM_REQ_MAY_SLEEP;
130 
131 		status = crypto_shash_digest(desc, clname->data, clname->len,
132 					     cksum.data);
133 		shash_desc_zero(desc);
134 	}
135 
136 	if (status)
137 		goto out;
138 
139 	md5_to_hex(dname, cksum.data);
140 
141 	status = 0;
142 out:
143 	kfree(cksum.data);
144 	crypto_free_shash(tfm);
145 out_no_tfm:
146 	return status;
147 }
148 
149 /*
150  * If we had an error generating the recdir name for the legacy tracker
151  * then warn the admin. If the error doesn't appear to be transient,
152  * then disable recovery tracking.
153  */
154 static void
155 legacy_recdir_name_error(struct nfs4_client *clp, int error)
156 {
157 	printk(KERN_ERR "NFSD: unable to generate recoverydir "
158 			"name (%d).\n", error);
159 
160 	/*
161 	 * if the algorithm just doesn't exist, then disable the recovery
162 	 * tracker altogether. The crypto libs will generally return this if
163 	 * FIPS is enabled as well.
164 	 */
165 	if (error == -ENOENT) {
166 		printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
167 			"Reboot recovery will not function correctly!\n");
168 		nfsd4_client_tracking_exit(clp->net);
169 	}
170 }
171 
172 static void
173 nfsd4_create_clid_dir(struct nfs4_client *clp)
174 {
175 	const struct cred *original_cred;
176 	char dname[HEXDIR_LEN];
177 	struct dentry *dir, *dentry;
178 	struct nfs4_client_reclaim *crp;
179 	int status;
180 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
181 
182 	if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
183 		return;
184 	if (!nn->rec_file)
185 		return;
186 
187 	status = nfs4_make_rec_clidname(dname, &clp->cl_name);
188 	if (status)
189 		return legacy_recdir_name_error(clp, status);
190 
191 	status = nfs4_save_creds(&original_cred);
192 	if (status < 0)
193 		return;
194 
195 	status = mnt_want_write_file(nn->rec_file);
196 	if (status)
197 		goto out_creds;
198 
199 	dir = nn->rec_file->f_path.dentry;
200 	/* lock the parent */
201 	inode_lock(d_inode(dir));
202 
203 	dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
204 	if (IS_ERR(dentry)) {
205 		status = PTR_ERR(dentry);
206 		goto out_unlock;
207 	}
208 	if (d_really_is_positive(dentry))
209 		/*
210 		 * In the 4.1 case, where we're called from
211 		 * reclaim_complete(), records from the previous reboot
212 		 * may still be left, so this is OK.
213 		 *
214 		 * In the 4.0 case, we should never get here; but we may
215 		 * as well be forgiving and just succeed silently.
216 		 */
217 		goto out_put;
218 	status = vfs_mkdir(d_inode(dir), dentry, S_IRWXU);
219 out_put:
220 	dput(dentry);
221 out_unlock:
222 	inode_unlock(d_inode(dir));
223 	if (status == 0) {
224 		if (nn->in_grace) {
225 			crp = nfs4_client_to_reclaim(dname, nn);
226 			if (crp)
227 				crp->cr_clp = clp;
228 		}
229 		vfs_fsync(nn->rec_file, 0);
230 	} else {
231 		printk(KERN_ERR "NFSD: failed to write recovery record"
232 				" (err %d); please check that %s exists"
233 				" and is writeable", status,
234 				user_recovery_dirname);
235 	}
236 	mnt_drop_write_file(nn->rec_file);
237 out_creds:
238 	nfs4_reset_creds(original_cred);
239 }
240 
241 typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
242 
243 struct name_list {
244 	char name[HEXDIR_LEN];
245 	struct list_head list;
246 };
247 
248 struct nfs4_dir_ctx {
249 	struct dir_context ctx;
250 	struct list_head names;
251 };
252 
253 static int
254 nfsd4_build_namelist(struct dir_context *__ctx, const char *name, int namlen,
255 		loff_t offset, u64 ino, unsigned int d_type)
256 {
257 	struct nfs4_dir_ctx *ctx =
258 		container_of(__ctx, struct nfs4_dir_ctx, ctx);
259 	struct name_list *entry;
260 
261 	if (namlen != HEXDIR_LEN - 1)
262 		return 0;
263 	entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
264 	if (entry == NULL)
265 		return -ENOMEM;
266 	memcpy(entry->name, name, HEXDIR_LEN - 1);
267 	entry->name[HEXDIR_LEN - 1] = '\0';
268 	list_add(&entry->list, &ctx->names);
269 	return 0;
270 }
271 
272 static int
273 nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
274 {
275 	const struct cred *original_cred;
276 	struct dentry *dir = nn->rec_file->f_path.dentry;
277 	struct nfs4_dir_ctx ctx = {
278 		.ctx.actor = nfsd4_build_namelist,
279 		.names = LIST_HEAD_INIT(ctx.names)
280 	};
281 	struct name_list *entry, *tmp;
282 	int status;
283 
284 	status = nfs4_save_creds(&original_cred);
285 	if (status < 0)
286 		return status;
287 
288 	status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
289 	if (status < 0) {
290 		nfs4_reset_creds(original_cred);
291 		return status;
292 	}
293 
294 	status = iterate_dir(nn->rec_file, &ctx.ctx);
295 	inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
296 
297 	list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
298 		if (!status) {
299 			struct dentry *dentry;
300 			dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
301 			if (IS_ERR(dentry)) {
302 				status = PTR_ERR(dentry);
303 				break;
304 			}
305 			status = f(dir, dentry, nn);
306 			dput(dentry);
307 		}
308 		list_del(&entry->list);
309 		kfree(entry);
310 	}
311 	inode_unlock(d_inode(dir));
312 	nfs4_reset_creds(original_cred);
313 
314 	list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
315 		dprintk("NFSD: %s. Left entry %s\n", __func__, entry->name);
316 		list_del(&entry->list);
317 		kfree(entry);
318 	}
319 	return status;
320 }
321 
322 static int
323 nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
324 {
325 	struct dentry *dir, *dentry;
326 	int status;
327 
328 	dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
329 
330 	dir = nn->rec_file->f_path.dentry;
331 	inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
332 	dentry = lookup_one_len(name, dir, namlen);
333 	if (IS_ERR(dentry)) {
334 		status = PTR_ERR(dentry);
335 		goto out_unlock;
336 	}
337 	status = -ENOENT;
338 	if (d_really_is_negative(dentry))
339 		goto out;
340 	status = vfs_rmdir(d_inode(dir), dentry);
341 out:
342 	dput(dentry);
343 out_unlock:
344 	inode_unlock(d_inode(dir));
345 	return status;
346 }
347 
348 static void
349 nfsd4_remove_clid_dir(struct nfs4_client *clp)
350 {
351 	const struct cred *original_cred;
352 	struct nfs4_client_reclaim *crp;
353 	char dname[HEXDIR_LEN];
354 	int status;
355 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
356 
357 	if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
358 		return;
359 
360 	status = nfs4_make_rec_clidname(dname, &clp->cl_name);
361 	if (status)
362 		return legacy_recdir_name_error(clp, status);
363 
364 	status = mnt_want_write_file(nn->rec_file);
365 	if (status)
366 		goto out;
367 	clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
368 
369 	status = nfs4_save_creds(&original_cred);
370 	if (status < 0)
371 		goto out_drop_write;
372 
373 	status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
374 	nfs4_reset_creds(original_cred);
375 	if (status == 0) {
376 		vfs_fsync(nn->rec_file, 0);
377 		if (nn->in_grace) {
378 			/* remove reclaim record */
379 			crp = nfsd4_find_reclaim_client(dname, nn);
380 			if (crp)
381 				nfs4_remove_reclaim_record(crp, nn);
382 		}
383 	}
384 out_drop_write:
385 	mnt_drop_write_file(nn->rec_file);
386 out:
387 	if (status)
388 		printk("NFSD: Failed to remove expired client state directory"
389 				" %.*s\n", HEXDIR_LEN, dname);
390 }
391 
392 static int
393 purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
394 {
395 	int status;
396 
397 	if (nfs4_has_reclaimed_state(child->d_name.name, nn))
398 		return 0;
399 
400 	status = vfs_rmdir(d_inode(parent), child);
401 	if (status)
402 		printk("failed to remove client recovery directory %pd\n",
403 				child);
404 	/* Keep trying, success or failure: */
405 	return 0;
406 }
407 
408 static void
409 nfsd4_recdir_purge_old(struct nfsd_net *nn)
410 {
411 	int status;
412 
413 	nn->in_grace = false;
414 	if (!nn->rec_file)
415 		return;
416 	status = mnt_want_write_file(nn->rec_file);
417 	if (status)
418 		goto out;
419 	status = nfsd4_list_rec_dir(purge_old, nn);
420 	if (status == 0)
421 		vfs_fsync(nn->rec_file, 0);
422 	mnt_drop_write_file(nn->rec_file);
423 out:
424 	nfs4_release_reclaim(nn);
425 	if (status)
426 		printk("nfsd4: failed to purge old clients from recovery"
427 			" directory %pD\n", nn->rec_file);
428 }
429 
430 static int
431 load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
432 {
433 	if (child->d_name.len != HEXDIR_LEN - 1) {
434 		printk("nfsd4: illegal name %pd in recovery directory\n",
435 				child);
436 		/* Keep trying; maybe the others are OK: */
437 		return 0;
438 	}
439 	nfs4_client_to_reclaim(child->d_name.name, nn);
440 	return 0;
441 }
442 
443 static int
444 nfsd4_recdir_load(struct net *net) {
445 	int status;
446 	struct nfsd_net *nn =  net_generic(net, nfsd_net_id);
447 
448 	if (!nn->rec_file)
449 		return 0;
450 
451 	status = nfsd4_list_rec_dir(load_recdir, nn);
452 	if (status)
453 		printk("nfsd4: failed loading clients from recovery"
454 			" directory %pD\n", nn->rec_file);
455 	return status;
456 }
457 
458 /*
459  * Hold reference to the recovery directory.
460  */
461 
462 static int
463 nfsd4_init_recdir(struct net *net)
464 {
465 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
466 	const struct cred *original_cred;
467 	int status;
468 
469 	printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
470 			user_recovery_dirname);
471 
472 	BUG_ON(nn->rec_file);
473 
474 	status = nfs4_save_creds(&original_cred);
475 	if (status < 0) {
476 		printk("NFSD: Unable to change credentials to find recovery"
477 		       " directory: error %d\n",
478 		       status);
479 		return status;
480 	}
481 
482 	nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
483 	if (IS_ERR(nn->rec_file)) {
484 		printk("NFSD: unable to find recovery directory %s\n",
485 				user_recovery_dirname);
486 		status = PTR_ERR(nn->rec_file);
487 		nn->rec_file = NULL;
488 	}
489 
490 	nfs4_reset_creds(original_cred);
491 	if (!status)
492 		nn->in_grace = true;
493 	return status;
494 }
495 
496 static void
497 nfsd4_shutdown_recdir(struct net *net)
498 {
499 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
500 
501 	if (!nn->rec_file)
502 		return;
503 	fput(nn->rec_file);
504 	nn->rec_file = NULL;
505 }
506 
507 static int
508 nfs4_legacy_state_init(struct net *net)
509 {
510 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
511 	int i;
512 
513 	nn->reclaim_str_hashtbl = kmalloc_array(CLIENT_HASH_SIZE,
514 						sizeof(struct list_head),
515 						GFP_KERNEL);
516 	if (!nn->reclaim_str_hashtbl)
517 		return -ENOMEM;
518 
519 	for (i = 0; i < CLIENT_HASH_SIZE; i++)
520 		INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
521 	nn->reclaim_str_hashtbl_size = 0;
522 
523 	return 0;
524 }
525 
526 static void
527 nfs4_legacy_state_shutdown(struct net *net)
528 {
529 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
530 
531 	kfree(nn->reclaim_str_hashtbl);
532 }
533 
534 static int
535 nfsd4_load_reboot_recovery_data(struct net *net)
536 {
537 	int status;
538 
539 	status = nfsd4_init_recdir(net);
540 	if (status)
541 		return status;
542 
543 	status = nfsd4_recdir_load(net);
544 	if (status)
545 		nfsd4_shutdown_recdir(net);
546 
547 	return status;
548 }
549 
550 static int
551 nfsd4_legacy_tracking_init(struct net *net)
552 {
553 	int status;
554 
555 	/* XXX: The legacy code won't work in a container */
556 	if (net != &init_net) {
557 		pr_warn("NFSD: attempt to initialize legacy client tracking in a container ignored.\n");
558 		return -EINVAL;
559 	}
560 
561 	status = nfs4_legacy_state_init(net);
562 	if (status)
563 		return status;
564 
565 	status = nfsd4_load_reboot_recovery_data(net);
566 	if (status)
567 		goto err;
568 	return 0;
569 
570 err:
571 	nfs4_legacy_state_shutdown(net);
572 	return status;
573 }
574 
575 static void
576 nfsd4_legacy_tracking_exit(struct net *net)
577 {
578 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
579 
580 	nfs4_release_reclaim(nn);
581 	nfsd4_shutdown_recdir(net);
582 	nfs4_legacy_state_shutdown(net);
583 }
584 
585 /*
586  * Change the NFSv4 recovery directory to recdir.
587  */
588 int
589 nfs4_reset_recoverydir(char *recdir)
590 {
591 	int status;
592 	struct path path;
593 
594 	status = kern_path(recdir, LOOKUP_FOLLOW, &path);
595 	if (status)
596 		return status;
597 	status = -ENOTDIR;
598 	if (d_is_dir(path.dentry)) {
599 		strcpy(user_recovery_dirname, recdir);
600 		status = 0;
601 	}
602 	path_put(&path);
603 	return status;
604 }
605 
606 char *
607 nfs4_recoverydir(void)
608 {
609 	return user_recovery_dirname;
610 }
611 
612 static int
613 nfsd4_check_legacy_client(struct nfs4_client *clp)
614 {
615 	int status;
616 	char dname[HEXDIR_LEN];
617 	struct nfs4_client_reclaim *crp;
618 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
619 
620 	/* did we already find that this client is stable? */
621 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
622 		return 0;
623 
624 	status = nfs4_make_rec_clidname(dname, &clp->cl_name);
625 	if (status) {
626 		legacy_recdir_name_error(clp, status);
627 		return status;
628 	}
629 
630 	/* look for it in the reclaim hashtable otherwise */
631 	crp = nfsd4_find_reclaim_client(dname, nn);
632 	if (crp) {
633 		set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
634 		crp->cr_clp = clp;
635 		return 0;
636 	}
637 
638 	return -ENOENT;
639 }
640 
641 static const struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
642 	.init		= nfsd4_legacy_tracking_init,
643 	.exit		= nfsd4_legacy_tracking_exit,
644 	.create		= nfsd4_create_clid_dir,
645 	.remove		= nfsd4_remove_clid_dir,
646 	.check		= nfsd4_check_legacy_client,
647 	.grace_done	= nfsd4_recdir_purge_old,
648 };
649 
650 /* Globals */
651 #define NFSD_PIPE_DIR		"nfsd"
652 #define NFSD_CLD_PIPE		"cld"
653 
654 /* per-net-ns structure for holding cld upcall info */
655 struct cld_net {
656 	struct rpc_pipe		*cn_pipe;
657 	spinlock_t		 cn_lock;
658 	struct list_head	 cn_list;
659 	unsigned int		 cn_xid;
660 };
661 
662 struct cld_upcall {
663 	struct list_head	 cu_list;
664 	struct cld_net		*cu_net;
665 	struct task_struct	*cu_task;
666 	struct cld_msg		 cu_msg;
667 };
668 
669 static int
670 __cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
671 {
672 	int ret;
673 	struct rpc_pipe_msg msg;
674 
675 	memset(&msg, 0, sizeof(msg));
676 	msg.data = cmsg;
677 	msg.len = sizeof(*cmsg);
678 
679 	/*
680 	 * Set task state before we queue the upcall. That prevents
681 	 * wake_up_process in the downcall from racing with schedule.
682 	 */
683 	set_current_state(TASK_UNINTERRUPTIBLE);
684 	ret = rpc_queue_upcall(pipe, &msg);
685 	if (ret < 0) {
686 		set_current_state(TASK_RUNNING);
687 		goto out;
688 	}
689 
690 	schedule();
691 
692 	if (msg.errno < 0)
693 		ret = msg.errno;
694 out:
695 	return ret;
696 }
697 
698 static int
699 cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
700 {
701 	int ret;
702 
703 	/*
704 	 * -EAGAIN occurs when pipe is closed and reopened while there are
705 	 *  upcalls queued.
706 	 */
707 	do {
708 		ret = __cld_pipe_upcall(pipe, cmsg);
709 	} while (ret == -EAGAIN);
710 
711 	return ret;
712 }
713 
714 static ssize_t
715 cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
716 {
717 	struct cld_upcall *tmp, *cup;
718 	struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
719 	uint32_t xid;
720 	struct nfsd_net *nn = net_generic(file_inode(filp)->i_sb->s_fs_info,
721 						nfsd_net_id);
722 	struct cld_net *cn = nn->cld_net;
723 
724 	if (mlen != sizeof(*cmsg)) {
725 		dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
726 			sizeof(*cmsg));
727 		return -EINVAL;
728 	}
729 
730 	/* copy just the xid so we can try to find that */
731 	if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
732 		dprintk("%s: error when copying xid from userspace", __func__);
733 		return -EFAULT;
734 	}
735 
736 	/* walk the list and find corresponding xid */
737 	cup = NULL;
738 	spin_lock(&cn->cn_lock);
739 	list_for_each_entry(tmp, &cn->cn_list, cu_list) {
740 		if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
741 			cup = tmp;
742 			list_del_init(&cup->cu_list);
743 			break;
744 		}
745 	}
746 	spin_unlock(&cn->cn_lock);
747 
748 	/* couldn't find upcall? */
749 	if (!cup) {
750 		dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
751 		return -EINVAL;
752 	}
753 
754 	if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
755 		return -EFAULT;
756 
757 	wake_up_process(cup->cu_task);
758 	return mlen;
759 }
760 
761 static void
762 cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
763 {
764 	struct cld_msg *cmsg = msg->data;
765 	struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
766 						 cu_msg);
767 
768 	/* errno >= 0 means we got a downcall */
769 	if (msg->errno >= 0)
770 		return;
771 
772 	wake_up_process(cup->cu_task);
773 }
774 
775 static const struct rpc_pipe_ops cld_upcall_ops = {
776 	.upcall		= rpc_pipe_generic_upcall,
777 	.downcall	= cld_pipe_downcall,
778 	.destroy_msg	= cld_pipe_destroy_msg,
779 };
780 
781 static struct dentry *
782 nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
783 {
784 	struct dentry *dir, *dentry;
785 
786 	dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
787 	if (dir == NULL)
788 		return ERR_PTR(-ENOENT);
789 	dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
790 	dput(dir);
791 	return dentry;
792 }
793 
794 static void
795 nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
796 {
797 	if (pipe->dentry)
798 		rpc_unlink(pipe->dentry);
799 }
800 
801 static struct dentry *
802 nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
803 {
804 	struct super_block *sb;
805 	struct dentry *dentry;
806 
807 	sb = rpc_get_sb_net(net);
808 	if (!sb)
809 		return NULL;
810 	dentry = nfsd4_cld_register_sb(sb, pipe);
811 	rpc_put_sb_net(net);
812 	return dentry;
813 }
814 
815 static void
816 nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
817 {
818 	struct super_block *sb;
819 
820 	sb = rpc_get_sb_net(net);
821 	if (sb) {
822 		nfsd4_cld_unregister_sb(pipe);
823 		rpc_put_sb_net(net);
824 	}
825 }
826 
827 /* Initialize rpc_pipefs pipe for communication with client tracking daemon */
828 static int
829 nfsd4_init_cld_pipe(struct net *net)
830 {
831 	int ret;
832 	struct dentry *dentry;
833 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
834 	struct cld_net *cn;
835 
836 	if (nn->cld_net)
837 		return 0;
838 
839 	cn = kzalloc(sizeof(*cn), GFP_KERNEL);
840 	if (!cn) {
841 		ret = -ENOMEM;
842 		goto err;
843 	}
844 
845 	cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
846 	if (IS_ERR(cn->cn_pipe)) {
847 		ret = PTR_ERR(cn->cn_pipe);
848 		goto err;
849 	}
850 	spin_lock_init(&cn->cn_lock);
851 	INIT_LIST_HEAD(&cn->cn_list);
852 
853 	dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
854 	if (IS_ERR(dentry)) {
855 		ret = PTR_ERR(dentry);
856 		goto err_destroy_data;
857 	}
858 
859 	cn->cn_pipe->dentry = dentry;
860 	nn->cld_net = cn;
861 	return 0;
862 
863 err_destroy_data:
864 	rpc_destroy_pipe_data(cn->cn_pipe);
865 err:
866 	kfree(cn);
867 	printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
868 			ret);
869 	return ret;
870 }
871 
872 static void
873 nfsd4_remove_cld_pipe(struct net *net)
874 {
875 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
876 	struct cld_net *cn = nn->cld_net;
877 
878 	nfsd4_cld_unregister_net(net, cn->cn_pipe);
879 	rpc_destroy_pipe_data(cn->cn_pipe);
880 	kfree(nn->cld_net);
881 	nn->cld_net = NULL;
882 }
883 
884 static struct cld_upcall *
885 alloc_cld_upcall(struct cld_net *cn)
886 {
887 	struct cld_upcall *new, *tmp;
888 
889 	new = kzalloc(sizeof(*new), GFP_KERNEL);
890 	if (!new)
891 		return new;
892 
893 	/* FIXME: hard cap on number in flight? */
894 restart_search:
895 	spin_lock(&cn->cn_lock);
896 	list_for_each_entry(tmp, &cn->cn_list, cu_list) {
897 		if (tmp->cu_msg.cm_xid == cn->cn_xid) {
898 			cn->cn_xid++;
899 			spin_unlock(&cn->cn_lock);
900 			goto restart_search;
901 		}
902 	}
903 	new->cu_task = current;
904 	new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
905 	put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
906 	new->cu_net = cn;
907 	list_add(&new->cu_list, &cn->cn_list);
908 	spin_unlock(&cn->cn_lock);
909 
910 	dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
911 
912 	return new;
913 }
914 
915 static void
916 free_cld_upcall(struct cld_upcall *victim)
917 {
918 	struct cld_net *cn = victim->cu_net;
919 
920 	spin_lock(&cn->cn_lock);
921 	list_del(&victim->cu_list);
922 	spin_unlock(&cn->cn_lock);
923 	kfree(victim);
924 }
925 
926 /* Ask daemon to create a new record */
927 static void
928 nfsd4_cld_create(struct nfs4_client *clp)
929 {
930 	int ret;
931 	struct cld_upcall *cup;
932 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
933 	struct cld_net *cn = nn->cld_net;
934 
935 	/* Don't upcall if it's already stored */
936 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
937 		return;
938 
939 	cup = alloc_cld_upcall(cn);
940 	if (!cup) {
941 		ret = -ENOMEM;
942 		goto out_err;
943 	}
944 
945 	cup->cu_msg.cm_cmd = Cld_Create;
946 	cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
947 	memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
948 			clp->cl_name.len);
949 
950 	ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
951 	if (!ret) {
952 		ret = cup->cu_msg.cm_status;
953 		set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
954 	}
955 
956 	free_cld_upcall(cup);
957 out_err:
958 	if (ret)
959 		printk(KERN_ERR "NFSD: Unable to create client "
960 				"record on stable storage: %d\n", ret);
961 }
962 
963 /* Ask daemon to create a new record */
964 static void
965 nfsd4_cld_remove(struct nfs4_client *clp)
966 {
967 	int ret;
968 	struct cld_upcall *cup;
969 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
970 	struct cld_net *cn = nn->cld_net;
971 
972 	/* Don't upcall if it's already removed */
973 	if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
974 		return;
975 
976 	cup = alloc_cld_upcall(cn);
977 	if (!cup) {
978 		ret = -ENOMEM;
979 		goto out_err;
980 	}
981 
982 	cup->cu_msg.cm_cmd = Cld_Remove;
983 	cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
984 	memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
985 			clp->cl_name.len);
986 
987 	ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
988 	if (!ret) {
989 		ret = cup->cu_msg.cm_status;
990 		clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
991 	}
992 
993 	free_cld_upcall(cup);
994 out_err:
995 	if (ret)
996 		printk(KERN_ERR "NFSD: Unable to remove client "
997 				"record from stable storage: %d\n", ret);
998 }
999 
1000 /* Check for presence of a record, and update its timestamp */
1001 static int
1002 nfsd4_cld_check(struct nfs4_client *clp)
1003 {
1004 	int ret;
1005 	struct cld_upcall *cup;
1006 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1007 	struct cld_net *cn = nn->cld_net;
1008 
1009 	/* Don't upcall if one was already stored during this grace pd */
1010 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1011 		return 0;
1012 
1013 	cup = alloc_cld_upcall(cn);
1014 	if (!cup) {
1015 		printk(KERN_ERR "NFSD: Unable to check client record on "
1016 				"stable storage: %d\n", -ENOMEM);
1017 		return -ENOMEM;
1018 	}
1019 
1020 	cup->cu_msg.cm_cmd = Cld_Check;
1021 	cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1022 	memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1023 			clp->cl_name.len);
1024 
1025 	ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1026 	if (!ret) {
1027 		ret = cup->cu_msg.cm_status;
1028 		set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1029 	}
1030 
1031 	free_cld_upcall(cup);
1032 	return ret;
1033 }
1034 
1035 static void
1036 nfsd4_cld_grace_done(struct nfsd_net *nn)
1037 {
1038 	int ret;
1039 	struct cld_upcall *cup;
1040 	struct cld_net *cn = nn->cld_net;
1041 
1042 	cup = alloc_cld_upcall(cn);
1043 	if (!cup) {
1044 		ret = -ENOMEM;
1045 		goto out_err;
1046 	}
1047 
1048 	cup->cu_msg.cm_cmd = Cld_GraceDone;
1049 	cup->cu_msg.cm_u.cm_gracetime = (int64_t)nn->boot_time;
1050 	ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1051 	if (!ret)
1052 		ret = cup->cu_msg.cm_status;
1053 
1054 	free_cld_upcall(cup);
1055 out_err:
1056 	if (ret)
1057 		printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1058 }
1059 
1060 static const struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
1061 	.init		= nfsd4_init_cld_pipe,
1062 	.exit		= nfsd4_remove_cld_pipe,
1063 	.create		= nfsd4_cld_create,
1064 	.remove		= nfsd4_cld_remove,
1065 	.check		= nfsd4_cld_check,
1066 	.grace_done	= nfsd4_cld_grace_done,
1067 };
1068 
1069 /* upcall via usermodehelper */
1070 static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1071 module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1072 			S_IRUGO|S_IWUSR);
1073 MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1074 
1075 static bool cltrack_legacy_disable;
1076 module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1077 MODULE_PARM_DESC(cltrack_legacy_disable,
1078 		"Disable legacy recoverydir conversion. Default: false");
1079 
1080 #define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1081 #define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
1082 #define HAS_SESSION_ENV_PREFIX "NFSDCLTRACK_CLIENT_HAS_SESSION="
1083 #define GRACE_START_ENV_PREFIX "NFSDCLTRACK_GRACE_START="
1084 
1085 static char *
1086 nfsd4_cltrack_legacy_topdir(void)
1087 {
1088 	int copied;
1089 	size_t len;
1090 	char *result;
1091 
1092 	if (cltrack_legacy_disable)
1093 		return NULL;
1094 
1095 	len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1096 		strlen(nfs4_recoverydir()) + 1;
1097 
1098 	result = kmalloc(len, GFP_KERNEL);
1099 	if (!result)
1100 		return result;
1101 
1102 	copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1103 				nfs4_recoverydir());
1104 	if (copied >= len) {
1105 		/* just return nothing if output was truncated */
1106 		kfree(result);
1107 		return NULL;
1108 	}
1109 
1110 	return result;
1111 }
1112 
1113 static char *
1114 nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
1115 {
1116 	int copied;
1117 	size_t len;
1118 	char *result;
1119 
1120 	if (cltrack_legacy_disable)
1121 		return NULL;
1122 
1123 	/* +1 is for '/' between "topdir" and "recdir" */
1124 	len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1125 		strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1126 
1127 	result = kmalloc(len, GFP_KERNEL);
1128 	if (!result)
1129 		return result;
1130 
1131 	copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1132 				nfs4_recoverydir());
1133 	if (copied > (len - HEXDIR_LEN)) {
1134 		/* just return nothing if output will be truncated */
1135 		kfree(result);
1136 		return NULL;
1137 	}
1138 
1139 	copied = nfs4_make_rec_clidname(result + copied, name);
1140 	if (copied) {
1141 		kfree(result);
1142 		return NULL;
1143 	}
1144 
1145 	return result;
1146 }
1147 
1148 static char *
1149 nfsd4_cltrack_client_has_session(struct nfs4_client *clp)
1150 {
1151 	int copied;
1152 	size_t len;
1153 	char *result;
1154 
1155 	/* prefix + Y/N character + terminating NULL */
1156 	len = strlen(HAS_SESSION_ENV_PREFIX) + 1 + 1;
1157 
1158 	result = kmalloc(len, GFP_KERNEL);
1159 	if (!result)
1160 		return result;
1161 
1162 	copied = snprintf(result, len, HAS_SESSION_ENV_PREFIX "%c",
1163 				clp->cl_minorversion ? 'Y' : 'N');
1164 	if (copied >= len) {
1165 		/* just return nothing if output was truncated */
1166 		kfree(result);
1167 		return NULL;
1168 	}
1169 
1170 	return result;
1171 }
1172 
1173 static char *
1174 nfsd4_cltrack_grace_start(time_t grace_start)
1175 {
1176 	int copied;
1177 	size_t len;
1178 	char *result;
1179 
1180 	/* prefix + max width of int64_t string + terminating NULL */
1181 	len = strlen(GRACE_START_ENV_PREFIX) + 22 + 1;
1182 
1183 	result = kmalloc(len, GFP_KERNEL);
1184 	if (!result)
1185 		return result;
1186 
1187 	copied = snprintf(result, len, GRACE_START_ENV_PREFIX "%ld",
1188 				grace_start);
1189 	if (copied >= len) {
1190 		/* just return nothing if output was truncated */
1191 		kfree(result);
1192 		return NULL;
1193 	}
1194 
1195 	return result;
1196 }
1197 
1198 static int
1199 nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *env0, char *env1)
1200 {
1201 	char *envp[3];
1202 	char *argv[4];
1203 	int ret;
1204 
1205 	if (unlikely(!cltrack_prog[0])) {
1206 		dprintk("%s: cltrack_prog is disabled\n", __func__);
1207 		return -EACCES;
1208 	}
1209 
1210 	dprintk("%s: cmd: %s\n", __func__, cmd);
1211 	dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
1212 	dprintk("%s: env0: %s\n", __func__, env0 ? env0 : "(null)");
1213 	dprintk("%s: env1: %s\n", __func__, env1 ? env1 : "(null)");
1214 
1215 	envp[0] = env0;
1216 	envp[1] = env1;
1217 	envp[2] = NULL;
1218 
1219 	argv[0] = (char *)cltrack_prog;
1220 	argv[1] = cmd;
1221 	argv[2] = arg;
1222 	argv[3] = NULL;
1223 
1224 	ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1225 	/*
1226 	 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1227 	 * error. The admin can re-enable it on the fly by using sysfs
1228 	 * once the problem has been fixed.
1229 	 */
1230 	if (ret == -ENOENT || ret == -EACCES) {
1231 		dprintk("NFSD: %s was not found or isn't executable (%d). "
1232 			"Setting cltrack_prog to blank string!",
1233 			cltrack_prog, ret);
1234 		cltrack_prog[0] = '\0';
1235 	}
1236 	dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1237 
1238 	return ret;
1239 }
1240 
1241 static char *
1242 bin_to_hex_dup(const unsigned char *src, int srclen)
1243 {
1244 	int i;
1245 	char *buf, *hex;
1246 
1247 	/* +1 for terminating NULL */
1248 	buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1249 	if (!buf)
1250 		return buf;
1251 
1252 	hex = buf;
1253 	for (i = 0; i < srclen; i++) {
1254 		sprintf(hex, "%2.2x", *src++);
1255 		hex += 2;
1256 	}
1257 	return buf;
1258 }
1259 
1260 static int
1261 nfsd4_umh_cltrack_init(struct net *net)
1262 {
1263 	int ret;
1264 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1265 	char *grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
1266 
1267 	/* XXX: The usermode helper s not working in container yet. */
1268 	if (net != &init_net) {
1269 		pr_warn("NFSD: attempt to initialize umh client tracking in a container ignored.\n");
1270 		kfree(grace_start);
1271 		return -EINVAL;
1272 	}
1273 
1274 	ret = nfsd4_umh_cltrack_upcall("init", NULL, grace_start, NULL);
1275 	kfree(grace_start);
1276 	return ret;
1277 }
1278 
1279 static void
1280 nfsd4_cltrack_upcall_lock(struct nfs4_client *clp)
1281 {
1282 	wait_on_bit_lock(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK,
1283 			 TASK_UNINTERRUPTIBLE);
1284 }
1285 
1286 static void
1287 nfsd4_cltrack_upcall_unlock(struct nfs4_client *clp)
1288 {
1289 	smp_mb__before_atomic();
1290 	clear_bit(NFSD4_CLIENT_UPCALL_LOCK, &clp->cl_flags);
1291 	smp_mb__after_atomic();
1292 	wake_up_bit(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK);
1293 }
1294 
1295 static void
1296 nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1297 {
1298 	char *hexid, *has_session, *grace_start;
1299 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1300 
1301 	/*
1302 	 * With v4.0 clients, there's little difference in outcome between a
1303 	 * create and check operation, and we can end up calling into this
1304 	 * function multiple times per client (once for each openowner). So,
1305 	 * for v4.0 clients skip upcalling once the client has been recorded
1306 	 * on stable storage.
1307 	 *
1308 	 * For v4.1+ clients, the outcome of the two operations is different,
1309 	 * so we must ensure that we upcall for the create operation. v4.1+
1310 	 * clients call this on RECLAIM_COMPLETE though, so we should only end
1311 	 * up doing a single create upcall per client.
1312 	 */
1313 	if (clp->cl_minorversion == 0 &&
1314 	    test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1315 		return;
1316 
1317 	hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1318 	if (!hexid) {
1319 		dprintk("%s: can't allocate memory for upcall!\n", __func__);
1320 		return;
1321 	}
1322 
1323 	has_session = nfsd4_cltrack_client_has_session(clp);
1324 	grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
1325 
1326 	nfsd4_cltrack_upcall_lock(clp);
1327 	if (!nfsd4_umh_cltrack_upcall("create", hexid, has_session, grace_start))
1328 		set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1329 	nfsd4_cltrack_upcall_unlock(clp);
1330 
1331 	kfree(has_session);
1332 	kfree(grace_start);
1333 	kfree(hexid);
1334 }
1335 
1336 static void
1337 nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1338 {
1339 	char *hexid;
1340 
1341 	if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1342 		return;
1343 
1344 	hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1345 	if (!hexid) {
1346 		dprintk("%s: can't allocate memory for upcall!\n", __func__);
1347 		return;
1348 	}
1349 
1350 	nfsd4_cltrack_upcall_lock(clp);
1351 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags) &&
1352 	    nfsd4_umh_cltrack_upcall("remove", hexid, NULL, NULL) == 0)
1353 		clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1354 	nfsd4_cltrack_upcall_unlock(clp);
1355 
1356 	kfree(hexid);
1357 }
1358 
1359 static int
1360 nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1361 {
1362 	int ret;
1363 	char *hexid, *has_session, *legacy;
1364 
1365 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1366 		return 0;
1367 
1368 	hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1369 	if (!hexid) {
1370 		dprintk("%s: can't allocate memory for upcall!\n", __func__);
1371 		return -ENOMEM;
1372 	}
1373 
1374 	has_session = nfsd4_cltrack_client_has_session(clp);
1375 	legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
1376 
1377 	nfsd4_cltrack_upcall_lock(clp);
1378 	if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags)) {
1379 		ret = 0;
1380 	} else {
1381 		ret = nfsd4_umh_cltrack_upcall("check", hexid, has_session, legacy);
1382 		if (ret == 0)
1383 			set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1384 	}
1385 	nfsd4_cltrack_upcall_unlock(clp);
1386 	kfree(has_session);
1387 	kfree(legacy);
1388 	kfree(hexid);
1389 
1390 	return ret;
1391 }
1392 
1393 static void
1394 nfsd4_umh_cltrack_grace_done(struct nfsd_net *nn)
1395 {
1396 	char *legacy;
1397 	char timestr[22]; /* FIXME: better way to determine max size? */
1398 
1399 	sprintf(timestr, "%ld", nn->boot_time);
1400 	legacy = nfsd4_cltrack_legacy_topdir();
1401 	nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy, NULL);
1402 	kfree(legacy);
1403 }
1404 
1405 static const struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
1406 	.init		= nfsd4_umh_cltrack_init,
1407 	.exit		= NULL,
1408 	.create		= nfsd4_umh_cltrack_create,
1409 	.remove		= nfsd4_umh_cltrack_remove,
1410 	.check		= nfsd4_umh_cltrack_check,
1411 	.grace_done	= nfsd4_umh_cltrack_grace_done,
1412 };
1413 
1414 int
1415 nfsd4_client_tracking_init(struct net *net)
1416 {
1417 	int status;
1418 	struct path path;
1419 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1420 
1421 	/* just run the init if it the method is already decided */
1422 	if (nn->client_tracking_ops)
1423 		goto do_init;
1424 
1425 	/*
1426 	 * First, try a UMH upcall. It should succeed or fail quickly, so
1427 	 * there's little harm in trying that first.
1428 	 */
1429 	nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1430 	status = nn->client_tracking_ops->init(net);
1431 	if (!status)
1432 		return status;
1433 
1434 	/*
1435 	 * See if the recoverydir exists and is a directory. If it is,
1436 	 * then use the legacy ops.
1437 	 */
1438 	nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
1439 	status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1440 	if (!status) {
1441 		status = d_is_dir(path.dentry);
1442 		path_put(&path);
1443 		if (status)
1444 			goto do_init;
1445 	}
1446 
1447 	/* Finally, try to use nfsdcld */
1448 	nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
1449 	printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1450 			"removed in 3.10. Please transition to using "
1451 			"nfsdcltrack.\n");
1452 do_init:
1453 	status = nn->client_tracking_ops->init(net);
1454 	if (status) {
1455 		printk(KERN_WARNING "NFSD: Unable to initialize client "
1456 				    "recovery tracking! (%d)\n", status);
1457 		nn->client_tracking_ops = NULL;
1458 	}
1459 	return status;
1460 }
1461 
1462 void
1463 nfsd4_client_tracking_exit(struct net *net)
1464 {
1465 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1466 
1467 	if (nn->client_tracking_ops) {
1468 		if (nn->client_tracking_ops->exit)
1469 			nn->client_tracking_ops->exit(net);
1470 		nn->client_tracking_ops = NULL;
1471 	}
1472 }
1473 
1474 void
1475 nfsd4_client_record_create(struct nfs4_client *clp)
1476 {
1477 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1478 
1479 	if (nn->client_tracking_ops)
1480 		nn->client_tracking_ops->create(clp);
1481 }
1482 
1483 void
1484 nfsd4_client_record_remove(struct nfs4_client *clp)
1485 {
1486 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1487 
1488 	if (nn->client_tracking_ops)
1489 		nn->client_tracking_ops->remove(clp);
1490 }
1491 
1492 int
1493 nfsd4_client_record_check(struct nfs4_client *clp)
1494 {
1495 	struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1496 
1497 	if (nn->client_tracking_ops)
1498 		return nn->client_tracking_ops->check(clp);
1499 
1500 	return -EOPNOTSUPP;
1501 }
1502 
1503 void
1504 nfsd4_record_grace_done(struct nfsd_net *nn)
1505 {
1506 	if (nn->client_tracking_ops)
1507 		nn->client_tracking_ops->grace_done(nn);
1508 }
1509 
1510 static int
1511 rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1512 {
1513 	struct super_block *sb = ptr;
1514 	struct net *net = sb->s_fs_info;
1515 	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1516 	struct cld_net *cn = nn->cld_net;
1517 	struct dentry *dentry;
1518 	int ret = 0;
1519 
1520 	if (!try_module_get(THIS_MODULE))
1521 		return 0;
1522 
1523 	if (!cn) {
1524 		module_put(THIS_MODULE);
1525 		return 0;
1526 	}
1527 
1528 	switch (event) {
1529 	case RPC_PIPEFS_MOUNT:
1530 		dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1531 		if (IS_ERR(dentry)) {
1532 			ret = PTR_ERR(dentry);
1533 			break;
1534 		}
1535 		cn->cn_pipe->dentry = dentry;
1536 		break;
1537 	case RPC_PIPEFS_UMOUNT:
1538 		if (cn->cn_pipe->dentry)
1539 			nfsd4_cld_unregister_sb(cn->cn_pipe);
1540 		break;
1541 	default:
1542 		ret = -ENOTSUPP;
1543 		break;
1544 	}
1545 	module_put(THIS_MODULE);
1546 	return ret;
1547 }
1548 
1549 static struct notifier_block nfsd4_cld_block = {
1550 	.notifier_call = rpc_pipefs_event,
1551 };
1552 
1553 int
1554 register_cld_notifier(void)
1555 {
1556 	return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1557 }
1558 
1559 void
1560 unregister_cld_notifier(void)
1561 {
1562 	rpc_pipefs_notifier_unregister(&nfsd4_cld_block);
1563 }
1564