Linux 3.12.28
[linux/fpc-iii.git] / fs / nfsd / nfs4recover.c
blobe0a65a9e37e97ac1a8702a48487349d599be4aab
1 /*
2 * Copyright (c) 2004 The Regents of the University of Michigan.
3 * Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
4 * All rights reserved.
6 * Andy Adamson <andros@citi.umich.edu>
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 #include <linux/file.h>
36 #include <linux/slab.h>
37 #include <linux/namei.h>
38 #include <linux/crypto.h>
39 #include <linux/sched.h>
40 #include <linux/fs.h>
41 #include <linux/module.h>
42 #include <net/net_namespace.h>
43 #include <linux/sunrpc/rpc_pipe_fs.h>
44 #include <linux/sunrpc/clnt.h>
45 #include <linux/nfsd/cld.h>
47 #include "nfsd.h"
48 #include "state.h"
49 #include "vfs.h"
50 #include "netns.h"
52 #define NFSDDBG_FACILITY NFSDDBG_PROC
54 /* Declarations */
55 struct nfsd4_client_tracking_ops {
56 int (*init)(struct net *);
57 void (*exit)(struct net *);
58 void (*create)(struct nfs4_client *);
59 void (*remove)(struct nfs4_client *);
60 int (*check)(struct nfs4_client *);
61 void (*grace_done)(struct nfsd_net *, time_t);
64 /* Globals */
65 static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
67 static int
68 nfs4_save_creds(const struct cred **original_creds)
70 struct cred *new;
72 new = prepare_creds();
73 if (!new)
74 return -ENOMEM;
76 new->fsuid = GLOBAL_ROOT_UID;
77 new->fsgid = GLOBAL_ROOT_GID;
78 *original_creds = override_creds(new);
79 put_cred(new);
80 return 0;
83 static void
84 nfs4_reset_creds(const struct cred *original)
86 revert_creds(original);
89 static void
90 md5_to_hex(char *out, char *md5)
92 int i;
94 for (i=0; i<16; i++) {
95 unsigned char c = md5[i];
97 *out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 *out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
100 *out = '\0';
103 static int
104 nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
106 struct xdr_netobj cksum;
107 struct hash_desc desc;
108 struct scatterlist sg;
109 int status;
111 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
112 clname->len, clname->data);
113 desc.flags = CRYPTO_TFM_REQ_MAY_SLEEP;
114 desc.tfm = crypto_alloc_hash("md5", 0, CRYPTO_ALG_ASYNC);
115 if (IS_ERR(desc.tfm)) {
116 status = PTR_ERR(desc.tfm);
117 goto out_no_tfm;
120 cksum.len = crypto_hash_digestsize(desc.tfm);
121 cksum.data = kmalloc(cksum.len, GFP_KERNEL);
122 if (cksum.data == NULL) {
123 status = -ENOMEM;
124 goto out;
127 sg_init_one(&sg, clname->data, clname->len);
129 status = crypto_hash_digest(&desc, &sg, sg.length, cksum.data);
130 if (status)
131 goto out;
133 md5_to_hex(dname, cksum.data);
135 status = 0;
136 out:
137 kfree(cksum.data);
138 crypto_free_hash(desc.tfm);
139 out_no_tfm:
140 return status;
144 * If we had an error generating the recdir name for the legacy tracker
145 * then warn the admin. If the error doesn't appear to be transient,
146 * then disable recovery tracking.
148 static void
149 legacy_recdir_name_error(struct nfs4_client *clp, int error)
151 printk(KERN_ERR "NFSD: unable to generate recoverydir "
152 "name (%d).\n", error);
155 * if the algorithm just doesn't exist, then disable the recovery
156 * tracker altogether. The crypto libs will generally return this if
157 * FIPS is enabled as well.
159 if (error == -ENOENT) {
160 printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
161 "Reboot recovery will not function correctly!\n");
162 nfsd4_client_tracking_exit(clp->net);
166 static void
167 nfsd4_create_clid_dir(struct nfs4_client *clp)
169 const struct cred *original_cred;
170 char dname[HEXDIR_LEN];
171 struct dentry *dir, *dentry;
172 struct nfs4_client_reclaim *crp;
173 int status;
174 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
176 if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
177 return;
178 if (!nn->rec_file)
179 return;
181 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
182 if (status)
183 return legacy_recdir_name_error(clp, status);
185 status = nfs4_save_creds(&original_cred);
186 if (status < 0)
187 return;
189 status = mnt_want_write_file(nn->rec_file);
190 if (status)
191 return;
193 dir = nn->rec_file->f_path.dentry;
194 /* lock the parent */
195 mutex_lock(&dir->d_inode->i_mutex);
197 dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
198 if (IS_ERR(dentry)) {
199 status = PTR_ERR(dentry);
200 goto out_unlock;
202 if (dentry->d_inode)
204 * In the 4.1 case, where we're called from
205 * reclaim_complete(), records from the previous reboot
206 * may still be left, so this is OK.
208 * In the 4.0 case, we should never get here; but we may
209 * as well be forgiving and just succeed silently.
211 goto out_put;
212 status = vfs_mkdir(dir->d_inode, dentry, S_IRWXU);
213 out_put:
214 dput(dentry);
215 out_unlock:
216 mutex_unlock(&dir->d_inode->i_mutex);
217 if (status == 0) {
218 if (nn->in_grace) {
219 crp = nfs4_client_to_reclaim(dname, nn);
220 if (crp)
221 crp->cr_clp = clp;
223 vfs_fsync(nn->rec_file, 0);
224 } else {
225 printk(KERN_ERR "NFSD: failed to write recovery record"
226 " (err %d); please check that %s exists"
227 " and is writeable", status,
228 user_recovery_dirname);
230 mnt_drop_write_file(nn->rec_file);
231 nfs4_reset_creds(original_cred);
234 typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
236 struct name_list {
237 char name[HEXDIR_LEN];
238 struct list_head list;
241 struct nfs4_dir_ctx {
242 struct dir_context ctx;
243 struct list_head names;
246 static int
247 nfsd4_build_namelist(void *arg, const char *name, int namlen,
248 loff_t offset, u64 ino, unsigned int d_type)
250 struct nfs4_dir_ctx *ctx = arg;
251 struct name_list *entry;
253 if (namlen != HEXDIR_LEN - 1)
254 return 0;
255 entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
256 if (entry == NULL)
257 return -ENOMEM;
258 memcpy(entry->name, name, HEXDIR_LEN - 1);
259 entry->name[HEXDIR_LEN - 1] = '\0';
260 list_add(&entry->list, &ctx->names);
261 return 0;
264 static int
265 nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
267 const struct cred *original_cred;
268 struct dentry *dir = nn->rec_file->f_path.dentry;
269 struct nfs4_dir_ctx ctx = {
270 .ctx.actor = nfsd4_build_namelist,
271 .names = LIST_HEAD_INIT(ctx.names)
273 int status;
275 status = nfs4_save_creds(&original_cred);
276 if (status < 0)
277 return status;
279 status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
280 if (status < 0) {
281 nfs4_reset_creds(original_cred);
282 return status;
285 status = iterate_dir(nn->rec_file, &ctx.ctx);
286 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
287 while (!list_empty(&ctx.names)) {
288 struct name_list *entry;
289 entry = list_entry(ctx.names.next, struct name_list, list);
290 if (!status) {
291 struct dentry *dentry;
292 dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
293 if (IS_ERR(dentry)) {
294 status = PTR_ERR(dentry);
295 break;
297 status = f(dir, dentry, nn);
298 dput(dentry);
300 list_del(&entry->list);
301 kfree(entry);
303 mutex_unlock(&dir->d_inode->i_mutex);
304 nfs4_reset_creds(original_cred);
305 return status;
308 static int
309 nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
311 struct dentry *dir, *dentry;
312 int status;
314 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
316 dir = nn->rec_file->f_path.dentry;
317 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
318 dentry = lookup_one_len(name, dir, namlen);
319 if (IS_ERR(dentry)) {
320 status = PTR_ERR(dentry);
321 goto out_unlock;
323 status = -ENOENT;
324 if (!dentry->d_inode)
325 goto out;
326 status = vfs_rmdir(dir->d_inode, dentry);
327 out:
328 dput(dentry);
329 out_unlock:
330 mutex_unlock(&dir->d_inode->i_mutex);
331 return status;
334 static void
335 nfsd4_remove_clid_dir(struct nfs4_client *clp)
337 const struct cred *original_cred;
338 struct nfs4_client_reclaim *crp;
339 char dname[HEXDIR_LEN];
340 int status;
341 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
343 if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
344 return;
346 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
347 if (status)
348 return legacy_recdir_name_error(clp, status);
350 status = mnt_want_write_file(nn->rec_file);
351 if (status)
352 goto out;
353 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
355 status = nfs4_save_creds(&original_cred);
356 if (status < 0)
357 goto out_drop_write;
359 status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
360 nfs4_reset_creds(original_cred);
361 if (status == 0) {
362 vfs_fsync(nn->rec_file, 0);
363 if (nn->in_grace) {
364 /* remove reclaim record */
365 crp = nfsd4_find_reclaim_client(dname, nn);
366 if (crp)
367 nfs4_remove_reclaim_record(crp, nn);
370 out_drop_write:
371 mnt_drop_write_file(nn->rec_file);
372 out:
373 if (status)
374 printk("NFSD: Failed to remove expired client state directory"
375 " %.*s\n", HEXDIR_LEN, dname);
378 static int
379 purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
381 int status;
383 if (nfs4_has_reclaimed_state(child->d_name.name, nn))
384 return 0;
386 status = vfs_rmdir(parent->d_inode, child);
387 if (status)
388 printk("failed to remove client recovery directory %s\n",
389 child->d_name.name);
390 /* Keep trying, success or failure: */
391 return 0;
394 static void
395 nfsd4_recdir_purge_old(struct nfsd_net *nn, time_t boot_time)
397 int status;
399 nn->in_grace = false;
400 if (!nn->rec_file)
401 return;
402 status = mnt_want_write_file(nn->rec_file);
403 if (status)
404 goto out;
405 status = nfsd4_list_rec_dir(purge_old, nn);
406 if (status == 0)
407 vfs_fsync(nn->rec_file, 0);
408 mnt_drop_write_file(nn->rec_file);
409 out:
410 nfs4_release_reclaim(nn);
411 if (status)
412 printk("nfsd4: failed to purge old clients from recovery"
413 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
416 static int
417 load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
419 if (child->d_name.len != HEXDIR_LEN - 1) {
420 printk("nfsd4: illegal name %s in recovery directory\n",
421 child->d_name.name);
422 /* Keep trying; maybe the others are OK: */
423 return 0;
425 nfs4_client_to_reclaim(child->d_name.name, nn);
426 return 0;
429 static int
430 nfsd4_recdir_load(struct net *net) {
431 int status;
432 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
434 if (!nn->rec_file)
435 return 0;
437 status = nfsd4_list_rec_dir(load_recdir, nn);
438 if (status)
439 printk("nfsd4: failed loading clients from recovery"
440 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
441 return status;
445 * Hold reference to the recovery directory.
448 static int
449 nfsd4_init_recdir(struct net *net)
451 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
452 const struct cred *original_cred;
453 int status;
455 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
456 user_recovery_dirname);
458 BUG_ON(nn->rec_file);
460 status = nfs4_save_creds(&original_cred);
461 if (status < 0) {
462 printk("NFSD: Unable to change credentials to find recovery"
463 " directory: error %d\n",
464 status);
465 return status;
468 nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
469 if (IS_ERR(nn->rec_file)) {
470 printk("NFSD: unable to find recovery directory %s\n",
471 user_recovery_dirname);
472 status = PTR_ERR(nn->rec_file);
473 nn->rec_file = NULL;
476 nfs4_reset_creds(original_cred);
477 if (!status)
478 nn->in_grace = true;
479 return status;
483 static int
484 nfs4_legacy_state_init(struct net *net)
486 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
487 int i;
489 nn->reclaim_str_hashtbl = kmalloc(sizeof(struct list_head) *
490 CLIENT_HASH_SIZE, GFP_KERNEL);
491 if (!nn->reclaim_str_hashtbl)
492 return -ENOMEM;
494 for (i = 0; i < CLIENT_HASH_SIZE; i++)
495 INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
496 nn->reclaim_str_hashtbl_size = 0;
498 return 0;
501 static void
502 nfs4_legacy_state_shutdown(struct net *net)
504 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
506 kfree(nn->reclaim_str_hashtbl);
509 static int
510 nfsd4_load_reboot_recovery_data(struct net *net)
512 int status;
514 status = nfsd4_init_recdir(net);
515 if (!status)
516 status = nfsd4_recdir_load(net);
517 if (status)
518 printk(KERN_ERR "NFSD: Failure reading reboot recovery data\n");
519 return status;
522 static int
523 nfsd4_legacy_tracking_init(struct net *net)
525 int status;
527 /* XXX: The legacy code won't work in a container */
528 if (net != &init_net) {
529 WARN(1, KERN_ERR "NFSD: attempt to initialize legacy client "
530 "tracking in a container!\n");
531 return -EINVAL;
534 status = nfs4_legacy_state_init(net);
535 if (status)
536 return status;
538 status = nfsd4_load_reboot_recovery_data(net);
539 if (status)
540 goto err;
541 return 0;
543 err:
544 nfs4_legacy_state_shutdown(net);
545 return status;
548 static void
549 nfsd4_shutdown_recdir(struct nfsd_net *nn)
551 if (!nn->rec_file)
552 return;
553 fput(nn->rec_file);
554 nn->rec_file = NULL;
557 static void
558 nfsd4_legacy_tracking_exit(struct net *net)
560 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
562 nfs4_release_reclaim(nn);
563 nfsd4_shutdown_recdir(nn);
564 nfs4_legacy_state_shutdown(net);
568 * Change the NFSv4 recovery directory to recdir.
571 nfs4_reset_recoverydir(char *recdir)
573 int status;
574 struct path path;
576 status = kern_path(recdir, LOOKUP_FOLLOW, &path);
577 if (status)
578 return status;
579 status = -ENOTDIR;
580 if (S_ISDIR(path.dentry->d_inode->i_mode)) {
581 strcpy(user_recovery_dirname, recdir);
582 status = 0;
584 path_put(&path);
585 return status;
588 char *
589 nfs4_recoverydir(void)
591 return user_recovery_dirname;
594 static int
595 nfsd4_check_legacy_client(struct nfs4_client *clp)
597 int status;
598 char dname[HEXDIR_LEN];
599 struct nfs4_client_reclaim *crp;
600 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
602 /* did we already find that this client is stable? */
603 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
604 return 0;
606 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
607 if (status) {
608 legacy_recdir_name_error(clp, status);
609 return status;
612 /* look for it in the reclaim hashtable otherwise */
613 crp = nfsd4_find_reclaim_client(dname, nn);
614 if (crp) {
615 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
616 crp->cr_clp = clp;
617 return 0;
620 return -ENOENT;
623 static struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
624 .init = nfsd4_legacy_tracking_init,
625 .exit = nfsd4_legacy_tracking_exit,
626 .create = nfsd4_create_clid_dir,
627 .remove = nfsd4_remove_clid_dir,
628 .check = nfsd4_check_legacy_client,
629 .grace_done = nfsd4_recdir_purge_old,
632 /* Globals */
633 #define NFSD_PIPE_DIR "nfsd"
634 #define NFSD_CLD_PIPE "cld"
636 /* per-net-ns structure for holding cld upcall info */
637 struct cld_net {
638 struct rpc_pipe *cn_pipe;
639 spinlock_t cn_lock;
640 struct list_head cn_list;
641 unsigned int cn_xid;
644 struct cld_upcall {
645 struct list_head cu_list;
646 struct cld_net *cu_net;
647 struct task_struct *cu_task;
648 struct cld_msg cu_msg;
651 static int
652 __cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
654 int ret;
655 struct rpc_pipe_msg msg;
657 memset(&msg, 0, sizeof(msg));
658 msg.data = cmsg;
659 msg.len = sizeof(*cmsg);
662 * Set task state before we queue the upcall. That prevents
663 * wake_up_process in the downcall from racing with schedule.
665 set_current_state(TASK_UNINTERRUPTIBLE);
666 ret = rpc_queue_upcall(pipe, &msg);
667 if (ret < 0) {
668 set_current_state(TASK_RUNNING);
669 goto out;
672 schedule();
673 set_current_state(TASK_RUNNING);
675 if (msg.errno < 0)
676 ret = msg.errno;
677 out:
678 return ret;
681 static int
682 cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
684 int ret;
687 * -EAGAIN occurs when pipe is closed and reopened while there are
688 * upcalls queued.
690 do {
691 ret = __cld_pipe_upcall(pipe, cmsg);
692 } while (ret == -EAGAIN);
694 return ret;
697 static ssize_t
698 cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
700 struct cld_upcall *tmp, *cup;
701 struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
702 uint32_t xid;
703 struct nfsd_net *nn = net_generic(filp->f_dentry->d_sb->s_fs_info,
704 nfsd_net_id);
705 struct cld_net *cn = nn->cld_net;
707 if (mlen != sizeof(*cmsg)) {
708 dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
709 sizeof(*cmsg));
710 return -EINVAL;
713 /* copy just the xid so we can try to find that */
714 if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
715 dprintk("%s: error when copying xid from userspace", __func__);
716 return -EFAULT;
719 /* walk the list and find corresponding xid */
720 cup = NULL;
721 spin_lock(&cn->cn_lock);
722 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
723 if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
724 cup = tmp;
725 list_del_init(&cup->cu_list);
726 break;
729 spin_unlock(&cn->cn_lock);
731 /* couldn't find upcall? */
732 if (!cup) {
733 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
734 return -EINVAL;
737 if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
738 return -EFAULT;
740 wake_up_process(cup->cu_task);
741 return mlen;
744 static void
745 cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
747 struct cld_msg *cmsg = msg->data;
748 struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
749 cu_msg);
751 /* errno >= 0 means we got a downcall */
752 if (msg->errno >= 0)
753 return;
755 wake_up_process(cup->cu_task);
758 static const struct rpc_pipe_ops cld_upcall_ops = {
759 .upcall = rpc_pipe_generic_upcall,
760 .downcall = cld_pipe_downcall,
761 .destroy_msg = cld_pipe_destroy_msg,
764 static struct dentry *
765 nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
767 struct dentry *dir, *dentry;
769 dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
770 if (dir == NULL)
771 return ERR_PTR(-ENOENT);
772 dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
773 dput(dir);
774 return dentry;
777 static void
778 nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
780 if (pipe->dentry)
781 rpc_unlink(pipe->dentry);
784 static struct dentry *
785 nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
787 struct super_block *sb;
788 struct dentry *dentry;
790 sb = rpc_get_sb_net(net);
791 if (!sb)
792 return NULL;
793 dentry = nfsd4_cld_register_sb(sb, pipe);
794 rpc_put_sb_net(net);
795 return dentry;
798 static void
799 nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
801 struct super_block *sb;
803 sb = rpc_get_sb_net(net);
804 if (sb) {
805 nfsd4_cld_unregister_sb(pipe);
806 rpc_put_sb_net(net);
810 /* Initialize rpc_pipefs pipe for communication with client tracking daemon */
811 static int
812 nfsd4_init_cld_pipe(struct net *net)
814 int ret;
815 struct dentry *dentry;
816 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
817 struct cld_net *cn;
819 if (nn->cld_net)
820 return 0;
822 cn = kzalloc(sizeof(*cn), GFP_KERNEL);
823 if (!cn) {
824 ret = -ENOMEM;
825 goto err;
828 cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
829 if (IS_ERR(cn->cn_pipe)) {
830 ret = PTR_ERR(cn->cn_pipe);
831 goto err;
833 spin_lock_init(&cn->cn_lock);
834 INIT_LIST_HEAD(&cn->cn_list);
836 dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
837 if (IS_ERR(dentry)) {
838 ret = PTR_ERR(dentry);
839 goto err_destroy_data;
842 cn->cn_pipe->dentry = dentry;
843 nn->cld_net = cn;
844 return 0;
846 err_destroy_data:
847 rpc_destroy_pipe_data(cn->cn_pipe);
848 err:
849 kfree(cn);
850 printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
851 ret);
852 return ret;
855 static void
856 nfsd4_remove_cld_pipe(struct net *net)
858 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
859 struct cld_net *cn = nn->cld_net;
861 nfsd4_cld_unregister_net(net, cn->cn_pipe);
862 rpc_destroy_pipe_data(cn->cn_pipe);
863 kfree(nn->cld_net);
864 nn->cld_net = NULL;
867 static struct cld_upcall *
868 alloc_cld_upcall(struct cld_net *cn)
870 struct cld_upcall *new, *tmp;
872 new = kzalloc(sizeof(*new), GFP_KERNEL);
873 if (!new)
874 return new;
876 /* FIXME: hard cap on number in flight? */
877 restart_search:
878 spin_lock(&cn->cn_lock);
879 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
880 if (tmp->cu_msg.cm_xid == cn->cn_xid) {
881 cn->cn_xid++;
882 spin_unlock(&cn->cn_lock);
883 goto restart_search;
886 new->cu_task = current;
887 new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
888 put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
889 new->cu_net = cn;
890 list_add(&new->cu_list, &cn->cn_list);
891 spin_unlock(&cn->cn_lock);
893 dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
895 return new;
898 static void
899 free_cld_upcall(struct cld_upcall *victim)
901 struct cld_net *cn = victim->cu_net;
903 spin_lock(&cn->cn_lock);
904 list_del(&victim->cu_list);
905 spin_unlock(&cn->cn_lock);
906 kfree(victim);
909 /* Ask daemon to create a new record */
910 static void
911 nfsd4_cld_create(struct nfs4_client *clp)
913 int ret;
914 struct cld_upcall *cup;
915 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
916 struct cld_net *cn = nn->cld_net;
918 /* Don't upcall if it's already stored */
919 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
920 return;
922 cup = alloc_cld_upcall(cn);
923 if (!cup) {
924 ret = -ENOMEM;
925 goto out_err;
928 cup->cu_msg.cm_cmd = Cld_Create;
929 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
930 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
931 clp->cl_name.len);
933 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
934 if (!ret) {
935 ret = cup->cu_msg.cm_status;
936 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
939 free_cld_upcall(cup);
940 out_err:
941 if (ret)
942 printk(KERN_ERR "NFSD: Unable to create client "
943 "record on stable storage: %d\n", ret);
946 /* Ask daemon to create a new record */
947 static void
948 nfsd4_cld_remove(struct nfs4_client *clp)
950 int ret;
951 struct cld_upcall *cup;
952 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
953 struct cld_net *cn = nn->cld_net;
955 /* Don't upcall if it's already removed */
956 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
957 return;
959 cup = alloc_cld_upcall(cn);
960 if (!cup) {
961 ret = -ENOMEM;
962 goto out_err;
965 cup->cu_msg.cm_cmd = Cld_Remove;
966 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
967 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
968 clp->cl_name.len);
970 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
971 if (!ret) {
972 ret = cup->cu_msg.cm_status;
973 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
976 free_cld_upcall(cup);
977 out_err:
978 if (ret)
979 printk(KERN_ERR "NFSD: Unable to remove client "
980 "record from stable storage: %d\n", ret);
983 /* Check for presence of a record, and update its timestamp */
984 static int
985 nfsd4_cld_check(struct nfs4_client *clp)
987 int ret;
988 struct cld_upcall *cup;
989 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
990 struct cld_net *cn = nn->cld_net;
992 /* Don't upcall if one was already stored during this grace pd */
993 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
994 return 0;
996 cup = alloc_cld_upcall(cn);
997 if (!cup) {
998 printk(KERN_ERR "NFSD: Unable to check client record on "
999 "stable storage: %d\n", -ENOMEM);
1000 return -ENOMEM;
1003 cup->cu_msg.cm_cmd = Cld_Check;
1004 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1005 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1006 clp->cl_name.len);
1008 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1009 if (!ret) {
1010 ret = cup->cu_msg.cm_status;
1011 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1014 free_cld_upcall(cup);
1015 return ret;
1018 static void
1019 nfsd4_cld_grace_done(struct nfsd_net *nn, time_t boot_time)
1021 int ret;
1022 struct cld_upcall *cup;
1023 struct cld_net *cn = nn->cld_net;
1025 cup = alloc_cld_upcall(cn);
1026 if (!cup) {
1027 ret = -ENOMEM;
1028 goto out_err;
1031 cup->cu_msg.cm_cmd = Cld_GraceDone;
1032 cup->cu_msg.cm_u.cm_gracetime = (int64_t)boot_time;
1033 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1034 if (!ret)
1035 ret = cup->cu_msg.cm_status;
1037 free_cld_upcall(cup);
1038 out_err:
1039 if (ret)
1040 printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1043 static struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
1044 .init = nfsd4_init_cld_pipe,
1045 .exit = nfsd4_remove_cld_pipe,
1046 .create = nfsd4_cld_create,
1047 .remove = nfsd4_cld_remove,
1048 .check = nfsd4_cld_check,
1049 .grace_done = nfsd4_cld_grace_done,
1052 /* upcall via usermodehelper */
1053 static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1054 module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1055 S_IRUGO|S_IWUSR);
1056 MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1058 static bool cltrack_legacy_disable;
1059 module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1060 MODULE_PARM_DESC(cltrack_legacy_disable,
1061 "Disable legacy recoverydir conversion. Default: false");
1063 #define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1064 #define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
1066 static char *
1067 nfsd4_cltrack_legacy_topdir(void)
1069 int copied;
1070 size_t len;
1071 char *result;
1073 if (cltrack_legacy_disable)
1074 return NULL;
1076 len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1077 strlen(nfs4_recoverydir()) + 1;
1079 result = kmalloc(len, GFP_KERNEL);
1080 if (!result)
1081 return result;
1083 copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1084 nfs4_recoverydir());
1085 if (copied >= len) {
1086 /* just return nothing if output was truncated */
1087 kfree(result);
1088 return NULL;
1091 return result;
1094 static char *
1095 nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
1097 int copied;
1098 size_t len;
1099 char *result;
1101 if (cltrack_legacy_disable)
1102 return NULL;
1104 /* +1 is for '/' between "topdir" and "recdir" */
1105 len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1106 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1108 result = kmalloc(len, GFP_KERNEL);
1109 if (!result)
1110 return result;
1112 copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1113 nfs4_recoverydir());
1114 if (copied > (len - HEXDIR_LEN)) {
1115 /* just return nothing if output will be truncated */
1116 kfree(result);
1117 return NULL;
1120 copied = nfs4_make_rec_clidname(result + copied, name);
1121 if (copied) {
1122 kfree(result);
1123 return NULL;
1126 return result;
1129 static int
1130 nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *legacy)
1132 char *envp[2];
1133 char *argv[4];
1134 int ret;
1136 if (unlikely(!cltrack_prog[0])) {
1137 dprintk("%s: cltrack_prog is disabled\n", __func__);
1138 return -EACCES;
1141 dprintk("%s: cmd: %s\n", __func__, cmd);
1142 dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
1143 dprintk("%s: legacy: %s\n", __func__, legacy ? legacy : "(null)");
1145 envp[0] = legacy;
1146 envp[1] = NULL;
1148 argv[0] = (char *)cltrack_prog;
1149 argv[1] = cmd;
1150 argv[2] = arg;
1151 argv[3] = NULL;
1153 ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1155 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1156 * error. The admin can re-enable it on the fly by using sysfs
1157 * once the problem has been fixed.
1159 if (ret == -ENOENT || ret == -EACCES) {
1160 dprintk("NFSD: %s was not found or isn't executable (%d). "
1161 "Setting cltrack_prog to blank string!",
1162 cltrack_prog, ret);
1163 cltrack_prog[0] = '\0';
1165 dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1167 return ret;
1170 static char *
1171 bin_to_hex_dup(const unsigned char *src, int srclen)
1173 int i;
1174 char *buf, *hex;
1176 /* +1 for terminating NULL */
1177 buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1178 if (!buf)
1179 return buf;
1181 hex = buf;
1182 for (i = 0; i < srclen; i++) {
1183 sprintf(hex, "%2.2x", *src++);
1184 hex += 2;
1186 return buf;
1189 static int
1190 nfsd4_umh_cltrack_init(struct net __attribute__((unused)) *net)
1192 /* XXX: The usermode helper s not working in container yet. */
1193 if (net != &init_net) {
1194 WARN(1, KERN_ERR "NFSD: attempt to initialize umh client "
1195 "tracking in a container!\n");
1196 return -EINVAL;
1198 return nfsd4_umh_cltrack_upcall("init", NULL, NULL);
1201 static void
1202 nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1204 char *hexid;
1206 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1207 if (!hexid) {
1208 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1209 return;
1211 nfsd4_umh_cltrack_upcall("create", hexid, NULL);
1212 kfree(hexid);
1215 static void
1216 nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1218 char *hexid;
1220 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1221 if (!hexid) {
1222 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1223 return;
1225 nfsd4_umh_cltrack_upcall("remove", hexid, NULL);
1226 kfree(hexid);
1229 static int
1230 nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1232 int ret;
1233 char *hexid, *legacy;
1235 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1236 if (!hexid) {
1237 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1238 return -ENOMEM;
1240 legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
1241 ret = nfsd4_umh_cltrack_upcall("check", hexid, legacy);
1242 kfree(legacy);
1243 kfree(hexid);
1244 return ret;
1247 static void
1248 nfsd4_umh_cltrack_grace_done(struct nfsd_net __attribute__((unused)) *nn,
1249 time_t boot_time)
1251 char *legacy;
1252 char timestr[22]; /* FIXME: better way to determine max size? */
1254 sprintf(timestr, "%ld", boot_time);
1255 legacy = nfsd4_cltrack_legacy_topdir();
1256 nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy);
1257 kfree(legacy);
1260 static struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
1261 .init = nfsd4_umh_cltrack_init,
1262 .exit = NULL,
1263 .create = nfsd4_umh_cltrack_create,
1264 .remove = nfsd4_umh_cltrack_remove,
1265 .check = nfsd4_umh_cltrack_check,
1266 .grace_done = nfsd4_umh_cltrack_grace_done,
1270 nfsd4_client_tracking_init(struct net *net)
1272 int status;
1273 struct path path;
1274 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1276 /* just run the init if it the method is already decided */
1277 if (nn->client_tracking_ops)
1278 goto do_init;
1281 * First, try a UMH upcall. It should succeed or fail quickly, so
1282 * there's little harm in trying that first.
1284 nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1285 status = nn->client_tracking_ops->init(net);
1286 if (!status)
1287 return status;
1290 * See if the recoverydir exists and is a directory. If it is,
1291 * then use the legacy ops.
1293 nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
1294 status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1295 if (!status) {
1296 status = S_ISDIR(path.dentry->d_inode->i_mode);
1297 path_put(&path);
1298 if (status)
1299 goto do_init;
1302 /* Finally, try to use nfsdcld */
1303 nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
1304 printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1305 "removed in 3.10. Please transition to using "
1306 "nfsdcltrack.\n");
1307 do_init:
1308 status = nn->client_tracking_ops->init(net);
1309 if (status) {
1310 printk(KERN_WARNING "NFSD: Unable to initialize client "
1311 "recovery tracking! (%d)\n", status);
1312 nn->client_tracking_ops = NULL;
1314 return status;
1317 void
1318 nfsd4_client_tracking_exit(struct net *net)
1320 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1322 if (nn->client_tracking_ops) {
1323 if (nn->client_tracking_ops->exit)
1324 nn->client_tracking_ops->exit(net);
1325 nn->client_tracking_ops = NULL;
1329 void
1330 nfsd4_client_record_create(struct nfs4_client *clp)
1332 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1334 if (nn->client_tracking_ops)
1335 nn->client_tracking_ops->create(clp);
1338 void
1339 nfsd4_client_record_remove(struct nfs4_client *clp)
1341 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1343 if (nn->client_tracking_ops)
1344 nn->client_tracking_ops->remove(clp);
1348 nfsd4_client_record_check(struct nfs4_client *clp)
1350 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1352 if (nn->client_tracking_ops)
1353 return nn->client_tracking_ops->check(clp);
1355 return -EOPNOTSUPP;
1358 void
1359 nfsd4_record_grace_done(struct nfsd_net *nn, time_t boot_time)
1361 if (nn->client_tracking_ops)
1362 nn->client_tracking_ops->grace_done(nn, boot_time);
1365 static int
1366 rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1368 struct super_block *sb = ptr;
1369 struct net *net = sb->s_fs_info;
1370 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1371 struct cld_net *cn = nn->cld_net;
1372 struct dentry *dentry;
1373 int ret = 0;
1375 if (!try_module_get(THIS_MODULE))
1376 return 0;
1378 if (!cn) {
1379 module_put(THIS_MODULE);
1380 return 0;
1383 switch (event) {
1384 case RPC_PIPEFS_MOUNT:
1385 dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1386 if (IS_ERR(dentry)) {
1387 ret = PTR_ERR(dentry);
1388 break;
1390 cn->cn_pipe->dentry = dentry;
1391 break;
1392 case RPC_PIPEFS_UMOUNT:
1393 if (cn->cn_pipe->dentry)
1394 nfsd4_cld_unregister_sb(cn->cn_pipe);
1395 break;
1396 default:
1397 ret = -ENOTSUPP;
1398 break;
1400 module_put(THIS_MODULE);
1401 return ret;
1404 static struct notifier_block nfsd4_cld_block = {
1405 .notifier_call = rpc_pipefs_event,
1409 register_cld_notifier(void)
1411 return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1414 void
1415 unregister_cld_notifier(void)
1417 rpc_pipefs_notifier_unregister(&nfsd4_cld_block);