2 * Copyright (c) 2004 The Regents of the University of Michigan.
3 * Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
6 * Andy Adamson <andros@citi.umich.edu>
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 #include <linux/file.h>
36 #include <linux/slab.h>
37 #include <linux/namei.h>
38 #include <linux/crypto.h>
39 #include <linux/sched.h>
41 #include <linux/module.h>
42 #include <net/net_namespace.h>
43 #include <linux/sunrpc/rpc_pipe_fs.h>
44 #include <linux/sunrpc/clnt.h>
45 #include <linux/nfsd/cld.h>
52 #define NFSDDBG_FACILITY NFSDDBG_PROC
55 struct nfsd4_client_tracking_ops
{
56 int (*init
)(struct net
*);
57 void (*exit
)(struct net
*);
58 void (*create
)(struct nfs4_client
*);
59 void (*remove
)(struct nfs4_client
*);
60 int (*check
)(struct nfs4_client
*);
61 void (*grace_done
)(struct nfsd_net
*);
65 static char user_recovery_dirname
[PATH_MAX
] = "/var/lib/nfs/v4recovery";
68 nfs4_save_creds(const struct cred
**original_creds
)
72 new = prepare_creds();
76 new->fsuid
= GLOBAL_ROOT_UID
;
77 new->fsgid
= GLOBAL_ROOT_GID
;
78 *original_creds
= override_creds(new);
84 nfs4_reset_creds(const struct cred
*original
)
86 revert_creds(original
);
90 md5_to_hex(char *out
, char *md5
)
94 for (i
=0; i
<16; i
++) {
95 unsigned char c
= md5
[i
];
97 *out
++ = '0' + ((c
&0xf0)>>4) + (c
>=0xa0)*('a'-'9'-1);
98 *out
++ = '0' + (c
&0x0f) + ((c
&0x0f)>=0x0a)*('a'-'9'-1);
104 nfs4_make_rec_clidname(char *dname
, const struct xdr_netobj
*clname
)
106 struct xdr_netobj cksum
;
107 struct hash_desc desc
;
108 struct scatterlist sg
;
111 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
112 clname
->len
, clname
->data
);
113 desc
.flags
= CRYPTO_TFM_REQ_MAY_SLEEP
;
114 desc
.tfm
= crypto_alloc_hash("md5", 0, CRYPTO_ALG_ASYNC
);
115 if (IS_ERR(desc
.tfm
)) {
116 status
= PTR_ERR(desc
.tfm
);
120 cksum
.len
= crypto_hash_digestsize(desc
.tfm
);
121 cksum
.data
= kmalloc(cksum
.len
, GFP_KERNEL
);
122 if (cksum
.data
== NULL
) {
127 sg_init_one(&sg
, clname
->data
, clname
->len
);
129 status
= crypto_hash_digest(&desc
, &sg
, sg
.length
, cksum
.data
);
133 md5_to_hex(dname
, cksum
.data
);
138 crypto_free_hash(desc
.tfm
);
144 * If we had an error generating the recdir name for the legacy tracker
145 * then warn the admin. If the error doesn't appear to be transient,
146 * then disable recovery tracking.
149 legacy_recdir_name_error(struct nfs4_client
*clp
, int error
)
151 printk(KERN_ERR
"NFSD: unable to generate recoverydir "
152 "name (%d).\n", error
);
155 * if the algorithm just doesn't exist, then disable the recovery
156 * tracker altogether. The crypto libs will generally return this if
157 * FIPS is enabled as well.
159 if (error
== -ENOENT
) {
160 printk(KERN_ERR
"NFSD: disabling legacy clientid tracking. "
161 "Reboot recovery will not function correctly!\n");
162 nfsd4_client_tracking_exit(clp
->net
);
167 nfsd4_create_clid_dir(struct nfs4_client
*clp
)
169 const struct cred
*original_cred
;
170 char dname
[HEXDIR_LEN
];
171 struct dentry
*dir
, *dentry
;
172 struct nfs4_client_reclaim
*crp
;
174 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
176 if (test_and_set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
181 status
= nfs4_make_rec_clidname(dname
, &clp
->cl_name
);
183 return legacy_recdir_name_error(clp
, status
);
185 status
= nfs4_save_creds(&original_cred
);
189 status
= mnt_want_write_file(nn
->rec_file
);
193 dir
= nn
->rec_file
->f_path
.dentry
;
194 /* lock the parent */
195 mutex_lock(&d_inode(dir
)->i_mutex
);
197 dentry
= lookup_one_len(dname
, dir
, HEXDIR_LEN
-1);
198 if (IS_ERR(dentry
)) {
199 status
= PTR_ERR(dentry
);
202 if (d_really_is_positive(dentry
))
204 * In the 4.1 case, where we're called from
205 * reclaim_complete(), records from the previous reboot
206 * may still be left, so this is OK.
208 * In the 4.0 case, we should never get here; but we may
209 * as well be forgiving and just succeed silently.
212 status
= vfs_mkdir(d_inode(dir
), dentry
, S_IRWXU
);
216 mutex_unlock(&d_inode(dir
)->i_mutex
);
219 crp
= nfs4_client_to_reclaim(dname
, nn
);
223 vfs_fsync(nn
->rec_file
, 0);
225 printk(KERN_ERR
"NFSD: failed to write recovery record"
226 " (err %d); please check that %s exists"
227 " and is writeable", status
,
228 user_recovery_dirname
);
230 mnt_drop_write_file(nn
->rec_file
);
232 nfs4_reset_creds(original_cred
);
235 typedef int (recdir_func
)(struct dentry
*, struct dentry
*, struct nfsd_net
*);
238 char name
[HEXDIR_LEN
];
239 struct list_head list
;
242 struct nfs4_dir_ctx
{
243 struct dir_context ctx
;
244 struct list_head names
;
248 nfsd4_build_namelist(struct dir_context
*__ctx
, const char *name
, int namlen
,
249 loff_t offset
, u64 ino
, unsigned int d_type
)
251 struct nfs4_dir_ctx
*ctx
=
252 container_of(__ctx
, struct nfs4_dir_ctx
, ctx
);
253 struct name_list
*entry
;
255 if (namlen
!= HEXDIR_LEN
- 1)
257 entry
= kmalloc(sizeof(struct name_list
), GFP_KERNEL
);
260 memcpy(entry
->name
, name
, HEXDIR_LEN
- 1);
261 entry
->name
[HEXDIR_LEN
- 1] = '\0';
262 list_add(&entry
->list
, &ctx
->names
);
267 nfsd4_list_rec_dir(recdir_func
*f
, struct nfsd_net
*nn
)
269 const struct cred
*original_cred
;
270 struct dentry
*dir
= nn
->rec_file
->f_path
.dentry
;
271 struct nfs4_dir_ctx ctx
= {
272 .ctx
.actor
= nfsd4_build_namelist
,
273 .names
= LIST_HEAD_INIT(ctx
.names
)
275 struct name_list
*entry
, *tmp
;
278 status
= nfs4_save_creds(&original_cred
);
282 status
= vfs_llseek(nn
->rec_file
, 0, SEEK_SET
);
284 nfs4_reset_creds(original_cred
);
288 status
= iterate_dir(nn
->rec_file
, &ctx
.ctx
);
289 mutex_lock_nested(&d_inode(dir
)->i_mutex
, I_MUTEX_PARENT
);
291 list_for_each_entry_safe(entry
, tmp
, &ctx
.names
, list
) {
293 struct dentry
*dentry
;
294 dentry
= lookup_one_len(entry
->name
, dir
, HEXDIR_LEN
-1);
295 if (IS_ERR(dentry
)) {
296 status
= PTR_ERR(dentry
);
299 status
= f(dir
, dentry
, nn
);
302 list_del(&entry
->list
);
305 mutex_unlock(&d_inode(dir
)->i_mutex
);
306 nfs4_reset_creds(original_cred
);
308 list_for_each_entry_safe(entry
, tmp
, &ctx
.names
, list
) {
309 dprintk("NFSD: %s. Left entry %s\n", __func__
, entry
->name
);
310 list_del(&entry
->list
);
317 nfsd4_unlink_clid_dir(char *name
, int namlen
, struct nfsd_net
*nn
)
319 struct dentry
*dir
, *dentry
;
322 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen
, name
);
324 dir
= nn
->rec_file
->f_path
.dentry
;
325 mutex_lock_nested(&d_inode(dir
)->i_mutex
, I_MUTEX_PARENT
);
326 dentry
= lookup_one_len(name
, dir
, namlen
);
327 if (IS_ERR(dentry
)) {
328 status
= PTR_ERR(dentry
);
332 if (d_really_is_negative(dentry
))
334 status
= vfs_rmdir(d_inode(dir
), dentry
);
338 mutex_unlock(&d_inode(dir
)->i_mutex
);
343 nfsd4_remove_clid_dir(struct nfs4_client
*clp
)
345 const struct cred
*original_cred
;
346 struct nfs4_client_reclaim
*crp
;
347 char dname
[HEXDIR_LEN
];
349 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
351 if (!nn
->rec_file
|| !test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
354 status
= nfs4_make_rec_clidname(dname
, &clp
->cl_name
);
356 return legacy_recdir_name_error(clp
, status
);
358 status
= mnt_want_write_file(nn
->rec_file
);
361 clear_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
363 status
= nfs4_save_creds(&original_cred
);
367 status
= nfsd4_unlink_clid_dir(dname
, HEXDIR_LEN
-1, nn
);
368 nfs4_reset_creds(original_cred
);
370 vfs_fsync(nn
->rec_file
, 0);
372 /* remove reclaim record */
373 crp
= nfsd4_find_reclaim_client(dname
, nn
);
375 nfs4_remove_reclaim_record(crp
, nn
);
379 mnt_drop_write_file(nn
->rec_file
);
382 printk("NFSD: Failed to remove expired client state directory"
383 " %.*s\n", HEXDIR_LEN
, dname
);
387 purge_old(struct dentry
*parent
, struct dentry
*child
, struct nfsd_net
*nn
)
391 if (nfs4_has_reclaimed_state(child
->d_name
.name
, nn
))
394 status
= vfs_rmdir(d_inode(parent
), child
);
396 printk("failed to remove client recovery directory %pd\n",
398 /* Keep trying, success or failure: */
403 nfsd4_recdir_purge_old(struct nfsd_net
*nn
)
407 nn
->in_grace
= false;
410 status
= mnt_want_write_file(nn
->rec_file
);
413 status
= nfsd4_list_rec_dir(purge_old
, nn
);
415 vfs_fsync(nn
->rec_file
, 0);
416 mnt_drop_write_file(nn
->rec_file
);
418 nfs4_release_reclaim(nn
);
420 printk("nfsd4: failed to purge old clients from recovery"
421 " directory %pD\n", nn
->rec_file
);
425 load_recdir(struct dentry
*parent
, struct dentry
*child
, struct nfsd_net
*nn
)
427 if (child
->d_name
.len
!= HEXDIR_LEN
- 1) {
428 printk("nfsd4: illegal name %pd in recovery directory\n",
430 /* Keep trying; maybe the others are OK: */
433 nfs4_client_to_reclaim(child
->d_name
.name
, nn
);
438 nfsd4_recdir_load(struct net
*net
) {
440 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
445 status
= nfsd4_list_rec_dir(load_recdir
, nn
);
447 printk("nfsd4: failed loading clients from recovery"
448 " directory %pD\n", nn
->rec_file
);
453 * Hold reference to the recovery directory.
457 nfsd4_init_recdir(struct net
*net
)
459 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
460 const struct cred
*original_cred
;
463 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
464 user_recovery_dirname
);
466 BUG_ON(nn
->rec_file
);
468 status
= nfs4_save_creds(&original_cred
);
470 printk("NFSD: Unable to change credentials to find recovery"
471 " directory: error %d\n",
476 nn
->rec_file
= filp_open(user_recovery_dirname
, O_RDONLY
| O_DIRECTORY
, 0);
477 if (IS_ERR(nn
->rec_file
)) {
478 printk("NFSD: unable to find recovery directory %s\n",
479 user_recovery_dirname
);
480 status
= PTR_ERR(nn
->rec_file
);
484 nfs4_reset_creds(original_cred
);
491 nfsd4_shutdown_recdir(struct net
*net
)
493 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
502 nfs4_legacy_state_init(struct net
*net
)
504 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
507 nn
->reclaim_str_hashtbl
= kmalloc(sizeof(struct list_head
) *
508 CLIENT_HASH_SIZE
, GFP_KERNEL
);
509 if (!nn
->reclaim_str_hashtbl
)
512 for (i
= 0; i
< CLIENT_HASH_SIZE
; i
++)
513 INIT_LIST_HEAD(&nn
->reclaim_str_hashtbl
[i
]);
514 nn
->reclaim_str_hashtbl_size
= 0;
520 nfs4_legacy_state_shutdown(struct net
*net
)
522 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
524 kfree(nn
->reclaim_str_hashtbl
);
528 nfsd4_load_reboot_recovery_data(struct net
*net
)
532 status
= nfsd4_init_recdir(net
);
536 status
= nfsd4_recdir_load(net
);
538 nfsd4_shutdown_recdir(net
);
544 nfsd4_legacy_tracking_init(struct net
*net
)
548 /* XXX: The legacy code won't work in a container */
549 if (net
!= &init_net
) {
550 pr_warn("NFSD: attempt to initialize legacy client tracking in a container ignored.\n");
554 status
= nfs4_legacy_state_init(net
);
558 status
= nfsd4_load_reboot_recovery_data(net
);
564 nfs4_legacy_state_shutdown(net
);
569 nfsd4_legacy_tracking_exit(struct net
*net
)
571 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
573 nfs4_release_reclaim(nn
);
574 nfsd4_shutdown_recdir(net
);
575 nfs4_legacy_state_shutdown(net
);
579 * Change the NFSv4 recovery directory to recdir.
582 nfs4_reset_recoverydir(char *recdir
)
587 status
= kern_path(recdir
, LOOKUP_FOLLOW
, &path
);
591 if (d_is_dir(path
.dentry
)) {
592 strcpy(user_recovery_dirname
, recdir
);
600 nfs4_recoverydir(void)
602 return user_recovery_dirname
;
606 nfsd4_check_legacy_client(struct nfs4_client
*clp
)
609 char dname
[HEXDIR_LEN
];
610 struct nfs4_client_reclaim
*crp
;
611 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
613 /* did we already find that this client is stable? */
614 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
617 status
= nfs4_make_rec_clidname(dname
, &clp
->cl_name
);
619 legacy_recdir_name_error(clp
, status
);
623 /* look for it in the reclaim hashtable otherwise */
624 crp
= nfsd4_find_reclaim_client(dname
, nn
);
626 set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
634 static struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops
= {
635 .init
= nfsd4_legacy_tracking_init
,
636 .exit
= nfsd4_legacy_tracking_exit
,
637 .create
= nfsd4_create_clid_dir
,
638 .remove
= nfsd4_remove_clid_dir
,
639 .check
= nfsd4_check_legacy_client
,
640 .grace_done
= nfsd4_recdir_purge_old
,
644 #define NFSD_PIPE_DIR "nfsd"
645 #define NFSD_CLD_PIPE "cld"
647 /* per-net-ns structure for holding cld upcall info */
649 struct rpc_pipe
*cn_pipe
;
651 struct list_head cn_list
;
656 struct list_head cu_list
;
657 struct cld_net
*cu_net
;
658 struct completion cu_done
;
659 struct cld_msg cu_msg
;
663 __cld_pipe_upcall(struct rpc_pipe
*pipe
, struct cld_msg
*cmsg
)
666 struct rpc_pipe_msg msg
;
667 struct cld_upcall
*cup
= container_of(cmsg
, struct cld_upcall
, cu_msg
);
669 memset(&msg
, 0, sizeof(msg
));
671 msg
.len
= sizeof(*cmsg
);
673 ret
= rpc_queue_upcall(pipe
, &msg
);
678 wait_for_completion(&cup
->cu_done
);
687 cld_pipe_upcall(struct rpc_pipe
*pipe
, struct cld_msg
*cmsg
)
692 * -EAGAIN occurs when pipe is closed and reopened while there are
696 ret
= __cld_pipe_upcall(pipe
, cmsg
);
697 } while (ret
== -EAGAIN
);
703 cld_pipe_downcall(struct file
*filp
, const char __user
*src
, size_t mlen
)
705 struct cld_upcall
*tmp
, *cup
;
706 struct cld_msg __user
*cmsg
= (struct cld_msg __user
*)src
;
708 struct nfsd_net
*nn
= net_generic(file_inode(filp
)->i_sb
->s_fs_info
,
710 struct cld_net
*cn
= nn
->cld_net
;
712 if (mlen
!= sizeof(*cmsg
)) {
713 dprintk("%s: got %zu bytes, expected %zu\n", __func__
, mlen
,
718 /* copy just the xid so we can try to find that */
719 if (copy_from_user(&xid
, &cmsg
->cm_xid
, sizeof(xid
)) != 0) {
720 dprintk("%s: error when copying xid from userspace", __func__
);
724 /* walk the list and find corresponding xid */
726 spin_lock(&cn
->cn_lock
);
727 list_for_each_entry(tmp
, &cn
->cn_list
, cu_list
) {
728 if (get_unaligned(&tmp
->cu_msg
.cm_xid
) == xid
) {
730 list_del_init(&cup
->cu_list
);
734 spin_unlock(&cn
->cn_lock
);
736 /* couldn't find upcall? */
738 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__
, xid
);
742 if (copy_from_user(&cup
->cu_msg
, src
, mlen
) != 0)
745 complete(&cup
->cu_done
);
750 cld_pipe_destroy_msg(struct rpc_pipe_msg
*msg
)
752 struct cld_msg
*cmsg
= msg
->data
;
753 struct cld_upcall
*cup
= container_of(cmsg
, struct cld_upcall
,
756 /* errno >= 0 means we got a downcall */
760 complete(&cup
->cu_done
);
763 static const struct rpc_pipe_ops cld_upcall_ops
= {
764 .upcall
= rpc_pipe_generic_upcall
,
765 .downcall
= cld_pipe_downcall
,
766 .destroy_msg
= cld_pipe_destroy_msg
,
769 static struct dentry
*
770 nfsd4_cld_register_sb(struct super_block
*sb
, struct rpc_pipe
*pipe
)
772 struct dentry
*dir
, *dentry
;
774 dir
= rpc_d_lookup_sb(sb
, NFSD_PIPE_DIR
);
776 return ERR_PTR(-ENOENT
);
777 dentry
= rpc_mkpipe_dentry(dir
, NFSD_CLD_PIPE
, NULL
, pipe
);
783 nfsd4_cld_unregister_sb(struct rpc_pipe
*pipe
)
786 rpc_unlink(pipe
->dentry
);
789 static struct dentry
*
790 nfsd4_cld_register_net(struct net
*net
, struct rpc_pipe
*pipe
)
792 struct super_block
*sb
;
793 struct dentry
*dentry
;
795 sb
= rpc_get_sb_net(net
);
798 dentry
= nfsd4_cld_register_sb(sb
, pipe
);
804 nfsd4_cld_unregister_net(struct net
*net
, struct rpc_pipe
*pipe
)
806 struct super_block
*sb
;
808 sb
= rpc_get_sb_net(net
);
810 nfsd4_cld_unregister_sb(pipe
);
815 /* Initialize rpc_pipefs pipe for communication with client tracking daemon */
817 nfsd4_init_cld_pipe(struct net
*net
)
820 struct dentry
*dentry
;
821 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
827 cn
= kzalloc(sizeof(*cn
), GFP_KERNEL
);
833 cn
->cn_pipe
= rpc_mkpipe_data(&cld_upcall_ops
, RPC_PIPE_WAIT_FOR_OPEN
);
834 if (IS_ERR(cn
->cn_pipe
)) {
835 ret
= PTR_ERR(cn
->cn_pipe
);
838 spin_lock_init(&cn
->cn_lock
);
839 INIT_LIST_HEAD(&cn
->cn_list
);
841 dentry
= nfsd4_cld_register_net(net
, cn
->cn_pipe
);
842 if (IS_ERR(dentry
)) {
843 ret
= PTR_ERR(dentry
);
844 goto err_destroy_data
;
847 cn
->cn_pipe
->dentry
= dentry
;
852 rpc_destroy_pipe_data(cn
->cn_pipe
);
855 printk(KERN_ERR
"NFSD: unable to create nfsdcld upcall pipe (%d)\n",
861 nfsd4_remove_cld_pipe(struct net
*net
)
863 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
864 struct cld_net
*cn
= nn
->cld_net
;
866 nfsd4_cld_unregister_net(net
, cn
->cn_pipe
);
867 rpc_destroy_pipe_data(cn
->cn_pipe
);
872 static struct cld_upcall
*
873 alloc_cld_upcall(struct cld_net
*cn
)
875 struct cld_upcall
*new, *tmp
;
877 new = kzalloc(sizeof(*new), GFP_KERNEL
);
881 /* FIXME: hard cap on number in flight? */
883 spin_lock(&cn
->cn_lock
);
884 list_for_each_entry(tmp
, &cn
->cn_list
, cu_list
) {
885 if (tmp
->cu_msg
.cm_xid
== cn
->cn_xid
) {
887 spin_unlock(&cn
->cn_lock
);
891 init_completion(&new->cu_done
);
892 new->cu_msg
.cm_vers
= CLD_UPCALL_VERSION
;
893 put_unaligned(cn
->cn_xid
++, &new->cu_msg
.cm_xid
);
895 list_add(&new->cu_list
, &cn
->cn_list
);
896 spin_unlock(&cn
->cn_lock
);
898 dprintk("%s: allocated xid %u\n", __func__
, new->cu_msg
.cm_xid
);
904 free_cld_upcall(struct cld_upcall
*victim
)
906 struct cld_net
*cn
= victim
->cu_net
;
908 spin_lock(&cn
->cn_lock
);
909 list_del(&victim
->cu_list
);
910 spin_unlock(&cn
->cn_lock
);
914 /* Ask daemon to create a new record */
916 nfsd4_cld_create(struct nfs4_client
*clp
)
919 struct cld_upcall
*cup
;
920 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
921 struct cld_net
*cn
= nn
->cld_net
;
923 /* Don't upcall if it's already stored */
924 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
927 cup
= alloc_cld_upcall(cn
);
933 cup
->cu_msg
.cm_cmd
= Cld_Create
;
934 cup
->cu_msg
.cm_u
.cm_name
.cn_len
= clp
->cl_name
.len
;
935 memcpy(cup
->cu_msg
.cm_u
.cm_name
.cn_id
, clp
->cl_name
.data
,
938 ret
= cld_pipe_upcall(cn
->cn_pipe
, &cup
->cu_msg
);
940 ret
= cup
->cu_msg
.cm_status
;
941 set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
944 free_cld_upcall(cup
);
947 printk(KERN_ERR
"NFSD: Unable to create client "
948 "record on stable storage: %d\n", ret
);
951 /* Ask daemon to create a new record */
953 nfsd4_cld_remove(struct nfs4_client
*clp
)
956 struct cld_upcall
*cup
;
957 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
958 struct cld_net
*cn
= nn
->cld_net
;
960 /* Don't upcall if it's already removed */
961 if (!test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
964 cup
= alloc_cld_upcall(cn
);
970 cup
->cu_msg
.cm_cmd
= Cld_Remove
;
971 cup
->cu_msg
.cm_u
.cm_name
.cn_len
= clp
->cl_name
.len
;
972 memcpy(cup
->cu_msg
.cm_u
.cm_name
.cn_id
, clp
->cl_name
.data
,
975 ret
= cld_pipe_upcall(cn
->cn_pipe
, &cup
->cu_msg
);
977 ret
= cup
->cu_msg
.cm_status
;
978 clear_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
981 free_cld_upcall(cup
);
984 printk(KERN_ERR
"NFSD: Unable to remove client "
985 "record from stable storage: %d\n", ret
);
988 /* Check for presence of a record, and update its timestamp */
990 nfsd4_cld_check(struct nfs4_client
*clp
)
993 struct cld_upcall
*cup
;
994 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
995 struct cld_net
*cn
= nn
->cld_net
;
997 /* Don't upcall if one was already stored during this grace pd */
998 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
1001 cup
= alloc_cld_upcall(cn
);
1003 printk(KERN_ERR
"NFSD: Unable to check client record on "
1004 "stable storage: %d\n", -ENOMEM
);
1008 cup
->cu_msg
.cm_cmd
= Cld_Check
;
1009 cup
->cu_msg
.cm_u
.cm_name
.cn_len
= clp
->cl_name
.len
;
1010 memcpy(cup
->cu_msg
.cm_u
.cm_name
.cn_id
, clp
->cl_name
.data
,
1013 ret
= cld_pipe_upcall(cn
->cn_pipe
, &cup
->cu_msg
);
1015 ret
= cup
->cu_msg
.cm_status
;
1016 set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
1019 free_cld_upcall(cup
);
1024 nfsd4_cld_grace_done(struct nfsd_net
*nn
)
1027 struct cld_upcall
*cup
;
1028 struct cld_net
*cn
= nn
->cld_net
;
1030 cup
= alloc_cld_upcall(cn
);
1036 cup
->cu_msg
.cm_cmd
= Cld_GraceDone
;
1037 cup
->cu_msg
.cm_u
.cm_gracetime
= (int64_t)nn
->boot_time
;
1038 ret
= cld_pipe_upcall(cn
->cn_pipe
, &cup
->cu_msg
);
1040 ret
= cup
->cu_msg
.cm_status
;
1042 free_cld_upcall(cup
);
1045 printk(KERN_ERR
"NFSD: Unable to end grace period: %d\n", ret
);
1048 static struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops
= {
1049 .init
= nfsd4_init_cld_pipe
,
1050 .exit
= nfsd4_remove_cld_pipe
,
1051 .create
= nfsd4_cld_create
,
1052 .remove
= nfsd4_cld_remove
,
1053 .check
= nfsd4_cld_check
,
1054 .grace_done
= nfsd4_cld_grace_done
,
1057 /* upcall via usermodehelper */
1058 static char cltrack_prog
[PATH_MAX
] = "/sbin/nfsdcltrack";
1059 module_param_string(cltrack_prog
, cltrack_prog
, sizeof(cltrack_prog
),
1061 MODULE_PARM_DESC(cltrack_prog
, "Path to the nfsdcltrack upcall program");
1063 static bool cltrack_legacy_disable
;
1064 module_param(cltrack_legacy_disable
, bool, S_IRUGO
|S_IWUSR
);
1065 MODULE_PARM_DESC(cltrack_legacy_disable
,
1066 "Disable legacy recoverydir conversion. Default: false");
1068 #define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1069 #define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
1070 #define HAS_SESSION_ENV_PREFIX "NFSDCLTRACK_CLIENT_HAS_SESSION="
1071 #define GRACE_START_ENV_PREFIX "NFSDCLTRACK_GRACE_START="
1074 nfsd4_cltrack_legacy_topdir(void)
1080 if (cltrack_legacy_disable
)
1083 len
= strlen(LEGACY_TOPDIR_ENV_PREFIX
) +
1084 strlen(nfs4_recoverydir()) + 1;
1086 result
= kmalloc(len
, GFP_KERNEL
);
1090 copied
= snprintf(result
, len
, LEGACY_TOPDIR_ENV_PREFIX
"%s",
1091 nfs4_recoverydir());
1092 if (copied
>= len
) {
1093 /* just return nothing if output was truncated */
1102 nfsd4_cltrack_legacy_recdir(const struct xdr_netobj
*name
)
1108 if (cltrack_legacy_disable
)
1111 /* +1 is for '/' between "topdir" and "recdir" */
1112 len
= strlen(LEGACY_RECDIR_ENV_PREFIX
) +
1113 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN
;
1115 result
= kmalloc(len
, GFP_KERNEL
);
1119 copied
= snprintf(result
, len
, LEGACY_RECDIR_ENV_PREFIX
"%s/",
1120 nfs4_recoverydir());
1121 if (copied
> (len
- HEXDIR_LEN
)) {
1122 /* just return nothing if output will be truncated */
1127 copied
= nfs4_make_rec_clidname(result
+ copied
, name
);
1137 nfsd4_cltrack_client_has_session(struct nfs4_client
*clp
)
1143 /* prefix + Y/N character + terminating NULL */
1144 len
= strlen(HAS_SESSION_ENV_PREFIX
) + 1 + 1;
1146 result
= kmalloc(len
, GFP_KERNEL
);
1150 copied
= snprintf(result
, len
, HAS_SESSION_ENV_PREFIX
"%c",
1151 clp
->cl_minorversion
? 'Y' : 'N');
1152 if (copied
>= len
) {
1153 /* just return nothing if output was truncated */
1162 nfsd4_cltrack_grace_start(time_t grace_start
)
1168 /* prefix + max width of int64_t string + terminating NULL */
1169 len
= strlen(GRACE_START_ENV_PREFIX
) + 22 + 1;
1171 result
= kmalloc(len
, GFP_KERNEL
);
1175 copied
= snprintf(result
, len
, GRACE_START_ENV_PREFIX
"%ld",
1177 if (copied
>= len
) {
1178 /* just return nothing if output was truncated */
1187 nfsd4_umh_cltrack_upcall(char *cmd
, char *arg
, char *env0
, char *env1
)
1193 if (unlikely(!cltrack_prog
[0])) {
1194 dprintk("%s: cltrack_prog is disabled\n", __func__
);
1198 dprintk("%s: cmd: %s\n", __func__
, cmd
);
1199 dprintk("%s: arg: %s\n", __func__
, arg
? arg
: "(null)");
1200 dprintk("%s: env0: %s\n", __func__
, env0
? env0
: "(null)");
1201 dprintk("%s: env1: %s\n", __func__
, env1
? env1
: "(null)");
1207 argv
[0] = (char *)cltrack_prog
;
1212 ret
= call_usermodehelper(argv
[0], argv
, envp
, UMH_WAIT_PROC
);
1214 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1215 * error. The admin can re-enable it on the fly by using sysfs
1216 * once the problem has been fixed.
1218 if (ret
== -ENOENT
|| ret
== -EACCES
) {
1219 dprintk("NFSD: %s was not found or isn't executable (%d). "
1220 "Setting cltrack_prog to blank string!",
1222 cltrack_prog
[0] = '\0';
1224 dprintk("%s: %s return value: %d\n", __func__
, cltrack_prog
, ret
);
1230 bin_to_hex_dup(const unsigned char *src
, int srclen
)
1235 /* +1 for terminating NULL */
1236 buf
= kmalloc((srclen
* 2) + 1, GFP_KERNEL
);
1241 for (i
= 0; i
< srclen
; i
++) {
1242 sprintf(hex
, "%2.2x", *src
++);
1249 nfsd4_umh_cltrack_init(struct net
*net
)
1252 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
1253 char *grace_start
= nfsd4_cltrack_grace_start(nn
->boot_time
);
1255 /* XXX: The usermode helper s not working in container yet. */
1256 if (net
!= &init_net
) {
1257 pr_warn("NFSD: attempt to initialize umh client tracking in a container ignored.\n");
1261 ret
= nfsd4_umh_cltrack_upcall("init", NULL
, grace_start
, NULL
);
1267 nfsd4_cltrack_upcall_lock(struct nfs4_client
*clp
)
1269 wait_on_bit_lock(&clp
->cl_flags
, NFSD4_CLIENT_UPCALL_LOCK
,
1270 TASK_UNINTERRUPTIBLE
);
1274 nfsd4_cltrack_upcall_unlock(struct nfs4_client
*clp
)
1276 smp_mb__before_atomic();
1277 clear_bit(NFSD4_CLIENT_UPCALL_LOCK
, &clp
->cl_flags
);
1278 smp_mb__after_atomic();
1279 wake_up_bit(&clp
->cl_flags
, NFSD4_CLIENT_UPCALL_LOCK
);
1283 nfsd4_umh_cltrack_create(struct nfs4_client
*clp
)
1285 char *hexid
, *has_session
, *grace_start
;
1286 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
1289 * With v4.0 clients, there's little difference in outcome between a
1290 * create and check operation, and we can end up calling into this
1291 * function multiple times per client (once for each openowner). So,
1292 * for v4.0 clients skip upcalling once the client has been recorded
1293 * on stable storage.
1295 * For v4.1+ clients, the outcome of the two operations is different,
1296 * so we must ensure that we upcall for the create operation. v4.1+
1297 * clients call this on RECLAIM_COMPLETE though, so we should only end
1298 * up doing a single create upcall per client.
1300 if (clp
->cl_minorversion
== 0 &&
1301 test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
1304 hexid
= bin_to_hex_dup(clp
->cl_name
.data
, clp
->cl_name
.len
);
1306 dprintk("%s: can't allocate memory for upcall!\n", __func__
);
1310 has_session
= nfsd4_cltrack_client_has_session(clp
);
1311 grace_start
= nfsd4_cltrack_grace_start(nn
->boot_time
);
1313 nfsd4_cltrack_upcall_lock(clp
);
1314 if (!nfsd4_umh_cltrack_upcall("create", hexid
, has_session
, grace_start
))
1315 set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
1316 nfsd4_cltrack_upcall_unlock(clp
);
1324 nfsd4_umh_cltrack_remove(struct nfs4_client
*clp
)
1328 if (!test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
1331 hexid
= bin_to_hex_dup(clp
->cl_name
.data
, clp
->cl_name
.len
);
1333 dprintk("%s: can't allocate memory for upcall!\n", __func__
);
1337 nfsd4_cltrack_upcall_lock(clp
);
1338 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
) &&
1339 nfsd4_umh_cltrack_upcall("remove", hexid
, NULL
, NULL
) == 0)
1340 clear_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
1341 nfsd4_cltrack_upcall_unlock(clp
);
1347 nfsd4_umh_cltrack_check(struct nfs4_client
*clp
)
1350 char *hexid
, *has_session
, *legacy
;
1352 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
))
1355 hexid
= bin_to_hex_dup(clp
->cl_name
.data
, clp
->cl_name
.len
);
1357 dprintk("%s: can't allocate memory for upcall!\n", __func__
);
1361 has_session
= nfsd4_cltrack_client_has_session(clp
);
1362 legacy
= nfsd4_cltrack_legacy_recdir(&clp
->cl_name
);
1364 nfsd4_cltrack_upcall_lock(clp
);
1365 if (test_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
)) {
1368 ret
= nfsd4_umh_cltrack_upcall("check", hexid
, has_session
, legacy
);
1370 set_bit(NFSD4_CLIENT_STABLE
, &clp
->cl_flags
);
1372 nfsd4_cltrack_upcall_unlock(clp
);
1381 nfsd4_umh_cltrack_grace_done(struct nfsd_net
*nn
)
1384 char timestr
[22]; /* FIXME: better way to determine max size? */
1386 sprintf(timestr
, "%ld", nn
->boot_time
);
1387 legacy
= nfsd4_cltrack_legacy_topdir();
1388 nfsd4_umh_cltrack_upcall("gracedone", timestr
, legacy
, NULL
);
1392 static struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops
= {
1393 .init
= nfsd4_umh_cltrack_init
,
1395 .create
= nfsd4_umh_cltrack_create
,
1396 .remove
= nfsd4_umh_cltrack_remove
,
1397 .check
= nfsd4_umh_cltrack_check
,
1398 .grace_done
= nfsd4_umh_cltrack_grace_done
,
1402 nfsd4_client_tracking_init(struct net
*net
)
1406 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
1408 /* just run the init if it the method is already decided */
1409 if (nn
->client_tracking_ops
)
1413 * First, try a UMH upcall. It should succeed or fail quickly, so
1414 * there's little harm in trying that first.
1416 nn
->client_tracking_ops
= &nfsd4_umh_tracking_ops
;
1417 status
= nn
->client_tracking_ops
->init(net
);
1422 * See if the recoverydir exists and is a directory. If it is,
1423 * then use the legacy ops.
1425 nn
->client_tracking_ops
= &nfsd4_legacy_tracking_ops
;
1426 status
= kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW
, &path
);
1428 status
= d_is_dir(path
.dentry
);
1434 /* Finally, try to use nfsdcld */
1435 nn
->client_tracking_ops
= &nfsd4_cld_tracking_ops
;
1436 printk(KERN_WARNING
"NFSD: the nfsdcld client tracking upcall will be "
1437 "removed in 3.10. Please transition to using "
1440 status
= nn
->client_tracking_ops
->init(net
);
1442 printk(KERN_WARNING
"NFSD: Unable to initialize client "
1443 "recovery tracking! (%d)\n", status
);
1444 nn
->client_tracking_ops
= NULL
;
1450 nfsd4_client_tracking_exit(struct net
*net
)
1452 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
1454 if (nn
->client_tracking_ops
) {
1455 if (nn
->client_tracking_ops
->exit
)
1456 nn
->client_tracking_ops
->exit(net
);
1457 nn
->client_tracking_ops
= NULL
;
1462 nfsd4_client_record_create(struct nfs4_client
*clp
)
1464 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
1466 if (nn
->client_tracking_ops
)
1467 nn
->client_tracking_ops
->create(clp
);
1471 nfsd4_client_record_remove(struct nfs4_client
*clp
)
1473 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
1475 if (nn
->client_tracking_ops
)
1476 nn
->client_tracking_ops
->remove(clp
);
1480 nfsd4_client_record_check(struct nfs4_client
*clp
)
1482 struct nfsd_net
*nn
= net_generic(clp
->net
, nfsd_net_id
);
1484 if (nn
->client_tracking_ops
)
1485 return nn
->client_tracking_ops
->check(clp
);
1491 nfsd4_record_grace_done(struct nfsd_net
*nn
)
1493 if (nn
->client_tracking_ops
)
1494 nn
->client_tracking_ops
->grace_done(nn
);
1498 rpc_pipefs_event(struct notifier_block
*nb
, unsigned long event
, void *ptr
)
1500 struct super_block
*sb
= ptr
;
1501 struct net
*net
= sb
->s_fs_info
;
1502 struct nfsd_net
*nn
= net_generic(net
, nfsd_net_id
);
1503 struct cld_net
*cn
= nn
->cld_net
;
1504 struct dentry
*dentry
;
1507 if (!try_module_get(THIS_MODULE
))
1511 module_put(THIS_MODULE
);
1516 case RPC_PIPEFS_MOUNT
:
1517 dentry
= nfsd4_cld_register_sb(sb
, cn
->cn_pipe
);
1518 if (IS_ERR(dentry
)) {
1519 ret
= PTR_ERR(dentry
);
1522 cn
->cn_pipe
->dentry
= dentry
;
1524 case RPC_PIPEFS_UMOUNT
:
1525 if (cn
->cn_pipe
->dentry
)
1526 nfsd4_cld_unregister_sb(cn
->cn_pipe
);
1532 module_put(THIS_MODULE
);
1536 static struct notifier_block nfsd4_cld_block
= {
1537 .notifier_call
= rpc_pipefs_event
,
1541 register_cld_notifier(void)
1543 return rpc_pipefs_notifier_register(&nfsd4_cld_block
);
1547 unregister_cld_notifier(void)
1549 rpc_pipefs_notifier_unregister(&nfsd4_cld_block
);