4f8cc6ba7c28ea979678439b9a1b8e7ac62cc03a
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / fs / nfsd / nfs4recover.c
1 /*
2 * Copyright (c) 2004 The Regents of the University of Michigan.
3 * Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
4 * All rights reserved.
5 *
6 * Andy Adamson <andros@citi.umich.edu>
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 *
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 *
33 */
34
35 #include <linux/file.h>
36 #include <linux/slab.h>
37 #include <linux/namei.h>
38 #include <linux/crypto.h>
39 #include <linux/sched.h>
40 #include <linux/fs.h>
41 #include <linux/module.h>
42 #include <net/net_namespace.h>
43 #include <linux/sunrpc/rpc_pipe_fs.h>
44 #include <linux/sunrpc/clnt.h>
45 #include <linux/nfsd/cld.h>
46
47 #include "nfsd.h"
48 #include "state.h"
49 #include "vfs.h"
50 #include "netns.h"
51
52 #define NFSDDBG_FACILITY NFSDDBG_PROC
53
54 /* Declarations */
55 struct nfsd4_client_tracking_ops {
56 int (*init)(struct net *);
57 void (*exit)(struct net *);
58 void (*create)(struct nfs4_client *);
59 void (*remove)(struct nfs4_client *);
60 int (*check)(struct nfs4_client *);
61 void (*grace_done)(struct nfsd_net *, time_t);
62 };
63
64 /* Globals */
65 static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
66
67 static int
68 nfs4_save_creds(const struct cred **original_creds)
69 {
70 struct cred *new;
71
72 new = prepare_creds();
73 if (!new)
74 return -ENOMEM;
75
76 new->fsuid = GLOBAL_ROOT_UID;
77 new->fsgid = GLOBAL_ROOT_GID;
78 *original_creds = override_creds(new);
79 put_cred(new);
80 return 0;
81 }
82
83 static void
84 nfs4_reset_creds(const struct cred *original)
85 {
86 revert_creds(original);
87 }
88
89 static void
90 md5_to_hex(char *out, char *md5)
91 {
92 int i;
93
94 for (i=0; i<16; i++) {
95 unsigned char c = md5[i];
96
97 *out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 *out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
99 }
100 *out = '\0';
101 }
102
103 static int
104 nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
105 {
106 struct xdr_netobj cksum;
107 struct hash_desc desc;
108 struct scatterlist sg;
109 int status;
110
111 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
112 clname->len, clname->data);
113 desc.flags = CRYPTO_TFM_REQ_MAY_SLEEP;
114 desc.tfm = crypto_alloc_hash("md5", 0, CRYPTO_ALG_ASYNC);
115 if (IS_ERR(desc.tfm)) {
116 status = PTR_ERR(desc.tfm);
117 goto out_no_tfm;
118 }
119
120 cksum.len = crypto_hash_digestsize(desc.tfm);
121 cksum.data = kmalloc(cksum.len, GFP_KERNEL);
122 if (cksum.data == NULL) {
123 status = -ENOMEM;
124 goto out;
125 }
126
127 sg_init_one(&sg, clname->data, clname->len);
128
129 status = crypto_hash_digest(&desc, &sg, sg.length, cksum.data);
130 if (status)
131 goto out;
132
133 md5_to_hex(dname, cksum.data);
134
135 status = 0;
136 out:
137 kfree(cksum.data);
138 crypto_free_hash(desc.tfm);
139 out_no_tfm:
140 return status;
141 }
142
143 /*
144 * If we had an error generating the recdir name for the legacy tracker
145 * then warn the admin. If the error doesn't appear to be transient,
146 * then disable recovery tracking.
147 */
148 static void
149 legacy_recdir_name_error(struct nfs4_client *clp, int error)
150 {
151 printk(KERN_ERR "NFSD: unable to generate recoverydir "
152 "name (%d).\n", error);
153
154 /*
155 * if the algorithm just doesn't exist, then disable the recovery
156 * tracker altogether. The crypto libs will generally return this if
157 * FIPS is enabled as well.
158 */
159 if (error == -ENOENT) {
160 printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
161 "Reboot recovery will not function correctly!\n");
162 nfsd4_client_tracking_exit(clp->net);
163 }
164 }
165
166 static void
167 nfsd4_create_clid_dir(struct nfs4_client *clp)
168 {
169 const struct cred *original_cred;
170 char dname[HEXDIR_LEN];
171 struct dentry *dir, *dentry;
172 struct nfs4_client_reclaim *crp;
173 int status;
174 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
175
176 dprintk("NFSD: nfsd4_create_clid_dir for \"%s\"\n", dname);
177
178 if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
179 return;
180 if (!nn->rec_file)
181 return;
182
183 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
184 if (status)
185 return legacy_recdir_name_error(clp, status);
186
187 status = nfs4_save_creds(&original_cred);
188 if (status < 0)
189 return;
190
191 status = mnt_want_write_file(nn->rec_file);
192 if (status)
193 return;
194
195 dir = nn->rec_file->f_path.dentry;
196 /* lock the parent */
197 mutex_lock(&dir->d_inode->i_mutex);
198
199 dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
200 if (IS_ERR(dentry)) {
201 status = PTR_ERR(dentry);
202 goto out_unlock;
203 }
204 if (dentry->d_inode)
205 /*
206 * In the 4.1 case, where we're called from
207 * reclaim_complete(), records from the previous reboot
208 * may still be left, so this is OK.
209 *
210 * In the 4.0 case, we should never get here; but we may
211 * as well be forgiving and just succeed silently.
212 */
213 goto out_put;
214 status = vfs_mkdir(dir->d_inode, dentry, S_IRWXU);
215 out_put:
216 dput(dentry);
217 out_unlock:
218 mutex_unlock(&dir->d_inode->i_mutex);
219 if (status == 0) {
220 if (nn->in_grace) {
221 crp = nfs4_client_to_reclaim(dname, nn);
222 if (crp)
223 crp->cr_clp = clp;
224 }
225 vfs_fsync(nn->rec_file, 0);
226 } else {
227 printk(KERN_ERR "NFSD: failed to write recovery record"
228 " (err %d); please check that %s exists"
229 " and is writeable", status,
230 user_recovery_dirname);
231 }
232 mnt_drop_write_file(nn->rec_file);
233 nfs4_reset_creds(original_cred);
234 }
235
236 typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
237
238 struct name_list {
239 char name[HEXDIR_LEN];
240 struct list_head list;
241 };
242
243 static int
244 nfsd4_build_namelist(void *arg, const char *name, int namlen,
245 loff_t offset, u64 ino, unsigned int d_type)
246 {
247 struct list_head *names = arg;
248 struct name_list *entry;
249
250 if (namlen != HEXDIR_LEN - 1)
251 return 0;
252 entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
253 if (entry == NULL)
254 return -ENOMEM;
255 memcpy(entry->name, name, HEXDIR_LEN - 1);
256 entry->name[HEXDIR_LEN - 1] = '\0';
257 list_add(&entry->list, names);
258 return 0;
259 }
260
261 static int
262 nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
263 {
264 const struct cred *original_cred;
265 struct dentry *dir = nn->rec_file->f_path.dentry;
266 struct {
267 struct dir_context ctx;
268 struct list_head names;
269 } ctx;
270 int status;
271
272 status = nfs4_save_creds(&original_cred);
273 if (status < 0)
274 return status;
275
276 status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
277 if (status < 0) {
278 nfs4_reset_creds(original_cred);
279 return status;
280 }
281
282 INIT_LIST_HEAD(&ctx.names);
283 ctx.ctx.actor = nfsd4_build_namelist;
284 status = iterate_dir(nn->rec_file, &ctx.ctx);
285 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
286 while (!list_empty(&ctx.names)) {
287 struct name_list *entry;
288 entry = list_entry(ctx.names.next, struct name_list, list);
289 if (!status) {
290 struct dentry *dentry;
291 dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
292 if (IS_ERR(dentry)) {
293 status = PTR_ERR(dentry);
294 break;
295 }
296 status = f(dir, dentry, nn);
297 dput(dentry);
298 }
299 list_del(&entry->list);
300 kfree(entry);
301 }
302 mutex_unlock(&dir->d_inode->i_mutex);
303 nfs4_reset_creds(original_cred);
304 return status;
305 }
306
307 static int
308 nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
309 {
310 struct dentry *dir, *dentry;
311 int status;
312
313 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
314
315 dir = nn->rec_file->f_path.dentry;
316 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
317 dentry = lookup_one_len(name, dir, namlen);
318 if (IS_ERR(dentry)) {
319 status = PTR_ERR(dentry);
320 goto out_unlock;
321 }
322 status = -ENOENT;
323 if (!dentry->d_inode)
324 goto out;
325 status = vfs_rmdir(dir->d_inode, dentry);
326 out:
327 dput(dentry);
328 out_unlock:
329 mutex_unlock(&dir->d_inode->i_mutex);
330 return status;
331 }
332
333 static void
334 nfsd4_remove_clid_dir(struct nfs4_client *clp)
335 {
336 const struct cred *original_cred;
337 struct nfs4_client_reclaim *crp;
338 char dname[HEXDIR_LEN];
339 int status;
340 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
341
342 if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
343 return;
344
345 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
346 if (status)
347 return legacy_recdir_name_error(clp, status);
348
349 status = mnt_want_write_file(nn->rec_file);
350 if (status)
351 goto out;
352 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
353
354 status = nfs4_save_creds(&original_cred);
355 if (status < 0)
356 goto out_drop_write;
357
358 status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
359 nfs4_reset_creds(original_cred);
360 if (status == 0) {
361 vfs_fsync(nn->rec_file, 0);
362 if (nn->in_grace) {
363 /* remove reclaim record */
364 crp = nfsd4_find_reclaim_client(dname, nn);
365 if (crp)
366 nfs4_remove_reclaim_record(crp, nn);
367 }
368 }
369 out_drop_write:
370 mnt_drop_write_file(nn->rec_file);
371 out:
372 if (status)
373 printk("NFSD: Failed to remove expired client state directory"
374 " %.*s\n", HEXDIR_LEN, dname);
375 }
376
377 static int
378 purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
379 {
380 int status;
381
382 if (nfs4_has_reclaimed_state(child->d_name.name, nn))
383 return 0;
384
385 status = vfs_rmdir(parent->d_inode, child);
386 if (status)
387 printk("failed to remove client recovery directory %s\n",
388 child->d_name.name);
389 /* Keep trying, success or failure: */
390 return 0;
391 }
392
393 static void
394 nfsd4_recdir_purge_old(struct nfsd_net *nn, time_t boot_time)
395 {
396 int status;
397
398 nn->in_grace = false;
399 if (!nn->rec_file)
400 return;
401 status = mnt_want_write_file(nn->rec_file);
402 if (status)
403 goto out;
404 status = nfsd4_list_rec_dir(purge_old, nn);
405 if (status == 0)
406 vfs_fsync(nn->rec_file, 0);
407 mnt_drop_write_file(nn->rec_file);
408 out:
409 nfs4_release_reclaim(nn);
410 if (status)
411 printk("nfsd4: failed to purge old clients from recovery"
412 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
413 }
414
415 static int
416 load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
417 {
418 if (child->d_name.len != HEXDIR_LEN - 1) {
419 printk("nfsd4: illegal name %s in recovery directory\n",
420 child->d_name.name);
421 /* Keep trying; maybe the others are OK: */
422 return 0;
423 }
424 nfs4_client_to_reclaim(child->d_name.name, nn);
425 return 0;
426 }
427
428 static int
429 nfsd4_recdir_load(struct net *net) {
430 int status;
431 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
432
433 if (!nn->rec_file)
434 return 0;
435
436 status = nfsd4_list_rec_dir(load_recdir, nn);
437 if (status)
438 printk("nfsd4: failed loading clients from recovery"
439 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
440 return status;
441 }
442
443 /*
444 * Hold reference to the recovery directory.
445 */
446
447 static int
448 nfsd4_init_recdir(struct net *net)
449 {
450 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
451 const struct cred *original_cred;
452 int status;
453
454 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
455 user_recovery_dirname);
456
457 BUG_ON(nn->rec_file);
458
459 status = nfs4_save_creds(&original_cred);
460 if (status < 0) {
461 printk("NFSD: Unable to change credentials to find recovery"
462 " directory: error %d\n",
463 status);
464 return status;
465 }
466
467 nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
468 if (IS_ERR(nn->rec_file)) {
469 printk("NFSD: unable to find recovery directory %s\n",
470 user_recovery_dirname);
471 status = PTR_ERR(nn->rec_file);
472 nn->rec_file = NULL;
473 }
474
475 nfs4_reset_creds(original_cred);
476 if (!status)
477 nn->in_grace = true;
478 return status;
479 }
480
481
482 static int
483 nfs4_legacy_state_init(struct net *net)
484 {
485 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
486 int i;
487
488 nn->reclaim_str_hashtbl = kmalloc(sizeof(struct list_head) *
489 CLIENT_HASH_SIZE, GFP_KERNEL);
490 if (!nn->reclaim_str_hashtbl)
491 return -ENOMEM;
492
493 for (i = 0; i < CLIENT_HASH_SIZE; i++)
494 INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
495 nn->reclaim_str_hashtbl_size = 0;
496
497 return 0;
498 }
499
500 static void
501 nfs4_legacy_state_shutdown(struct net *net)
502 {
503 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
504
505 kfree(nn->reclaim_str_hashtbl);
506 }
507
508 static int
509 nfsd4_load_reboot_recovery_data(struct net *net)
510 {
511 int status;
512
513 status = nfsd4_init_recdir(net);
514 if (!status)
515 status = nfsd4_recdir_load(net);
516 if (status)
517 printk(KERN_ERR "NFSD: Failure reading reboot recovery data\n");
518 return status;
519 }
520
521 static int
522 nfsd4_legacy_tracking_init(struct net *net)
523 {
524 int status;
525
526 /* XXX: The legacy code won't work in a container */
527 if (net != &init_net) {
528 WARN(1, KERN_ERR "NFSD: attempt to initialize legacy client "
529 "tracking in a container!\n");
530 return -EINVAL;
531 }
532
533 status = nfs4_legacy_state_init(net);
534 if (status)
535 return status;
536
537 status = nfsd4_load_reboot_recovery_data(net);
538 if (status)
539 goto err;
540 return 0;
541
542 err:
543 nfs4_legacy_state_shutdown(net);
544 return status;
545 }
546
547 static void
548 nfsd4_shutdown_recdir(struct nfsd_net *nn)
549 {
550 if (!nn->rec_file)
551 return;
552 fput(nn->rec_file);
553 nn->rec_file = NULL;
554 }
555
556 static void
557 nfsd4_legacy_tracking_exit(struct net *net)
558 {
559 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
560
561 nfs4_release_reclaim(nn);
562 nfsd4_shutdown_recdir(nn);
563 nfs4_legacy_state_shutdown(net);
564 }
565
566 /*
567 * Change the NFSv4 recovery directory to recdir.
568 */
569 int
570 nfs4_reset_recoverydir(char *recdir)
571 {
572 int status;
573 struct path path;
574
575 status = kern_path(recdir, LOOKUP_FOLLOW, &path);
576 if (status)
577 return status;
578 status = -ENOTDIR;
579 if (S_ISDIR(path.dentry->d_inode->i_mode)) {
580 strcpy(user_recovery_dirname, recdir);
581 status = 0;
582 }
583 path_put(&path);
584 return status;
585 }
586
587 char *
588 nfs4_recoverydir(void)
589 {
590 return user_recovery_dirname;
591 }
592
593 static int
594 nfsd4_check_legacy_client(struct nfs4_client *clp)
595 {
596 int status;
597 char dname[HEXDIR_LEN];
598 struct nfs4_client_reclaim *crp;
599 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
600
601 /* did we already find that this client is stable? */
602 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
603 return 0;
604
605 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
606 if (status) {
607 legacy_recdir_name_error(clp, status);
608 return status;
609 }
610
611 /* look for it in the reclaim hashtable otherwise */
612 crp = nfsd4_find_reclaim_client(dname, nn);
613 if (crp) {
614 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
615 crp->cr_clp = clp;
616 return 0;
617 }
618
619 return -ENOENT;
620 }
621
622 static struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
623 .init = nfsd4_legacy_tracking_init,
624 .exit = nfsd4_legacy_tracking_exit,
625 .create = nfsd4_create_clid_dir,
626 .remove = nfsd4_remove_clid_dir,
627 .check = nfsd4_check_legacy_client,
628 .grace_done = nfsd4_recdir_purge_old,
629 };
630
631 /* Globals */
632 #define NFSD_PIPE_DIR "nfsd"
633 #define NFSD_CLD_PIPE "cld"
634
635 /* per-net-ns structure for holding cld upcall info */
636 struct cld_net {
637 struct rpc_pipe *cn_pipe;
638 spinlock_t cn_lock;
639 struct list_head cn_list;
640 unsigned int cn_xid;
641 };
642
643 struct cld_upcall {
644 struct list_head cu_list;
645 struct cld_net *cu_net;
646 struct task_struct *cu_task;
647 struct cld_msg cu_msg;
648 };
649
650 static int
651 __cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
652 {
653 int ret;
654 struct rpc_pipe_msg msg;
655
656 memset(&msg, 0, sizeof(msg));
657 msg.data = cmsg;
658 msg.len = sizeof(*cmsg);
659
660 /*
661 * Set task state before we queue the upcall. That prevents
662 * wake_up_process in the downcall from racing with schedule.
663 */
664 set_current_state(TASK_UNINTERRUPTIBLE);
665 ret = rpc_queue_upcall(pipe, &msg);
666 if (ret < 0) {
667 set_current_state(TASK_RUNNING);
668 goto out;
669 }
670
671 schedule();
672 set_current_state(TASK_RUNNING);
673
674 if (msg.errno < 0)
675 ret = msg.errno;
676 out:
677 return ret;
678 }
679
680 static int
681 cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
682 {
683 int ret;
684
685 /*
686 * -EAGAIN occurs when pipe is closed and reopened while there are
687 * upcalls queued.
688 */
689 do {
690 ret = __cld_pipe_upcall(pipe, cmsg);
691 } while (ret == -EAGAIN);
692
693 return ret;
694 }
695
696 static ssize_t
697 cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
698 {
699 struct cld_upcall *tmp, *cup;
700 struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
701 uint32_t xid;
702 struct nfsd_net *nn = net_generic(filp->f_dentry->d_sb->s_fs_info,
703 nfsd_net_id);
704 struct cld_net *cn = nn->cld_net;
705
706 if (mlen != sizeof(*cmsg)) {
707 dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
708 sizeof(*cmsg));
709 return -EINVAL;
710 }
711
712 /* copy just the xid so we can try to find that */
713 if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
714 dprintk("%s: error when copying xid from userspace", __func__);
715 return -EFAULT;
716 }
717
718 /* walk the list and find corresponding xid */
719 cup = NULL;
720 spin_lock(&cn->cn_lock);
721 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
722 if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
723 cup = tmp;
724 list_del_init(&cup->cu_list);
725 break;
726 }
727 }
728 spin_unlock(&cn->cn_lock);
729
730 /* couldn't find upcall? */
731 if (!cup) {
732 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
733 return -EINVAL;
734 }
735
736 if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
737 return -EFAULT;
738
739 wake_up_process(cup->cu_task);
740 return mlen;
741 }
742
743 static void
744 cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
745 {
746 struct cld_msg *cmsg = msg->data;
747 struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
748 cu_msg);
749
750 /* errno >= 0 means we got a downcall */
751 if (msg->errno >= 0)
752 return;
753
754 wake_up_process(cup->cu_task);
755 }
756
757 static const struct rpc_pipe_ops cld_upcall_ops = {
758 .upcall = rpc_pipe_generic_upcall,
759 .downcall = cld_pipe_downcall,
760 .destroy_msg = cld_pipe_destroy_msg,
761 };
762
763 static struct dentry *
764 nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
765 {
766 struct dentry *dir, *dentry;
767
768 dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
769 if (dir == NULL)
770 return ERR_PTR(-ENOENT);
771 dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
772 dput(dir);
773 return dentry;
774 }
775
776 static void
777 nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
778 {
779 if (pipe->dentry)
780 rpc_unlink(pipe->dentry);
781 }
782
783 static struct dentry *
784 nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
785 {
786 struct super_block *sb;
787 struct dentry *dentry;
788
789 sb = rpc_get_sb_net(net);
790 if (!sb)
791 return NULL;
792 dentry = nfsd4_cld_register_sb(sb, pipe);
793 rpc_put_sb_net(net);
794 return dentry;
795 }
796
797 static void
798 nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
799 {
800 struct super_block *sb;
801
802 sb = rpc_get_sb_net(net);
803 if (sb) {
804 nfsd4_cld_unregister_sb(pipe);
805 rpc_put_sb_net(net);
806 }
807 }
808
809 /* Initialize rpc_pipefs pipe for communication with client tracking daemon */
810 static int
811 nfsd4_init_cld_pipe(struct net *net)
812 {
813 int ret;
814 struct dentry *dentry;
815 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
816 struct cld_net *cn;
817
818 if (nn->cld_net)
819 return 0;
820
821 cn = kzalloc(sizeof(*cn), GFP_KERNEL);
822 if (!cn) {
823 ret = -ENOMEM;
824 goto err;
825 }
826
827 cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
828 if (IS_ERR(cn->cn_pipe)) {
829 ret = PTR_ERR(cn->cn_pipe);
830 goto err;
831 }
832 spin_lock_init(&cn->cn_lock);
833 INIT_LIST_HEAD(&cn->cn_list);
834
835 dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
836 if (IS_ERR(dentry)) {
837 ret = PTR_ERR(dentry);
838 goto err_destroy_data;
839 }
840
841 cn->cn_pipe->dentry = dentry;
842 nn->cld_net = cn;
843 return 0;
844
845 err_destroy_data:
846 rpc_destroy_pipe_data(cn->cn_pipe);
847 err:
848 kfree(cn);
849 printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
850 ret);
851 return ret;
852 }
853
854 static void
855 nfsd4_remove_cld_pipe(struct net *net)
856 {
857 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
858 struct cld_net *cn = nn->cld_net;
859
860 nfsd4_cld_unregister_net(net, cn->cn_pipe);
861 rpc_destroy_pipe_data(cn->cn_pipe);
862 kfree(nn->cld_net);
863 nn->cld_net = NULL;
864 }
865
866 static struct cld_upcall *
867 alloc_cld_upcall(struct cld_net *cn)
868 {
869 struct cld_upcall *new, *tmp;
870
871 new = kzalloc(sizeof(*new), GFP_KERNEL);
872 if (!new)
873 return new;
874
875 /* FIXME: hard cap on number in flight? */
876 restart_search:
877 spin_lock(&cn->cn_lock);
878 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
879 if (tmp->cu_msg.cm_xid == cn->cn_xid) {
880 cn->cn_xid++;
881 spin_unlock(&cn->cn_lock);
882 goto restart_search;
883 }
884 }
885 new->cu_task = current;
886 new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
887 put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
888 new->cu_net = cn;
889 list_add(&new->cu_list, &cn->cn_list);
890 spin_unlock(&cn->cn_lock);
891
892 dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
893
894 return new;
895 }
896
897 static void
898 free_cld_upcall(struct cld_upcall *victim)
899 {
900 struct cld_net *cn = victim->cu_net;
901
902 spin_lock(&cn->cn_lock);
903 list_del(&victim->cu_list);
904 spin_unlock(&cn->cn_lock);
905 kfree(victim);
906 }
907
908 /* Ask daemon to create a new record */
909 static void
910 nfsd4_cld_create(struct nfs4_client *clp)
911 {
912 int ret;
913 struct cld_upcall *cup;
914 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
915 struct cld_net *cn = nn->cld_net;
916
917 /* Don't upcall if it's already stored */
918 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
919 return;
920
921 cup = alloc_cld_upcall(cn);
922 if (!cup) {
923 ret = -ENOMEM;
924 goto out_err;
925 }
926
927 cup->cu_msg.cm_cmd = Cld_Create;
928 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
929 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
930 clp->cl_name.len);
931
932 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
933 if (!ret) {
934 ret = cup->cu_msg.cm_status;
935 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
936 }
937
938 free_cld_upcall(cup);
939 out_err:
940 if (ret)
941 printk(KERN_ERR "NFSD: Unable to create client "
942 "record on stable storage: %d\n", ret);
943 }
944
945 /* Ask daemon to create a new record */
946 static void
947 nfsd4_cld_remove(struct nfs4_client *clp)
948 {
949 int ret;
950 struct cld_upcall *cup;
951 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
952 struct cld_net *cn = nn->cld_net;
953
954 /* Don't upcall if it's already removed */
955 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
956 return;
957
958 cup = alloc_cld_upcall(cn);
959 if (!cup) {
960 ret = -ENOMEM;
961 goto out_err;
962 }
963
964 cup->cu_msg.cm_cmd = Cld_Remove;
965 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
966 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
967 clp->cl_name.len);
968
969 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
970 if (!ret) {
971 ret = cup->cu_msg.cm_status;
972 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
973 }
974
975 free_cld_upcall(cup);
976 out_err:
977 if (ret)
978 printk(KERN_ERR "NFSD: Unable to remove client "
979 "record from stable storage: %d\n", ret);
980 }
981
982 /* Check for presence of a record, and update its timestamp */
983 static int
984 nfsd4_cld_check(struct nfs4_client *clp)
985 {
986 int ret;
987 struct cld_upcall *cup;
988 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
989 struct cld_net *cn = nn->cld_net;
990
991 /* Don't upcall if one was already stored during this grace pd */
992 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
993 return 0;
994
995 cup = alloc_cld_upcall(cn);
996 if (!cup) {
997 printk(KERN_ERR "NFSD: Unable to check client record on "
998 "stable storage: %d\n", -ENOMEM);
999 return -ENOMEM;
1000 }
1001
1002 cup->cu_msg.cm_cmd = Cld_Check;
1003 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1004 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1005 clp->cl_name.len);
1006
1007 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1008 if (!ret) {
1009 ret = cup->cu_msg.cm_status;
1010 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1011 }
1012
1013 free_cld_upcall(cup);
1014 return ret;
1015 }
1016
1017 static void
1018 nfsd4_cld_grace_done(struct nfsd_net *nn, time_t boot_time)
1019 {
1020 int ret;
1021 struct cld_upcall *cup;
1022 struct cld_net *cn = nn->cld_net;
1023
1024 cup = alloc_cld_upcall(cn);
1025 if (!cup) {
1026 ret = -ENOMEM;
1027 goto out_err;
1028 }
1029
1030 cup->cu_msg.cm_cmd = Cld_GraceDone;
1031 cup->cu_msg.cm_u.cm_gracetime = (int64_t)boot_time;
1032 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1033 if (!ret)
1034 ret = cup->cu_msg.cm_status;
1035
1036 free_cld_upcall(cup);
1037 out_err:
1038 if (ret)
1039 printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1040 }
1041
1042 static struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
1043 .init = nfsd4_init_cld_pipe,
1044 .exit = nfsd4_remove_cld_pipe,
1045 .create = nfsd4_cld_create,
1046 .remove = nfsd4_cld_remove,
1047 .check = nfsd4_cld_check,
1048 .grace_done = nfsd4_cld_grace_done,
1049 };
1050
1051 /* upcall via usermodehelper */
1052 static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1053 module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1054 S_IRUGO|S_IWUSR);
1055 MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1056
1057 static bool cltrack_legacy_disable;
1058 module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1059 MODULE_PARM_DESC(cltrack_legacy_disable,
1060 "Disable legacy recoverydir conversion. Default: false");
1061
1062 #define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1063 #define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
1064
1065 static char *
1066 nfsd4_cltrack_legacy_topdir(void)
1067 {
1068 int copied;
1069 size_t len;
1070 char *result;
1071
1072 if (cltrack_legacy_disable)
1073 return NULL;
1074
1075 len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1076 strlen(nfs4_recoverydir()) + 1;
1077
1078 result = kmalloc(len, GFP_KERNEL);
1079 if (!result)
1080 return result;
1081
1082 copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1083 nfs4_recoverydir());
1084 if (copied >= len) {
1085 /* just return nothing if output was truncated */
1086 kfree(result);
1087 return NULL;
1088 }
1089
1090 return result;
1091 }
1092
1093 static char *
1094 nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
1095 {
1096 int copied;
1097 size_t len;
1098 char *result;
1099
1100 if (cltrack_legacy_disable)
1101 return NULL;
1102
1103 /* +1 is for '/' between "topdir" and "recdir" */
1104 len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1105 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1106
1107 result = kmalloc(len, GFP_KERNEL);
1108 if (!result)
1109 return result;
1110
1111 copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1112 nfs4_recoverydir());
1113 if (copied > (len - HEXDIR_LEN)) {
1114 /* just return nothing if output will be truncated */
1115 kfree(result);
1116 return NULL;
1117 }
1118
1119 copied = nfs4_make_rec_clidname(result + copied, name);
1120 if (copied) {
1121 kfree(result);
1122 return NULL;
1123 }
1124
1125 return result;
1126 }
1127
1128 static int
1129 nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *legacy)
1130 {
1131 char *envp[2];
1132 char *argv[4];
1133 int ret;
1134
1135 if (unlikely(!cltrack_prog[0])) {
1136 dprintk("%s: cltrack_prog is disabled\n", __func__);
1137 return -EACCES;
1138 }
1139
1140 dprintk("%s: cmd: %s\n", __func__, cmd);
1141 dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
1142 dprintk("%s: legacy: %s\n", __func__, legacy ? legacy : "(null)");
1143
1144 envp[0] = legacy;
1145 envp[1] = NULL;
1146
1147 argv[0] = (char *)cltrack_prog;
1148 argv[1] = cmd;
1149 argv[2] = arg;
1150 argv[3] = NULL;
1151
1152 ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1153 /*
1154 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1155 * error. The admin can re-enable it on the fly by using sysfs
1156 * once the problem has been fixed.
1157 */
1158 if (ret == -ENOENT || ret == -EACCES) {
1159 dprintk("NFSD: %s was not found or isn't executable (%d). "
1160 "Setting cltrack_prog to blank string!",
1161 cltrack_prog, ret);
1162 cltrack_prog[0] = '\0';
1163 }
1164 dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1165
1166 return ret;
1167 }
1168
1169 static char *
1170 bin_to_hex_dup(const unsigned char *src, int srclen)
1171 {
1172 int i;
1173 char *buf, *hex;
1174
1175 /* +1 for terminating NULL */
1176 buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1177 if (!buf)
1178 return buf;
1179
1180 hex = buf;
1181 for (i = 0; i < srclen; i++) {
1182 sprintf(hex, "%2.2x", *src++);
1183 hex += 2;
1184 }
1185 return buf;
1186 }
1187
1188 static int
1189 nfsd4_umh_cltrack_init(struct net __attribute__((unused)) *net)
1190 {
1191 /* XXX: The usermode helper s not working in container yet. */
1192 if (net != &init_net) {
1193 WARN(1, KERN_ERR "NFSD: attempt to initialize umh client "
1194 "tracking in a container!\n");
1195 return -EINVAL;
1196 }
1197 return nfsd4_umh_cltrack_upcall("init", NULL, NULL);
1198 }
1199
1200 static void
1201 nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1202 {
1203 char *hexid;
1204
1205 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1206 if (!hexid) {
1207 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1208 return;
1209 }
1210 nfsd4_umh_cltrack_upcall("create", hexid, NULL);
1211 kfree(hexid);
1212 }
1213
1214 static void
1215 nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1216 {
1217 char *hexid;
1218
1219 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1220 if (!hexid) {
1221 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1222 return;
1223 }
1224 nfsd4_umh_cltrack_upcall("remove", hexid, NULL);
1225 kfree(hexid);
1226 }
1227
1228 static int
1229 nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1230 {
1231 int ret;
1232 char *hexid, *legacy;
1233
1234 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1235 if (!hexid) {
1236 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1237 return -ENOMEM;
1238 }
1239 legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
1240 ret = nfsd4_umh_cltrack_upcall("check", hexid, legacy);
1241 kfree(legacy);
1242 kfree(hexid);
1243 return ret;
1244 }
1245
1246 static void
1247 nfsd4_umh_cltrack_grace_done(struct nfsd_net __attribute__((unused)) *nn,
1248 time_t boot_time)
1249 {
1250 char *legacy;
1251 char timestr[22]; /* FIXME: better way to determine max size? */
1252
1253 sprintf(timestr, "%ld", boot_time);
1254 legacy = nfsd4_cltrack_legacy_topdir();
1255 nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy);
1256 kfree(legacy);
1257 }
1258
1259 static struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
1260 .init = nfsd4_umh_cltrack_init,
1261 .exit = NULL,
1262 .create = nfsd4_umh_cltrack_create,
1263 .remove = nfsd4_umh_cltrack_remove,
1264 .check = nfsd4_umh_cltrack_check,
1265 .grace_done = nfsd4_umh_cltrack_grace_done,
1266 };
1267
1268 int
1269 nfsd4_client_tracking_init(struct net *net)
1270 {
1271 int status;
1272 struct path path;
1273 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1274
1275 /* just run the init if it the method is already decided */
1276 if (nn->client_tracking_ops)
1277 goto do_init;
1278
1279 /*
1280 * First, try a UMH upcall. It should succeed or fail quickly, so
1281 * there's little harm in trying that first.
1282 */
1283 nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1284 status = nn->client_tracking_ops->init(net);
1285 if (!status)
1286 return status;
1287
1288 /*
1289 * See if the recoverydir exists and is a directory. If it is,
1290 * then use the legacy ops.
1291 */
1292 nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
1293 status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1294 if (!status) {
1295 status = S_ISDIR(path.dentry->d_inode->i_mode);
1296 path_put(&path);
1297 if (status)
1298 goto do_init;
1299 }
1300
1301 /* Finally, try to use nfsdcld */
1302 nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
1303 printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1304 "removed in 3.10. Please transition to using "
1305 "nfsdcltrack.\n");
1306 do_init:
1307 status = nn->client_tracking_ops->init(net);
1308 if (status) {
1309 printk(KERN_WARNING "NFSD: Unable to initialize client "
1310 "recovery tracking! (%d)\n", status);
1311 nn->client_tracking_ops = NULL;
1312 }
1313 return status;
1314 }
1315
1316 void
1317 nfsd4_client_tracking_exit(struct net *net)
1318 {
1319 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1320
1321 if (nn->client_tracking_ops) {
1322 if (nn->client_tracking_ops->exit)
1323 nn->client_tracking_ops->exit(net);
1324 nn->client_tracking_ops = NULL;
1325 }
1326 }
1327
1328 void
1329 nfsd4_client_record_create(struct nfs4_client *clp)
1330 {
1331 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1332
1333 if (nn->client_tracking_ops)
1334 nn->client_tracking_ops->create(clp);
1335 }
1336
1337 void
1338 nfsd4_client_record_remove(struct nfs4_client *clp)
1339 {
1340 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1341
1342 if (nn->client_tracking_ops)
1343 nn->client_tracking_ops->remove(clp);
1344 }
1345
1346 int
1347 nfsd4_client_record_check(struct nfs4_client *clp)
1348 {
1349 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1350
1351 if (nn->client_tracking_ops)
1352 return nn->client_tracking_ops->check(clp);
1353
1354 return -EOPNOTSUPP;
1355 }
1356
1357 void
1358 nfsd4_record_grace_done(struct nfsd_net *nn, time_t boot_time)
1359 {
1360 if (nn->client_tracking_ops)
1361 nn->client_tracking_ops->grace_done(nn, boot_time);
1362 }
1363
1364 static int
1365 rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1366 {
1367 struct super_block *sb = ptr;
1368 struct net *net = sb->s_fs_info;
1369 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1370 struct cld_net *cn = nn->cld_net;
1371 struct dentry *dentry;
1372 int ret = 0;
1373
1374 if (!try_module_get(THIS_MODULE))
1375 return 0;
1376
1377 if (!cn) {
1378 module_put(THIS_MODULE);
1379 return 0;
1380 }
1381
1382 switch (event) {
1383 case RPC_PIPEFS_MOUNT:
1384 dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1385 if (IS_ERR(dentry)) {
1386 ret = PTR_ERR(dentry);
1387 break;
1388 }
1389 cn->cn_pipe->dentry = dentry;
1390 break;
1391 case RPC_PIPEFS_UMOUNT:
1392 if (cn->cn_pipe->dentry)
1393 nfsd4_cld_unregister_sb(cn->cn_pipe);
1394 break;
1395 default:
1396 ret = -ENOTSUPP;
1397 break;
1398 }
1399 module_put(THIS_MODULE);
1400 return ret;
1401 }
1402
1403 static struct notifier_block nfsd4_cld_block = {
1404 .notifier_call = rpc_pipefs_event,
1405 };
1406
1407 int
1408 register_cld_notifier(void)
1409 {
1410 return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1411 }
1412
1413 void
1414 unregister_cld_notifier(void)
1415 {
1416 rpc_pipefs_notifier_unregister(&nfsd4_cld_block);
1417 }