45509c23c7a049c979c0d545b644cde414290293
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / fs / nfsd / nfs4recover.c
1 /*
2 * Copyright (c) 2004 The Regents of the University of Michigan.
3 * Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
4 * All rights reserved.
5 *
6 * Andy Adamson <andros@citi.umich.edu>
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 *
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. Neither the name of the University nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 *
33 */
34
35 #include <linux/file.h>
36 #include <linux/slab.h>
37 #include <linux/namei.h>
38 #include <linux/crypto.h>
39 #include <linux/sched.h>
40 #include <linux/fs.h>
41 #include <linux/module.h>
42 #include <net/net_namespace.h>
43 #include <linux/sunrpc/rpc_pipe_fs.h>
44 #include <linux/sunrpc/clnt.h>
45 #include <linux/nfsd/cld.h>
46
47 #include "nfsd.h"
48 #include "state.h"
49 #include "vfs.h"
50 #include "netns.h"
51
52 #define NFSDDBG_FACILITY NFSDDBG_PROC
53
54 /* Declarations */
55 struct nfsd4_client_tracking_ops {
56 int (*init)(struct net *);
57 void (*exit)(struct net *);
58 void (*create)(struct nfs4_client *);
59 void (*remove)(struct nfs4_client *);
60 int (*check)(struct nfs4_client *);
61 void (*grace_done)(struct nfsd_net *, time_t);
62 };
63
64 /* Globals */
65 static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
66
67 static int
68 nfs4_save_creds(const struct cred **original_creds)
69 {
70 struct cred *new;
71
72 new = prepare_creds();
73 if (!new)
74 return -ENOMEM;
75
76 new->fsuid = GLOBAL_ROOT_UID;
77 new->fsgid = GLOBAL_ROOT_GID;
78 *original_creds = override_creds(new);
79 put_cred(new);
80 return 0;
81 }
82
83 static void
84 nfs4_reset_creds(const struct cred *original)
85 {
86 revert_creds(original);
87 }
88
89 static void
90 md5_to_hex(char *out, char *md5)
91 {
92 int i;
93
94 for (i=0; i<16; i++) {
95 unsigned char c = md5[i];
96
97 *out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 *out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
99 }
100 *out = '\0';
101 }
102
103 static int
104 nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
105 {
106 struct xdr_netobj cksum;
107 struct hash_desc desc;
108 struct scatterlist sg;
109 int status;
110
111 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
112 clname->len, clname->data);
113 desc.flags = CRYPTO_TFM_REQ_MAY_SLEEP;
114 desc.tfm = crypto_alloc_hash("md5", 0, CRYPTO_ALG_ASYNC);
115 if (IS_ERR(desc.tfm)) {
116 status = PTR_ERR(desc.tfm);
117 goto out_no_tfm;
118 }
119
120 cksum.len = crypto_hash_digestsize(desc.tfm);
121 cksum.data = kmalloc(cksum.len, GFP_KERNEL);
122 if (cksum.data == NULL) {
123 status = -ENOMEM;
124 goto out;
125 }
126
127 sg_init_one(&sg, clname->data, clname->len);
128
129 status = crypto_hash_digest(&desc, &sg, sg.length, cksum.data);
130 if (status)
131 goto out;
132
133 md5_to_hex(dname, cksum.data);
134
135 status = 0;
136 out:
137 kfree(cksum.data);
138 crypto_free_hash(desc.tfm);
139 out_no_tfm:
140 return status;
141 }
142
143 /*
144 * If we had an error generating the recdir name for the legacy tracker
145 * then warn the admin. If the error doesn't appear to be transient,
146 * then disable recovery tracking.
147 */
148 static void
149 legacy_recdir_name_error(struct nfs4_client *clp, int error)
150 {
151 printk(KERN_ERR "NFSD: unable to generate recoverydir "
152 "name (%d).\n", error);
153
154 /*
155 * if the algorithm just doesn't exist, then disable the recovery
156 * tracker altogether. The crypto libs will generally return this if
157 * FIPS is enabled as well.
158 */
159 if (error == -ENOENT) {
160 printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
161 "Reboot recovery will not function correctly!\n");
162 nfsd4_client_tracking_exit(clp->net);
163 }
164 }
165
166 static void
167 nfsd4_create_clid_dir(struct nfs4_client *clp)
168 {
169 const struct cred *original_cred;
170 char dname[HEXDIR_LEN];
171 struct dentry *dir, *dentry;
172 struct nfs4_client_reclaim *crp;
173 int status;
174 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
175
176 dprintk("NFSD: nfsd4_create_clid_dir for \"%s\"\n", dname);
177
178 if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
179 return;
180 if (!nn->rec_file)
181 return;
182
183 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
184 if (status)
185 return legacy_recdir_name_error(clp, status);
186
187 status = nfs4_save_creds(&original_cred);
188 if (status < 0)
189 return;
190
191 status = mnt_want_write_file(nn->rec_file);
192 if (status)
193 return;
194
195 dir = nn->rec_file->f_path.dentry;
196 /* lock the parent */
197 mutex_lock(&dir->d_inode->i_mutex);
198
199 dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
200 if (IS_ERR(dentry)) {
201 status = PTR_ERR(dentry);
202 goto out_unlock;
203 }
204 if (dentry->d_inode)
205 /*
206 * In the 4.1 case, where we're called from
207 * reclaim_complete(), records from the previous reboot
208 * may still be left, so this is OK.
209 *
210 * In the 4.0 case, we should never get here; but we may
211 * as well be forgiving and just succeed silently.
212 */
213 goto out_put;
214 status = vfs_mkdir(dir->d_inode, dentry, S_IRWXU);
215 out_put:
216 dput(dentry);
217 out_unlock:
218 mutex_unlock(&dir->d_inode->i_mutex);
219 if (status == 0) {
220 if (nn->in_grace) {
221 crp = nfs4_client_to_reclaim(dname, nn);
222 if (crp)
223 crp->cr_clp = clp;
224 }
225 vfs_fsync(nn->rec_file, 0);
226 } else {
227 printk(KERN_ERR "NFSD: failed to write recovery record"
228 " (err %d); please check that %s exists"
229 " and is writeable", status,
230 user_recovery_dirname);
231 }
232 mnt_drop_write_file(nn->rec_file);
233 nfs4_reset_creds(original_cred);
234 }
235
236 typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
237
238 struct name_list {
239 char name[HEXDIR_LEN];
240 struct list_head list;
241 };
242
243 struct nfs4_dir_ctx {
244 struct dir_context ctx;
245 struct list_head names;
246 };
247
248 static int
249 nfsd4_build_namelist(void *arg, const char *name, int namlen,
250 loff_t offset, u64 ino, unsigned int d_type)
251 {
252 struct list_head *names = arg;
253 struct name_list *entry;
254
255 if (namlen != HEXDIR_LEN - 1)
256 return 0;
257 entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
258 if (entry == NULL)
259 return -ENOMEM;
260 memcpy(entry->name, name, HEXDIR_LEN - 1);
261 entry->name[HEXDIR_LEN - 1] = '\0';
262 list_add(&entry->list, &ctx->names);
263 return 0;
264 }
265
266 static int
267 nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
268 {
269 const struct cred *original_cred;
270 struct dentry *dir = nn->rec_file->f_path.dentry;
271 struct nfs4_dir_ctx ctx;
272 int status;
273
274 status = nfs4_save_creds(&original_cred);
275 if (status < 0)
276 return status;
277
278 status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
279 if (status < 0) {
280 nfs4_reset_creds(original_cred);
281 return status;
282 }
283
284 INIT_LIST_HEAD(&ctx.names);
285 ctx.ctx.actor = nfsd4_build_namelist;
286 status = iterate_dir(nn->rec_file, &ctx.ctx);
287 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
288 while (!list_empty(&ctx.names)) {
289 struct name_list *entry;
290 entry = list_entry(ctx.names.next, struct name_list, list);
291 if (!status) {
292 struct dentry *dentry;
293 dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
294 if (IS_ERR(dentry)) {
295 status = PTR_ERR(dentry);
296 break;
297 }
298 status = f(dir, dentry, nn);
299 dput(dentry);
300 }
301 list_del(&entry->list);
302 kfree(entry);
303 }
304 mutex_unlock(&dir->d_inode->i_mutex);
305 nfs4_reset_creds(original_cred);
306 return status;
307 }
308
309 static int
310 nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
311 {
312 struct dentry *dir, *dentry;
313 int status;
314
315 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
316
317 dir = nn->rec_file->f_path.dentry;
318 mutex_lock_nested(&dir->d_inode->i_mutex, I_MUTEX_PARENT);
319 dentry = lookup_one_len(name, dir, namlen);
320 if (IS_ERR(dentry)) {
321 status = PTR_ERR(dentry);
322 goto out_unlock;
323 }
324 status = -ENOENT;
325 if (!dentry->d_inode)
326 goto out;
327 status = vfs_rmdir(dir->d_inode, dentry);
328 out:
329 dput(dentry);
330 out_unlock:
331 mutex_unlock(&dir->d_inode->i_mutex);
332 return status;
333 }
334
335 static void
336 nfsd4_remove_clid_dir(struct nfs4_client *clp)
337 {
338 const struct cred *original_cred;
339 struct nfs4_client_reclaim *crp;
340 char dname[HEXDIR_LEN];
341 int status;
342 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
343
344 if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
345 return;
346
347 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
348 if (status)
349 return legacy_recdir_name_error(clp, status);
350
351 status = mnt_want_write_file(nn->rec_file);
352 if (status)
353 goto out;
354 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
355
356 status = nfs4_save_creds(&original_cred);
357 if (status < 0)
358 goto out_drop_write;
359
360 status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
361 nfs4_reset_creds(original_cred);
362 if (status == 0) {
363 vfs_fsync(nn->rec_file, 0);
364 if (nn->in_grace) {
365 /* remove reclaim record */
366 crp = nfsd4_find_reclaim_client(dname, nn);
367 if (crp)
368 nfs4_remove_reclaim_record(crp, nn);
369 }
370 }
371 out_drop_write:
372 mnt_drop_write_file(nn->rec_file);
373 out:
374 if (status)
375 printk("NFSD: Failed to remove expired client state directory"
376 " %.*s\n", HEXDIR_LEN, dname);
377 }
378
379 static int
380 purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
381 {
382 int status;
383
384 if (nfs4_has_reclaimed_state(child->d_name.name, nn))
385 return 0;
386
387 status = vfs_rmdir(parent->d_inode, child);
388 if (status)
389 printk("failed to remove client recovery directory %s\n",
390 child->d_name.name);
391 /* Keep trying, success or failure: */
392 return 0;
393 }
394
395 static void
396 nfsd4_recdir_purge_old(struct nfsd_net *nn, time_t boot_time)
397 {
398 int status;
399
400 nn->in_grace = false;
401 if (!nn->rec_file)
402 return;
403 status = mnt_want_write_file(nn->rec_file);
404 if (status)
405 goto out;
406 status = nfsd4_list_rec_dir(purge_old, nn);
407 if (status == 0)
408 vfs_fsync(nn->rec_file, 0);
409 mnt_drop_write_file(nn->rec_file);
410 out:
411 nfs4_release_reclaim(nn);
412 if (status)
413 printk("nfsd4: failed to purge old clients from recovery"
414 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
415 }
416
417 static int
418 load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
419 {
420 if (child->d_name.len != HEXDIR_LEN - 1) {
421 printk("nfsd4: illegal name %s in recovery directory\n",
422 child->d_name.name);
423 /* Keep trying; maybe the others are OK: */
424 return 0;
425 }
426 nfs4_client_to_reclaim(child->d_name.name, nn);
427 return 0;
428 }
429
430 static int
431 nfsd4_recdir_load(struct net *net) {
432 int status;
433 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
434
435 if (!nn->rec_file)
436 return 0;
437
438 status = nfsd4_list_rec_dir(load_recdir, nn);
439 if (status)
440 printk("nfsd4: failed loading clients from recovery"
441 " directory %s\n", nn->rec_file->f_path.dentry->d_name.name);
442 return status;
443 }
444
445 /*
446 * Hold reference to the recovery directory.
447 */
448
449 static int
450 nfsd4_init_recdir(struct net *net)
451 {
452 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
453 const struct cred *original_cred;
454 int status;
455
456 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
457 user_recovery_dirname);
458
459 BUG_ON(nn->rec_file);
460
461 status = nfs4_save_creds(&original_cred);
462 if (status < 0) {
463 printk("NFSD: Unable to change credentials to find recovery"
464 " directory: error %d\n",
465 status);
466 return status;
467 }
468
469 nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
470 if (IS_ERR(nn->rec_file)) {
471 printk("NFSD: unable to find recovery directory %s\n",
472 user_recovery_dirname);
473 status = PTR_ERR(nn->rec_file);
474 nn->rec_file = NULL;
475 }
476
477 nfs4_reset_creds(original_cred);
478 if (!status)
479 nn->in_grace = true;
480 return status;
481 }
482
483
484 static int
485 nfs4_legacy_state_init(struct net *net)
486 {
487 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
488 int i;
489
490 nn->reclaim_str_hashtbl = kmalloc(sizeof(struct list_head) *
491 CLIENT_HASH_SIZE, GFP_KERNEL);
492 if (!nn->reclaim_str_hashtbl)
493 return -ENOMEM;
494
495 for (i = 0; i < CLIENT_HASH_SIZE; i++)
496 INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
497 nn->reclaim_str_hashtbl_size = 0;
498
499 return 0;
500 }
501
502 static void
503 nfs4_legacy_state_shutdown(struct net *net)
504 {
505 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
506
507 kfree(nn->reclaim_str_hashtbl);
508 }
509
510 static int
511 nfsd4_load_reboot_recovery_data(struct net *net)
512 {
513 int status;
514
515 status = nfsd4_init_recdir(net);
516 if (!status)
517 status = nfsd4_recdir_load(net);
518 if (status)
519 printk(KERN_ERR "NFSD: Failure reading reboot recovery data\n");
520 return status;
521 }
522
523 static int
524 nfsd4_legacy_tracking_init(struct net *net)
525 {
526 int status;
527
528 /* XXX: The legacy code won't work in a container */
529 if (net != &init_net) {
530 WARN(1, KERN_ERR "NFSD: attempt to initialize legacy client "
531 "tracking in a container!\n");
532 return -EINVAL;
533 }
534
535 status = nfs4_legacy_state_init(net);
536 if (status)
537 return status;
538
539 status = nfsd4_load_reboot_recovery_data(net);
540 if (status)
541 goto err;
542 return 0;
543
544 err:
545 nfs4_legacy_state_shutdown(net);
546 return status;
547 }
548
549 static void
550 nfsd4_shutdown_recdir(struct nfsd_net *nn)
551 {
552 if (!nn->rec_file)
553 return;
554 fput(nn->rec_file);
555 nn->rec_file = NULL;
556 }
557
558 static void
559 nfsd4_legacy_tracking_exit(struct net *net)
560 {
561 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
562
563 nfs4_release_reclaim(nn);
564 nfsd4_shutdown_recdir(nn);
565 nfs4_legacy_state_shutdown(net);
566 }
567
568 /*
569 * Change the NFSv4 recovery directory to recdir.
570 */
571 int
572 nfs4_reset_recoverydir(char *recdir)
573 {
574 int status;
575 struct path path;
576
577 status = kern_path(recdir, LOOKUP_FOLLOW, &path);
578 if (status)
579 return status;
580 status = -ENOTDIR;
581 if (S_ISDIR(path.dentry->d_inode->i_mode)) {
582 strcpy(user_recovery_dirname, recdir);
583 status = 0;
584 }
585 path_put(&path);
586 return status;
587 }
588
589 char *
590 nfs4_recoverydir(void)
591 {
592 return user_recovery_dirname;
593 }
594
595 static int
596 nfsd4_check_legacy_client(struct nfs4_client *clp)
597 {
598 int status;
599 char dname[HEXDIR_LEN];
600 struct nfs4_client_reclaim *crp;
601 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
602
603 /* did we already find that this client is stable? */
604 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
605 return 0;
606
607 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
608 if (status) {
609 legacy_recdir_name_error(clp, status);
610 return status;
611 }
612
613 /* look for it in the reclaim hashtable otherwise */
614 crp = nfsd4_find_reclaim_client(dname, nn);
615 if (crp) {
616 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
617 crp->cr_clp = clp;
618 return 0;
619 }
620
621 return -ENOENT;
622 }
623
624 static struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
625 .init = nfsd4_legacy_tracking_init,
626 .exit = nfsd4_legacy_tracking_exit,
627 .create = nfsd4_create_clid_dir,
628 .remove = nfsd4_remove_clid_dir,
629 .check = nfsd4_check_legacy_client,
630 .grace_done = nfsd4_recdir_purge_old,
631 };
632
633 /* Globals */
634 #define NFSD_PIPE_DIR "nfsd"
635 #define NFSD_CLD_PIPE "cld"
636
637 /* per-net-ns structure for holding cld upcall info */
638 struct cld_net {
639 struct rpc_pipe *cn_pipe;
640 spinlock_t cn_lock;
641 struct list_head cn_list;
642 unsigned int cn_xid;
643 };
644
645 struct cld_upcall {
646 struct list_head cu_list;
647 struct cld_net *cu_net;
648 struct task_struct *cu_task;
649 struct cld_msg cu_msg;
650 };
651
652 static int
653 __cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
654 {
655 int ret;
656 struct rpc_pipe_msg msg;
657
658 memset(&msg, 0, sizeof(msg));
659 msg.data = cmsg;
660 msg.len = sizeof(*cmsg);
661
662 /*
663 * Set task state before we queue the upcall. That prevents
664 * wake_up_process in the downcall from racing with schedule.
665 */
666 set_current_state(TASK_UNINTERRUPTIBLE);
667 ret = rpc_queue_upcall(pipe, &msg);
668 if (ret < 0) {
669 set_current_state(TASK_RUNNING);
670 goto out;
671 }
672
673 schedule();
674 set_current_state(TASK_RUNNING);
675
676 if (msg.errno < 0)
677 ret = msg.errno;
678 out:
679 return ret;
680 }
681
682 static int
683 cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
684 {
685 int ret;
686
687 /*
688 * -EAGAIN occurs when pipe is closed and reopened while there are
689 * upcalls queued.
690 */
691 do {
692 ret = __cld_pipe_upcall(pipe, cmsg);
693 } while (ret == -EAGAIN);
694
695 return ret;
696 }
697
698 static ssize_t
699 cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
700 {
701 struct cld_upcall *tmp, *cup;
702 struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
703 uint32_t xid;
704 struct nfsd_net *nn = net_generic(filp->f_dentry->d_sb->s_fs_info,
705 nfsd_net_id);
706 struct cld_net *cn = nn->cld_net;
707
708 if (mlen != sizeof(*cmsg)) {
709 dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
710 sizeof(*cmsg));
711 return -EINVAL;
712 }
713
714 /* copy just the xid so we can try to find that */
715 if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
716 dprintk("%s: error when copying xid from userspace", __func__);
717 return -EFAULT;
718 }
719
720 /* walk the list and find corresponding xid */
721 cup = NULL;
722 spin_lock(&cn->cn_lock);
723 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
724 if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
725 cup = tmp;
726 list_del_init(&cup->cu_list);
727 break;
728 }
729 }
730 spin_unlock(&cn->cn_lock);
731
732 /* couldn't find upcall? */
733 if (!cup) {
734 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
735 return -EINVAL;
736 }
737
738 if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
739 return -EFAULT;
740
741 wake_up_process(cup->cu_task);
742 return mlen;
743 }
744
745 static void
746 cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
747 {
748 struct cld_msg *cmsg = msg->data;
749 struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
750 cu_msg);
751
752 /* errno >= 0 means we got a downcall */
753 if (msg->errno >= 0)
754 return;
755
756 wake_up_process(cup->cu_task);
757 }
758
759 static const struct rpc_pipe_ops cld_upcall_ops = {
760 .upcall = rpc_pipe_generic_upcall,
761 .downcall = cld_pipe_downcall,
762 .destroy_msg = cld_pipe_destroy_msg,
763 };
764
765 static struct dentry *
766 nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
767 {
768 struct dentry *dir, *dentry;
769
770 dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
771 if (dir == NULL)
772 return ERR_PTR(-ENOENT);
773 dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
774 dput(dir);
775 return dentry;
776 }
777
778 static void
779 nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
780 {
781 if (pipe->dentry)
782 rpc_unlink(pipe->dentry);
783 }
784
785 static struct dentry *
786 nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
787 {
788 struct super_block *sb;
789 struct dentry *dentry;
790
791 sb = rpc_get_sb_net(net);
792 if (!sb)
793 return NULL;
794 dentry = nfsd4_cld_register_sb(sb, pipe);
795 rpc_put_sb_net(net);
796 return dentry;
797 }
798
799 static void
800 nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
801 {
802 struct super_block *sb;
803
804 sb = rpc_get_sb_net(net);
805 if (sb) {
806 nfsd4_cld_unregister_sb(pipe);
807 rpc_put_sb_net(net);
808 }
809 }
810
811 /* Initialize rpc_pipefs pipe for communication with client tracking daemon */
812 static int
813 nfsd4_init_cld_pipe(struct net *net)
814 {
815 int ret;
816 struct dentry *dentry;
817 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
818 struct cld_net *cn;
819
820 if (nn->cld_net)
821 return 0;
822
823 cn = kzalloc(sizeof(*cn), GFP_KERNEL);
824 if (!cn) {
825 ret = -ENOMEM;
826 goto err;
827 }
828
829 cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
830 if (IS_ERR(cn->cn_pipe)) {
831 ret = PTR_ERR(cn->cn_pipe);
832 goto err;
833 }
834 spin_lock_init(&cn->cn_lock);
835 INIT_LIST_HEAD(&cn->cn_list);
836
837 dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
838 if (IS_ERR(dentry)) {
839 ret = PTR_ERR(dentry);
840 goto err_destroy_data;
841 }
842
843 cn->cn_pipe->dentry = dentry;
844 nn->cld_net = cn;
845 return 0;
846
847 err_destroy_data:
848 rpc_destroy_pipe_data(cn->cn_pipe);
849 err:
850 kfree(cn);
851 printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
852 ret);
853 return ret;
854 }
855
856 static void
857 nfsd4_remove_cld_pipe(struct net *net)
858 {
859 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
860 struct cld_net *cn = nn->cld_net;
861
862 nfsd4_cld_unregister_net(net, cn->cn_pipe);
863 rpc_destroy_pipe_data(cn->cn_pipe);
864 kfree(nn->cld_net);
865 nn->cld_net = NULL;
866 }
867
868 static struct cld_upcall *
869 alloc_cld_upcall(struct cld_net *cn)
870 {
871 struct cld_upcall *new, *tmp;
872
873 new = kzalloc(sizeof(*new), GFP_KERNEL);
874 if (!new)
875 return new;
876
877 /* FIXME: hard cap on number in flight? */
878 restart_search:
879 spin_lock(&cn->cn_lock);
880 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
881 if (tmp->cu_msg.cm_xid == cn->cn_xid) {
882 cn->cn_xid++;
883 spin_unlock(&cn->cn_lock);
884 goto restart_search;
885 }
886 }
887 new->cu_task = current;
888 new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
889 put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
890 new->cu_net = cn;
891 list_add(&new->cu_list, &cn->cn_list);
892 spin_unlock(&cn->cn_lock);
893
894 dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
895
896 return new;
897 }
898
899 static void
900 free_cld_upcall(struct cld_upcall *victim)
901 {
902 struct cld_net *cn = victim->cu_net;
903
904 spin_lock(&cn->cn_lock);
905 list_del(&victim->cu_list);
906 spin_unlock(&cn->cn_lock);
907 kfree(victim);
908 }
909
910 /* Ask daemon to create a new record */
911 static void
912 nfsd4_cld_create(struct nfs4_client *clp)
913 {
914 int ret;
915 struct cld_upcall *cup;
916 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
917 struct cld_net *cn = nn->cld_net;
918
919 /* Don't upcall if it's already stored */
920 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
921 return;
922
923 cup = alloc_cld_upcall(cn);
924 if (!cup) {
925 ret = -ENOMEM;
926 goto out_err;
927 }
928
929 cup->cu_msg.cm_cmd = Cld_Create;
930 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
931 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
932 clp->cl_name.len);
933
934 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
935 if (!ret) {
936 ret = cup->cu_msg.cm_status;
937 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
938 }
939
940 free_cld_upcall(cup);
941 out_err:
942 if (ret)
943 printk(KERN_ERR "NFSD: Unable to create client "
944 "record on stable storage: %d\n", ret);
945 }
946
947 /* Ask daemon to create a new record */
948 static void
949 nfsd4_cld_remove(struct nfs4_client *clp)
950 {
951 int ret;
952 struct cld_upcall *cup;
953 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
954 struct cld_net *cn = nn->cld_net;
955
956 /* Don't upcall if it's already removed */
957 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
958 return;
959
960 cup = alloc_cld_upcall(cn);
961 if (!cup) {
962 ret = -ENOMEM;
963 goto out_err;
964 }
965
966 cup->cu_msg.cm_cmd = Cld_Remove;
967 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
968 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
969 clp->cl_name.len);
970
971 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
972 if (!ret) {
973 ret = cup->cu_msg.cm_status;
974 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
975 }
976
977 free_cld_upcall(cup);
978 out_err:
979 if (ret)
980 printk(KERN_ERR "NFSD: Unable to remove client "
981 "record from stable storage: %d\n", ret);
982 }
983
984 /* Check for presence of a record, and update its timestamp */
985 static int
986 nfsd4_cld_check(struct nfs4_client *clp)
987 {
988 int ret;
989 struct cld_upcall *cup;
990 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
991 struct cld_net *cn = nn->cld_net;
992
993 /* Don't upcall if one was already stored during this grace pd */
994 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
995 return 0;
996
997 cup = alloc_cld_upcall(cn);
998 if (!cup) {
999 printk(KERN_ERR "NFSD: Unable to check client record on "
1000 "stable storage: %d\n", -ENOMEM);
1001 return -ENOMEM;
1002 }
1003
1004 cup->cu_msg.cm_cmd = Cld_Check;
1005 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1006 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1007 clp->cl_name.len);
1008
1009 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1010 if (!ret) {
1011 ret = cup->cu_msg.cm_status;
1012 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1013 }
1014
1015 free_cld_upcall(cup);
1016 return ret;
1017 }
1018
1019 static void
1020 nfsd4_cld_grace_done(struct nfsd_net *nn, time_t boot_time)
1021 {
1022 int ret;
1023 struct cld_upcall *cup;
1024 struct cld_net *cn = nn->cld_net;
1025
1026 cup = alloc_cld_upcall(cn);
1027 if (!cup) {
1028 ret = -ENOMEM;
1029 goto out_err;
1030 }
1031
1032 cup->cu_msg.cm_cmd = Cld_GraceDone;
1033 cup->cu_msg.cm_u.cm_gracetime = (int64_t)boot_time;
1034 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1035 if (!ret)
1036 ret = cup->cu_msg.cm_status;
1037
1038 free_cld_upcall(cup);
1039 out_err:
1040 if (ret)
1041 printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1042 }
1043
1044 static struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
1045 .init = nfsd4_init_cld_pipe,
1046 .exit = nfsd4_remove_cld_pipe,
1047 .create = nfsd4_cld_create,
1048 .remove = nfsd4_cld_remove,
1049 .check = nfsd4_cld_check,
1050 .grace_done = nfsd4_cld_grace_done,
1051 };
1052
1053 /* upcall via usermodehelper */
1054 static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1055 module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1056 S_IRUGO|S_IWUSR);
1057 MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1058
1059 static bool cltrack_legacy_disable;
1060 module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1061 MODULE_PARM_DESC(cltrack_legacy_disable,
1062 "Disable legacy recoverydir conversion. Default: false");
1063
1064 #define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1065 #define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
1066
1067 static char *
1068 nfsd4_cltrack_legacy_topdir(void)
1069 {
1070 int copied;
1071 size_t len;
1072 char *result;
1073
1074 if (cltrack_legacy_disable)
1075 return NULL;
1076
1077 len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1078 strlen(nfs4_recoverydir()) + 1;
1079
1080 result = kmalloc(len, GFP_KERNEL);
1081 if (!result)
1082 return result;
1083
1084 copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1085 nfs4_recoverydir());
1086 if (copied >= len) {
1087 /* just return nothing if output was truncated */
1088 kfree(result);
1089 return NULL;
1090 }
1091
1092 return result;
1093 }
1094
1095 static char *
1096 nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
1097 {
1098 int copied;
1099 size_t len;
1100 char *result;
1101
1102 if (cltrack_legacy_disable)
1103 return NULL;
1104
1105 /* +1 is for '/' between "topdir" and "recdir" */
1106 len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1107 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1108
1109 result = kmalloc(len, GFP_KERNEL);
1110 if (!result)
1111 return result;
1112
1113 copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1114 nfs4_recoverydir());
1115 if (copied > (len - HEXDIR_LEN)) {
1116 /* just return nothing if output will be truncated */
1117 kfree(result);
1118 return NULL;
1119 }
1120
1121 copied = nfs4_make_rec_clidname(result + copied, name);
1122 if (copied) {
1123 kfree(result);
1124 return NULL;
1125 }
1126
1127 return result;
1128 }
1129
1130 static int
1131 nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *legacy)
1132 {
1133 char *envp[2];
1134 char *argv[4];
1135 int ret;
1136
1137 if (unlikely(!cltrack_prog[0])) {
1138 dprintk("%s: cltrack_prog is disabled\n", __func__);
1139 return -EACCES;
1140 }
1141
1142 dprintk("%s: cmd: %s\n", __func__, cmd);
1143 dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
1144 dprintk("%s: legacy: %s\n", __func__, legacy ? legacy : "(null)");
1145
1146 envp[0] = legacy;
1147 envp[1] = NULL;
1148
1149 argv[0] = (char *)cltrack_prog;
1150 argv[1] = cmd;
1151 argv[2] = arg;
1152 argv[3] = NULL;
1153
1154 ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1155 /*
1156 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1157 * error. The admin can re-enable it on the fly by using sysfs
1158 * once the problem has been fixed.
1159 */
1160 if (ret == -ENOENT || ret == -EACCES) {
1161 dprintk("NFSD: %s was not found or isn't executable (%d). "
1162 "Setting cltrack_prog to blank string!",
1163 cltrack_prog, ret);
1164 cltrack_prog[0] = '\0';
1165 }
1166 dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1167
1168 return ret;
1169 }
1170
1171 static char *
1172 bin_to_hex_dup(const unsigned char *src, int srclen)
1173 {
1174 int i;
1175 char *buf, *hex;
1176
1177 /* +1 for terminating NULL */
1178 buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1179 if (!buf)
1180 return buf;
1181
1182 hex = buf;
1183 for (i = 0; i < srclen; i++) {
1184 sprintf(hex, "%2.2x", *src++);
1185 hex += 2;
1186 }
1187 return buf;
1188 }
1189
1190 static int
1191 nfsd4_umh_cltrack_init(struct net __attribute__((unused)) *net)
1192 {
1193 /* XXX: The usermode helper s not working in container yet. */
1194 if (net != &init_net) {
1195 WARN(1, KERN_ERR "NFSD: attempt to initialize umh client "
1196 "tracking in a container!\n");
1197 return -EINVAL;
1198 }
1199 return nfsd4_umh_cltrack_upcall("init", NULL, NULL);
1200 }
1201
1202 static void
1203 nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1204 {
1205 char *hexid;
1206
1207 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1208 if (!hexid) {
1209 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1210 return;
1211 }
1212 nfsd4_umh_cltrack_upcall("create", hexid, NULL);
1213 kfree(hexid);
1214 }
1215
1216 static void
1217 nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1218 {
1219 char *hexid;
1220
1221 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1222 if (!hexid) {
1223 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1224 return;
1225 }
1226 nfsd4_umh_cltrack_upcall("remove", hexid, NULL);
1227 kfree(hexid);
1228 }
1229
1230 static int
1231 nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1232 {
1233 int ret;
1234 char *hexid, *legacy;
1235
1236 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1237 if (!hexid) {
1238 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1239 return -ENOMEM;
1240 }
1241 legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
1242 ret = nfsd4_umh_cltrack_upcall("check", hexid, legacy);
1243 kfree(legacy);
1244 kfree(hexid);
1245 return ret;
1246 }
1247
1248 static void
1249 nfsd4_umh_cltrack_grace_done(struct nfsd_net __attribute__((unused)) *nn,
1250 time_t boot_time)
1251 {
1252 char *legacy;
1253 char timestr[22]; /* FIXME: better way to determine max size? */
1254
1255 sprintf(timestr, "%ld", boot_time);
1256 legacy = nfsd4_cltrack_legacy_topdir();
1257 nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy);
1258 kfree(legacy);
1259 }
1260
1261 static struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
1262 .init = nfsd4_umh_cltrack_init,
1263 .exit = NULL,
1264 .create = nfsd4_umh_cltrack_create,
1265 .remove = nfsd4_umh_cltrack_remove,
1266 .check = nfsd4_umh_cltrack_check,
1267 .grace_done = nfsd4_umh_cltrack_grace_done,
1268 };
1269
1270 int
1271 nfsd4_client_tracking_init(struct net *net)
1272 {
1273 int status;
1274 struct path path;
1275 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1276
1277 /* just run the init if it the method is already decided */
1278 if (nn->client_tracking_ops)
1279 goto do_init;
1280
1281 /*
1282 * First, try a UMH upcall. It should succeed or fail quickly, so
1283 * there's little harm in trying that first.
1284 */
1285 nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1286 status = nn->client_tracking_ops->init(net);
1287 if (!status)
1288 return status;
1289
1290 /*
1291 * See if the recoverydir exists and is a directory. If it is,
1292 * then use the legacy ops.
1293 */
1294 nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
1295 status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1296 if (!status) {
1297 status = S_ISDIR(path.dentry->d_inode->i_mode);
1298 path_put(&path);
1299 if (status)
1300 goto do_init;
1301 }
1302
1303 /* Finally, try to use nfsdcld */
1304 nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
1305 printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1306 "removed in 3.10. Please transition to using "
1307 "nfsdcltrack.\n");
1308 do_init:
1309 status = nn->client_tracking_ops->init(net);
1310 if (status) {
1311 printk(KERN_WARNING "NFSD: Unable to initialize client "
1312 "recovery tracking! (%d)\n", status);
1313 nn->client_tracking_ops = NULL;
1314 }
1315 return status;
1316 }
1317
1318 void
1319 nfsd4_client_tracking_exit(struct net *net)
1320 {
1321 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1322
1323 if (nn->client_tracking_ops) {
1324 if (nn->client_tracking_ops->exit)
1325 nn->client_tracking_ops->exit(net);
1326 nn->client_tracking_ops = NULL;
1327 }
1328 }
1329
1330 void
1331 nfsd4_client_record_create(struct nfs4_client *clp)
1332 {
1333 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1334
1335 if (nn->client_tracking_ops)
1336 nn->client_tracking_ops->create(clp);
1337 }
1338
1339 void
1340 nfsd4_client_record_remove(struct nfs4_client *clp)
1341 {
1342 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1343
1344 if (nn->client_tracking_ops)
1345 nn->client_tracking_ops->remove(clp);
1346 }
1347
1348 int
1349 nfsd4_client_record_check(struct nfs4_client *clp)
1350 {
1351 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1352
1353 if (nn->client_tracking_ops)
1354 return nn->client_tracking_ops->check(clp);
1355
1356 return -EOPNOTSUPP;
1357 }
1358
1359 void
1360 nfsd4_record_grace_done(struct nfsd_net *nn, time_t boot_time)
1361 {
1362 if (nn->client_tracking_ops)
1363 nn->client_tracking_ops->grace_done(nn, boot_time);
1364 }
1365
1366 static int
1367 rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1368 {
1369 struct super_block *sb = ptr;
1370 struct net *net = sb->s_fs_info;
1371 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1372 struct cld_net *cn = nn->cld_net;
1373 struct dentry *dentry;
1374 int ret = 0;
1375
1376 if (!try_module_get(THIS_MODULE))
1377 return 0;
1378
1379 if (!cn) {
1380 module_put(THIS_MODULE);
1381 return 0;
1382 }
1383
1384 switch (event) {
1385 case RPC_PIPEFS_MOUNT:
1386 dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1387 if (IS_ERR(dentry)) {
1388 ret = PTR_ERR(dentry);
1389 break;
1390 }
1391 cn->cn_pipe->dentry = dentry;
1392 break;
1393 case RPC_PIPEFS_UMOUNT:
1394 if (cn->cn_pipe->dentry)
1395 nfsd4_cld_unregister_sb(cn->cn_pipe);
1396 break;
1397 default:
1398 ret = -ENOTSUPP;
1399 break;
1400 }
1401 module_put(THIS_MODULE);
1402 return ret;
1403 }
1404
1405 static struct notifier_block nfsd4_cld_block = {
1406 .notifier_call = rpc_pipefs_event,
1407 };
1408
1409 int
1410 register_cld_notifier(void)
1411 {
1412 return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1413 }
1414
1415 void
1416 unregister_cld_notifier(void)
1417 {
1418 rpc_pipefs_notifier_unregister(&nfsd4_cld_block);
1419 }