nfsd4: fix crash on writing v4_end_grace before nfsd startup
[linux-2.6-block.git] / fs / nfsd / nfs4recover.c
CommitLineData
a55370a3 1/*
a55370a3 2* Copyright (c) 2004 The Regents of the University of Michigan.
f3f80148 3* Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
a55370a3
N
4* All rights reserved.
5*
6* Andy Adamson <andros@citi.umich.edu>
7*
8* Redistribution and use in source and binary forms, with or without
9* modification, are permitted provided that the following conditions
10* are met:
11*
12* 1. Redistributions of source code must retain the above copyright
13* notice, this list of conditions and the following disclaimer.
14* 2. Redistributions in binary form must reproduce the above copyright
15* notice, this list of conditions and the following disclaimer in the
16* documentation and/or other materials provided with the distribution.
17* 3. Neither the name of the University nor the names of its
18* contributors may be used to endorse or promote products derived
19* from this software without specific prior written permission.
20*
21* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*
33*/
34
1edb82d2 35#include <crypto/hash.h>
190e4fbf 36#include <linux/file.h>
5a0e3ad6 37#include <linux/slab.h>
190e4fbf 38#include <linux/namei.h>
e8edc6e0 39#include <linux/sched.h>
f3f80148 40#include <linux/fs.h>
813fd320 41#include <linux/module.h>
f3f80148
JL
42#include <net/net_namespace.h>
43#include <linux/sunrpc/rpc_pipe_fs.h>
44#include <linux/sunrpc/clnt.h>
45#include <linux/nfsd/cld.h>
9a74af21
BH
46
47#include "nfsd.h"
48#include "state.h"
0a3adade 49#include "vfs.h"
f3f80148 50#include "netns.h"
a55370a3
N
51
52#define NFSDDBG_FACILITY NFSDDBG_PROC
53
2a4317c5
JL
54/* Declarations */
55struct nfsd4_client_tracking_ops {
56 int (*init)(struct net *);
57 void (*exit)(struct net *);
58 void (*create)(struct nfs4_client *);
59 void (*remove)(struct nfs4_client *);
60 int (*check)(struct nfs4_client *);
919b8049 61 void (*grace_done)(struct nfsd_net *);
2a4317c5
JL
62};
63
190e4fbf 64/* Globals */
48483bf2 65static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
190e4fbf 66
d84f4f99
DH
67static int
68nfs4_save_creds(const struct cred **original_creds)
190e4fbf 69{
d84f4f99
DH
70 struct cred *new;
71
72 new = prepare_creds();
73 if (!new)
74 return -ENOMEM;
75
6fab8779
EB
76 new->fsuid = GLOBAL_ROOT_UID;
77 new->fsgid = GLOBAL_ROOT_GID;
d84f4f99
DH
78 *original_creds = override_creds(new);
79 put_cred(new);
80 return 0;
190e4fbf
N
81}
82
83static void
d84f4f99 84nfs4_reset_creds(const struct cred *original)
190e4fbf 85{
d84f4f99 86 revert_creds(original);
190e4fbf
N
87}
88
a55370a3
N
89static void
90md5_to_hex(char *out, char *md5)
91{
92 int i;
93
94 for (i=0; i<16; i++) {
95 unsigned char c = md5[i];
96
97 *out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 *out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
99 }
100 *out = '\0';
101}
102
2216d449
JL
103static int
104nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
a55370a3
N
105{
106 struct xdr_netobj cksum;
1edb82d2 107 struct crypto_shash *tfm;
2216d449 108 int status;
a55370a3
N
109
110 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
111 clname->len, clname->data);
1edb82d2
HX
112 tfm = crypto_alloc_shash("md5", 0, 0);
113 if (IS_ERR(tfm)) {
114 status = PTR_ERR(tfm);
35058687 115 goto out_no_tfm;
2216d449
JL
116 }
117
1edb82d2 118 cksum.len = crypto_shash_digestsize(tfm);
a55370a3 119 cksum.data = kmalloc(cksum.len, GFP_KERNEL);
2216d449
JL
120 if (cksum.data == NULL) {
121 status = -ENOMEM;
a55370a3 122 goto out;
2216d449 123 }
a55370a3 124
1edb82d2
HX
125 {
126 SHASH_DESC_ON_STACK(desc, tfm);
127
128 desc->tfm = tfm;
129 desc->flags = CRYPTO_TFM_REQ_MAY_SLEEP;
130
131 status = crypto_shash_digest(desc, clname->data, clname->len,
132 cksum.data);
133 shash_desc_zero(desc);
134 }
a55370a3 135
2216d449 136 if (status)
35058687 137 goto out;
a55370a3
N
138
139 md5_to_hex(dname, cksum.data);
140
2216d449 141 status = 0;
a55370a3 142out:
2bd9e7b6 143 kfree(cksum.data);
1edb82d2 144 crypto_free_shash(tfm);
35058687 145out_no_tfm:
a55370a3
N
146 return status;
147}
190e4fbf 148
2216d449
JL
149/*
150 * If we had an error generating the recdir name for the legacy tracker
151 * then warn the admin. If the error doesn't appear to be transient,
152 * then disable recovery tracking.
153 */
154static void
7255e716 155legacy_recdir_name_error(struct nfs4_client *clp, int error)
2216d449
JL
156{
157 printk(KERN_ERR "NFSD: unable to generate recoverydir "
158 "name (%d).\n", error);
159
160 /*
161 * if the algorithm just doesn't exist, then disable the recovery
162 * tracker altogether. The crypto libs will generally return this if
163 * FIPS is enabled as well.
164 */
165 if (error == -ENOENT) {
166 printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
167 "Reboot recovery will not function correctly!\n");
7255e716 168 nfsd4_client_tracking_exit(clp->net);
2216d449
JL
169 }
170}
171
2a4317c5
JL
172static void
173nfsd4_create_clid_dir(struct nfs4_client *clp)
c7b9a459 174{
d84f4f99 175 const struct cred *original_cred;
2216d449 176 char dname[HEXDIR_LEN];
e970a573 177 struct dentry *dir, *dentry;
0ce0c2b5 178 struct nfs4_client_reclaim *crp;
c7b9a459 179 int status;
52e19c09 180 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
c7b9a459 181
a52d726b 182 if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
7a6ef8c7 183 return;
3a073369 184 if (!nn->rec_file)
7a6ef8c7 185 return;
2216d449
JL
186
187 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
188 if (status)
7255e716 189 return legacy_recdir_name_error(clp, status);
2216d449 190
d84f4f99
DH
191 status = nfs4_save_creds(&original_cred);
192 if (status < 0)
7a6ef8c7 193 return;
c7b9a459 194
3a073369 195 status = mnt_want_write_file(nn->rec_file);
4a55c101 196 if (status)
c2236f14 197 goto out_creds;
4a55c101 198
3a073369 199 dir = nn->rec_file->f_path.dentry;
c7b9a459 200 /* lock the parent */
5955102c 201 inode_lock(d_inode(dir));
c7b9a459 202
e970a573 203 dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
c7b9a459
N
204 if (IS_ERR(dentry)) {
205 status = PTR_ERR(dentry);
206 goto out_unlock;
207 }
2b0143b5 208 if (d_really_is_positive(dentry))
aec39680
BF
209 /*
210 * In the 4.1 case, where we're called from
211 * reclaim_complete(), records from the previous reboot
212 * may still be left, so this is OK.
213 *
214 * In the 4.0 case, we should never get here; but we may
215 * as well be forgiving and just succeed silently.
216 */
c7b9a459 217 goto out_put;
2b0143b5 218 status = vfs_mkdir(d_inode(dir), dentry, S_IRWXU);
c7b9a459
N
219out_put:
220 dput(dentry);
221out_unlock:
5955102c 222 inode_unlock(d_inode(dir));
0ce0c2b5 223 if (status == 0) {
f141f79d 224 if (nn->in_grace) {
52e19c09 225 crp = nfs4_client_to_reclaim(dname, nn);
0ce0c2b5
JL
226 if (crp)
227 crp->cr_clp = clp;
228 }
3a073369 229 vfs_fsync(nn->rec_file, 0);
0ce0c2b5 230 } else {
6577aac0
BH
231 printk(KERN_ERR "NFSD: failed to write recovery record"
232 " (err %d); please check that %s exists"
233 " and is writeable", status,
234 user_recovery_dirname);
0ce0c2b5 235 }
3a073369 236 mnt_drop_write_file(nn->rec_file);
c2236f14 237out_creds:
d84f4f99 238 nfs4_reset_creds(original_cred);
c7b9a459
N
239}
240
52e19c09 241typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
190e4fbf 242
05f4f678
BF
243struct name_list {
244 char name[HEXDIR_LEN];
190e4fbf
N
245 struct list_head list;
246};
247
bb6f619b
AV
248struct nfs4_dir_ctx {
249 struct dir_context ctx;
250 struct list_head names;
251};
252
190e4fbf 253static int
ac7576f4 254nfsd4_build_namelist(struct dir_context *__ctx, const char *name, int namlen,
afefdbb2 255 loff_t offset, u64 ino, unsigned int d_type)
190e4fbf 256{
ac7576f4
MS
257 struct nfs4_dir_ctx *ctx =
258 container_of(__ctx, struct nfs4_dir_ctx, ctx);
05f4f678 259 struct name_list *entry;
190e4fbf 260
05f4f678 261 if (namlen != HEXDIR_LEN - 1)
b37ad28b 262 return 0;
05f4f678
BF
263 entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
264 if (entry == NULL)
190e4fbf 265 return -ENOMEM;
05f4f678
BF
266 memcpy(entry->name, name, HEXDIR_LEN - 1);
267 entry->name[HEXDIR_LEN - 1] = '\0';
bb6f619b 268 list_add(&entry->list, &ctx->names);
190e4fbf
N
269 return 0;
270}
271
272static int
52e19c09 273nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
190e4fbf 274{
d84f4f99 275 const struct cred *original_cred;
3a073369 276 struct dentry *dir = nn->rec_file->f_path.dentry;
ac6614b7
AV
277 struct nfs4_dir_ctx ctx = {
278 .ctx.actor = nfsd4_build_namelist,
279 .names = LIST_HEAD_INIT(ctx.names)
280 };
4691b271 281 struct name_list *entry, *tmp;
190e4fbf
N
282 int status;
283
d84f4f99
DH
284 status = nfs4_save_creds(&original_cred);
285 if (status < 0)
286 return status;
190e4fbf 287
3a073369 288 status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
5b4b299c
AV
289 if (status < 0) {
290 nfs4_reset_creds(original_cred);
291 return status;
292 }
293
5c0ba4e0 294 status = iterate_dir(nn->rec_file, &ctx.ctx);
5955102c 295 inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
4691b271
KM
296
297 list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
5b4b299c
AV
298 if (!status) {
299 struct dentry *dentry;
300 dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
301 if (IS_ERR(dentry)) {
302 status = PTR_ERR(dentry);
303 break;
304 }
52e19c09 305 status = f(dir, dentry, nn);
5b4b299c 306 dput(dentry);
05f4f678 307 }
05f4f678
BF
308 list_del(&entry->list);
309 kfree(entry);
190e4fbf 310 }
5955102c 311 inode_unlock(d_inode(dir));
d84f4f99 312 nfs4_reset_creds(original_cred);
4691b271
KM
313
314 list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
315 dprintk("NFSD: %s. Left entry %s\n", __func__, entry->name);
316 list_del(&entry->list);
317 kfree(entry);
318 }
190e4fbf
N
319 return status;
320}
321
c7b9a459 322static int
3a073369 323nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
c7b9a459 324{
e970a573 325 struct dentry *dir, *dentry;
c7b9a459
N
326 int status;
327
328 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
329
3a073369 330 dir = nn->rec_file->f_path.dentry;
5955102c 331 inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
e970a573 332 dentry = lookup_one_len(name, dir, namlen);
c7b9a459
N
333 if (IS_ERR(dentry)) {
334 status = PTR_ERR(dentry);
2f9092e1 335 goto out_unlock;
c7b9a459
N
336 }
337 status = -ENOENT;
2b0143b5 338 if (d_really_is_negative(dentry))
c7b9a459 339 goto out;
2b0143b5 340 status = vfs_rmdir(d_inode(dir), dentry);
c7b9a459
N
341out:
342 dput(dentry);
2f9092e1 343out_unlock:
5955102c 344 inode_unlock(d_inode(dir));
c7b9a459
N
345 return status;
346}
347
2a4317c5 348static void
c7b9a459
N
349nfsd4_remove_clid_dir(struct nfs4_client *clp)
350{
d84f4f99 351 const struct cred *original_cred;
0ce0c2b5 352 struct nfs4_client_reclaim *crp;
2216d449 353 char dname[HEXDIR_LEN];
c7b9a459 354 int status;
52e19c09 355 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
c7b9a459 356
3a073369 357 if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
c7b9a459
N
358 return;
359
2216d449
JL
360 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
361 if (status)
7255e716 362 return legacy_recdir_name_error(clp, status);
2216d449 363
3a073369 364 status = mnt_want_write_file(nn->rec_file);
0622753b
DH
365 if (status)
366 goto out;
a52d726b 367 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d84f4f99
DH
368
369 status = nfs4_save_creds(&original_cred);
370 if (status < 0)
698d8d87 371 goto out_drop_write;
d84f4f99 372
3a073369 373 status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
d84f4f99 374 nfs4_reset_creds(original_cred);
0ce0c2b5 375 if (status == 0) {
3a073369 376 vfs_fsync(nn->rec_file, 0);
f141f79d 377 if (nn->in_grace) {
0ce0c2b5 378 /* remove reclaim record */
52e19c09 379 crp = nfsd4_find_reclaim_client(dname, nn);
0ce0c2b5 380 if (crp)
52e19c09 381 nfs4_remove_reclaim_record(crp, nn);
0ce0c2b5
JL
382 }
383 }
698d8d87 384out_drop_write:
3a073369 385 mnt_drop_write_file(nn->rec_file);
0622753b 386out:
c7b9a459
N
387 if (status)
388 printk("NFSD: Failed to remove expired client state directory"
2216d449 389 " %.*s\n", HEXDIR_LEN, dname);
c7b9a459
N
390}
391
392static int
52e19c09 393purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
c7b9a459
N
394{
395 int status;
396
52e19c09 397 if (nfs4_has_reclaimed_state(child->d_name.name, nn))
b37ad28b 398 return 0;
c7b9a459 399
2b0143b5 400 status = vfs_rmdir(d_inode(parent), child);
c7b9a459 401 if (status)
a6a9f18f
AV
402 printk("failed to remove client recovery directory %pd\n",
403 child);
c7b9a459 404 /* Keep trying, success or failure: */
b37ad28b 405 return 0;
c7b9a459
N
406}
407
2a4317c5 408static void
919b8049 409nfsd4_recdir_purge_old(struct nfsd_net *nn)
2a4317c5 410{
c7b9a459
N
411 int status;
412
f141f79d 413 nn->in_grace = false;
3a073369 414 if (!nn->rec_file)
c7b9a459 415 return;
3a073369 416 status = mnt_want_write_file(nn->rec_file);
0622753b
DH
417 if (status)
418 goto out;
52e19c09 419 status = nfsd4_list_rec_dir(purge_old, nn);
c7b9a459 420 if (status == 0)
3a073369
SK
421 vfs_fsync(nn->rec_file, 0);
422 mnt_drop_write_file(nn->rec_file);
0622753b 423out:
52e19c09 424 nfs4_release_reclaim(nn);
c7b9a459
N
425 if (status)
426 printk("nfsd4: failed to purge old clients from recovery"
a6a9f18f 427 " directory %pD\n", nn->rec_file);
c7b9a459
N
428}
429
190e4fbf 430static int
52e19c09 431load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
190e4fbf
N
432{
433 if (child->d_name.len != HEXDIR_LEN - 1) {
a6a9f18f
AV
434 printk("nfsd4: illegal name %pd in recovery directory\n",
435 child);
190e4fbf 436 /* Keep trying; maybe the others are OK: */
b37ad28b 437 return 0;
190e4fbf 438 }
52e19c09 439 nfs4_client_to_reclaim(child->d_name.name, nn);
b37ad28b 440 return 0;
190e4fbf
N
441}
442
2a4317c5 443static int
52e19c09 444nfsd4_recdir_load(struct net *net) {
190e4fbf 445 int status;
52e19c09 446 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
190e4fbf 447
3a073369 448 if (!nn->rec_file)
e970a573
CH
449 return 0;
450
52e19c09 451 status = nfsd4_list_rec_dir(load_recdir, nn);
190e4fbf
N
452 if (status)
453 printk("nfsd4: failed loading clients from recovery"
a6a9f18f 454 " directory %pD\n", nn->rec_file);
190e4fbf
N
455 return status;
456}
457
458/*
459 * Hold reference to the recovery directory.
460 */
461
2a4317c5 462static int
3a073369 463nfsd4_init_recdir(struct net *net)
190e4fbf 464{
3a073369 465 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
d84f4f99
DH
466 const struct cred *original_cred;
467 int status;
190e4fbf
N
468
469 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
48483bf2 470 user_recovery_dirname);
190e4fbf 471
3a073369 472 BUG_ON(nn->rec_file);
190e4fbf 473
d84f4f99
DH
474 status = nfs4_save_creds(&original_cred);
475 if (status < 0) {
476 printk("NFSD: Unable to change credentials to find recovery"
477 " directory: error %d\n",
478 status);
2a4317c5 479 return status;
d84f4f99 480 }
190e4fbf 481
3a073369
SK
482 nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
483 if (IS_ERR(nn->rec_file)) {
c2642ab0 484 printk("NFSD: unable to find recovery directory %s\n",
48483bf2 485 user_recovery_dirname);
3a073369
SK
486 status = PTR_ERR(nn->rec_file);
487 nn->rec_file = NULL;
e970a573 488 }
190e4fbf 489
d84f4f99 490 nfs4_reset_creds(original_cred);
0ce0c2b5 491 if (!status)
f141f79d 492 nn->in_grace = true;
2a4317c5 493 return status;
190e4fbf
N
494}
495
15d176c1
KM
496static void
497nfsd4_shutdown_recdir(struct net *net)
498{
499 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
500
501 if (!nn->rec_file)
502 return;
503 fput(nn->rec_file);
504 nn->rec_file = NULL;
505}
52e19c09
SK
506
507static int
508nfs4_legacy_state_init(struct net *net)
509{
510 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
511 int i;
512
6da2ec56
KC
513 nn->reclaim_str_hashtbl = kmalloc_array(CLIENT_HASH_SIZE,
514 sizeof(struct list_head),
515 GFP_KERNEL);
52e19c09
SK
516 if (!nn->reclaim_str_hashtbl)
517 return -ENOMEM;
518
519 for (i = 0; i < CLIENT_HASH_SIZE; i++)
520 INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
521 nn->reclaim_str_hashtbl_size = 0;
522
523 return 0;
524}
525
526static void
527nfs4_legacy_state_shutdown(struct net *net)
528{
529 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
530
531 kfree(nn->reclaim_str_hashtbl);
532}
533
2a4317c5
JL
534static int
535nfsd4_load_reboot_recovery_data(struct net *net)
536{
537 int status;
538
3a073369 539 status = nfsd4_init_recdir(net);
52e19c09 540 if (status)
15d176c1
KM
541 return status;
542
543 status = nfsd4_recdir_load(net);
544 if (status)
545 nfsd4_shutdown_recdir(net);
546
52e19c09
SK
547 return status;
548}
549
550static int
551nfsd4_legacy_tracking_init(struct net *net)
552{
553 int status;
554
cc27e0d4
JL
555 /* XXX: The legacy code won't work in a container */
556 if (net != &init_net) {
46cc8ba3 557 pr_warn("NFSD: attempt to initialize legacy client tracking in a container ignored.\n");
cc27e0d4
JL
558 return -EINVAL;
559 }
560
52e19c09 561 status = nfs4_legacy_state_init(net);
2a4317c5 562 if (status)
52e19c09
SK
563 return status;
564
565 status = nfsd4_load_reboot_recovery_data(net);
566 if (status)
567 goto err;
568 return 0;
569
570err:
571 nfs4_legacy_state_shutdown(net);
2a4317c5
JL
572 return status;
573}
574
2a4317c5
JL
575static void
576nfsd4_legacy_tracking_exit(struct net *net)
577{
52e19c09
SK
578 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
579
580 nfs4_release_reclaim(nn);
15d176c1 581 nfsd4_shutdown_recdir(net);
52e19c09 582 nfs4_legacy_state_shutdown(net);
2a4317c5
JL
583}
584
48483bf2
BF
585/*
586 * Change the NFSv4 recovery directory to recdir.
587 */
588int
589nfs4_reset_recoverydir(char *recdir)
590{
591 int status;
592 struct path path;
593
594 status = kern_path(recdir, LOOKUP_FOLLOW, &path);
595 if (status)
596 return status;
597 status = -ENOTDIR;
e36cb0b8 598 if (d_is_dir(path.dentry)) {
48483bf2
BF
599 strcpy(user_recovery_dirname, recdir);
600 status = 0;
601 }
602 path_put(&path);
603 return status;
604}
605
606char *
607nfs4_recoverydir(void)
608{
609 return user_recovery_dirname;
610}
2a4317c5
JL
611
612static int
613nfsd4_check_legacy_client(struct nfs4_client *clp)
614{
2216d449
JL
615 int status;
616 char dname[HEXDIR_LEN];
0ce0c2b5 617 struct nfs4_client_reclaim *crp;
52e19c09 618 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
0ce0c2b5 619
2a4317c5
JL
620 /* did we already find that this client is stable? */
621 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
622 return 0;
623
2216d449
JL
624 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
625 if (status) {
7255e716 626 legacy_recdir_name_error(clp, status);
2216d449
JL
627 return status;
628 }
629
2a4317c5 630 /* look for it in the reclaim hashtable otherwise */
52e19c09 631 crp = nfsd4_find_reclaim_client(dname, nn);
0ce0c2b5 632 if (crp) {
2a4317c5 633 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
0ce0c2b5 634 crp->cr_clp = clp;
2a4317c5
JL
635 return 0;
636 }
637
638 return -ENOENT;
639}
640
7c582e4f 641static const struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
52e19c09 642 .init = nfsd4_legacy_tracking_init,
2a4317c5
JL
643 .exit = nfsd4_legacy_tracking_exit,
644 .create = nfsd4_create_clid_dir,
645 .remove = nfsd4_remove_clid_dir,
646 .check = nfsd4_check_legacy_client,
647 .grace_done = nfsd4_recdir_purge_old,
648};
649
f3f80148
JL
650/* Globals */
651#define NFSD_PIPE_DIR "nfsd"
652#define NFSD_CLD_PIPE "cld"
653
654/* per-net-ns structure for holding cld upcall info */
655struct cld_net {
656 struct rpc_pipe *cn_pipe;
657 spinlock_t cn_lock;
658 struct list_head cn_list;
659 unsigned int cn_xid;
660};
661
662struct cld_upcall {
663 struct list_head cu_list;
664 struct cld_net *cu_net;
665 struct task_struct *cu_task;
666 struct cld_msg cu_msg;
667};
668
669static int
670__cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
671{
672 int ret;
673 struct rpc_pipe_msg msg;
674
675 memset(&msg, 0, sizeof(msg));
676 msg.data = cmsg;
677 msg.len = sizeof(*cmsg);
678
679 /*
680 * Set task state before we queue the upcall. That prevents
681 * wake_up_process in the downcall from racing with schedule.
682 */
683 set_current_state(TASK_UNINTERRUPTIBLE);
684 ret = rpc_queue_upcall(pipe, &msg);
685 if (ret < 0) {
686 set_current_state(TASK_RUNNING);
687 goto out;
688 }
689
690 schedule();
f3f80148
JL
691
692 if (msg.errno < 0)
693 ret = msg.errno;
694out:
695 return ret;
696}
697
698static int
699cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
700{
701 int ret;
702
703 /*
704 * -EAGAIN occurs when pipe is closed and reopened while there are
705 * upcalls queued.
706 */
707 do {
708 ret = __cld_pipe_upcall(pipe, cmsg);
709 } while (ret == -EAGAIN);
710
711 return ret;
712}
713
714static ssize_t
715cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
716{
717 struct cld_upcall *tmp, *cup;
bc1b542b 718 struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
f3f80148 719 uint32_t xid;
ef8a1a10 720 struct nfsd_net *nn = net_generic(file_inode(filp)->i_sb->s_fs_info,
f3f80148
JL
721 nfsd_net_id);
722 struct cld_net *cn = nn->cld_net;
723
724 if (mlen != sizeof(*cmsg)) {
8a7dc4b0 725 dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
f3f80148
JL
726 sizeof(*cmsg));
727 return -EINVAL;
728 }
729
730 /* copy just the xid so we can try to find that */
731 if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
732 dprintk("%s: error when copying xid from userspace", __func__);
733 return -EFAULT;
734 }
735
736 /* walk the list and find corresponding xid */
737 cup = NULL;
738 spin_lock(&cn->cn_lock);
739 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
740 if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
741 cup = tmp;
742 list_del_init(&cup->cu_list);
743 break;
744 }
745 }
746 spin_unlock(&cn->cn_lock);
747
748 /* couldn't find upcall? */
749 if (!cup) {
21f72c9f 750 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
f3f80148
JL
751 return -EINVAL;
752 }
753
754 if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
755 return -EFAULT;
756
757 wake_up_process(cup->cu_task);
758 return mlen;
759}
760
761static void
762cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
763{
764 struct cld_msg *cmsg = msg->data;
765 struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
766 cu_msg);
767
768 /* errno >= 0 means we got a downcall */
769 if (msg->errno >= 0)
770 return;
771
772 wake_up_process(cup->cu_task);
773}
774
775static const struct rpc_pipe_ops cld_upcall_ops = {
776 .upcall = rpc_pipe_generic_upcall,
777 .downcall = cld_pipe_downcall,
778 .destroy_msg = cld_pipe_destroy_msg,
779};
780
781static struct dentry *
782nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
783{
784 struct dentry *dir, *dentry;
785
786 dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
787 if (dir == NULL)
788 return ERR_PTR(-ENOENT);
789 dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
790 dput(dir);
791 return dentry;
792}
793
794static void
795nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
796{
797 if (pipe->dentry)
798 rpc_unlink(pipe->dentry);
799}
800
801static struct dentry *
802nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
803{
804 struct super_block *sb;
805 struct dentry *dentry;
806
807 sb = rpc_get_sb_net(net);
808 if (!sb)
809 return NULL;
810 dentry = nfsd4_cld_register_sb(sb, pipe);
811 rpc_put_sb_net(net);
812 return dentry;
813}
814
815static void
816nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
817{
818 struct super_block *sb;
819
820 sb = rpc_get_sb_net(net);
821 if (sb) {
822 nfsd4_cld_unregister_sb(pipe);
823 rpc_put_sb_net(net);
824 }
825}
826
827/* Initialize rpc_pipefs pipe for communication with client tracking daemon */
828static int
829nfsd4_init_cld_pipe(struct net *net)
830{
831 int ret;
832 struct dentry *dentry;
833 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
834 struct cld_net *cn;
835
836 if (nn->cld_net)
837 return 0;
838
839 cn = kzalloc(sizeof(*cn), GFP_KERNEL);
840 if (!cn) {
841 ret = -ENOMEM;
842 goto err;
843 }
844
845 cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
846 if (IS_ERR(cn->cn_pipe)) {
847 ret = PTR_ERR(cn->cn_pipe);
848 goto err;
849 }
850 spin_lock_init(&cn->cn_lock);
851 INIT_LIST_HEAD(&cn->cn_list);
852
853 dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
854 if (IS_ERR(dentry)) {
855 ret = PTR_ERR(dentry);
856 goto err_destroy_data;
857 }
858
859 cn->cn_pipe->dentry = dentry;
860 nn->cld_net = cn;
861 return 0;
862
863err_destroy_data:
864 rpc_destroy_pipe_data(cn->cn_pipe);
865err:
866 kfree(cn);
867 printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
868 ret);
869 return ret;
870}
871
872static void
873nfsd4_remove_cld_pipe(struct net *net)
874{
875 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
876 struct cld_net *cn = nn->cld_net;
877
878 nfsd4_cld_unregister_net(net, cn->cn_pipe);
879 rpc_destroy_pipe_data(cn->cn_pipe);
880 kfree(nn->cld_net);
881 nn->cld_net = NULL;
882}
883
884static struct cld_upcall *
885alloc_cld_upcall(struct cld_net *cn)
886{
887 struct cld_upcall *new, *tmp;
888
889 new = kzalloc(sizeof(*new), GFP_KERNEL);
890 if (!new)
891 return new;
892
893 /* FIXME: hard cap on number in flight? */
894restart_search:
895 spin_lock(&cn->cn_lock);
896 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
897 if (tmp->cu_msg.cm_xid == cn->cn_xid) {
898 cn->cn_xid++;
899 spin_unlock(&cn->cn_lock);
900 goto restart_search;
901 }
902 }
903 new->cu_task = current;
904 new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
905 put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
906 new->cu_net = cn;
907 list_add(&new->cu_list, &cn->cn_list);
908 spin_unlock(&cn->cn_lock);
909
910 dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
911
912 return new;
913}
914
915static void
916free_cld_upcall(struct cld_upcall *victim)
917{
918 struct cld_net *cn = victim->cu_net;
919
920 spin_lock(&cn->cn_lock);
921 list_del(&victim->cu_list);
922 spin_unlock(&cn->cn_lock);
923 kfree(victim);
924}
925
926/* Ask daemon to create a new record */
927static void
928nfsd4_cld_create(struct nfs4_client *clp)
929{
930 int ret;
931 struct cld_upcall *cup;
c212cecf 932 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
933 struct cld_net *cn = nn->cld_net;
934
935 /* Don't upcall if it's already stored */
936 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
937 return;
938
939 cup = alloc_cld_upcall(cn);
940 if (!cup) {
941 ret = -ENOMEM;
942 goto out_err;
943 }
944
945 cup->cu_msg.cm_cmd = Cld_Create;
946 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
947 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
948 clp->cl_name.len);
949
950 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
951 if (!ret) {
952 ret = cup->cu_msg.cm_status;
953 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
954 }
955
956 free_cld_upcall(cup);
957out_err:
958 if (ret)
959 printk(KERN_ERR "NFSD: Unable to create client "
960 "record on stable storage: %d\n", ret);
961}
962
963/* Ask daemon to create a new record */
964static void
965nfsd4_cld_remove(struct nfs4_client *clp)
966{
967 int ret;
968 struct cld_upcall *cup;
c212cecf 969 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
970 struct cld_net *cn = nn->cld_net;
971
972 /* Don't upcall if it's already removed */
973 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
974 return;
975
976 cup = alloc_cld_upcall(cn);
977 if (!cup) {
978 ret = -ENOMEM;
979 goto out_err;
980 }
981
982 cup->cu_msg.cm_cmd = Cld_Remove;
983 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
984 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
985 clp->cl_name.len);
986
987 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
988 if (!ret) {
989 ret = cup->cu_msg.cm_status;
990 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
991 }
992
993 free_cld_upcall(cup);
994out_err:
995 if (ret)
996 printk(KERN_ERR "NFSD: Unable to remove client "
997 "record from stable storage: %d\n", ret);
998}
999
1000/* Check for presence of a record, and update its timestamp */
1001static int
1002nfsd4_cld_check(struct nfs4_client *clp)
1003{
1004 int ret;
1005 struct cld_upcall *cup;
c212cecf 1006 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
1007 struct cld_net *cn = nn->cld_net;
1008
1009 /* Don't upcall if one was already stored during this grace pd */
1010 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1011 return 0;
1012
1013 cup = alloc_cld_upcall(cn);
1014 if (!cup) {
1015 printk(KERN_ERR "NFSD: Unable to check client record on "
1016 "stable storage: %d\n", -ENOMEM);
1017 return -ENOMEM;
1018 }
1019
1020 cup->cu_msg.cm_cmd = Cld_Check;
1021 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1022 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1023 clp->cl_name.len);
1024
1025 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1026 if (!ret) {
1027 ret = cup->cu_msg.cm_status;
1028 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1029 }
1030
1031 free_cld_upcall(cup);
1032 return ret;
1033}
1034
1035static void
919b8049 1036nfsd4_cld_grace_done(struct nfsd_net *nn)
f3f80148
JL
1037{
1038 int ret;
1039 struct cld_upcall *cup;
f3f80148
JL
1040 struct cld_net *cn = nn->cld_net;
1041
1042 cup = alloc_cld_upcall(cn);
1043 if (!cup) {
1044 ret = -ENOMEM;
1045 goto out_err;
1046 }
1047
1048 cup->cu_msg.cm_cmd = Cld_GraceDone;
919b8049 1049 cup->cu_msg.cm_u.cm_gracetime = (int64_t)nn->boot_time;
f3f80148
JL
1050 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1051 if (!ret)
1052 ret = cup->cu_msg.cm_status;
1053
1054 free_cld_upcall(cup);
1055out_err:
1056 if (ret)
1057 printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1058}
1059
7c582e4f 1060static const struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
f3f80148
JL
1061 .init = nfsd4_init_cld_pipe,
1062 .exit = nfsd4_remove_cld_pipe,
1063 .create = nfsd4_cld_create,
1064 .remove = nfsd4_cld_remove,
1065 .check = nfsd4_cld_check,
1066 .grace_done = nfsd4_cld_grace_done,
1067};
1068
2873d214
JL
1069/* upcall via usermodehelper */
1070static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1071module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1072 S_IRUGO|S_IWUSR);
1073MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1074
f3aa7e24
JL
1075static bool cltrack_legacy_disable;
1076module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1077MODULE_PARM_DESC(cltrack_legacy_disable,
1078 "Disable legacy recoverydir conversion. Default: false");
1079
1080#define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1081#define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
d4318acd
JL
1082#define HAS_SESSION_ENV_PREFIX "NFSDCLTRACK_CLIENT_HAS_SESSION="
1083#define GRACE_START_ENV_PREFIX "NFSDCLTRACK_GRACE_START="
f3aa7e24
JL
1084
1085static char *
1086nfsd4_cltrack_legacy_topdir(void)
1087{
1088 int copied;
1089 size_t len;
1090 char *result;
1091
1092 if (cltrack_legacy_disable)
1093 return NULL;
1094
1095 len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1096 strlen(nfs4_recoverydir()) + 1;
1097
1098 result = kmalloc(len, GFP_KERNEL);
1099 if (!result)
1100 return result;
1101
1102 copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1103 nfs4_recoverydir());
1104 if (copied >= len) {
1105 /* just return nothing if output was truncated */
1106 kfree(result);
1107 return NULL;
1108 }
1109
1110 return result;
1111}
1112
1113static char *
2216d449 1114nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
f3aa7e24
JL
1115{
1116 int copied;
1117 size_t len;
1118 char *result;
1119
1120 if (cltrack_legacy_disable)
1121 return NULL;
1122
1123 /* +1 is for '/' between "topdir" and "recdir" */
1124 len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1125 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1126
1127 result = kmalloc(len, GFP_KERNEL);
1128 if (!result)
1129 return result;
1130
2216d449
JL
1131 copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1132 nfs4_recoverydir());
1133 if (copied > (len - HEXDIR_LEN)) {
1134 /* just return nothing if output will be truncated */
1135 kfree(result);
1136 return NULL;
1137 }
1138
1139 copied = nfs4_make_rec_clidname(result + copied, name);
1140 if (copied) {
f3aa7e24
JL
1141 kfree(result);
1142 return NULL;
1143 }
1144
1145 return result;
1146}
1147
d4318acd
JL
1148static char *
1149nfsd4_cltrack_client_has_session(struct nfs4_client *clp)
1150{
1151 int copied;
1152 size_t len;
1153 char *result;
1154
1155 /* prefix + Y/N character + terminating NULL */
1156 len = strlen(HAS_SESSION_ENV_PREFIX) + 1 + 1;
1157
1158 result = kmalloc(len, GFP_KERNEL);
1159 if (!result)
1160 return result;
1161
1162 copied = snprintf(result, len, HAS_SESSION_ENV_PREFIX "%c",
1163 clp->cl_minorversion ? 'Y' : 'N');
1164 if (copied >= len) {
1165 /* just return nothing if output was truncated */
1166 kfree(result);
1167 return NULL;
1168 }
1169
1170 return result;
1171}
1172
1173static char *
1174nfsd4_cltrack_grace_start(time_t grace_start)
1175{
1176 int copied;
1177 size_t len;
1178 char *result;
1179
1180 /* prefix + max width of int64_t string + terminating NULL */
1181 len = strlen(GRACE_START_ENV_PREFIX) + 22 + 1;
1182
1183 result = kmalloc(len, GFP_KERNEL);
1184 if (!result)
1185 return result;
1186
1187 copied = snprintf(result, len, GRACE_START_ENV_PREFIX "%ld",
1188 grace_start);
1189 if (copied >= len) {
1190 /* just return nothing if output was truncated */
1191 kfree(result);
1192 return NULL;
1193 }
1194
1195 return result;
1196}
1197
2873d214 1198static int
d4318acd 1199nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *env0, char *env1)
2873d214 1200{
d4318acd 1201 char *envp[3];
2873d214
JL
1202 char *argv[4];
1203 int ret;
1204
1205 if (unlikely(!cltrack_prog[0])) {
1206 dprintk("%s: cltrack_prog is disabled\n", __func__);
1207 return -EACCES;
1208 }
1209
1210 dprintk("%s: cmd: %s\n", __func__, cmd);
1211 dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
d4318acd
JL
1212 dprintk("%s: env0: %s\n", __func__, env0 ? env0 : "(null)");
1213 dprintk("%s: env1: %s\n", __func__, env1 ? env1 : "(null)");
f3aa7e24 1214
d4318acd
JL
1215 envp[0] = env0;
1216 envp[1] = env1;
1217 envp[2] = NULL;
2873d214
JL
1218
1219 argv[0] = (char *)cltrack_prog;
1220 argv[1] = cmd;
1221 argv[2] = arg;
1222 argv[3] = NULL;
1223
1224 ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1225 /*
1226 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1227 * error. The admin can re-enable it on the fly by using sysfs
1228 * once the problem has been fixed.
1229 */
1230 if (ret == -ENOENT || ret == -EACCES) {
1231 dprintk("NFSD: %s was not found or isn't executable (%d). "
1232 "Setting cltrack_prog to blank string!",
1233 cltrack_prog, ret);
1234 cltrack_prog[0] = '\0';
1235 }
1236 dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1237
1238 return ret;
1239}
1240
1241static char *
1242bin_to_hex_dup(const unsigned char *src, int srclen)
1243{
1244 int i;
1245 char *buf, *hex;
1246
1247 /* +1 for terminating NULL */
1248 buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1249 if (!buf)
1250 return buf;
1251
1252 hex = buf;
1253 for (i = 0; i < srclen; i++) {
1254 sprintf(hex, "%2.2x", *src++);
1255 hex += 2;
1256 }
1257 return buf;
1258}
1259
1260static int
d4318acd 1261nfsd4_umh_cltrack_init(struct net *net)
2873d214 1262{
d4318acd
JL
1263 int ret;
1264 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1265 char *grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
1266
71a50306
SK
1267 /* XXX: The usermode helper s not working in container yet. */
1268 if (net != &init_net) {
46cc8ba3 1269 pr_warn("NFSD: attempt to initialize umh client tracking in a container ignored.\n");
956ccef3 1270 kfree(grace_start);
71a50306
SK
1271 return -EINVAL;
1272 }
d4318acd
JL
1273
1274 ret = nfsd4_umh_cltrack_upcall("init", NULL, grace_start, NULL);
1275 kfree(grace_start);
1276 return ret;
2873d214
JL
1277}
1278
d682e750
JL
1279static void
1280nfsd4_cltrack_upcall_lock(struct nfs4_client *clp)
1281{
1282 wait_on_bit_lock(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK,
1283 TASK_UNINTERRUPTIBLE);
1284}
1285
1286static void
1287nfsd4_cltrack_upcall_unlock(struct nfs4_client *clp)
1288{
1289 smp_mb__before_atomic();
1290 clear_bit(NFSD4_CLIENT_UPCALL_LOCK, &clp->cl_flags);
1291 smp_mb__after_atomic();
1292 wake_up_bit(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK);
1293}
1294
2873d214
JL
1295static void
1296nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1297{
d4318acd
JL
1298 char *hexid, *has_session, *grace_start;
1299 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
2873d214 1300
65decb65
JL
1301 /*
1302 * With v4.0 clients, there's little difference in outcome between a
1303 * create and check operation, and we can end up calling into this
1304 * function multiple times per client (once for each openowner). So,
1305 * for v4.0 clients skip upcalling once the client has been recorded
1306 * on stable storage.
1307 *
1308 * For v4.1+ clients, the outcome of the two operations is different,
1309 * so we must ensure that we upcall for the create operation. v4.1+
1310 * clients call this on RECLAIM_COMPLETE though, so we should only end
1311 * up doing a single create upcall per client.
1312 */
1313 if (clp->cl_minorversion == 0 &&
1314 test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1315 return;
1316
2873d214
JL
1317 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1318 if (!hexid) {
1319 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1320 return;
1321 }
d682e750 1322
d4318acd
JL
1323 has_session = nfsd4_cltrack_client_has_session(clp);
1324 grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
d682e750
JL
1325
1326 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1327 if (!nfsd4_umh_cltrack_upcall("create", hexid, has_session, grace_start))
1328 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d682e750
JL
1329 nfsd4_cltrack_upcall_unlock(clp);
1330
d4318acd
JL
1331 kfree(has_session);
1332 kfree(grace_start);
2873d214
JL
1333 kfree(hexid);
1334}
1335
1336static void
1337nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1338{
1339 char *hexid;
1340
788a7914
JL
1341 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1342 return;
1343
2873d214
JL
1344 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1345 if (!hexid) {
1346 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1347 return;
1348 }
d682e750
JL
1349
1350 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1351 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags) &&
1352 nfsd4_umh_cltrack_upcall("remove", hexid, NULL, NULL) == 0)
1353 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d682e750
JL
1354 nfsd4_cltrack_upcall_unlock(clp);
1355
2873d214
JL
1356 kfree(hexid);
1357}
1358
1359static int
1360nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1361{
1362 int ret;
d4318acd 1363 char *hexid, *has_session, *legacy;
2873d214 1364
788a7914
JL
1365 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1366 return 0;
1367
2873d214
JL
1368 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1369 if (!hexid) {
1370 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1371 return -ENOMEM;
1372 }
d4318acd
JL
1373
1374 has_session = nfsd4_cltrack_client_has_session(clp);
2216d449 1375 legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
d682e750
JL
1376
1377 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1378 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags)) {
1379 ret = 0;
1380 } else {
1381 ret = nfsd4_umh_cltrack_upcall("check", hexid, has_session, legacy);
1382 if (ret == 0)
1383 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1384 }
d682e750 1385 nfsd4_cltrack_upcall_unlock(clp);
d4318acd 1386 kfree(has_session);
f3aa7e24 1387 kfree(legacy);
2873d214 1388 kfree(hexid);
d4318acd 1389
2873d214
JL
1390 return ret;
1391}
1392
1393static void
919b8049 1394nfsd4_umh_cltrack_grace_done(struct nfsd_net *nn)
2873d214 1395{
f3aa7e24 1396 char *legacy;
2873d214
JL
1397 char timestr[22]; /* FIXME: better way to determine max size? */
1398
919b8049 1399 sprintf(timestr, "%ld", nn->boot_time);
f3aa7e24 1400 legacy = nfsd4_cltrack_legacy_topdir();
d4318acd 1401 nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy, NULL);
f3aa7e24 1402 kfree(legacy);
2873d214
JL
1403}
1404
7c582e4f 1405static const struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
2873d214
JL
1406 .init = nfsd4_umh_cltrack_init,
1407 .exit = NULL,
1408 .create = nfsd4_umh_cltrack_create,
1409 .remove = nfsd4_umh_cltrack_remove,
1410 .check = nfsd4_umh_cltrack_check,
1411 .grace_done = nfsd4_umh_cltrack_grace_done,
1412};
1413
2a4317c5
JL
1414int
1415nfsd4_client_tracking_init(struct net *net)
1416{
1417 int status;
f3f80148 1418 struct path path;
9a9c6478 1419 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
2a4317c5 1420
2d77bf0a 1421 /* just run the init if it the method is already decided */
9a9c6478 1422 if (nn->client_tracking_ops)
2d77bf0a
JL
1423 goto do_init;
1424
1425 /*
1426 * First, try a UMH upcall. It should succeed or fail quickly, so
1427 * there's little harm in trying that first.
1428 */
9a9c6478
SK
1429 nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1430 status = nn->client_tracking_ops->init(net);
2d77bf0a
JL
1431 if (!status)
1432 return status;
1433
1434 /*
1435 * See if the recoverydir exists and is a directory. If it is,
1436 * then use the legacy ops.
1437 */
9a9c6478 1438 nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
2d77bf0a
JL
1439 status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1440 if (!status) {
e36cb0b8 1441 status = d_is_dir(path.dentry);
2d77bf0a
JL
1442 path_put(&path);
1443 if (status)
1444 goto do_init;
f3f80148 1445 }
2a4317c5 1446
2d77bf0a 1447 /* Finally, try to use nfsdcld */
9a9c6478 1448 nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
8b0554e9
JL
1449 printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1450 "removed in 3.10. Please transition to using "
1451 "nfsdcltrack.\n");
2d77bf0a 1452do_init:
9a9c6478 1453 status = nn->client_tracking_ops->init(net);
2a4317c5
JL
1454 if (status) {
1455 printk(KERN_WARNING "NFSD: Unable to initialize client "
1456 "recovery tracking! (%d)\n", status);
9a9c6478 1457 nn->client_tracking_ops = NULL;
2a4317c5
JL
1458 }
1459 return status;
1460}
1461
1462void
1463nfsd4_client_tracking_exit(struct net *net)
1464{
9a9c6478
SK
1465 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1466
1467 if (nn->client_tracking_ops) {
1468 if (nn->client_tracking_ops->exit)
1469 nn->client_tracking_ops->exit(net);
1470 nn->client_tracking_ops = NULL;
2a4317c5
JL
1471 }
1472}
1473
1474void
1475nfsd4_client_record_create(struct nfs4_client *clp)
1476{
9a9c6478
SK
1477 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1478
1479 if (nn->client_tracking_ops)
1480 nn->client_tracking_ops->create(clp);
2a4317c5
JL
1481}
1482
1483void
1484nfsd4_client_record_remove(struct nfs4_client *clp)
1485{
9a9c6478
SK
1486 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1487
1488 if (nn->client_tracking_ops)
1489 nn->client_tracking_ops->remove(clp);
2a4317c5
JL
1490}
1491
1492int
1493nfsd4_client_record_check(struct nfs4_client *clp)
1494{
9a9c6478
SK
1495 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1496
1497 if (nn->client_tracking_ops)
1498 return nn->client_tracking_ops->check(clp);
2a4317c5
JL
1499
1500 return -EOPNOTSUPP;
1501}
1502
1503void
919b8049 1504nfsd4_record_grace_done(struct nfsd_net *nn)
2a4317c5 1505{
9a9c6478 1506 if (nn->client_tracking_ops)
919b8049 1507 nn->client_tracking_ops->grace_done(nn);
2a4317c5 1508}
813fd320
JL
1509
1510static int
1511rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1512{
1513 struct super_block *sb = ptr;
1514 struct net *net = sb->s_fs_info;
1515 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1516 struct cld_net *cn = nn->cld_net;
1517 struct dentry *dentry;
1518 int ret = 0;
1519
1520 if (!try_module_get(THIS_MODULE))
1521 return 0;
1522
1523 if (!cn) {
1524 module_put(THIS_MODULE);
1525 return 0;
1526 }
1527
1528 switch (event) {
1529 case RPC_PIPEFS_MOUNT:
1530 dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1531 if (IS_ERR(dentry)) {
1532 ret = PTR_ERR(dentry);
1533 break;
1534 }
1535 cn->cn_pipe->dentry = dentry;
1536 break;
1537 case RPC_PIPEFS_UMOUNT:
1538 if (cn->cn_pipe->dentry)
1539 nfsd4_cld_unregister_sb(cn->cn_pipe);
1540 break;
1541 default:
1542 ret = -ENOTSUPP;
1543 break;
1544 }
1545 module_put(THIS_MODULE);
1546 return ret;
1547}
1548
2355c596 1549static struct notifier_block nfsd4_cld_block = {
813fd320
JL
1550 .notifier_call = rpc_pipefs_event,
1551};
797a9d79
JL
1552
1553int
1554register_cld_notifier(void)
1555{
1556 return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1557}
1558
1559void
1560unregister_cld_notifier(void)
1561{
1562 rpc_pipefs_notifier_unregister(&nfsd4_cld_block);
1563}