wrappers for ->i_mutex access
[linux-2.6-block.git] / fs / nfsd / nfs4recover.c
CommitLineData
a55370a3 1/*
a55370a3 2* Copyright (c) 2004 The Regents of the University of Michigan.
f3f80148 3* Copyright (c) 2012 Jeff Layton <jlayton@redhat.com>
a55370a3
N
4* All rights reserved.
5*
6* Andy Adamson <andros@citi.umich.edu>
7*
8* Redistribution and use in source and binary forms, with or without
9* modification, are permitted provided that the following conditions
10* are met:
11*
12* 1. Redistributions of source code must retain the above copyright
13* notice, this list of conditions and the following disclaimer.
14* 2. Redistributions in binary form must reproduce the above copyright
15* notice, this list of conditions and the following disclaimer in the
16* documentation and/or other materials provided with the distribution.
17* 3. Neither the name of the University nor the names of its
18* contributors may be used to endorse or promote products derived
19* from this software without specific prior written permission.
20*
21* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*
33*/
34
190e4fbf 35#include <linux/file.h>
5a0e3ad6 36#include <linux/slab.h>
190e4fbf 37#include <linux/namei.h>
a55370a3 38#include <linux/crypto.h>
e8edc6e0 39#include <linux/sched.h>
f3f80148 40#include <linux/fs.h>
813fd320 41#include <linux/module.h>
f3f80148
JL
42#include <net/net_namespace.h>
43#include <linux/sunrpc/rpc_pipe_fs.h>
44#include <linux/sunrpc/clnt.h>
45#include <linux/nfsd/cld.h>
9a74af21
BH
46
47#include "nfsd.h"
48#include "state.h"
0a3adade 49#include "vfs.h"
f3f80148 50#include "netns.h"
a55370a3
N
51
52#define NFSDDBG_FACILITY NFSDDBG_PROC
53
2a4317c5
JL
54/* Declarations */
55struct nfsd4_client_tracking_ops {
56 int (*init)(struct net *);
57 void (*exit)(struct net *);
58 void (*create)(struct nfs4_client *);
59 void (*remove)(struct nfs4_client *);
60 int (*check)(struct nfs4_client *);
919b8049 61 void (*grace_done)(struct nfsd_net *);
2a4317c5
JL
62};
63
190e4fbf 64/* Globals */
48483bf2 65static char user_recovery_dirname[PATH_MAX] = "/var/lib/nfs/v4recovery";
190e4fbf 66
d84f4f99
DH
67static int
68nfs4_save_creds(const struct cred **original_creds)
190e4fbf 69{
d84f4f99
DH
70 struct cred *new;
71
72 new = prepare_creds();
73 if (!new)
74 return -ENOMEM;
75
6fab8779
EB
76 new->fsuid = GLOBAL_ROOT_UID;
77 new->fsgid = GLOBAL_ROOT_GID;
d84f4f99
DH
78 *original_creds = override_creds(new);
79 put_cred(new);
80 return 0;
190e4fbf
N
81}
82
83static void
d84f4f99 84nfs4_reset_creds(const struct cred *original)
190e4fbf 85{
d84f4f99 86 revert_creds(original);
190e4fbf
N
87}
88
a55370a3
N
89static void
90md5_to_hex(char *out, char *md5)
91{
92 int i;
93
94 for (i=0; i<16; i++) {
95 unsigned char c = md5[i];
96
97 *out++ = '0' + ((c&0xf0)>>4) + (c>=0xa0)*('a'-'9'-1);
98 *out++ = '0' + (c&0x0f) + ((c&0x0f)>=0x0a)*('a'-'9'-1);
99 }
100 *out = '\0';
101}
102
2216d449
JL
103static int
104nfs4_make_rec_clidname(char *dname, const struct xdr_netobj *clname)
a55370a3
N
105{
106 struct xdr_netobj cksum;
35058687 107 struct hash_desc desc;
60c74f81 108 struct scatterlist sg;
2216d449 109 int status;
a55370a3
N
110
111 dprintk("NFSD: nfs4_make_rec_clidname for %.*s\n",
112 clname->len, clname->data);
35058687
HX
113 desc.flags = CRYPTO_TFM_REQ_MAY_SLEEP;
114 desc.tfm = crypto_alloc_hash("md5", 0, CRYPTO_ALG_ASYNC);
2216d449
JL
115 if (IS_ERR(desc.tfm)) {
116 status = PTR_ERR(desc.tfm);
35058687 117 goto out_no_tfm;
2216d449
JL
118 }
119
35058687 120 cksum.len = crypto_hash_digestsize(desc.tfm);
a55370a3 121 cksum.data = kmalloc(cksum.len, GFP_KERNEL);
2216d449
JL
122 if (cksum.data == NULL) {
123 status = -ENOMEM;
a55370a3 124 goto out;
2216d449 125 }
a55370a3 126
60c74f81 127 sg_init_one(&sg, clname->data, clname->len);
a55370a3 128
2216d449
JL
129 status = crypto_hash_digest(&desc, &sg, sg.length, cksum.data);
130 if (status)
35058687 131 goto out;
a55370a3
N
132
133 md5_to_hex(dname, cksum.data);
134
2216d449 135 status = 0;
a55370a3 136out:
2bd9e7b6 137 kfree(cksum.data);
35058687
HX
138 crypto_free_hash(desc.tfm);
139out_no_tfm:
a55370a3
N
140 return status;
141}
190e4fbf 142
2216d449
JL
143/*
144 * If we had an error generating the recdir name for the legacy tracker
145 * then warn the admin. If the error doesn't appear to be transient,
146 * then disable recovery tracking.
147 */
148static void
7255e716 149legacy_recdir_name_error(struct nfs4_client *clp, int error)
2216d449
JL
150{
151 printk(KERN_ERR "NFSD: unable to generate recoverydir "
152 "name (%d).\n", error);
153
154 /*
155 * if the algorithm just doesn't exist, then disable the recovery
156 * tracker altogether. The crypto libs will generally return this if
157 * FIPS is enabled as well.
158 */
159 if (error == -ENOENT) {
160 printk(KERN_ERR "NFSD: disabling legacy clientid tracking. "
161 "Reboot recovery will not function correctly!\n");
7255e716 162 nfsd4_client_tracking_exit(clp->net);
2216d449
JL
163 }
164}
165
2a4317c5
JL
166static void
167nfsd4_create_clid_dir(struct nfs4_client *clp)
c7b9a459 168{
d84f4f99 169 const struct cred *original_cred;
2216d449 170 char dname[HEXDIR_LEN];
e970a573 171 struct dentry *dir, *dentry;
0ce0c2b5 172 struct nfs4_client_reclaim *crp;
c7b9a459 173 int status;
52e19c09 174 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
c7b9a459 175
a52d726b 176 if (test_and_set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
7a6ef8c7 177 return;
3a073369 178 if (!nn->rec_file)
7a6ef8c7 179 return;
2216d449
JL
180
181 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
182 if (status)
7255e716 183 return legacy_recdir_name_error(clp, status);
2216d449 184
d84f4f99
DH
185 status = nfs4_save_creds(&original_cred);
186 if (status < 0)
7a6ef8c7 187 return;
c7b9a459 188
3a073369 189 status = mnt_want_write_file(nn->rec_file);
4a55c101 190 if (status)
c2236f14 191 goto out_creds;
4a55c101 192
3a073369 193 dir = nn->rec_file->f_path.dentry;
c7b9a459 194 /* lock the parent */
5955102c 195 inode_lock(d_inode(dir));
c7b9a459 196
e970a573 197 dentry = lookup_one_len(dname, dir, HEXDIR_LEN-1);
c7b9a459
N
198 if (IS_ERR(dentry)) {
199 status = PTR_ERR(dentry);
200 goto out_unlock;
201 }
2b0143b5 202 if (d_really_is_positive(dentry))
aec39680
BF
203 /*
204 * In the 4.1 case, where we're called from
205 * reclaim_complete(), records from the previous reboot
206 * may still be left, so this is OK.
207 *
208 * In the 4.0 case, we should never get here; but we may
209 * as well be forgiving and just succeed silently.
210 */
c7b9a459 211 goto out_put;
2b0143b5 212 status = vfs_mkdir(d_inode(dir), dentry, S_IRWXU);
c7b9a459
N
213out_put:
214 dput(dentry);
215out_unlock:
5955102c 216 inode_unlock(d_inode(dir));
0ce0c2b5 217 if (status == 0) {
f141f79d 218 if (nn->in_grace) {
52e19c09 219 crp = nfs4_client_to_reclaim(dname, nn);
0ce0c2b5
JL
220 if (crp)
221 crp->cr_clp = clp;
222 }
3a073369 223 vfs_fsync(nn->rec_file, 0);
0ce0c2b5 224 } else {
6577aac0
BH
225 printk(KERN_ERR "NFSD: failed to write recovery record"
226 " (err %d); please check that %s exists"
227 " and is writeable", status,
228 user_recovery_dirname);
0ce0c2b5 229 }
3a073369 230 mnt_drop_write_file(nn->rec_file);
c2236f14 231out_creds:
d84f4f99 232 nfs4_reset_creds(original_cred);
c7b9a459
N
233}
234
52e19c09 235typedef int (recdir_func)(struct dentry *, struct dentry *, struct nfsd_net *);
190e4fbf 236
05f4f678
BF
237struct name_list {
238 char name[HEXDIR_LEN];
190e4fbf
N
239 struct list_head list;
240};
241
bb6f619b
AV
242struct nfs4_dir_ctx {
243 struct dir_context ctx;
244 struct list_head names;
245};
246
190e4fbf 247static int
ac7576f4 248nfsd4_build_namelist(struct dir_context *__ctx, const char *name, int namlen,
afefdbb2 249 loff_t offset, u64 ino, unsigned int d_type)
190e4fbf 250{
ac7576f4
MS
251 struct nfs4_dir_ctx *ctx =
252 container_of(__ctx, struct nfs4_dir_ctx, ctx);
05f4f678 253 struct name_list *entry;
190e4fbf 254
05f4f678 255 if (namlen != HEXDIR_LEN - 1)
b37ad28b 256 return 0;
05f4f678
BF
257 entry = kmalloc(sizeof(struct name_list), GFP_KERNEL);
258 if (entry == NULL)
190e4fbf 259 return -ENOMEM;
05f4f678
BF
260 memcpy(entry->name, name, HEXDIR_LEN - 1);
261 entry->name[HEXDIR_LEN - 1] = '\0';
bb6f619b 262 list_add(&entry->list, &ctx->names);
190e4fbf
N
263 return 0;
264}
265
266static int
52e19c09 267nfsd4_list_rec_dir(recdir_func *f, struct nfsd_net *nn)
190e4fbf 268{
d84f4f99 269 const struct cred *original_cred;
3a073369 270 struct dentry *dir = nn->rec_file->f_path.dentry;
ac6614b7
AV
271 struct nfs4_dir_ctx ctx = {
272 .ctx.actor = nfsd4_build_namelist,
273 .names = LIST_HEAD_INIT(ctx.names)
274 };
4691b271 275 struct name_list *entry, *tmp;
190e4fbf
N
276 int status;
277
d84f4f99
DH
278 status = nfs4_save_creds(&original_cred);
279 if (status < 0)
280 return status;
190e4fbf 281
3a073369 282 status = vfs_llseek(nn->rec_file, 0, SEEK_SET);
5b4b299c
AV
283 if (status < 0) {
284 nfs4_reset_creds(original_cred);
285 return status;
286 }
287
5c0ba4e0 288 status = iterate_dir(nn->rec_file, &ctx.ctx);
5955102c 289 inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
4691b271
KM
290
291 list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
5b4b299c
AV
292 if (!status) {
293 struct dentry *dentry;
294 dentry = lookup_one_len(entry->name, dir, HEXDIR_LEN-1);
295 if (IS_ERR(dentry)) {
296 status = PTR_ERR(dentry);
297 break;
298 }
52e19c09 299 status = f(dir, dentry, nn);
5b4b299c 300 dput(dentry);
05f4f678 301 }
05f4f678
BF
302 list_del(&entry->list);
303 kfree(entry);
190e4fbf 304 }
5955102c 305 inode_unlock(d_inode(dir));
d84f4f99 306 nfs4_reset_creds(original_cred);
4691b271
KM
307
308 list_for_each_entry_safe(entry, tmp, &ctx.names, list) {
309 dprintk("NFSD: %s. Left entry %s\n", __func__, entry->name);
310 list_del(&entry->list);
311 kfree(entry);
312 }
190e4fbf
N
313 return status;
314}
315
c7b9a459 316static int
3a073369 317nfsd4_unlink_clid_dir(char *name, int namlen, struct nfsd_net *nn)
c7b9a459 318{
e970a573 319 struct dentry *dir, *dentry;
c7b9a459
N
320 int status;
321
322 dprintk("NFSD: nfsd4_unlink_clid_dir. name %.*s\n", namlen, name);
323
3a073369 324 dir = nn->rec_file->f_path.dentry;
5955102c 325 inode_lock_nested(d_inode(dir), I_MUTEX_PARENT);
e970a573 326 dentry = lookup_one_len(name, dir, namlen);
c7b9a459
N
327 if (IS_ERR(dentry)) {
328 status = PTR_ERR(dentry);
2f9092e1 329 goto out_unlock;
c7b9a459
N
330 }
331 status = -ENOENT;
2b0143b5 332 if (d_really_is_negative(dentry))
c7b9a459 333 goto out;
2b0143b5 334 status = vfs_rmdir(d_inode(dir), dentry);
c7b9a459
N
335out:
336 dput(dentry);
2f9092e1 337out_unlock:
5955102c 338 inode_unlock(d_inode(dir));
c7b9a459
N
339 return status;
340}
341
2a4317c5 342static void
c7b9a459
N
343nfsd4_remove_clid_dir(struct nfs4_client *clp)
344{
d84f4f99 345 const struct cred *original_cred;
0ce0c2b5 346 struct nfs4_client_reclaim *crp;
2216d449 347 char dname[HEXDIR_LEN];
c7b9a459 348 int status;
52e19c09 349 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
c7b9a459 350
3a073369 351 if (!nn->rec_file || !test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
c7b9a459
N
352 return;
353
2216d449
JL
354 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
355 if (status)
7255e716 356 return legacy_recdir_name_error(clp, status);
2216d449 357
3a073369 358 status = mnt_want_write_file(nn->rec_file);
0622753b
DH
359 if (status)
360 goto out;
a52d726b 361 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d84f4f99
DH
362
363 status = nfs4_save_creds(&original_cred);
364 if (status < 0)
698d8d87 365 goto out_drop_write;
d84f4f99 366
3a073369 367 status = nfsd4_unlink_clid_dir(dname, HEXDIR_LEN-1, nn);
d84f4f99 368 nfs4_reset_creds(original_cred);
0ce0c2b5 369 if (status == 0) {
3a073369 370 vfs_fsync(nn->rec_file, 0);
f141f79d 371 if (nn->in_grace) {
0ce0c2b5 372 /* remove reclaim record */
52e19c09 373 crp = nfsd4_find_reclaim_client(dname, nn);
0ce0c2b5 374 if (crp)
52e19c09 375 nfs4_remove_reclaim_record(crp, nn);
0ce0c2b5
JL
376 }
377 }
698d8d87 378out_drop_write:
3a073369 379 mnt_drop_write_file(nn->rec_file);
0622753b 380out:
c7b9a459
N
381 if (status)
382 printk("NFSD: Failed to remove expired client state directory"
2216d449 383 " %.*s\n", HEXDIR_LEN, dname);
c7b9a459
N
384}
385
386static int
52e19c09 387purge_old(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
c7b9a459
N
388{
389 int status;
390
52e19c09 391 if (nfs4_has_reclaimed_state(child->d_name.name, nn))
b37ad28b 392 return 0;
c7b9a459 393
2b0143b5 394 status = vfs_rmdir(d_inode(parent), child);
c7b9a459 395 if (status)
a6a9f18f
AV
396 printk("failed to remove client recovery directory %pd\n",
397 child);
c7b9a459 398 /* Keep trying, success or failure: */
b37ad28b 399 return 0;
c7b9a459
N
400}
401
2a4317c5 402static void
919b8049 403nfsd4_recdir_purge_old(struct nfsd_net *nn)
2a4317c5 404{
c7b9a459
N
405 int status;
406
f141f79d 407 nn->in_grace = false;
3a073369 408 if (!nn->rec_file)
c7b9a459 409 return;
3a073369 410 status = mnt_want_write_file(nn->rec_file);
0622753b
DH
411 if (status)
412 goto out;
52e19c09 413 status = nfsd4_list_rec_dir(purge_old, nn);
c7b9a459 414 if (status == 0)
3a073369
SK
415 vfs_fsync(nn->rec_file, 0);
416 mnt_drop_write_file(nn->rec_file);
0622753b 417out:
52e19c09 418 nfs4_release_reclaim(nn);
c7b9a459
N
419 if (status)
420 printk("nfsd4: failed to purge old clients from recovery"
a6a9f18f 421 " directory %pD\n", nn->rec_file);
c7b9a459
N
422}
423
190e4fbf 424static int
52e19c09 425load_recdir(struct dentry *parent, struct dentry *child, struct nfsd_net *nn)
190e4fbf
N
426{
427 if (child->d_name.len != HEXDIR_LEN - 1) {
a6a9f18f
AV
428 printk("nfsd4: illegal name %pd in recovery directory\n",
429 child);
190e4fbf 430 /* Keep trying; maybe the others are OK: */
b37ad28b 431 return 0;
190e4fbf 432 }
52e19c09 433 nfs4_client_to_reclaim(child->d_name.name, nn);
b37ad28b 434 return 0;
190e4fbf
N
435}
436
2a4317c5 437static int
52e19c09 438nfsd4_recdir_load(struct net *net) {
190e4fbf 439 int status;
52e19c09 440 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
190e4fbf 441
3a073369 442 if (!nn->rec_file)
e970a573
CH
443 return 0;
444
52e19c09 445 status = nfsd4_list_rec_dir(load_recdir, nn);
190e4fbf
N
446 if (status)
447 printk("nfsd4: failed loading clients from recovery"
a6a9f18f 448 " directory %pD\n", nn->rec_file);
190e4fbf
N
449 return status;
450}
451
452/*
453 * Hold reference to the recovery directory.
454 */
455
2a4317c5 456static int
3a073369 457nfsd4_init_recdir(struct net *net)
190e4fbf 458{
3a073369 459 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
d84f4f99
DH
460 const struct cred *original_cred;
461 int status;
190e4fbf
N
462
463 printk("NFSD: Using %s as the NFSv4 state recovery directory\n",
48483bf2 464 user_recovery_dirname);
190e4fbf 465
3a073369 466 BUG_ON(nn->rec_file);
190e4fbf 467
d84f4f99
DH
468 status = nfs4_save_creds(&original_cred);
469 if (status < 0) {
470 printk("NFSD: Unable to change credentials to find recovery"
471 " directory: error %d\n",
472 status);
2a4317c5 473 return status;
d84f4f99 474 }
190e4fbf 475
3a073369
SK
476 nn->rec_file = filp_open(user_recovery_dirname, O_RDONLY | O_DIRECTORY, 0);
477 if (IS_ERR(nn->rec_file)) {
c2642ab0 478 printk("NFSD: unable to find recovery directory %s\n",
48483bf2 479 user_recovery_dirname);
3a073369
SK
480 status = PTR_ERR(nn->rec_file);
481 nn->rec_file = NULL;
e970a573 482 }
190e4fbf 483
d84f4f99 484 nfs4_reset_creds(original_cred);
0ce0c2b5 485 if (!status)
f141f79d 486 nn->in_grace = true;
2a4317c5 487 return status;
190e4fbf
N
488}
489
15d176c1
KM
490static void
491nfsd4_shutdown_recdir(struct net *net)
492{
493 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
494
495 if (!nn->rec_file)
496 return;
497 fput(nn->rec_file);
498 nn->rec_file = NULL;
499}
52e19c09
SK
500
501static int
502nfs4_legacy_state_init(struct net *net)
503{
504 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
505 int i;
506
507 nn->reclaim_str_hashtbl = kmalloc(sizeof(struct list_head) *
508 CLIENT_HASH_SIZE, GFP_KERNEL);
509 if (!nn->reclaim_str_hashtbl)
510 return -ENOMEM;
511
512 for (i = 0; i < CLIENT_HASH_SIZE; i++)
513 INIT_LIST_HEAD(&nn->reclaim_str_hashtbl[i]);
514 nn->reclaim_str_hashtbl_size = 0;
515
516 return 0;
517}
518
519static void
520nfs4_legacy_state_shutdown(struct net *net)
521{
522 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
523
524 kfree(nn->reclaim_str_hashtbl);
525}
526
2a4317c5
JL
527static int
528nfsd4_load_reboot_recovery_data(struct net *net)
529{
530 int status;
531
3a073369 532 status = nfsd4_init_recdir(net);
52e19c09 533 if (status)
15d176c1
KM
534 return status;
535
536 status = nfsd4_recdir_load(net);
537 if (status)
538 nfsd4_shutdown_recdir(net);
539
52e19c09
SK
540 return status;
541}
542
543static int
544nfsd4_legacy_tracking_init(struct net *net)
545{
546 int status;
547
cc27e0d4
JL
548 /* XXX: The legacy code won't work in a container */
549 if (net != &init_net) {
46cc8ba3 550 pr_warn("NFSD: attempt to initialize legacy client tracking in a container ignored.\n");
cc27e0d4
JL
551 return -EINVAL;
552 }
553
52e19c09 554 status = nfs4_legacy_state_init(net);
2a4317c5 555 if (status)
52e19c09
SK
556 return status;
557
558 status = nfsd4_load_reboot_recovery_data(net);
559 if (status)
560 goto err;
561 return 0;
562
563err:
564 nfs4_legacy_state_shutdown(net);
2a4317c5
JL
565 return status;
566}
567
2a4317c5
JL
568static void
569nfsd4_legacy_tracking_exit(struct net *net)
570{
52e19c09
SK
571 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
572
573 nfs4_release_reclaim(nn);
15d176c1 574 nfsd4_shutdown_recdir(net);
52e19c09 575 nfs4_legacy_state_shutdown(net);
2a4317c5
JL
576}
577
48483bf2
BF
578/*
579 * Change the NFSv4 recovery directory to recdir.
580 */
581int
582nfs4_reset_recoverydir(char *recdir)
583{
584 int status;
585 struct path path;
586
587 status = kern_path(recdir, LOOKUP_FOLLOW, &path);
588 if (status)
589 return status;
590 status = -ENOTDIR;
e36cb0b8 591 if (d_is_dir(path.dentry)) {
48483bf2
BF
592 strcpy(user_recovery_dirname, recdir);
593 status = 0;
594 }
595 path_put(&path);
596 return status;
597}
598
599char *
600nfs4_recoverydir(void)
601{
602 return user_recovery_dirname;
603}
2a4317c5
JL
604
605static int
606nfsd4_check_legacy_client(struct nfs4_client *clp)
607{
2216d449
JL
608 int status;
609 char dname[HEXDIR_LEN];
0ce0c2b5 610 struct nfs4_client_reclaim *crp;
52e19c09 611 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
0ce0c2b5 612
2a4317c5
JL
613 /* did we already find that this client is stable? */
614 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
615 return 0;
616
2216d449
JL
617 status = nfs4_make_rec_clidname(dname, &clp->cl_name);
618 if (status) {
7255e716 619 legacy_recdir_name_error(clp, status);
2216d449
JL
620 return status;
621 }
622
2a4317c5 623 /* look for it in the reclaim hashtable otherwise */
52e19c09 624 crp = nfsd4_find_reclaim_client(dname, nn);
0ce0c2b5 625 if (crp) {
2a4317c5 626 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
0ce0c2b5 627 crp->cr_clp = clp;
2a4317c5
JL
628 return 0;
629 }
630
631 return -ENOENT;
632}
633
7c582e4f 634static const struct nfsd4_client_tracking_ops nfsd4_legacy_tracking_ops = {
52e19c09 635 .init = nfsd4_legacy_tracking_init,
2a4317c5
JL
636 .exit = nfsd4_legacy_tracking_exit,
637 .create = nfsd4_create_clid_dir,
638 .remove = nfsd4_remove_clid_dir,
639 .check = nfsd4_check_legacy_client,
640 .grace_done = nfsd4_recdir_purge_old,
641};
642
f3f80148
JL
643/* Globals */
644#define NFSD_PIPE_DIR "nfsd"
645#define NFSD_CLD_PIPE "cld"
646
647/* per-net-ns structure for holding cld upcall info */
648struct cld_net {
649 struct rpc_pipe *cn_pipe;
650 spinlock_t cn_lock;
651 struct list_head cn_list;
652 unsigned int cn_xid;
653};
654
655struct cld_upcall {
656 struct list_head cu_list;
657 struct cld_net *cu_net;
658 struct task_struct *cu_task;
659 struct cld_msg cu_msg;
660};
661
662static int
663__cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
664{
665 int ret;
666 struct rpc_pipe_msg msg;
667
668 memset(&msg, 0, sizeof(msg));
669 msg.data = cmsg;
670 msg.len = sizeof(*cmsg);
671
672 /*
673 * Set task state before we queue the upcall. That prevents
674 * wake_up_process in the downcall from racing with schedule.
675 */
676 set_current_state(TASK_UNINTERRUPTIBLE);
677 ret = rpc_queue_upcall(pipe, &msg);
678 if (ret < 0) {
679 set_current_state(TASK_RUNNING);
680 goto out;
681 }
682
683 schedule();
f3f80148
JL
684
685 if (msg.errno < 0)
686 ret = msg.errno;
687out:
688 return ret;
689}
690
691static int
692cld_pipe_upcall(struct rpc_pipe *pipe, struct cld_msg *cmsg)
693{
694 int ret;
695
696 /*
697 * -EAGAIN occurs when pipe is closed and reopened while there are
698 * upcalls queued.
699 */
700 do {
701 ret = __cld_pipe_upcall(pipe, cmsg);
702 } while (ret == -EAGAIN);
703
704 return ret;
705}
706
707static ssize_t
708cld_pipe_downcall(struct file *filp, const char __user *src, size_t mlen)
709{
710 struct cld_upcall *tmp, *cup;
bc1b542b 711 struct cld_msg __user *cmsg = (struct cld_msg __user *)src;
f3f80148 712 uint32_t xid;
ef8a1a10 713 struct nfsd_net *nn = net_generic(file_inode(filp)->i_sb->s_fs_info,
f3f80148
JL
714 nfsd_net_id);
715 struct cld_net *cn = nn->cld_net;
716
717 if (mlen != sizeof(*cmsg)) {
8a7dc4b0 718 dprintk("%s: got %zu bytes, expected %zu\n", __func__, mlen,
f3f80148
JL
719 sizeof(*cmsg));
720 return -EINVAL;
721 }
722
723 /* copy just the xid so we can try to find that */
724 if (copy_from_user(&xid, &cmsg->cm_xid, sizeof(xid)) != 0) {
725 dprintk("%s: error when copying xid from userspace", __func__);
726 return -EFAULT;
727 }
728
729 /* walk the list and find corresponding xid */
730 cup = NULL;
731 spin_lock(&cn->cn_lock);
732 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
733 if (get_unaligned(&tmp->cu_msg.cm_xid) == xid) {
734 cup = tmp;
735 list_del_init(&cup->cu_list);
736 break;
737 }
738 }
739 spin_unlock(&cn->cn_lock);
740
741 /* couldn't find upcall? */
742 if (!cup) {
21f72c9f 743 dprintk("%s: couldn't find upcall -- xid=%u\n", __func__, xid);
f3f80148
JL
744 return -EINVAL;
745 }
746
747 if (copy_from_user(&cup->cu_msg, src, mlen) != 0)
748 return -EFAULT;
749
750 wake_up_process(cup->cu_task);
751 return mlen;
752}
753
754static void
755cld_pipe_destroy_msg(struct rpc_pipe_msg *msg)
756{
757 struct cld_msg *cmsg = msg->data;
758 struct cld_upcall *cup = container_of(cmsg, struct cld_upcall,
759 cu_msg);
760
761 /* errno >= 0 means we got a downcall */
762 if (msg->errno >= 0)
763 return;
764
765 wake_up_process(cup->cu_task);
766}
767
768static const struct rpc_pipe_ops cld_upcall_ops = {
769 .upcall = rpc_pipe_generic_upcall,
770 .downcall = cld_pipe_downcall,
771 .destroy_msg = cld_pipe_destroy_msg,
772};
773
774static struct dentry *
775nfsd4_cld_register_sb(struct super_block *sb, struct rpc_pipe *pipe)
776{
777 struct dentry *dir, *dentry;
778
779 dir = rpc_d_lookup_sb(sb, NFSD_PIPE_DIR);
780 if (dir == NULL)
781 return ERR_PTR(-ENOENT);
782 dentry = rpc_mkpipe_dentry(dir, NFSD_CLD_PIPE, NULL, pipe);
783 dput(dir);
784 return dentry;
785}
786
787static void
788nfsd4_cld_unregister_sb(struct rpc_pipe *pipe)
789{
790 if (pipe->dentry)
791 rpc_unlink(pipe->dentry);
792}
793
794static struct dentry *
795nfsd4_cld_register_net(struct net *net, struct rpc_pipe *pipe)
796{
797 struct super_block *sb;
798 struct dentry *dentry;
799
800 sb = rpc_get_sb_net(net);
801 if (!sb)
802 return NULL;
803 dentry = nfsd4_cld_register_sb(sb, pipe);
804 rpc_put_sb_net(net);
805 return dentry;
806}
807
808static void
809nfsd4_cld_unregister_net(struct net *net, struct rpc_pipe *pipe)
810{
811 struct super_block *sb;
812
813 sb = rpc_get_sb_net(net);
814 if (sb) {
815 nfsd4_cld_unregister_sb(pipe);
816 rpc_put_sb_net(net);
817 }
818}
819
820/* Initialize rpc_pipefs pipe for communication with client tracking daemon */
821static int
822nfsd4_init_cld_pipe(struct net *net)
823{
824 int ret;
825 struct dentry *dentry;
826 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
827 struct cld_net *cn;
828
829 if (nn->cld_net)
830 return 0;
831
832 cn = kzalloc(sizeof(*cn), GFP_KERNEL);
833 if (!cn) {
834 ret = -ENOMEM;
835 goto err;
836 }
837
838 cn->cn_pipe = rpc_mkpipe_data(&cld_upcall_ops, RPC_PIPE_WAIT_FOR_OPEN);
839 if (IS_ERR(cn->cn_pipe)) {
840 ret = PTR_ERR(cn->cn_pipe);
841 goto err;
842 }
843 spin_lock_init(&cn->cn_lock);
844 INIT_LIST_HEAD(&cn->cn_list);
845
846 dentry = nfsd4_cld_register_net(net, cn->cn_pipe);
847 if (IS_ERR(dentry)) {
848 ret = PTR_ERR(dentry);
849 goto err_destroy_data;
850 }
851
852 cn->cn_pipe->dentry = dentry;
853 nn->cld_net = cn;
854 return 0;
855
856err_destroy_data:
857 rpc_destroy_pipe_data(cn->cn_pipe);
858err:
859 kfree(cn);
860 printk(KERN_ERR "NFSD: unable to create nfsdcld upcall pipe (%d)\n",
861 ret);
862 return ret;
863}
864
865static void
866nfsd4_remove_cld_pipe(struct net *net)
867{
868 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
869 struct cld_net *cn = nn->cld_net;
870
871 nfsd4_cld_unregister_net(net, cn->cn_pipe);
872 rpc_destroy_pipe_data(cn->cn_pipe);
873 kfree(nn->cld_net);
874 nn->cld_net = NULL;
875}
876
877static struct cld_upcall *
878alloc_cld_upcall(struct cld_net *cn)
879{
880 struct cld_upcall *new, *tmp;
881
882 new = kzalloc(sizeof(*new), GFP_KERNEL);
883 if (!new)
884 return new;
885
886 /* FIXME: hard cap on number in flight? */
887restart_search:
888 spin_lock(&cn->cn_lock);
889 list_for_each_entry(tmp, &cn->cn_list, cu_list) {
890 if (tmp->cu_msg.cm_xid == cn->cn_xid) {
891 cn->cn_xid++;
892 spin_unlock(&cn->cn_lock);
893 goto restart_search;
894 }
895 }
896 new->cu_task = current;
897 new->cu_msg.cm_vers = CLD_UPCALL_VERSION;
898 put_unaligned(cn->cn_xid++, &new->cu_msg.cm_xid);
899 new->cu_net = cn;
900 list_add(&new->cu_list, &cn->cn_list);
901 spin_unlock(&cn->cn_lock);
902
903 dprintk("%s: allocated xid %u\n", __func__, new->cu_msg.cm_xid);
904
905 return new;
906}
907
908static void
909free_cld_upcall(struct cld_upcall *victim)
910{
911 struct cld_net *cn = victim->cu_net;
912
913 spin_lock(&cn->cn_lock);
914 list_del(&victim->cu_list);
915 spin_unlock(&cn->cn_lock);
916 kfree(victim);
917}
918
919/* Ask daemon to create a new record */
920static void
921nfsd4_cld_create(struct nfs4_client *clp)
922{
923 int ret;
924 struct cld_upcall *cup;
c212cecf 925 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
926 struct cld_net *cn = nn->cld_net;
927
928 /* Don't upcall if it's already stored */
929 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
930 return;
931
932 cup = alloc_cld_upcall(cn);
933 if (!cup) {
934 ret = -ENOMEM;
935 goto out_err;
936 }
937
938 cup->cu_msg.cm_cmd = Cld_Create;
939 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
940 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
941 clp->cl_name.len);
942
943 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
944 if (!ret) {
945 ret = cup->cu_msg.cm_status;
946 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
947 }
948
949 free_cld_upcall(cup);
950out_err:
951 if (ret)
952 printk(KERN_ERR "NFSD: Unable to create client "
953 "record on stable storage: %d\n", ret);
954}
955
956/* Ask daemon to create a new record */
957static void
958nfsd4_cld_remove(struct nfs4_client *clp)
959{
960 int ret;
961 struct cld_upcall *cup;
c212cecf 962 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
963 struct cld_net *cn = nn->cld_net;
964
965 /* Don't upcall if it's already removed */
966 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
967 return;
968
969 cup = alloc_cld_upcall(cn);
970 if (!cup) {
971 ret = -ENOMEM;
972 goto out_err;
973 }
974
975 cup->cu_msg.cm_cmd = Cld_Remove;
976 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
977 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
978 clp->cl_name.len);
979
980 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
981 if (!ret) {
982 ret = cup->cu_msg.cm_status;
983 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
984 }
985
986 free_cld_upcall(cup);
987out_err:
988 if (ret)
989 printk(KERN_ERR "NFSD: Unable to remove client "
990 "record from stable storage: %d\n", ret);
991}
992
993/* Check for presence of a record, and update its timestamp */
994static int
995nfsd4_cld_check(struct nfs4_client *clp)
996{
997 int ret;
998 struct cld_upcall *cup;
c212cecf 999 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
f3f80148
JL
1000 struct cld_net *cn = nn->cld_net;
1001
1002 /* Don't upcall if one was already stored during this grace pd */
1003 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1004 return 0;
1005
1006 cup = alloc_cld_upcall(cn);
1007 if (!cup) {
1008 printk(KERN_ERR "NFSD: Unable to check client record on "
1009 "stable storage: %d\n", -ENOMEM);
1010 return -ENOMEM;
1011 }
1012
1013 cup->cu_msg.cm_cmd = Cld_Check;
1014 cup->cu_msg.cm_u.cm_name.cn_len = clp->cl_name.len;
1015 memcpy(cup->cu_msg.cm_u.cm_name.cn_id, clp->cl_name.data,
1016 clp->cl_name.len);
1017
1018 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1019 if (!ret) {
1020 ret = cup->cu_msg.cm_status;
1021 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1022 }
1023
1024 free_cld_upcall(cup);
1025 return ret;
1026}
1027
1028static void
919b8049 1029nfsd4_cld_grace_done(struct nfsd_net *nn)
f3f80148
JL
1030{
1031 int ret;
1032 struct cld_upcall *cup;
f3f80148
JL
1033 struct cld_net *cn = nn->cld_net;
1034
1035 cup = alloc_cld_upcall(cn);
1036 if (!cup) {
1037 ret = -ENOMEM;
1038 goto out_err;
1039 }
1040
1041 cup->cu_msg.cm_cmd = Cld_GraceDone;
919b8049 1042 cup->cu_msg.cm_u.cm_gracetime = (int64_t)nn->boot_time;
f3f80148
JL
1043 ret = cld_pipe_upcall(cn->cn_pipe, &cup->cu_msg);
1044 if (!ret)
1045 ret = cup->cu_msg.cm_status;
1046
1047 free_cld_upcall(cup);
1048out_err:
1049 if (ret)
1050 printk(KERN_ERR "NFSD: Unable to end grace period: %d\n", ret);
1051}
1052
7c582e4f 1053static const struct nfsd4_client_tracking_ops nfsd4_cld_tracking_ops = {
f3f80148
JL
1054 .init = nfsd4_init_cld_pipe,
1055 .exit = nfsd4_remove_cld_pipe,
1056 .create = nfsd4_cld_create,
1057 .remove = nfsd4_cld_remove,
1058 .check = nfsd4_cld_check,
1059 .grace_done = nfsd4_cld_grace_done,
1060};
1061
2873d214
JL
1062/* upcall via usermodehelper */
1063static char cltrack_prog[PATH_MAX] = "/sbin/nfsdcltrack";
1064module_param_string(cltrack_prog, cltrack_prog, sizeof(cltrack_prog),
1065 S_IRUGO|S_IWUSR);
1066MODULE_PARM_DESC(cltrack_prog, "Path to the nfsdcltrack upcall program");
1067
f3aa7e24
JL
1068static bool cltrack_legacy_disable;
1069module_param(cltrack_legacy_disable, bool, S_IRUGO|S_IWUSR);
1070MODULE_PARM_DESC(cltrack_legacy_disable,
1071 "Disable legacy recoverydir conversion. Default: false");
1072
1073#define LEGACY_TOPDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_TOPDIR="
1074#define LEGACY_RECDIR_ENV_PREFIX "NFSDCLTRACK_LEGACY_RECDIR="
d4318acd
JL
1075#define HAS_SESSION_ENV_PREFIX "NFSDCLTRACK_CLIENT_HAS_SESSION="
1076#define GRACE_START_ENV_PREFIX "NFSDCLTRACK_GRACE_START="
f3aa7e24
JL
1077
1078static char *
1079nfsd4_cltrack_legacy_topdir(void)
1080{
1081 int copied;
1082 size_t len;
1083 char *result;
1084
1085 if (cltrack_legacy_disable)
1086 return NULL;
1087
1088 len = strlen(LEGACY_TOPDIR_ENV_PREFIX) +
1089 strlen(nfs4_recoverydir()) + 1;
1090
1091 result = kmalloc(len, GFP_KERNEL);
1092 if (!result)
1093 return result;
1094
1095 copied = snprintf(result, len, LEGACY_TOPDIR_ENV_PREFIX "%s",
1096 nfs4_recoverydir());
1097 if (copied >= len) {
1098 /* just return nothing if output was truncated */
1099 kfree(result);
1100 return NULL;
1101 }
1102
1103 return result;
1104}
1105
1106static char *
2216d449 1107nfsd4_cltrack_legacy_recdir(const struct xdr_netobj *name)
f3aa7e24
JL
1108{
1109 int copied;
1110 size_t len;
1111 char *result;
1112
1113 if (cltrack_legacy_disable)
1114 return NULL;
1115
1116 /* +1 is for '/' between "topdir" and "recdir" */
1117 len = strlen(LEGACY_RECDIR_ENV_PREFIX) +
1118 strlen(nfs4_recoverydir()) + 1 + HEXDIR_LEN;
1119
1120 result = kmalloc(len, GFP_KERNEL);
1121 if (!result)
1122 return result;
1123
2216d449
JL
1124 copied = snprintf(result, len, LEGACY_RECDIR_ENV_PREFIX "%s/",
1125 nfs4_recoverydir());
1126 if (copied > (len - HEXDIR_LEN)) {
1127 /* just return nothing if output will be truncated */
1128 kfree(result);
1129 return NULL;
1130 }
1131
1132 copied = nfs4_make_rec_clidname(result + copied, name);
1133 if (copied) {
f3aa7e24
JL
1134 kfree(result);
1135 return NULL;
1136 }
1137
1138 return result;
1139}
1140
d4318acd
JL
1141static char *
1142nfsd4_cltrack_client_has_session(struct nfs4_client *clp)
1143{
1144 int copied;
1145 size_t len;
1146 char *result;
1147
1148 /* prefix + Y/N character + terminating NULL */
1149 len = strlen(HAS_SESSION_ENV_PREFIX) + 1 + 1;
1150
1151 result = kmalloc(len, GFP_KERNEL);
1152 if (!result)
1153 return result;
1154
1155 copied = snprintf(result, len, HAS_SESSION_ENV_PREFIX "%c",
1156 clp->cl_minorversion ? 'Y' : 'N');
1157 if (copied >= len) {
1158 /* just return nothing if output was truncated */
1159 kfree(result);
1160 return NULL;
1161 }
1162
1163 return result;
1164}
1165
1166static char *
1167nfsd4_cltrack_grace_start(time_t grace_start)
1168{
1169 int copied;
1170 size_t len;
1171 char *result;
1172
1173 /* prefix + max width of int64_t string + terminating NULL */
1174 len = strlen(GRACE_START_ENV_PREFIX) + 22 + 1;
1175
1176 result = kmalloc(len, GFP_KERNEL);
1177 if (!result)
1178 return result;
1179
1180 copied = snprintf(result, len, GRACE_START_ENV_PREFIX "%ld",
1181 grace_start);
1182 if (copied >= len) {
1183 /* just return nothing if output was truncated */
1184 kfree(result);
1185 return NULL;
1186 }
1187
1188 return result;
1189}
1190
2873d214 1191static int
d4318acd 1192nfsd4_umh_cltrack_upcall(char *cmd, char *arg, char *env0, char *env1)
2873d214 1193{
d4318acd 1194 char *envp[3];
2873d214
JL
1195 char *argv[4];
1196 int ret;
1197
1198 if (unlikely(!cltrack_prog[0])) {
1199 dprintk("%s: cltrack_prog is disabled\n", __func__);
1200 return -EACCES;
1201 }
1202
1203 dprintk("%s: cmd: %s\n", __func__, cmd);
1204 dprintk("%s: arg: %s\n", __func__, arg ? arg : "(null)");
d4318acd
JL
1205 dprintk("%s: env0: %s\n", __func__, env0 ? env0 : "(null)");
1206 dprintk("%s: env1: %s\n", __func__, env1 ? env1 : "(null)");
f3aa7e24 1207
d4318acd
JL
1208 envp[0] = env0;
1209 envp[1] = env1;
1210 envp[2] = NULL;
2873d214
JL
1211
1212 argv[0] = (char *)cltrack_prog;
1213 argv[1] = cmd;
1214 argv[2] = arg;
1215 argv[3] = NULL;
1216
1217 ret = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
1218 /*
1219 * Disable the upcall mechanism if we're getting an ENOENT or EACCES
1220 * error. The admin can re-enable it on the fly by using sysfs
1221 * once the problem has been fixed.
1222 */
1223 if (ret == -ENOENT || ret == -EACCES) {
1224 dprintk("NFSD: %s was not found or isn't executable (%d). "
1225 "Setting cltrack_prog to blank string!",
1226 cltrack_prog, ret);
1227 cltrack_prog[0] = '\0';
1228 }
1229 dprintk("%s: %s return value: %d\n", __func__, cltrack_prog, ret);
1230
1231 return ret;
1232}
1233
1234static char *
1235bin_to_hex_dup(const unsigned char *src, int srclen)
1236{
1237 int i;
1238 char *buf, *hex;
1239
1240 /* +1 for terminating NULL */
1241 buf = kmalloc((srclen * 2) + 1, GFP_KERNEL);
1242 if (!buf)
1243 return buf;
1244
1245 hex = buf;
1246 for (i = 0; i < srclen; i++) {
1247 sprintf(hex, "%2.2x", *src++);
1248 hex += 2;
1249 }
1250 return buf;
1251}
1252
1253static int
d4318acd 1254nfsd4_umh_cltrack_init(struct net *net)
2873d214 1255{
d4318acd
JL
1256 int ret;
1257 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1258 char *grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
1259
71a50306
SK
1260 /* XXX: The usermode helper s not working in container yet. */
1261 if (net != &init_net) {
46cc8ba3 1262 pr_warn("NFSD: attempt to initialize umh client tracking in a container ignored.\n");
71a50306
SK
1263 return -EINVAL;
1264 }
d4318acd
JL
1265
1266 ret = nfsd4_umh_cltrack_upcall("init", NULL, grace_start, NULL);
1267 kfree(grace_start);
1268 return ret;
2873d214
JL
1269}
1270
d682e750
JL
1271static void
1272nfsd4_cltrack_upcall_lock(struct nfs4_client *clp)
1273{
1274 wait_on_bit_lock(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK,
1275 TASK_UNINTERRUPTIBLE);
1276}
1277
1278static void
1279nfsd4_cltrack_upcall_unlock(struct nfs4_client *clp)
1280{
1281 smp_mb__before_atomic();
1282 clear_bit(NFSD4_CLIENT_UPCALL_LOCK, &clp->cl_flags);
1283 smp_mb__after_atomic();
1284 wake_up_bit(&clp->cl_flags, NFSD4_CLIENT_UPCALL_LOCK);
1285}
1286
2873d214
JL
1287static void
1288nfsd4_umh_cltrack_create(struct nfs4_client *clp)
1289{
d4318acd
JL
1290 char *hexid, *has_session, *grace_start;
1291 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
2873d214 1292
65decb65
JL
1293 /*
1294 * With v4.0 clients, there's little difference in outcome between a
1295 * create and check operation, and we can end up calling into this
1296 * function multiple times per client (once for each openowner). So,
1297 * for v4.0 clients skip upcalling once the client has been recorded
1298 * on stable storage.
1299 *
1300 * For v4.1+ clients, the outcome of the two operations is different,
1301 * so we must ensure that we upcall for the create operation. v4.1+
1302 * clients call this on RECLAIM_COMPLETE though, so we should only end
1303 * up doing a single create upcall per client.
1304 */
1305 if (clp->cl_minorversion == 0 &&
1306 test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1307 return;
1308
2873d214
JL
1309 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1310 if (!hexid) {
1311 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1312 return;
1313 }
d682e750 1314
d4318acd
JL
1315 has_session = nfsd4_cltrack_client_has_session(clp);
1316 grace_start = nfsd4_cltrack_grace_start(nn->boot_time);
d682e750
JL
1317
1318 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1319 if (!nfsd4_umh_cltrack_upcall("create", hexid, has_session, grace_start))
1320 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d682e750
JL
1321 nfsd4_cltrack_upcall_unlock(clp);
1322
d4318acd
JL
1323 kfree(has_session);
1324 kfree(grace_start);
2873d214
JL
1325 kfree(hexid);
1326}
1327
1328static void
1329nfsd4_umh_cltrack_remove(struct nfs4_client *clp)
1330{
1331 char *hexid;
1332
788a7914
JL
1333 if (!test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1334 return;
1335
2873d214
JL
1336 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1337 if (!hexid) {
1338 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1339 return;
1340 }
d682e750
JL
1341
1342 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1343 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags) &&
1344 nfsd4_umh_cltrack_upcall("remove", hexid, NULL, NULL) == 0)
1345 clear_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
d682e750
JL
1346 nfsd4_cltrack_upcall_unlock(clp);
1347
2873d214
JL
1348 kfree(hexid);
1349}
1350
1351static int
1352nfsd4_umh_cltrack_check(struct nfs4_client *clp)
1353{
1354 int ret;
d4318acd 1355 char *hexid, *has_session, *legacy;
2873d214 1356
788a7914
JL
1357 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags))
1358 return 0;
1359
2873d214
JL
1360 hexid = bin_to_hex_dup(clp->cl_name.data, clp->cl_name.len);
1361 if (!hexid) {
1362 dprintk("%s: can't allocate memory for upcall!\n", __func__);
1363 return -ENOMEM;
1364 }
d4318acd
JL
1365
1366 has_session = nfsd4_cltrack_client_has_session(clp);
2216d449 1367 legacy = nfsd4_cltrack_legacy_recdir(&clp->cl_name);
d682e750
JL
1368
1369 nfsd4_cltrack_upcall_lock(clp);
788a7914
JL
1370 if (test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags)) {
1371 ret = 0;
1372 } else {
1373 ret = nfsd4_umh_cltrack_upcall("check", hexid, has_session, legacy);
1374 if (ret == 0)
1375 set_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
1376 }
d682e750 1377 nfsd4_cltrack_upcall_unlock(clp);
d4318acd 1378 kfree(has_session);
f3aa7e24 1379 kfree(legacy);
2873d214 1380 kfree(hexid);
d4318acd 1381
2873d214
JL
1382 return ret;
1383}
1384
1385static void
919b8049 1386nfsd4_umh_cltrack_grace_done(struct nfsd_net *nn)
2873d214 1387{
f3aa7e24 1388 char *legacy;
2873d214
JL
1389 char timestr[22]; /* FIXME: better way to determine max size? */
1390
919b8049 1391 sprintf(timestr, "%ld", nn->boot_time);
f3aa7e24 1392 legacy = nfsd4_cltrack_legacy_topdir();
d4318acd 1393 nfsd4_umh_cltrack_upcall("gracedone", timestr, legacy, NULL);
f3aa7e24 1394 kfree(legacy);
2873d214
JL
1395}
1396
7c582e4f 1397static const struct nfsd4_client_tracking_ops nfsd4_umh_tracking_ops = {
2873d214
JL
1398 .init = nfsd4_umh_cltrack_init,
1399 .exit = NULL,
1400 .create = nfsd4_umh_cltrack_create,
1401 .remove = nfsd4_umh_cltrack_remove,
1402 .check = nfsd4_umh_cltrack_check,
1403 .grace_done = nfsd4_umh_cltrack_grace_done,
1404};
1405
2a4317c5
JL
1406int
1407nfsd4_client_tracking_init(struct net *net)
1408{
1409 int status;
f3f80148 1410 struct path path;
9a9c6478 1411 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
2a4317c5 1412
2d77bf0a 1413 /* just run the init if it the method is already decided */
9a9c6478 1414 if (nn->client_tracking_ops)
2d77bf0a
JL
1415 goto do_init;
1416
1417 /*
1418 * First, try a UMH upcall. It should succeed or fail quickly, so
1419 * there's little harm in trying that first.
1420 */
9a9c6478
SK
1421 nn->client_tracking_ops = &nfsd4_umh_tracking_ops;
1422 status = nn->client_tracking_ops->init(net);
2d77bf0a
JL
1423 if (!status)
1424 return status;
1425
1426 /*
1427 * See if the recoverydir exists and is a directory. If it is,
1428 * then use the legacy ops.
1429 */
9a9c6478 1430 nn->client_tracking_ops = &nfsd4_legacy_tracking_ops;
2d77bf0a
JL
1431 status = kern_path(nfs4_recoverydir(), LOOKUP_FOLLOW, &path);
1432 if (!status) {
e36cb0b8 1433 status = d_is_dir(path.dentry);
2d77bf0a
JL
1434 path_put(&path);
1435 if (status)
1436 goto do_init;
f3f80148 1437 }
2a4317c5 1438
2d77bf0a 1439 /* Finally, try to use nfsdcld */
9a9c6478 1440 nn->client_tracking_ops = &nfsd4_cld_tracking_ops;
8b0554e9
JL
1441 printk(KERN_WARNING "NFSD: the nfsdcld client tracking upcall will be "
1442 "removed in 3.10. Please transition to using "
1443 "nfsdcltrack.\n");
2d77bf0a 1444do_init:
9a9c6478 1445 status = nn->client_tracking_ops->init(net);
2a4317c5
JL
1446 if (status) {
1447 printk(KERN_WARNING "NFSD: Unable to initialize client "
1448 "recovery tracking! (%d)\n", status);
9a9c6478 1449 nn->client_tracking_ops = NULL;
2a4317c5
JL
1450 }
1451 return status;
1452}
1453
1454void
1455nfsd4_client_tracking_exit(struct net *net)
1456{
9a9c6478
SK
1457 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1458
1459 if (nn->client_tracking_ops) {
1460 if (nn->client_tracking_ops->exit)
1461 nn->client_tracking_ops->exit(net);
1462 nn->client_tracking_ops = NULL;
2a4317c5
JL
1463 }
1464}
1465
1466void
1467nfsd4_client_record_create(struct nfs4_client *clp)
1468{
9a9c6478
SK
1469 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1470
1471 if (nn->client_tracking_ops)
1472 nn->client_tracking_ops->create(clp);
2a4317c5
JL
1473}
1474
1475void
1476nfsd4_client_record_remove(struct nfs4_client *clp)
1477{
9a9c6478
SK
1478 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1479
1480 if (nn->client_tracking_ops)
1481 nn->client_tracking_ops->remove(clp);
2a4317c5
JL
1482}
1483
1484int
1485nfsd4_client_record_check(struct nfs4_client *clp)
1486{
9a9c6478
SK
1487 struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1488
1489 if (nn->client_tracking_ops)
1490 return nn->client_tracking_ops->check(clp);
2a4317c5
JL
1491
1492 return -EOPNOTSUPP;
1493}
1494
1495void
919b8049 1496nfsd4_record_grace_done(struct nfsd_net *nn)
2a4317c5 1497{
9a9c6478 1498 if (nn->client_tracking_ops)
919b8049 1499 nn->client_tracking_ops->grace_done(nn);
2a4317c5 1500}
813fd320
JL
1501
1502static int
1503rpc_pipefs_event(struct notifier_block *nb, unsigned long event, void *ptr)
1504{
1505 struct super_block *sb = ptr;
1506 struct net *net = sb->s_fs_info;
1507 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1508 struct cld_net *cn = nn->cld_net;
1509 struct dentry *dentry;
1510 int ret = 0;
1511
1512 if (!try_module_get(THIS_MODULE))
1513 return 0;
1514
1515 if (!cn) {
1516 module_put(THIS_MODULE);
1517 return 0;
1518 }
1519
1520 switch (event) {
1521 case RPC_PIPEFS_MOUNT:
1522 dentry = nfsd4_cld_register_sb(sb, cn->cn_pipe);
1523 if (IS_ERR(dentry)) {
1524 ret = PTR_ERR(dentry);
1525 break;
1526 }
1527 cn->cn_pipe->dentry = dentry;
1528 break;
1529 case RPC_PIPEFS_UMOUNT:
1530 if (cn->cn_pipe->dentry)
1531 nfsd4_cld_unregister_sb(cn->cn_pipe);
1532 break;
1533 default:
1534 ret = -ENOTSUPP;
1535 break;
1536 }
1537 module_put(THIS_MODULE);
1538 return ret;
1539}
1540
2355c596 1541static struct notifier_block nfsd4_cld_block = {
813fd320
JL
1542 .notifier_call = rpc_pipefs_event,
1543};
797a9d79
JL
1544
1545int
1546register_cld_notifier(void)
1547{
1548 return rpc_pipefs_notifier_register(&nfsd4_cld_block);
1549}
1550
1551void
1552unregister_cld_notifier(void)
1553{
1554 rpc_pipefs_notifier_unregister(&nfsd4_cld_block);
1555}