Merge tag 'locking-core-2023-05-05' of git://git.kernel.org/pub/scm/linux/kernel...
[linux-block.git] / fs / nfs / unlink.c
CommitLineData
b2441318 1// SPDX-License-Identifier: GPL-2.0
1da177e4
LT
2/*
3 * linux/fs/nfs/unlink.c
4 *
5 * nfs sillydelete handling
6 *
1da177e4
LT
7 */
8
9#include <linux/slab.h>
10#include <linux/string.h>
11#include <linux/dcache.h>
12#include <linux/sunrpc/sched.h>
13#include <linux/sunrpc/clnt.h>
14#include <linux/nfs_fs.h>
b35e7041
LT
15#include <linux/sched.h>
16#include <linux/wait.h>
779c5179 17#include <linux/namei.h>
f7be7284 18#include <linux/fsnotify.h>
1da177e4 19
ef818a28 20#include "internal.h"
472cfbd9 21#include "nfs4_fs.h"
779c5179
JL
22#include "iostat.h"
23#include "delegation.h"
ef818a28 24
70ded201
TM
25#include "nfstrace.h"
26
1da177e4 27/**
e4eff1a6 28 * nfs_free_unlinkdata - release data from a sillydelete operation.
1da177e4
LT
29 * @data: pointer to unlink structure.
30 */
31static void
e4eff1a6 32nfs_free_unlinkdata(struct nfs_unlinkdata *data)
1da177e4 33{
a52458b4 34 put_cred(data->cred);
e4eff1a6
TM
35 kfree(data->args.name.name);
36 kfree(data);
1da177e4
LT
37}
38
1da177e4
LT
39/**
40 * nfs_async_unlink_done - Sillydelete post-processing
41 * @task: rpc_task of the sillydelete
302fad7b 42 * @calldata: pointer to nfs_unlinkdata
1da177e4
LT
43 *
44 * Do the directory attribute update.
45 */
963d8fe5 46static void nfs_async_unlink_done(struct rpc_task *task, void *calldata)
1da177e4 47{
e4eff1a6 48 struct nfs_unlinkdata *data = calldata;
884be175 49 struct inode *dir = d_inode(data->dentry->d_parent);
e4eff1a6 50
70ded201 51 trace_nfs_sillyrename_unlink(data, task->tk_status);
e4eff1a6 52 if (!NFS_PROTO(dir)->unlink_done(task, dir))
d00c5d43 53 rpc_restart_call_prepare(task);
1da177e4
LT
54}
55
56/**
57 * nfs_async_unlink_release - Release the sillydelete data.
302fad7b 58 * @calldata: struct nfs_unlinkdata to release
1da177e4
LT
59 *
60 * We need to call nfs_put_unlinkdata as a 'tk_release' task since the
61 * rpc_task would be freed too.
62 */
963d8fe5 63static void nfs_async_unlink_release(void *calldata)
1da177e4 64{
963d8fe5 65 struct nfs_unlinkdata *data = calldata;
884be175
AV
66 struct dentry *dentry = data->dentry;
67 struct super_block *sb = dentry->d_sb;
565277f6 68
884be175
AV
69 up_read_non_owner(&NFS_I(d_inode(dentry->d_parent))->rmdir_sem);
70 d_lookup_done(dentry);
e4eff1a6 71 nfs_free_unlinkdata(data);
884be175 72 dput(dentry);
322b2b90 73 nfs_sb_deactive(sb);
1da177e4
LT
74}
75
17280175 76static void nfs_unlink_prepare(struct rpc_task *task, void *calldata)
472cfbd9
AA
77{
78 struct nfs_unlinkdata *data = calldata;
884be175
AV
79 struct inode *dir = d_inode(data->dentry->d_parent);
80 NFS_PROTO(dir)->unlink_rpc_prepare(task, data);
472cfbd9 81}
472cfbd9 82
963d8fe5
TM
83static const struct rpc_call_ops nfs_unlink_ops = {
84 .rpc_call_done = nfs_async_unlink_done,
85 .rpc_release = nfs_async_unlink_release,
472cfbd9 86 .rpc_call_prepare = nfs_unlink_prepare,
963d8fe5
TM
87};
88
ed7e9ad0 89static void nfs_do_call_unlink(struct inode *inode, struct nfs_unlinkdata *data)
e4eff1a6 90{
5138fde0
TM
91 struct rpc_message msg = {
92 .rpc_argp = &data->args,
93 .rpc_resp = &data->res,
94 .rpc_cred = data->cred,
95 };
c970aa85 96 struct rpc_task_setup task_setup_data = {
5138fde0 97 .rpc_message = &msg,
c970aa85
TM
98 .callback_ops = &nfs_unlink_ops,
99 .callback_data = data,
1daef0a8 100 .workqueue = nfsiod_workqueue,
49cd3254 101 .flags = RPC_TASK_ASYNC | RPC_TASK_CRED_NOREF,
c970aa85 102 };
e4eff1a6 103 struct rpc_task *task;
884be175 104 struct inode *dir = d_inode(data->dentry->d_parent);
118f09ed
OK
105
106 if (nfs_server_capable(inode, NFS_CAP_MOVEABLE))
107 task_setup_data.flags |= RPC_TASK_MOVEABLE;
108
884be175
AV
109 nfs_sb_active(dir->i_sb);
110 data->args.fh = NFS_FH(dir);
111 nfs_fattr_init(data->res.dir_attr);
112
ed7e9ad0 113 NFS_PROTO(dir)->unlink_setup(&msg, data->dentry, inode);
884be175
AV
114
115 task_setup_data.rpc_client = NFS_CLIENT(dir);
116 task = rpc_run_task(&task_setup_data);
117 if (!IS_ERR(task))
118 rpc_put_task_async(task);
119}
120
ed7e9ad0 121static int nfs_call_unlink(struct dentry *dentry, struct inode *inode, struct nfs_unlinkdata *data)
884be175
AV
122{
123 struct inode *dir = d_inode(dentry->d_parent);
565277f6
TM
124 struct dentry *alias;
125
884be175
AV
126 down_read_non_owner(&NFS_I(dir)->rmdir_sem);
127 alias = d_alloc_parallel(dentry->d_parent, &data->args.name, &data->wq);
128 if (IS_ERR(alias)) {
129 up_read_non_owner(&NFS_I(dir)->rmdir_sem);
130 return 0;
131 }
132 if (!d_in_lookup(alias)) {
73ca1001 133 int ret;
b1942c5f 134 void *devname_garbage = NULL;
609005c3 135
565277f6
TM
136 /*
137 * Hey, we raced with lookup... See if we need to transfer
138 * the sillyrename information to the aliased dentry.
139 */
565277f6 140 spin_lock(&alias->d_lock);
884be175 141 if (d_really_is_positive(alias) &&
5776a9cd 142 !nfs_compare_fh(NFS_FH(inode), NFS_FH(d_inode(alias))) &&
609005c3 143 !(alias->d_flags & DCACHE_NFSFS_RENAMED)) {
b1942c5f 144 devname_garbage = alias->d_fsdata;
565277f6 145 alias->d_fsdata = data;
fccca7fc 146 alias->d_flags |= DCACHE_NFSFS_RENAMED;
565277f6 147 ret = 1;
73ca1001
JL
148 } else
149 ret = 0;
565277f6 150 spin_unlock(&alias->d_lock);
565277f6 151 dput(alias);
884be175 152 up_read_non_owner(&NFS_I(dir)->rmdir_sem);
b1942c5f
AV
153 /*
154 * If we'd displaced old cached devname, free it. At that
155 * point dentry is definitely not a root, so we won't need
156 * that anymore.
157 */
73ca1001 158 kfree(devname_garbage);
565277f6
TM
159 return ret;
160 }
884be175 161 data->dentry = alias;
ed7e9ad0 162 nfs_do_call_unlink(inode, data);
565277f6
TM
163 return 1;
164}
165
1da177e4
LT
166/**
167 * nfs_async_unlink - asynchronous unlinking of a file
302fad7b
TM
168 * @dentry: parent directory of dentry
169 * @name: name of dentry to unlink
1da177e4 170 */
779c5179 171static int
beffb8fe 172nfs_async_unlink(struct dentry *dentry, const struct qstr *name)
1da177e4 173{
e4eff1a6
TM
174 struct nfs_unlinkdata *data;
175 int status = -ENOMEM;
b1942c5f 176 void *devname_garbage = NULL;
1da177e4 177
bd647545 178 data = kzalloc(sizeof(*data), GFP_KERNEL);
e4eff1a6 179 if (data == NULL)
1da177e4 180 goto out;
884be175
AV
181 data->args.name.name = kstrdup(name->name, GFP_KERNEL);
182 if (!data->args.name.name)
183 goto out_free;
184 data->args.name.len = name->len;
1da177e4 185
a52458b4 186 data->cred = get_current_cred();
d346890b 187 data->res.dir_attr = &data->dir_attr;
884be175 188 init_waitqueue_head(&data->wq);
1da177e4 189
e4eff1a6 190 status = -EBUSY;
1da177e4 191 spin_lock(&dentry->d_lock);
e4eff1a6
TM
192 if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
193 goto out_unlock;
1da177e4 194 dentry->d_flags |= DCACHE_NFSFS_RENAMED;
b1942c5f 195 devname_garbage = dentry->d_fsdata;
e4eff1a6 196 dentry->d_fsdata = data;
1da177e4 197 spin_unlock(&dentry->d_lock);
b1942c5f
AV
198 /*
199 * If we'd displaced old cached devname, free it. At that
200 * point dentry is definitely not a root, so we won't need
201 * that anymore.
202 */
96aa1549 203 kfree(devname_garbage);
e4eff1a6
TM
204 return 0;
205out_unlock:
206 spin_unlock(&dentry->d_lock);
a52458b4 207 put_cred(data->cred);
884be175 208 kfree(data->args.name.name);
1da177e4
LT
209out_free:
210 kfree(data);
e4eff1a6 211out:
1da177e4
LT
212 return status;
213}
214
215/**
216 * nfs_complete_unlink - Initialize completion of the sillydelete
217 * @dentry: dentry to delete
e4eff1a6 218 * @inode: inode
1da177e4
LT
219 *
220 * Since we're most likely to be called by dentry_iput(), we
221 * only use the dentry to find the sillydelete. We then copy the name
222 * into the qstr.
223 */
224void
e4eff1a6 225nfs_complete_unlink(struct dentry *dentry, struct inode *inode)
1da177e4 226{
884be175 227 struct nfs_unlinkdata *data;
1da177e4 228
1da177e4 229 spin_lock(&dentry->d_lock);
884be175
AV
230 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
231 data = dentry->d_fsdata;
232 dentry->d_fsdata = NULL;
1da177e4 233 spin_unlock(&dentry->d_lock);
e4eff1a6 234
ed7e9ad0 235 if (NFS_STALE(inode) || !nfs_call_unlink(dentry, inode, data))
e4eff1a6 236 nfs_free_unlinkdata(data);
1da177e4 237}
779c5179 238
d3d4152a
JL
239/* Cancel a queued async unlink. Called when a sillyrename run fails. */
240static void
241nfs_cancel_async_unlink(struct dentry *dentry)
242{
243 spin_lock(&dentry->d_lock);
244 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) {
245 struct nfs_unlinkdata *data = dentry->d_fsdata;
246
247 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
b1942c5f 248 dentry->d_fsdata = NULL;
d3d4152a
JL
249 spin_unlock(&dentry->d_lock);
250 nfs_free_unlinkdata(data);
251 return;
252 }
253 spin_unlock(&dentry->d_lock);
254}
255
d3d4152a
JL
256/**
257 * nfs_async_rename_done - Sillyrename post-processing
258 * @task: rpc_task of the sillyrename
259 * @calldata: nfs_renamedata for the sillyrename
260 *
261 * Do the directory attribute updates and the d_move
262 */
263static void nfs_async_rename_done(struct rpc_task *task, void *calldata)
264{
265 struct nfs_renamedata *data = calldata;
266 struct inode *old_dir = data->old_dir;
267 struct inode *new_dir = data->new_dir;
73ca1001 268 struct dentry *old_dentry = data->old_dentry;
d3d4152a 269
70ded201
TM
270 trace_nfs_sillyrename_rename(old_dir, old_dentry,
271 new_dir, data->new_dentry, task->tk_status);
d3d4152a 272 if (!NFS_PROTO(old_dir)->rename_done(task, old_dir, new_dir)) {
d00c5d43 273 rpc_restart_call_prepare(task);
d3d4152a
JL
274 return;
275 }
276
96f9d8c0
JL
277 if (data->complete)
278 data->complete(task, data);
d3d4152a
JL
279}
280
281/**
282 * nfs_async_rename_release - Release the sillyrename data.
283 * @calldata: the struct nfs_renamedata to be released
284 */
285static void nfs_async_rename_release(void *calldata)
286{
287 struct nfs_renamedata *data = calldata;
288 struct super_block *sb = data->old_dir->i_sb;
289
2b0143b5
DH
290 if (d_really_is_positive(data->old_dentry))
291 nfs_mark_for_revalidate(d_inode(data->old_dentry));
d3d4152a 292
818a8dbe
BC
293 /* The result of the rename is unknown. Play it safe by
294 * forcing a new lookup */
295 if (data->cancelled) {
296 spin_lock(&data->old_dir->i_lock);
297 nfs_force_lookup_revalidate(data->old_dir);
298 spin_unlock(&data->old_dir->i_lock);
299 if (data->new_dir != data->old_dir) {
300 spin_lock(&data->new_dir->i_lock);
301 nfs_force_lookup_revalidate(data->new_dir);
302 spin_unlock(&data->new_dir->i_lock);
303 }
304 }
305
d3d4152a
JL
306 dput(data->old_dentry);
307 dput(data->new_dentry);
308 iput(data->old_dir);
309 iput(data->new_dir);
310 nfs_sb_deactive(sb);
a52458b4 311 put_cred(data->cred);
d3d4152a
JL
312 kfree(data);
313}
314
d3d4152a
JL
315static void nfs_rename_prepare(struct rpc_task *task, void *calldata)
316{
317 struct nfs_renamedata *data = calldata;
c6bfa1a1 318 NFS_PROTO(data->old_dir)->rename_rpc_prepare(task, data);
d3d4152a 319}
d3d4152a
JL
320
321static const struct rpc_call_ops nfs_rename_ops = {
322 .rpc_call_done = nfs_async_rename_done,
323 .rpc_release = nfs_async_rename_release,
d3d4152a 324 .rpc_call_prepare = nfs_rename_prepare,
d3d4152a
JL
325};
326
327/**
328 * nfs_async_rename - perform an asynchronous rename operation
329 * @old_dir: directory that currently holds the dentry to be renamed
330 * @new_dir: target directory for the rename
331 * @old_dentry: original dentry to be renamed
332 * @new_dentry: dentry to which the old_dentry should be renamed
302fad7b 333 * @complete: Function to run on successful completion
d3d4152a
JL
334 *
335 * It's expected that valid references to the dentries and inodes are held
336 */
0e862a40 337struct rpc_task *
d3d4152a 338nfs_async_rename(struct inode *old_dir, struct inode *new_dir,
96f9d8c0
JL
339 struct dentry *old_dentry, struct dentry *new_dentry,
340 void (*complete)(struct rpc_task *, struct nfs_renamedata *))
d3d4152a
JL
341{
342 struct nfs_renamedata *data;
343 struct rpc_message msg = { };
344 struct rpc_task_setup task_setup_data = {
345 .rpc_message = &msg,
346 .callback_ops = &nfs_rename_ops,
347 .workqueue = nfsiod_workqueue,
348 .rpc_client = NFS_CLIENT(old_dir),
49cd3254 349 .flags = RPC_TASK_ASYNC | RPC_TASK_CRED_NOREF,
d3d4152a 350 };
d3d4152a 351
118f09ed
OK
352 if (nfs_server_capable(old_dir, NFS_CAP_MOVEABLE) &&
353 nfs_server_capable(new_dir, NFS_CAP_MOVEABLE))
354 task_setup_data.flags |= RPC_TASK_MOVEABLE;
355
dfb4f309 356 data = kzalloc(sizeof(*data), GFP_KERNEL);
d3d4152a
JL
357 if (data == NULL)
358 return ERR_PTR(-ENOMEM);
88dee0cc 359 task_setup_data.task = &data->task;
1174dd1f 360 task_setup_data.callback_data = data;
d3d4152a 361
a52458b4 362 data->cred = get_current_cred();
d3d4152a
JL
363
364 msg.rpc_argp = &data->args;
365 msg.rpc_resp = &data->res;
366 msg.rpc_cred = data->cred;
367
368 /* set up nfs_renamedata */
369 data->old_dir = old_dir;
a4118ee1 370 ihold(old_dir);
d3d4152a 371 data->new_dir = new_dir;
a4118ee1 372 ihold(new_dir);
d3d4152a
JL
373 data->old_dentry = dget(old_dentry);
374 data->new_dentry = dget(new_dentry);
375 nfs_fattr_init(&data->old_fattr);
376 nfs_fattr_init(&data->new_fattr);
96f9d8c0 377 data->complete = complete;
d3d4152a
JL
378
379 /* set up nfs_renameargs */
380 data->args.old_dir = NFS_FH(old_dir);
381 data->args.old_name = &old_dentry->d_name;
382 data->args.new_dir = NFS_FH(new_dir);
383 data->args.new_name = &new_dentry->d_name;
384
385 /* set up nfs_renameres */
386 data->res.old_fattr = &data->old_fattr;
387 data->res.new_fattr = &data->new_fattr;
388
389 nfs_sb_active(old_dir->i_sb);
390
f2c2c552 391 NFS_PROTO(data->old_dir)->rename_setup(&msg, old_dentry, new_dentry);
d3d4152a 392
f7732d65 393 return rpc_run_task(&task_setup_data);
d3d4152a
JL
394}
395
96f9d8c0
JL
396/*
397 * Perform tasks needed when a sillyrename is done such as cancelling the
398 * queued async unlink if it failed.
399 */
400static void
401nfs_complete_sillyrename(struct rpc_task *task, struct nfs_renamedata *data)
402{
f7be7284
JL
403 struct dentry *dentry = data->old_dentry;
404
405 if (task->tk_status != 0) {
406 nfs_cancel_async_unlink(dentry);
407 return;
408 }
96f9d8c0
JL
409}
410
c2dd1378
TM
411#define SILLYNAME_PREFIX ".nfs"
412#define SILLYNAME_PREFIX_LEN ((unsigned)sizeof(SILLYNAME_PREFIX) - 1)
413#define SILLYNAME_FILEID_LEN ((unsigned)sizeof(u64) << 1)
414#define SILLYNAME_COUNTER_LEN ((unsigned)sizeof(unsigned int) << 1)
415#define SILLYNAME_LEN (SILLYNAME_PREFIX_LEN + \
416 SILLYNAME_FILEID_LEN + \
417 SILLYNAME_COUNTER_LEN)
418
779c5179
JL
419/**
420 * nfs_sillyrename - Perform a silly-rename of a dentry
421 * @dir: inode of directory that contains dentry
422 * @dentry: dentry to be sillyrenamed
423 *
424 * NFSv2/3 is stateless and the server doesn't know when the client is
425 * holding a file open. To prevent application problems when a file is
426 * unlinked while it's still open, the client performs a "silly-rename".
427 * That is, it renames the file to a hidden file in the same directory,
428 * and only performs the unlink once the last reference to it is put.
429 *
430 * The final cleanup is done during dentry_iput.
674e405b
BF
431 *
432 * (Note: NFSv4 is stateful, and has opens, so in theory an NFSv4 server
433 * could take responsibility for keeping open files referenced. The server
434 * would also need to ensure that opened-but-deleted files were kept over
435 * reboots. However, we may not assume a server does so. (RFC 5661
436 * does provide an OPEN4_RESULT_PRESERVE_UNLINKED flag that a server can
437 * use to advertise that it does this; some day we may take advantage of
438 * it.))
779c5179
JL
439 */
440int
441nfs_sillyrename(struct inode *dir, struct dentry *dentry)
442{
443 static unsigned int sillycounter;
c2dd1378
TM
444 unsigned char silly[SILLYNAME_LEN + 1];
445 unsigned long long fileid;
779c5179 446 struct dentry *sdentry;
3cb3fd6d 447 struct inode *inode = d_inode(dentry);
d3d4152a 448 struct rpc_task *task;
4f5829d7 449 int error = -EBUSY;
779c5179 450
6de1472f
AV
451 dfprintk(VFS, "NFS: silly-rename(%pd2, ct=%d)\n",
452 dentry, d_count(dentry));
779c5179
JL
453 nfs_inc_stats(dir, NFSIOS_SILLYRENAME);
454
455 /*
456 * We don't allow a dentry to be silly-renamed twice.
457 */
779c5179
JL
458 if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
459 goto out;
460
2b0143b5 461 fileid = NFS_FILEID(d_inode(dentry));
779c5179 462
779c5179
JL
463 sdentry = NULL;
464 do {
c2dd1378 465 int slen;
779c5179
JL
466 dput(sdentry);
467 sillycounter++;
c2dd1378
TM
468 slen = scnprintf(silly, sizeof(silly),
469 SILLYNAME_PREFIX "%0*llx%0*x",
470 SILLYNAME_FILEID_LEN, fileid,
471 SILLYNAME_COUNTER_LEN, sillycounter);
779c5179 472
6de1472f
AV
473 dfprintk(VFS, "NFS: trying to rename %pd to %s\n",
474 dentry, silly);
779c5179
JL
475
476 sdentry = lookup_one_len(silly, dentry->d_parent, slen);
477 /*
478 * N.B. Better to return EBUSY here ... it could be
479 * dangerous to delete the file while it's in use.
480 */
481 if (IS_ERR(sdentry))
482 goto out;
2b0143b5 483 } while (d_inode(sdentry) != NULL); /* need negative lookup */
779c5179 484
3cb3fd6d
TM
485 ihold(inode);
486
d3d4152a
JL
487 /* queue unlink first. Can't do this from rpc_release as it
488 * has to allocate memory
489 */
884be175 490 error = nfs_async_unlink(dentry, &sdentry->d_name);
d3d4152a
JL
491 if (error)
492 goto out_dput;
493
494 /* run the rename task, undo unlink if it fails */
96f9d8c0
JL
495 task = nfs_async_rename(dir, dir, dentry, sdentry,
496 nfs_complete_sillyrename);
d3d4152a
JL
497 if (IS_ERR(task)) {
498 error = -EBUSY;
499 nfs_cancel_async_unlink(dentry);
500 goto out_dput;
779c5179 501 }
d3d4152a
JL
502
503 /* wait for the RPC task to complete, unless a SIGKILL intervenes */
504 error = rpc_wait_for_completion_task(task);
505 if (error == 0)
506 error = task->tk_status;
5a7a613a
TM
507 switch (error) {
508 case 0:
509 /* The rename succeeded */
510 nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
3cb3fd6d
TM
511 spin_lock(&inode->i_lock);
512 NFS_I(inode)->attr_gencount = nfs_inc_attr_generation_counter();
ac46b3d7
TM
513 nfs_set_cache_invalid(inode, NFS_INO_INVALID_CHANGE |
514 NFS_INO_INVALID_CTIME |
515 NFS_INO_REVAL_FORCED);
3cb3fd6d 516 spin_unlock(&inode->i_lock);
5a7a613a
TM
517 d_move(dentry, sdentry);
518 break;
519 case -ERESTARTSYS:
520 /* The result of the rename is unknown. Play it safe by
521 * forcing a new lookup */
522 d_drop(dentry);
523 d_drop(sdentry);
524 }
d3d4152a
JL
525 rpc_put_task(task);
526out_dput:
3cb3fd6d 527 iput(inode);
779c5179
JL
528 dput(sdentry);
529out:
530 return error;
531}