]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - fs/nfs/unlink.c
RDMA: Increasing RPCRDMA_MAX_DATA_SEGS
[mirror_ubuntu-artful-kernel.git] / fs / nfs / unlink.c
CommitLineData
1da177e4
LT
1/*
2 * linux/fs/nfs/unlink.c
3 *
4 * nfs sillydelete handling
5 *
1da177e4
LT
6 */
7
8#include <linux/slab.h>
9#include <linux/string.h>
10#include <linux/dcache.h>
11#include <linux/sunrpc/sched.h>
12#include <linux/sunrpc/clnt.h>
13#include <linux/nfs_fs.h>
b35e7041
LT
14#include <linux/sched.h>
15#include <linux/wait.h>
779c5179 16#include <linux/namei.h>
1da177e4 17
ef818a28 18#include "internal.h"
472cfbd9 19#include "nfs4_fs.h"
779c5179
JL
20#include "iostat.h"
21#include "delegation.h"
ef818a28 22
1da177e4 23struct nfs_unlinkdata {
565277f6 24 struct hlist_node list;
e4eff1a6
TM
25 struct nfs_removeargs args;
26 struct nfs_removeres res;
27 struct inode *dir;
1da177e4 28 struct rpc_cred *cred;
d346890b 29 struct nfs_fattr dir_attr;
1da177e4
LT
30};
31
1da177e4 32/**
e4eff1a6 33 * nfs_free_unlinkdata - release data from a sillydelete operation.
1da177e4
LT
34 * @data: pointer to unlink structure.
35 */
36static void
e4eff1a6 37nfs_free_unlinkdata(struct nfs_unlinkdata *data)
1da177e4 38{
e4eff1a6
TM
39 iput(data->dir);
40 put_rpccred(data->cred);
41 kfree(data->args.name.name);
42 kfree(data);
1da177e4
LT
43}
44
45#define NAME_ALLOC_LEN(len) ((len+16) & ~15)
46/**
47 * nfs_copy_dname - copy dentry name to data structure
48 * @dentry: pointer to dentry
49 * @data: nfs_unlinkdata
50 */
e4eff1a6 51static int nfs_copy_dname(struct dentry *dentry, struct nfs_unlinkdata *data)
1da177e4
LT
52{
53 char *str;
54 int len = dentry->d_name.len;
55
e4eff1a6 56 str = kmemdup(dentry->d_name.name, NAME_ALLOC_LEN(len), GFP_KERNEL);
1da177e4 57 if (!str)
e4eff1a6
TM
58 return -ENOMEM;
59 data->args.name.len = len;
60 data->args.name.name = str;
61 return 0;
1da177e4
LT
62}
63
565277f6
TM
64static void nfs_free_dname(struct nfs_unlinkdata *data)
65{
66 kfree(data->args.name.name);
67 data->args.name.name = NULL;
68 data->args.name.len = 0;
69}
70
71static void nfs_dec_sillycount(struct inode *dir)
72{
73 struct nfs_inode *nfsi = NFS_I(dir);
74 if (atomic_dec_return(&nfsi->silly_count) == 1)
75 wake_up(&nfsi->waitqueue);
76}
77
1da177e4
LT
78/**
79 * nfs_async_unlink_done - Sillydelete post-processing
80 * @task: rpc_task of the sillydelete
81 *
82 * Do the directory attribute update.
83 */
963d8fe5 84static void nfs_async_unlink_done(struct rpc_task *task, void *calldata)
1da177e4 85{
e4eff1a6
TM
86 struct nfs_unlinkdata *data = calldata;
87 struct inode *dir = data->dir;
88
89 if (!NFS_PROTO(dir)->unlink_done(task, dir))
0110ee15 90 nfs_restart_rpc(task, NFS_SERVER(dir)->nfs_client);
1da177e4
LT
91}
92
93/**
94 * nfs_async_unlink_release - Release the sillydelete data.
95 * @task: rpc_task of the sillydelete
96 *
97 * We need to call nfs_put_unlinkdata as a 'tk_release' task since the
98 * rpc_task would be freed too.
99 */
963d8fe5 100static void nfs_async_unlink_release(void *calldata)
1da177e4 101{
963d8fe5 102 struct nfs_unlinkdata *data = calldata;
744d18db 103 struct super_block *sb = data->dir->i_sb;
565277f6
TM
104
105 nfs_dec_sillycount(data->dir);
e4eff1a6 106 nfs_free_unlinkdata(data);
1daef0a8 107 nfs_sb_deactive(sb);
1da177e4
LT
108}
109
472cfbd9
AA
110#if defined(CONFIG_NFS_V4_1)
111void nfs_unlink_prepare(struct rpc_task *task, void *calldata)
112{
113 struct nfs_unlinkdata *data = calldata;
114 struct nfs_server *server = NFS_SERVER(data->dir);
115
035168ab 116 if (nfs4_setup_sequence(server, &data->args.seq_args,
472cfbd9
AA
117 &data->res.seq_res, 1, task))
118 return;
119 rpc_call_start(task);
120}
121#endif /* CONFIG_NFS_V4_1 */
122
963d8fe5
TM
123static const struct rpc_call_ops nfs_unlink_ops = {
124 .rpc_call_done = nfs_async_unlink_done,
125 .rpc_release = nfs_async_unlink_release,
472cfbd9
AA
126#if defined(CONFIG_NFS_V4_1)
127 .rpc_call_prepare = nfs_unlink_prepare,
128#endif /* CONFIG_NFS_V4_1 */
963d8fe5
TM
129};
130
565277f6 131static int nfs_do_call_unlink(struct dentry *parent, struct inode *dir, struct nfs_unlinkdata *data)
e4eff1a6 132{
5138fde0
TM
133 struct rpc_message msg = {
134 .rpc_argp = &data->args,
135 .rpc_resp = &data->res,
136 .rpc_cred = data->cred,
137 };
c970aa85 138 struct rpc_task_setup task_setup_data = {
5138fde0 139 .rpc_message = &msg,
c970aa85
TM
140 .callback_ops = &nfs_unlink_ops,
141 .callback_data = data,
1daef0a8 142 .workqueue = nfsiod_workqueue,
c970aa85
TM
143 .flags = RPC_TASK_ASYNC,
144 };
e4eff1a6 145 struct rpc_task *task;
565277f6
TM
146 struct dentry *alias;
147
148 alias = d_lookup(parent, &data->args.name);
149 if (alias != NULL) {
150 int ret = 0;
b1942c5f 151 void *devname_garbage = NULL;
609005c3 152
565277f6
TM
153 /*
154 * Hey, we raced with lookup... See if we need to transfer
155 * the sillyrename information to the aliased dentry.
156 */
157 nfs_free_dname(data);
158 spin_lock(&alias->d_lock);
609005c3
TM
159 if (alias->d_inode != NULL &&
160 !(alias->d_flags & DCACHE_NFSFS_RENAMED)) {
b1942c5f 161 devname_garbage = alias->d_fsdata;
565277f6 162 alias->d_fsdata = data;
fccca7fc 163 alias->d_flags |= DCACHE_NFSFS_RENAMED;
565277f6
TM
164 ret = 1;
165 }
166 spin_unlock(&alias->d_lock);
167 nfs_dec_sillycount(dir);
168 dput(alias);
b1942c5f
AV
169 /*
170 * If we'd displaced old cached devname, free it. At that
171 * point dentry is definitely not a root, so we won't need
172 * that anymore.
173 */
174 if (devname_garbage)
175 kfree(devname_garbage);
565277f6
TM
176 return ret;
177 }
178 data->dir = igrab(dir);
179 if (!data->dir) {
180 nfs_dec_sillycount(dir);
181 return 0;
182 }
1daef0a8 183 nfs_sb_active(dir->i_sb);
565277f6 184 data->args.fh = NFS_FH(dir);
d346890b 185 nfs_fattr_init(data->res.dir_attr);
565277f6 186
5138fde0 187 NFS_PROTO(dir)->unlink_setup(&msg, dir);
c970aa85 188
5138fde0 189 task_setup_data.rpc_client = NFS_CLIENT(dir);
c970aa85 190 task = rpc_run_task(&task_setup_data);
565277f6 191 if (!IS_ERR(task))
bf294b41 192 rpc_put_task_async(task);
565277f6
TM
193 return 1;
194}
195
196static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata *data)
197{
e4eff1a6
TM
198 struct dentry *parent;
199 struct inode *dir;
565277f6 200 int ret = 0;
e4eff1a6 201
e4eff1a6
TM
202
203 parent = dget_parent(dentry);
204 if (parent == NULL)
205 goto out_free;
565277f6 206 dir = parent->d_inode;
55b70a03 207 if (nfs_copy_dname(dentry, data) != 0)
565277f6
TM
208 goto out_dput;
209 /* Non-exclusive lock protects against concurrent lookup() calls */
210 spin_lock(&dir->i_lock);
211 if (atomic_inc_not_zero(&NFS_I(dir)->silly_count) == 0) {
212 /* Deferred delete */
213 hlist_add_head(&data->list, &NFS_I(dir)->silly_list);
214 spin_unlock(&dir->i_lock);
215 ret = 1;
216 goto out_dput;
217 }
218 spin_unlock(&dir->i_lock);
219 ret = nfs_do_call_unlink(parent, dir, data);
220out_dput:
e4eff1a6 221 dput(parent);
565277f6
TM
222out_free:
223 return ret;
224}
e4eff1a6 225
565277f6
TM
226void nfs_block_sillyrename(struct dentry *dentry)
227{
228 struct nfs_inode *nfsi = NFS_I(dentry->d_inode);
e4eff1a6 229
565277f6
TM
230 wait_event(nfsi->waitqueue, atomic_cmpxchg(&nfsi->silly_count, 1, 0) == 1);
231}
232
233void nfs_unblock_sillyrename(struct dentry *dentry)
234{
235 struct inode *dir = dentry->d_inode;
236 struct nfs_inode *nfsi = NFS_I(dir);
237 struct nfs_unlinkdata *data;
238
239 atomic_inc(&nfsi->silly_count);
240 spin_lock(&dir->i_lock);
241 while (!hlist_empty(&nfsi->silly_list)) {
242 if (!atomic_inc_not_zero(&nfsi->silly_count))
243 break;
244 data = hlist_entry(nfsi->silly_list.first, struct nfs_unlinkdata, list);
245 hlist_del(&data->list);
246 spin_unlock(&dir->i_lock);
247 if (nfs_do_call_unlink(dentry, dir, data) == 0)
248 nfs_free_unlinkdata(data);
249 spin_lock(&dir->i_lock);
250 }
251 spin_unlock(&dir->i_lock);
e4eff1a6
TM
252}
253
1da177e4
LT
254/**
255 * nfs_async_unlink - asynchronous unlinking of a file
e4eff1a6 256 * @dir: parent directory of dentry
1da177e4
LT
257 * @dentry: dentry to unlink
258 */
779c5179 259static int
e4eff1a6 260nfs_async_unlink(struct inode *dir, struct dentry *dentry)
1da177e4 261{
e4eff1a6
TM
262 struct nfs_unlinkdata *data;
263 int status = -ENOMEM;
b1942c5f 264 void *devname_garbage = NULL;
1da177e4 265
bd647545 266 data = kzalloc(sizeof(*data), GFP_KERNEL);
e4eff1a6 267 if (data == NULL)
1da177e4 268 goto out;
1da177e4 269
98a8e323 270 data->cred = rpc_lookup_cred();
1da177e4
LT
271 if (IS_ERR(data->cred)) {
272 status = PTR_ERR(data->cred);
273 goto out_free;
274 }
d346890b 275 data->res.dir_attr = &data->dir_attr;
1da177e4 276
e4eff1a6 277 status = -EBUSY;
1da177e4 278 spin_lock(&dentry->d_lock);
e4eff1a6
TM
279 if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
280 goto out_unlock;
1da177e4 281 dentry->d_flags |= DCACHE_NFSFS_RENAMED;
b1942c5f 282 devname_garbage = dentry->d_fsdata;
e4eff1a6 283 dentry->d_fsdata = data;
1da177e4 284 spin_unlock(&dentry->d_lock);
b1942c5f
AV
285 /*
286 * If we'd displaced old cached devname, free it. At that
287 * point dentry is definitely not a root, so we won't need
288 * that anymore.
289 */
290 if (devname_garbage)
291 kfree(devname_garbage);
e4eff1a6
TM
292 return 0;
293out_unlock:
294 spin_unlock(&dentry->d_lock);
295 put_rpccred(data->cred);
1da177e4
LT
296out_free:
297 kfree(data);
e4eff1a6 298out:
1da177e4
LT
299 return status;
300}
301
302/**
303 * nfs_complete_unlink - Initialize completion of the sillydelete
304 * @dentry: dentry to delete
e4eff1a6 305 * @inode: inode
1da177e4
LT
306 *
307 * Since we're most likely to be called by dentry_iput(), we
308 * only use the dentry to find the sillydelete. We then copy the name
309 * into the qstr.
310 */
311void
e4eff1a6 312nfs_complete_unlink(struct dentry *dentry, struct inode *inode)
1da177e4 313{
e4eff1a6 314 struct nfs_unlinkdata *data = NULL;
1da177e4 315
1da177e4 316 spin_lock(&dentry->d_lock);
e4eff1a6
TM
317 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) {
318 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
319 data = dentry->d_fsdata;
b1942c5f 320 dentry->d_fsdata = NULL;
e4eff1a6 321 }
1da177e4 322 spin_unlock(&dentry->d_lock);
e4eff1a6
TM
323
324 if (data != NULL && (NFS_STALE(inode) || !nfs_call_unlink(dentry, data)))
325 nfs_free_unlinkdata(data);
1da177e4 326}
779c5179 327
d3d4152a
JL
328/* Cancel a queued async unlink. Called when a sillyrename run fails. */
329static void
330nfs_cancel_async_unlink(struct dentry *dentry)
331{
332 spin_lock(&dentry->d_lock);
333 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) {
334 struct nfs_unlinkdata *data = dentry->d_fsdata;
335
336 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
b1942c5f 337 dentry->d_fsdata = NULL;
d3d4152a
JL
338 spin_unlock(&dentry->d_lock);
339 nfs_free_unlinkdata(data);
340 return;
341 }
342 spin_unlock(&dentry->d_lock);
343}
344
345struct nfs_renamedata {
346 struct nfs_renameargs args;
347 struct nfs_renameres res;
348 struct rpc_cred *cred;
349 struct inode *old_dir;
350 struct dentry *old_dentry;
351 struct nfs_fattr old_fattr;
352 struct inode *new_dir;
353 struct dentry *new_dentry;
354 struct nfs_fattr new_fattr;
355};
356
357/**
358 * nfs_async_rename_done - Sillyrename post-processing
359 * @task: rpc_task of the sillyrename
360 * @calldata: nfs_renamedata for the sillyrename
361 *
362 * Do the directory attribute updates and the d_move
363 */
364static void nfs_async_rename_done(struct rpc_task *task, void *calldata)
365{
366 struct nfs_renamedata *data = calldata;
367 struct inode *old_dir = data->old_dir;
368 struct inode *new_dir = data->new_dir;
369
370 if (!NFS_PROTO(old_dir)->rename_done(task, old_dir, new_dir)) {
371 nfs_restart_rpc(task, NFS_SERVER(old_dir)->nfs_client);
372 return;
373 }
374
375 if (task->tk_status != 0) {
376 nfs_cancel_async_unlink(data->old_dentry);
377 return;
378 }
379
380 nfs_set_verifier(data->old_dentry, nfs_save_change_attribute(old_dir));
381 d_move(data->old_dentry, data->new_dentry);
382}
383
384/**
385 * nfs_async_rename_release - Release the sillyrename data.
386 * @calldata: the struct nfs_renamedata to be released
387 */
388static void nfs_async_rename_release(void *calldata)
389{
390 struct nfs_renamedata *data = calldata;
391 struct super_block *sb = data->old_dir->i_sb;
392
393 if (data->old_dentry->d_inode)
394 nfs_mark_for_revalidate(data->old_dentry->d_inode);
395
396 dput(data->old_dentry);
397 dput(data->new_dentry);
398 iput(data->old_dir);
399 iput(data->new_dir);
400 nfs_sb_deactive(sb);
401 put_rpccred(data->cred);
402 kfree(data);
403}
404
405#if defined(CONFIG_NFS_V4_1)
406static void nfs_rename_prepare(struct rpc_task *task, void *calldata)
407{
408 struct nfs_renamedata *data = calldata;
409 struct nfs_server *server = NFS_SERVER(data->old_dir);
410
411 if (nfs4_setup_sequence(server, &data->args.seq_args,
412 &data->res.seq_res, 1, task))
413 return;
414 rpc_call_start(task);
415}
416#endif /* CONFIG_NFS_V4_1 */
417
418static const struct rpc_call_ops nfs_rename_ops = {
419 .rpc_call_done = nfs_async_rename_done,
420 .rpc_release = nfs_async_rename_release,
421#if defined(CONFIG_NFS_V4_1)
422 .rpc_call_prepare = nfs_rename_prepare,
423#endif /* CONFIG_NFS_V4_1 */
424};
425
426/**
427 * nfs_async_rename - perform an asynchronous rename operation
428 * @old_dir: directory that currently holds the dentry to be renamed
429 * @new_dir: target directory for the rename
430 * @old_dentry: original dentry to be renamed
431 * @new_dentry: dentry to which the old_dentry should be renamed
432 *
433 * It's expected that valid references to the dentries and inodes are held
434 */
435static struct rpc_task *
436nfs_async_rename(struct inode *old_dir, struct inode *new_dir,
437 struct dentry *old_dentry, struct dentry *new_dentry)
438{
439 struct nfs_renamedata *data;
440 struct rpc_message msg = { };
441 struct rpc_task_setup task_setup_data = {
442 .rpc_message = &msg,
443 .callback_ops = &nfs_rename_ops,
444 .workqueue = nfsiod_workqueue,
445 .rpc_client = NFS_CLIENT(old_dir),
446 .flags = RPC_TASK_ASYNC,
447 };
d3d4152a 448
dfb4f309 449 data = kzalloc(sizeof(*data), GFP_KERNEL);
d3d4152a
JL
450 if (data == NULL)
451 return ERR_PTR(-ENOMEM);
1174dd1f 452 task_setup_data.callback_data = data;
d3d4152a
JL
453
454 data->cred = rpc_lookup_cred();
455 if (IS_ERR(data->cred)) {
f7732d65 456 struct rpc_task *task = ERR_CAST(data->cred);
d3d4152a
JL
457 kfree(data);
458 return task;
459 }
460
461 msg.rpc_argp = &data->args;
462 msg.rpc_resp = &data->res;
463 msg.rpc_cred = data->cred;
464
465 /* set up nfs_renamedata */
466 data->old_dir = old_dir;
a4118ee1 467 ihold(old_dir);
d3d4152a 468 data->new_dir = new_dir;
a4118ee1 469 ihold(new_dir);
d3d4152a
JL
470 data->old_dentry = dget(old_dentry);
471 data->new_dentry = dget(new_dentry);
472 nfs_fattr_init(&data->old_fattr);
473 nfs_fattr_init(&data->new_fattr);
474
475 /* set up nfs_renameargs */
476 data->args.old_dir = NFS_FH(old_dir);
477 data->args.old_name = &old_dentry->d_name;
478 data->args.new_dir = NFS_FH(new_dir);
479 data->args.new_name = &new_dentry->d_name;
480
481 /* set up nfs_renameres */
482 data->res.old_fattr = &data->old_fattr;
483 data->res.new_fattr = &data->new_fattr;
484
485 nfs_sb_active(old_dir->i_sb);
486
487 NFS_PROTO(data->old_dir)->rename_setup(&msg, old_dir);
488
f7732d65 489 return rpc_run_task(&task_setup_data);
d3d4152a
JL
490}
491
779c5179
JL
492/**
493 * nfs_sillyrename - Perform a silly-rename of a dentry
494 * @dir: inode of directory that contains dentry
495 * @dentry: dentry to be sillyrenamed
496 *
497 * NFSv2/3 is stateless and the server doesn't know when the client is
498 * holding a file open. To prevent application problems when a file is
499 * unlinked while it's still open, the client performs a "silly-rename".
500 * That is, it renames the file to a hidden file in the same directory,
501 * and only performs the unlink once the last reference to it is put.
502 *
503 * The final cleanup is done during dentry_iput.
674e405b
BF
504 *
505 * (Note: NFSv4 is stateful, and has opens, so in theory an NFSv4 server
506 * could take responsibility for keeping open files referenced. The server
507 * would also need to ensure that opened-but-deleted files were kept over
508 * reboots. However, we may not assume a server does so. (RFC 5661
509 * does provide an OPEN4_RESULT_PRESERVE_UNLINKED flag that a server can
510 * use to advertise that it does this; some day we may take advantage of
511 * it.))
779c5179
JL
512 */
513int
514nfs_sillyrename(struct inode *dir, struct dentry *dentry)
515{
516 static unsigned int sillycounter;
517 const int fileidsize = sizeof(NFS_FILEID(dentry->d_inode))*2;
518 const int countersize = sizeof(sillycounter)*2;
519 const int slen = sizeof(".nfs")+fileidsize+countersize-1;
520 char silly[slen+1];
779c5179 521 struct dentry *sdentry;
d3d4152a 522 struct rpc_task *task;
779c5179
JL
523 int error = -EIO;
524
525 dfprintk(VFS, "NFS: silly-rename(%s/%s, ct=%d)\n",
526 dentry->d_parent->d_name.name, dentry->d_name.name,
b7ab39f6 527 dentry->d_count);
779c5179
JL
528 nfs_inc_stats(dir, NFSIOS_SILLYRENAME);
529
530 /*
531 * We don't allow a dentry to be silly-renamed twice.
532 */
533 error = -EBUSY;
534 if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
535 goto out;
536
537 sprintf(silly, ".nfs%*.*Lx",
538 fileidsize, fileidsize,
539 (unsigned long long)NFS_FILEID(dentry->d_inode));
540
541 /* Return delegation in anticipation of the rename */
542 nfs_inode_return_delegation(dentry->d_inode);
543
544 sdentry = NULL;
545 do {
546 char *suffix = silly + slen - countersize;
547
548 dput(sdentry);
549 sillycounter++;
550 sprintf(suffix, "%*.*x", countersize, countersize, sillycounter);
551
552 dfprintk(VFS, "NFS: trying to rename %s to %s\n",
553 dentry->d_name.name, silly);
554
555 sdentry = lookup_one_len(silly, dentry->d_parent, slen);
556 /*
557 * N.B. Better to return EBUSY here ... it could be
558 * dangerous to delete the file while it's in use.
559 */
560 if (IS_ERR(sdentry))
561 goto out;
562 } while (sdentry->d_inode != NULL); /* need negative lookup */
563
d3d4152a
JL
564 /* queue unlink first. Can't do this from rpc_release as it
565 * has to allocate memory
566 */
567 error = nfs_async_unlink(dir, dentry);
568 if (error)
569 goto out_dput;
570
571 /* run the rename task, undo unlink if it fails */
572 task = nfs_async_rename(dir, dir, dentry, sdentry);
573 if (IS_ERR(task)) {
574 error = -EBUSY;
575 nfs_cancel_async_unlink(dentry);
576 goto out_dput;
779c5179 577 }
d3d4152a
JL
578
579 /* wait for the RPC task to complete, unless a SIGKILL intervenes */
580 error = rpc_wait_for_completion_task(task);
581 if (error == 0)
582 error = task->tk_status;
583 rpc_put_task(task);
584out_dput:
779c5179
JL
585 dput(sdentry);
586out:
587 return error;
588}