1 /* 2 * linux/fs/nfs/unlink.c 3 * 4 * nfs sillydelete handling 5 * 6 */ 7 8 #include <linux/slab.h> 9 #include <linux/string.h> 10 #include <linux/dcache.h> 11 #include <linux/sunrpc/sched.h> 12 #include <linux/sunrpc/clnt.h> 13 #include <linux/nfs_fs.h> 14 #include <linux/sched.h> 15 #include <linux/wait.h> 16 #include <linux/namei.h> 17 #include <linux/fsnotify.h> 18 19 #include "internal.h" 20 #include "nfs4_fs.h" 21 #include "iostat.h" 22 #include "delegation.h" 23 24 #include "nfstrace.h" 25 26 /** 27 * nfs_free_unlinkdata - release data from a sillydelete operation. 28 * @data: pointer to unlink structure. 29 */ 30 static void 31 nfs_free_unlinkdata(struct nfs_unlinkdata *data) 32 { 33 iput(data->dir); 34 put_rpccred(data->cred); 35 kfree(data->args.name.name); 36 kfree(data); 37 } 38 39 #define NAME_ALLOC_LEN(len) ((len+16) & ~15) 40 /** 41 * nfs_copy_dname - copy dentry name to data structure 42 * @dentry: pointer to dentry 43 * @data: nfs_unlinkdata 44 */ 45 static int nfs_copy_dname(struct dentry *dentry, struct nfs_unlinkdata *data) 46 { 47 char *str; 48 int len = dentry->d_name.len; 49 50 str = kmemdup(dentry->d_name.name, NAME_ALLOC_LEN(len), GFP_KERNEL); 51 if (!str) 52 return -ENOMEM; 53 data->args.name.len = len; 54 data->args.name.name = str; 55 return 0; 56 } 57 58 static void nfs_free_dname(struct nfs_unlinkdata *data) 59 { 60 kfree(data->args.name.name); 61 data->args.name.name = NULL; 62 data->args.name.len = 0; 63 } 64 65 static void nfs_dec_sillycount(struct inode *dir) 66 { 67 struct nfs_inode *nfsi = NFS_I(dir); 68 if (atomic_dec_return(&nfsi->silly_count) == 1) 69 wake_up(&nfsi->waitqueue); 70 } 71 72 /** 73 * nfs_async_unlink_done - Sillydelete post-processing 74 * @task: rpc_task of the sillydelete 75 * 76 * Do the directory attribute update. 77 */ 78 static void nfs_async_unlink_done(struct rpc_task *task, void *calldata) 79 { 80 struct nfs_unlinkdata *data = calldata; 81 struct inode *dir = data->dir; 82 83 trace_nfs_sillyrename_unlink(data, task->tk_status); 84 if (!NFS_PROTO(dir)->unlink_done(task, dir)) 85 rpc_restart_call_prepare(task); 86 } 87 88 /** 89 * nfs_async_unlink_release - Release the sillydelete data. 90 * @task: rpc_task of the sillydelete 91 * 92 * We need to call nfs_put_unlinkdata as a 'tk_release' task since the 93 * rpc_task would be freed too. 94 */ 95 static void nfs_async_unlink_release(void *calldata) 96 { 97 struct nfs_unlinkdata *data = calldata; 98 struct super_block *sb = data->dir->i_sb; 99 100 nfs_dec_sillycount(data->dir); 101 nfs_free_unlinkdata(data); 102 nfs_sb_deactive(sb); 103 } 104 105 static void nfs_unlink_prepare(struct rpc_task *task, void *calldata) 106 { 107 struct nfs_unlinkdata *data = calldata; 108 NFS_PROTO(data->dir)->unlink_rpc_prepare(task, data); 109 } 110 111 static const struct rpc_call_ops nfs_unlink_ops = { 112 .rpc_call_done = nfs_async_unlink_done, 113 .rpc_release = nfs_async_unlink_release, 114 .rpc_call_prepare = nfs_unlink_prepare, 115 }; 116 117 static int nfs_do_call_unlink(struct dentry *parent, struct inode *dir, struct nfs_unlinkdata *data) 118 { 119 struct rpc_message msg = { 120 .rpc_argp = &data->args, 121 .rpc_resp = &data->res, 122 .rpc_cred = data->cred, 123 }; 124 struct rpc_task_setup task_setup_data = { 125 .rpc_message = &msg, 126 .callback_ops = &nfs_unlink_ops, 127 .callback_data = data, 128 .workqueue = nfsiod_workqueue, 129 .flags = RPC_TASK_ASYNC, 130 }; 131 struct rpc_task *task; 132 struct dentry *alias; 133 134 alias = d_lookup(parent, &data->args.name); 135 if (alias != NULL) { 136 int ret; 137 void *devname_garbage = NULL; 138 139 /* 140 * Hey, we raced with lookup... See if we need to transfer 141 * the sillyrename information to the aliased dentry. 142 */ 143 nfs_free_dname(data); 144 ret = nfs_copy_dname(alias, data); 145 spin_lock(&alias->d_lock); 146 if (ret == 0 && alias->d_inode != NULL && 147 !(alias->d_flags & DCACHE_NFSFS_RENAMED)) { 148 devname_garbage = alias->d_fsdata; 149 alias->d_fsdata = data; 150 alias->d_flags |= DCACHE_NFSFS_RENAMED; 151 ret = 1; 152 } else 153 ret = 0; 154 spin_unlock(&alias->d_lock); 155 nfs_dec_sillycount(dir); 156 dput(alias); 157 /* 158 * If we'd displaced old cached devname, free it. At that 159 * point dentry is definitely not a root, so we won't need 160 * that anymore. 161 */ 162 kfree(devname_garbage); 163 return ret; 164 } 165 data->dir = igrab(dir); 166 if (!data->dir) { 167 nfs_dec_sillycount(dir); 168 return 0; 169 } 170 nfs_sb_active(dir->i_sb); 171 data->args.fh = NFS_FH(dir); 172 nfs_fattr_init(data->res.dir_attr); 173 174 NFS_PROTO(dir)->unlink_setup(&msg, dir); 175 176 task_setup_data.rpc_client = NFS_CLIENT(dir); 177 task = rpc_run_task(&task_setup_data); 178 if (!IS_ERR(task)) 179 rpc_put_task_async(task); 180 return 1; 181 } 182 183 static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata *data) 184 { 185 struct dentry *parent; 186 struct inode *dir; 187 int ret = 0; 188 189 190 parent = dget_parent(dentry); 191 if (parent == NULL) 192 goto out_free; 193 dir = parent->d_inode; 194 /* Non-exclusive lock protects against concurrent lookup() calls */ 195 spin_lock(&dir->i_lock); 196 if (atomic_inc_not_zero(&NFS_I(dir)->silly_count) == 0) { 197 /* Deferred delete */ 198 hlist_add_head(&data->list, &NFS_I(dir)->silly_list); 199 spin_unlock(&dir->i_lock); 200 ret = 1; 201 goto out_dput; 202 } 203 spin_unlock(&dir->i_lock); 204 ret = nfs_do_call_unlink(parent, dir, data); 205 out_dput: 206 dput(parent); 207 out_free: 208 return ret; 209 } 210 211 void nfs_wait_on_sillyrename(struct dentry *dentry) 212 { 213 struct nfs_inode *nfsi = NFS_I(dentry->d_inode); 214 215 wait_event(nfsi->waitqueue, atomic_read(&nfsi->silly_count) <= 1); 216 } 217 218 void nfs_block_sillyrename(struct dentry *dentry) 219 { 220 struct nfs_inode *nfsi = NFS_I(dentry->d_inode); 221 222 wait_event(nfsi->waitqueue, atomic_cmpxchg(&nfsi->silly_count, 1, 0) == 1); 223 } 224 225 void nfs_unblock_sillyrename(struct dentry *dentry) 226 { 227 struct inode *dir = dentry->d_inode; 228 struct nfs_inode *nfsi = NFS_I(dir); 229 struct nfs_unlinkdata *data; 230 231 atomic_inc(&nfsi->silly_count); 232 spin_lock(&dir->i_lock); 233 while (!hlist_empty(&nfsi->silly_list)) { 234 if (!atomic_inc_not_zero(&nfsi->silly_count)) 235 break; 236 data = hlist_entry(nfsi->silly_list.first, struct nfs_unlinkdata, list); 237 hlist_del(&data->list); 238 spin_unlock(&dir->i_lock); 239 if (nfs_do_call_unlink(dentry, dir, data) == 0) 240 nfs_free_unlinkdata(data); 241 spin_lock(&dir->i_lock); 242 } 243 spin_unlock(&dir->i_lock); 244 } 245 246 /** 247 * nfs_async_unlink - asynchronous unlinking of a file 248 * @dir: parent directory of dentry 249 * @dentry: dentry to unlink 250 */ 251 static int 252 nfs_async_unlink(struct inode *dir, struct dentry *dentry) 253 { 254 struct nfs_unlinkdata *data; 255 int status = -ENOMEM; 256 void *devname_garbage = NULL; 257 258 data = kzalloc(sizeof(*data), GFP_KERNEL); 259 if (data == NULL) 260 goto out; 261 262 data->cred = rpc_lookup_cred(); 263 if (IS_ERR(data->cred)) { 264 status = PTR_ERR(data->cred); 265 goto out_free; 266 } 267 data->res.dir_attr = &data->dir_attr; 268 269 status = -EBUSY; 270 spin_lock(&dentry->d_lock); 271 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) 272 goto out_unlock; 273 dentry->d_flags |= DCACHE_NFSFS_RENAMED; 274 devname_garbage = dentry->d_fsdata; 275 dentry->d_fsdata = data; 276 spin_unlock(&dentry->d_lock); 277 /* 278 * If we'd displaced old cached devname, free it. At that 279 * point dentry is definitely not a root, so we won't need 280 * that anymore. 281 */ 282 kfree(devname_garbage); 283 return 0; 284 out_unlock: 285 spin_unlock(&dentry->d_lock); 286 put_rpccred(data->cred); 287 out_free: 288 kfree(data); 289 out: 290 return status; 291 } 292 293 /** 294 * nfs_complete_unlink - Initialize completion of the sillydelete 295 * @dentry: dentry to delete 296 * @inode: inode 297 * 298 * Since we're most likely to be called by dentry_iput(), we 299 * only use the dentry to find the sillydelete. We then copy the name 300 * into the qstr. 301 */ 302 void 303 nfs_complete_unlink(struct dentry *dentry, struct inode *inode) 304 { 305 struct nfs_unlinkdata *data = NULL; 306 307 spin_lock(&dentry->d_lock); 308 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) { 309 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED; 310 data = dentry->d_fsdata; 311 dentry->d_fsdata = NULL; 312 } 313 spin_unlock(&dentry->d_lock); 314 315 if (data != NULL && (NFS_STALE(inode) || !nfs_call_unlink(dentry, data))) 316 nfs_free_unlinkdata(data); 317 } 318 319 /* Cancel a queued async unlink. Called when a sillyrename run fails. */ 320 static void 321 nfs_cancel_async_unlink(struct dentry *dentry) 322 { 323 spin_lock(&dentry->d_lock); 324 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) { 325 struct nfs_unlinkdata *data = dentry->d_fsdata; 326 327 dentry->d_flags &= ~DCACHE_NFSFS_RENAMED; 328 dentry->d_fsdata = NULL; 329 spin_unlock(&dentry->d_lock); 330 nfs_free_unlinkdata(data); 331 return; 332 } 333 spin_unlock(&dentry->d_lock); 334 } 335 336 /** 337 * nfs_async_rename_done - Sillyrename post-processing 338 * @task: rpc_task of the sillyrename 339 * @calldata: nfs_renamedata for the sillyrename 340 * 341 * Do the directory attribute updates and the d_move 342 */ 343 static void nfs_async_rename_done(struct rpc_task *task, void *calldata) 344 { 345 struct nfs_renamedata *data = calldata; 346 struct inode *old_dir = data->old_dir; 347 struct inode *new_dir = data->new_dir; 348 struct dentry *old_dentry = data->old_dentry; 349 350 trace_nfs_sillyrename_rename(old_dir, old_dentry, 351 new_dir, data->new_dentry, task->tk_status); 352 if (!NFS_PROTO(old_dir)->rename_done(task, old_dir, new_dir)) { 353 rpc_restart_call_prepare(task); 354 return; 355 } 356 357 if (data->complete) 358 data->complete(task, data); 359 } 360 361 /** 362 * nfs_async_rename_release - Release the sillyrename data. 363 * @calldata: the struct nfs_renamedata to be released 364 */ 365 static void nfs_async_rename_release(void *calldata) 366 { 367 struct nfs_renamedata *data = calldata; 368 struct super_block *sb = data->old_dir->i_sb; 369 370 if (data->old_dentry->d_inode) 371 nfs_mark_for_revalidate(data->old_dentry->d_inode); 372 373 dput(data->old_dentry); 374 dput(data->new_dentry); 375 iput(data->old_dir); 376 iput(data->new_dir); 377 nfs_sb_deactive(sb); 378 put_rpccred(data->cred); 379 kfree(data); 380 } 381 382 static void nfs_rename_prepare(struct rpc_task *task, void *calldata) 383 { 384 struct nfs_renamedata *data = calldata; 385 NFS_PROTO(data->old_dir)->rename_rpc_prepare(task, data); 386 } 387 388 static const struct rpc_call_ops nfs_rename_ops = { 389 .rpc_call_done = nfs_async_rename_done, 390 .rpc_release = nfs_async_rename_release, 391 .rpc_call_prepare = nfs_rename_prepare, 392 }; 393 394 /** 395 * nfs_async_rename - perform an asynchronous rename operation 396 * @old_dir: directory that currently holds the dentry to be renamed 397 * @new_dir: target directory for the rename 398 * @old_dentry: original dentry to be renamed 399 * @new_dentry: dentry to which the old_dentry should be renamed 400 * 401 * It's expected that valid references to the dentries and inodes are held 402 */ 403 struct rpc_task * 404 nfs_async_rename(struct inode *old_dir, struct inode *new_dir, 405 struct dentry *old_dentry, struct dentry *new_dentry, 406 void (*complete)(struct rpc_task *, struct nfs_renamedata *)) 407 { 408 struct nfs_renamedata *data; 409 struct rpc_message msg = { }; 410 struct rpc_task_setup task_setup_data = { 411 .rpc_message = &msg, 412 .callback_ops = &nfs_rename_ops, 413 .workqueue = nfsiod_workqueue, 414 .rpc_client = NFS_CLIENT(old_dir), 415 .flags = RPC_TASK_ASYNC, 416 }; 417 418 data = kzalloc(sizeof(*data), GFP_KERNEL); 419 if (data == NULL) 420 return ERR_PTR(-ENOMEM); 421 task_setup_data.callback_data = data; 422 423 data->cred = rpc_lookup_cred(); 424 if (IS_ERR(data->cred)) { 425 struct rpc_task *task = ERR_CAST(data->cred); 426 kfree(data); 427 return task; 428 } 429 430 msg.rpc_argp = &data->args; 431 msg.rpc_resp = &data->res; 432 msg.rpc_cred = data->cred; 433 434 /* set up nfs_renamedata */ 435 data->old_dir = old_dir; 436 ihold(old_dir); 437 data->new_dir = new_dir; 438 ihold(new_dir); 439 data->old_dentry = dget(old_dentry); 440 data->new_dentry = dget(new_dentry); 441 nfs_fattr_init(&data->old_fattr); 442 nfs_fattr_init(&data->new_fattr); 443 data->complete = complete; 444 445 /* set up nfs_renameargs */ 446 data->args.old_dir = NFS_FH(old_dir); 447 data->args.old_name = &old_dentry->d_name; 448 data->args.new_dir = NFS_FH(new_dir); 449 data->args.new_name = &new_dentry->d_name; 450 451 /* set up nfs_renameres */ 452 data->res.old_fattr = &data->old_fattr; 453 data->res.new_fattr = &data->new_fattr; 454 455 nfs_sb_active(old_dir->i_sb); 456 457 NFS_PROTO(data->old_dir)->rename_setup(&msg, old_dir); 458 459 return rpc_run_task(&task_setup_data); 460 } 461 462 /* 463 * Perform tasks needed when a sillyrename is done such as cancelling the 464 * queued async unlink if it failed. 465 */ 466 static void 467 nfs_complete_sillyrename(struct rpc_task *task, struct nfs_renamedata *data) 468 { 469 struct dentry *dentry = data->old_dentry; 470 471 if (task->tk_status != 0) { 472 nfs_cancel_async_unlink(dentry); 473 return; 474 } 475 476 /* 477 * vfs_unlink and the like do not issue this when a file is 478 * sillyrenamed, so do it here. 479 */ 480 fsnotify_nameremove(dentry, 0); 481 } 482 483 #define SILLYNAME_PREFIX ".nfs" 484 #define SILLYNAME_PREFIX_LEN ((unsigned)sizeof(SILLYNAME_PREFIX) - 1) 485 #define SILLYNAME_FILEID_LEN ((unsigned)sizeof(u64) << 1) 486 #define SILLYNAME_COUNTER_LEN ((unsigned)sizeof(unsigned int) << 1) 487 #define SILLYNAME_LEN (SILLYNAME_PREFIX_LEN + \ 488 SILLYNAME_FILEID_LEN + \ 489 SILLYNAME_COUNTER_LEN) 490 491 /** 492 * nfs_sillyrename - Perform a silly-rename of a dentry 493 * @dir: inode of directory that contains dentry 494 * @dentry: dentry to be sillyrenamed 495 * 496 * NFSv2/3 is stateless and the server doesn't know when the client is 497 * holding a file open. To prevent application problems when a file is 498 * unlinked while it's still open, the client performs a "silly-rename". 499 * That is, it renames the file to a hidden file in the same directory, 500 * and only performs the unlink once the last reference to it is put. 501 * 502 * The final cleanup is done during dentry_iput. 503 * 504 * (Note: NFSv4 is stateful, and has opens, so in theory an NFSv4 server 505 * could take responsibility for keeping open files referenced. The server 506 * would also need to ensure that opened-but-deleted files were kept over 507 * reboots. However, we may not assume a server does so. (RFC 5661 508 * does provide an OPEN4_RESULT_PRESERVE_UNLINKED flag that a server can 509 * use to advertise that it does this; some day we may take advantage of 510 * it.)) 511 */ 512 int 513 nfs_sillyrename(struct inode *dir, struct dentry *dentry) 514 { 515 static unsigned int sillycounter; 516 unsigned char silly[SILLYNAME_LEN + 1]; 517 unsigned long long fileid; 518 struct dentry *sdentry; 519 struct rpc_task *task; 520 int error = -EBUSY; 521 522 dfprintk(VFS, "NFS: silly-rename(%pd2, ct=%d)\n", 523 dentry, d_count(dentry)); 524 nfs_inc_stats(dir, NFSIOS_SILLYRENAME); 525 526 /* 527 * We don't allow a dentry to be silly-renamed twice. 528 */ 529 if (dentry->d_flags & DCACHE_NFSFS_RENAMED) 530 goto out; 531 532 fileid = NFS_FILEID(dentry->d_inode); 533 534 /* Return delegation in anticipation of the rename */ 535 NFS_PROTO(dentry->d_inode)->return_delegation(dentry->d_inode); 536 537 sdentry = NULL; 538 do { 539 int slen; 540 dput(sdentry); 541 sillycounter++; 542 slen = scnprintf(silly, sizeof(silly), 543 SILLYNAME_PREFIX "%0*llx%0*x", 544 SILLYNAME_FILEID_LEN, fileid, 545 SILLYNAME_COUNTER_LEN, sillycounter); 546 547 dfprintk(VFS, "NFS: trying to rename %pd to %s\n", 548 dentry, silly); 549 550 sdentry = lookup_one_len(silly, dentry->d_parent, slen); 551 /* 552 * N.B. Better to return EBUSY here ... it could be 553 * dangerous to delete the file while it's in use. 554 */ 555 if (IS_ERR(sdentry)) 556 goto out; 557 } while (sdentry->d_inode != NULL); /* need negative lookup */ 558 559 /* queue unlink first. Can't do this from rpc_release as it 560 * has to allocate memory 561 */ 562 error = nfs_async_unlink(dir, dentry); 563 if (error) 564 goto out_dput; 565 566 /* populate unlinkdata with the right dname */ 567 error = nfs_copy_dname(sdentry, 568 (struct nfs_unlinkdata *)dentry->d_fsdata); 569 if (error) { 570 nfs_cancel_async_unlink(dentry); 571 goto out_dput; 572 } 573 574 /* run the rename task, undo unlink if it fails */ 575 task = nfs_async_rename(dir, dir, dentry, sdentry, 576 nfs_complete_sillyrename); 577 if (IS_ERR(task)) { 578 error = -EBUSY; 579 nfs_cancel_async_unlink(dentry); 580 goto out_dput; 581 } 582 583 /* wait for the RPC task to complete, unless a SIGKILL intervenes */ 584 error = rpc_wait_for_completion_task(task); 585 if (error == 0) 586 error = task->tk_status; 587 switch (error) { 588 case 0: 589 /* The rename succeeded */ 590 nfs_set_verifier(dentry, nfs_save_change_attribute(dir)); 591 d_move(dentry, sdentry); 592 break; 593 case -ERESTARTSYS: 594 /* The result of the rename is unknown. Play it safe by 595 * forcing a new lookup */ 596 d_drop(dentry); 597 d_drop(sdentry); 598 } 599 rpc_put_task(task); 600 out_dput: 601 dput(sdentry); 602 out: 603 return error; 604 } 605