1 /* 2 FUSE: Filesystem in Userspace 3 Copyright (C) 2001-2008 Miklos Szeredi <miklos@szeredi.hu> 4 5 This program can be distributed under the terms of the GNU GPL. 6 See the file COPYING. 7 */ 8 9 #include "fuse_i.h" 10 11 #include <linux/pagemap.h> 12 #include <linux/file.h> 13 #include <linux/sched.h> 14 #include <linux/namei.h> 15 #include <linux/slab.h> 16 17 static bool fuse_use_readdirplus(struct inode *dir, struct dir_context *ctx) 18 { 19 struct fuse_conn *fc = get_fuse_conn(dir); 20 struct fuse_inode *fi = get_fuse_inode(dir); 21 22 if (!fc->do_readdirplus) 23 return false; 24 if (!fc->readdirplus_auto) 25 return true; 26 if (test_and_clear_bit(FUSE_I_ADVISE_RDPLUS, &fi->state)) 27 return true; 28 if (ctx->pos == 0) 29 return true; 30 return false; 31 } 32 33 static void fuse_advise_use_readdirplus(struct inode *dir) 34 { 35 struct fuse_inode *fi = get_fuse_inode(dir); 36 37 set_bit(FUSE_I_ADVISE_RDPLUS, &fi->state); 38 } 39 40 #if BITS_PER_LONG >= 64 41 static inline void fuse_dentry_settime(struct dentry *entry, u64 time) 42 { 43 entry->d_time = time; 44 } 45 46 static inline u64 fuse_dentry_time(struct dentry *entry) 47 { 48 return entry->d_time; 49 } 50 #else 51 /* 52 * On 32 bit archs store the high 32 bits of time in d_fsdata 53 */ 54 static void fuse_dentry_settime(struct dentry *entry, u64 time) 55 { 56 entry->d_time = time; 57 entry->d_fsdata = (void *) (unsigned long) (time >> 32); 58 } 59 60 static u64 fuse_dentry_time(struct dentry *entry) 61 { 62 return (u64) entry->d_time + 63 ((u64) (unsigned long) entry->d_fsdata << 32); 64 } 65 #endif 66 67 /* 68 * FUSE caches dentries and attributes with separate timeout. The 69 * time in jiffies until the dentry/attributes are valid is stored in 70 * dentry->d_time and fuse_inode->i_time respectively. 71 */ 72 73 /* 74 * Calculate the time in jiffies until a dentry/attributes are valid 75 */ 76 static u64 time_to_jiffies(unsigned long sec, unsigned long nsec) 77 { 78 if (sec || nsec) { 79 struct timespec ts = {sec, nsec}; 80 return get_jiffies_64() + timespec_to_jiffies(&ts); 81 } else 82 return 0; 83 } 84 85 /* 86 * Set dentry and possibly attribute timeouts from the lookup/mk* 87 * replies 88 */ 89 static void fuse_change_entry_timeout(struct dentry *entry, 90 struct fuse_entry_out *o) 91 { 92 fuse_dentry_settime(entry, 93 time_to_jiffies(o->entry_valid, o->entry_valid_nsec)); 94 } 95 96 static u64 attr_timeout(struct fuse_attr_out *o) 97 { 98 return time_to_jiffies(o->attr_valid, o->attr_valid_nsec); 99 } 100 101 static u64 entry_attr_timeout(struct fuse_entry_out *o) 102 { 103 return time_to_jiffies(o->attr_valid, o->attr_valid_nsec); 104 } 105 106 /* 107 * Mark the attributes as stale, so that at the next call to 108 * ->getattr() they will be fetched from userspace 109 */ 110 void fuse_invalidate_attr(struct inode *inode) 111 { 112 get_fuse_inode(inode)->i_time = 0; 113 } 114 115 /** 116 * Mark the attributes as stale due to an atime change. Avoid the invalidate if 117 * atime is not used. 118 */ 119 void fuse_invalidate_atime(struct inode *inode) 120 { 121 if (!IS_RDONLY(inode)) 122 fuse_invalidate_attr(inode); 123 } 124 125 /* 126 * Just mark the entry as stale, so that a next attempt to look it up 127 * will result in a new lookup call to userspace 128 * 129 * This is called when a dentry is about to become negative and the 130 * timeout is unknown (unlink, rmdir, rename and in some cases 131 * lookup) 132 */ 133 void fuse_invalidate_entry_cache(struct dentry *entry) 134 { 135 fuse_dentry_settime(entry, 0); 136 } 137 138 /* 139 * Same as fuse_invalidate_entry_cache(), but also try to remove the 140 * dentry from the hash 141 */ 142 static void fuse_invalidate_entry(struct dentry *entry) 143 { 144 d_invalidate(entry); 145 fuse_invalidate_entry_cache(entry); 146 } 147 148 static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_args *args, 149 u64 nodeid, const struct qstr *name, 150 struct fuse_entry_out *outarg) 151 { 152 memset(outarg, 0, sizeof(struct fuse_entry_out)); 153 args->in.h.opcode = FUSE_LOOKUP; 154 args->in.h.nodeid = nodeid; 155 args->in.numargs = 1; 156 args->in.args[0].size = name->len + 1; 157 args->in.args[0].value = name->name; 158 args->out.numargs = 1; 159 args->out.args[0].size = sizeof(struct fuse_entry_out); 160 args->out.args[0].value = outarg; 161 } 162 163 u64 fuse_get_attr_version(struct fuse_conn *fc) 164 { 165 u64 curr_version; 166 167 /* 168 * The spin lock isn't actually needed on 64bit archs, but we 169 * don't yet care too much about such optimizations. 170 */ 171 spin_lock(&fc->lock); 172 curr_version = fc->attr_version; 173 spin_unlock(&fc->lock); 174 175 return curr_version; 176 } 177 178 /* 179 * Check whether the dentry is still valid 180 * 181 * If the entry validity timeout has expired and the dentry is 182 * positive, try to redo the lookup. If the lookup results in a 183 * different inode, then let the VFS invalidate the dentry and redo 184 * the lookup once more. If the lookup results in the same inode, 185 * then refresh the attributes, timeouts and mark the dentry valid. 186 */ 187 static int fuse_dentry_revalidate(struct dentry *entry, unsigned int flags) 188 { 189 struct inode *inode; 190 struct dentry *parent; 191 struct fuse_conn *fc; 192 struct fuse_inode *fi; 193 int ret; 194 195 inode = d_inode_rcu(entry); 196 if (inode && is_bad_inode(inode)) 197 goto invalid; 198 else if (time_before64(fuse_dentry_time(entry), get_jiffies_64()) || 199 (flags & LOOKUP_REVAL)) { 200 struct fuse_entry_out outarg; 201 FUSE_ARGS(args); 202 struct fuse_forget_link *forget; 203 u64 attr_version; 204 205 /* For negative dentries, always do a fresh lookup */ 206 if (!inode) 207 goto invalid; 208 209 ret = -ECHILD; 210 if (flags & LOOKUP_RCU) 211 goto out; 212 213 fc = get_fuse_conn(inode); 214 215 forget = fuse_alloc_forget(); 216 ret = -ENOMEM; 217 if (!forget) 218 goto out; 219 220 attr_version = fuse_get_attr_version(fc); 221 222 parent = dget_parent(entry); 223 fuse_lookup_init(fc, &args, get_node_id(d_inode(parent)), 224 &entry->d_name, &outarg); 225 ret = fuse_simple_request(fc, &args); 226 dput(parent); 227 /* Zero nodeid is same as -ENOENT */ 228 if (!ret && !outarg.nodeid) 229 ret = -ENOENT; 230 if (!ret) { 231 fi = get_fuse_inode(inode); 232 if (outarg.nodeid != get_node_id(inode)) { 233 fuse_queue_forget(fc, forget, outarg.nodeid, 1); 234 goto invalid; 235 } 236 spin_lock(&fc->lock); 237 fi->nlookup++; 238 spin_unlock(&fc->lock); 239 } 240 kfree(forget); 241 if (ret == -ENOMEM) 242 goto out; 243 if (ret || (outarg.attr.mode ^ inode->i_mode) & S_IFMT) 244 goto invalid; 245 246 fuse_change_attributes(inode, &outarg.attr, 247 entry_attr_timeout(&outarg), 248 attr_version); 249 fuse_change_entry_timeout(entry, &outarg); 250 } else if (inode) { 251 fi = get_fuse_inode(inode); 252 if (flags & LOOKUP_RCU) { 253 if (test_bit(FUSE_I_INIT_RDPLUS, &fi->state)) 254 return -ECHILD; 255 } else if (test_and_clear_bit(FUSE_I_INIT_RDPLUS, &fi->state)) { 256 parent = dget_parent(entry); 257 fuse_advise_use_readdirplus(d_inode(parent)); 258 dput(parent); 259 } 260 } 261 ret = 1; 262 out: 263 return ret; 264 265 invalid: 266 ret = 0; 267 goto out; 268 } 269 270 static int invalid_nodeid(u64 nodeid) 271 { 272 return !nodeid || nodeid == FUSE_ROOT_ID; 273 } 274 275 const struct dentry_operations fuse_dentry_operations = { 276 .d_revalidate = fuse_dentry_revalidate, 277 }; 278 279 int fuse_valid_type(int m) 280 { 281 return S_ISREG(m) || S_ISDIR(m) || S_ISLNK(m) || S_ISCHR(m) || 282 S_ISBLK(m) || S_ISFIFO(m) || S_ISSOCK(m); 283 } 284 285 int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name, 286 struct fuse_entry_out *outarg, struct inode **inode) 287 { 288 struct fuse_conn *fc = get_fuse_conn_super(sb); 289 FUSE_ARGS(args); 290 struct fuse_forget_link *forget; 291 u64 attr_version; 292 int err; 293 294 *inode = NULL; 295 err = -ENAMETOOLONG; 296 if (name->len > FUSE_NAME_MAX) 297 goto out; 298 299 300 forget = fuse_alloc_forget(); 301 err = -ENOMEM; 302 if (!forget) 303 goto out; 304 305 attr_version = fuse_get_attr_version(fc); 306 307 fuse_lookup_init(fc, &args, nodeid, name, outarg); 308 err = fuse_simple_request(fc, &args); 309 /* Zero nodeid is same as -ENOENT, but with valid timeout */ 310 if (err || !outarg->nodeid) 311 goto out_put_forget; 312 313 err = -EIO; 314 if (!outarg->nodeid) 315 goto out_put_forget; 316 if (!fuse_valid_type(outarg->attr.mode)) 317 goto out_put_forget; 318 319 *inode = fuse_iget(sb, outarg->nodeid, outarg->generation, 320 &outarg->attr, entry_attr_timeout(outarg), 321 attr_version); 322 err = -ENOMEM; 323 if (!*inode) { 324 fuse_queue_forget(fc, forget, outarg->nodeid, 1); 325 goto out; 326 } 327 err = 0; 328 329 out_put_forget: 330 kfree(forget); 331 out: 332 return err; 333 } 334 335 static struct dentry *fuse_lookup(struct inode *dir, struct dentry *entry, 336 unsigned int flags) 337 { 338 int err; 339 struct fuse_entry_out outarg; 340 struct inode *inode; 341 struct dentry *newent; 342 bool outarg_valid = true; 343 344 fuse_lock_inode(dir); 345 err = fuse_lookup_name(dir->i_sb, get_node_id(dir), &entry->d_name, 346 &outarg, &inode); 347 fuse_unlock_inode(dir); 348 if (err == -ENOENT) { 349 outarg_valid = false; 350 err = 0; 351 } 352 if (err) 353 goto out_err; 354 355 err = -EIO; 356 if (inode && get_node_id(inode) == FUSE_ROOT_ID) 357 goto out_iput; 358 359 newent = d_splice_alias(inode, entry); 360 err = PTR_ERR(newent); 361 if (IS_ERR(newent)) 362 goto out_err; 363 364 entry = newent ? newent : entry; 365 if (outarg_valid) 366 fuse_change_entry_timeout(entry, &outarg); 367 else 368 fuse_invalidate_entry_cache(entry); 369 370 fuse_advise_use_readdirplus(dir); 371 return newent; 372 373 out_iput: 374 iput(inode); 375 out_err: 376 return ERR_PTR(err); 377 } 378 379 /* 380 * Atomic create+open operation 381 * 382 * If the filesystem doesn't support this, then fall back to separate 383 * 'mknod' + 'open' requests. 384 */ 385 static int fuse_create_open(struct inode *dir, struct dentry *entry, 386 struct file *file, unsigned flags, 387 umode_t mode, int *opened) 388 { 389 int err; 390 struct inode *inode; 391 struct fuse_conn *fc = get_fuse_conn(dir); 392 FUSE_ARGS(args); 393 struct fuse_forget_link *forget; 394 struct fuse_create_in inarg; 395 struct fuse_open_out outopen; 396 struct fuse_entry_out outentry; 397 struct fuse_file *ff; 398 399 /* Userspace expects S_IFREG in create mode */ 400 BUG_ON((mode & S_IFMT) != S_IFREG); 401 402 forget = fuse_alloc_forget(); 403 err = -ENOMEM; 404 if (!forget) 405 goto out_err; 406 407 err = -ENOMEM; 408 ff = fuse_file_alloc(fc); 409 if (!ff) 410 goto out_put_forget_req; 411 412 if (!fc->dont_mask) 413 mode &= ~current_umask(); 414 415 flags &= ~O_NOCTTY; 416 memset(&inarg, 0, sizeof(inarg)); 417 memset(&outentry, 0, sizeof(outentry)); 418 inarg.flags = flags; 419 inarg.mode = mode; 420 inarg.umask = current_umask(); 421 args.in.h.opcode = FUSE_CREATE; 422 args.in.h.nodeid = get_node_id(dir); 423 args.in.numargs = 2; 424 args.in.args[0].size = sizeof(inarg); 425 args.in.args[0].value = &inarg; 426 args.in.args[1].size = entry->d_name.len + 1; 427 args.in.args[1].value = entry->d_name.name; 428 args.out.numargs = 2; 429 args.out.args[0].size = sizeof(outentry); 430 args.out.args[0].value = &outentry; 431 args.out.args[1].size = sizeof(outopen); 432 args.out.args[1].value = &outopen; 433 err = fuse_simple_request(fc, &args); 434 if (err) 435 goto out_free_ff; 436 437 err = -EIO; 438 if (!S_ISREG(outentry.attr.mode) || invalid_nodeid(outentry.nodeid)) 439 goto out_free_ff; 440 441 ff->fh = outopen.fh; 442 ff->nodeid = outentry.nodeid; 443 ff->open_flags = outopen.open_flags; 444 inode = fuse_iget(dir->i_sb, outentry.nodeid, outentry.generation, 445 &outentry.attr, entry_attr_timeout(&outentry), 0); 446 if (!inode) { 447 flags &= ~(O_CREAT | O_EXCL | O_TRUNC); 448 fuse_sync_release(ff, flags); 449 fuse_queue_forget(fc, forget, outentry.nodeid, 1); 450 err = -ENOMEM; 451 goto out_err; 452 } 453 kfree(forget); 454 d_instantiate(entry, inode); 455 fuse_change_entry_timeout(entry, &outentry); 456 fuse_invalidate_attr(dir); 457 err = finish_open(file, entry, generic_file_open, opened); 458 if (err) { 459 fuse_sync_release(ff, flags); 460 } else { 461 file->private_data = fuse_file_get(ff); 462 fuse_finish_open(inode, file); 463 } 464 return err; 465 466 out_free_ff: 467 fuse_file_free(ff); 468 out_put_forget_req: 469 kfree(forget); 470 out_err: 471 return err; 472 } 473 474 static int fuse_mknod(struct inode *, struct dentry *, umode_t, dev_t); 475 static int fuse_atomic_open(struct inode *dir, struct dentry *entry, 476 struct file *file, unsigned flags, 477 umode_t mode, int *opened) 478 { 479 int err; 480 struct fuse_conn *fc = get_fuse_conn(dir); 481 struct dentry *res = NULL; 482 483 if (d_in_lookup(entry)) { 484 res = fuse_lookup(dir, entry, 0); 485 if (IS_ERR(res)) 486 return PTR_ERR(res); 487 488 if (res) 489 entry = res; 490 } 491 492 if (!(flags & O_CREAT) || d_really_is_positive(entry)) 493 goto no_open; 494 495 /* Only creates */ 496 *opened |= FILE_CREATED; 497 498 if (fc->no_create) 499 goto mknod; 500 501 err = fuse_create_open(dir, entry, file, flags, mode, opened); 502 if (err == -ENOSYS) { 503 fc->no_create = 1; 504 goto mknod; 505 } 506 out_dput: 507 dput(res); 508 return err; 509 510 mknod: 511 err = fuse_mknod(dir, entry, mode, 0); 512 if (err) 513 goto out_dput; 514 no_open: 515 return finish_no_open(file, res); 516 } 517 518 /* 519 * Code shared between mknod, mkdir, symlink and link 520 */ 521 static int create_new_entry(struct fuse_conn *fc, struct fuse_args *args, 522 struct inode *dir, struct dentry *entry, 523 umode_t mode) 524 { 525 struct fuse_entry_out outarg; 526 struct inode *inode; 527 int err; 528 struct fuse_forget_link *forget; 529 530 forget = fuse_alloc_forget(); 531 if (!forget) 532 return -ENOMEM; 533 534 memset(&outarg, 0, sizeof(outarg)); 535 args->in.h.nodeid = get_node_id(dir); 536 args->out.numargs = 1; 537 args->out.args[0].size = sizeof(outarg); 538 args->out.args[0].value = &outarg; 539 err = fuse_simple_request(fc, args); 540 if (err) 541 goto out_put_forget_req; 542 543 err = -EIO; 544 if (invalid_nodeid(outarg.nodeid)) 545 goto out_put_forget_req; 546 547 if ((outarg.attr.mode ^ mode) & S_IFMT) 548 goto out_put_forget_req; 549 550 inode = fuse_iget(dir->i_sb, outarg.nodeid, outarg.generation, 551 &outarg.attr, entry_attr_timeout(&outarg), 0); 552 if (!inode) { 553 fuse_queue_forget(fc, forget, outarg.nodeid, 1); 554 return -ENOMEM; 555 } 556 kfree(forget); 557 558 err = d_instantiate_no_diralias(entry, inode); 559 if (err) 560 return err; 561 562 fuse_change_entry_timeout(entry, &outarg); 563 fuse_invalidate_attr(dir); 564 return 0; 565 566 out_put_forget_req: 567 kfree(forget); 568 return err; 569 } 570 571 static int fuse_mknod(struct inode *dir, struct dentry *entry, umode_t mode, 572 dev_t rdev) 573 { 574 struct fuse_mknod_in inarg; 575 struct fuse_conn *fc = get_fuse_conn(dir); 576 FUSE_ARGS(args); 577 578 if (!fc->dont_mask) 579 mode &= ~current_umask(); 580 581 memset(&inarg, 0, sizeof(inarg)); 582 inarg.mode = mode; 583 inarg.rdev = new_encode_dev(rdev); 584 inarg.umask = current_umask(); 585 args.in.h.opcode = FUSE_MKNOD; 586 args.in.numargs = 2; 587 args.in.args[0].size = sizeof(inarg); 588 args.in.args[0].value = &inarg; 589 args.in.args[1].size = entry->d_name.len + 1; 590 args.in.args[1].value = entry->d_name.name; 591 return create_new_entry(fc, &args, dir, entry, mode); 592 } 593 594 static int fuse_create(struct inode *dir, struct dentry *entry, umode_t mode, 595 bool excl) 596 { 597 return fuse_mknod(dir, entry, mode, 0); 598 } 599 600 static int fuse_mkdir(struct inode *dir, struct dentry *entry, umode_t mode) 601 { 602 struct fuse_mkdir_in inarg; 603 struct fuse_conn *fc = get_fuse_conn(dir); 604 FUSE_ARGS(args); 605 606 if (!fc->dont_mask) 607 mode &= ~current_umask(); 608 609 memset(&inarg, 0, sizeof(inarg)); 610 inarg.mode = mode; 611 inarg.umask = current_umask(); 612 args.in.h.opcode = FUSE_MKDIR; 613 args.in.numargs = 2; 614 args.in.args[0].size = sizeof(inarg); 615 args.in.args[0].value = &inarg; 616 args.in.args[1].size = entry->d_name.len + 1; 617 args.in.args[1].value = entry->d_name.name; 618 return create_new_entry(fc, &args, dir, entry, S_IFDIR); 619 } 620 621 static int fuse_symlink(struct inode *dir, struct dentry *entry, 622 const char *link) 623 { 624 struct fuse_conn *fc = get_fuse_conn(dir); 625 unsigned len = strlen(link) + 1; 626 FUSE_ARGS(args); 627 628 args.in.h.opcode = FUSE_SYMLINK; 629 args.in.numargs = 2; 630 args.in.args[0].size = entry->d_name.len + 1; 631 args.in.args[0].value = entry->d_name.name; 632 args.in.args[1].size = len; 633 args.in.args[1].value = link; 634 return create_new_entry(fc, &args, dir, entry, S_IFLNK); 635 } 636 637 static inline void fuse_update_ctime(struct inode *inode) 638 { 639 if (!IS_NOCMTIME(inode)) { 640 inode->i_ctime = current_fs_time(inode->i_sb); 641 mark_inode_dirty_sync(inode); 642 } 643 } 644 645 static int fuse_unlink(struct inode *dir, struct dentry *entry) 646 { 647 int err; 648 struct fuse_conn *fc = get_fuse_conn(dir); 649 FUSE_ARGS(args); 650 651 args.in.h.opcode = FUSE_UNLINK; 652 args.in.h.nodeid = get_node_id(dir); 653 args.in.numargs = 1; 654 args.in.args[0].size = entry->d_name.len + 1; 655 args.in.args[0].value = entry->d_name.name; 656 err = fuse_simple_request(fc, &args); 657 if (!err) { 658 struct inode *inode = d_inode(entry); 659 struct fuse_inode *fi = get_fuse_inode(inode); 660 661 spin_lock(&fc->lock); 662 fi->attr_version = ++fc->attr_version; 663 /* 664 * If i_nlink == 0 then unlink doesn't make sense, yet this can 665 * happen if userspace filesystem is careless. It would be 666 * difficult to enforce correct nlink usage so just ignore this 667 * condition here 668 */ 669 if (inode->i_nlink > 0) 670 drop_nlink(inode); 671 spin_unlock(&fc->lock); 672 fuse_invalidate_attr(inode); 673 fuse_invalidate_attr(dir); 674 fuse_invalidate_entry_cache(entry); 675 fuse_update_ctime(inode); 676 } else if (err == -EINTR) 677 fuse_invalidate_entry(entry); 678 return err; 679 } 680 681 static int fuse_rmdir(struct inode *dir, struct dentry *entry) 682 { 683 int err; 684 struct fuse_conn *fc = get_fuse_conn(dir); 685 FUSE_ARGS(args); 686 687 args.in.h.opcode = FUSE_RMDIR; 688 args.in.h.nodeid = get_node_id(dir); 689 args.in.numargs = 1; 690 args.in.args[0].size = entry->d_name.len + 1; 691 args.in.args[0].value = entry->d_name.name; 692 err = fuse_simple_request(fc, &args); 693 if (!err) { 694 clear_nlink(d_inode(entry)); 695 fuse_invalidate_attr(dir); 696 fuse_invalidate_entry_cache(entry); 697 } else if (err == -EINTR) 698 fuse_invalidate_entry(entry); 699 return err; 700 } 701 702 static int fuse_rename_common(struct inode *olddir, struct dentry *oldent, 703 struct inode *newdir, struct dentry *newent, 704 unsigned int flags, int opcode, size_t argsize) 705 { 706 int err; 707 struct fuse_rename2_in inarg; 708 struct fuse_conn *fc = get_fuse_conn(olddir); 709 FUSE_ARGS(args); 710 711 memset(&inarg, 0, argsize); 712 inarg.newdir = get_node_id(newdir); 713 inarg.flags = flags; 714 args.in.h.opcode = opcode; 715 args.in.h.nodeid = get_node_id(olddir); 716 args.in.numargs = 3; 717 args.in.args[0].size = argsize; 718 args.in.args[0].value = &inarg; 719 args.in.args[1].size = oldent->d_name.len + 1; 720 args.in.args[1].value = oldent->d_name.name; 721 args.in.args[2].size = newent->d_name.len + 1; 722 args.in.args[2].value = newent->d_name.name; 723 err = fuse_simple_request(fc, &args); 724 if (!err) { 725 /* ctime changes */ 726 fuse_invalidate_attr(d_inode(oldent)); 727 fuse_update_ctime(d_inode(oldent)); 728 729 if (flags & RENAME_EXCHANGE) { 730 fuse_invalidate_attr(d_inode(newent)); 731 fuse_update_ctime(d_inode(newent)); 732 } 733 734 fuse_invalidate_attr(olddir); 735 if (olddir != newdir) 736 fuse_invalidate_attr(newdir); 737 738 /* newent will end up negative */ 739 if (!(flags & RENAME_EXCHANGE) && d_really_is_positive(newent)) { 740 fuse_invalidate_attr(d_inode(newent)); 741 fuse_invalidate_entry_cache(newent); 742 fuse_update_ctime(d_inode(newent)); 743 } 744 } else if (err == -EINTR) { 745 /* If request was interrupted, DEITY only knows if the 746 rename actually took place. If the invalidation 747 fails (e.g. some process has CWD under the renamed 748 directory), then there can be inconsistency between 749 the dcache and the real filesystem. Tough luck. */ 750 fuse_invalidate_entry(oldent); 751 if (d_really_is_positive(newent)) 752 fuse_invalidate_entry(newent); 753 } 754 755 return err; 756 } 757 758 static int fuse_rename2(struct inode *olddir, struct dentry *oldent, 759 struct inode *newdir, struct dentry *newent, 760 unsigned int flags) 761 { 762 struct fuse_conn *fc = get_fuse_conn(olddir); 763 int err; 764 765 if (flags & ~(RENAME_NOREPLACE | RENAME_EXCHANGE)) 766 return -EINVAL; 767 768 if (flags) { 769 if (fc->no_rename2 || fc->minor < 23) 770 return -EINVAL; 771 772 err = fuse_rename_common(olddir, oldent, newdir, newent, flags, 773 FUSE_RENAME2, 774 sizeof(struct fuse_rename2_in)); 775 if (err == -ENOSYS) { 776 fc->no_rename2 = 1; 777 err = -EINVAL; 778 } 779 } else { 780 err = fuse_rename_common(olddir, oldent, newdir, newent, 0, 781 FUSE_RENAME, 782 sizeof(struct fuse_rename_in)); 783 } 784 785 return err; 786 } 787 788 static int fuse_link(struct dentry *entry, struct inode *newdir, 789 struct dentry *newent) 790 { 791 int err; 792 struct fuse_link_in inarg; 793 struct inode *inode = d_inode(entry); 794 struct fuse_conn *fc = get_fuse_conn(inode); 795 FUSE_ARGS(args); 796 797 memset(&inarg, 0, sizeof(inarg)); 798 inarg.oldnodeid = get_node_id(inode); 799 args.in.h.opcode = FUSE_LINK; 800 args.in.numargs = 2; 801 args.in.args[0].size = sizeof(inarg); 802 args.in.args[0].value = &inarg; 803 args.in.args[1].size = newent->d_name.len + 1; 804 args.in.args[1].value = newent->d_name.name; 805 err = create_new_entry(fc, &args, newdir, newent, inode->i_mode); 806 /* Contrary to "normal" filesystems it can happen that link 807 makes two "logical" inodes point to the same "physical" 808 inode. We invalidate the attributes of the old one, so it 809 will reflect changes in the backing inode (link count, 810 etc.) 811 */ 812 if (!err) { 813 struct fuse_inode *fi = get_fuse_inode(inode); 814 815 spin_lock(&fc->lock); 816 fi->attr_version = ++fc->attr_version; 817 inc_nlink(inode); 818 spin_unlock(&fc->lock); 819 fuse_invalidate_attr(inode); 820 fuse_update_ctime(inode); 821 } else if (err == -EINTR) { 822 fuse_invalidate_attr(inode); 823 } 824 return err; 825 } 826 827 static void fuse_fillattr(struct inode *inode, struct fuse_attr *attr, 828 struct kstat *stat) 829 { 830 unsigned int blkbits; 831 struct fuse_conn *fc = get_fuse_conn(inode); 832 833 /* see the comment in fuse_change_attributes() */ 834 if (fc->writeback_cache && S_ISREG(inode->i_mode)) { 835 attr->size = i_size_read(inode); 836 attr->mtime = inode->i_mtime.tv_sec; 837 attr->mtimensec = inode->i_mtime.tv_nsec; 838 attr->ctime = inode->i_ctime.tv_sec; 839 attr->ctimensec = inode->i_ctime.tv_nsec; 840 } 841 842 stat->dev = inode->i_sb->s_dev; 843 stat->ino = attr->ino; 844 stat->mode = (inode->i_mode & S_IFMT) | (attr->mode & 07777); 845 stat->nlink = attr->nlink; 846 stat->uid = make_kuid(&init_user_ns, attr->uid); 847 stat->gid = make_kgid(&init_user_ns, attr->gid); 848 stat->rdev = inode->i_rdev; 849 stat->atime.tv_sec = attr->atime; 850 stat->atime.tv_nsec = attr->atimensec; 851 stat->mtime.tv_sec = attr->mtime; 852 stat->mtime.tv_nsec = attr->mtimensec; 853 stat->ctime.tv_sec = attr->ctime; 854 stat->ctime.tv_nsec = attr->ctimensec; 855 stat->size = attr->size; 856 stat->blocks = attr->blocks; 857 858 if (attr->blksize != 0) 859 blkbits = ilog2(attr->blksize); 860 else 861 blkbits = inode->i_sb->s_blocksize_bits; 862 863 stat->blksize = 1 << blkbits; 864 } 865 866 static int fuse_do_getattr(struct inode *inode, struct kstat *stat, 867 struct file *file) 868 { 869 int err; 870 struct fuse_getattr_in inarg; 871 struct fuse_attr_out outarg; 872 struct fuse_conn *fc = get_fuse_conn(inode); 873 FUSE_ARGS(args); 874 u64 attr_version; 875 876 attr_version = fuse_get_attr_version(fc); 877 878 memset(&inarg, 0, sizeof(inarg)); 879 memset(&outarg, 0, sizeof(outarg)); 880 /* Directories have separate file-handle space */ 881 if (file && S_ISREG(inode->i_mode)) { 882 struct fuse_file *ff = file->private_data; 883 884 inarg.getattr_flags |= FUSE_GETATTR_FH; 885 inarg.fh = ff->fh; 886 } 887 args.in.h.opcode = FUSE_GETATTR; 888 args.in.h.nodeid = get_node_id(inode); 889 args.in.numargs = 1; 890 args.in.args[0].size = sizeof(inarg); 891 args.in.args[0].value = &inarg; 892 args.out.numargs = 1; 893 args.out.args[0].size = sizeof(outarg); 894 args.out.args[0].value = &outarg; 895 err = fuse_simple_request(fc, &args); 896 if (!err) { 897 if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) { 898 make_bad_inode(inode); 899 err = -EIO; 900 } else { 901 fuse_change_attributes(inode, &outarg.attr, 902 attr_timeout(&outarg), 903 attr_version); 904 if (stat) 905 fuse_fillattr(inode, &outarg.attr, stat); 906 } 907 } 908 return err; 909 } 910 911 int fuse_update_attributes(struct inode *inode, struct kstat *stat, 912 struct file *file, bool *refreshed) 913 { 914 struct fuse_inode *fi = get_fuse_inode(inode); 915 int err; 916 bool r; 917 918 if (time_before64(fi->i_time, get_jiffies_64())) { 919 r = true; 920 err = fuse_do_getattr(inode, stat, file); 921 } else { 922 r = false; 923 err = 0; 924 if (stat) { 925 generic_fillattr(inode, stat); 926 stat->mode = fi->orig_i_mode; 927 stat->ino = fi->orig_ino; 928 } 929 } 930 931 if (refreshed != NULL) 932 *refreshed = r; 933 934 return err; 935 } 936 937 int fuse_reverse_inval_entry(struct super_block *sb, u64 parent_nodeid, 938 u64 child_nodeid, struct qstr *name) 939 { 940 int err = -ENOTDIR; 941 struct inode *parent; 942 struct dentry *dir; 943 struct dentry *entry; 944 945 parent = ilookup5(sb, parent_nodeid, fuse_inode_eq, &parent_nodeid); 946 if (!parent) 947 return -ENOENT; 948 949 inode_lock(parent); 950 if (!S_ISDIR(parent->i_mode)) 951 goto unlock; 952 953 err = -ENOENT; 954 dir = d_find_alias(parent); 955 if (!dir) 956 goto unlock; 957 958 name->hash = full_name_hash(dir, name->name, name->len); 959 entry = d_lookup(dir, name); 960 dput(dir); 961 if (!entry) 962 goto unlock; 963 964 fuse_invalidate_attr(parent); 965 fuse_invalidate_entry(entry); 966 967 if (child_nodeid != 0 && d_really_is_positive(entry)) { 968 inode_lock(d_inode(entry)); 969 if (get_node_id(d_inode(entry)) != child_nodeid) { 970 err = -ENOENT; 971 goto badentry; 972 } 973 if (d_mountpoint(entry)) { 974 err = -EBUSY; 975 goto badentry; 976 } 977 if (d_is_dir(entry)) { 978 shrink_dcache_parent(entry); 979 if (!simple_empty(entry)) { 980 err = -ENOTEMPTY; 981 goto badentry; 982 } 983 d_inode(entry)->i_flags |= S_DEAD; 984 } 985 dont_mount(entry); 986 clear_nlink(d_inode(entry)); 987 err = 0; 988 badentry: 989 inode_unlock(d_inode(entry)); 990 if (!err) 991 d_delete(entry); 992 } else { 993 err = 0; 994 } 995 dput(entry); 996 997 unlock: 998 inode_unlock(parent); 999 iput(parent); 1000 return err; 1001 } 1002 1003 /* 1004 * Calling into a user-controlled filesystem gives the filesystem 1005 * daemon ptrace-like capabilities over the current process. This 1006 * means, that the filesystem daemon is able to record the exact 1007 * filesystem operations performed, and can also control the behavior 1008 * of the requester process in otherwise impossible ways. For example 1009 * it can delay the operation for arbitrary length of time allowing 1010 * DoS against the requester. 1011 * 1012 * For this reason only those processes can call into the filesystem, 1013 * for which the owner of the mount has ptrace privilege. This 1014 * excludes processes started by other users, suid or sgid processes. 1015 */ 1016 int fuse_allow_current_process(struct fuse_conn *fc) 1017 { 1018 const struct cred *cred; 1019 1020 if (fc->flags & FUSE_ALLOW_OTHER) 1021 return 1; 1022 1023 cred = current_cred(); 1024 if (uid_eq(cred->euid, fc->user_id) && 1025 uid_eq(cred->suid, fc->user_id) && 1026 uid_eq(cred->uid, fc->user_id) && 1027 gid_eq(cred->egid, fc->group_id) && 1028 gid_eq(cred->sgid, fc->group_id) && 1029 gid_eq(cred->gid, fc->group_id)) 1030 return 1; 1031 1032 return 0; 1033 } 1034 1035 static int fuse_access(struct inode *inode, int mask) 1036 { 1037 struct fuse_conn *fc = get_fuse_conn(inode); 1038 FUSE_ARGS(args); 1039 struct fuse_access_in inarg; 1040 int err; 1041 1042 BUG_ON(mask & MAY_NOT_BLOCK); 1043 1044 if (fc->no_access) 1045 return 0; 1046 1047 memset(&inarg, 0, sizeof(inarg)); 1048 inarg.mask = mask & (MAY_READ | MAY_WRITE | MAY_EXEC); 1049 args.in.h.opcode = FUSE_ACCESS; 1050 args.in.h.nodeid = get_node_id(inode); 1051 args.in.numargs = 1; 1052 args.in.args[0].size = sizeof(inarg); 1053 args.in.args[0].value = &inarg; 1054 err = fuse_simple_request(fc, &args); 1055 if (err == -ENOSYS) { 1056 fc->no_access = 1; 1057 err = 0; 1058 } 1059 return err; 1060 } 1061 1062 static int fuse_perm_getattr(struct inode *inode, int mask) 1063 { 1064 if (mask & MAY_NOT_BLOCK) 1065 return -ECHILD; 1066 1067 return fuse_do_getattr(inode, NULL, NULL); 1068 } 1069 1070 /* 1071 * Check permission. The two basic access models of FUSE are: 1072 * 1073 * 1) Local access checking ('default_permissions' mount option) based 1074 * on file mode. This is the plain old disk filesystem permission 1075 * modell. 1076 * 1077 * 2) "Remote" access checking, where server is responsible for 1078 * checking permission in each inode operation. An exception to this 1079 * is if ->permission() was invoked from sys_access() in which case an 1080 * access request is sent. Execute permission is still checked 1081 * locally based on file mode. 1082 */ 1083 static int fuse_permission(struct inode *inode, int mask) 1084 { 1085 struct fuse_conn *fc = get_fuse_conn(inode); 1086 bool refreshed = false; 1087 int err = 0; 1088 1089 if (!fuse_allow_current_process(fc)) 1090 return -EACCES; 1091 1092 /* 1093 * If attributes are needed, refresh them before proceeding 1094 */ 1095 if ((fc->flags & FUSE_DEFAULT_PERMISSIONS) || 1096 ((mask & MAY_EXEC) && S_ISREG(inode->i_mode))) { 1097 struct fuse_inode *fi = get_fuse_inode(inode); 1098 1099 if (time_before64(fi->i_time, get_jiffies_64())) { 1100 refreshed = true; 1101 1102 err = fuse_perm_getattr(inode, mask); 1103 if (err) 1104 return err; 1105 } 1106 } 1107 1108 if (fc->flags & FUSE_DEFAULT_PERMISSIONS) { 1109 err = generic_permission(inode, mask); 1110 1111 /* If permission is denied, try to refresh file 1112 attributes. This is also needed, because the root 1113 node will at first have no permissions */ 1114 if (err == -EACCES && !refreshed) { 1115 err = fuse_perm_getattr(inode, mask); 1116 if (!err) 1117 err = generic_permission(inode, mask); 1118 } 1119 1120 /* Note: the opposite of the above test does not 1121 exist. So if permissions are revoked this won't be 1122 noticed immediately, only after the attribute 1123 timeout has expired */ 1124 } else if (mask & (MAY_ACCESS | MAY_CHDIR)) { 1125 err = fuse_access(inode, mask); 1126 } else if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) { 1127 if (!(inode->i_mode & S_IXUGO)) { 1128 if (refreshed) 1129 return -EACCES; 1130 1131 err = fuse_perm_getattr(inode, mask); 1132 if (!err && !(inode->i_mode & S_IXUGO)) 1133 return -EACCES; 1134 } 1135 } 1136 return err; 1137 } 1138 1139 static int parse_dirfile(char *buf, size_t nbytes, struct file *file, 1140 struct dir_context *ctx) 1141 { 1142 while (nbytes >= FUSE_NAME_OFFSET) { 1143 struct fuse_dirent *dirent = (struct fuse_dirent *) buf; 1144 size_t reclen = FUSE_DIRENT_SIZE(dirent); 1145 if (!dirent->namelen || dirent->namelen > FUSE_NAME_MAX) 1146 return -EIO; 1147 if (reclen > nbytes) 1148 break; 1149 if (memchr(dirent->name, '/', dirent->namelen) != NULL) 1150 return -EIO; 1151 1152 if (!dir_emit(ctx, dirent->name, dirent->namelen, 1153 dirent->ino, dirent->type)) 1154 break; 1155 1156 buf += reclen; 1157 nbytes -= reclen; 1158 ctx->pos = dirent->off; 1159 } 1160 1161 return 0; 1162 } 1163 1164 static int fuse_direntplus_link(struct file *file, 1165 struct fuse_direntplus *direntplus, 1166 u64 attr_version) 1167 { 1168 struct fuse_entry_out *o = &direntplus->entry_out; 1169 struct fuse_dirent *dirent = &direntplus->dirent; 1170 struct dentry *parent = file->f_path.dentry; 1171 struct qstr name = QSTR_INIT(dirent->name, dirent->namelen); 1172 struct dentry *dentry; 1173 struct dentry *alias; 1174 struct inode *dir = d_inode(parent); 1175 struct fuse_conn *fc; 1176 struct inode *inode; 1177 DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq); 1178 1179 if (!o->nodeid) { 1180 /* 1181 * Unlike in the case of fuse_lookup, zero nodeid does not mean 1182 * ENOENT. Instead, it only means the userspace filesystem did 1183 * not want to return attributes/handle for this entry. 1184 * 1185 * So do nothing. 1186 */ 1187 return 0; 1188 } 1189 1190 if (name.name[0] == '.') { 1191 /* 1192 * We could potentially refresh the attributes of the directory 1193 * and its parent? 1194 */ 1195 if (name.len == 1) 1196 return 0; 1197 if (name.name[1] == '.' && name.len == 2) 1198 return 0; 1199 } 1200 1201 if (invalid_nodeid(o->nodeid)) 1202 return -EIO; 1203 if (!fuse_valid_type(o->attr.mode)) 1204 return -EIO; 1205 1206 fc = get_fuse_conn(dir); 1207 1208 name.hash = full_name_hash(parent, name.name, name.len); 1209 dentry = d_lookup(parent, &name); 1210 if (!dentry) { 1211 retry: 1212 dentry = d_alloc_parallel(parent, &name, &wq); 1213 if (IS_ERR(dentry)) 1214 return PTR_ERR(dentry); 1215 } 1216 if (!d_in_lookup(dentry)) { 1217 struct fuse_inode *fi; 1218 inode = d_inode(dentry); 1219 if (!inode || 1220 get_node_id(inode) != o->nodeid || 1221 ((o->attr.mode ^ inode->i_mode) & S_IFMT)) { 1222 d_invalidate(dentry); 1223 dput(dentry); 1224 goto retry; 1225 } 1226 if (is_bad_inode(inode)) { 1227 dput(dentry); 1228 return -EIO; 1229 } 1230 1231 fi = get_fuse_inode(inode); 1232 spin_lock(&fc->lock); 1233 fi->nlookup++; 1234 spin_unlock(&fc->lock); 1235 1236 fuse_change_attributes(inode, &o->attr, 1237 entry_attr_timeout(o), 1238 attr_version); 1239 /* 1240 * The other branch comes via fuse_iget() 1241 * which bumps nlookup inside 1242 */ 1243 } else { 1244 inode = fuse_iget(dir->i_sb, o->nodeid, o->generation, 1245 &o->attr, entry_attr_timeout(o), 1246 attr_version); 1247 if (!inode) 1248 inode = ERR_PTR(-ENOMEM); 1249 1250 alias = d_splice_alias(inode, dentry); 1251 d_lookup_done(dentry); 1252 if (alias) { 1253 dput(dentry); 1254 dentry = alias; 1255 } 1256 if (IS_ERR(dentry)) 1257 return PTR_ERR(dentry); 1258 } 1259 if (fc->readdirplus_auto) 1260 set_bit(FUSE_I_INIT_RDPLUS, &get_fuse_inode(inode)->state); 1261 fuse_change_entry_timeout(dentry, o); 1262 1263 dput(dentry); 1264 return 0; 1265 } 1266 1267 static int parse_dirplusfile(char *buf, size_t nbytes, struct file *file, 1268 struct dir_context *ctx, u64 attr_version) 1269 { 1270 struct fuse_direntplus *direntplus; 1271 struct fuse_dirent *dirent; 1272 size_t reclen; 1273 int over = 0; 1274 int ret; 1275 1276 while (nbytes >= FUSE_NAME_OFFSET_DIRENTPLUS) { 1277 direntplus = (struct fuse_direntplus *) buf; 1278 dirent = &direntplus->dirent; 1279 reclen = FUSE_DIRENTPLUS_SIZE(direntplus); 1280 1281 if (!dirent->namelen || dirent->namelen > FUSE_NAME_MAX) 1282 return -EIO; 1283 if (reclen > nbytes) 1284 break; 1285 if (memchr(dirent->name, '/', dirent->namelen) != NULL) 1286 return -EIO; 1287 1288 if (!over) { 1289 /* We fill entries into dstbuf only as much as 1290 it can hold. But we still continue iterating 1291 over remaining entries to link them. If not, 1292 we need to send a FORGET for each of those 1293 which we did not link. 1294 */ 1295 over = !dir_emit(ctx, dirent->name, dirent->namelen, 1296 dirent->ino, dirent->type); 1297 ctx->pos = dirent->off; 1298 } 1299 1300 buf += reclen; 1301 nbytes -= reclen; 1302 1303 ret = fuse_direntplus_link(file, direntplus, attr_version); 1304 if (ret) 1305 fuse_force_forget(file, direntplus->entry_out.nodeid); 1306 } 1307 1308 return 0; 1309 } 1310 1311 static int fuse_readdir(struct file *file, struct dir_context *ctx) 1312 { 1313 int plus, err; 1314 size_t nbytes; 1315 struct page *page; 1316 struct inode *inode = file_inode(file); 1317 struct fuse_conn *fc = get_fuse_conn(inode); 1318 struct fuse_req *req; 1319 u64 attr_version = 0; 1320 1321 if (is_bad_inode(inode)) 1322 return -EIO; 1323 1324 req = fuse_get_req(fc, 1); 1325 if (IS_ERR(req)) 1326 return PTR_ERR(req); 1327 1328 page = alloc_page(GFP_KERNEL); 1329 if (!page) { 1330 fuse_put_request(fc, req); 1331 return -ENOMEM; 1332 } 1333 1334 plus = fuse_use_readdirplus(inode, ctx); 1335 req->out.argpages = 1; 1336 req->num_pages = 1; 1337 req->pages[0] = page; 1338 req->page_descs[0].length = PAGE_SIZE; 1339 if (plus) { 1340 attr_version = fuse_get_attr_version(fc); 1341 fuse_read_fill(req, file, ctx->pos, PAGE_SIZE, 1342 FUSE_READDIRPLUS); 1343 } else { 1344 fuse_read_fill(req, file, ctx->pos, PAGE_SIZE, 1345 FUSE_READDIR); 1346 } 1347 fuse_lock_inode(inode); 1348 fuse_request_send(fc, req); 1349 fuse_unlock_inode(inode); 1350 nbytes = req->out.args[0].size; 1351 err = req->out.h.error; 1352 fuse_put_request(fc, req); 1353 if (!err) { 1354 if (plus) { 1355 err = parse_dirplusfile(page_address(page), nbytes, 1356 file, ctx, 1357 attr_version); 1358 } else { 1359 err = parse_dirfile(page_address(page), nbytes, file, 1360 ctx); 1361 } 1362 } 1363 1364 __free_page(page); 1365 fuse_invalidate_atime(inode); 1366 return err; 1367 } 1368 1369 static const char *fuse_get_link(struct dentry *dentry, 1370 struct inode *inode, 1371 struct delayed_call *done) 1372 { 1373 struct fuse_conn *fc = get_fuse_conn(inode); 1374 FUSE_ARGS(args); 1375 char *link; 1376 ssize_t ret; 1377 1378 if (!dentry) 1379 return ERR_PTR(-ECHILD); 1380 1381 link = kmalloc(PAGE_SIZE, GFP_KERNEL); 1382 if (!link) 1383 return ERR_PTR(-ENOMEM); 1384 1385 args.in.h.opcode = FUSE_READLINK; 1386 args.in.h.nodeid = get_node_id(inode); 1387 args.out.argvar = 1; 1388 args.out.numargs = 1; 1389 args.out.args[0].size = PAGE_SIZE - 1; 1390 args.out.args[0].value = link; 1391 ret = fuse_simple_request(fc, &args); 1392 if (ret < 0) { 1393 kfree(link); 1394 link = ERR_PTR(ret); 1395 } else { 1396 link[ret] = '\0'; 1397 set_delayed_call(done, kfree_link, link); 1398 } 1399 fuse_invalidate_atime(inode); 1400 return link; 1401 } 1402 1403 static int fuse_dir_open(struct inode *inode, struct file *file) 1404 { 1405 return fuse_open_common(inode, file, true); 1406 } 1407 1408 static int fuse_dir_release(struct inode *inode, struct file *file) 1409 { 1410 fuse_release_common(file, FUSE_RELEASEDIR); 1411 1412 return 0; 1413 } 1414 1415 static int fuse_dir_fsync(struct file *file, loff_t start, loff_t end, 1416 int datasync) 1417 { 1418 return fuse_fsync_common(file, start, end, datasync, 1); 1419 } 1420 1421 static long fuse_dir_ioctl(struct file *file, unsigned int cmd, 1422 unsigned long arg) 1423 { 1424 struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host); 1425 1426 /* FUSE_IOCTL_DIR only supported for API version >= 7.18 */ 1427 if (fc->minor < 18) 1428 return -ENOTTY; 1429 1430 return fuse_ioctl_common(file, cmd, arg, FUSE_IOCTL_DIR); 1431 } 1432 1433 static long fuse_dir_compat_ioctl(struct file *file, unsigned int cmd, 1434 unsigned long arg) 1435 { 1436 struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host); 1437 1438 if (fc->minor < 18) 1439 return -ENOTTY; 1440 1441 return fuse_ioctl_common(file, cmd, arg, 1442 FUSE_IOCTL_COMPAT | FUSE_IOCTL_DIR); 1443 } 1444 1445 static bool update_mtime(unsigned ivalid, bool trust_local_mtime) 1446 { 1447 /* Always update if mtime is explicitly set */ 1448 if (ivalid & ATTR_MTIME_SET) 1449 return true; 1450 1451 /* Or if kernel i_mtime is the official one */ 1452 if (trust_local_mtime) 1453 return true; 1454 1455 /* If it's an open(O_TRUNC) or an ftruncate(), don't update */ 1456 if ((ivalid & ATTR_SIZE) && (ivalid & (ATTR_OPEN | ATTR_FILE))) 1457 return false; 1458 1459 /* In all other cases update */ 1460 return true; 1461 } 1462 1463 static void iattr_to_fattr(struct iattr *iattr, struct fuse_setattr_in *arg, 1464 bool trust_local_cmtime) 1465 { 1466 unsigned ivalid = iattr->ia_valid; 1467 1468 if (ivalid & ATTR_MODE) 1469 arg->valid |= FATTR_MODE, arg->mode = iattr->ia_mode; 1470 if (ivalid & ATTR_UID) 1471 arg->valid |= FATTR_UID, arg->uid = from_kuid(&init_user_ns, iattr->ia_uid); 1472 if (ivalid & ATTR_GID) 1473 arg->valid |= FATTR_GID, arg->gid = from_kgid(&init_user_ns, iattr->ia_gid); 1474 if (ivalid & ATTR_SIZE) 1475 arg->valid |= FATTR_SIZE, arg->size = iattr->ia_size; 1476 if (ivalid & ATTR_ATIME) { 1477 arg->valid |= FATTR_ATIME; 1478 arg->atime = iattr->ia_atime.tv_sec; 1479 arg->atimensec = iattr->ia_atime.tv_nsec; 1480 if (!(ivalid & ATTR_ATIME_SET)) 1481 arg->valid |= FATTR_ATIME_NOW; 1482 } 1483 if ((ivalid & ATTR_MTIME) && update_mtime(ivalid, trust_local_cmtime)) { 1484 arg->valid |= FATTR_MTIME; 1485 arg->mtime = iattr->ia_mtime.tv_sec; 1486 arg->mtimensec = iattr->ia_mtime.tv_nsec; 1487 if (!(ivalid & ATTR_MTIME_SET) && !trust_local_cmtime) 1488 arg->valid |= FATTR_MTIME_NOW; 1489 } 1490 if ((ivalid & ATTR_CTIME) && trust_local_cmtime) { 1491 arg->valid |= FATTR_CTIME; 1492 arg->ctime = iattr->ia_ctime.tv_sec; 1493 arg->ctimensec = iattr->ia_ctime.tv_nsec; 1494 } 1495 } 1496 1497 /* 1498 * Prevent concurrent writepages on inode 1499 * 1500 * This is done by adding a negative bias to the inode write counter 1501 * and waiting for all pending writes to finish. 1502 */ 1503 void fuse_set_nowrite(struct inode *inode) 1504 { 1505 struct fuse_conn *fc = get_fuse_conn(inode); 1506 struct fuse_inode *fi = get_fuse_inode(inode); 1507 1508 BUG_ON(!inode_is_locked(inode)); 1509 1510 spin_lock(&fc->lock); 1511 BUG_ON(fi->writectr < 0); 1512 fi->writectr += FUSE_NOWRITE; 1513 spin_unlock(&fc->lock); 1514 wait_event(fi->page_waitq, fi->writectr == FUSE_NOWRITE); 1515 } 1516 1517 /* 1518 * Allow writepages on inode 1519 * 1520 * Remove the bias from the writecounter and send any queued 1521 * writepages. 1522 */ 1523 static void __fuse_release_nowrite(struct inode *inode) 1524 { 1525 struct fuse_inode *fi = get_fuse_inode(inode); 1526 1527 BUG_ON(fi->writectr != FUSE_NOWRITE); 1528 fi->writectr = 0; 1529 fuse_flush_writepages(inode); 1530 } 1531 1532 void fuse_release_nowrite(struct inode *inode) 1533 { 1534 struct fuse_conn *fc = get_fuse_conn(inode); 1535 1536 spin_lock(&fc->lock); 1537 __fuse_release_nowrite(inode); 1538 spin_unlock(&fc->lock); 1539 } 1540 1541 static void fuse_setattr_fill(struct fuse_conn *fc, struct fuse_args *args, 1542 struct inode *inode, 1543 struct fuse_setattr_in *inarg_p, 1544 struct fuse_attr_out *outarg_p) 1545 { 1546 args->in.h.opcode = FUSE_SETATTR; 1547 args->in.h.nodeid = get_node_id(inode); 1548 args->in.numargs = 1; 1549 args->in.args[0].size = sizeof(*inarg_p); 1550 args->in.args[0].value = inarg_p; 1551 args->out.numargs = 1; 1552 args->out.args[0].size = sizeof(*outarg_p); 1553 args->out.args[0].value = outarg_p; 1554 } 1555 1556 /* 1557 * Flush inode->i_mtime to the server 1558 */ 1559 int fuse_flush_times(struct inode *inode, struct fuse_file *ff) 1560 { 1561 struct fuse_conn *fc = get_fuse_conn(inode); 1562 FUSE_ARGS(args); 1563 struct fuse_setattr_in inarg; 1564 struct fuse_attr_out outarg; 1565 1566 memset(&inarg, 0, sizeof(inarg)); 1567 memset(&outarg, 0, sizeof(outarg)); 1568 1569 inarg.valid = FATTR_MTIME; 1570 inarg.mtime = inode->i_mtime.tv_sec; 1571 inarg.mtimensec = inode->i_mtime.tv_nsec; 1572 if (fc->minor >= 23) { 1573 inarg.valid |= FATTR_CTIME; 1574 inarg.ctime = inode->i_ctime.tv_sec; 1575 inarg.ctimensec = inode->i_ctime.tv_nsec; 1576 } 1577 if (ff) { 1578 inarg.valid |= FATTR_FH; 1579 inarg.fh = ff->fh; 1580 } 1581 fuse_setattr_fill(fc, &args, inode, &inarg, &outarg); 1582 1583 return fuse_simple_request(fc, &args); 1584 } 1585 1586 /* 1587 * Set attributes, and at the same time refresh them. 1588 * 1589 * Truncation is slightly complicated, because the 'truncate' request 1590 * may fail, in which case we don't want to touch the mapping. 1591 * vmtruncate() doesn't allow for this case, so do the rlimit checking 1592 * and the actual truncation by hand. 1593 */ 1594 int fuse_do_setattr(struct inode *inode, struct iattr *attr, 1595 struct file *file) 1596 { 1597 struct fuse_conn *fc = get_fuse_conn(inode); 1598 struct fuse_inode *fi = get_fuse_inode(inode); 1599 FUSE_ARGS(args); 1600 struct fuse_setattr_in inarg; 1601 struct fuse_attr_out outarg; 1602 bool is_truncate = false; 1603 bool is_wb = fc->writeback_cache; 1604 loff_t oldsize; 1605 int err; 1606 bool trust_local_cmtime = is_wb && S_ISREG(inode->i_mode); 1607 1608 if (!(fc->flags & FUSE_DEFAULT_PERMISSIONS)) 1609 attr->ia_valid |= ATTR_FORCE; 1610 1611 err = inode_change_ok(inode, attr); 1612 if (err) 1613 return err; 1614 1615 if (attr->ia_valid & ATTR_OPEN) { 1616 if (fc->atomic_o_trunc) 1617 return 0; 1618 file = NULL; 1619 } 1620 1621 if (attr->ia_valid & ATTR_SIZE) 1622 is_truncate = true; 1623 1624 if (is_truncate) { 1625 fuse_set_nowrite(inode); 1626 set_bit(FUSE_I_SIZE_UNSTABLE, &fi->state); 1627 if (trust_local_cmtime && attr->ia_size != inode->i_size) 1628 attr->ia_valid |= ATTR_MTIME | ATTR_CTIME; 1629 } 1630 1631 memset(&inarg, 0, sizeof(inarg)); 1632 memset(&outarg, 0, sizeof(outarg)); 1633 iattr_to_fattr(attr, &inarg, trust_local_cmtime); 1634 if (file) { 1635 struct fuse_file *ff = file->private_data; 1636 inarg.valid |= FATTR_FH; 1637 inarg.fh = ff->fh; 1638 } 1639 if (attr->ia_valid & ATTR_SIZE) { 1640 /* For mandatory locking in truncate */ 1641 inarg.valid |= FATTR_LOCKOWNER; 1642 inarg.lock_owner = fuse_lock_owner_id(fc, current->files); 1643 } 1644 fuse_setattr_fill(fc, &args, inode, &inarg, &outarg); 1645 err = fuse_simple_request(fc, &args); 1646 if (err) { 1647 if (err == -EINTR) 1648 fuse_invalidate_attr(inode); 1649 goto error; 1650 } 1651 1652 if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) { 1653 make_bad_inode(inode); 1654 err = -EIO; 1655 goto error; 1656 } 1657 1658 spin_lock(&fc->lock); 1659 /* the kernel maintains i_mtime locally */ 1660 if (trust_local_cmtime) { 1661 if (attr->ia_valid & ATTR_MTIME) 1662 inode->i_mtime = attr->ia_mtime; 1663 if (attr->ia_valid & ATTR_CTIME) 1664 inode->i_ctime = attr->ia_ctime; 1665 /* FIXME: clear I_DIRTY_SYNC? */ 1666 } 1667 1668 fuse_change_attributes_common(inode, &outarg.attr, 1669 attr_timeout(&outarg)); 1670 oldsize = inode->i_size; 1671 /* see the comment in fuse_change_attributes() */ 1672 if (!is_wb || is_truncate || !S_ISREG(inode->i_mode)) 1673 i_size_write(inode, outarg.attr.size); 1674 1675 if (is_truncate) { 1676 /* NOTE: this may release/reacquire fc->lock */ 1677 __fuse_release_nowrite(inode); 1678 } 1679 spin_unlock(&fc->lock); 1680 1681 /* 1682 * Only call invalidate_inode_pages2() after removing 1683 * FUSE_NOWRITE, otherwise fuse_launder_page() would deadlock. 1684 */ 1685 if ((is_truncate || !is_wb) && 1686 S_ISREG(inode->i_mode) && oldsize != outarg.attr.size) { 1687 truncate_pagecache(inode, outarg.attr.size); 1688 invalidate_inode_pages2(inode->i_mapping); 1689 } 1690 1691 clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state); 1692 return 0; 1693 1694 error: 1695 if (is_truncate) 1696 fuse_release_nowrite(inode); 1697 1698 clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state); 1699 return err; 1700 } 1701 1702 static int fuse_setattr(struct dentry *entry, struct iattr *attr) 1703 { 1704 struct inode *inode = d_inode(entry); 1705 1706 if (!fuse_allow_current_process(get_fuse_conn(inode))) 1707 return -EACCES; 1708 1709 if (attr->ia_valid & ATTR_FILE) 1710 return fuse_do_setattr(inode, attr, attr->ia_file); 1711 else 1712 return fuse_do_setattr(inode, attr, NULL); 1713 } 1714 1715 static int fuse_getattr(struct vfsmount *mnt, struct dentry *entry, 1716 struct kstat *stat) 1717 { 1718 struct inode *inode = d_inode(entry); 1719 struct fuse_conn *fc = get_fuse_conn(inode); 1720 1721 if (!fuse_allow_current_process(fc)) 1722 return -EACCES; 1723 1724 return fuse_update_attributes(inode, stat, NULL, NULL); 1725 } 1726 1727 static int fuse_setxattr(struct dentry *unused, struct inode *inode, 1728 const char *name, const void *value, 1729 size_t size, int flags) 1730 { 1731 struct fuse_conn *fc = get_fuse_conn(inode); 1732 FUSE_ARGS(args); 1733 struct fuse_setxattr_in inarg; 1734 int err; 1735 1736 if (fc->no_setxattr) 1737 return -EOPNOTSUPP; 1738 1739 memset(&inarg, 0, sizeof(inarg)); 1740 inarg.size = size; 1741 inarg.flags = flags; 1742 args.in.h.opcode = FUSE_SETXATTR; 1743 args.in.h.nodeid = get_node_id(inode); 1744 args.in.numargs = 3; 1745 args.in.args[0].size = sizeof(inarg); 1746 args.in.args[0].value = &inarg; 1747 args.in.args[1].size = strlen(name) + 1; 1748 args.in.args[1].value = name; 1749 args.in.args[2].size = size; 1750 args.in.args[2].value = value; 1751 err = fuse_simple_request(fc, &args); 1752 if (err == -ENOSYS) { 1753 fc->no_setxattr = 1; 1754 err = -EOPNOTSUPP; 1755 } 1756 if (!err) { 1757 fuse_invalidate_attr(inode); 1758 fuse_update_ctime(inode); 1759 } 1760 return err; 1761 } 1762 1763 static ssize_t fuse_getxattr(struct dentry *entry, struct inode *inode, 1764 const char *name, void *value, size_t size) 1765 { 1766 struct fuse_conn *fc = get_fuse_conn(inode); 1767 FUSE_ARGS(args); 1768 struct fuse_getxattr_in inarg; 1769 struct fuse_getxattr_out outarg; 1770 ssize_t ret; 1771 1772 if (fc->no_getxattr) 1773 return -EOPNOTSUPP; 1774 1775 memset(&inarg, 0, sizeof(inarg)); 1776 inarg.size = size; 1777 args.in.h.opcode = FUSE_GETXATTR; 1778 args.in.h.nodeid = get_node_id(inode); 1779 args.in.numargs = 2; 1780 args.in.args[0].size = sizeof(inarg); 1781 args.in.args[0].value = &inarg; 1782 args.in.args[1].size = strlen(name) + 1; 1783 args.in.args[1].value = name; 1784 /* This is really two different operations rolled into one */ 1785 args.out.numargs = 1; 1786 if (size) { 1787 args.out.argvar = 1; 1788 args.out.args[0].size = size; 1789 args.out.args[0].value = value; 1790 } else { 1791 args.out.args[0].size = sizeof(outarg); 1792 args.out.args[0].value = &outarg; 1793 } 1794 ret = fuse_simple_request(fc, &args); 1795 if (!ret && !size) 1796 ret = outarg.size; 1797 if (ret == -ENOSYS) { 1798 fc->no_getxattr = 1; 1799 ret = -EOPNOTSUPP; 1800 } 1801 return ret; 1802 } 1803 1804 static ssize_t fuse_listxattr(struct dentry *entry, char *list, size_t size) 1805 { 1806 struct inode *inode = d_inode(entry); 1807 struct fuse_conn *fc = get_fuse_conn(inode); 1808 FUSE_ARGS(args); 1809 struct fuse_getxattr_in inarg; 1810 struct fuse_getxattr_out outarg; 1811 ssize_t ret; 1812 1813 if (!fuse_allow_current_process(fc)) 1814 return -EACCES; 1815 1816 if (fc->no_listxattr) 1817 return -EOPNOTSUPP; 1818 1819 memset(&inarg, 0, sizeof(inarg)); 1820 inarg.size = size; 1821 args.in.h.opcode = FUSE_LISTXATTR; 1822 args.in.h.nodeid = get_node_id(inode); 1823 args.in.numargs = 1; 1824 args.in.args[0].size = sizeof(inarg); 1825 args.in.args[0].value = &inarg; 1826 /* This is really two different operations rolled into one */ 1827 args.out.numargs = 1; 1828 if (size) { 1829 args.out.argvar = 1; 1830 args.out.args[0].size = size; 1831 args.out.args[0].value = list; 1832 } else { 1833 args.out.args[0].size = sizeof(outarg); 1834 args.out.args[0].value = &outarg; 1835 } 1836 ret = fuse_simple_request(fc, &args); 1837 if (!ret && !size) 1838 ret = outarg.size; 1839 if (ret == -ENOSYS) { 1840 fc->no_listxattr = 1; 1841 ret = -EOPNOTSUPP; 1842 } 1843 return ret; 1844 } 1845 1846 static int fuse_removexattr(struct dentry *entry, const char *name) 1847 { 1848 struct inode *inode = d_inode(entry); 1849 struct fuse_conn *fc = get_fuse_conn(inode); 1850 FUSE_ARGS(args); 1851 int err; 1852 1853 if (fc->no_removexattr) 1854 return -EOPNOTSUPP; 1855 1856 args.in.h.opcode = FUSE_REMOVEXATTR; 1857 args.in.h.nodeid = get_node_id(inode); 1858 args.in.numargs = 1; 1859 args.in.args[0].size = strlen(name) + 1; 1860 args.in.args[0].value = name; 1861 err = fuse_simple_request(fc, &args); 1862 if (err == -ENOSYS) { 1863 fc->no_removexattr = 1; 1864 err = -EOPNOTSUPP; 1865 } 1866 if (!err) { 1867 fuse_invalidate_attr(inode); 1868 fuse_update_ctime(inode); 1869 } 1870 return err; 1871 } 1872 1873 static const struct inode_operations fuse_dir_inode_operations = { 1874 .lookup = fuse_lookup, 1875 .mkdir = fuse_mkdir, 1876 .symlink = fuse_symlink, 1877 .unlink = fuse_unlink, 1878 .rmdir = fuse_rmdir, 1879 .rename2 = fuse_rename2, 1880 .link = fuse_link, 1881 .setattr = fuse_setattr, 1882 .create = fuse_create, 1883 .atomic_open = fuse_atomic_open, 1884 .mknod = fuse_mknod, 1885 .permission = fuse_permission, 1886 .getattr = fuse_getattr, 1887 .setxattr = fuse_setxattr, 1888 .getxattr = fuse_getxattr, 1889 .listxattr = fuse_listxattr, 1890 .removexattr = fuse_removexattr, 1891 }; 1892 1893 static const struct file_operations fuse_dir_operations = { 1894 .llseek = generic_file_llseek, 1895 .read = generic_read_dir, 1896 .iterate_shared = fuse_readdir, 1897 .open = fuse_dir_open, 1898 .release = fuse_dir_release, 1899 .fsync = fuse_dir_fsync, 1900 .unlocked_ioctl = fuse_dir_ioctl, 1901 .compat_ioctl = fuse_dir_compat_ioctl, 1902 }; 1903 1904 static const struct inode_operations fuse_common_inode_operations = { 1905 .setattr = fuse_setattr, 1906 .permission = fuse_permission, 1907 .getattr = fuse_getattr, 1908 .setxattr = fuse_setxattr, 1909 .getxattr = fuse_getxattr, 1910 .listxattr = fuse_listxattr, 1911 .removexattr = fuse_removexattr, 1912 }; 1913 1914 static const struct inode_operations fuse_symlink_inode_operations = { 1915 .setattr = fuse_setattr, 1916 .get_link = fuse_get_link, 1917 .readlink = generic_readlink, 1918 .getattr = fuse_getattr, 1919 .setxattr = fuse_setxattr, 1920 .getxattr = fuse_getxattr, 1921 .listxattr = fuse_listxattr, 1922 .removexattr = fuse_removexattr, 1923 }; 1924 1925 void fuse_init_common(struct inode *inode) 1926 { 1927 inode->i_op = &fuse_common_inode_operations; 1928 } 1929 1930 void fuse_init_dir(struct inode *inode) 1931 { 1932 inode->i_op = &fuse_dir_inode_operations; 1933 inode->i_fop = &fuse_dir_operations; 1934 } 1935 1936 void fuse_init_symlink(struct inode *inode) 1937 { 1938 inode->i_op = &fuse_symlink_inode_operations; 1939 } 1940