1 /*- 2 * SPDX-License-Identifier: BSD-3-Clause 3 * 4 * Copyright (c) 1989, 1993 5 * The Regents of the University of California. All rights reserved. 6 * 7 * This code is derived from software contributed 8 * to Berkeley by John Heidemann of the UCLA Ficus project. 9 * 10 * Source: * @(#)i405_init.c 2.10 92/04/27 UCLA Ficus project 11 * 12 * Redistribution and use in source and binary forms, with or without 13 * modification, are permitted provided that the following conditions 14 * are met: 15 * 1. Redistributions of source code must retain the above copyright 16 * notice, this list of conditions and the following disclaimer. 17 * 2. Redistributions in binary form must reproduce the above copyright 18 * notice, this list of conditions and the following disclaimer in the 19 * documentation and/or other materials provided with the distribution. 20 * 3. Neither the name of the University nor the names of its contributors 21 * may be used to endorse or promote products derived from this software 22 * without specific prior written permission. 23 * 24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 34 * SUCH DAMAGE. 35 */ 36 37 #include <sys/cdefs.h> 38 __FBSDID("$FreeBSD$"); 39 40 #include <sys/param.h> 41 #include <sys/systm.h> 42 #include <sys/bio.h> 43 #include <sys/buf.h> 44 #include <sys/conf.h> 45 #include <sys/event.h> 46 #include <sys/kernel.h> 47 #include <sys/limits.h> 48 #include <sys/lock.h> 49 #include <sys/lockf.h> 50 #include <sys/malloc.h> 51 #include <sys/mount.h> 52 #include <sys/namei.h> 53 #include <sys/rwlock.h> 54 #include <sys/fcntl.h> 55 #include <sys/unistd.h> 56 #include <sys/vnode.h> 57 #include <sys/dirent.h> 58 #include <sys/poll.h> 59 60 #include <security/mac/mac_framework.h> 61 62 #include <vm/vm.h> 63 #include <vm/vm_object.h> 64 #include <vm/vm_extern.h> 65 #include <vm/pmap.h> 66 #include <vm/vm_map.h> 67 #include <vm/vm_page.h> 68 #include <vm/vm_pager.h> 69 #include <vm/vnode_pager.h> 70 71 static int vop_nolookup(struct vop_lookup_args *); 72 static int vop_norename(struct vop_rename_args *); 73 static int vop_nostrategy(struct vop_strategy_args *); 74 static int get_next_dirent(struct vnode *vp, struct dirent **dpp, 75 char *dirbuf, int dirbuflen, off_t *off, 76 char **cpos, int *len, int *eofflag, 77 struct thread *td); 78 static int dirent_exists(struct vnode *vp, const char *dirname, 79 struct thread *td); 80 81 #define DIRENT_MINSIZE (sizeof(struct dirent) - (MAXNAMLEN+1) + 4) 82 83 static int vop_stdis_text(struct vop_is_text_args *ap); 84 static int vop_stdunset_text(struct vop_unset_text_args *ap); 85 static int vop_stdadd_writecount(struct vop_add_writecount_args *ap); 86 static int vop_stdfdatasync(struct vop_fdatasync_args *ap); 87 static int vop_stdgetpages_async(struct vop_getpages_async_args *ap); 88 89 /* 90 * This vnode table stores what we want to do if the filesystem doesn't 91 * implement a particular VOP. 92 * 93 * If there is no specific entry here, we will return EOPNOTSUPP. 94 * 95 * Note that every filesystem has to implement either vop_access 96 * or vop_accessx; failing to do so will result in immediate crash 97 * due to stack overflow, as vop_stdaccess() calls vop_stdaccessx(), 98 * which calls vop_stdaccess() etc. 99 */ 100 101 struct vop_vector default_vnodeops = { 102 .vop_default = NULL, 103 .vop_bypass = VOP_EOPNOTSUPP, 104 105 .vop_access = vop_stdaccess, 106 .vop_accessx = vop_stdaccessx, 107 .vop_advise = vop_stdadvise, 108 .vop_advlock = vop_stdadvlock, 109 .vop_advlockasync = vop_stdadvlockasync, 110 .vop_advlockpurge = vop_stdadvlockpurge, 111 .vop_allocate = vop_stdallocate, 112 .vop_bmap = vop_stdbmap, 113 .vop_close = VOP_NULL, 114 .vop_fsync = VOP_NULL, 115 .vop_fdatasync = vop_stdfdatasync, 116 .vop_getpages = vop_stdgetpages, 117 .vop_getpages_async = vop_stdgetpages_async, 118 .vop_getwritemount = vop_stdgetwritemount, 119 .vop_inactive = VOP_NULL, 120 .vop_ioctl = VOP_ENOTTY, 121 .vop_kqfilter = vop_stdkqfilter, 122 .vop_islocked = vop_stdislocked, 123 .vop_lock1 = vop_stdlock, 124 .vop_lookup = vop_nolookup, 125 .vop_open = VOP_NULL, 126 .vop_pathconf = VOP_EINVAL, 127 .vop_poll = vop_nopoll, 128 .vop_putpages = vop_stdputpages, 129 .vop_readlink = VOP_EINVAL, 130 .vop_rename = vop_norename, 131 .vop_revoke = VOP_PANIC, 132 .vop_strategy = vop_nostrategy, 133 .vop_unlock = vop_stdunlock, 134 .vop_vptocnp = vop_stdvptocnp, 135 .vop_vptofh = vop_stdvptofh, 136 .vop_unp_bind = vop_stdunp_bind, 137 .vop_unp_connect = vop_stdunp_connect, 138 .vop_unp_detach = vop_stdunp_detach, 139 .vop_is_text = vop_stdis_text, 140 .vop_set_text = vop_stdset_text, 141 .vop_unset_text = vop_stdunset_text, 142 .vop_add_writecount = vop_stdadd_writecount, 143 }; 144 145 /* 146 * Series of placeholder functions for various error returns for 147 * VOPs. 148 */ 149 150 int 151 vop_eopnotsupp(struct vop_generic_args *ap) 152 { 153 /* 154 printf("vop_notsupp[%s]\n", ap->a_desc->vdesc_name); 155 */ 156 157 return (EOPNOTSUPP); 158 } 159 160 int 161 vop_ebadf(struct vop_generic_args *ap) 162 { 163 164 return (EBADF); 165 } 166 167 int 168 vop_enotty(struct vop_generic_args *ap) 169 { 170 171 return (ENOTTY); 172 } 173 174 int 175 vop_einval(struct vop_generic_args *ap) 176 { 177 178 return (EINVAL); 179 } 180 181 int 182 vop_enoent(struct vop_generic_args *ap) 183 { 184 185 return (ENOENT); 186 } 187 188 int 189 vop_null(struct vop_generic_args *ap) 190 { 191 192 return (0); 193 } 194 195 /* 196 * Helper function to panic on some bad VOPs in some filesystems. 197 */ 198 int 199 vop_panic(struct vop_generic_args *ap) 200 { 201 202 panic("filesystem goof: vop_panic[%s]", ap->a_desc->vdesc_name); 203 } 204 205 /* 206 * vop_std<something> and vop_no<something> are default functions for use by 207 * filesystems that need the "default reasonable" implementation for a 208 * particular operation. 209 * 210 * The documentation for the operations they implement exists (if it exists) 211 * in the VOP_<SOMETHING>(9) manpage (all uppercase). 212 */ 213 214 /* 215 * Default vop for filesystems that do not support name lookup 216 */ 217 static int 218 vop_nolookup(ap) 219 struct vop_lookup_args /* { 220 struct vnode *a_dvp; 221 struct vnode **a_vpp; 222 struct componentname *a_cnp; 223 } */ *ap; 224 { 225 226 *ap->a_vpp = NULL; 227 return (ENOTDIR); 228 } 229 230 /* 231 * vop_norename: 232 * 233 * Handle unlock and reference counting for arguments of vop_rename 234 * for filesystems that do not implement rename operation. 235 */ 236 static int 237 vop_norename(struct vop_rename_args *ap) 238 { 239 240 vop_rename_fail(ap); 241 return (EOPNOTSUPP); 242 } 243 244 /* 245 * vop_nostrategy: 246 * 247 * Strategy routine for VFS devices that have none. 248 * 249 * BIO_ERROR and B_INVAL must be cleared prior to calling any strategy 250 * routine. Typically this is done for a BIO_READ strategy call. 251 * Typically B_INVAL is assumed to already be clear prior to a write 252 * and should not be cleared manually unless you just made the buffer 253 * invalid. BIO_ERROR should be cleared either way. 254 */ 255 256 static int 257 vop_nostrategy (struct vop_strategy_args *ap) 258 { 259 printf("No strategy for buffer at %p\n", ap->a_bp); 260 vn_printf(ap->a_vp, "vnode "); 261 ap->a_bp->b_ioflags |= BIO_ERROR; 262 ap->a_bp->b_error = EOPNOTSUPP; 263 bufdone(ap->a_bp); 264 return (EOPNOTSUPP); 265 } 266 267 static int 268 get_next_dirent(struct vnode *vp, struct dirent **dpp, char *dirbuf, 269 int dirbuflen, off_t *off, char **cpos, int *len, 270 int *eofflag, struct thread *td) 271 { 272 int error, reclen; 273 struct uio uio; 274 struct iovec iov; 275 struct dirent *dp; 276 277 KASSERT(VOP_ISLOCKED(vp), ("vp %p is not locked", vp)); 278 KASSERT(vp->v_type == VDIR, ("vp %p is not a directory", vp)); 279 280 if (*len == 0) { 281 iov.iov_base = dirbuf; 282 iov.iov_len = dirbuflen; 283 284 uio.uio_iov = &iov; 285 uio.uio_iovcnt = 1; 286 uio.uio_offset = *off; 287 uio.uio_resid = dirbuflen; 288 uio.uio_segflg = UIO_SYSSPACE; 289 uio.uio_rw = UIO_READ; 290 uio.uio_td = td; 291 292 *eofflag = 0; 293 294 #ifdef MAC 295 error = mac_vnode_check_readdir(td->td_ucred, vp); 296 if (error == 0) 297 #endif 298 error = VOP_READDIR(vp, &uio, td->td_ucred, eofflag, 299 NULL, NULL); 300 if (error) 301 return (error); 302 303 *off = uio.uio_offset; 304 305 *cpos = dirbuf; 306 *len = (dirbuflen - uio.uio_resid); 307 308 if (*len == 0) 309 return (ENOENT); 310 } 311 312 dp = (struct dirent *)(*cpos); 313 reclen = dp->d_reclen; 314 *dpp = dp; 315 316 /* check for malformed directory.. */ 317 if (reclen < DIRENT_MINSIZE) 318 return (EINVAL); 319 320 *cpos += reclen; 321 *len -= reclen; 322 323 return (0); 324 } 325 326 /* 327 * Check if a named file exists in a given directory vnode. 328 */ 329 static int 330 dirent_exists(struct vnode *vp, const char *dirname, struct thread *td) 331 { 332 char *dirbuf, *cpos; 333 int error, eofflag, dirbuflen, len, found; 334 off_t off; 335 struct dirent *dp; 336 struct vattr va; 337 338 KASSERT(VOP_ISLOCKED(vp), ("vp %p is not locked", vp)); 339 KASSERT(vp->v_type == VDIR, ("vp %p is not a directory", vp)); 340 341 found = 0; 342 343 error = VOP_GETATTR(vp, &va, td->td_ucred); 344 if (error) 345 return (found); 346 347 dirbuflen = DEV_BSIZE; 348 if (dirbuflen < va.va_blocksize) 349 dirbuflen = va.va_blocksize; 350 dirbuf = (char *)malloc(dirbuflen, M_TEMP, M_WAITOK); 351 352 off = 0; 353 len = 0; 354 do { 355 error = get_next_dirent(vp, &dp, dirbuf, dirbuflen, &off, 356 &cpos, &len, &eofflag, td); 357 if (error) 358 goto out; 359 360 if (dp->d_type != DT_WHT && dp->d_fileno != 0 && 361 strcmp(dp->d_name, dirname) == 0) { 362 found = 1; 363 goto out; 364 } 365 } while (len > 0 || !eofflag); 366 367 out: 368 free(dirbuf, M_TEMP); 369 return (found); 370 } 371 372 int 373 vop_stdaccess(struct vop_access_args *ap) 374 { 375 376 KASSERT((ap->a_accmode & ~(VEXEC | VWRITE | VREAD | VADMIN | 377 VAPPEND)) == 0, ("invalid bit in accmode")); 378 379 return (VOP_ACCESSX(ap->a_vp, ap->a_accmode, ap->a_cred, ap->a_td)); 380 } 381 382 int 383 vop_stdaccessx(struct vop_accessx_args *ap) 384 { 385 int error; 386 accmode_t accmode = ap->a_accmode; 387 388 error = vfs_unixify_accmode(&accmode); 389 if (error != 0) 390 return (error); 391 392 if (accmode == 0) 393 return (0); 394 395 return (VOP_ACCESS(ap->a_vp, accmode, ap->a_cred, ap->a_td)); 396 } 397 398 /* 399 * Advisory record locking support 400 */ 401 int 402 vop_stdadvlock(struct vop_advlock_args *ap) 403 { 404 struct vnode *vp; 405 struct vattr vattr; 406 int error; 407 408 vp = ap->a_vp; 409 if (ap->a_fl->l_whence == SEEK_END) { 410 /* 411 * The NFSv4 server must avoid doing a vn_lock() here, since it 412 * can deadlock the nfsd threads, due to a LOR. Fortunately 413 * the NFSv4 server always uses SEEK_SET and this code is 414 * only required for the SEEK_END case. 415 */ 416 vn_lock(vp, LK_SHARED | LK_RETRY); 417 error = VOP_GETATTR(vp, &vattr, curthread->td_ucred); 418 VOP_UNLOCK(vp, 0); 419 if (error) 420 return (error); 421 } else 422 vattr.va_size = 0; 423 424 return (lf_advlock(ap, &(vp->v_lockf), vattr.va_size)); 425 } 426 427 int 428 vop_stdadvlockasync(struct vop_advlockasync_args *ap) 429 { 430 struct vnode *vp; 431 struct vattr vattr; 432 int error; 433 434 vp = ap->a_vp; 435 if (ap->a_fl->l_whence == SEEK_END) { 436 /* The size argument is only needed for SEEK_END. */ 437 vn_lock(vp, LK_SHARED | LK_RETRY); 438 error = VOP_GETATTR(vp, &vattr, curthread->td_ucred); 439 VOP_UNLOCK(vp, 0); 440 if (error) 441 return (error); 442 } else 443 vattr.va_size = 0; 444 445 return (lf_advlockasync(ap, &(vp->v_lockf), vattr.va_size)); 446 } 447 448 int 449 vop_stdadvlockpurge(struct vop_advlockpurge_args *ap) 450 { 451 struct vnode *vp; 452 453 vp = ap->a_vp; 454 lf_purgelocks(vp, &vp->v_lockf); 455 return (0); 456 } 457 458 /* 459 * vop_stdpathconf: 460 * 461 * Standard implementation of POSIX pathconf, to get information about limits 462 * for a filesystem. 463 * Override per filesystem for the case where the filesystem has smaller 464 * limits. 465 */ 466 int 467 vop_stdpathconf(ap) 468 struct vop_pathconf_args /* { 469 struct vnode *a_vp; 470 int a_name; 471 int *a_retval; 472 } */ *ap; 473 { 474 475 switch (ap->a_name) { 476 case _PC_ASYNC_IO: 477 *ap->a_retval = _POSIX_ASYNCHRONOUS_IO; 478 return (0); 479 case _PC_PATH_MAX: 480 *ap->a_retval = PATH_MAX; 481 return (0); 482 case _PC_ACL_EXTENDED: 483 case _PC_ACL_NFS4: 484 case _PC_CAP_PRESENT: 485 case _PC_INF_PRESENT: 486 case _PC_MAC_PRESENT: 487 *ap->a_retval = 0; 488 return (0); 489 default: 490 return (EINVAL); 491 } 492 /* NOTREACHED */ 493 } 494 495 /* 496 * Standard lock, unlock and islocked functions. 497 */ 498 int 499 vop_stdlock(ap) 500 struct vop_lock1_args /* { 501 struct vnode *a_vp; 502 int a_flags; 503 char *file; 504 int line; 505 } */ *ap; 506 { 507 struct vnode *vp = ap->a_vp; 508 struct mtx *ilk; 509 510 ilk = VI_MTX(vp); 511 return (lockmgr_lock_fast_path(vp->v_vnlock, ap->a_flags, 512 &ilk->lock_object, ap->a_file, ap->a_line)); 513 } 514 515 /* See above. */ 516 int 517 vop_stdunlock(ap) 518 struct vop_unlock_args /* { 519 struct vnode *a_vp; 520 int a_flags; 521 } */ *ap; 522 { 523 struct vnode *vp = ap->a_vp; 524 struct mtx *ilk; 525 526 ilk = VI_MTX(vp); 527 return (lockmgr_unlock_fast_path(vp->v_vnlock, ap->a_flags, 528 &ilk->lock_object)); 529 } 530 531 /* See above. */ 532 int 533 vop_stdislocked(ap) 534 struct vop_islocked_args /* { 535 struct vnode *a_vp; 536 } */ *ap; 537 { 538 539 return (lockstatus(ap->a_vp->v_vnlock)); 540 } 541 542 /* 543 * Return true for select/poll. 544 */ 545 int 546 vop_nopoll(ap) 547 struct vop_poll_args /* { 548 struct vnode *a_vp; 549 int a_events; 550 struct ucred *a_cred; 551 struct thread *a_td; 552 } */ *ap; 553 { 554 555 return (poll_no_poll(ap->a_events)); 556 } 557 558 /* 559 * Implement poll for local filesystems that support it. 560 */ 561 int 562 vop_stdpoll(ap) 563 struct vop_poll_args /* { 564 struct vnode *a_vp; 565 int a_events; 566 struct ucred *a_cred; 567 struct thread *a_td; 568 } */ *ap; 569 { 570 if (ap->a_events & ~POLLSTANDARD) 571 return (vn_pollrecord(ap->a_vp, ap->a_td, ap->a_events)); 572 return (ap->a_events & (POLLIN | POLLOUT | POLLRDNORM | POLLWRNORM)); 573 } 574 575 /* 576 * Return our mount point, as we will take charge of the writes. 577 */ 578 int 579 vop_stdgetwritemount(ap) 580 struct vop_getwritemount_args /* { 581 struct vnode *a_vp; 582 struct mount **a_mpp; 583 } */ *ap; 584 { 585 struct mount *mp; 586 587 /* 588 * XXX Since this is called unlocked we may be recycled while 589 * attempting to ref the mount. If this is the case or mountpoint 590 * will be set to NULL. We only have to prevent this call from 591 * returning with a ref to an incorrect mountpoint. It is not 592 * harmful to return with a ref to our previous mountpoint. 593 */ 594 mp = ap->a_vp->v_mount; 595 if (mp != NULL) { 596 vfs_ref(mp); 597 if (mp != ap->a_vp->v_mount) { 598 vfs_rel(mp); 599 mp = NULL; 600 } 601 } 602 *(ap->a_mpp) = mp; 603 return (0); 604 } 605 606 /* 607 * If the file system doesn't implement VOP_BMAP, then return sensible defaults: 608 * - Return the vnode's bufobj instead of any underlying device's bufobj 609 * - Calculate the physical block number as if there were equal size 610 * consecutive blocks, but 611 * - Report no contiguous runs of blocks. 612 */ 613 int 614 vop_stdbmap(ap) 615 struct vop_bmap_args /* { 616 struct vnode *a_vp; 617 daddr_t a_bn; 618 struct bufobj **a_bop; 619 daddr_t *a_bnp; 620 int *a_runp; 621 int *a_runb; 622 } */ *ap; 623 { 624 625 if (ap->a_bop != NULL) 626 *ap->a_bop = &ap->a_vp->v_bufobj; 627 if (ap->a_bnp != NULL) 628 *ap->a_bnp = ap->a_bn * btodb(ap->a_vp->v_mount->mnt_stat.f_iosize); 629 if (ap->a_runp != NULL) 630 *ap->a_runp = 0; 631 if (ap->a_runb != NULL) 632 *ap->a_runb = 0; 633 return (0); 634 } 635 636 int 637 vop_stdfsync(ap) 638 struct vop_fsync_args /* { 639 struct vnode *a_vp; 640 int a_waitfor; 641 struct thread *a_td; 642 } */ *ap; 643 { 644 645 return (vn_fsync_buf(ap->a_vp, ap->a_waitfor)); 646 } 647 648 static int 649 vop_stdfdatasync(struct vop_fdatasync_args *ap) 650 { 651 652 return (VOP_FSYNC(ap->a_vp, MNT_WAIT, ap->a_td)); 653 } 654 655 int 656 vop_stdfdatasync_buf(struct vop_fdatasync_args *ap) 657 { 658 659 return (vn_fsync_buf(ap->a_vp, MNT_WAIT)); 660 } 661 662 /* XXX Needs good comment and more info in the manpage (VOP_GETPAGES(9)). */ 663 int 664 vop_stdgetpages(ap) 665 struct vop_getpages_args /* { 666 struct vnode *a_vp; 667 vm_page_t *a_m; 668 int a_count; 669 int *a_rbehind; 670 int *a_rahead; 671 } */ *ap; 672 { 673 674 return vnode_pager_generic_getpages(ap->a_vp, ap->a_m, 675 ap->a_count, ap->a_rbehind, ap->a_rahead, NULL, NULL); 676 } 677 678 static int 679 vop_stdgetpages_async(struct vop_getpages_async_args *ap) 680 { 681 int error; 682 683 error = VOP_GETPAGES(ap->a_vp, ap->a_m, ap->a_count, ap->a_rbehind, 684 ap->a_rahead); 685 ap->a_iodone(ap->a_arg, ap->a_m, ap->a_count, error); 686 return (error); 687 } 688 689 int 690 vop_stdkqfilter(struct vop_kqfilter_args *ap) 691 { 692 return vfs_kqfilter(ap); 693 } 694 695 /* XXX Needs good comment and more info in the manpage (VOP_PUTPAGES(9)). */ 696 int 697 vop_stdputpages(ap) 698 struct vop_putpages_args /* { 699 struct vnode *a_vp; 700 vm_page_t *a_m; 701 int a_count; 702 int a_sync; 703 int *a_rtvals; 704 } */ *ap; 705 { 706 707 return vnode_pager_generic_putpages(ap->a_vp, ap->a_m, ap->a_count, 708 ap->a_sync, ap->a_rtvals); 709 } 710 711 int 712 vop_stdvptofh(struct vop_vptofh_args *ap) 713 { 714 return (EOPNOTSUPP); 715 } 716 717 int 718 vop_stdvptocnp(struct vop_vptocnp_args *ap) 719 { 720 struct vnode *vp = ap->a_vp; 721 struct vnode **dvp = ap->a_vpp; 722 struct ucred *cred = ap->a_cred; 723 char *buf = ap->a_buf; 724 int *buflen = ap->a_buflen; 725 char *dirbuf, *cpos; 726 int i, error, eofflag, dirbuflen, flags, locked, len, covered; 727 off_t off; 728 ino_t fileno; 729 struct vattr va; 730 struct nameidata nd; 731 struct thread *td; 732 struct dirent *dp; 733 struct vnode *mvp; 734 735 i = *buflen; 736 error = 0; 737 covered = 0; 738 td = curthread; 739 740 if (vp->v_type != VDIR) 741 return (ENOENT); 742 743 error = VOP_GETATTR(vp, &va, cred); 744 if (error) 745 return (error); 746 747 VREF(vp); 748 locked = VOP_ISLOCKED(vp); 749 VOP_UNLOCK(vp, 0); 750 NDINIT_ATVP(&nd, LOOKUP, FOLLOW | LOCKSHARED | LOCKLEAF, UIO_SYSSPACE, 751 "..", vp, td); 752 flags = FREAD; 753 error = vn_open_cred(&nd, &flags, 0, VN_OPEN_NOAUDIT, cred, NULL); 754 if (error) { 755 vn_lock(vp, locked | LK_RETRY); 756 return (error); 757 } 758 NDFREE(&nd, NDF_ONLY_PNBUF); 759 760 mvp = *dvp = nd.ni_vp; 761 762 if (vp->v_mount != (*dvp)->v_mount && 763 ((*dvp)->v_vflag & VV_ROOT) && 764 ((*dvp)->v_mount->mnt_flag & MNT_UNION)) { 765 *dvp = (*dvp)->v_mount->mnt_vnodecovered; 766 VREF(mvp); 767 VOP_UNLOCK(mvp, 0); 768 vn_close(mvp, FREAD, cred, td); 769 VREF(*dvp); 770 vn_lock(*dvp, LK_SHARED | LK_RETRY); 771 covered = 1; 772 } 773 774 fileno = va.va_fileid; 775 776 dirbuflen = DEV_BSIZE; 777 if (dirbuflen < va.va_blocksize) 778 dirbuflen = va.va_blocksize; 779 dirbuf = (char *)malloc(dirbuflen, M_TEMP, M_WAITOK); 780 781 if ((*dvp)->v_type != VDIR) { 782 error = ENOENT; 783 goto out; 784 } 785 786 off = 0; 787 len = 0; 788 do { 789 /* call VOP_READDIR of parent */ 790 error = get_next_dirent(*dvp, &dp, dirbuf, dirbuflen, &off, 791 &cpos, &len, &eofflag, td); 792 if (error) 793 goto out; 794 795 if ((dp->d_type != DT_WHT) && 796 (dp->d_fileno == fileno)) { 797 if (covered) { 798 VOP_UNLOCK(*dvp, 0); 799 vn_lock(mvp, LK_SHARED | LK_RETRY); 800 if (dirent_exists(mvp, dp->d_name, td)) { 801 error = ENOENT; 802 VOP_UNLOCK(mvp, 0); 803 vn_lock(*dvp, LK_SHARED | LK_RETRY); 804 goto out; 805 } 806 VOP_UNLOCK(mvp, 0); 807 vn_lock(*dvp, LK_SHARED | LK_RETRY); 808 } 809 i -= dp->d_namlen; 810 811 if (i < 0) { 812 error = ENOMEM; 813 goto out; 814 } 815 if (dp->d_namlen == 1 && dp->d_name[0] == '.') { 816 error = ENOENT; 817 } else { 818 bcopy(dp->d_name, buf + i, dp->d_namlen); 819 error = 0; 820 } 821 goto out; 822 } 823 } while (len > 0 || !eofflag); 824 error = ENOENT; 825 826 out: 827 free(dirbuf, M_TEMP); 828 if (!error) { 829 *buflen = i; 830 vref(*dvp); 831 } 832 if (covered) { 833 vput(*dvp); 834 vrele(mvp); 835 } else { 836 VOP_UNLOCK(mvp, 0); 837 vn_close(mvp, FREAD, cred, td); 838 } 839 vn_lock(vp, locked | LK_RETRY); 840 return (error); 841 } 842 843 int 844 vop_stdallocate(struct vop_allocate_args *ap) 845 { 846 #ifdef __notyet__ 847 struct statfs *sfs; 848 off_t maxfilesize = 0; 849 #endif 850 struct iovec aiov; 851 struct vattr vattr, *vap; 852 struct uio auio; 853 off_t fsize, len, cur, offset; 854 uint8_t *buf; 855 struct thread *td; 856 struct vnode *vp; 857 size_t iosize; 858 int error; 859 860 buf = NULL; 861 error = 0; 862 td = curthread; 863 vap = &vattr; 864 vp = ap->a_vp; 865 len = *ap->a_len; 866 offset = *ap->a_offset; 867 868 error = VOP_GETATTR(vp, vap, td->td_ucred); 869 if (error != 0) 870 goto out; 871 fsize = vap->va_size; 872 iosize = vap->va_blocksize; 873 if (iosize == 0) 874 iosize = BLKDEV_IOSIZE; 875 if (iosize > MAXPHYS) 876 iosize = MAXPHYS; 877 buf = malloc(iosize, M_TEMP, M_WAITOK); 878 879 #ifdef __notyet__ 880 /* 881 * Check if the filesystem sets f_maxfilesize; if not use 882 * VOP_SETATTR to perform the check. 883 */ 884 sfs = malloc(sizeof(struct statfs), M_STATFS, M_WAITOK); 885 error = VFS_STATFS(vp->v_mount, sfs, td); 886 if (error == 0) 887 maxfilesize = sfs->f_maxfilesize; 888 free(sfs, M_STATFS); 889 if (error != 0) 890 goto out; 891 if (maxfilesize) { 892 if (offset > maxfilesize || len > maxfilesize || 893 offset + len > maxfilesize) { 894 error = EFBIG; 895 goto out; 896 } 897 } else 898 #endif 899 if (offset + len > vap->va_size) { 900 /* 901 * Test offset + len against the filesystem's maxfilesize. 902 */ 903 VATTR_NULL(vap); 904 vap->va_size = offset + len; 905 error = VOP_SETATTR(vp, vap, td->td_ucred); 906 if (error != 0) 907 goto out; 908 VATTR_NULL(vap); 909 vap->va_size = fsize; 910 error = VOP_SETATTR(vp, vap, td->td_ucred); 911 if (error != 0) 912 goto out; 913 } 914 915 for (;;) { 916 /* 917 * Read and write back anything below the nominal file 918 * size. There's currently no way outside the filesystem 919 * to know whether this area is sparse or not. 920 */ 921 cur = iosize; 922 if ((offset % iosize) != 0) 923 cur -= (offset % iosize); 924 if (cur > len) 925 cur = len; 926 if (offset < fsize) { 927 aiov.iov_base = buf; 928 aiov.iov_len = cur; 929 auio.uio_iov = &aiov; 930 auio.uio_iovcnt = 1; 931 auio.uio_offset = offset; 932 auio.uio_resid = cur; 933 auio.uio_segflg = UIO_SYSSPACE; 934 auio.uio_rw = UIO_READ; 935 auio.uio_td = td; 936 error = VOP_READ(vp, &auio, 0, td->td_ucred); 937 if (error != 0) 938 break; 939 if (auio.uio_resid > 0) { 940 bzero(buf + cur - auio.uio_resid, 941 auio.uio_resid); 942 } 943 } else { 944 bzero(buf, cur); 945 } 946 947 aiov.iov_base = buf; 948 aiov.iov_len = cur; 949 auio.uio_iov = &aiov; 950 auio.uio_iovcnt = 1; 951 auio.uio_offset = offset; 952 auio.uio_resid = cur; 953 auio.uio_segflg = UIO_SYSSPACE; 954 auio.uio_rw = UIO_WRITE; 955 auio.uio_td = td; 956 957 error = VOP_WRITE(vp, &auio, 0, td->td_ucred); 958 if (error != 0) 959 break; 960 961 len -= cur; 962 offset += cur; 963 if (len == 0) 964 break; 965 if (should_yield()) 966 break; 967 } 968 969 out: 970 *ap->a_len = len; 971 *ap->a_offset = offset; 972 free(buf, M_TEMP); 973 return (error); 974 } 975 976 int 977 vop_stdadvise(struct vop_advise_args *ap) 978 { 979 struct vnode *vp; 980 struct bufobj *bo; 981 daddr_t startn, endn; 982 off_t bstart, bend, start, end; 983 int bsize, error; 984 985 vp = ap->a_vp; 986 switch (ap->a_advice) { 987 case POSIX_FADV_WILLNEED: 988 /* 989 * Do nothing for now. Filesystems should provide a 990 * custom method which starts an asynchronous read of 991 * the requested region. 992 */ 993 error = 0; 994 break; 995 case POSIX_FADV_DONTNEED: 996 error = 0; 997 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY); 998 if (vp->v_iflag & VI_DOOMED) { 999 VOP_UNLOCK(vp, 0); 1000 break; 1001 } 1002 1003 /* 1004 * Round to block boundaries (and later possibly further to 1005 * page boundaries). Applications cannot reasonably be aware 1006 * of the boundaries, and the rounding must be to expand at 1007 * both extremities to cover enough. It still doesn't cover 1008 * read-ahead. For partial blocks, this gives unnecessary 1009 * discarding of buffers but is efficient enough since the 1010 * pages usually remain in VMIO for some time. 1011 */ 1012 bsize = vp->v_bufobj.bo_bsize; 1013 bstart = rounddown(ap->a_start, bsize); 1014 bend = roundup(ap->a_end, bsize); 1015 1016 /* 1017 * Deactivate pages in the specified range from the backing VM 1018 * object. Pages that are resident in the buffer cache will 1019 * remain wired until their corresponding buffers are released 1020 * below. 1021 */ 1022 if (vp->v_object != NULL) { 1023 start = trunc_page(bstart); 1024 end = round_page(bend); 1025 VM_OBJECT_RLOCK(vp->v_object); 1026 vm_object_page_noreuse(vp->v_object, OFF_TO_IDX(start), 1027 OFF_TO_IDX(end)); 1028 VM_OBJECT_RUNLOCK(vp->v_object); 1029 } 1030 1031 bo = &vp->v_bufobj; 1032 BO_RLOCK(bo); 1033 startn = bstart / bsize; 1034 endn = bend / bsize; 1035 error = bnoreuselist(&bo->bo_clean, bo, startn, endn); 1036 if (error == 0) 1037 error = bnoreuselist(&bo->bo_dirty, bo, startn, endn); 1038 BO_RUNLOCK(bo); 1039 VOP_UNLOCK(vp, 0); 1040 break; 1041 default: 1042 error = EINVAL; 1043 break; 1044 } 1045 return (error); 1046 } 1047 1048 int 1049 vop_stdunp_bind(struct vop_unp_bind_args *ap) 1050 { 1051 1052 ap->a_vp->v_unpcb = ap->a_unpcb; 1053 return (0); 1054 } 1055 1056 int 1057 vop_stdunp_connect(struct vop_unp_connect_args *ap) 1058 { 1059 1060 *ap->a_unpcb = ap->a_vp->v_unpcb; 1061 return (0); 1062 } 1063 1064 int 1065 vop_stdunp_detach(struct vop_unp_detach_args *ap) 1066 { 1067 1068 ap->a_vp->v_unpcb = NULL; 1069 return (0); 1070 } 1071 1072 static int 1073 vop_stdis_text(struct vop_is_text_args *ap) 1074 { 1075 1076 return (ap->a_vp->v_writecount < 0); 1077 } 1078 1079 int 1080 vop_stdset_text(struct vop_set_text_args *ap) 1081 { 1082 struct vnode *vp; 1083 int error; 1084 1085 vp = ap->a_vp; 1086 VI_LOCK(vp); 1087 if (vp->v_writecount > 0) { 1088 error = ETXTBSY; 1089 } else { 1090 vp->v_writecount--; 1091 error = 0; 1092 } 1093 VI_UNLOCK(vp); 1094 return (error); 1095 } 1096 1097 static int 1098 vop_stdunset_text(struct vop_unset_text_args *ap) 1099 { 1100 struct vnode *vp; 1101 int error; 1102 1103 vp = ap->a_vp; 1104 VI_LOCK(vp); 1105 if (vp->v_writecount < 0) { 1106 vp->v_writecount++; 1107 error = 0; 1108 } else { 1109 error = EINVAL; 1110 } 1111 VI_UNLOCK(vp); 1112 return (error); 1113 } 1114 1115 static int 1116 vop_stdadd_writecount(struct vop_add_writecount_args *ap) 1117 { 1118 struct vnode *vp; 1119 int error; 1120 1121 vp = ap->a_vp; 1122 VI_LOCK_FLAGS(vp, MTX_DUPOK); 1123 if (vp->v_writecount < 0) { 1124 error = ETXTBSY; 1125 } else { 1126 VNASSERT(vp->v_writecount + ap->a_inc >= 0, vp, 1127 ("neg writecount increment %d", ap->a_inc)); 1128 vp->v_writecount += ap->a_inc; 1129 error = 0; 1130 } 1131 VI_UNLOCK(vp); 1132 return (error); 1133 } 1134 1135 /* 1136 * vfs default ops 1137 * used to fill the vfs function table to get reasonable default return values. 1138 */ 1139 int 1140 vfs_stdroot (mp, flags, vpp) 1141 struct mount *mp; 1142 int flags; 1143 struct vnode **vpp; 1144 { 1145 1146 return (EOPNOTSUPP); 1147 } 1148 1149 int 1150 vfs_stdstatfs (mp, sbp) 1151 struct mount *mp; 1152 struct statfs *sbp; 1153 { 1154 1155 return (EOPNOTSUPP); 1156 } 1157 1158 int 1159 vfs_stdquotactl (mp, cmds, uid, arg) 1160 struct mount *mp; 1161 int cmds; 1162 uid_t uid; 1163 void *arg; 1164 { 1165 1166 return (EOPNOTSUPP); 1167 } 1168 1169 int 1170 vfs_stdsync(mp, waitfor) 1171 struct mount *mp; 1172 int waitfor; 1173 { 1174 struct vnode *vp, *mvp; 1175 struct thread *td; 1176 int error, lockreq, allerror = 0; 1177 1178 td = curthread; 1179 lockreq = LK_EXCLUSIVE | LK_INTERLOCK; 1180 if (waitfor != MNT_WAIT) 1181 lockreq |= LK_NOWAIT; 1182 /* 1183 * Force stale buffer cache information to be flushed. 1184 */ 1185 loop: 1186 MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 1187 if (vp->v_bufobj.bo_dirty.bv_cnt == 0) { 1188 VI_UNLOCK(vp); 1189 continue; 1190 } 1191 if ((error = vget(vp, lockreq, td)) != 0) { 1192 if (error == ENOENT) { 1193 MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 1194 goto loop; 1195 } 1196 continue; 1197 } 1198 error = VOP_FSYNC(vp, waitfor, td); 1199 if (error) 1200 allerror = error; 1201 vput(vp); 1202 } 1203 return (allerror); 1204 } 1205 1206 int 1207 vfs_stdnosync (mp, waitfor) 1208 struct mount *mp; 1209 int waitfor; 1210 { 1211 1212 return (0); 1213 } 1214 1215 int 1216 vfs_stdvget (mp, ino, flags, vpp) 1217 struct mount *mp; 1218 ino_t ino; 1219 int flags; 1220 struct vnode **vpp; 1221 { 1222 1223 return (EOPNOTSUPP); 1224 } 1225 1226 int 1227 vfs_stdfhtovp (mp, fhp, flags, vpp) 1228 struct mount *mp; 1229 struct fid *fhp; 1230 int flags; 1231 struct vnode **vpp; 1232 { 1233 1234 return (EOPNOTSUPP); 1235 } 1236 1237 int 1238 vfs_stdinit (vfsp) 1239 struct vfsconf *vfsp; 1240 { 1241 1242 return (0); 1243 } 1244 1245 int 1246 vfs_stduninit (vfsp) 1247 struct vfsconf *vfsp; 1248 { 1249 1250 return(0); 1251 } 1252 1253 int 1254 vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, attrname) 1255 struct mount *mp; 1256 int cmd; 1257 struct vnode *filename_vp; 1258 int attrnamespace; 1259 const char *attrname; 1260 { 1261 1262 if (filename_vp != NULL) 1263 VOP_UNLOCK(filename_vp, 0); 1264 return (EOPNOTSUPP); 1265 } 1266 1267 int 1268 vfs_stdsysctl(mp, op, req) 1269 struct mount *mp; 1270 fsctlop_t op; 1271 struct sysctl_req *req; 1272 { 1273 1274 return (EOPNOTSUPP); 1275 } 1276 1277 static vop_bypass_t * 1278 bp_by_off(struct vop_vector *vop, struct vop_generic_args *a) 1279 { 1280 1281 return (*(vop_bypass_t **)((char *)vop + a->a_desc->vdesc_vop_offset)); 1282 } 1283 1284 int 1285 vop_sigdefer(struct vop_vector *vop, struct vop_generic_args *a) 1286 { 1287 vop_bypass_t *bp; 1288 int prev_stops, rc; 1289 1290 for (; vop != NULL; vop = vop->vop_default) { 1291 bp = bp_by_off(vop, a); 1292 if (bp != NULL) 1293 break; 1294 1295 /* 1296 * Bypass is not really supported. It is done for 1297 * fallback to unimplemented vops in the default 1298 * vector. 1299 */ 1300 bp = vop->vop_bypass; 1301 if (bp != NULL) 1302 break; 1303 } 1304 MPASS(bp != NULL); 1305 1306 prev_stops = sigdeferstop(SIGDEFERSTOP_SILENT); 1307 rc = bp(a); 1308 sigallowstop(prev_stops); 1309 return (rc); 1310 } 1311