160727d8bSWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1989, 1991, 1993, 1994 5df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31996c772fSJohn Dyson * @(#)ffs_vfsops.c 8.31 (Berkeley) 5/20/95 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f4636c59SDavid E. O'Brien #include <sys/cdefs.h> 35f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$"); 36f4636c59SDavid E. O'Brien 3701733a9bSGarrett Wollman #include "opt_quota.h" 38516081f2SRobert Watson #include "opt_ufs.h" 396e77a041SPoul-Henning Kamp #include "opt_ffs.h" 4052dfc8d7SKonstantin Belousov #include "opt_ddb.h" 4101733a9bSGarrett Wollman 42df8bae1dSRodney W. Grimes #include <sys/param.h> 43f89d2072SXin LI #include <sys/gsb_crc32.h> 44df8bae1dSRodney W. Grimes #include <sys/systm.h> 45df8bae1dSRodney W. Grimes #include <sys/namei.h> 46acd3428bSRobert Watson #include <sys/priv.h> 47df8bae1dSRodney W. Grimes #include <sys/proc.h> 48c79dff0fSKonstantin Belousov #include <sys/taskqueue.h> 49df8bae1dSRodney W. Grimes #include <sys/kernel.h> 50daec9284SConrad Meyer #include <sys/ktr.h> 51df8bae1dSRodney W. Grimes #include <sys/vnode.h> 52df8bae1dSRodney W. Grimes #include <sys/mount.h> 539626b608SPoul-Henning Kamp #include <sys/bio.h> 54df8bae1dSRodney W. Grimes #include <sys/buf.h> 5581bca6ddSKATO Takenori #include <sys/conf.h> 563ac4d1efSBruce Evans #include <sys/fcntl.h> 571848286aSEdward Tomasz Napierala #include <sys/ioccom.h> 58df8bae1dSRodney W. Grimes #include <sys/malloc.h> 591b367556SJason Evans #include <sys/mutex.h> 6022a72260SJeff Roberson #include <sys/rwlock.h> 61d79ff54bSChuck Silvers #include <sys/sysctl.h> 629ed01c32SGleb Smirnoff #include <sys/vmmeter.h> 63a18b1f1dSJason Evans 64aed55708SRobert Watson #include <security/mac/mac_framework.h> 65aed55708SRobert Watson 66a96da1c3SConrad Meyer #include <ufs/ufs/dir.h> 67a64ed089SRobert Watson #include <ufs/ufs/extattr.h> 681a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h> 69df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h> 70df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h> 71df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h> 72df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h> 73df8bae1dSRodney W. Grimes 74df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h> 75df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h> 76df8bae1dSRodney W. Grimes 77f6b04d2bSDavid Greenman #include <vm/vm.h> 78aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h> 79f6b04d2bSDavid Greenman #include <vm/vm_page.h> 80f6b04d2bSDavid Greenman 8143920011SPoul-Henning Kamp #include <geom/geom.h> 8243920011SPoul-Henning Kamp #include <geom/geom_vfs.h> 8343920011SPoul-Henning Kamp 8452dfc8d7SKonstantin Belousov #include <ddb/ddb.h> 8552dfc8d7SKonstantin Belousov 86adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2; 879d5a594fSMateusz Guzik VFS_SMR_DECLARE; 8855166637SPoul-Henning Kamp 89975512a9SPoul-Henning Kamp static int ffs_mountfs(struct vnode *, struct mount *, struct thread *); 901c85e6a3SKirk McKusick static void ffs_oldfscompat_read(struct fs *, struct ufsmount *, 911c85e6a3SKirk McKusick ufs2_daddr_t); 92975512a9SPoul-Henning Kamp static void ffs_ifree(struct ufsmount *ump, struct inode *ip); 93a988a5c6SKonstantin Belousov static int ffs_sync_lazy(struct mount *mp); 94dffce215SKirk McKusick static int ffs_use_bread(void *devfd, off_t loc, void **bufp, int size); 95dffce215SKirk McKusick static int ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size); 96a988a5c6SKonstantin Belousov 979bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init; 989bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit; 99d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl; 10020a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount; 101adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount; 10220a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount; 103adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs; 104adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp; 105adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync; 106df8bae1dSRodney W. Grimes 107303b270bSEivind Eklund static struct vfsops ufs_vfsops = { 1087652131bSPoul-Henning Kamp .vfs_extattrctl = ffs_extattrctl, 1097652131bSPoul-Henning Kamp .vfs_fhtovp = ffs_fhtovp, 1107652131bSPoul-Henning Kamp .vfs_init = ffs_init, 11120a92a18SPoul-Henning Kamp .vfs_mount = ffs_mount, 11220a92a18SPoul-Henning Kamp .vfs_cmount = ffs_cmount, 1137652131bSPoul-Henning Kamp .vfs_quotactl = ufs_quotactl, 114e35cd9e3SMateusz Guzik .vfs_root = vfs_cache_root, 115e35cd9e3SMateusz Guzik .vfs_cachedroot = ufs_root, 1167652131bSPoul-Henning Kamp .vfs_statfs = ffs_statfs, 1177652131bSPoul-Henning Kamp .vfs_sync = ffs_sync, 1187652131bSPoul-Henning Kamp .vfs_uninit = ffs_uninit, 1197652131bSPoul-Henning Kamp .vfs_unmount = ffs_unmount, 1207652131bSPoul-Henning Kamp .vfs_vget = ffs_vget, 1212814d5baSKonstantin Belousov .vfs_susp_clean = process_deferred_inactive, 122df8bae1dSRodney W. Grimes }; 123df8bae1dSRodney W. Grimes 1248994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0); 1255fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1); 126c901836cSGarrett Wollman 1276e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy; 128dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite; 1296e77a041SPoul-Henning Kamp 1306e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = { 1316e77a041SPoul-Henning Kamp .bop_name = "FFS", 132dd19a799SPoul-Henning Kamp .bop_write = ffs_bufwrite, 1336e77a041SPoul-Henning Kamp .bop_strategy = ffs_geom_strategy, 1346ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 1352cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT 1362cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush, 1372cc7d26fSKonstantin Belousov #else 1382cc7d26fSKonstantin Belousov .bop_bdflush = ffs_bdflush, 1392cc7d26fSKonstantin Belousov #endif 1406e77a041SPoul-Henning Kamp }; 1416e77a041SPoul-Henning Kamp 1420b962648SAndriy Gapon /* 1430b962648SAndriy Gapon * Note that userquota and groupquota options are not currently used 1440b962648SAndriy Gapon * by UFS/FFS code and generally mount(8) does not pass those options 1450b962648SAndriy Gapon * from userland, but they can be passed by loader(8) via 1460b962648SAndriy Gapon * vfs.root.mountfrom.options. 1470b962648SAndriy Gapon */ 148d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr", 1490b962648SAndriy Gapon "noclusterw", "noexec", "export", "force", "from", "groupquota", 150927a12aeSKirk McKusick "multilabel", "nfsv4acls", "fsckpid", "snapshot", "nosuid", "suiddir", 151daba4da8SKirk McKusick "nosymfollow", "sync", "union", "userquota", "untrusted", NULL }; 15220a92a18SPoul-Henning Kamp 153d79ff54bSChuck Silvers static int ffs_enxio_enable = 1; 154d79ff54bSChuck Silvers SYSCTL_DECL(_vfs_ffs); 155d79ff54bSChuck Silvers SYSCTL_INT(_vfs_ffs, OID_AUTO, enxio_enable, CTLFLAG_RWTUN, 156d79ff54bSChuck Silvers &ffs_enxio_enable, 0, 157d79ff54bSChuck Silvers "enable mapping of other disk I/O errors to ENXIO"); 158d79ff54bSChuck Silvers 159d9a8abf6SChuck Silvers /* 160d9a8abf6SChuck Silvers * Return buffer with the contents of block "offset" from the beginning of 161d9a8abf6SChuck Silvers * directory "ip". If "res" is non-zero, fill it in with a pointer to the 162d9a8abf6SChuck Silvers * remaining space in the directory. 163d9a8abf6SChuck Silvers */ 164d9a8abf6SChuck Silvers static int 165d9a8abf6SChuck Silvers ffs_blkatoff(struct vnode *vp, off_t offset, char **res, struct buf **bpp) 166d9a8abf6SChuck Silvers { 167d9a8abf6SChuck Silvers struct inode *ip; 168d9a8abf6SChuck Silvers struct fs *fs; 169d9a8abf6SChuck Silvers struct buf *bp; 170d9a8abf6SChuck Silvers ufs_lbn_t lbn; 171d9a8abf6SChuck Silvers int bsize, error; 172d9a8abf6SChuck Silvers 173d9a8abf6SChuck Silvers ip = VTOI(vp); 174d9a8abf6SChuck Silvers fs = ITOFS(ip); 175d9a8abf6SChuck Silvers lbn = lblkno(fs, offset); 176d9a8abf6SChuck Silvers bsize = blksize(fs, ip, lbn); 177d9a8abf6SChuck Silvers 178d9a8abf6SChuck Silvers *bpp = NULL; 179d9a8abf6SChuck Silvers error = bread(vp, lbn, bsize, NOCRED, &bp); 180d9a8abf6SChuck Silvers if (error) { 181d9a8abf6SChuck Silvers return (error); 182d9a8abf6SChuck Silvers } 183d9a8abf6SChuck Silvers if (res) 184d9a8abf6SChuck Silvers *res = (char *)bp->b_data + blkoff(fs, offset); 185d9a8abf6SChuck Silvers *bpp = bp; 186d9a8abf6SChuck Silvers return (0); 187d9a8abf6SChuck Silvers } 188d9a8abf6SChuck Silvers 189d9a8abf6SChuck Silvers /* 190d9a8abf6SChuck Silvers * Load up the contents of an inode and copy the appropriate pieces 191d9a8abf6SChuck Silvers * to the incore copy. 192d9a8abf6SChuck Silvers */ 193d9a8abf6SChuck Silvers static int 194d9a8abf6SChuck Silvers ffs_load_inode(struct buf *bp, struct inode *ip, struct fs *fs, ino_t ino) 195d9a8abf6SChuck Silvers { 196d9a8abf6SChuck Silvers struct ufs1_dinode *dip1; 197d9a8abf6SChuck Silvers struct ufs2_dinode *dip2; 198d9a8abf6SChuck Silvers int error; 199d9a8abf6SChuck Silvers 200d9a8abf6SChuck Silvers if (I_IS_UFS1(ip)) { 201d9a8abf6SChuck Silvers dip1 = ip->i_din1; 202d9a8abf6SChuck Silvers *dip1 = 203d9a8abf6SChuck Silvers *((struct ufs1_dinode *)bp->b_data + ino_to_fsbo(fs, ino)); 204d9a8abf6SChuck Silvers ip->i_mode = dip1->di_mode; 205d9a8abf6SChuck Silvers ip->i_nlink = dip1->di_nlink; 206d9a8abf6SChuck Silvers ip->i_effnlink = dip1->di_nlink; 207d9a8abf6SChuck Silvers ip->i_size = dip1->di_size; 208d9a8abf6SChuck Silvers ip->i_flags = dip1->di_flags; 209d9a8abf6SChuck Silvers ip->i_gen = dip1->di_gen; 210d9a8abf6SChuck Silvers ip->i_uid = dip1->di_uid; 211d9a8abf6SChuck Silvers ip->i_gid = dip1->di_gid; 212d9a8abf6SChuck Silvers return (0); 213d9a8abf6SChuck Silvers } 214d9a8abf6SChuck Silvers dip2 = ((struct ufs2_dinode *)bp->b_data + ino_to_fsbo(fs, ino)); 215d9a8abf6SChuck Silvers if ((error = ffs_verify_dinode_ckhash(fs, dip2)) != 0 && 216d9a8abf6SChuck Silvers !ffs_fsfail_cleanup(ITOUMP(ip), error)) { 217d9a8abf6SChuck Silvers printf("%s: inode %jd: check-hash failed\n", fs->fs_fsmnt, 218d9a8abf6SChuck Silvers (intmax_t)ino); 219d9a8abf6SChuck Silvers return (error); 220d9a8abf6SChuck Silvers } 221d9a8abf6SChuck Silvers *ip->i_din2 = *dip2; 222d9a8abf6SChuck Silvers dip2 = ip->i_din2; 223d9a8abf6SChuck Silvers ip->i_mode = dip2->di_mode; 224d9a8abf6SChuck Silvers ip->i_nlink = dip2->di_nlink; 225d9a8abf6SChuck Silvers ip->i_effnlink = dip2->di_nlink; 226d9a8abf6SChuck Silvers ip->i_size = dip2->di_size; 227d9a8abf6SChuck Silvers ip->i_flags = dip2->di_flags; 228d9a8abf6SChuck Silvers ip->i_gen = dip2->di_gen; 229d9a8abf6SChuck Silvers ip->i_uid = dip2->di_uid; 230d9a8abf6SChuck Silvers ip->i_gid = dip2->di_gid; 231d9a8abf6SChuck Silvers return (0); 232d9a8abf6SChuck Silvers } 233d9a8abf6SChuck Silvers 234d9a8abf6SChuck Silvers /* 235d9a8abf6SChuck Silvers * Verify that a filesystem block number is a valid data block. 236d9a8abf6SChuck Silvers * This routine is only called on untrusted filesystems. 237d9a8abf6SChuck Silvers */ 238d9a8abf6SChuck Silvers static int 239d9a8abf6SChuck Silvers ffs_check_blkno(struct mount *mp, ino_t inum, ufs2_daddr_t daddr, int blksize) 240d9a8abf6SChuck Silvers { 241d9a8abf6SChuck Silvers struct fs *fs; 242d9a8abf6SChuck Silvers struct ufsmount *ump; 243d9a8abf6SChuck Silvers ufs2_daddr_t end_daddr; 244d9a8abf6SChuck Silvers int cg, havemtx; 245d9a8abf6SChuck Silvers 246d9a8abf6SChuck Silvers KASSERT((mp->mnt_flag & MNT_UNTRUSTED) != 0, 247d9a8abf6SChuck Silvers ("ffs_check_blkno called on a trusted file system")); 248d9a8abf6SChuck Silvers ump = VFSTOUFS(mp); 249d9a8abf6SChuck Silvers fs = ump->um_fs; 250d9a8abf6SChuck Silvers cg = dtog(fs, daddr); 251d9a8abf6SChuck Silvers end_daddr = daddr + numfrags(fs, blksize); 252d9a8abf6SChuck Silvers /* 253d9a8abf6SChuck Silvers * Verify that the block number is a valid data block. Also check 254d9a8abf6SChuck Silvers * that it does not point to an inode block or a superblock. Accept 255d9a8abf6SChuck Silvers * blocks that are unalloacted (0) or part of snapshot metadata 256d9a8abf6SChuck Silvers * (BLK_NOCOPY or BLK_SNAP). 257d9a8abf6SChuck Silvers * 258d9a8abf6SChuck Silvers * Thus, the block must be in a valid range for the filesystem and 259d9a8abf6SChuck Silvers * either in the space before a backup superblock (except the first 260d9a8abf6SChuck Silvers * cylinder group where that space is used by the bootstrap code) or 261d9a8abf6SChuck Silvers * after the inode blocks and before the end of the cylinder group. 262d9a8abf6SChuck Silvers */ 263d9a8abf6SChuck Silvers if ((uint64_t)daddr <= BLK_SNAP || 264d9a8abf6SChuck Silvers ((uint64_t)end_daddr <= fs->fs_size && 265d9a8abf6SChuck Silvers ((cg > 0 && end_daddr <= cgsblock(fs, cg)) || 266d9a8abf6SChuck Silvers (daddr >= cgdmin(fs, cg) && 267d9a8abf6SChuck Silvers end_daddr <= cgbase(fs, cg) + fs->fs_fpg)))) 268d9a8abf6SChuck Silvers return (0); 269d9a8abf6SChuck Silvers if ((havemtx = mtx_owned(UFS_MTX(ump))) == 0) 270d9a8abf6SChuck Silvers UFS_LOCK(ump); 271d9a8abf6SChuck Silvers if (ppsratecheck(&ump->um_last_integritymsg, 272d9a8abf6SChuck Silvers &ump->um_secs_integritymsg, 1)) { 273d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 274d9a8abf6SChuck Silvers uprintf("\n%s: inode %jd, out-of-range indirect block " 275d9a8abf6SChuck Silvers "number %jd\n", mp->mnt_stat.f_mntonname, inum, daddr); 276d9a8abf6SChuck Silvers if (havemtx) 277d9a8abf6SChuck Silvers UFS_LOCK(ump); 278d9a8abf6SChuck Silvers } else if (!havemtx) 279d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 280d9a8abf6SChuck Silvers return (EINTEGRITY); 281d9a8abf6SChuck Silvers } 282d9a8abf6SChuck Silvers 283d9a8abf6SChuck Silvers /* 284d9a8abf6SChuck Silvers * Initiate a forcible unmount. 285d9a8abf6SChuck Silvers * Used to unmount filesystems whose underlying media has gone away. 286d9a8abf6SChuck Silvers */ 287d9a8abf6SChuck Silvers static void 288d9a8abf6SChuck Silvers ffs_fsfail_unmount(void *v, int pending) 289d9a8abf6SChuck Silvers { 290d9a8abf6SChuck Silvers struct fsfail_task *etp; 291d9a8abf6SChuck Silvers struct mount *mp; 292d9a8abf6SChuck Silvers 293d9a8abf6SChuck Silvers etp = v; 294d9a8abf6SChuck Silvers 295d9a8abf6SChuck Silvers /* 296d9a8abf6SChuck Silvers * Find our mount and get a ref on it, then try to unmount. 297d9a8abf6SChuck Silvers */ 298d9a8abf6SChuck Silvers mp = vfs_getvfs(&etp->fsid); 299d9a8abf6SChuck Silvers if (mp != NULL) 300d9a8abf6SChuck Silvers dounmount(mp, MNT_FORCE, curthread); 301d9a8abf6SChuck Silvers free(etp, M_UFSMNT); 302d9a8abf6SChuck Silvers } 303d9a8abf6SChuck Silvers 304d9a8abf6SChuck Silvers /* 305d9a8abf6SChuck Silvers * On first ENXIO error, start a task that forcibly unmounts the filesystem. 306d9a8abf6SChuck Silvers * 307d9a8abf6SChuck Silvers * Return true if a cleanup is in progress. 308d9a8abf6SChuck Silvers */ 309d9a8abf6SChuck Silvers int 310d9a8abf6SChuck Silvers ffs_fsfail_cleanup(struct ufsmount *ump, int error) 311d9a8abf6SChuck Silvers { 312d9a8abf6SChuck Silvers int retval; 313d9a8abf6SChuck Silvers 314d9a8abf6SChuck Silvers UFS_LOCK(ump); 315d9a8abf6SChuck Silvers retval = ffs_fsfail_cleanup_locked(ump, error); 316d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 317d9a8abf6SChuck Silvers return (retval); 318d9a8abf6SChuck Silvers } 319d9a8abf6SChuck Silvers 320d9a8abf6SChuck Silvers int 321d9a8abf6SChuck Silvers ffs_fsfail_cleanup_locked(struct ufsmount *ump, int error) 322d9a8abf6SChuck Silvers { 323d9a8abf6SChuck Silvers struct fsfail_task *etp; 324d9a8abf6SChuck Silvers struct task *tp; 325d9a8abf6SChuck Silvers 326d9a8abf6SChuck Silvers mtx_assert(UFS_MTX(ump), MA_OWNED); 327d9a8abf6SChuck Silvers if (error == ENXIO && (ump->um_flags & UM_FSFAIL_CLEANUP) == 0) { 328d9a8abf6SChuck Silvers ump->um_flags |= UM_FSFAIL_CLEANUP; 329d9a8abf6SChuck Silvers /* 330d9a8abf6SChuck Silvers * Queue an async forced unmount. 331d9a8abf6SChuck Silvers */ 332d9a8abf6SChuck Silvers etp = ump->um_fsfail_task; 333d9a8abf6SChuck Silvers ump->um_fsfail_task = NULL; 334d9a8abf6SChuck Silvers if (etp != NULL) { 335d9a8abf6SChuck Silvers tp = &etp->task; 336d9a8abf6SChuck Silvers TASK_INIT(tp, 0, ffs_fsfail_unmount, etp); 337d9a8abf6SChuck Silvers taskqueue_enqueue(taskqueue_thread, tp); 338d9a8abf6SChuck Silvers printf("UFS: forcibly unmounting %s from %s\n", 339d9a8abf6SChuck Silvers ump->um_mountp->mnt_stat.f_mntfromname, 340d9a8abf6SChuck Silvers ump->um_mountp->mnt_stat.f_mntonname); 341d9a8abf6SChuck Silvers } 342d9a8abf6SChuck Silvers } 343d9a8abf6SChuck Silvers return ((ump->um_flags & UM_FSFAIL_CLEANUP) != 0); 344d9a8abf6SChuck Silvers } 345d9a8abf6SChuck Silvers 346d9a8abf6SChuck Silvers /* 347d9a8abf6SChuck Silvers * Wrapper used during ENXIO cleanup to allocate empty buffers when 348d9a8abf6SChuck Silvers * the kernel is unable to read the real one. They are needed so that 349d9a8abf6SChuck Silvers * the soft updates code can use them to unwind its dependencies. 350d9a8abf6SChuck Silvers */ 351d9a8abf6SChuck Silvers int 352d9a8abf6SChuck Silvers ffs_breadz(struct ufsmount *ump, struct vnode *vp, daddr_t lblkno, 353d9a8abf6SChuck Silvers daddr_t dblkno, int size, daddr_t *rablkno, int *rabsize, int cnt, 354d9a8abf6SChuck Silvers struct ucred *cred, int flags, void (*ckhashfunc)(struct buf *), 355d9a8abf6SChuck Silvers struct buf **bpp) 356d9a8abf6SChuck Silvers { 357d9a8abf6SChuck Silvers int error; 358d9a8abf6SChuck Silvers 359d9a8abf6SChuck Silvers flags |= GB_CVTENXIO; 360d9a8abf6SChuck Silvers error = breadn_flags(vp, lblkno, dblkno, size, rablkno, rabsize, cnt, 361d9a8abf6SChuck Silvers cred, flags, ckhashfunc, bpp); 362d9a8abf6SChuck Silvers if (error != 0 && ffs_fsfail_cleanup(ump, error)) { 363d9a8abf6SChuck Silvers error = getblkx(vp, lblkno, dblkno, size, 0, 0, flags, bpp); 364d9a8abf6SChuck Silvers KASSERT(error == 0, ("getblkx failed")); 365d9a8abf6SChuck Silvers vfs_bio_bzero_buf(*bpp, 0, size); 366d9a8abf6SChuck Silvers } 367d9a8abf6SChuck Silvers return (error); 368d9a8abf6SChuck Silvers } 369d9a8abf6SChuck Silvers 3705e8c582aSPoul-Henning Kamp static int 371dfd233edSAttilio Rao ffs_mount(struct mount *mp) 372df8bae1dSRodney W. Grimes { 373f15ccf88SChuck Silvers struct vnode *devvp, *odevvp; 374dfd233edSAttilio Rao struct thread *td; 375f7a3729cSKevin Lo struct ufsmount *ump = NULL; 37605f4ff5dSPoul-Henning Kamp struct fs *fs; 377927a12aeSKirk McKusick pid_t fsckpid = 0; 378714b7df5SKonstantin Belousov int error, error1, flags; 3795ffc99e2SKonstantin Belousov uint64_t mntorflags, saved_mnt_flag; 38015bc6b2bSEdward Tomasz Napierala accmode_t accmode; 3815e8c582aSPoul-Henning Kamp struct nameidata ndp; 38220a92a18SPoul-Henning Kamp char *fspec; 383df8bae1dSRodney W. Grimes 384dfd233edSAttilio Rao td = curthread; 38520a92a18SPoul-Henning Kamp if (vfs_filteropt(mp->mnt_optnew, ffs_opts)) 38620a92a18SPoul-Henning Kamp return (EINVAL); 387aa4d7a8aSPoul-Henning Kamp if (uma_inode == NULL) { 388aa4d7a8aSPoul-Henning Kamp uma_inode = uma_zcreate("FFS inode", 389aa4d7a8aSPoul-Henning Kamp sizeof(struct inode), NULL, NULL, NULL, NULL, 390aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 391aa4d7a8aSPoul-Henning Kamp uma_ufs1 = uma_zcreate("FFS1 dinode", 392aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL, 393aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 394aa4d7a8aSPoul-Henning Kamp uma_ufs2 = uma_zcreate("FFS2 dinode", 395aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL, 396aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 3979d5a594fSMateusz Guzik VFS_SMR_ZONE_SET(uma_inode); 398aa4d7a8aSPoul-Henning Kamp } 3998d02a378SPawel Jakub Dawidek 4000b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "groupquota"); 4010b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "userquota"); 4020b962648SAndriy Gapon 40320a92a18SPoul-Henning Kamp fspec = vfs_getopts(mp->mnt_optnew, "from", &error); 40451ac12abSPoul-Henning Kamp if (error) 405f2a2857bSKirk McKusick return (error); 4062b14f991SJulian Elischer 4075da56ddbSTor Egge mntorflags = 0; 408daba4da8SKirk McKusick if (vfs_getopt(mp->mnt_optnew, "untrusted", NULL, NULL) == 0) 409daba4da8SKirk McKusick mntorflags |= MNT_UNTRUSTED; 410daba4da8SKirk McKusick 41126f59b64SCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0) 4125da56ddbSTor Egge mntorflags |= MNT_ACLS; 41326f59b64SCraig Rodrigues 414fb77e0afSCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) { 4155da56ddbSTor Egge mntorflags |= MNT_SNAPSHOT; 416fb77e0afSCraig Rodrigues /* 417fb77e0afSCraig Rodrigues * Once we have set the MNT_SNAPSHOT flag, do not 418fb77e0afSCraig Rodrigues * persist "snapshot" in the options list. 419fb77e0afSCraig Rodrigues */ 420fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_optnew, "snapshot"); 421fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_opt, "snapshot"); 422fb77e0afSCraig Rodrigues } 42326f59b64SCraig Rodrigues 424927a12aeSKirk McKusick if (vfs_getopt(mp->mnt_optnew, "fsckpid", NULL, NULL) == 0 && 425927a12aeSKirk McKusick vfs_scanopt(mp->mnt_optnew, "fsckpid", "%d", &fsckpid) == 1) { 426927a12aeSKirk McKusick /* 427927a12aeSKirk McKusick * Once we have set the restricted PID, do not 428927a12aeSKirk McKusick * persist "fsckpid" in the options list. 429927a12aeSKirk McKusick */ 430927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_optnew, "fsckpid"); 431927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_opt, "fsckpid"); 432927a12aeSKirk McKusick if (mp->mnt_flag & MNT_UPDATE) { 433927a12aeSKirk McKusick if (VFSTOUFS(mp)->um_fs->fs_ronly == 0 && 434927a12aeSKirk McKusick vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 435b60ee81eSKirk McKusick vfs_mount_error(mp, 436b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 437927a12aeSKirk McKusick return (EINVAL); 438927a12aeSKirk McKusick } 439927a12aeSKirk McKusick } else if (vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 440b60ee81eSKirk McKusick vfs_mount_error(mp, 441b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 442927a12aeSKirk McKusick return (EINVAL); 443927a12aeSKirk McKusick } 444927a12aeSKirk McKusick /* Set to -1 if we are done */ 445927a12aeSKirk McKusick if (fsckpid == 0) 446927a12aeSKirk McKusick fsckpid = -1; 447927a12aeSKirk McKusick } 448927a12aeSKirk McKusick 4499340fc72SEdward Tomasz Napierala if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) { 4509340fc72SEdward Tomasz Napierala if (mntorflags & MNT_ACLS) { 451b60ee81eSKirk McKusick vfs_mount_error(mp, 452b60ee81eSKirk McKusick "\"acls\" and \"nfsv4acls\" options " 453b60ee81eSKirk McKusick "are mutually exclusive"); 4549340fc72SEdward Tomasz Napierala return (EINVAL); 4559340fc72SEdward Tomasz Napierala } 4569340fc72SEdward Tomasz Napierala mntorflags |= MNT_NFS4ACLS; 4579340fc72SEdward Tomasz Napierala } 4589340fc72SEdward Tomasz Napierala 4595da56ddbSTor Egge MNT_ILOCK(mp); 4609d5a594fSMateusz Guzik mp->mnt_kern_flag &= ~MNTK_FPLOOKUP; 46161996181SEdward Tomasz Napierala mp->mnt_flag |= mntorflags; 4625da56ddbSTor Egge MNT_IUNLOCK(mp); 463df8bae1dSRodney W. Grimes /* 464df8bae1dSRodney W. Grimes * If updating, check whether changing from read-only to 465df8bae1dSRodney W. Grimes * read/write; if there is no device name, that's all we do. 466df8bae1dSRodney W. Grimes */ 467df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_UPDATE) { 468df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 469df8bae1dSRodney W. Grimes fs = ump->um_fs; 470f15ccf88SChuck Silvers odevvp = ump->um_odevvp; 47126cf9c3bSPeter Wemm devvp = ump->um_devvp; 472927a12aeSKirk McKusick if (fsckpid == -1 && ump->um_fsckpid > 0) { 473927a12aeSKirk McKusick if ((error = ffs_flushfiles(mp, WRITECLOSE, td)) != 0 || 474927a12aeSKirk McKusick (error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) 475927a12aeSKirk McKusick return (error); 476927a12aeSKirk McKusick g_topology_lock(); 477927a12aeSKirk McKusick /* 478927a12aeSKirk McKusick * Return to normal read-only mode. 479927a12aeSKirk McKusick */ 480927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 481927a12aeSKirk McKusick g_topology_unlock(); 482927a12aeSKirk McKusick ump->um_fsckpid = 0; 483927a12aeSKirk McKusick } 48420a92a18SPoul-Henning Kamp if (fs->fs_ronly == 0 && 48520a92a18SPoul-Henning Kamp vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 4866fecb4e4SKonstantin Belousov /* 4876fecb4e4SKonstantin Belousov * Flush any dirty data and suspend filesystem. 4886fecb4e4SKonstantin Belousov */ 489f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 490f2a2857bSKirk McKusick return (error); 491895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 492895b3782SKonstantin Belousov if (error != 0) 4939ab73fd1SKirk McKusick return (error); 494cd600596SKirk McKusick /* 495cd600596SKirk McKusick * Check for and optionally get rid of files open 496cd600596SKirk McKusick * for writing. 497cd600596SKirk McKusick */ 498df8bae1dSRodney W. Grimes flags = WRITECLOSE; 499df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_FORCE) 500df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 501fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 502b40ce416SJulian Elischer error = softdep_flushfiles(mp, flags, td); 503b1897c19SJulian Elischer } else { 504b40ce416SJulian Elischer error = ffs_flushfiles(mp, flags, td); 505df8bae1dSRodney W. Grimes } 506f2a2857bSKirk McKusick if (error) { 507ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 508f2a2857bSKirk McKusick return (error); 509b1897c19SJulian Elischer } 5109ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || 5119ccb939eSKirk McKusick fs->fs_pendinginodes != 0) { 512b60ee81eSKirk McKusick printf("WARNING: %s Update error: blocks %jd " 513b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, 5141c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 5159ccb939eSKirk McKusick fs->fs_pendinginodes); 5169ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 5179ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 5189ccb939eSKirk McKusick } 5191a6a6610SKirk McKusick if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0) 520f2a2857bSKirk McKusick fs->fs_clean = 1; 521791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 522f2a2857bSKirk McKusick fs->fs_ronly = 0; 523f2a2857bSKirk McKusick fs->fs_clean = 0; 524ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 525f2a2857bSKirk McKusick return (error); 5262b14f991SJulian Elischer } 527fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 5289420dc62SKirk McKusick softdep_unmount(mp); 52943920011SPoul-Henning Kamp g_topology_lock(); 5308795189cSKirk McKusick /* 5318795189cSKirk McKusick * Drop our write and exclusive access. 5328795189cSKirk McKusick */ 5338795189cSKirk McKusick g_access(ump->um_cp, 0, -1, -1); 53443920011SPoul-Henning Kamp g_topology_unlock(); 53520a92a18SPoul-Henning Kamp fs->fs_ronly = 1; 5365da56ddbSTor Egge MNT_ILOCK(mp); 53720a92a18SPoul-Henning Kamp mp->mnt_flag |= MNT_RDONLY; 5385da56ddbSTor Egge MNT_IUNLOCK(mp); 5396fecb4e4SKonstantin Belousov /* 5406fecb4e4SKonstantin Belousov * Allow the writers to note that filesystem 5416fecb4e4SKonstantin Belousov * is ro now. 5426fecb4e4SKonstantin Belousov */ 543ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 544f2a2857bSKirk McKusick } 545f2a2857bSKirk McKusick if ((mp->mnt_flag & MNT_RELOAD) && 5461848286aSEdward Tomasz Napierala (error = ffs_reload(mp, td, 0)) != 0) 547f2a2857bSKirk McKusick return (error); 54820a92a18SPoul-Henning Kamp if (fs->fs_ronly && 54920a92a18SPoul-Henning Kamp !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 550c9b99213SBruce Evans /* 551927a12aeSKirk McKusick * If we are running a checker, do not allow upgrade. 552927a12aeSKirk McKusick */ 553927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 554b60ee81eSKirk McKusick vfs_mount_error(mp, 555b60ee81eSKirk McKusick "Active checker, cannot upgrade to write"); 556927a12aeSKirk McKusick return (EINVAL); 557927a12aeSKirk McKusick } 558927a12aeSKirk McKusick /* 559c9b99213SBruce Evans * If upgrade to read-write by non-root, then verify 560c9b99213SBruce Evans * that user has necessary permissions on the device. 561c9b99213SBruce Evans */ 562f15ccf88SChuck Silvers vn_lock(odevvp, LK_EXCLUSIVE | LK_RETRY); 563f15ccf88SChuck Silvers error = VOP_ACCESS(odevvp, VREAD | VWRITE, 564acd3428bSRobert Watson td->td_ucred, td); 565acd3428bSRobert Watson if (error) 566acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 567f15ccf88SChuck Silvers VOP_UNLOCK(odevvp); 568acd3428bSRobert Watson if (error) { 569c9b99213SBruce Evans return (error); 570c9b99213SBruce Evans } 5717e58bfacSBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 5720922cce6SBruce Evans if (fs->fs_clean == 0) { 5737e58bfacSBruce Evans fs->fs_flags |= FS_UNCLEAN; 574812b1d41SKirk McKusick if ((mp->mnt_flag & MNT_FORCE) || 575113db2ddSJeff Roberson ((fs->fs_flags & 576113db2ddSJeff Roberson (FS_SUJ | FS_NEEDSFSCK)) == 0 && 5771a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 578b60ee81eSKirk McKusick printf("WARNING: %s was not properly " 579b60ee81eSKirk McKusick "dismounted\n", fs->fs_fsmnt); 5800922cce6SBruce Evans } else { 581b60ee81eSKirk McKusick vfs_mount_error(mp, 582b60ee81eSKirk McKusick "R/W mount of %s denied. %s.%s", 583b60ee81eSKirk McKusick fs->fs_fsmnt, 584b60ee81eSKirk McKusick "Filesystem is not clean - run fsck", 585b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 586b60ee81eSKirk McKusick " Forced mount will invalidate" 587b60ee81eSKirk McKusick " journal contents"); 588f2a2857bSKirk McKusick return (EPERM); 5890922cce6SBruce Evans } 5900922cce6SBruce Evans } 59140c340aaSPoul-Henning Kamp g_topology_lock(); 59240c340aaSPoul-Henning Kamp /* 5938795189cSKirk McKusick * Request exclusive write access. 59440c340aaSPoul-Henning Kamp */ 59540c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 1); 59640c340aaSPoul-Henning Kamp g_topology_unlock(); 59740c340aaSPoul-Henning Kamp if (error) 59840c340aaSPoul-Henning Kamp return (error); 599f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 600f2a2857bSKirk McKusick return (error); 6015ffc99e2SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 6025ffc99e2SKonstantin Belousov if (error != 0) 6035ffc99e2SKonstantin Belousov return (error); 604f2a2857bSKirk McKusick fs->fs_ronly = 0; 6055da56ddbSTor Egge MNT_ILOCK(mp); 6065ffc99e2SKonstantin Belousov saved_mnt_flag = MNT_RDONLY; 6075ffc99e2SKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (mp->mnt_flag & 6085ffc99e2SKonstantin Belousov MNT_ASYNC) != 0) 6095ffc99e2SKonstantin Belousov saved_mnt_flag |= MNT_ASYNC; 6105ffc99e2SKonstantin Belousov mp->mnt_flag &= ~saved_mnt_flag; 6115da56ddbSTor Egge MNT_IUNLOCK(mp); 612113db2ddSJeff Roberson fs->fs_mtime = time_second; 61326cf9c3bSPeter Wemm /* check to see if we need to start softdep */ 614f2a2857bSKirk McKusick if ((fs->fs_flags & FS_DOSOFTDEP) && 615a854ed98SJohn Baldwin (error = softdep_mount(devvp, mp, fs, td->td_ucred))){ 6165ffc99e2SKonstantin Belousov fs->fs_ronly = 1; 6175ffc99e2SKonstantin Belousov MNT_ILOCK(mp); 6185ffc99e2SKonstantin Belousov mp->mnt_flag |= saved_mnt_flag; 6195ffc99e2SKonstantin Belousov MNT_IUNLOCK(mp); 6205ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 621f2a2857bSKirk McKusick return (error); 62226cf9c3bSPeter Wemm } 623113db2ddSJeff Roberson fs->fs_clean = 0; 624113db2ddSJeff Roberson if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 6255ffc99e2SKonstantin Belousov fs->fs_ronly = 1; 6265ffc99e2SKonstantin Belousov MNT_ILOCK(mp); 6275ffc99e2SKonstantin Belousov mp->mnt_flag |= saved_mnt_flag; 6285ffc99e2SKonstantin Belousov MNT_IUNLOCK(mp); 6295ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 630113db2ddSJeff Roberson return (error); 631113db2ddSJeff Roberson } 632f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 633f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 6345ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 6351469eec8SDavid Greenman } 636c11d2981SJulian Elischer /* 637c11d2981SJulian Elischer * Soft updates is incompatible with "async", 638c11d2981SJulian Elischer * so if we are doing softupdates stop the user 639c11d2981SJulian Elischer * from setting the async flag in an update. 640c11d2981SJulian Elischer * Softdep_mount() clears it in an initial mount 641c11d2981SJulian Elischer * or ro->rw remount. 642c11d2981SJulian Elischer */ 643fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 6445da56ddbSTor Egge /* XXX: Reset too late ? */ 6455da56ddbSTor Egge MNT_ILOCK(mp); 646c11d2981SJulian Elischer mp->mnt_flag &= ~MNT_ASYNC; 6475da56ddbSTor Egge MNT_IUNLOCK(mp); 6485da56ddbSTor Egge } 649df8bae1dSRodney W. Grimes /* 65039cfb239SPawel Jakub Dawidek * Keep MNT_ACLS flag if it is stored in superblock. 65139cfb239SPawel Jakub Dawidek */ 6525da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 6535da56ddbSTor Egge /* XXX: Set too late ? */ 6545da56ddbSTor Egge MNT_ILOCK(mp); 65539cfb239SPawel Jakub Dawidek mp->mnt_flag |= MNT_ACLS; 6565da56ddbSTor Egge MNT_IUNLOCK(mp); 6575da56ddbSTor Egge } 658cea90362SCraig Rodrigues 6599340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 6609340fc72SEdward Tomasz Napierala /* XXX: Set too late ? */ 6619340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 6629340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 6639340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 6649340fc72SEdward Tomasz Napierala } 665927a12aeSKirk McKusick /* 666927a12aeSKirk McKusick * If this is a request from fsck to clean up the filesystem, 667927a12aeSKirk McKusick * then allow the specified pid to proceed. 668927a12aeSKirk McKusick */ 669927a12aeSKirk McKusick if (fsckpid > 0) { 670927a12aeSKirk McKusick if (ump->um_fsckpid != 0) { 671b60ee81eSKirk McKusick vfs_mount_error(mp, 672b60ee81eSKirk McKusick "Active checker already running on %s", 673927a12aeSKirk McKusick fs->fs_fsmnt); 674927a12aeSKirk McKusick return (EINVAL); 675927a12aeSKirk McKusick } 676fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 677927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 678927a12aeSKirk McKusick g_topology_lock(); 679927a12aeSKirk McKusick /* 680927a12aeSKirk McKusick * Request write access. 681927a12aeSKirk McKusick */ 682927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 683927a12aeSKirk McKusick g_topology_unlock(); 684927a12aeSKirk McKusick if (error) { 685b60ee81eSKirk McKusick vfs_mount_error(mp, 686b60ee81eSKirk McKusick "Checker activation failed on %s", 687927a12aeSKirk McKusick fs->fs_fsmnt); 688927a12aeSKirk McKusick return (error); 689927a12aeSKirk McKusick } 690927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 691927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 692927a12aeSKirk McKusick ffs_snapshot_mount(mp); 693927a12aeSKirk McKusick fs->fs_mtime = time_second; 694927a12aeSKirk McKusick fs->fs_fmod = 1; 695927a12aeSKirk McKusick fs->fs_clean = 0; 696927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 697927a12aeSKirk McKusick } 6989340fc72SEdward Tomasz Napierala 699f2a2857bSKirk McKusick /* 700f2a2857bSKirk McKusick * If this is a snapshot request, take the snapshot. 701f2a2857bSKirk McKusick */ 702f2a2857bSKirk McKusick if (mp->mnt_flag & MNT_SNAPSHOT) 70320a92a18SPoul-Henning Kamp return (ffs_snapshot(mp, fspec)); 704714b7df5SKonstantin Belousov 705714b7df5SKonstantin Belousov /* 706714b7df5SKonstantin Belousov * Must not call namei() while owning busy ref. 707714b7df5SKonstantin Belousov */ 708714b7df5SKonstantin Belousov vfs_unbusy(mp); 709df8bae1dSRodney W. Grimes } 7102b14f991SJulian Elischer 711df8bae1dSRodney W. Grimes /* 712df8bae1dSRodney W. Grimes * Not an update, or updating the name: look up the name 713e9827c6dSBruce Evans * and verify that it refers to a sensible disk device. 714df8bae1dSRodney W. Grimes */ 715fdedad76SSuleiman Souhlal NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td); 716714b7df5SKonstantin Belousov error = namei(&ndp); 717714b7df5SKonstantin Belousov if ((mp->mnt_flag & MNT_UPDATE) != 0) { 718714b7df5SKonstantin Belousov /* 719714b7df5SKonstantin Belousov * Unmount does not start if MNT_UPDATE is set. Mount 720714b7df5SKonstantin Belousov * update busies mp before setting MNT_UPDATE. We 721714b7df5SKonstantin Belousov * must be able to retain our busy ref succesfully, 722714b7df5SKonstantin Belousov * without sleep. 723714b7df5SKonstantin Belousov */ 724714b7df5SKonstantin Belousov error1 = vfs_busy(mp, MBF_NOWAIT); 725714b7df5SKonstantin Belousov MPASS(error1 == 0); 726714b7df5SKonstantin Belousov } 727714b7df5SKonstantin Belousov if (error != 0) 728f2a2857bSKirk McKusick return (error); 7295e8c582aSPoul-Henning Kamp NDFREE(&ndp, NDF_ONLY_PNBUF); 7305e8c582aSPoul-Henning Kamp devvp = ndp.ni_vp; 7317ad2a82dSMateusz Guzik if (!vn_isdisk_error(devvp, &error)) { 732fdedad76SSuleiman Souhlal vput(devvp); 733f2a2857bSKirk McKusick return (error); 734f2a2857bSKirk McKusick } 735c9b99213SBruce Evans 736c9b99213SBruce Evans /* 737c9b99213SBruce Evans * If mount by non-root, then verify that user has necessary 738c9b99213SBruce Evans * permissions on the device. 739c9b99213SBruce Evans */ 74015bc6b2bSEdward Tomasz Napierala accmode = VREAD; 741c9b99213SBruce Evans if ((mp->mnt_flag & MNT_RDONLY) == 0) 74215bc6b2bSEdward Tomasz Napierala accmode |= VWRITE; 74315bc6b2bSEdward Tomasz Napierala error = VOP_ACCESS(devvp, accmode, td->td_ucred, td); 744acd3428bSRobert Watson if (error) 745acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 746acd3428bSRobert Watson if (error) { 747c9b99213SBruce Evans vput(devvp); 748c9b99213SBruce Evans return (error); 749c9b99213SBruce Evans } 750c9b99213SBruce Evans 7512b14f991SJulian Elischer if (mp->mnt_flag & MNT_UPDATE) { 7522b14f991SJulian Elischer /* 753f2a2857bSKirk McKusick * Update only 754f2a2857bSKirk McKusick * 7553e425b96SJulian Elischer * If it's not the same vnode, or at least the same device 7563e425b96SJulian Elischer * then it's not correct. 7572b14f991SJulian Elischer */ 7582b14f991SJulian Elischer 75943920011SPoul-Henning Kamp if (devvp->v_rdev != ump->um_devvp->v_rdev) 760f2a2857bSKirk McKusick error = EINVAL; /* needs translation */ 761fdedad76SSuleiman Souhlal vput(devvp); 762f2a2857bSKirk McKusick if (error) 763f2a2857bSKirk McKusick return (error); 7642b14f991SJulian Elischer } else { 7652b14f991SJulian Elischer /* 766f2a2857bSKirk McKusick * New mount 7672b14f991SJulian Elischer * 768f2a2857bSKirk McKusick * We need the name for the mount point (also used for 769f2a2857bSKirk McKusick * "last mounted on") copied in. If an error occurs, 770f2a2857bSKirk McKusick * the mount point is discarded by the upper level code. 77198cbffd7SKonstantin Belousov * Note that vfs_mount_alloc() populates f_mntonname for us. 772f2a2857bSKirk McKusick */ 773975512a9SPoul-Henning Kamp if ((error = ffs_mountfs(devvp, mp, td)) != 0) { 774f2a2857bSKirk McKusick vrele(devvp); 775f2a2857bSKirk McKusick return (error); 776f2a2857bSKirk McKusick } 777927a12aeSKirk McKusick if (fsckpid > 0) { 778fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 779927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 780927a12aeSKirk McKusick ump = VFSTOUFS(mp); 781927a12aeSKirk McKusick fs = ump->um_fs; 782927a12aeSKirk McKusick g_topology_lock(); 783927a12aeSKirk McKusick /* 784927a12aeSKirk McKusick * Request write access. 785927a12aeSKirk McKusick */ 786927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 787927a12aeSKirk McKusick g_topology_unlock(); 788927a12aeSKirk McKusick if (error) { 789b60ee81eSKirk McKusick printf("WARNING: %s: Checker activation " 790b60ee81eSKirk McKusick "failed\n", fs->fs_fsmnt); 791927a12aeSKirk McKusick } else { 792927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 793927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 794927a12aeSKirk McKusick ffs_snapshot_mount(mp); 795927a12aeSKirk McKusick fs->fs_mtime = time_second; 796927a12aeSKirk McKusick fs->fs_clean = 0; 797927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 798927a12aeSKirk McKusick } 799927a12aeSKirk McKusick } 800f2a2857bSKirk McKusick } 8019d5a594fSMateusz Guzik 8029d5a594fSMateusz Guzik MNT_ILOCK(mp); 8039d5a594fSMateusz Guzik /* 8049d5a594fSMateusz Guzik * This is racy versus lookup, see ufs_fplookup_vexec for details. 8059d5a594fSMateusz Guzik */ 8069d5a594fSMateusz Guzik if ((mp->mnt_kern_flag & MNTK_FPLOOKUP) != 0) 8079d5a594fSMateusz Guzik panic("MNTK_FPLOOKUP set on mount %p when it should not be", mp); 80803337743SMateusz Guzik if ((mp->mnt_flag & (MNT_ACLS | MNT_NFS4ACLS | MNT_UNION)) == 0) 8099d5a594fSMateusz Guzik mp->mnt_kern_flag |= MNTK_FPLOOKUP; 8109d5a594fSMateusz Guzik MNT_IUNLOCK(mp); 8119d5a594fSMateusz Guzik 81220a92a18SPoul-Henning Kamp vfs_mountedfrom(mp, fspec); 813f2a2857bSKirk McKusick return (0); 8142b14f991SJulian Elischer } 8152b14f991SJulian Elischer 816df8bae1dSRodney W. Grimes /* 81720a92a18SPoul-Henning Kamp * Compatibility with old mount system call. 81820a92a18SPoul-Henning Kamp */ 81920a92a18SPoul-Henning Kamp 82020a92a18SPoul-Henning Kamp static int 821cc672d35SKirk McKusick ffs_cmount(struct mntarg *ma, void *data, uint64_t flags) 82220a92a18SPoul-Henning Kamp { 82320a92a18SPoul-Henning Kamp struct ufs_args args; 82420a92a18SPoul-Henning Kamp int error; 82520a92a18SPoul-Henning Kamp 82620a92a18SPoul-Henning Kamp if (data == NULL) 82720a92a18SPoul-Henning Kamp return (EINVAL); 82820a92a18SPoul-Henning Kamp error = copyin(data, &args, sizeof args); 82920a92a18SPoul-Henning Kamp if (error) 83020a92a18SPoul-Henning Kamp return (error); 83120a92a18SPoul-Henning Kamp 83220a92a18SPoul-Henning Kamp ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN); 8331f7104d7SRick Macklem ma = mount_arg(ma, "export", &args.export, sizeof(args.export)); 83420a92a18SPoul-Henning Kamp error = kernel_mount(ma, flags); 83520a92a18SPoul-Henning Kamp 83620a92a18SPoul-Henning Kamp return (error); 83720a92a18SPoul-Henning Kamp } 83820a92a18SPoul-Henning Kamp 83920a92a18SPoul-Henning Kamp /* 840df8bae1dSRodney W. Grimes * Reload all incore data for a filesystem (used after running fsck on 8411848286aSEdward Tomasz Napierala * the root filesystem and finding things to fix). If the 'force' flag 8421848286aSEdward Tomasz Napierala * is 0, the filesystem must be mounted read-only. 843df8bae1dSRodney W. Grimes * 844df8bae1dSRodney W. Grimes * Things to do to update the mount: 845df8bae1dSRodney W. Grimes * 1) invalidate all cached meta-data. 846df8bae1dSRodney W. Grimes * 2) re-read superblock from disk. 847df8bae1dSRodney W. Grimes * 3) re-read summary information from disk. 848df8bae1dSRodney W. Grimes * 4) invalidate all inactive vnodes. 849df426577SKonstantin Belousov * 5) clear MNTK_SUSPEND2 and MNTK_SUSPENDED flags, allowing secondary 850df426577SKonstantin Belousov * writers, if requested. 851df426577SKonstantin Belousov * 6) invalidate all cached file data. 852df426577SKonstantin Belousov * 7) re-read inode data for all active vnodes. 853df8bae1dSRodney W. Grimes */ 8541848286aSEdward Tomasz Napierala int 855df426577SKonstantin Belousov ffs_reload(struct mount *mp, struct thread *td, int flags) 856df8bae1dSRodney W. Grimes { 85782be0a5aSTor Egge struct vnode *vp, *mvp, *devvp; 858df8bae1dSRodney W. Grimes struct inode *ip; 859f55ff3f3SIan Dowse void *space; 860df8bae1dSRodney W. Grimes struct buf *bp; 861996c772fSJohn Dyson struct fs *fs, *newfs; 8623ba649d7SJeff Roberson struct ufsmount *ump; 8631c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 864ad544726SKirk McKusick int i, blks, error; 865ad544726SKirk McKusick u_long size; 866996c772fSJohn Dyson int32_t *lp; 867df8bae1dSRodney W. Grimes 8683ba649d7SJeff Roberson ump = VFSTOUFS(mp); 8691848286aSEdward Tomasz Napierala 8701848286aSEdward Tomasz Napierala MNT_ILOCK(mp); 871df426577SKonstantin Belousov if ((mp->mnt_flag & MNT_RDONLY) == 0 && (flags & FFSR_FORCE) == 0) { 8721848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 8731848286aSEdward Tomasz Napierala return (EINVAL); 8741848286aSEdward Tomasz Napierala } 8751848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 8761848286aSEdward Tomasz Napierala 877df8bae1dSRodney W. Grimes /* 878df8bae1dSRodney W. Grimes * Step 1: invalidate all cached meta-data. 879df8bae1dSRodney W. Grimes */ 8802b14f991SJulian Elischer devvp = VFSTOUFS(mp)->um_devvp; 881cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 8820d7935fdSAttilio Rao if (vinvalbuf(devvp, 0, 0, 0) != 0) 883df8bae1dSRodney W. Grimes panic("ffs_reload: dirty1"); 884b249ce48SMateusz Guzik VOP_UNLOCK(devvp); 88595e5e988SJohn Dyson 886df8bae1dSRodney W. Grimes /* 887df8bae1dSRodney W. Grimes * Step 2: re-read superblock from disk. 888df8bae1dSRodney W. Grimes */ 8891c85e6a3SKirk McKusick fs = VFSTOUFS(mp)->um_fs; 890ada981b2SKirk McKusick if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize, 8911c85e6a3SKirk McKusick NOCRED, &bp)) != 0) 892df8bae1dSRodney W. Grimes return (error); 893996c772fSJohn Dyson newfs = (struct fs *)bp->b_data; 8941c85e6a3SKirk McKusick if ((newfs->fs_magic != FS_UFS1_MAGIC && 8951c85e6a3SKirk McKusick newfs->fs_magic != FS_UFS2_MAGIC) || 8961c85e6a3SKirk McKusick newfs->fs_bsize > MAXBSIZE || 897996c772fSJohn Dyson newfs->fs_bsize < sizeof(struct fs)) { 898df8bae1dSRodney W. Grimes brelse(bp); 899df8bae1dSRodney W. Grimes return (EIO); /* XXX needs translation */ 900df8bae1dSRodney W. Grimes } 901996c772fSJohn Dyson /* 90234816cb9SKirk McKusick * Preserve the summary information, read-only status, and 90334816cb9SKirk McKusick * superblock location by copying these fields into our new 90434816cb9SKirk McKusick * superblock before using it to update the existing superblock. 905996c772fSJohn Dyson */ 90634816cb9SKirk McKusick newfs->fs_si = fs->fs_si; 9071848286aSEdward Tomasz Napierala newfs->fs_ronly = fs->fs_ronly; 9081c85e6a3SKirk McKusick sblockloc = fs->fs_sblockloc; 909996c772fSJohn Dyson bcopy(newfs, fs, (u_int)fs->fs_sbsize); 910df8bae1dSRodney W. Grimes brelse(bp); 911996c772fSJohn Dyson mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 9121c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc); 9133ba649d7SJeff Roberson UFS_LOCK(ump); 9149ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 915b60ee81eSKirk McKusick printf("WARNING: %s: reload pending error: blocks %jd " 916b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 9171c85e6a3SKirk McKusick fs->fs_pendinginodes); 9189ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 9199ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 9209ccb939eSKirk McKusick } 9213ba649d7SJeff Roberson UFS_UNLOCK(ump); 922996c772fSJohn Dyson 923df8bae1dSRodney W. Grimes /* 924df8bae1dSRodney W. Grimes * Step 3: re-read summary information from disk. 925df8bae1dSRodney W. Grimes */ 9262b028c25SEdward Tomasz Napierala size = fs->fs_cssize; 9272b028c25SEdward Tomasz Napierala blks = howmany(size, fs->fs_fsize); 9282b028c25SEdward Tomasz Napierala if (fs->fs_contigsumsize > 0) 9292b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(int32_t); 9302b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(u_int8_t); 9312b028c25SEdward Tomasz Napierala free(fs->fs_csp, M_UFSMNT); 932ad544726SKirk McKusick space = malloc(size, M_UFSMNT, M_WAITOK); 9332b028c25SEdward Tomasz Napierala fs->fs_csp = space; 934df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 935df8bae1dSRodney W. Grimes size = fs->fs_bsize; 936df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 937df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 938c9671602SPoul-Henning Kamp error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 939c9671602SPoul-Henning Kamp NOCRED, &bp); 940c9671602SPoul-Henning Kamp if (error) 941df8bae1dSRodney W. Grimes return (error); 942f55ff3f3SIan Dowse bcopy(bp->b_data, space, (u_int)size); 943f55ff3f3SIan Dowse space = (char *)space + size; 944df8bae1dSRodney W. Grimes brelse(bp); 945df8bae1dSRodney W. Grimes } 946996c772fSJohn Dyson /* 947996c772fSJohn Dyson * We no longer know anything about clusters per cylinder group. 948996c772fSJohn Dyson */ 949996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 95072b8ff1cSEdward Tomasz Napierala fs->fs_maxcluster = lp = space; 951996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 952996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 95372b8ff1cSEdward Tomasz Napierala space = lp; 954996c772fSJohn Dyson } 95572b8ff1cSEdward Tomasz Napierala size = fs->fs_ncg * sizeof(u_int8_t); 95672b8ff1cSEdward Tomasz Napierala fs->fs_contigdirs = (u_int8_t *)space; 95772b8ff1cSEdward Tomasz Napierala bzero(fs->fs_contigdirs, size); 958df426577SKonstantin Belousov if ((flags & FFSR_UNSUSPEND) != 0) { 959df426577SKonstantin Belousov MNT_ILOCK(mp); 960df426577SKonstantin Belousov mp->mnt_kern_flag &= ~(MNTK_SUSPENDED | MNTK_SUSPEND2); 961df426577SKonstantin Belousov wakeup(&mp->mnt_flag); 962df426577SKonstantin Belousov MNT_IUNLOCK(mp); 963df426577SKonstantin Belousov } 964996c772fSJohn Dyson 965df8bae1dSRodney W. Grimes loop: 96671469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 967df8bae1dSRodney W. Grimes /* 9681848286aSEdward Tomasz Napierala * Skip syncer vnode. 9691848286aSEdward Tomasz Napierala */ 9701848286aSEdward Tomasz Napierala if (vp->v_type == VNON) { 9711848286aSEdward Tomasz Napierala VI_UNLOCK(vp); 9721848286aSEdward Tomasz Napierala continue; 9731848286aSEdward Tomasz Napierala } 9741848286aSEdward Tomasz Napierala /* 975fe68abe2SJeff Roberson * Step 4: invalidate all cached file data. 976df8bae1dSRodney W. Grimes */ 977a92a971bSMateusz Guzik if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK)) { 97871469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 979df8bae1dSRodney W. Grimes goto loop; 980996c772fSJohn Dyson } 9810d7935fdSAttilio Rao if (vinvalbuf(vp, 0, 0, 0)) 982df8bae1dSRodney W. Grimes panic("ffs_reload: dirty2"); 983df8bae1dSRodney W. Grimes /* 984fe68abe2SJeff Roberson * Step 5: re-read inode data for all active vnodes. 985df8bae1dSRodney W. Grimes */ 986df8bae1dSRodney W. Grimes ip = VTOI(vp); 987c9671602SPoul-Henning Kamp error = 988df8bae1dSRodney W. Grimes bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), 989c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 990c9671602SPoul-Henning Kamp if (error) { 9919fc5d538SKirk McKusick vput(vp); 99271469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 993df8bae1dSRodney W. Grimes return (error); 994df8bae1dSRodney W. Grimes } 9959fc5d538SKirk McKusick if ((error = ffs_load_inode(bp, ip, fs, ip->i_number)) != 0) { 9969fc5d538SKirk McKusick brelse(bp); 9979fc5d538SKirk McKusick vput(vp); 9989fc5d538SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 9999fc5d538SKirk McKusick return (error); 10009fc5d538SKirk McKusick } 1001b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 1002df8bae1dSRodney W. Grimes brelse(bp); 10039fc5d538SKirk McKusick vput(vp); 1004df8bae1dSRodney W. Grimes } 1005df8bae1dSRodney W. Grimes return (0); 1006df8bae1dSRodney W. Grimes } 1007df8bae1dSRodney W. Grimes 10081c85e6a3SKirk McKusick /* 1009df8bae1dSRodney W. Grimes * Common code for mount and mountroot 1010df8bae1dSRodney W. Grimes */ 1011975512a9SPoul-Henning Kamp static int 1012f15ccf88SChuck Silvers ffs_mountfs(odevvp, mp, td) 1013f15ccf88SChuck Silvers struct vnode *odevvp; 1014df8bae1dSRodney W. Grimes struct mount *mp; 1015b40ce416SJulian Elischer struct thread *td; 1016df8bae1dSRodney W. Grimes { 101705f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 101805f4ff5dSPoul-Henning Kamp struct fs *fs; 101989c9c53dSPoul-Henning Kamp struct cdev *dev; 1020dffce215SKirk McKusick int error, i, len, ronly; 1021996c772fSJohn Dyson struct ucred *cred; 102243920011SPoul-Henning Kamp struct g_consumer *cp; 10233bbd6d8aSJeff Roberson struct mount *nmp; 1024f15ccf88SChuck Silvers struct vnode *devvp; 1025d79ff54bSChuck Silvers struct fsfail_task *etp; 102613532153SScott Long int candelete, canspeedup; 1027fb14e73cSKirk McKusick off_t loc; 1028df8bae1dSRodney W. Grimes 1029dffce215SKirk McKusick fs = NULL; 1030ee445a69SJohn Baldwin ump = NULL; 1031a854ed98SJohn Baldwin cred = td ? td->td_ucred : NOCRED; 103243920011SPoul-Henning Kamp ronly = (mp->mnt_flag & MNT_RDONLY) != 0; 1033ee445a69SJohn Baldwin 1034f15ccf88SChuck Silvers devvp = mntfs_allocvp(mp, odevvp); 1035f15ccf88SChuck Silvers VOP_UNLOCK(odevvp); 1036c70b3cd2SKonstantin Belousov KASSERT(devvp->v_type == VCHR, ("reclaimed devvp")); 1037ee445a69SJohn Baldwin dev = devvp->v_rdev; 1038c70b3cd2SKonstantin Belousov if (atomic_cmpset_acq_ptr((uintptr_t *)&dev->si_mountpt, 0, 1039c70b3cd2SKonstantin Belousov (uintptr_t)mp) == 0) { 1040f15ccf88SChuck Silvers mntfs_freevp(devvp); 1041c70b3cd2SKonstantin Belousov return (EBUSY); 1042c70b3cd2SKonstantin Belousov } 104343920011SPoul-Henning Kamp g_topology_lock(); 104443920011SPoul-Henning Kamp error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1); 104543920011SPoul-Henning Kamp g_topology_unlock(); 1046c70b3cd2SKonstantin Belousov if (error != 0) { 1047c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 1048f15ccf88SChuck Silvers mntfs_freevp(devvp); 1049c70b3cd2SKonstantin Belousov return (error); 1050c70b3cd2SKonstantin Belousov } 1051c70b3cd2SKonstantin Belousov dev_ref(dev); 1052c70b3cd2SKonstantin Belousov devvp->v_bufobj.bo_ops = &ffs_ops; 1053f15ccf88SChuck Silvers BO_LOCK(&odevvp->v_bufobj); 1054f15ccf88SChuck Silvers odevvp->v_bufobj.bo_flag |= BO_NOBUFS; 1055f15ccf88SChuck Silvers BO_UNLOCK(&odevvp->v_bufobj); 1056c70b3cd2SKonstantin Belousov if (dev->si_iosize_max != 0) 1057c70b3cd2SKonstantin Belousov mp->mnt_iosize_max = dev->si_iosize_max; 1058*cd853791SKonstantin Belousov if (mp->mnt_iosize_max > maxphys) 1059*cd853791SKonstantin Belousov mp->mnt_iosize_max = maxphys; 106071ac2d7cSCraig Rodrigues if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) { 106171ac2d7cSCraig Rodrigues error = EINVAL; 106271ac2d7cSCraig Rodrigues vfs_mount_error(mp, 106371ac2d7cSCraig Rodrigues "Invalid sectorsize %d for superblock size %d", 106471ac2d7cSCraig Rodrigues cp->provider->sectorsize, SBLOCKSIZE); 106571ac2d7cSCraig Rodrigues goto out; 106671ac2d7cSCraig Rodrigues } 1067dffce215SKirk McKusick /* fetch the superblock and summary information */ 1068fb14e73cSKirk McKusick loc = STDSB; 1069fb14e73cSKirk McKusick if ((mp->mnt_flag & MNT_ROOTFS) != 0) 1070fb14e73cSKirk McKusick loc = STDSB_NOHASHFAIL; 1071fb14e73cSKirk McKusick if ((error = ffs_sbget(devvp, &fs, loc, M_UFSMNT, ffs_use_bread)) != 0) 1072df8bae1dSRodney W. Grimes goto out; 10730922cce6SBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 10740922cce6SBruce Evans if (fs->fs_clean == 0) { 10750922cce6SBruce Evans fs->fs_flags |= FS_UNCLEAN; 1076812b1d41SKirk McKusick if (ronly || (mp->mnt_flag & MNT_FORCE) || 1077113db2ddSJeff Roberson ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 && 10781a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 107959b3a4ebSDavid E. O'Brien printf("WARNING: %s was not properly dismounted\n", 10800922cce6SBruce Evans fs->fs_fsmnt); 10811469eec8SDavid Greenman } else { 1082b60ee81eSKirk McKusick vfs_mount_error(mp, "R/W mount of %s denied. %s%s", 1083b60ee81eSKirk McKusick fs->fs_fsmnt, "Filesystem is not clean - run fsck.", 1084b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 1085b60ee81eSKirk McKusick " Forced mount will invalidate journal contents"); 10861469eec8SDavid Greenman error = EPERM; 10871469eec8SDavid Greenman goto out; 10881469eec8SDavid Greenman } 10891c85e6a3SKirk McKusick if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) && 10901c85e6a3SKirk McKusick (mp->mnt_flag & MNT_FORCE)) { 1091b60ee81eSKirk McKusick printf("WARNING: %s: lost blocks %jd files %d\n", 1092b60ee81eSKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 10931c85e6a3SKirk McKusick fs->fs_pendinginodes); 10949ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 10959ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 10969ccb939eSKirk McKusick } 10979ccb939eSKirk McKusick } 10989ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1099b60ee81eSKirk McKusick printf("WARNING: %s: mount pending error: blocks %jd " 1100b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 11011c85e6a3SKirk McKusick fs->fs_pendinginodes); 11029ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 11039ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 11041469eec8SDavid Greenman } 11051a60c7fcSPawel Jakub Dawidek if ((fs->fs_flags & FS_GJOURNAL) != 0) { 11061a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL 11071a60c7fcSPawel Jakub Dawidek /* 11081a60c7fcSPawel Jakub Dawidek * Get journal provider name. 11091a60c7fcSPawel Jakub Dawidek */ 1110ad544726SKirk McKusick len = 1024; 1111ad544726SKirk McKusick mp->mnt_gjprovider = malloc((u_long)len, M_UFSMNT, M_WAITOK); 1112ad544726SKirk McKusick if (g_io_getattr("GJOURNAL::provider", cp, &len, 11131a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider) == 0) { 1114ad544726SKirk McKusick mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, len, 11151a60c7fcSPawel Jakub Dawidek M_UFSMNT, M_WAITOK); 11161a60c7fcSPawel Jakub Dawidek MNT_ILOCK(mp); 11171a60c7fcSPawel Jakub Dawidek mp->mnt_flag |= MNT_GJOURNAL; 11181a60c7fcSPawel Jakub Dawidek MNT_IUNLOCK(mp); 11191a60c7fcSPawel Jakub Dawidek } else { 1120b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs " 1121b60ee81eSKirk McKusick "but no gjournal provider below\n", 11221a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 11231a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 11241a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 11251a60c7fcSPawel Jakub Dawidek } 11261a60c7fcSPawel Jakub Dawidek #else 1127b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs but no " 1128b60ee81eSKirk McKusick "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname); 11291a60c7fcSPawel Jakub Dawidek #endif 11301a60c7fcSPawel Jakub Dawidek } else { 11311a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 11321a60c7fcSPawel Jakub Dawidek } 1133a163d034SWarner Losh ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO); 113443920011SPoul-Henning Kamp ump->um_cp = cp; 113543920011SPoul-Henning Kamp ump->um_bo = &devvp->v_bufobj; 1136dffce215SKirk McKusick ump->um_fs = fs; 11371c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 11381c85e6a3SKirk McKusick ump->um_fstype = UFS1; 11391c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs1; 11401c85e6a3SKirk McKusick } else { 11411c85e6a3SKirk McKusick ump->um_fstype = UFS2; 11421c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs2; 11431c85e6a3SKirk McKusick } 1144cec0f20cSPoul-Henning Kamp ump->um_blkatoff = ffs_blkatoff; 1145cec0f20cSPoul-Henning Kamp ump->um_truncate = ffs_truncate; 1146987f5696SPoul-Henning Kamp ump->um_update = ffs_update; 1147cec0f20cSPoul-Henning Kamp ump->um_valloc = ffs_valloc; 1148cec0f20cSPoul-Henning Kamp ump->um_vfree = ffs_vfree; 1149975512a9SPoul-Henning Kamp ump->um_ifree = ffs_ifree; 115090446e36SKonstantin Belousov ump->um_rdonly = ffs_rdonly; 115116b1f68dSKonstantin Belousov ump->um_snapgone = ffs_snapgone; 1152fdf34aa3SKirk McKusick if ((mp->mnt_flag & MNT_UNTRUSTED) != 0) 1153fdf34aa3SKirk McKusick ump->um_check_blkno = ffs_check_blkno; 1154fdf34aa3SKirk McKusick else 1155fdf34aa3SKirk McKusick ump->um_check_blkno = NULL; 11563ba649d7SJeff Roberson mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF); 1157dffce215SKirk McKusick ffs_oldfscompat_read(fs, ump, fs->fs_sblockloc); 1158df8bae1dSRodney W. Grimes fs->fs_ronly = ronly; 1159143a5346SIan Dowse fs->fs_active = NULL; 116077465d93SAlfred Perlstein mp->mnt_data = ump; 116168de329eSPoul-Henning Kamp mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0]; 11628f89943eSGuido van Rooij mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1]; 11633bbd6d8aSJeff Roberson nmp = NULL; 116468de329eSPoul-Henning Kamp if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 || 11653bbd6d8aSJeff Roberson (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) { 11663bbd6d8aSJeff Roberson if (nmp) 11673bbd6d8aSJeff Roberson vfs_rel(nmp); 116868de329eSPoul-Henning Kamp vfs_getnewfsid(mp); 11693bbd6d8aSJeff Roberson } 1170df8bae1dSRodney W. Grimes mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 11715da56ddbSTor Egge MNT_ILOCK(mp); 1172cc9d8990SPeter Wemm mp->mnt_flag |= MNT_LOCAL; 11735da56ddbSTor Egge MNT_IUNLOCK(mp); 11745da56ddbSTor Egge if ((fs->fs_flags & FS_MULTILABEL) != 0) { 11757b3f1bbdSTom Rhodes #ifdef MAC 11765da56ddbSTor Egge MNT_ILOCK(mp); 117780830407SRobert Watson mp->mnt_flag |= MNT_MULTILABEL; 11785da56ddbSTor Egge MNT_IUNLOCK(mp); 11797b3f1bbdSTom Rhodes #else 1180b60ee81eSKirk McKusick printf("WARNING: %s: multilabel flag on fs but " 1181b60ee81eSKirk McKusick "no MAC support\n", mp->mnt_stat.f_mntonname); 11827b3f1bbdSTom Rhodes #endif 11835da56ddbSTor Egge } 11845da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 11857b3f1bbdSTom Rhodes #ifdef UFS_ACL 11865da56ddbSTor Egge MNT_ILOCK(mp); 11879340fc72SEdward Tomasz Napierala 11889340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_NFS4ACLS) 1189b60ee81eSKirk McKusick printf("WARNING: %s: ACLs flag on fs conflicts with " 1190b60ee81eSKirk McKusick "\"nfsv4acls\" mount option; option ignored\n", 1191b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 11929340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_NFS4ACLS; 119380830407SRobert Watson mp->mnt_flag |= MNT_ACLS; 11949340fc72SEdward Tomasz Napierala 11955da56ddbSTor Egge MNT_IUNLOCK(mp); 11967b3f1bbdSTom Rhodes #else 119759b3a4ebSDavid E. O'Brien printf("WARNING: %s: ACLs flag on fs but no ACLs support\n", 1198946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 11997b3f1bbdSTom Rhodes #endif 12005da56ddbSTor Egge } 12019340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 12029340fc72SEdward Tomasz Napierala #ifdef UFS_ACL 12039340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 12049340fc72SEdward Tomasz Napierala 12059340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_ACLS) 1206b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts " 1207b60ee81eSKirk McKusick "with \"acls\" mount option; option ignored\n", 1208b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 12099340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_ACLS; 12109340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 12119340fc72SEdward Tomasz Napierala 12129340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 12139340fc72SEdward Tomasz Napierala #else 1214b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs but no " 1215b60ee81eSKirk McKusick "ACLs support\n", mp->mnt_stat.f_mntonname); 12169340fc72SEdward Tomasz Napierala #endif 12179340fc72SEdward Tomasz Napierala } 12188c2a54deSKonstantin Belousov if ((fs->fs_flags & FS_TRIM) != 0) { 1219ad544726SKirk McKusick len = sizeof(int); 1220ad544726SKirk McKusick if (g_io_getattr("GEOM::candelete", cp, &len, 1221ab0bcb60SKirk McKusick &candelete) == 0) { 1222ab0bcb60SKirk McKusick if (candelete) 1223ab0bcb60SKirk McKusick ump->um_flags |= UM_CANDELETE; 1224ab0bcb60SKirk McKusick else 1225b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk " 1226b60ee81eSKirk McKusick "does not support TRIM\n", 12278c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 12288c2a54deSKonstantin Belousov } else { 1229b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk does " 1230b60ee81eSKirk McKusick "not confirm that it supports TRIM\n", 12318c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 12328c2a54deSKonstantin Belousov } 1233ab0bcb60SKirk McKusick if (((ump->um_flags) & UM_CANDELETE) != 0) { 1234c79dff0fSKonstantin Belousov ump->um_trim_tq = taskqueue_create("trim", M_WAITOK, 1235c79dff0fSKonstantin Belousov taskqueue_thread_enqueue, &ump->um_trim_tq); 1236c79dff0fSKonstantin Belousov taskqueue_start_threads(&ump->um_trim_tq, 1, PVFS, 1237c79dff0fSKonstantin Belousov "%s trim", mp->mnt_stat.f_mntonname); 12387e038bc2SKirk McKusick ump->um_trimhash = hashinit(MAXTRIMIO, M_TRIM, 12397e038bc2SKirk McKusick &ump->um_trimlisthashsize); 1240c79dff0fSKonstantin Belousov } 12418c2a54deSKonstantin Belousov } 12429340fc72SEdward Tomasz Napierala 124313532153SScott Long len = sizeof(int); 124413532153SScott Long if (g_io_getattr("GEOM::canspeedup", cp, &len, &canspeedup) == 0) { 124513532153SScott Long if (canspeedup) 124613532153SScott Long ump->um_flags |= UM_CANSPEEDUP; 124713532153SScott Long } 124813532153SScott Long 1249df8bae1dSRodney W. Grimes ump->um_mountp = mp; 1250df8bae1dSRodney W. Grimes ump->um_dev = dev; 1251df8bae1dSRodney W. Grimes ump->um_devvp = devvp; 1252f15ccf88SChuck Silvers ump->um_odevvp = odevvp; 1253df8bae1dSRodney W. Grimes ump->um_nindir = fs->fs_nindir; 1254df8bae1dSRodney W. Grimes ump->um_bptrtodb = fs->fs_fsbtodb; 1255df8bae1dSRodney W. Grimes ump->um_seqinc = fs->fs_frag; 1256df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1257df8bae1dSRodney W. Grimes ump->um_quotas[i] = NULLVP; 1258516081f2SRobert Watson #ifdef UFS_EXTATTR 1259a64ed089SRobert Watson ufs_extattr_uepm_init(&ump->um_extattr); 1260a64ed089SRobert Watson #endif 12612b14f991SJulian Elischer /* 12622b14f991SJulian Elischer * Set FS local "last mounted on" information (NULL pad) 12632b14f991SJulian Elischer */ 126493373c42SSuleiman Souhlal bzero(fs->fs_fsmnt, MAXMNTLEN); 126593373c42SSuleiman Souhlal strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN); 1266113db2ddSJeff Roberson mp->mnt_stat.f_iosize = fs->fs_bsize; 12672b14f991SJulian Elischer 12682b14f991SJulian Elischer if (mp->mnt_flag & MNT_ROOTFS) { 12692b14f991SJulian Elischer /* 12702b14f991SJulian Elischer * Root mount; update timestamp in mount structure. 12712b14f991SJulian Elischer * this will be used by the common root mount code 12722b14f991SJulian Elischer * to update the system clock. 12732b14f991SJulian Elischer */ 12742b14f991SJulian Elischer mp->mnt_time = fs->fs_time; 12752b14f991SJulian Elischer } 1276996c772fSJohn Dyson 1277996c772fSJohn Dyson if (ronly == 0) { 1278113db2ddSJeff Roberson fs->fs_mtime = time_second; 1279b1897c19SJulian Elischer if ((fs->fs_flags & FS_DOSOFTDEP) && 1280b1897c19SJulian Elischer (error = softdep_mount(devvp, mp, fs, cred)) != 0) { 1281fddd463dSKonstantin Belousov ffs_flushfiles(mp, FORCECLOSE, td); 1282b1897c19SJulian Elischer goto out; 1283b1897c19SJulian Elischer } 1284f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 1285f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 1286cf60e8e4SKirk McKusick fs->fs_fmod = 1; 1287996c772fSJohn Dyson fs->fs_clean = 0; 1288791dd2faSTor Egge (void) ffs_sbupdate(ump, MNT_WAIT, 0); 1289996c772fSJohn Dyson } 1290d8d3d415SPoul-Henning Kamp /* 129198cbffd7SKonstantin Belousov * Initialize filesystem state information in mount struct. 1292d8d3d415SPoul-Henning Kamp */ 12936cf7bc60SRobert Watson MNT_ILOCK(mp); 1294bc2258daSAttilio Rao mp->mnt_kern_flag |= MNTK_LOOKUP_SHARED | MNTK_EXTENDED_SHARED | 12955f34e93cSMark Johnston MNTK_NO_IOPF | MNTK_UNMAPPED_BUFS | MNTK_USES_BCACHE; 12966cf7bc60SRobert Watson MNT_IUNLOCK(mp); 1297516081f2SRobert Watson #ifdef UFS_EXTATTR 1298516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART 12999de54ba5SRobert Watson /* 13009de54ba5SRobert Watson * 1301f5161237SRobert Watson * Auto-starting does the following: 13029de54ba5SRobert Watson * - check for /.attribute in the fs, and extattr_start if so 13039de54ba5SRobert Watson * - for each file in .attribute, enable that file with 13049de54ba5SRobert Watson * an attribute of the same name. 13059de54ba5SRobert Watson * Not clear how to report errors -- probably eat them. 13069de54ba5SRobert Watson * This would all happen while the filesystem was busy/not 13079de54ba5SRobert Watson * available, so would effectively be "atomic". 13089de54ba5SRobert Watson */ 1309b40ce416SJulian Elischer (void) ufs_extattr_autostart(mp, td); 1310516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */ 1311516081f2SRobert Watson #endif /* !UFS_EXTATTR */ 1312d79ff54bSChuck Silvers etp = malloc(sizeof *ump->um_fsfail_task, M_UFSMNT, M_WAITOK | M_ZERO); 1313d79ff54bSChuck Silvers etp->fsid = mp->mnt_stat.f_fsid; 1314d79ff54bSChuck Silvers ump->um_fsfail_task = etp; 1315df8bae1dSRodney W. Grimes return (0); 1316df8bae1dSRodney W. Grimes out: 1317dffce215SKirk McKusick if (fs != NULL) { 1318dffce215SKirk McKusick free(fs->fs_csp, M_UFSMNT); 131934816cb9SKirk McKusick free(fs->fs_si, M_UFSMNT); 1320dffce215SKirk McKusick free(fs, M_UFSMNT); 1321dffce215SKirk McKusick } 132243920011SPoul-Henning Kamp if (cp != NULL) { 132343920011SPoul-Henning Kamp g_topology_lock(); 13240d7935fdSAttilio Rao g_vfs_close(cp); 132543920011SPoul-Henning Kamp g_topology_unlock(); 132643920011SPoul-Henning Kamp } 1327df8bae1dSRodney W. Grimes if (ump) { 13283ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 13291a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 13301a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 13311a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 13321a60c7fcSPawel Jakub Dawidek } 1333df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 133477465d93SAlfred Perlstein mp->mnt_data = NULL; 1335df8bae1dSRodney W. Grimes } 1336f15ccf88SChuck Silvers BO_LOCK(&odevvp->v_bufobj); 1337f15ccf88SChuck Silvers odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS; 1338f15ccf88SChuck Silvers BO_UNLOCK(&odevvp->v_bufobj); 1339c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 1340f15ccf88SChuck Silvers mntfs_freevp(devvp); 134149c4791cSEdward Tomasz Napierala dev_rel(dev); 1342df8bae1dSRodney W. Grimes return (error); 1343df8bae1dSRodney W. Grimes } 1344df8bae1dSRodney W. Grimes 1345dffce215SKirk McKusick /* 1346dffce215SKirk McKusick * A read function for use by filesystem-layer routines. 1347dffce215SKirk McKusick */ 1348dffce215SKirk McKusick static int 1349dffce215SKirk McKusick ffs_use_bread(void *devfd, off_t loc, void **bufp, int size) 1350dffce215SKirk McKusick { 1351dffce215SKirk McKusick struct buf *bp; 1352dffce215SKirk McKusick int error; 1353dffce215SKirk McKusick 1354efbf3964SKirk McKusick KASSERT(*bufp == NULL, ("ffs_use_bread: non-NULL *bufp %p\n", *bufp)); 1355dffce215SKirk McKusick *bufp = malloc(size, M_UFSMNT, M_WAITOK); 1356dffce215SKirk McKusick if ((error = bread((struct vnode *)devfd, btodb(loc), size, NOCRED, 1357efbf3964SKirk McKusick &bp)) != 0) 1358dffce215SKirk McKusick return (error); 1359dffce215SKirk McKusick bcopy(bp->b_data, *bufp, size); 1360dffce215SKirk McKusick bp->b_flags |= B_INVAL | B_NOCACHE; 1361dffce215SKirk McKusick brelse(bp); 1362dffce215SKirk McKusick return (0); 1363dffce215SKirk McKusick } 1364dffce215SKirk McKusick 1365adf41577SPoul-Henning Kamp static int bigcgs = 0; 13661c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, ""); 13671c85e6a3SKirk McKusick 1368df8bae1dSRodney W. Grimes /* 13691c85e6a3SKirk McKusick * Sanity checks for loading old filesystem superblocks. 13701c85e6a3SKirk McKusick * See ffs_oldfscompat_write below for unwound actions. 1371df8bae1dSRodney W. Grimes * 13721c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 13731c85e6a3SKirk McKusick * Unfortunately new bits get added. 1374df8bae1dSRodney W. Grimes */ 13751c85e6a3SKirk McKusick static void 13761c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc) 1377df8bae1dSRodney W. Grimes struct fs *fs; 13781c85e6a3SKirk McKusick struct ufsmount *ump; 13791c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 13801c85e6a3SKirk McKusick { 13811c85e6a3SKirk McKusick off_t maxfilesize; 13821c85e6a3SKirk McKusick 13831c85e6a3SKirk McKusick /* 1384ada981b2SKirk McKusick * If not yet done, update fs_flags location and value of fs_sblockloc. 1385ada981b2SKirk McKusick */ 1386ada981b2SKirk McKusick if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1387ada981b2SKirk McKusick fs->fs_flags = fs->fs_old_flags; 1388ada981b2SKirk McKusick fs->fs_old_flags |= FS_FLAGS_UPDATED; 1389ada981b2SKirk McKusick fs->fs_sblockloc = sblockloc; 1390ada981b2SKirk McKusick } 1391ada981b2SKirk McKusick /* 13921c85e6a3SKirk McKusick * If not yet done, update UFS1 superblock with new wider fields. 13931c85e6a3SKirk McKusick */ 139474f3809aSKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) { 13951c85e6a3SKirk McKusick fs->fs_maxbsize = fs->fs_bsize; 13961c85e6a3SKirk McKusick fs->fs_time = fs->fs_old_time; 13971c85e6a3SKirk McKusick fs->fs_size = fs->fs_old_size; 13981c85e6a3SKirk McKusick fs->fs_dsize = fs->fs_old_dsize; 13991c85e6a3SKirk McKusick fs->fs_csaddr = fs->fs_old_csaddr; 14001c85e6a3SKirk McKusick fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir; 14011c85e6a3SKirk McKusick fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree; 14021c85e6a3SKirk McKusick fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree; 14031c85e6a3SKirk McKusick fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree; 14041c85e6a3SKirk McKusick } 14051c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && 14061c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { 14078680d698SNate Lawson fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1; 14081c85e6a3SKirk McKusick fs->fs_qbmask = ~fs->fs_bmask; 14091c85e6a3SKirk McKusick fs->fs_qfmask = ~fs->fs_fmask; 14101c85e6a3SKirk McKusick } 14118f42fb8fSIan Dowse if (fs->fs_magic == FS_UFS1_MAGIC) { 14121c85e6a3SKirk McKusick ump->um_savedmaxfilesize = fs->fs_maxfilesize; 14138680d698SNate Lawson maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1; 14141c85e6a3SKirk McKusick if (fs->fs_maxfilesize > maxfilesize) 14151c85e6a3SKirk McKusick fs->fs_maxfilesize = maxfilesize; 14168f42fb8fSIan Dowse } 14171c85e6a3SKirk McKusick /* Compatibility for old filesystems */ 14181c85e6a3SKirk McKusick if (fs->fs_avgfilesize <= 0) 14191c85e6a3SKirk McKusick fs->fs_avgfilesize = AVFILESIZ; 14201c85e6a3SKirk McKusick if (fs->fs_avgfpdir <= 0) 14211c85e6a3SKirk McKusick fs->fs_avgfpdir = AFPDIR; 14221c85e6a3SKirk McKusick if (bigcgs) { 14231c85e6a3SKirk McKusick fs->fs_save_cgsize = fs->fs_cgsize; 14241c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_bsize; 14251c85e6a3SKirk McKusick } 14261c85e6a3SKirk McKusick } 14271c85e6a3SKirk McKusick 14281c85e6a3SKirk McKusick /* 14291c85e6a3SKirk McKusick * Unwinding superblock updates for old filesystems. 14301c85e6a3SKirk McKusick * See ffs_oldfscompat_read above for details. 14311c85e6a3SKirk McKusick * 14321c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 14331c85e6a3SKirk McKusick * Unfortunately new bits get added. 14341c85e6a3SKirk McKusick */ 1435113db2ddSJeff Roberson void 14361c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump) 14371c85e6a3SKirk McKusick struct fs *fs; 14381c85e6a3SKirk McKusick struct ufsmount *ump; 1439df8bae1dSRodney W. Grimes { 1440df8bae1dSRodney W. Grimes 14411c85e6a3SKirk McKusick /* 14421c85e6a3SKirk McKusick * Copy back UFS2 updated fields that UFS1 inspects. 14431c85e6a3SKirk McKusick */ 14441c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 14451c85e6a3SKirk McKusick fs->fs_old_time = fs->fs_time; 14461c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir; 14471c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree; 14481c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree; 14491c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree; 14501c85e6a3SKirk McKusick fs->fs_maxfilesize = ump->um_savedmaxfilesize; 14518f42fb8fSIan Dowse } 14521c85e6a3SKirk McKusick if (bigcgs) { 14531c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_save_cgsize; 14541c85e6a3SKirk McKusick fs->fs_save_cgsize = 0; 14551c85e6a3SKirk McKusick } 1456df8bae1dSRodney W. Grimes } 1457df8bae1dSRodney W. Grimes 1458df8bae1dSRodney W. Grimes /* 1459df8bae1dSRodney W. Grimes * unmount system call 1460df8bae1dSRodney W. Grimes */ 1461adf41577SPoul-Henning Kamp static int 1462dfd233edSAttilio Rao ffs_unmount(mp, mntflags) 1463df8bae1dSRodney W. Grimes struct mount *mp; 1464df8bae1dSRodney W. Grimes int mntflags; 1465df8bae1dSRodney W. Grimes { 1466dfd233edSAttilio Rao struct thread *td; 146705f4ff5dSPoul-Henning Kamp struct ufsmount *ump = VFSTOUFS(mp); 146805f4ff5dSPoul-Henning Kamp struct fs *fs; 14696fecb4e4SKonstantin Belousov int error, flags, susp; 1470df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1471df86ccf6SKonstantin Belousov int e_restart; 1472df86ccf6SKonstantin Belousov #endif 1473df8bae1dSRodney W. Grimes 1474df8bae1dSRodney W. Grimes flags = 0; 1475dfd233edSAttilio Rao td = curthread; 14766fecb4e4SKonstantin Belousov fs = ump->um_fs; 147771f26429SKonstantin Belousov if (mntflags & MNT_FORCE) 1478df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 14794ce90426SKonstantin Belousov susp = fs->fs_ronly == 0; 1480516081f2SRobert Watson #ifdef UFS_EXTATTR 1481b40ce416SJulian Elischer if ((error = ufs_extattr_stop(mp, td))) { 1482b2b0497aSRobert Watson if (error != EOPNOTSUPP) 1483b60ee81eSKirk McKusick printf("WARNING: unmount %s: ufs_extattr_stop " 1484b60ee81eSKirk McKusick "returned errno %d\n", mp->mnt_stat.f_mntonname, 1485b2b0497aSRobert Watson error); 1486df86ccf6SKonstantin Belousov e_restart = 0; 14877df97b61SRobert Watson } else { 14889de54ba5SRobert Watson ufs_extattr_uepm_destroy(&ump->um_extattr); 1489df86ccf6SKonstantin Belousov e_restart = 1; 14907df97b61SRobert Watson } 1491a64ed089SRobert Watson #endif 14926fecb4e4SKonstantin Belousov if (susp) { 1493895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 1494895b3782SKonstantin Belousov if (error != 0) 1495895b3782SKonstantin Belousov goto fail1; 14966fecb4e4SKonstantin Belousov } 1497fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 14983c140b2dSEdward Tomasz Napierala error = softdep_flushfiles(mp, flags, td); 14993c140b2dSEdward Tomasz Napierala else 15003c140b2dSEdward Tomasz Napierala error = ffs_flushfiles(mp, flags, td); 1501d79ff54bSChuck Silvers if (error != 0 && !ffs_fsfail_cleanup(ump, error)) 15026fecb4e4SKonstantin Belousov goto fail; 15033c140b2dSEdward Tomasz Napierala 15043ba649d7SJeff Roberson UFS_LOCK(ump); 15059ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1506b60ee81eSKirk McKusick printf("WARNING: unmount %s: pending error: blocks %jd " 1507b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 15081c85e6a3SKirk McKusick fs->fs_pendinginodes); 15099ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 15109ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 15119ccb939eSKirk McKusick } 15123ba649d7SJeff Roberson UFS_UNLOCK(ump); 1513519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 1514113db2ddSJeff Roberson softdep_unmount(mp); 1515927a12aeSKirk McKusick if (fs->fs_ronly == 0 || ump->um_fsckpid > 0) { 15161a6a6610SKirk McKusick fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1; 1517791dd2faSTor Egge error = ffs_sbupdate(ump, MNT_WAIT, 0); 1518d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, error)) 1519d79ff54bSChuck Silvers error = 0; 1520d79ff54bSChuck Silvers if (error != 0 && !ffs_fsfail_cleanup(ump, error)) { 1521996c772fSJohn Dyson fs->fs_clean = 0; 15226fecb4e4SKonstantin Belousov goto fail; 1523996c772fSJohn Dyson } 1524e0e9c421SDavid Greenman } 1525ddd6b3fcSKonstantin Belousov if (susp) 1526ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1527c79dff0fSKonstantin Belousov if (ump->um_trim_tq != NULL) { 1528c79dff0fSKonstantin Belousov while (ump->um_trim_inflight != 0) 1529c79dff0fSKonstantin Belousov pause("ufsutr", hz); 1530c79dff0fSKonstantin Belousov taskqueue_drain_all(ump->um_trim_tq); 1531c79dff0fSKonstantin Belousov taskqueue_free(ump->um_trim_tq); 15327e038bc2SKirk McKusick free (ump->um_trimhash, M_TRIM); 1533c79dff0fSKonstantin Belousov } 153443920011SPoul-Henning Kamp g_topology_lock(); 1535927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 1536927a12aeSKirk McKusick /* 1537927a12aeSKirk McKusick * Return to normal read-only mode. 1538927a12aeSKirk McKusick */ 1539927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 1540927a12aeSKirk McKusick ump->um_fsckpid = 0; 1541927a12aeSKirk McKusick } 15420d7935fdSAttilio Rao g_vfs_close(ump->um_cp); 154343920011SPoul-Henning Kamp g_topology_unlock(); 1544f15ccf88SChuck Silvers BO_LOCK(&ump->um_odevvp->v_bufobj); 1545f15ccf88SChuck Silvers ump->um_odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS; 1546f15ccf88SChuck Silvers BO_UNLOCK(&ump->um_odevvp->v_bufobj); 1547c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&ump->um_dev->si_mountpt, 0); 1548f15ccf88SChuck Silvers mntfs_freevp(ump->um_devvp); 1549f15ccf88SChuck Silvers vrele(ump->um_odevvp); 155049c4791cSEdward Tomasz Napierala dev_rel(ump->um_dev); 15513ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 15521a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 15531a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 15541a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 15551a60c7fcSPawel Jakub Dawidek } 1556f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 155734816cb9SKirk McKusick free(fs->fs_si, M_UFSMNT); 1558df8bae1dSRodney W. Grimes free(fs, M_UFSMNT); 1559d79ff54bSChuck Silvers if (ump->um_fsfail_task != NULL) 1560d79ff54bSChuck Silvers free(ump->um_fsfail_task, M_UFSMNT); 1561df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 156277465d93SAlfred Perlstein mp->mnt_data = NULL; 15635da56ddbSTor Egge MNT_ILOCK(mp); 1564cc9d8990SPeter Wemm mp->mnt_flag &= ~MNT_LOCAL; 15655da56ddbSTor Egge MNT_IUNLOCK(mp); 15664cbc378cSKonstantin Belousov if (td->td_su == mp) { 15674cbc378cSKonstantin Belousov td->td_su = NULL; 15684cbc378cSKonstantin Belousov vfs_rel(mp); 15694cbc378cSKonstantin Belousov } 1570df8bae1dSRodney W. Grimes return (error); 15716fecb4e4SKonstantin Belousov 15726fecb4e4SKonstantin Belousov fail: 1573ddd6b3fcSKonstantin Belousov if (susp) 1574ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1575895b3782SKonstantin Belousov fail1: 1576df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1577df86ccf6SKonstantin Belousov if (e_restart) { 1578df86ccf6SKonstantin Belousov ufs_extattr_uepm_init(&ump->um_extattr); 1579df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART 1580df86ccf6SKonstantin Belousov (void) ufs_extattr_autostart(mp, td); 1581df86ccf6SKonstantin Belousov #endif 1582df86ccf6SKonstantin Belousov } 1583df86ccf6SKonstantin Belousov #endif 1584df86ccf6SKonstantin Belousov 15856fecb4e4SKonstantin Belousov return (error); 1586df8bae1dSRodney W. Grimes } 1587df8bae1dSRodney W. Grimes 1588df8bae1dSRodney W. Grimes /* 1589df8bae1dSRodney W. Grimes * Flush out all the files in a filesystem. 1590df8bae1dSRodney W. Grimes */ 159126f9a767SRodney W. Grimes int 1592b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td) 159305f4ff5dSPoul-Henning Kamp struct mount *mp; 1594df8bae1dSRodney W. Grimes int flags; 1595b40ce416SJulian Elischer struct thread *td; 1596df8bae1dSRodney W. Grimes { 159705f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 1598ba05dec5SKonstantin Belousov int qerror, error; 1599df8bae1dSRodney W. Grimes 1600df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1601ba05dec5SKonstantin Belousov qerror = 0; 1602df8bae1dSRodney W. Grimes #ifdef QUOTA 1603df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_QUOTA) { 1604c1d9efcbSPoul-Henning Kamp int i; 1605f257b7a5SAlfred Perlstein error = vflush(mp, 0, SKIPSYSTEM|flags, td); 1606c1d9efcbSPoul-Henning Kamp if (error) 1607df8bae1dSRodney W. Grimes return (error); 1608df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) { 1609ba05dec5SKonstantin Belousov error = quotaoff(td, mp, i); 1610ba05dec5SKonstantin Belousov if (error != 0) { 1611ba05dec5SKonstantin Belousov if ((flags & EARLYFLUSH) == 0) 1612ba05dec5SKonstantin Belousov return (error); 1613ba05dec5SKonstantin Belousov else 1614ba05dec5SKonstantin Belousov qerror = error; 1615df8bae1dSRodney W. Grimes } 1616ba05dec5SKonstantin Belousov } 1617ba05dec5SKonstantin Belousov 1618df8bae1dSRodney W. Grimes /* 1619ba05dec5SKonstantin Belousov * Here we fall through to vflush again to ensure that 1620ba05dec5SKonstantin Belousov * we have gotten rid of all the system vnodes, unless 1621ba05dec5SKonstantin Belousov * quotas must not be closed. 1622df8bae1dSRodney W. Grimes */ 1623df8bae1dSRodney W. Grimes } 1624df8bae1dSRodney W. Grimes #endif 1625e6e370a7SJeff Roberson ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles"); 1626e6e370a7SJeff Roberson if (ump->um_devvp->v_vflag & VV_COPYONWRITE) { 1627f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0) 1628f2a2857bSKirk McKusick return (error); 1629f2a2857bSKirk McKusick ffs_snapshot_unmount(mp); 163095e7a3c3STor Egge flags |= FORCECLOSE; 1631f2a2857bSKirk McKusick /* 1632f2a2857bSKirk McKusick * Here we fall through to vflush again to ensure 1633f2a2857bSKirk McKusick * that we have gotten rid of all the system vnodes. 1634f2a2857bSKirk McKusick */ 1635f2a2857bSKirk McKusick } 1636ba05dec5SKonstantin Belousov 1637b1897c19SJulian Elischer /* 1638ba05dec5SKonstantin Belousov * Do not close system files if quotas were not closed, to be 1639ba05dec5SKonstantin Belousov * able to sync the remaining dquots. The freeblks softupdate 1640ba05dec5SKonstantin Belousov * workitems might hold a reference on a dquot, preventing 1641ba05dec5SKonstantin Belousov * quotaoff() from completing. Next round of 1642ba05dec5SKonstantin Belousov * softdep_flushworklist() iteration should process the 1643ba05dec5SKonstantin Belousov * blockers, allowing the next run of quotaoff() to finally 1644ba05dec5SKonstantin Belousov * flush held dquots. 1645ba05dec5SKonstantin Belousov * 1646ba05dec5SKonstantin Belousov * Otherwise, flush all the files. 1647b1897c19SJulian Elischer */ 1648ba05dec5SKonstantin Belousov if (qerror == 0 && (error = vflush(mp, 0, flags, td)) != 0) 1649b1897c19SJulian Elischer return (error); 1650ba05dec5SKonstantin Belousov 1651b1897c19SJulian Elischer /* 1652b1897c19SJulian Elischer * Flush filesystem metadata. 1653b1897c19SJulian Elischer */ 1654cb05b60aSAttilio Rao vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 16558df6bac4SPoul-Henning Kamp error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td); 1656b249ce48SMateusz Guzik VOP_UNLOCK(ump->um_devvp); 1657df8bae1dSRodney W. Grimes return (error); 1658df8bae1dSRodney W. Grimes } 1659df8bae1dSRodney W. Grimes 1660df8bae1dSRodney W. Grimes /* 1661df8bae1dSRodney W. Grimes * Get filesystem statistics. 1662df8bae1dSRodney W. Grimes */ 1663adf41577SPoul-Henning Kamp static int 1664dfd233edSAttilio Rao ffs_statfs(mp, sbp) 1665df8bae1dSRodney W. Grimes struct mount *mp; 166605f4ff5dSPoul-Henning Kamp struct statfs *sbp; 1667df8bae1dSRodney W. Grimes { 166805f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 166905f4ff5dSPoul-Henning Kamp struct fs *fs; 1670df8bae1dSRodney W. Grimes 1671df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1672df8bae1dSRodney W. Grimes fs = ump->um_fs; 16731c85e6a3SKirk McKusick if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC) 1674df8bae1dSRodney W. Grimes panic("ffs_statfs"); 1675fde81c7dSKirk McKusick sbp->f_version = STATFS_VERSION; 1676df8bae1dSRodney W. Grimes sbp->f_bsize = fs->fs_fsize; 1677df8bae1dSRodney W. Grimes sbp->f_iosize = fs->fs_bsize; 1678df8bae1dSRodney W. Grimes sbp->f_blocks = fs->fs_dsize; 16793ba649d7SJeff Roberson UFS_LOCK(ump); 1680df8bae1dSRodney W. Grimes sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + 16819ccb939eSKirk McKusick fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks); 16829ccb939eSKirk McKusick sbp->f_bavail = freespace(fs, fs->fs_minfree) + 16839ccb939eSKirk McKusick dbtofsb(fs, fs->fs_pendingblocks); 16841dc349abSEd Maste sbp->f_files = fs->fs_ncg * fs->fs_ipg - UFS_ROOTINO; 16859ccb939eSKirk McKusick sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes; 16863ba649d7SJeff Roberson UFS_UNLOCK(ump); 1687a96da1c3SConrad Meyer sbp->f_namemax = UFS_MAXNAMLEN; 1688df8bae1dSRodney W. Grimes return (0); 1689df8bae1dSRodney W. Grimes } 1690df8bae1dSRodney W. Grimes 16911eabd967SKonstantin Belousov static bool 16921eabd967SKonstantin Belousov sync_doupdate(struct inode *ip) 16931eabd967SKonstantin Belousov { 16941eabd967SKonstantin Belousov 16951eabd967SKonstantin Belousov return ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED | 16961eabd967SKonstantin Belousov IN_UPDATE)) != 0); 16971eabd967SKonstantin Belousov } 16981eabd967SKonstantin Belousov 169980663cadSMateusz Guzik static int 170080663cadSMateusz Guzik ffs_sync_lazy_filter(struct vnode *vp, void *arg __unused) 170180663cadSMateusz Guzik { 170280663cadSMateusz Guzik struct inode *ip; 170380663cadSMateusz Guzik 170480663cadSMateusz Guzik /* 170580663cadSMateusz Guzik * Flags are safe to access because ->v_data invalidation 170680663cadSMateusz Guzik * is held off by listmtx. 170780663cadSMateusz Guzik */ 170880663cadSMateusz Guzik if (vp->v_type == VNON) 170980663cadSMateusz Guzik return (false); 171080663cadSMateusz Guzik ip = VTOI(vp); 171180663cadSMateusz Guzik if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) 171280663cadSMateusz Guzik return (false); 171380663cadSMateusz Guzik return (true); 171480663cadSMateusz Guzik } 171580663cadSMateusz Guzik 1716df8bae1dSRodney W. Grimes /* 1717a988a5c6SKonstantin Belousov * For a lazy sync, we only care about access times, quotas and the 1718a988a5c6SKonstantin Belousov * superblock. Other filesystem changes are already converted to 1719a988a5c6SKonstantin Belousov * cylinder group blocks or inode blocks updates and are written to 1720a988a5c6SKonstantin Belousov * disk by syncer. 1721a988a5c6SKonstantin Belousov */ 1722a988a5c6SKonstantin Belousov static int 1723a988a5c6SKonstantin Belousov ffs_sync_lazy(mp) 1724a988a5c6SKonstantin Belousov struct mount *mp; 1725a988a5c6SKonstantin Belousov { 1726a988a5c6SKonstantin Belousov struct vnode *mvp, *vp; 1727a988a5c6SKonstantin Belousov struct inode *ip; 1728a988a5c6SKonstantin Belousov struct thread *td; 1729a988a5c6SKonstantin Belousov int allerror, error; 1730a988a5c6SKonstantin Belousov 1731a988a5c6SKonstantin Belousov allerror = 0; 1732a988a5c6SKonstantin Belousov td = curthread; 17330297c138SKirk McKusick if ((mp->mnt_flag & MNT_NOATIME) != 0) { 17340297c138SKirk McKusick #ifdef QUOTA 17350297c138SKirk McKusick qsync(mp); 17360297c138SKirk McKusick #endif 17370297c138SKirk McKusick goto sbupdate; 17380297c138SKirk McKusick } 173980663cadSMateusz Guzik MNT_VNODE_FOREACH_LAZY(vp, mp, mvp, ffs_sync_lazy_filter, NULL) { 174071469bb3SKirk McKusick if (vp->v_type == VNON) { 1741a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1742a988a5c6SKonstantin Belousov continue; 1743a988a5c6SKonstantin Belousov } 1744a988a5c6SKonstantin Belousov ip = VTOI(vp); 1745a988a5c6SKonstantin Belousov 1746a988a5c6SKonstantin Belousov /* 1747a988a5c6SKonstantin Belousov * The IN_ACCESS flag is converted to IN_MODIFIED by 1748a988a5c6SKonstantin Belousov * ufs_close() and ufs_getattr() by the calls to 1749ea573a50SKonstantin Belousov * ufs_itimes_locked(), without subsequent UFS_UPDATE(). 1750ea573a50SKonstantin Belousov * Test also all the other timestamp flags too, to pick up 1751ea573a50SKonstantin Belousov * any other cases that could be missed. 1752a988a5c6SKonstantin Belousov */ 17531eabd967SKonstantin Belousov if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) { 1754a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1755a988a5c6SKonstantin Belousov continue; 1756a988a5c6SKonstantin Belousov } 1757a92a971bSMateusz Guzik if ((error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK)) != 0) 1758a988a5c6SKonstantin Belousov continue; 17590297c138SKirk McKusick #ifdef QUOTA 17600297c138SKirk McKusick qsyncvp(vp); 17610297c138SKirk McKusick #endif 17621eabd967SKonstantin Belousov if (sync_doupdate(ip)) 1763a988a5c6SKonstantin Belousov error = ffs_update(vp, 0); 1764a988a5c6SKonstantin Belousov if (error != 0) 1765a988a5c6SKonstantin Belousov allerror = error; 1766a988a5c6SKonstantin Belousov vput(vp); 1767a988a5c6SKonstantin Belousov } 17680297c138SKirk McKusick sbupdate: 1769a988a5c6SKonstantin Belousov if (VFSTOUFS(mp)->um_fs->fs_fmod != 0 && 1770a988a5c6SKonstantin Belousov (error = ffs_sbupdate(VFSTOUFS(mp), MNT_LAZY, 0)) != 0) 1771a988a5c6SKonstantin Belousov allerror = error; 1772a988a5c6SKonstantin Belousov return (allerror); 1773a988a5c6SKonstantin Belousov } 1774a988a5c6SKonstantin Belousov 1775a988a5c6SKonstantin Belousov /* 1776df8bae1dSRodney W. Grimes * Go through the disk queues to initiate sandbagged IO; 1777df8bae1dSRodney W. Grimes * go through the inodes to write those that have been modified; 1778df8bae1dSRodney W. Grimes * initiate the writing of the super block if it has been modified. 1779df8bae1dSRodney W. Grimes * 1780a988a5c6SKonstantin Belousov * Note: we are always called with the filesystem marked busy using 1781a988a5c6SKonstantin Belousov * vfs_busy(). 1782df8bae1dSRodney W. Grimes */ 1783adf41577SPoul-Henning Kamp static int 1784dfd233edSAttilio Rao ffs_sync(mp, waitfor) 1785df8bae1dSRodney W. Grimes struct mount *mp; 1786df8bae1dSRodney W. Grimes int waitfor; 1787df8bae1dSRodney W. Grimes { 178882be0a5aSTor Egge struct vnode *mvp, *vp, *devvp; 1789dfd233edSAttilio Rao struct thread *td; 1790996c772fSJohn Dyson struct inode *ip; 1791996c772fSJohn Dyson struct ufsmount *ump = VFSTOUFS(mp); 1792996c772fSJohn Dyson struct fs *fs; 179369baeadcSKonstantin Belousov int error, count, lockreq, allerror = 0; 1794791dd2faSTor Egge int suspend; 1795791dd2faSTor Egge int suspended; 1796791dd2faSTor Egge int secondary_writes; 1797791dd2faSTor Egge int secondary_accwrites; 1798791dd2faSTor Egge int softdep_deps; 1799791dd2faSTor Egge int softdep_accdeps; 1800156cb265SPoul-Henning Kamp struct bufobj *bo; 1801df8bae1dSRodney W. Grimes 180219c87af0SKirk McKusick suspend = 0; 180319c87af0SKirk McKusick suspended = 0; 1804dfd233edSAttilio Rao td = curthread; 1805df8bae1dSRodney W. Grimes fs = ump->um_fs; 1806b60ee81eSKirk McKusick if (fs->fs_fmod != 0 && fs->fs_ronly != 0 && ump->um_fsckpid == 0) 1807b60ee81eSKirk McKusick panic("%s: ffs_sync: modification on read-only filesystem", 1808b60ee81eSKirk McKusick fs->fs_fsmnt); 18094af9f77eSKonstantin Belousov if (waitfor == MNT_LAZY) { 18104af9f77eSKonstantin Belousov if (!rebooting) 1811a988a5c6SKonstantin Belousov return (ffs_sync_lazy(mp)); 18124af9f77eSKonstantin Belousov waitfor = MNT_NOWAIT; 18134af9f77eSKonstantin Belousov } 1814a988a5c6SKonstantin Belousov 181519c87af0SKirk McKusick /* 1816df8bae1dSRodney W. Grimes * Write back each (modified) inode. 1817df8bae1dSRodney W. Grimes */ 1818245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE | LK_NOWAIT; 1819791dd2faSTor Egge if (waitfor == MNT_SUSPEND) { 1820791dd2faSTor Egge suspend = 1; 1821791dd2faSTor Egge waitfor = MNT_WAIT; 1822791dd2faSTor Egge } 182369baeadcSKonstantin Belousov if (waitfor == MNT_WAIT) 1824245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE; 182541d4783dSJeff Roberson lockreq |= LK_INTERLOCK | LK_SLEEPFAIL; 1826df8bae1dSRodney W. Grimes loop: 1827791dd2faSTor Egge /* Grab snapshot of secondary write counts */ 182871469bb3SKirk McKusick MNT_ILOCK(mp); 1829791dd2faSTor Egge secondary_writes = mp->mnt_secondary_writes; 1830791dd2faSTor Egge secondary_accwrites = mp->mnt_secondary_accwrites; 183171469bb3SKirk McKusick MNT_IUNLOCK(mp); 1832791dd2faSTor Egge 1833791dd2faSTor Egge /* Grab snapshot of softdep dependency counts */ 1834791dd2faSTor Egge softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps); 1835791dd2faSTor Egge 183671469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 1837245df27cSMatthew Dillon /* 1838e0c17408SKonstantin Belousov * Depend on the vnode interlock to keep things stable enough 1839245df27cSMatthew Dillon * for a quick test. Since there might be hundreds of 1840245df27cSMatthew Dillon * thousands of vnodes, we cannot afford even a subroutine 1841245df27cSMatthew Dillon * call unless there's a good chance that we have work to do. 1842245df27cSMatthew Dillon */ 184371469bb3SKirk McKusick if (vp->v_type == VNON) { 18442f05568aSJeff Roberson VI_UNLOCK(vp); 18452f05568aSJeff Roberson continue; 18462f05568aSJeff Roberson } 1847df8bae1dSRodney W. Grimes ip = VTOI(vp); 184871469bb3SKirk McKusick if ((ip->i_flag & 1849cf60e8e4SKirk McKusick (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && 185071469bb3SKirk McKusick vp->v_bufobj.bo_dirty.bv_cnt == 0) { 18512f05568aSJeff Roberson VI_UNLOCK(vp); 1852df8bae1dSRodney W. Grimes continue; 1853996c772fSJohn Dyson } 1854a92a971bSMateusz Guzik if ((error = vget(vp, lockreq)) != 0) { 185582be0a5aSTor Egge if (error == ENOENT || error == ENOLCK) { 185671469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 1857df8bae1dSRodney W. Grimes goto loop; 185882be0a5aSTor Egge } 18592f05568aSJeff Roberson continue; 18602f05568aSJeff Roberson } 18610297c138SKirk McKusick #ifdef QUOTA 18620297c138SKirk McKusick qsyncvp(vp); 18630297c138SKirk McKusick #endif 18648a1509e4SKonstantin Belousov for (;;) { 18658a1509e4SKonstantin Belousov error = ffs_syncvnode(vp, waitfor, 0); 18668a1509e4SKonstantin Belousov if (error == ERELOOKUP) 18678a1509e4SKonstantin Belousov continue; 18688a1509e4SKonstantin Belousov if (error != 0) 1869df8bae1dSRodney W. Grimes allerror = error; 18708a1509e4SKonstantin Belousov break; 18718a1509e4SKonstantin Belousov } 187241d4783dSJeff Roberson vput(vp); 1873245df27cSMatthew Dillon } 1874df8bae1dSRodney W. Grimes /* 1875df8bae1dSRodney W. Grimes * Force stale filesystem control information to be flushed. 1876df8bae1dSRodney W. Grimes */ 18774af9f77eSKonstantin Belousov if (waitfor == MNT_WAIT || rebooting) { 1878b40ce416SJulian Elischer if ((error = softdep_flushworklist(ump->um_mountp, &count, td))) 18799b971133SKirk McKusick allerror = error; 1880d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1881d79ff54bSChuck Silvers allerror = 0; 18829b971133SKirk McKusick /* Flushed work items may create new vnodes to clean */ 188371469bb3SKirk McKusick if (allerror == 0 && count) 18849b971133SKirk McKusick goto loop; 18859b971133SKirk McKusick } 188619c87af0SKirk McKusick 1887112f7372SKirk McKusick devvp = ump->um_devvp; 1888156cb265SPoul-Henning Kamp bo = &devvp->v_bufobj; 1889698b1a66SJeff Roberson BO_LOCK(bo); 189019c87af0SKirk McKusick if (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0) { 1891698b1a66SJeff Roberson BO_UNLOCK(bo); 1892698b1a66SJeff Roberson vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 18934af9f77eSKonstantin Belousov error = VOP_FSYNC(devvp, waitfor, td); 1894b249ce48SMateusz Guzik VOP_UNLOCK(devvp); 18954af9f77eSKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (error == 0 || error == EAGAIN)) 18964af9f77eSKonstantin Belousov error = ffs_sbupdate(ump, waitfor, 0); 18974af9f77eSKonstantin Belousov if (error != 0) 18984af9f77eSKonstantin Belousov allerror = error; 1899d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1900d79ff54bSChuck Silvers allerror = 0; 190171469bb3SKirk McKusick if (allerror == 0 && waitfor == MNT_WAIT) 1902112f7372SKirk McKusick goto loop; 1903791dd2faSTor Egge } else if (suspend != 0) { 1904791dd2faSTor Egge if (softdep_check_suspend(mp, 1905791dd2faSTor Egge devvp, 1906791dd2faSTor Egge softdep_deps, 1907791dd2faSTor Egge softdep_accdeps, 1908791dd2faSTor Egge secondary_writes, 190971469bb3SKirk McKusick secondary_accwrites) != 0) { 191071469bb3SKirk McKusick MNT_IUNLOCK(mp); 1911791dd2faSTor Egge goto loop; /* More work needed */ 191271469bb3SKirk McKusick } 1913791dd2faSTor Egge mtx_assert(MNT_MTX(mp), MA_OWNED); 1914ca2fa807STor Egge mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED; 1915791dd2faSTor Egge MNT_IUNLOCK(mp); 1916791dd2faSTor Egge suspended = 1; 1917112f7372SKirk McKusick } else 1918698b1a66SJeff Roberson BO_UNLOCK(bo); 1919996c772fSJohn Dyson /* 1920996c772fSJohn Dyson * Write back modified superblock. 1921996c772fSJohn Dyson */ 1922791dd2faSTor Egge if (fs->fs_fmod != 0 && 1923791dd2faSTor Egge (error = ffs_sbupdate(ump, waitfor, suspended)) != 0) 1924996c772fSJohn Dyson allerror = error; 1925d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1926d79ff54bSChuck Silvers allerror = 0; 1927df8bae1dSRodney W. Grimes return (allerror); 1928df8bae1dSRodney W. Grimes } 1929df8bae1dSRodney W. Grimes 1930df8bae1dSRodney W. Grimes int 1931a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp) 1932df8bae1dSRodney W. Grimes struct mount *mp; 1933df8bae1dSRodney W. Grimes ino_t ino; 1934a0595d02SKirk McKusick int flags; 1935df8bae1dSRodney W. Grimes struct vnode **vpp; 1936df8bae1dSRodney W. Grimes { 19377b7ed832SKonstantin Belousov return (ffs_vgetf(mp, ino, flags, vpp, 0)); 19387b7ed832SKonstantin Belousov } 19397b7ed832SKonstantin Belousov 19407b7ed832SKonstantin Belousov int 19417b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags) 19427b7ed832SKonstantin Belousov struct mount *mp; 19437b7ed832SKonstantin Belousov ino_t ino; 19447b7ed832SKonstantin Belousov int flags; 19457b7ed832SKonstantin Belousov struct vnode **vpp; 19467b7ed832SKonstantin Belousov int ffs_flags; 19477b7ed832SKonstantin Belousov { 1948996c772fSJohn Dyson struct fs *fs; 1949996c772fSJohn Dyson struct inode *ip; 1950df8bae1dSRodney W. Grimes struct ufsmount *ump; 1951df8bae1dSRodney W. Grimes struct buf *bp; 1952df8bae1dSRodney W. Grimes struct vnode *vp; 1953d79ff54bSChuck Silvers daddr_t dbn; 1954f576a00dSSemen Ustimenko int error; 1955df8bae1dSRodney W. Grimes 195616040222SKonstantin Belousov MPASS((ffs_flags & FFSV_REPLACE) == 0 || (flags & LK_EXCLUSIVE) != 0); 195716040222SKonstantin Belousov 195851f5ce0cSPoul-Henning Kamp error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL); 195916040222SKonstantin Belousov if (error != 0) 196014bc0685SPoul-Henning Kamp return (error); 196116040222SKonstantin Belousov if (*vpp != NULL) { 196216040222SKonstantin Belousov if ((ffs_flags & FFSV_REPLACE) == 0) 196316040222SKonstantin Belousov return (0); 196416040222SKonstantin Belousov vgone(*vpp); 196516040222SKonstantin Belousov vput(*vpp); 196616040222SKonstantin Belousov } 1967f576a00dSSemen Ustimenko 1968f576a00dSSemen Ustimenko /* 1969d6919865SJeff Roberson * We must promote to an exclusive lock for vnode creation. This 1970d6919865SJeff Roberson * can happen if lookup is passed LOCKSHARED. 1971d6919865SJeff Roberson */ 1972d6919865SJeff Roberson if ((flags & LK_TYPE_MASK) == LK_SHARED) { 1973d6919865SJeff Roberson flags &= ~LK_TYPE_MASK; 1974d6919865SJeff Roberson flags |= LK_EXCLUSIVE; 1975d6919865SJeff Roberson } 1976d6919865SJeff Roberson 1977d6919865SJeff Roberson /* 197813866b3fSSemen Ustimenko * We do not lock vnode creation as it is believed to be too 1979f576a00dSSemen Ustimenko * expensive for such rare case as simultaneous creation of vnode 1980f576a00dSSemen Ustimenko * for same ino by different processes. We just allow them to race 1981f576a00dSSemen Ustimenko * and check later to decide who wins. Let the race begin! 1982f576a00dSSemen Ustimenko */ 198314bc0685SPoul-Henning Kamp 198414bc0685SPoul-Henning Kamp ump = VFSTOUFS(mp); 198514bc0685SPoul-Henning Kamp fs = ump->um_fs; 19869d5a594fSMateusz Guzik ip = uma_zalloc_smr(uma_inode, M_WAITOK | M_ZERO); 19872f9bae59SDavid Greenman 1988df8bae1dSRodney W. Grimes /* Allocate a new vnode/inode. */ 198943a993bbSKirk McKusick error = getnewvnode("ufs", mp, fs->fs_magic == FS_UFS1_MAGIC ? 199043a993bbSKirk McKusick &ffs_vnodeops1 : &ffs_vnodeops2, &vp); 1991c9671602SPoul-Henning Kamp if (error) { 1992df8bae1dSRodney W. Grimes *vpp = NULL; 19939d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 1994df8bae1dSRodney W. Grimes return (error); 1995df8bae1dSRodney W. Grimes } 199667e87166SBoris Popov /* 199733fc3625SJohn Baldwin * FFS supports recursive locking. 199867e87166SBoris Popov */ 19993634d5b2SJohn Baldwin lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL); 2000628f51d2SAttilio Rao VN_LOCK_AREC(vp); 2001df8bae1dSRodney W. Grimes vp->v_data = ip; 20025d9d81e7SPoul-Henning Kamp vp->v_bufobj.bo_bsize = fs->fs_bsize; 2003df8bae1dSRodney W. Grimes ip->i_vnode = vp; 20041c85e6a3SKirk McKusick ip->i_ump = ump; 2005df8bae1dSRodney W. Grimes ip->i_number = ino; 2006e65f5a4eSKonstantin Belousov ip->i_ea_refs = 0; 200774a87c38SKirk McKusick ip->i_nextclustercg = -1; 2008e1db6897SKonstantin Belousov ip->i_flag = fs->fs_magic == FS_UFS1_MAGIC ? 0 : IN_UFS2; 200972d28f97SKirk McKusick ip->i_mode = 0; /* ensure error cases below throw away vnode */ 201061846fc4SKonstantin Belousov #ifdef DIAGNOSTIC 201161846fc4SKonstantin Belousov ufs_init_trackers(ip); 201261846fc4SKonstantin Belousov #endif 2013df8bae1dSRodney W. Grimes #ifdef QUOTA 2014c1d9efcbSPoul-Henning Kamp { 2015c1d9efcbSPoul-Henning Kamp int i; 2016df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 2017df8bae1dSRodney W. Grimes ip->i_dquot[i] = NODQUOT; 2018c1d9efcbSPoul-Henning Kamp } 2019df8bae1dSRodney W. Grimes #endif 2020df8bae1dSRodney W. Grimes 20217b7ed832SKonstantin Belousov if (ffs_flags & FFSV_FORCEINSMQ) 20227b7ed832SKonstantin Belousov vp->v_vflag |= VV_FORCEINSMQ; 202361b9d89fSTor Egge error = insmntque(vp, mp); 202461b9d89fSTor Egge if (error != 0) { 20259d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 202661b9d89fSTor Egge *vpp = NULL; 202761b9d89fSTor Egge return (error); 202861b9d89fSTor Egge } 20297b7ed832SKonstantin Belousov vp->v_vflag &= ~VV_FORCEINSMQ; 2030a80d8caaSPawel Jakub Dawidek error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL); 203116040222SKonstantin Belousov if (error != 0) 2032f576a00dSSemen Ustimenko return (error); 203316040222SKonstantin Belousov if (*vpp != NULL) { 203416040222SKonstantin Belousov /* 203516040222SKonstantin Belousov * Calls from ffs_valloc() (i.e. FFSV_REPLACE set) 203616040222SKonstantin Belousov * operate on empty inode, which must not be found by 203716040222SKonstantin Belousov * other threads until fully filled. Vnode for empty 203816040222SKonstantin Belousov * inode must be not re-inserted on the hash by other 203916040222SKonstantin Belousov * thread, after removal by us at the beginning. 204016040222SKonstantin Belousov */ 204116040222SKonstantin Belousov MPASS((ffs_flags & FFSV_REPLACE) == 0); 204216040222SKonstantin Belousov return (0); 204316040222SKonstantin Belousov } 2044f576a00dSSemen Ustimenko 2045df8bae1dSRodney W. Grimes /* Read in the disk contents for the inode, copy into the inode. */ 2046d79ff54bSChuck Silvers dbn = fsbtodb(fs, ino_to_fsba(fs, ino)); 2047d79ff54bSChuck Silvers error = ffs_breadz(ump, ump->um_devvp, dbn, dbn, (int)fs->fs_bsize, 2048d79ff54bSChuck Silvers NULL, NULL, 0, NOCRED, 0, NULL, &bp); 2049d79ff54bSChuck Silvers if (error != 0) { 2050df8bae1dSRodney W. Grimes /* 2051df8bae1dSRodney W. Grimes * The inode does not contain anything useful, so it would 2052df8bae1dSRodney W. Grimes * be misleading to leave it on its hash chain. With mode 2053df8bae1dSRodney W. Grimes * still zero, it will be unlinked and returned to the free 2054df8bae1dSRodney W. Grimes * list by vput(). 2055df8bae1dSRodney W. Grimes */ 20566c44a3e0SMateusz Guzik vgone(vp); 2057bd7e5f99SJohn Dyson vput(vp); 2058df8bae1dSRodney W. Grimes *vpp = NULL; 2059df8bae1dSRodney W. Grimes return (error); 2060df8bae1dSRodney W. Grimes } 2061e1db6897SKonstantin Belousov if (I_IS_UFS1(ip)) 2062a163d034SWarner Losh ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK); 2063de6ba7c0SPoul-Henning Kamp else 2064a163d034SWarner Losh ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK); 20659fc5d538SKirk McKusick if ((error = ffs_load_inode(bp, ip, fs, ino)) != 0) { 20669fc5d538SKirk McKusick bqrelse(bp); 20676c44a3e0SMateusz Guzik vgone(vp); 20689fc5d538SKirk McKusick vput(vp); 20699fc5d538SKirk McKusick *vpp = NULL; 20709fc5d538SKirk McKusick return (error); 20719fc5d538SKirk McKusick } 2072b1897c19SJulian Elischer if (DOINGSOFTDEP(vp)) 2073b1897c19SJulian Elischer softdep_load_inodeblock(ip); 2074b1897c19SJulian Elischer else 2075b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 2076bd7e5f99SJohn Dyson bqrelse(bp); 2077df8bae1dSRodney W. Grimes 2078df8bae1dSRodney W. Grimes /* 2079df8bae1dSRodney W. Grimes * Initialize the vnode from the inode, check for aliases. 2080df8bae1dSRodney W. Grimes * Note that the underlying vnode may have changed. 2081df8bae1dSRodney W. Grimes */ 2082e1db6897SKonstantin Belousov error = ufs_vinit(mp, I_IS_UFS1(ip) ? &ffs_fifoops1 : &ffs_fifoops2, 2083e1db6897SKonstantin Belousov &vp); 2084c9671602SPoul-Henning Kamp if (error) { 20856c44a3e0SMateusz Guzik vgone(vp); 2086df8bae1dSRodney W. Grimes vput(vp); 2087df8bae1dSRodney W. Grimes *vpp = NULL; 2088df8bae1dSRodney W. Grimes return (error); 2089df8bae1dSRodney W. Grimes } 2090de68347bSPoul-Henning Kamp 2091df8bae1dSRodney W. Grimes /* 20925c24d6eeSPoul-Henning Kamp * Finish inode initialization. 2093df8bae1dSRodney W. Grimes */ 209433fc3625SJohn Baldwin if (vp->v_type != VFIFO) { 209533fc3625SJohn Baldwin /* FFS supports shared locking for all files except fifos. */ 209633fc3625SJohn Baldwin VN_LOCK_ASHARE(vp); 209733fc3625SJohn Baldwin } 2098de68347bSPoul-Henning Kamp 2099df8bae1dSRodney W. Grimes /* 2100df8bae1dSRodney W. Grimes * Set up a generation number for this inode if it does not 2101df8bae1dSRodney W. Grimes * already have one. This should only happen on old filesystems. 2102df8bae1dSRodney W. Grimes */ 2103df8bae1dSRodney W. Grimes if (ip->i_gen == 0) { 210457d2ac2fSKevin Lo while (ip->i_gen == 0) 210557d2ac2fSKevin Lo ip->i_gen = arc4random(); 21061c85e6a3SKirk McKusick if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 2107ac4ec141SMateusz Guzik UFS_INODE_SET_FLAG(ip, IN_MODIFIED); 2108b403319bSAlexander Kabaev DIP_SET(ip, i_gen, ip->i_gen); 21091c85e6a3SKirk McKusick } 2110df8bae1dSRodney W. Grimes } 2111763bbd2fSRobert Watson #ifdef MAC 2112763bbd2fSRobert Watson if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) { 2113763bbd2fSRobert Watson /* 2114763bbd2fSRobert Watson * If this vnode is already allocated, and we're running 2115763bbd2fSRobert Watson * multi-label, attempt to perform a label association 2116763bbd2fSRobert Watson * from the extended attributes on the inode. 2117763bbd2fSRobert Watson */ 211830d239bcSRobert Watson error = mac_vnode_associate_extattr(mp, vp); 2119763bbd2fSRobert Watson if (error) { 2120763bbd2fSRobert Watson /* ufs_inactive will release ip->i_devvp ref. */ 21216c44a3e0SMateusz Guzik vgone(vp); 2122763bbd2fSRobert Watson vput(vp); 2123763bbd2fSRobert Watson *vpp = NULL; 2124763bbd2fSRobert Watson return (error); 2125763bbd2fSRobert Watson } 2126763bbd2fSRobert Watson } 2127763bbd2fSRobert Watson #endif 2128763bbd2fSRobert Watson 2129df8bae1dSRodney W. Grimes *vpp = vp; 2130df8bae1dSRodney W. Grimes return (0); 2131df8bae1dSRodney W. Grimes } 2132df8bae1dSRodney W. Grimes 2133df8bae1dSRodney W. Grimes /* 2134df8bae1dSRodney W. Grimes * File handle to vnode 2135df8bae1dSRodney W. Grimes * 2136df8bae1dSRodney W. Grimes * Have to be really careful about stale file handles: 2137df8bae1dSRodney W. Grimes * - check that the inode number is valid 2138abe53f7eSKirk McKusick * - for UFS2 check that the inode number is initialized 2139df8bae1dSRodney W. Grimes * - call ffs_vget() to get the locked inode 2140df8bae1dSRodney W. Grimes * - check for an unallocated inode (i_mode == 0) 2141df8bae1dSRodney W. Grimes * - check that the given client host has export rights and return 2142df8bae1dSRodney W. Grimes * those rights via. exflagsp and credanonp 2143df8bae1dSRodney W. Grimes */ 2144adf41577SPoul-Henning Kamp static int 2145694a586aSRick Macklem ffs_fhtovp(mp, fhp, flags, vpp) 214605f4ff5dSPoul-Henning Kamp struct mount *mp; 2147df8bae1dSRodney W. Grimes struct fid *fhp; 2148694a586aSRick Macklem int flags; 2149df8bae1dSRodney W. Grimes struct vnode **vpp; 2150df8bae1dSRodney W. Grimes { 215105f4ff5dSPoul-Henning Kamp struct ufid *ufhp; 2152abe53f7eSKirk McKusick struct ufsmount *ump; 2153df8bae1dSRodney W. Grimes struct fs *fs; 2154abe53f7eSKirk McKusick struct cg *cgp; 2155abe53f7eSKirk McKusick struct buf *bp; 2156abe53f7eSKirk McKusick ino_t ino; 2157abe53f7eSKirk McKusick u_int cg; 2158abe53f7eSKirk McKusick int error; 2159df8bae1dSRodney W. Grimes 2160df8bae1dSRodney W. Grimes ufhp = (struct ufid *)fhp; 2161abe53f7eSKirk McKusick ino = ufhp->ufid_ino; 2162abe53f7eSKirk McKusick ump = VFSTOUFS(mp); 2163abe53f7eSKirk McKusick fs = ump->um_fs; 21641dc349abSEd Maste if (ino < UFS_ROOTINO || ino >= fs->fs_ncg * fs->fs_ipg) 2165df8bae1dSRodney W. Grimes return (ESTALE); 2166abe53f7eSKirk McKusick /* 2167abe53f7eSKirk McKusick * Need to check if inode is initialized because UFS2 does lazy 2168abe53f7eSKirk McKusick * initialization and nfs_fhtovp can offer arbitrary inode numbers. 2169abe53f7eSKirk McKusick */ 2170abe53f7eSKirk McKusick if (fs->fs_magic != FS_UFS2_MAGIC) 2171abe53f7eSKirk McKusick return (ufs_fhtovp(mp, ufhp, flags, vpp)); 2172abe53f7eSKirk McKusick cg = ino_to_cg(fs, ino); 217344d37182SKirk McKusick if ((error = ffs_getcg(fs, ump->um_devvp, cg, 0, &bp, &cgp)) != 0) 2174abe53f7eSKirk McKusick return (error); 21759c4f551eSKirk McKusick if (ino >= cg * fs->fs_ipg + cgp->cg_initediblk) { 2176abe53f7eSKirk McKusick brelse(bp); 2177abe53f7eSKirk McKusick return (ESTALE); 2178abe53f7eSKirk McKusick } 2179abe53f7eSKirk McKusick brelse(bp); 2180694a586aSRick Macklem return (ufs_fhtovp(mp, ufhp, flags, vpp)); 2181df8bae1dSRodney W. Grimes } 2182df8bae1dSRodney W. Grimes 2183df8bae1dSRodney W. Grimes /* 21845346934fSIan Dowse * Initialize the filesystem. 2185996c772fSJohn Dyson */ 2186996c772fSJohn Dyson static int 2187996c772fSJohn Dyson ffs_init(vfsp) 2188996c772fSJohn Dyson struct vfsconf *vfsp; 2189996c772fSJohn Dyson { 2190996c772fSJohn Dyson 21911848286aSEdward Tomasz Napierala ffs_susp_initialize(); 2192b1897c19SJulian Elischer softdep_initialize(); 2193996c772fSJohn Dyson return (ufs_init(vfsp)); 2194996c772fSJohn Dyson } 2195996c772fSJohn Dyson 2196996c772fSJohn Dyson /* 21975346934fSIan Dowse * Undo the work of ffs_init(). 21985346934fSIan Dowse */ 21995346934fSIan Dowse static int 22005346934fSIan Dowse ffs_uninit(vfsp) 22015346934fSIan Dowse struct vfsconf *vfsp; 22025346934fSIan Dowse { 22035346934fSIan Dowse int ret; 22045346934fSIan Dowse 22055346934fSIan Dowse ret = ufs_uninit(vfsp); 22065346934fSIan Dowse softdep_uninitialize(); 22071848286aSEdward Tomasz Napierala ffs_susp_uninitialize(); 2208d79ff54bSChuck Silvers taskqueue_drain_all(taskqueue_thread); 22095346934fSIan Dowse return (ret); 22105346934fSIan Dowse } 22115346934fSIan Dowse 22125346934fSIan Dowse /* 2213dffce215SKirk McKusick * Structure used to pass information from ffs_sbupdate to its 2214dffce215SKirk McKusick * helper routine ffs_use_bwrite. 2215dffce215SKirk McKusick */ 2216dffce215SKirk McKusick struct devfd { 2217dffce215SKirk McKusick struct ufsmount *ump; 2218dffce215SKirk McKusick struct buf *sbbp; 2219dffce215SKirk McKusick int waitfor; 2220dffce215SKirk McKusick int suspended; 2221dffce215SKirk McKusick int error; 2222dffce215SKirk McKusick }; 2223dffce215SKirk McKusick 2224dffce215SKirk McKusick /* 2225df8bae1dSRodney W. Grimes * Write a superblock and associated information back to disk. 2226df8bae1dSRodney W. Grimes */ 22271a60c7fcSPawel Jakub Dawidek int 2228927a12aeSKirk McKusick ffs_sbupdate(ump, waitfor, suspended) 2229927a12aeSKirk McKusick struct ufsmount *ump; 2230df8bae1dSRodney W. Grimes int waitfor; 2231791dd2faSTor Egge int suspended; 2232df8bae1dSRodney W. Grimes { 2233dffce215SKirk McKusick struct fs *fs; 22343ba649d7SJeff Roberson struct buf *sbbp; 2235dffce215SKirk McKusick struct devfd devfd; 2236df8bae1dSRodney W. Grimes 2237dffce215SKirk McKusick fs = ump->um_fs; 223874f3809aSKirk McKusick if (fs->fs_ronly == 1 && 2239927a12aeSKirk McKusick (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) != 2240927a12aeSKirk McKusick (MNT_RDONLY | MNT_UPDATE) && ump->um_fsckpid == 0) 224174f3809aSKirk McKusick panic("ffs_sbupdate: write read-only filesystem"); 2242996c772fSJohn Dyson /* 22433ba649d7SJeff Roberson * We use the superblock's buf to serialize calls to ffs_sbupdate(). 22443ba649d7SJeff Roberson */ 2245927a12aeSKirk McKusick sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc), 2246927a12aeSKirk McKusick (int)fs->fs_sbsize, 0, 0, 0); 22473ba649d7SJeff Roberson /* 2248dffce215SKirk McKusick * Initialize info needed for write function. 2249996c772fSJohn Dyson */ 2250dffce215SKirk McKusick devfd.ump = ump; 2251dffce215SKirk McKusick devfd.sbbp = sbbp; 2252dffce215SKirk McKusick devfd.waitfor = waitfor; 2253dffce215SKirk McKusick devfd.suspended = suspended; 2254dffce215SKirk McKusick devfd.error = 0; 2255dffce215SKirk McKusick return (ffs_sbput(&devfd, fs, fs->fs_sblockloc, ffs_use_bwrite)); 2256dffce215SKirk McKusick } 2257dffce215SKirk McKusick 2258dffce215SKirk McKusick /* 2259dffce215SKirk McKusick * Write function for use by filesystem-layer routines. 2260dffce215SKirk McKusick */ 2261dffce215SKirk McKusick static int 2262dffce215SKirk McKusick ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size) 2263dffce215SKirk McKusick { 2264dffce215SKirk McKusick struct devfd *devfdp; 2265dffce215SKirk McKusick struct ufsmount *ump; 2266dffce215SKirk McKusick struct buf *bp; 2267dffce215SKirk McKusick struct fs *fs; 2268dffce215SKirk McKusick int error; 2269dffce215SKirk McKusick 2270dffce215SKirk McKusick devfdp = devfd; 2271dffce215SKirk McKusick ump = devfdp->ump; 2272dffce215SKirk McKusick fs = ump->um_fs; 2273dffce215SKirk McKusick /* 2274dffce215SKirk McKusick * Writing the superblock summary information. 2275dffce215SKirk McKusick */ 2276dffce215SKirk McKusick if (loc != fs->fs_sblockloc) { 2277dffce215SKirk McKusick bp = getblk(ump->um_devvp, btodb(loc), size, 0, 0, 0); 2278dffce215SKirk McKusick bcopy(buf, bp->b_data, (u_int)size); 2279dffce215SKirk McKusick if (devfdp->suspended) 2280791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 2281dffce215SKirk McKusick if (devfdp->waitfor != MNT_WAIT) 2282df8bae1dSRodney W. Grimes bawrite(bp); 22838aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 2284dffce215SKirk McKusick devfdp->error = error; 2285dffce215SKirk McKusick return (0); 2286df8bae1dSRodney W. Grimes } 2287996c772fSJohn Dyson /* 2288dffce215SKirk McKusick * Writing the superblock itself. We need to do special checks for it. 2289996c772fSJohn Dyson */ 2290dffce215SKirk McKusick bp = devfdp->sbbp; 2291d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, devfdp->error)) 2292d79ff54bSChuck Silvers devfdp->error = 0; 2293dffce215SKirk McKusick if (devfdp->error != 0) { 2294dffce215SKirk McKusick brelse(bp); 2295dffce215SKirk McKusick return (devfdp->error); 22963ba649d7SJeff Roberson } 229731574422SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 && 2298e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 2299b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 2300fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1); 2301fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS1; 2302fa5d33e2SKirk McKusick } 230331574422SKirk McKusick if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 && 2304e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 2305b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 2306fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2); 2307fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS2; 2308fa5d33e2SKirk McKusick } 2309519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(ump->um_mountp)) 2310927a12aeSKirk McKusick softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp); 2311996c772fSJohn Dyson bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize); 23129454b4fdSKirk McKusick fs = (struct fs *)bp->b_data; 23139454b4fdSKirk McKusick ffs_oldfscompat_write(fs, ump); 231493440bbeSKirk McKusick fs->fs_si = NULL; 231534816cb9SKirk McKusick /* Recalculate the superblock hash */ 23169454b4fdSKirk McKusick fs->fs_ckhash = ffs_calc_sbhash(fs); 2317dffce215SKirk McKusick if (devfdp->suspended) 2318791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 2319dffce215SKirk McKusick if (devfdp->waitfor != MNT_WAIT) 2320996c772fSJohn Dyson bawrite(bp); 23218aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 2322dffce215SKirk McKusick devfdp->error = error; 2323dffce215SKirk McKusick return (devfdp->error); 2324df8bae1dSRodney W. Grimes } 2325d6fe88e4SPoul-Henning Kamp 2326d6fe88e4SPoul-Henning Kamp static int 2327d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp, 2328dfd233edSAttilio Rao int attrnamespace, const char *attrname) 2329d6fe88e4SPoul-Henning Kamp { 2330d6fe88e4SPoul-Henning Kamp 2331d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR 2332d6fe88e4SPoul-Henning Kamp return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace, 2333dfd233edSAttilio Rao attrname)); 2334d6fe88e4SPoul-Henning Kamp #else 2335d6fe88e4SPoul-Henning Kamp return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, 2336dfd233edSAttilio Rao attrname)); 2337d6fe88e4SPoul-Henning Kamp #endif 2338d6fe88e4SPoul-Henning Kamp } 2339975512a9SPoul-Henning Kamp 2340975512a9SPoul-Henning Kamp static void 2341975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip) 2342975512a9SPoul-Henning Kamp { 2343975512a9SPoul-Henning Kamp 234436329289STim J. Robbins if (ump->um_fstype == UFS1 && ip->i_din1 != NULL) 2345aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_ufs1, ip->i_din1); 234636329289STim J. Robbins else if (ip->i_din2 != NULL) 23478d721e87STim J. Robbins uma_zfree(uma_ufs2, ip->i_din2); 23489d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 2349975512a9SPoul-Henning Kamp } 23506e77a041SPoul-Henning Kamp 2351dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1; 2352dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0, 2353dd19a799SPoul-Henning Kamp "Do background writes (honoring the BV_BKGRDWRITE flag)?"); 2354dd19a799SPoul-Henning Kamp 2355dd19a799SPoul-Henning Kamp /* 2356dd19a799SPoul-Henning Kamp * Complete a background write started from bwrite. 2357dd19a799SPoul-Henning Kamp */ 2358dd19a799SPoul-Henning Kamp static void 2359dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp) 2360dd19a799SPoul-Henning Kamp { 2361204ec66dSJeff Roberson struct bufobj *bufobj; 2362dd19a799SPoul-Henning Kamp struct buf *origbp; 2363dd19a799SPoul-Henning Kamp 2364d79ff54bSChuck Silvers #ifdef SOFTUPDATES 2365d79ff54bSChuck Silvers if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) != 0) 2366d79ff54bSChuck Silvers softdep_handle_error(bp); 2367d79ff54bSChuck Silvers #endif 2368d79ff54bSChuck Silvers 2369dd19a799SPoul-Henning Kamp /* 2370dd19a799SPoul-Henning Kamp * Find the original buffer that we are writing. 2371dd19a799SPoul-Henning Kamp */ 2372204ec66dSJeff Roberson bufobj = bp->b_bufobj; 2373204ec66dSJeff Roberson BO_LOCK(bufobj); 2374dd19a799SPoul-Henning Kamp if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL) 2375dd19a799SPoul-Henning Kamp panic("backgroundwritedone: lost buffer"); 2376b2c3df84SKonstantin Belousov 2377b2c3df84SKonstantin Belousov /* 2378b2c3df84SKonstantin Belousov * We should mark the cylinder group buffer origbp as 2379d79ff54bSChuck Silvers * dirty, to not lose the failed write. 2380b2c3df84SKonstantin Belousov */ 2381b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2382b2c3df84SKonstantin Belousov origbp->b_vflags |= BV_BKGRDERR; 2383204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2384dd19a799SPoul-Henning Kamp /* 2385dd19a799SPoul-Henning Kamp * Process dependencies then return any unfinished ones. 2386dd19a799SPoul-Henning Kamp */ 2387b2c3df84SKonstantin Belousov if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) == 0) 2388dd19a799SPoul-Henning Kamp buf_complete(bp); 2389dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 239004533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 2391dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, origbp); 2392dd19a799SPoul-Henning Kamp #endif 2393dd19a799SPoul-Henning Kamp /* 2394204ec66dSJeff Roberson * This buffer is marked B_NOCACHE so when it is released 2395204ec66dSJeff Roberson * by biodone it will be tossed. 2396dd19a799SPoul-Henning Kamp */ 2397dd19a799SPoul-Henning Kamp bp->b_flags |= B_NOCACHE; 2398ec9c9e73SAlan Cox bp->b_flags &= ~B_CACHE; 2399377f88fbSKonstantin Belousov pbrelvp(bp); 2400b2c3df84SKonstantin Belousov 2401b2c3df84SKonstantin Belousov /* 2402b2c3df84SKonstantin Belousov * Prevent brelse() from trying to keep and re-dirtying bp on 2403b2c3df84SKonstantin Belousov * errors. It causes b_bufobj dereference in 2404b2c3df84SKonstantin Belousov * bdirty()/reassignbuf(), and b_bufobj was cleared in 2405b2c3df84SKonstantin Belousov * pbrelvp() above. 2406b2c3df84SKonstantin Belousov */ 2407b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2408b2c3df84SKonstantin Belousov bp->b_flags |= B_INVAL; 2409dd19a799SPoul-Henning Kamp bufdone(bp); 2410204ec66dSJeff Roberson BO_LOCK(bufobj); 2411dd19a799SPoul-Henning Kamp /* 2412dd19a799SPoul-Henning Kamp * Clear the BV_BKGRDINPROG flag in the original buffer 2413dd19a799SPoul-Henning Kamp * and awaken it if it is waiting for the write to complete. 2414dd19a799SPoul-Henning Kamp * If BV_BKGRDINPROG is not set in the original buffer it must 2415dd19a799SPoul-Henning Kamp * have been released and re-instantiated - which is not legal. 2416dd19a799SPoul-Henning Kamp */ 2417dd19a799SPoul-Henning Kamp KASSERT((origbp->b_vflags & BV_BKGRDINPROG), 2418dd19a799SPoul-Henning Kamp ("backgroundwritedone: lost buffer2")); 2419dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDINPROG; 2420dd19a799SPoul-Henning Kamp if (origbp->b_vflags & BV_BKGRDWAIT) { 2421dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDWAIT; 2422dd19a799SPoul-Henning Kamp wakeup(&origbp->b_xflags); 2423dd19a799SPoul-Henning Kamp } 2424204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2425dd19a799SPoul-Henning Kamp } 2426dd19a799SPoul-Henning Kamp 2427dd19a799SPoul-Henning Kamp /* 2428dd19a799SPoul-Henning Kamp * Write, release buffer on completion. (Done by iodone 2429dd19a799SPoul-Henning Kamp * if async). Do not bother writing anything if the buffer 2430dd19a799SPoul-Henning Kamp * is invalid. 2431dd19a799SPoul-Henning Kamp * 2432dd19a799SPoul-Henning Kamp * Note that we set B_CACHE here, indicating that buffer is 2433dd19a799SPoul-Henning Kamp * fully valid and thus cacheable. This is true even of NFS 2434dd19a799SPoul-Henning Kamp * now so we set it generally. This could be set either here 2435dd19a799SPoul-Henning Kamp * or in biodone() since the I/O is synchronous. We put it 2436dd19a799SPoul-Henning Kamp * here. 2437dd19a799SPoul-Henning Kamp */ 2438dd19a799SPoul-Henning Kamp static int 2439dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp) 2440dd19a799SPoul-Henning Kamp { 2441dd19a799SPoul-Henning Kamp struct buf *newbp; 244247806d1bSKirk McKusick struct cg *cgp; 2443dd19a799SPoul-Henning Kamp 2444dd19a799SPoul-Henning Kamp CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags); 2445dd19a799SPoul-Henning Kamp if (bp->b_flags & B_INVAL) { 2446dd19a799SPoul-Henning Kamp brelse(bp); 2447dd19a799SPoul-Henning Kamp return (0); 2448dd19a799SPoul-Henning Kamp } 2449dd19a799SPoul-Henning Kamp 2450d638e093SAttilio Rao if (!BUF_ISLOCKED(bp)) 2451dd19a799SPoul-Henning Kamp panic("bufwrite: buffer is not busy???"); 2452dd19a799SPoul-Henning Kamp /* 2453dd19a799SPoul-Henning Kamp * If a background write is already in progress, delay 2454dd19a799SPoul-Henning Kamp * writing this block if it is asynchronous. Otherwise 2455dd19a799SPoul-Henning Kamp * wait for the background write to complete. 2456dd19a799SPoul-Henning Kamp */ 2457dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2458dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) { 2459dd19a799SPoul-Henning Kamp if (bp->b_flags & B_ASYNC) { 2460dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2461dd19a799SPoul-Henning Kamp bdwrite(bp); 2462dd19a799SPoul-Henning Kamp return (0); 2463dd19a799SPoul-Henning Kamp } 2464dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDWAIT; 246522a72260SJeff Roberson msleep(&bp->b_xflags, BO_LOCKPTR(bp->b_bufobj), PRIBIO, 246622a72260SJeff Roberson "bwrbg", 0); 2467dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) 2468dd19a799SPoul-Henning Kamp panic("bufwrite: still writing"); 2469dd19a799SPoul-Henning Kamp } 2470b2c3df84SKonstantin Belousov bp->b_vflags &= ~BV_BKGRDERR; 2471dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2472dd19a799SPoul-Henning Kamp 2473dd19a799SPoul-Henning Kamp /* 2474dd19a799SPoul-Henning Kamp * If this buffer is marked for background writing and we 2475dd19a799SPoul-Henning Kamp * do not have to wait for it, make a copy and write the 2476dd19a799SPoul-Henning Kamp * copy so as to leave this buffer ready for further use. 2477dd19a799SPoul-Henning Kamp * 2478dd19a799SPoul-Henning Kamp * This optimization eats a lot of memory. If we have a page 2479dd19a799SPoul-Henning Kamp * or buffer shortfall we can't do it. 2480dd19a799SPoul-Henning Kamp */ 2481dd19a799SPoul-Henning Kamp if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) && 2482dd19a799SPoul-Henning Kamp (bp->b_flags & B_ASYNC) && 2483dd19a799SPoul-Henning Kamp !vm_page_count_severe() && 2484dd19a799SPoul-Henning Kamp !buf_dirty_count_severe()) { 2485dd19a799SPoul-Henning Kamp KASSERT(bp->b_iodone == NULL, 2486dd19a799SPoul-Henning Kamp ("bufwrite: needs chained iodone (%p)", bp->b_iodone)); 2487dd19a799SPoul-Henning Kamp 2488dd19a799SPoul-Henning Kamp /* get a new block */ 2489c1d8b5e8SKonstantin Belousov newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD); 2490c1d8b5e8SKonstantin Belousov if (newbp == NULL) 2491c1d8b5e8SKonstantin Belousov goto normal_write; 2492dd19a799SPoul-Henning Kamp 2493fade8dd7SJeff Roberson KASSERT(buf_mapped(bp), ("Unmapped cg")); 2494dd19a799SPoul-Henning Kamp memcpy(newbp->b_data, bp->b_data, bp->b_bufsize); 2495dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2496dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDINPROG; 2497dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 249875e3597aSKirk McKusick newbp->b_xflags |= 249975e3597aSKirk McKusick (bp->b_xflags & BX_FSPRIV) | BX_BKGRDMARKER; 250026089666SJeff Roberson newbp->b_lblkno = bp->b_lblkno; 2501dd19a799SPoul-Henning Kamp newbp->b_blkno = bp->b_blkno; 2502dd19a799SPoul-Henning Kamp newbp->b_offset = bp->b_offset; 2503dd19a799SPoul-Henning Kamp newbp->b_iodone = ffs_backgroundwritedone; 2504dd19a799SPoul-Henning Kamp newbp->b_flags |= B_ASYNC; 2505dd19a799SPoul-Henning Kamp newbp->b_flags &= ~B_INVAL; 250626089666SJeff Roberson pbgetvp(bp->b_vp, newbp); 2507dd19a799SPoul-Henning Kamp 2508dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 2509113db2ddSJeff Roberson /* 2510113db2ddSJeff Roberson * Move over the dependencies. If there are rollbacks, 2511113db2ddSJeff Roberson * leave the parent buffer dirtied as it will need to 2512113db2ddSJeff Roberson * be written again. 2513113db2ddSJeff Roberson */ 2514113db2ddSJeff Roberson if (LIST_EMPTY(&bp->b_dep) || 2515113db2ddSJeff Roberson softdep_move_dependencies(bp, newbp) == 0) 2516113db2ddSJeff Roberson bundirty(bp); 2517113db2ddSJeff Roberson #else 2518113db2ddSJeff Roberson bundirty(bp); 2519dd19a799SPoul-Henning Kamp #endif 2520dd19a799SPoul-Henning Kamp 2521dd19a799SPoul-Henning Kamp /* 252226089666SJeff Roberson * Initiate write on the copy, release the original. The 252326089666SJeff Roberson * BKGRDINPROG flag prevents it from going away until 252447806d1bSKirk McKusick * the background write completes. We have to recalculate 252547806d1bSKirk McKusick * its check hash in case the buffer gets freed and then 252647806d1bSKirk McKusick * reconstituted from the buffer cache during a later read. 2527dd19a799SPoul-Henning Kamp */ 252847806d1bSKirk McKusick if ((bp->b_xflags & BX_CYLGRP) != 0) { 252947806d1bSKirk McKusick cgp = (struct cg *)bp->b_data; 253047806d1bSKirk McKusick cgp->cg_ckhash = 0; 253147806d1bSKirk McKusick cgp->cg_ckhash = 253247806d1bSKirk McKusick calculate_crc32c(~0L, bp->b_data, bp->b_bcount); 253347806d1bSKirk McKusick } 2534dd19a799SPoul-Henning Kamp bqrelse(bp); 2535dd19a799SPoul-Henning Kamp bp = newbp; 2536113db2ddSJeff Roberson } else 2537113db2ddSJeff Roberson /* Mark the buffer clean */ 2538113db2ddSJeff Roberson bundirty(bp); 2539113db2ddSJeff Roberson 2540dd19a799SPoul-Henning Kamp /* Let the normal bufwrite do the rest for us */ 2541c1d8b5e8SKonstantin Belousov normal_write: 254247806d1bSKirk McKusick /* 254347806d1bSKirk McKusick * If we are writing a cylinder group, update its time. 254447806d1bSKirk McKusick */ 254547806d1bSKirk McKusick if ((bp->b_xflags & BX_CYLGRP) != 0) { 254647806d1bSKirk McKusick cgp = (struct cg *)bp->b_data; 254747806d1bSKirk McKusick cgp->cg_old_time = cgp->cg_time = time_second; 254847806d1bSKirk McKusick } 25499248a827STor Egge return (bufwrite(bp)); 2550dd19a799SPoul-Henning Kamp } 2551dd19a799SPoul-Henning Kamp 25528dd56505SPoul-Henning Kamp static void 25536e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp) 25546e77a041SPoul-Henning Kamp { 2555153910e0SJeff Roberson struct vnode *vp; 25567de3839dSTor Egge struct buf *tbp; 255775e3597aSKirk McKusick int error, nocopy; 25586e77a041SPoul-Henning Kamp 2559f15ccf88SChuck Silvers /* 2560f15ccf88SChuck Silvers * This is the bufobj strategy for the private VCHR vnodes 2561f15ccf88SChuck Silvers * used by FFS to access the underlying storage device. 2562f15ccf88SChuck Silvers * We override the default bufobj strategy and thus bypass 2563f15ccf88SChuck Silvers * VOP_STRATEGY() for these vnodes. 2564f15ccf88SChuck Silvers */ 25658660b707SMateusz Guzik vp = bo2vnode(bo); 2566f15ccf88SChuck Silvers KASSERT(bp->b_vp == NULL || bp->b_vp->v_type != VCHR || 2567f15ccf88SChuck Silvers bp->b_vp->v_rdev == NULL || 2568f15ccf88SChuck Silvers bp->b_vp->v_rdev->si_mountpt == NULL || 2569f15ccf88SChuck Silvers VFSTOUFS(bp->b_vp->v_rdev->si_mountpt) == NULL || 2570f15ccf88SChuck Silvers vp == VFSTOUFS(bp->b_vp->v_rdev->si_mountpt)->um_devvp, 2571f15ccf88SChuck Silvers ("ffs_geom_strategy() with wrong vp")); 2572153910e0SJeff Roberson if (bp->b_iocmd == BIO_WRITE) { 2573153910e0SJeff Roberson if ((bp->b_flags & B_VALIDSUSPWRT) == 0 && 2574153910e0SJeff Roberson bp->b_vp != NULL && bp->b_vp->v_mount != NULL && 2575153910e0SJeff Roberson (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0) 2576153910e0SJeff Roberson panic("ffs_geom_strategy: bad I/O"); 2577113db2ddSJeff Roberson nocopy = bp->b_flags & B_NOCOPY; 2578113db2ddSJeff Roberson bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY); 2579113db2ddSJeff Roberson if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 && 25807de3839dSTor Egge vp->v_rdev->si_snapdata != NULL) { 25817de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 2582868bb88fSTor Egge runningbufwakeup(bp); 25837de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 25847de3839dSTor Egge b_cluster.cluster_entry) { 25857de3839dSTor Egge error = ffs_copyonwrite(vp, tbp); 25867de3839dSTor Egge if (error != 0 && 2587153910e0SJeff Roberson error != EOPNOTSUPP) { 2588153910e0SJeff Roberson bp->b_error = error; 2589153910e0SJeff Roberson bp->b_ioflags |= BIO_ERROR; 2590e1ef4c29SKonstantin Belousov bp->b_flags &= ~B_BARRIER; 2591153910e0SJeff Roberson bufdone(bp); 2592153910e0SJeff Roberson return; 2593153910e0SJeff Roberson } 2594153910e0SJeff Roberson } 2595868bb88fSTor Egge bp->b_runningbufspace = bp->b_bufsize; 25965bd65606SJohn Baldwin atomic_add_long(&runningbufspace, 2597868bb88fSTor Egge bp->b_runningbufspace); 25987de3839dSTor Egge } else { 25997de3839dSTor Egge error = ffs_copyonwrite(vp, bp); 26007de3839dSTor Egge if (error != 0 && error != EOPNOTSUPP) { 26017de3839dSTor Egge bp->b_error = error; 26027de3839dSTor Egge bp->b_ioflags |= BIO_ERROR; 2603e1ef4c29SKonstantin Belousov bp->b_flags &= ~B_BARRIER; 26047de3839dSTor Egge bufdone(bp); 26057de3839dSTor Egge return; 26067de3839dSTor Egge } 26077de3839dSTor Egge } 26087de3839dSTor Egge } 26097de3839dSTor Egge #ifdef SOFTUPDATES 26107de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 26117de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 26127de3839dSTor Egge b_cluster.cluster_entry) { 261304533fc6SXin LI if (!LIST_EMPTY(&tbp->b_dep)) 26147de3839dSTor Egge buf_start(tbp); 26157de3839dSTor Egge } 26167de3839dSTor Egge } else { 261704533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 26187de3839dSTor Egge buf_start(bp); 26197de3839dSTor Egge } 26207de3839dSTor Egge 26217de3839dSTor Egge #endif 262275e3597aSKirk McKusick /* 262375e3597aSKirk McKusick * Check for metadata that needs check-hashes and update them. 262475e3597aSKirk McKusick */ 262575e3597aSKirk McKusick switch (bp->b_xflags & BX_FSPRIV) { 262675e3597aSKirk McKusick case BX_CYLGRP: 262775e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 0; 262875e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 262975e3597aSKirk McKusick calculate_crc32c(~0L, bp->b_data, bp->b_bcount); 263075e3597aSKirk McKusick break; 263175e3597aSKirk McKusick 263275e3597aSKirk McKusick case BX_SUPERBLOCK: 263375e3597aSKirk McKusick case BX_INODE: 263475e3597aSKirk McKusick case BX_INDIR: 263575e3597aSKirk McKusick case BX_DIR: 263675e3597aSKirk McKusick printf("Check-hash write is unimplemented!!!\n"); 263775e3597aSKirk McKusick break; 263875e3597aSKirk McKusick 263975e3597aSKirk McKusick case 0: 264075e3597aSKirk McKusick break; 264175e3597aSKirk McKusick 264275e3597aSKirk McKusick default: 264375e3597aSKirk McKusick printf("multiple buffer types 0x%b\n", 264475e3597aSKirk McKusick (u_int)(bp->b_xflags & BX_FSPRIV), 264575e3597aSKirk McKusick PRINT_UFS_BUF_XFLAGS); 264675e3597aSKirk McKusick break; 264775e3597aSKirk McKusick } 26487de3839dSTor Egge } 2649d79ff54bSChuck Silvers if (bp->b_iocmd != BIO_READ && ffs_enxio_enable) 2650d79ff54bSChuck Silvers bp->b_xflags |= BX_CVTENXIO; 265143920011SPoul-Henning Kamp g_vfs_strategy(bo, bp); 26526e77a041SPoul-Henning Kamp } 265352dfc8d7SKonstantin Belousov 26541848286aSEdward Tomasz Napierala int 26551848286aSEdward Tomasz Napierala ffs_own_mount(const struct mount *mp) 26561848286aSEdward Tomasz Napierala { 26571848286aSEdward Tomasz Napierala 26581848286aSEdward Tomasz Napierala if (mp->mnt_op == &ufs_vfsops) 26591848286aSEdward Tomasz Napierala return (1); 26601848286aSEdward Tomasz Napierala return (0); 26611848286aSEdward Tomasz Napierala } 26621848286aSEdward Tomasz Napierala 266352dfc8d7SKonstantin Belousov #ifdef DDB 2664cf058082SBrooks Davis #ifdef SOFTUPDATES 266552dfc8d7SKonstantin Belousov 2666519e3c3bSKirk McKusick /* defined in ffs_softdep.c */ 2667519e3c3bSKirk McKusick extern void db_print_ffs(struct ufsmount *ump); 266852dfc8d7SKonstantin Belousov 266952dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs) 267052dfc8d7SKonstantin Belousov { 267152dfc8d7SKonstantin Belousov struct mount *mp; 267252dfc8d7SKonstantin Belousov struct ufsmount *ump; 267352dfc8d7SKonstantin Belousov 267452dfc8d7SKonstantin Belousov if (have_addr) { 267552dfc8d7SKonstantin Belousov ump = VFSTOUFS((struct mount *)addr); 267652dfc8d7SKonstantin Belousov db_print_ffs(ump); 267752dfc8d7SKonstantin Belousov return; 267852dfc8d7SKonstantin Belousov } 267952dfc8d7SKonstantin Belousov 268052dfc8d7SKonstantin Belousov TAILQ_FOREACH(mp, &mountlist, mnt_list) { 268152dfc8d7SKonstantin Belousov if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name)) 268252dfc8d7SKonstantin Belousov db_print_ffs(VFSTOUFS(mp)); 268352dfc8d7SKonstantin Belousov } 268452dfc8d7SKonstantin Belousov } 268552dfc8d7SKonstantin Belousov 2686cf058082SBrooks Davis #endif /* SOFTUPDATES */ 268752dfc8d7SKonstantin Belousov #endif /* DDB */ 2688