160727d8bSWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1989, 1991, 1993, 1994 5df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes */ 31df8bae1dSRodney W. Grimes 32f4636c59SDavid E. O'Brien #include <sys/cdefs.h> 3301733a9bSGarrett Wollman #include "opt_quota.h" 34516081f2SRobert Watson #include "opt_ufs.h" 356e77a041SPoul-Henning Kamp #include "opt_ffs.h" 3652dfc8d7SKonstantin Belousov #include "opt_ddb.h" 3701733a9bSGarrett Wollman 38df8bae1dSRodney W. Grimes #include <sys/param.h> 39f89d2072SXin LI #include <sys/gsb_crc32.h> 40df8bae1dSRodney W. Grimes #include <sys/systm.h> 41df8bae1dSRodney W. Grimes #include <sys/namei.h> 42acd3428bSRobert Watson #include <sys/priv.h> 43df8bae1dSRodney W. Grimes #include <sys/proc.h> 44c79dff0fSKonstantin Belousov #include <sys/taskqueue.h> 45df8bae1dSRodney W. Grimes #include <sys/kernel.h> 46daec9284SConrad Meyer #include <sys/ktr.h> 47df8bae1dSRodney W. Grimes #include <sys/vnode.h> 48df8bae1dSRodney W. Grimes #include <sys/mount.h> 499626b608SPoul-Henning Kamp #include <sys/bio.h> 50df8bae1dSRodney W. Grimes #include <sys/buf.h> 5181bca6ddSKATO Takenori #include <sys/conf.h> 523ac4d1efSBruce Evans #include <sys/fcntl.h> 531848286aSEdward Tomasz Napierala #include <sys/ioccom.h> 54df8bae1dSRodney W. Grimes #include <sys/malloc.h> 551b367556SJason Evans #include <sys/mutex.h> 5622a72260SJeff Roberson #include <sys/rwlock.h> 57d79ff54bSChuck Silvers #include <sys/sysctl.h> 589ed01c32SGleb Smirnoff #include <sys/vmmeter.h> 59a18b1f1dSJason Evans 60aed55708SRobert Watson #include <security/mac/mac_framework.h> 61aed55708SRobert Watson 62a96da1c3SConrad Meyer #include <ufs/ufs/dir.h> 63a64ed089SRobert Watson #include <ufs/ufs/extattr.h> 641a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h> 65df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h> 66df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h> 67df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h> 68df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h> 69df8bae1dSRodney W. Grimes 70df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h> 71df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h> 72df8bae1dSRodney W. Grimes 73f6b04d2bSDavid Greenman #include <vm/vm.h> 74aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h> 75f6b04d2bSDavid Greenman #include <vm/vm_page.h> 76f6b04d2bSDavid Greenman 7743920011SPoul-Henning Kamp #include <geom/geom.h> 7843920011SPoul-Henning Kamp #include <geom/geom_vfs.h> 7943920011SPoul-Henning Kamp 8052dfc8d7SKonstantin Belousov #include <ddb/ddb.h> 8152dfc8d7SKonstantin Belousov 82adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2; 839d5a594fSMateusz Guzik VFS_SMR_DECLARE; 8455166637SPoul-Henning Kamp 85975512a9SPoul-Henning Kamp static int ffs_mountfs(struct vnode *, struct mount *, struct thread *); 861c85e6a3SKirk McKusick static void ffs_oldfscompat_read(struct fs *, struct ufsmount *, 871c85e6a3SKirk McKusick ufs2_daddr_t); 88975512a9SPoul-Henning Kamp static void ffs_ifree(struct ufsmount *ump, struct inode *ip); 89a988a5c6SKonstantin Belousov static int ffs_sync_lazy(struct mount *mp); 90dffce215SKirk McKusick static int ffs_use_bread(void *devfd, off_t loc, void **bufp, int size); 91dffce215SKirk McKusick static int ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size); 92a988a5c6SKonstantin Belousov 939bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init; 949bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit; 95d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl; 9620a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount; 97adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount; 9820a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount; 99adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs; 100adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp; 101adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync; 102df8bae1dSRodney W. Grimes 103303b270bSEivind Eklund static struct vfsops ufs_vfsops = { 1047652131bSPoul-Henning Kamp .vfs_extattrctl = ffs_extattrctl, 1057652131bSPoul-Henning Kamp .vfs_fhtovp = ffs_fhtovp, 1067652131bSPoul-Henning Kamp .vfs_init = ffs_init, 10720a92a18SPoul-Henning Kamp .vfs_mount = ffs_mount, 10820a92a18SPoul-Henning Kamp .vfs_cmount = ffs_cmount, 1097652131bSPoul-Henning Kamp .vfs_quotactl = ufs_quotactl, 110e35cd9e3SMateusz Guzik .vfs_root = vfs_cache_root, 111e35cd9e3SMateusz Guzik .vfs_cachedroot = ufs_root, 1127652131bSPoul-Henning Kamp .vfs_statfs = ffs_statfs, 1137652131bSPoul-Henning Kamp .vfs_sync = ffs_sync, 1147652131bSPoul-Henning Kamp .vfs_uninit = ffs_uninit, 1157652131bSPoul-Henning Kamp .vfs_unmount = ffs_unmount, 1167652131bSPoul-Henning Kamp .vfs_vget = ffs_vget, 1172814d5baSKonstantin Belousov .vfs_susp_clean = process_deferred_inactive, 118df8bae1dSRodney W. Grimes }; 119df8bae1dSRodney W. Grimes 120*1cd455f3SRick Macklem VFS_SET(ufs_vfsops, ufs, VFCF_FILEREVINC); 1215fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1); 122c901836cSGarrett Wollman 1236e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy; 124dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite; 1256e77a041SPoul-Henning Kamp 1266e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = { 1276e77a041SPoul-Henning Kamp .bop_name = "FFS", 128dd19a799SPoul-Henning Kamp .bop_write = ffs_bufwrite, 1296e77a041SPoul-Henning Kamp .bop_strategy = ffs_geom_strategy, 1306ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 1312cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT 1322cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush, 1332cc7d26fSKonstantin Belousov #else 1342cc7d26fSKonstantin Belousov .bop_bdflush = ffs_bdflush, 1352cc7d26fSKonstantin Belousov #endif 1366e77a041SPoul-Henning Kamp }; 1376e77a041SPoul-Henning Kamp 1380b962648SAndriy Gapon /* 1390b962648SAndriy Gapon * Note that userquota and groupquota options are not currently used 1400b962648SAndriy Gapon * by UFS/FFS code and generally mount(8) does not pass those options 1410b962648SAndriy Gapon * from userland, but they can be passed by loader(8) via 1420b962648SAndriy Gapon * vfs.root.mountfrom.options. 1430b962648SAndriy Gapon */ 144d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr", 1450b962648SAndriy Gapon "noclusterw", "noexec", "export", "force", "from", "groupquota", 1469acea164SRobert Wing "multilabel", "nfsv4acls", "snapshot", "nosuid", "suiddir", 147daba4da8SKirk McKusick "nosymfollow", "sync", "union", "userquota", "untrusted", NULL }; 14820a92a18SPoul-Henning Kamp 149d79ff54bSChuck Silvers static int ffs_enxio_enable = 1; 150d79ff54bSChuck Silvers SYSCTL_DECL(_vfs_ffs); 151d79ff54bSChuck Silvers SYSCTL_INT(_vfs_ffs, OID_AUTO, enxio_enable, CTLFLAG_RWTUN, 152d79ff54bSChuck Silvers &ffs_enxio_enable, 0, 153d79ff54bSChuck Silvers "enable mapping of other disk I/O errors to ENXIO"); 154d79ff54bSChuck Silvers 155d9a8abf6SChuck Silvers /* 156d9a8abf6SChuck Silvers * Return buffer with the contents of block "offset" from the beginning of 157d9a8abf6SChuck Silvers * directory "ip". If "res" is non-zero, fill it in with a pointer to the 158d9a8abf6SChuck Silvers * remaining space in the directory. 159d9a8abf6SChuck Silvers */ 160d9a8abf6SChuck Silvers static int 161d9a8abf6SChuck Silvers ffs_blkatoff(struct vnode *vp, off_t offset, char **res, struct buf **bpp) 162d9a8abf6SChuck Silvers { 163d9a8abf6SChuck Silvers struct inode *ip; 164d9a8abf6SChuck Silvers struct fs *fs; 165d9a8abf6SChuck Silvers struct buf *bp; 166d9a8abf6SChuck Silvers ufs_lbn_t lbn; 167d9a8abf6SChuck Silvers int bsize, error; 168d9a8abf6SChuck Silvers 169d9a8abf6SChuck Silvers ip = VTOI(vp); 170d9a8abf6SChuck Silvers fs = ITOFS(ip); 171d9a8abf6SChuck Silvers lbn = lblkno(fs, offset); 172d9a8abf6SChuck Silvers bsize = blksize(fs, ip, lbn); 173d9a8abf6SChuck Silvers 174d9a8abf6SChuck Silvers *bpp = NULL; 175d9a8abf6SChuck Silvers error = bread(vp, lbn, bsize, NOCRED, &bp); 176d9a8abf6SChuck Silvers if (error) { 177d9a8abf6SChuck Silvers return (error); 178d9a8abf6SChuck Silvers } 179d9a8abf6SChuck Silvers if (res) 180d9a8abf6SChuck Silvers *res = (char *)bp->b_data + blkoff(fs, offset); 181d9a8abf6SChuck Silvers *bpp = bp; 182d9a8abf6SChuck Silvers return (0); 183d9a8abf6SChuck Silvers } 184d9a8abf6SChuck Silvers 185d9a8abf6SChuck Silvers /* 186d9a8abf6SChuck Silvers * Load up the contents of an inode and copy the appropriate pieces 187d9a8abf6SChuck Silvers * to the incore copy. 188d9a8abf6SChuck Silvers */ 189d9a8abf6SChuck Silvers static int 190d9a8abf6SChuck Silvers ffs_load_inode(struct buf *bp, struct inode *ip, struct fs *fs, ino_t ino) 191d9a8abf6SChuck Silvers { 192d9a8abf6SChuck Silvers struct ufs1_dinode *dip1; 193d9a8abf6SChuck Silvers struct ufs2_dinode *dip2; 194d9a8abf6SChuck Silvers int error; 195d9a8abf6SChuck Silvers 196d9a8abf6SChuck Silvers if (I_IS_UFS1(ip)) { 197d9a8abf6SChuck Silvers dip1 = ip->i_din1; 198d9a8abf6SChuck Silvers *dip1 = 199d9a8abf6SChuck Silvers *((struct ufs1_dinode *)bp->b_data + ino_to_fsbo(fs, ino)); 200d9a8abf6SChuck Silvers ip->i_mode = dip1->di_mode; 201d9a8abf6SChuck Silvers ip->i_nlink = dip1->di_nlink; 202d9a8abf6SChuck Silvers ip->i_effnlink = dip1->di_nlink; 203d9a8abf6SChuck Silvers ip->i_size = dip1->di_size; 204d9a8abf6SChuck Silvers ip->i_flags = dip1->di_flags; 205d9a8abf6SChuck Silvers ip->i_gen = dip1->di_gen; 206d9a8abf6SChuck Silvers ip->i_uid = dip1->di_uid; 207d9a8abf6SChuck Silvers ip->i_gid = dip1->di_gid; 208d9a8abf6SChuck Silvers return (0); 209d9a8abf6SChuck Silvers } 210d9a8abf6SChuck Silvers dip2 = ((struct ufs2_dinode *)bp->b_data + ino_to_fsbo(fs, ino)); 211d9a8abf6SChuck Silvers if ((error = ffs_verify_dinode_ckhash(fs, dip2)) != 0 && 212d9a8abf6SChuck Silvers !ffs_fsfail_cleanup(ITOUMP(ip), error)) { 213d9a8abf6SChuck Silvers printf("%s: inode %jd: check-hash failed\n", fs->fs_fsmnt, 214d9a8abf6SChuck Silvers (intmax_t)ino); 215d9a8abf6SChuck Silvers return (error); 216d9a8abf6SChuck Silvers } 217d9a8abf6SChuck Silvers *ip->i_din2 = *dip2; 218d9a8abf6SChuck Silvers dip2 = ip->i_din2; 219d9a8abf6SChuck Silvers ip->i_mode = dip2->di_mode; 220d9a8abf6SChuck Silvers ip->i_nlink = dip2->di_nlink; 221d9a8abf6SChuck Silvers ip->i_effnlink = dip2->di_nlink; 222d9a8abf6SChuck Silvers ip->i_size = dip2->di_size; 223d9a8abf6SChuck Silvers ip->i_flags = dip2->di_flags; 224d9a8abf6SChuck Silvers ip->i_gen = dip2->di_gen; 225d9a8abf6SChuck Silvers ip->i_uid = dip2->di_uid; 226d9a8abf6SChuck Silvers ip->i_gid = dip2->di_gid; 227d9a8abf6SChuck Silvers return (0); 228d9a8abf6SChuck Silvers } 229d9a8abf6SChuck Silvers 230d9a8abf6SChuck Silvers /* 231d9a8abf6SChuck Silvers * Verify that a filesystem block number is a valid data block. 232d9a8abf6SChuck Silvers * This routine is only called on untrusted filesystems. 233d9a8abf6SChuck Silvers */ 234d9a8abf6SChuck Silvers static int 235d9a8abf6SChuck Silvers ffs_check_blkno(struct mount *mp, ino_t inum, ufs2_daddr_t daddr, int blksize) 236d9a8abf6SChuck Silvers { 237d9a8abf6SChuck Silvers struct fs *fs; 238d9a8abf6SChuck Silvers struct ufsmount *ump; 239d9a8abf6SChuck Silvers ufs2_daddr_t end_daddr; 240d9a8abf6SChuck Silvers int cg, havemtx; 241d9a8abf6SChuck Silvers 242d9a8abf6SChuck Silvers KASSERT((mp->mnt_flag & MNT_UNTRUSTED) != 0, 243d9a8abf6SChuck Silvers ("ffs_check_blkno called on a trusted file system")); 244d9a8abf6SChuck Silvers ump = VFSTOUFS(mp); 245d9a8abf6SChuck Silvers fs = ump->um_fs; 246d9a8abf6SChuck Silvers cg = dtog(fs, daddr); 247d9a8abf6SChuck Silvers end_daddr = daddr + numfrags(fs, blksize); 248d9a8abf6SChuck Silvers /* 249d9a8abf6SChuck Silvers * Verify that the block number is a valid data block. Also check 250d9a8abf6SChuck Silvers * that it does not point to an inode block or a superblock. Accept 251d9a8abf6SChuck Silvers * blocks that are unalloacted (0) or part of snapshot metadata 252d9a8abf6SChuck Silvers * (BLK_NOCOPY or BLK_SNAP). 253d9a8abf6SChuck Silvers * 254d9a8abf6SChuck Silvers * Thus, the block must be in a valid range for the filesystem and 255d9a8abf6SChuck Silvers * either in the space before a backup superblock (except the first 256d9a8abf6SChuck Silvers * cylinder group where that space is used by the bootstrap code) or 257d9a8abf6SChuck Silvers * after the inode blocks and before the end of the cylinder group. 258d9a8abf6SChuck Silvers */ 259d9a8abf6SChuck Silvers if ((uint64_t)daddr <= BLK_SNAP || 260d9a8abf6SChuck Silvers ((uint64_t)end_daddr <= fs->fs_size && 261d9a8abf6SChuck Silvers ((cg > 0 && end_daddr <= cgsblock(fs, cg)) || 262d9a8abf6SChuck Silvers (daddr >= cgdmin(fs, cg) && 263d9a8abf6SChuck Silvers end_daddr <= cgbase(fs, cg) + fs->fs_fpg)))) 264d9a8abf6SChuck Silvers return (0); 265d9a8abf6SChuck Silvers if ((havemtx = mtx_owned(UFS_MTX(ump))) == 0) 266d9a8abf6SChuck Silvers UFS_LOCK(ump); 267d9a8abf6SChuck Silvers if (ppsratecheck(&ump->um_last_integritymsg, 268d9a8abf6SChuck Silvers &ump->um_secs_integritymsg, 1)) { 269d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 270d9a8abf6SChuck Silvers uprintf("\n%s: inode %jd, out-of-range indirect block " 271d9a8abf6SChuck Silvers "number %jd\n", mp->mnt_stat.f_mntonname, inum, daddr); 272d9a8abf6SChuck Silvers if (havemtx) 273d9a8abf6SChuck Silvers UFS_LOCK(ump); 274d9a8abf6SChuck Silvers } else if (!havemtx) 275d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 276d9a8abf6SChuck Silvers return (EINTEGRITY); 277d9a8abf6SChuck Silvers } 278d9a8abf6SChuck Silvers 279d9a8abf6SChuck Silvers /* 280211ec9b7SJason A. Harmening * On first ENXIO error, initiate an asynchronous forcible unmount. 281d9a8abf6SChuck Silvers * Used to unmount filesystems whose underlying media has gone away. 282d9a8abf6SChuck Silvers * 283d9a8abf6SChuck Silvers * Return true if a cleanup is in progress. 284d9a8abf6SChuck Silvers */ 285d9a8abf6SChuck Silvers int 286d9a8abf6SChuck Silvers ffs_fsfail_cleanup(struct ufsmount *ump, int error) 287d9a8abf6SChuck Silvers { 288d9a8abf6SChuck Silvers int retval; 289d9a8abf6SChuck Silvers 290d9a8abf6SChuck Silvers UFS_LOCK(ump); 291d9a8abf6SChuck Silvers retval = ffs_fsfail_cleanup_locked(ump, error); 292d9a8abf6SChuck Silvers UFS_UNLOCK(ump); 293d9a8abf6SChuck Silvers return (retval); 294d9a8abf6SChuck Silvers } 295d9a8abf6SChuck Silvers 296d9a8abf6SChuck Silvers int 297d9a8abf6SChuck Silvers ffs_fsfail_cleanup_locked(struct ufsmount *ump, int error) 298d9a8abf6SChuck Silvers { 299d9a8abf6SChuck Silvers mtx_assert(UFS_MTX(ump), MA_OWNED); 300d9a8abf6SChuck Silvers if (error == ENXIO && (ump->um_flags & UM_FSFAIL_CLEANUP) == 0) { 301d9a8abf6SChuck Silvers ump->um_flags |= UM_FSFAIL_CLEANUP; 30260a41168SChuck Silvers if (ump->um_mountp == rootvnode->v_mount) 30360a41168SChuck Silvers panic("UFS: root fs would be forcibly unmounted"); 30460a41168SChuck Silvers 305d9a8abf6SChuck Silvers /* 306d9a8abf6SChuck Silvers * Queue an async forced unmount. 307d9a8abf6SChuck Silvers */ 308211ec9b7SJason A. Harmening vfs_ref(ump->um_mountp); 309211ec9b7SJason A. Harmening dounmount(ump->um_mountp, 310211ec9b7SJason A. Harmening MNT_FORCE | MNT_RECURSE | MNT_DEFERRED, curthread); 311d9a8abf6SChuck Silvers printf("UFS: forcibly unmounting %s from %s\n", 312d9a8abf6SChuck Silvers ump->um_mountp->mnt_stat.f_mntfromname, 313d9a8abf6SChuck Silvers ump->um_mountp->mnt_stat.f_mntonname); 314d9a8abf6SChuck Silvers } 315d9a8abf6SChuck Silvers return ((ump->um_flags & UM_FSFAIL_CLEANUP) != 0); 316d9a8abf6SChuck Silvers } 317d9a8abf6SChuck Silvers 318d9a8abf6SChuck Silvers /* 319d9a8abf6SChuck Silvers * Wrapper used during ENXIO cleanup to allocate empty buffers when 320d9a8abf6SChuck Silvers * the kernel is unable to read the real one. They are needed so that 321d9a8abf6SChuck Silvers * the soft updates code can use them to unwind its dependencies. 322d9a8abf6SChuck Silvers */ 323d9a8abf6SChuck Silvers int 324d9a8abf6SChuck Silvers ffs_breadz(struct ufsmount *ump, struct vnode *vp, daddr_t lblkno, 325d9a8abf6SChuck Silvers daddr_t dblkno, int size, daddr_t *rablkno, int *rabsize, int cnt, 326d9a8abf6SChuck Silvers struct ucred *cred, int flags, void (*ckhashfunc)(struct buf *), 327d9a8abf6SChuck Silvers struct buf **bpp) 328d9a8abf6SChuck Silvers { 329d9a8abf6SChuck Silvers int error; 330d9a8abf6SChuck Silvers 331d9a8abf6SChuck Silvers flags |= GB_CVTENXIO; 332d9a8abf6SChuck Silvers error = breadn_flags(vp, lblkno, dblkno, size, rablkno, rabsize, cnt, 333d9a8abf6SChuck Silvers cred, flags, ckhashfunc, bpp); 334d9a8abf6SChuck Silvers if (error != 0 && ffs_fsfail_cleanup(ump, error)) { 335d9a8abf6SChuck Silvers error = getblkx(vp, lblkno, dblkno, size, 0, 0, flags, bpp); 336d9a8abf6SChuck Silvers KASSERT(error == 0, ("getblkx failed")); 337d9a8abf6SChuck Silvers vfs_bio_bzero_buf(*bpp, 0, size); 338d9a8abf6SChuck Silvers } 339d9a8abf6SChuck Silvers return (error); 340d9a8abf6SChuck Silvers } 341d9a8abf6SChuck Silvers 3425e8c582aSPoul-Henning Kamp static int 343dfd233edSAttilio Rao ffs_mount(struct mount *mp) 344df8bae1dSRodney W. Grimes { 345f15ccf88SChuck Silvers struct vnode *devvp, *odevvp; 346dfd233edSAttilio Rao struct thread *td; 347f7a3729cSKevin Lo struct ufsmount *ump = NULL; 34805f4ff5dSPoul-Henning Kamp struct fs *fs; 3492030ee0eSKonstantin Belousov int error, flags; 3502030ee0eSKonstantin Belousov int error1 __diagused; 3515ffc99e2SKonstantin Belousov uint64_t mntorflags, saved_mnt_flag; 35215bc6b2bSEdward Tomasz Napierala accmode_t accmode; 3535e8c582aSPoul-Henning Kamp struct nameidata ndp; 35420a92a18SPoul-Henning Kamp char *fspec; 3557c7a6681SKonstantin Belousov bool mounted_softdep; 356df8bae1dSRodney W. Grimes 357dfd233edSAttilio Rao td = curthread; 35820a92a18SPoul-Henning Kamp if (vfs_filteropt(mp->mnt_optnew, ffs_opts)) 35920a92a18SPoul-Henning Kamp return (EINVAL); 360aa4d7a8aSPoul-Henning Kamp if (uma_inode == NULL) { 361aa4d7a8aSPoul-Henning Kamp uma_inode = uma_zcreate("FFS inode", 362aa4d7a8aSPoul-Henning Kamp sizeof(struct inode), NULL, NULL, NULL, NULL, 363aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 364aa4d7a8aSPoul-Henning Kamp uma_ufs1 = uma_zcreate("FFS1 dinode", 365aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL, 366aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 367aa4d7a8aSPoul-Henning Kamp uma_ufs2 = uma_zcreate("FFS2 dinode", 368aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL, 369aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 3709d5a594fSMateusz Guzik VFS_SMR_ZONE_SET(uma_inode); 371aa4d7a8aSPoul-Henning Kamp } 3728d02a378SPawel Jakub Dawidek 3730b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "groupquota"); 3740b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "userquota"); 3750b962648SAndriy Gapon 37620a92a18SPoul-Henning Kamp fspec = vfs_getopts(mp->mnt_optnew, "from", &error); 37751ac12abSPoul-Henning Kamp if (error) 378f2a2857bSKirk McKusick return (error); 3792b14f991SJulian Elischer 3805da56ddbSTor Egge mntorflags = 0; 381daba4da8SKirk McKusick if (vfs_getopt(mp->mnt_optnew, "untrusted", NULL, NULL) == 0) 382daba4da8SKirk McKusick mntorflags |= MNT_UNTRUSTED; 383daba4da8SKirk McKusick 38426f59b64SCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0) 3855da56ddbSTor Egge mntorflags |= MNT_ACLS; 38626f59b64SCraig Rodrigues 387fb77e0afSCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) { 3885da56ddbSTor Egge mntorflags |= MNT_SNAPSHOT; 389fb77e0afSCraig Rodrigues /* 390fb77e0afSCraig Rodrigues * Once we have set the MNT_SNAPSHOT flag, do not 391fb77e0afSCraig Rodrigues * persist "snapshot" in the options list. 392fb77e0afSCraig Rodrigues */ 393fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_optnew, "snapshot"); 394fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_opt, "snapshot"); 395fb77e0afSCraig Rodrigues } 39626f59b64SCraig Rodrigues 3979340fc72SEdward Tomasz Napierala if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) { 3989340fc72SEdward Tomasz Napierala if (mntorflags & MNT_ACLS) { 399b60ee81eSKirk McKusick vfs_mount_error(mp, 400b60ee81eSKirk McKusick "\"acls\" and \"nfsv4acls\" options " 401b60ee81eSKirk McKusick "are mutually exclusive"); 4029340fc72SEdward Tomasz Napierala return (EINVAL); 4039340fc72SEdward Tomasz Napierala } 4049340fc72SEdward Tomasz Napierala mntorflags |= MNT_NFS4ACLS; 4059340fc72SEdward Tomasz Napierala } 4069340fc72SEdward Tomasz Napierala 4075da56ddbSTor Egge MNT_ILOCK(mp); 4089d5a594fSMateusz Guzik mp->mnt_kern_flag &= ~MNTK_FPLOOKUP; 40961996181SEdward Tomasz Napierala mp->mnt_flag |= mntorflags; 4105da56ddbSTor Egge MNT_IUNLOCK(mp); 4110455cc71SRobert Wing 412df8bae1dSRodney W. Grimes /* 413ab2dbd9bSRobert Wing * If this is a snapshot request, take the snapshot. 414ab2dbd9bSRobert Wing */ 41527d673fbSKirk McKusick if (mp->mnt_flag & MNT_SNAPSHOT) { 41627d673fbSKirk McKusick if ((mp->mnt_flag & MNT_UPDATE) == 0) 41727d673fbSKirk McKusick return (EINVAL); 418ab2dbd9bSRobert Wing return (ffs_snapshot(mp, fspec)); 41927d673fbSKirk McKusick } 420ab2dbd9bSRobert Wing 421ab2dbd9bSRobert Wing /* 4220455cc71SRobert Wing * Must not call namei() while owning busy ref. 4230455cc71SRobert Wing */ 4240455cc71SRobert Wing if (mp->mnt_flag & MNT_UPDATE) 4250455cc71SRobert Wing vfs_unbusy(mp); 4260455cc71SRobert Wing 4270455cc71SRobert Wing /* 4280455cc71SRobert Wing * Not an update, or updating the name: look up the name 4290455cc71SRobert Wing * and verify that it refers to a sensible disk device. 4300455cc71SRobert Wing */ 4310455cc71SRobert Wing NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec); 4320455cc71SRobert Wing error = namei(&ndp); 4330455cc71SRobert Wing if ((mp->mnt_flag & MNT_UPDATE) != 0) { 4340455cc71SRobert Wing /* 4350455cc71SRobert Wing * Unmount does not start if MNT_UPDATE is set. Mount 4360455cc71SRobert Wing * update busies mp before setting MNT_UPDATE. We 4370455cc71SRobert Wing * must be able to retain our busy ref successfully, 4380455cc71SRobert Wing * without sleep. 4390455cc71SRobert Wing */ 4400455cc71SRobert Wing error1 = vfs_busy(mp, MBF_NOWAIT); 4410455cc71SRobert Wing MPASS(error1 == 0); 4420455cc71SRobert Wing } 4430455cc71SRobert Wing if (error != 0) 4440455cc71SRobert Wing return (error); 445bb92cd7bSMateusz Guzik NDFREE_PNBUF(&ndp); 4460455cc71SRobert Wing if (!vn_isdisk_error(ndp.ni_vp, &error)) { 4470455cc71SRobert Wing vput(ndp.ni_vp); 4480455cc71SRobert Wing return (error); 4490455cc71SRobert Wing } 4500455cc71SRobert Wing 4510455cc71SRobert Wing /* 4520455cc71SRobert Wing * If mount by non-root, then verify that user has necessary 4530455cc71SRobert Wing * permissions on the device. 4540455cc71SRobert Wing */ 4550455cc71SRobert Wing accmode = VREAD; 4560455cc71SRobert Wing if ((mp->mnt_flag & MNT_RDONLY) == 0) 4570455cc71SRobert Wing accmode |= VWRITE; 4580455cc71SRobert Wing error = VOP_ACCESS(ndp.ni_vp, accmode, td->td_ucred, td); 4590455cc71SRobert Wing if (error) 4600455cc71SRobert Wing error = priv_check(td, PRIV_VFS_MOUNT_PERM); 4610455cc71SRobert Wing if (error) { 4620455cc71SRobert Wing vput(ndp.ni_vp); 4630455cc71SRobert Wing return (error); 4640455cc71SRobert Wing } 4650455cc71SRobert Wing 4660455cc71SRobert Wing /* 4670455cc71SRobert Wing * New mount 4680455cc71SRobert Wing * 4690455cc71SRobert Wing * We need the name for the mount point (also used for 4700455cc71SRobert Wing * "last mounted on") copied in. If an error occurs, 4710455cc71SRobert Wing * the mount point is discarded by the upper level code. 4720455cc71SRobert Wing * Note that vfs_mount_alloc() populates f_mntonname for us. 4730455cc71SRobert Wing */ 4740455cc71SRobert Wing if ((mp->mnt_flag & MNT_UPDATE) == 0) { 4750455cc71SRobert Wing if ((error = ffs_mountfs(ndp.ni_vp, mp, td)) != 0) { 4760455cc71SRobert Wing vrele(ndp.ni_vp); 4770455cc71SRobert Wing return (error); 4780455cc71SRobert Wing } 4790455cc71SRobert Wing } else { 4800455cc71SRobert Wing /* 4810455cc71SRobert Wing * When updating, check whether changing from read-only to 482df8bae1dSRodney W. Grimes * read/write; if there is no device name, that's all we do. 483df8bae1dSRodney W. Grimes */ 484df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 485df8bae1dSRodney W. Grimes fs = ump->um_fs; 486f15ccf88SChuck Silvers odevvp = ump->um_odevvp; 48726cf9c3bSPeter Wemm devvp = ump->um_devvp; 4880455cc71SRobert Wing 4890455cc71SRobert Wing /* 4900455cc71SRobert Wing * If it's not the same vnode, or at least the same device 4910455cc71SRobert Wing * then it's not correct. 4920455cc71SRobert Wing */ 4930455cc71SRobert Wing if (ndp.ni_vp->v_rdev != ump->um_odevvp->v_rdev) 4940455cc71SRobert Wing error = EINVAL; /* needs translation */ 4950455cc71SRobert Wing vput(ndp.ni_vp); 4960455cc71SRobert Wing if (error) 4970455cc71SRobert Wing return (error); 49820a92a18SPoul-Henning Kamp if (fs->fs_ronly == 0 && 49920a92a18SPoul-Henning Kamp vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 5006fecb4e4SKonstantin Belousov /* 5016fecb4e4SKonstantin Belousov * Flush any dirty data and suspend filesystem. 5026fecb4e4SKonstantin Belousov */ 503f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 504f2a2857bSKirk McKusick return (error); 505895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 506895b3782SKonstantin Belousov if (error != 0) 5079ab73fd1SKirk McKusick return (error); 5087c7a6681SKonstantin Belousov 5097c7a6681SKonstantin Belousov fs->fs_ronly = 1; 5107c7a6681SKonstantin Belousov if (MOUNTEDSOFTDEP(mp)) { 5117c7a6681SKonstantin Belousov MNT_ILOCK(mp); 5127c7a6681SKonstantin Belousov mp->mnt_flag &= ~MNT_SOFTDEP; 5137c7a6681SKonstantin Belousov MNT_IUNLOCK(mp); 5147c7a6681SKonstantin Belousov mounted_softdep = true; 5157c7a6681SKonstantin Belousov } else 5167c7a6681SKonstantin Belousov mounted_softdep = false; 5177c7a6681SKonstantin Belousov 518cd600596SKirk McKusick /* 519cd600596SKirk McKusick * Check for and optionally get rid of files open 520cd600596SKirk McKusick * for writing. 521cd600596SKirk McKusick */ 522df8bae1dSRodney W. Grimes flags = WRITECLOSE; 523df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_FORCE) 524df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 5257c7a6681SKonstantin Belousov if (mounted_softdep) { 526b40ce416SJulian Elischer error = softdep_flushfiles(mp, flags, td); 527b1897c19SJulian Elischer } else { 528b40ce416SJulian Elischer error = ffs_flushfiles(mp, flags, td); 529df8bae1dSRodney W. Grimes } 530f2a2857bSKirk McKusick if (error) { 5317c7a6681SKonstantin Belousov fs->fs_ronly = 0; 5327c7a6681SKonstantin Belousov if (mounted_softdep) { 5337c7a6681SKonstantin Belousov MNT_ILOCK(mp); 5347c7a6681SKonstantin Belousov mp->mnt_flag |= MNT_SOFTDEP; 5357c7a6681SKonstantin Belousov MNT_IUNLOCK(mp); 5367c7a6681SKonstantin Belousov } 537ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 538f2a2857bSKirk McKusick return (error); 539b1897c19SJulian Elischer } 5407c7a6681SKonstantin Belousov 5419ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || 5429ccb939eSKirk McKusick fs->fs_pendinginodes != 0) { 543b60ee81eSKirk McKusick printf("WARNING: %s Update error: blocks %jd " 544b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, 5451c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 5469ccb939eSKirk McKusick fs->fs_pendinginodes); 5479ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 5489ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 5499ccb939eSKirk McKusick } 5501a6a6610SKirk McKusick if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0) 551f2a2857bSKirk McKusick fs->fs_clean = 1; 552791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 553f2a2857bSKirk McKusick fs->fs_ronly = 0; 554f2a2857bSKirk McKusick fs->fs_clean = 0; 5557c7a6681SKonstantin Belousov if (mounted_softdep) { 5567c7a6681SKonstantin Belousov MNT_ILOCK(mp); 5577c7a6681SKonstantin Belousov mp->mnt_flag |= MNT_SOFTDEP; 5587c7a6681SKonstantin Belousov MNT_IUNLOCK(mp); 5597c7a6681SKonstantin Belousov } 560ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 561f2a2857bSKirk McKusick return (error); 5622b14f991SJulian Elischer } 5637c7a6681SKonstantin Belousov if (mounted_softdep) 5649420dc62SKirk McKusick softdep_unmount(mp); 56543920011SPoul-Henning Kamp g_topology_lock(); 5668795189cSKirk McKusick /* 5678795189cSKirk McKusick * Drop our write and exclusive access. 5688795189cSKirk McKusick */ 5698795189cSKirk McKusick g_access(ump->um_cp, 0, -1, -1); 57043920011SPoul-Henning Kamp g_topology_unlock(); 5715da56ddbSTor Egge MNT_ILOCK(mp); 57220a92a18SPoul-Henning Kamp mp->mnt_flag |= MNT_RDONLY; 5735da56ddbSTor Egge MNT_IUNLOCK(mp); 5746fecb4e4SKonstantin Belousov /* 5756fecb4e4SKonstantin Belousov * Allow the writers to note that filesystem 5766fecb4e4SKonstantin Belousov * is ro now. 5776fecb4e4SKonstantin Belousov */ 578ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 579f2a2857bSKirk McKusick } 580f2a2857bSKirk McKusick if ((mp->mnt_flag & MNT_RELOAD) && 581440320b6SRobert Wing (error = ffs_reload(mp, 0)) != 0) 582f2a2857bSKirk McKusick return (error); 58320a92a18SPoul-Henning Kamp if (fs->fs_ronly && 58420a92a18SPoul-Henning Kamp !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 585c9b99213SBruce Evans /* 586c9b99213SBruce Evans * If upgrade to read-write by non-root, then verify 587c9b99213SBruce Evans * that user has necessary permissions on the device. 588c9b99213SBruce Evans */ 589f15ccf88SChuck Silvers vn_lock(odevvp, LK_EXCLUSIVE | LK_RETRY); 590f15ccf88SChuck Silvers error = VOP_ACCESS(odevvp, VREAD | VWRITE, 591acd3428bSRobert Watson td->td_ucred, td); 592acd3428bSRobert Watson if (error) 593acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 594f15ccf88SChuck Silvers VOP_UNLOCK(odevvp); 595acd3428bSRobert Watson if (error) { 596c9b99213SBruce Evans return (error); 597c9b99213SBruce Evans } 5987e58bfacSBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 5990922cce6SBruce Evans if (fs->fs_clean == 0) { 6007e58bfacSBruce Evans fs->fs_flags |= FS_UNCLEAN; 601812b1d41SKirk McKusick if ((mp->mnt_flag & MNT_FORCE) || 602113db2ddSJeff Roberson ((fs->fs_flags & 603113db2ddSJeff Roberson (FS_SUJ | FS_NEEDSFSCK)) == 0 && 6041a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 605b60ee81eSKirk McKusick printf("WARNING: %s was not properly " 60608e5f519SKirk McKusick "dismounted\n", 60708e5f519SKirk McKusick mp->mnt_stat.f_mntonname); 6080922cce6SBruce Evans } else { 609b60ee81eSKirk McKusick vfs_mount_error(mp, 610b60ee81eSKirk McKusick "R/W mount of %s denied. %s.%s", 61108e5f519SKirk McKusick mp->mnt_stat.f_mntonname, 612b60ee81eSKirk McKusick "Filesystem is not clean - run fsck", 613b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 614b60ee81eSKirk McKusick " Forced mount will invalidate" 615b60ee81eSKirk McKusick " journal contents"); 616f2a2857bSKirk McKusick return (EPERM); 6170922cce6SBruce Evans } 6180922cce6SBruce Evans } 61940c340aaSPoul-Henning Kamp g_topology_lock(); 62040c340aaSPoul-Henning Kamp /* 6218795189cSKirk McKusick * Request exclusive write access. 62240c340aaSPoul-Henning Kamp */ 62340c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 1); 62440c340aaSPoul-Henning Kamp g_topology_unlock(); 62540c340aaSPoul-Henning Kamp if (error) 62640c340aaSPoul-Henning Kamp return (error); 627f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 628f2a2857bSKirk McKusick return (error); 6295ffc99e2SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 6305ffc99e2SKonstantin Belousov if (error != 0) 6315ffc99e2SKonstantin Belousov return (error); 632f2a2857bSKirk McKusick fs->fs_ronly = 0; 6335da56ddbSTor Egge MNT_ILOCK(mp); 6345ffc99e2SKonstantin Belousov saved_mnt_flag = MNT_RDONLY; 6355ffc99e2SKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (mp->mnt_flag & 6365ffc99e2SKonstantin Belousov MNT_ASYNC) != 0) 6375ffc99e2SKonstantin Belousov saved_mnt_flag |= MNT_ASYNC; 6385ffc99e2SKonstantin Belousov mp->mnt_flag &= ~saved_mnt_flag; 6395da56ddbSTor Egge MNT_IUNLOCK(mp); 640113db2ddSJeff Roberson fs->fs_mtime = time_second; 64126cf9c3bSPeter Wemm /* check to see if we need to start softdep */ 642f2a2857bSKirk McKusick if ((fs->fs_flags & FS_DOSOFTDEP) && 643a854ed98SJohn Baldwin (error = softdep_mount(devvp, mp, fs, td->td_ucred))){ 6445ffc99e2SKonstantin Belousov fs->fs_ronly = 1; 6455ffc99e2SKonstantin Belousov MNT_ILOCK(mp); 6465ffc99e2SKonstantin Belousov mp->mnt_flag |= saved_mnt_flag; 6475ffc99e2SKonstantin Belousov MNT_IUNLOCK(mp); 6485ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 649f2a2857bSKirk McKusick return (error); 65026cf9c3bSPeter Wemm } 651113db2ddSJeff Roberson fs->fs_clean = 0; 652113db2ddSJeff Roberson if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 6535ffc99e2SKonstantin Belousov fs->fs_ronly = 1; 654f776c54cSKonstantin Belousov if ((fs->fs_flags & FS_DOSOFTDEP) != 0) 655f776c54cSKonstantin Belousov softdep_unmount(mp); 6565ffc99e2SKonstantin Belousov MNT_ILOCK(mp); 6575ffc99e2SKonstantin Belousov mp->mnt_flag |= saved_mnt_flag; 6585ffc99e2SKonstantin Belousov MNT_IUNLOCK(mp); 6595ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 660113db2ddSJeff Roberson return (error); 661113db2ddSJeff Roberson } 662f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 663f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 6645ffc99e2SKonstantin Belousov vfs_write_resume(mp, 0); 6651469eec8SDavid Greenman } 666c11d2981SJulian Elischer /* 667c11d2981SJulian Elischer * Soft updates is incompatible with "async", 668c11d2981SJulian Elischer * so if we are doing softupdates stop the user 669c11d2981SJulian Elischer * from setting the async flag in an update. 670c11d2981SJulian Elischer * Softdep_mount() clears it in an initial mount 671c11d2981SJulian Elischer * or ro->rw remount. 672c11d2981SJulian Elischer */ 673fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 6745da56ddbSTor Egge /* XXX: Reset too late ? */ 6755da56ddbSTor Egge MNT_ILOCK(mp); 676c11d2981SJulian Elischer mp->mnt_flag &= ~MNT_ASYNC; 6775da56ddbSTor Egge MNT_IUNLOCK(mp); 6785da56ddbSTor Egge } 679df8bae1dSRodney W. Grimes /* 68039cfb239SPawel Jakub Dawidek * Keep MNT_ACLS flag if it is stored in superblock. 68139cfb239SPawel Jakub Dawidek */ 6825da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 6835da56ddbSTor Egge /* XXX: Set too late ? */ 6845da56ddbSTor Egge MNT_ILOCK(mp); 68539cfb239SPawel Jakub Dawidek mp->mnt_flag |= MNT_ACLS; 6865da56ddbSTor Egge MNT_IUNLOCK(mp); 6875da56ddbSTor Egge } 688cea90362SCraig Rodrigues 6899340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 6909340fc72SEdward Tomasz Napierala /* XXX: Set too late ? */ 6919340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 6929340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 6939340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 6949340fc72SEdward Tomasz Napierala } 6959340fc72SEdward Tomasz Napierala 696f2a2857bSKirk McKusick } 6979d5a594fSMateusz Guzik 6989d5a594fSMateusz Guzik MNT_ILOCK(mp); 6999d5a594fSMateusz Guzik /* 7009d5a594fSMateusz Guzik * This is racy versus lookup, see ufs_fplookup_vexec for details. 7019d5a594fSMateusz Guzik */ 7029d5a594fSMateusz Guzik if ((mp->mnt_kern_flag & MNTK_FPLOOKUP) != 0) 7039d5a594fSMateusz Guzik panic("MNTK_FPLOOKUP set on mount %p when it should not be", mp); 70403337743SMateusz Guzik if ((mp->mnt_flag & (MNT_ACLS | MNT_NFS4ACLS | MNT_UNION)) == 0) 7059d5a594fSMateusz Guzik mp->mnt_kern_flag |= MNTK_FPLOOKUP; 7069d5a594fSMateusz Guzik MNT_IUNLOCK(mp); 7079d5a594fSMateusz Guzik 70820a92a18SPoul-Henning Kamp vfs_mountedfrom(mp, fspec); 709f2a2857bSKirk McKusick return (0); 7102b14f991SJulian Elischer } 7112b14f991SJulian Elischer 712df8bae1dSRodney W. Grimes /* 71320a92a18SPoul-Henning Kamp * Compatibility with old mount system call. 71420a92a18SPoul-Henning Kamp */ 71520a92a18SPoul-Henning Kamp 71620a92a18SPoul-Henning Kamp static int 717cc672d35SKirk McKusick ffs_cmount(struct mntarg *ma, void *data, uint64_t flags) 71820a92a18SPoul-Henning Kamp { 71920a92a18SPoul-Henning Kamp struct ufs_args args; 72020a92a18SPoul-Henning Kamp int error; 72120a92a18SPoul-Henning Kamp 72220a92a18SPoul-Henning Kamp if (data == NULL) 72320a92a18SPoul-Henning Kamp return (EINVAL); 72420a92a18SPoul-Henning Kamp error = copyin(data, &args, sizeof args); 72520a92a18SPoul-Henning Kamp if (error) 72620a92a18SPoul-Henning Kamp return (error); 72720a92a18SPoul-Henning Kamp 72820a92a18SPoul-Henning Kamp ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN); 7291f7104d7SRick Macklem ma = mount_arg(ma, "export", &args.export, sizeof(args.export)); 73020a92a18SPoul-Henning Kamp error = kernel_mount(ma, flags); 73120a92a18SPoul-Henning Kamp 73220a92a18SPoul-Henning Kamp return (error); 73320a92a18SPoul-Henning Kamp } 73420a92a18SPoul-Henning Kamp 73520a92a18SPoul-Henning Kamp /* 736df8bae1dSRodney W. Grimes * Reload all incore data for a filesystem (used after running fsck on 7371848286aSEdward Tomasz Napierala * the root filesystem and finding things to fix). If the 'force' flag 7381848286aSEdward Tomasz Napierala * is 0, the filesystem must be mounted read-only. 739df8bae1dSRodney W. Grimes * 740df8bae1dSRodney W. Grimes * Things to do to update the mount: 741df8bae1dSRodney W. Grimes * 1) invalidate all cached meta-data. 742df8bae1dSRodney W. Grimes * 2) re-read superblock from disk. 743df8bae1dSRodney W. Grimes * 3) re-read summary information from disk. 744df8bae1dSRodney W. Grimes * 4) invalidate all inactive vnodes. 745df426577SKonstantin Belousov * 5) clear MNTK_SUSPEND2 and MNTK_SUSPENDED flags, allowing secondary 746df426577SKonstantin Belousov * writers, if requested. 747df426577SKonstantin Belousov * 6) invalidate all cached file data. 748df426577SKonstantin Belousov * 7) re-read inode data for all active vnodes. 749df8bae1dSRodney W. Grimes */ 7501848286aSEdward Tomasz Napierala int 751440320b6SRobert Wing ffs_reload(struct mount *mp, int flags) 752df8bae1dSRodney W. Grimes { 75382be0a5aSTor Egge struct vnode *vp, *mvp, *devvp; 754df8bae1dSRodney W. Grimes struct inode *ip; 755f55ff3f3SIan Dowse void *space; 756df8bae1dSRodney W. Grimes struct buf *bp; 757996c772fSJohn Dyson struct fs *fs, *newfs; 7583ba649d7SJeff Roberson struct ufsmount *ump; 7591c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 760ad544726SKirk McKusick int i, blks, error; 761831b1ff7SKirk McKusick uint64_t size; 762996c772fSJohn Dyson int32_t *lp; 763df8bae1dSRodney W. Grimes 7643ba649d7SJeff Roberson ump = VFSTOUFS(mp); 7651848286aSEdward Tomasz Napierala 7661848286aSEdward Tomasz Napierala MNT_ILOCK(mp); 767df426577SKonstantin Belousov if ((mp->mnt_flag & MNT_RDONLY) == 0 && (flags & FFSR_FORCE) == 0) { 7681848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 7691848286aSEdward Tomasz Napierala return (EINVAL); 7701848286aSEdward Tomasz Napierala } 7711848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 7721848286aSEdward Tomasz Napierala 773df8bae1dSRodney W. Grimes /* 774df8bae1dSRodney W. Grimes * Step 1: invalidate all cached meta-data. 775df8bae1dSRodney W. Grimes */ 7762b14f991SJulian Elischer devvp = VFSTOUFS(mp)->um_devvp; 777cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 7780d7935fdSAttilio Rao if (vinvalbuf(devvp, 0, 0, 0) != 0) 779df8bae1dSRodney W. Grimes panic("ffs_reload: dirty1"); 780b249ce48SMateusz Guzik VOP_UNLOCK(devvp); 78195e5e988SJohn Dyson 782df8bae1dSRodney W. Grimes /* 783df8bae1dSRodney W. Grimes * Step 2: re-read superblock from disk. 784df8bae1dSRodney W. Grimes */ 7851c85e6a3SKirk McKusick fs = VFSTOUFS(mp)->um_fs; 786ada981b2SKirk McKusick if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize, 7871c85e6a3SKirk McKusick NOCRED, &bp)) != 0) 788df8bae1dSRodney W. Grimes return (error); 789996c772fSJohn Dyson newfs = (struct fs *)bp->b_data; 7901c85e6a3SKirk McKusick if ((newfs->fs_magic != FS_UFS1_MAGIC && 7911c85e6a3SKirk McKusick newfs->fs_magic != FS_UFS2_MAGIC) || 7921c85e6a3SKirk McKusick newfs->fs_bsize > MAXBSIZE || 793996c772fSJohn Dyson newfs->fs_bsize < sizeof(struct fs)) { 794df8bae1dSRodney W. Grimes brelse(bp); 795886fd36eSKirk McKusick return (EINTEGRITY); 796df8bae1dSRodney W. Grimes } 797996c772fSJohn Dyson /* 79834816cb9SKirk McKusick * Preserve the summary information, read-only status, and 79934816cb9SKirk McKusick * superblock location by copying these fields into our new 80034816cb9SKirk McKusick * superblock before using it to update the existing superblock. 801996c772fSJohn Dyson */ 80234816cb9SKirk McKusick newfs->fs_si = fs->fs_si; 8031848286aSEdward Tomasz Napierala newfs->fs_ronly = fs->fs_ronly; 8041c85e6a3SKirk McKusick sblockloc = fs->fs_sblockloc; 805831b1ff7SKirk McKusick bcopy(newfs, fs, (uint64_t)fs->fs_sbsize); 806df8bae1dSRodney W. Grimes brelse(bp); 807f1b4324bSChuck Silvers ump->um_bsize = fs->fs_bsize; 808f784da88SKonstantin Belousov ump->um_maxsymlinklen = fs->fs_maxsymlinklen; 8091c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc); 8103ba649d7SJeff Roberson UFS_LOCK(ump); 8119ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 812b60ee81eSKirk McKusick printf("WARNING: %s: reload pending error: blocks %jd " 81308e5f519SKirk McKusick "files %d\n", mp->mnt_stat.f_mntonname, 81408e5f519SKirk McKusick (intmax_t)fs->fs_pendingblocks, fs->fs_pendinginodes); 8159ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 8169ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 8179ccb939eSKirk McKusick } 8183ba649d7SJeff Roberson UFS_UNLOCK(ump); 819996c772fSJohn Dyson 820df8bae1dSRodney W. Grimes /* 821df8bae1dSRodney W. Grimes * Step 3: re-read summary information from disk. 822df8bae1dSRodney W. Grimes */ 8232b028c25SEdward Tomasz Napierala size = fs->fs_cssize; 8242b028c25SEdward Tomasz Napierala blks = howmany(size, fs->fs_fsize); 8252b028c25SEdward Tomasz Napierala if (fs->fs_contigsumsize > 0) 8262b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(int32_t); 827831b1ff7SKirk McKusick size += fs->fs_ncg * sizeof(uint8_t); 8282b028c25SEdward Tomasz Napierala free(fs->fs_csp, M_UFSMNT); 829ad544726SKirk McKusick space = malloc(size, M_UFSMNT, M_WAITOK); 8302b028c25SEdward Tomasz Napierala fs->fs_csp = space; 831df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 832df8bae1dSRodney W. Grimes size = fs->fs_bsize; 833df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 834df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 835c9671602SPoul-Henning Kamp error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 836c9671602SPoul-Henning Kamp NOCRED, &bp); 837c9671602SPoul-Henning Kamp if (error) 838df8bae1dSRodney W. Grimes return (error); 839831b1ff7SKirk McKusick bcopy(bp->b_data, space, (uint64_t)size); 840f55ff3f3SIan Dowse space = (char *)space + size; 841df8bae1dSRodney W. Grimes brelse(bp); 842df8bae1dSRodney W. Grimes } 843996c772fSJohn Dyson /* 844996c772fSJohn Dyson * We no longer know anything about clusters per cylinder group. 845996c772fSJohn Dyson */ 846996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 84772b8ff1cSEdward Tomasz Napierala fs->fs_maxcluster = lp = space; 848996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 849996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 85072b8ff1cSEdward Tomasz Napierala space = lp; 851996c772fSJohn Dyson } 852831b1ff7SKirk McKusick size = fs->fs_ncg * sizeof(uint8_t); 853831b1ff7SKirk McKusick fs->fs_contigdirs = (uint8_t *)space; 85472b8ff1cSEdward Tomasz Napierala bzero(fs->fs_contigdirs, size); 855df426577SKonstantin Belousov if ((flags & FFSR_UNSUSPEND) != 0) { 856df426577SKonstantin Belousov MNT_ILOCK(mp); 857df426577SKonstantin Belousov mp->mnt_kern_flag &= ~(MNTK_SUSPENDED | MNTK_SUSPEND2); 858df426577SKonstantin Belousov wakeup(&mp->mnt_flag); 859df426577SKonstantin Belousov MNT_IUNLOCK(mp); 860df426577SKonstantin Belousov } 861996c772fSJohn Dyson 862df8bae1dSRodney W. Grimes loop: 86371469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 864df8bae1dSRodney W. Grimes /* 8651848286aSEdward Tomasz Napierala * Skip syncer vnode. 8661848286aSEdward Tomasz Napierala */ 8671848286aSEdward Tomasz Napierala if (vp->v_type == VNON) { 8681848286aSEdward Tomasz Napierala VI_UNLOCK(vp); 8691848286aSEdward Tomasz Napierala continue; 8701848286aSEdward Tomasz Napierala } 8711848286aSEdward Tomasz Napierala /* 872fe68abe2SJeff Roberson * Step 4: invalidate all cached file data. 873df8bae1dSRodney W. Grimes */ 874a92a971bSMateusz Guzik if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK)) { 87571469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 876df8bae1dSRodney W. Grimes goto loop; 877996c772fSJohn Dyson } 8780d7935fdSAttilio Rao if (vinvalbuf(vp, 0, 0, 0)) 879df8bae1dSRodney W. Grimes panic("ffs_reload: dirty2"); 880df8bae1dSRodney W. Grimes /* 881fe68abe2SJeff Roberson * Step 5: re-read inode data for all active vnodes. 882df8bae1dSRodney W. Grimes */ 883df8bae1dSRodney W. Grimes ip = VTOI(vp); 884c9671602SPoul-Henning Kamp error = 885df8bae1dSRodney W. Grimes bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), 886c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 887c9671602SPoul-Henning Kamp if (error) { 8889fc5d538SKirk McKusick vput(vp); 88971469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 890df8bae1dSRodney W. Grimes return (error); 891df8bae1dSRodney W. Grimes } 8929fc5d538SKirk McKusick if ((error = ffs_load_inode(bp, ip, fs, ip->i_number)) != 0) { 8939fc5d538SKirk McKusick brelse(bp); 8949fc5d538SKirk McKusick vput(vp); 8959fc5d538SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 8969fc5d538SKirk McKusick return (error); 8979fc5d538SKirk McKusick } 898b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 899df8bae1dSRodney W. Grimes brelse(bp); 9009fc5d538SKirk McKusick vput(vp); 901df8bae1dSRodney W. Grimes } 902df8bae1dSRodney W. Grimes return (0); 903df8bae1dSRodney W. Grimes } 904df8bae1dSRodney W. Grimes 9051c85e6a3SKirk McKusick /* 906df8bae1dSRodney W. Grimes * Common code for mount and mountroot 907df8bae1dSRodney W. Grimes */ 908975512a9SPoul-Henning Kamp static int 909064e6b43SKirk McKusick ffs_mountfs(struct vnode *odevvp, struct mount *mp, struct thread *td) 910df8bae1dSRodney W. Grimes { 91105f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 91205f4ff5dSPoul-Henning Kamp struct fs *fs; 91389c9c53dSPoul-Henning Kamp struct cdev *dev; 914dffce215SKirk McKusick int error, i, len, ronly; 915996c772fSJohn Dyson struct ucred *cred; 91643920011SPoul-Henning Kamp struct g_consumer *cp; 9173bbd6d8aSJeff Roberson struct mount *nmp; 918f15ccf88SChuck Silvers struct vnode *devvp; 919e6886616SKirk McKusick int candelete, canspeedup; 920df8bae1dSRodney W. Grimes 921dffce215SKirk McKusick fs = NULL; 922ee445a69SJohn Baldwin ump = NULL; 923a854ed98SJohn Baldwin cred = td ? td->td_ucred : NOCRED; 92443920011SPoul-Henning Kamp ronly = (mp->mnt_flag & MNT_RDONLY) != 0; 925ee445a69SJohn Baldwin 926f15ccf88SChuck Silvers devvp = mntfs_allocvp(mp, odevvp); 927c70b3cd2SKonstantin Belousov KASSERT(devvp->v_type == VCHR, ("reclaimed devvp")); 928ee445a69SJohn Baldwin dev = devvp->v_rdev; 92979a5c790SKirk McKusick KASSERT(dev->si_snapdata == NULL, ("non-NULL snapshot data")); 930c70b3cd2SKonstantin Belousov if (atomic_cmpset_acq_ptr((uintptr_t *)&dev->si_mountpt, 0, 931c70b3cd2SKonstantin Belousov (uintptr_t)mp) == 0) { 932f15ccf88SChuck Silvers mntfs_freevp(devvp); 933c70b3cd2SKonstantin Belousov return (EBUSY); 934c70b3cd2SKonstantin Belousov } 93543920011SPoul-Henning Kamp g_topology_lock(); 93643920011SPoul-Henning Kamp error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1); 93743920011SPoul-Henning Kamp g_topology_unlock(); 938c70b3cd2SKonstantin Belousov if (error != 0) { 939c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 940f15ccf88SChuck Silvers mntfs_freevp(devvp); 941c70b3cd2SKonstantin Belousov return (error); 942c70b3cd2SKonstantin Belousov } 943c70b3cd2SKonstantin Belousov dev_ref(dev); 944c70b3cd2SKonstantin Belousov devvp->v_bufobj.bo_ops = &ffs_ops; 945f15ccf88SChuck Silvers BO_LOCK(&odevvp->v_bufobj); 946f15ccf88SChuck Silvers odevvp->v_bufobj.bo_flag |= BO_NOBUFS; 947f15ccf88SChuck Silvers BO_UNLOCK(&odevvp->v_bufobj); 94825809a01SKonstantin Belousov VOP_UNLOCK(devvp); 949c70b3cd2SKonstantin Belousov if (dev->si_iosize_max != 0) 950c70b3cd2SKonstantin Belousov mp->mnt_iosize_max = dev->si_iosize_max; 951cd853791SKonstantin Belousov if (mp->mnt_iosize_max > maxphys) 952cd853791SKonstantin Belousov mp->mnt_iosize_max = maxphys; 95371ac2d7cSCraig Rodrigues if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) { 95471ac2d7cSCraig Rodrigues error = EINVAL; 95571ac2d7cSCraig Rodrigues vfs_mount_error(mp, 95671ac2d7cSCraig Rodrigues "Invalid sectorsize %d for superblock size %d", 95771ac2d7cSCraig Rodrigues cp->provider->sectorsize, SBLOCKSIZE); 95871ac2d7cSCraig Rodrigues goto out; 95971ac2d7cSCraig Rodrigues } 960dffce215SKirk McKusick /* fetch the superblock and summary information */ 9619e9dcac9SKirk McKusick if ((mp->mnt_flag & (MNT_ROOTFS | MNT_FORCE)) != 0) 962e6886616SKirk McKusick error = ffs_sbsearch(devvp, &fs, 0, M_UFSMNT, ffs_use_bread); 963e6886616SKirk McKusick else 964e6886616SKirk McKusick error = ffs_sbget(devvp, &fs, UFS_STDSB, 0, M_UFSMNT, 965e6886616SKirk McKusick ffs_use_bread); 966e6886616SKirk McKusick if (error != 0) 967df8bae1dSRodney W. Grimes goto out; 9680922cce6SBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 9690922cce6SBruce Evans if (fs->fs_clean == 0) { 9700922cce6SBruce Evans fs->fs_flags |= FS_UNCLEAN; 971812b1d41SKirk McKusick if (ronly || (mp->mnt_flag & MNT_FORCE) || 972113db2ddSJeff Roberson ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 && 9731a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 97459b3a4ebSDavid E. O'Brien printf("WARNING: %s was not properly dismounted\n", 97508e5f519SKirk McKusick mp->mnt_stat.f_mntonname); 9761469eec8SDavid Greenman } else { 97708e5f519SKirk McKusick vfs_mount_error(mp, "R/W mount on %s denied. " 97808e5f519SKirk McKusick "Filesystem is not clean - run fsck.%s", 97908e5f519SKirk McKusick mp->mnt_stat.f_mntonname, 980b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 981b60ee81eSKirk McKusick " Forced mount will invalidate journal contents"); 9821469eec8SDavid Greenman error = EPERM; 9831469eec8SDavid Greenman goto out; 9841469eec8SDavid Greenman } 9851c85e6a3SKirk McKusick if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) && 9861c85e6a3SKirk McKusick (mp->mnt_flag & MNT_FORCE)) { 987b60ee81eSKirk McKusick printf("WARNING: %s: lost blocks %jd files %d\n", 98808e5f519SKirk McKusick mp->mnt_stat.f_mntonname, 98908e5f519SKirk McKusick (intmax_t)fs->fs_pendingblocks, 9901c85e6a3SKirk McKusick fs->fs_pendinginodes); 9919ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 9929ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 9939ccb939eSKirk McKusick } 9949ccb939eSKirk McKusick } 9959ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 996b60ee81eSKirk McKusick printf("WARNING: %s: mount pending error: blocks %jd " 99708e5f519SKirk McKusick "files %d\n", mp->mnt_stat.f_mntonname, 99808e5f519SKirk McKusick (intmax_t)fs->fs_pendingblocks, fs->fs_pendinginodes); 9999ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 10009ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 10011469eec8SDavid Greenman } 10021a60c7fcSPawel Jakub Dawidek if ((fs->fs_flags & FS_GJOURNAL) != 0) { 10031a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL 10041a60c7fcSPawel Jakub Dawidek /* 10051a60c7fcSPawel Jakub Dawidek * Get journal provider name. 10061a60c7fcSPawel Jakub Dawidek */ 1007ad544726SKirk McKusick len = 1024; 1008831b1ff7SKirk McKusick mp->mnt_gjprovider = malloc((uint64_t)len, M_UFSMNT, M_WAITOK); 1009ad544726SKirk McKusick if (g_io_getattr("GJOURNAL::provider", cp, &len, 10101a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider) == 0) { 1011ad544726SKirk McKusick mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, len, 10121a60c7fcSPawel Jakub Dawidek M_UFSMNT, M_WAITOK); 10131a60c7fcSPawel Jakub Dawidek MNT_ILOCK(mp); 10141a60c7fcSPawel Jakub Dawidek mp->mnt_flag |= MNT_GJOURNAL; 10151a60c7fcSPawel Jakub Dawidek MNT_IUNLOCK(mp); 10161a60c7fcSPawel Jakub Dawidek } else { 10171fbcaa13SKirk McKusick if ((mp->mnt_flag & MNT_RDONLY) == 0) 1018b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs " 1019b60ee81eSKirk McKusick "but no gjournal provider below\n", 10201a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 10211a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 10221a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 10231a60c7fcSPawel Jakub Dawidek } 10241a60c7fcSPawel Jakub Dawidek #else 1025b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs but no " 1026b60ee81eSKirk McKusick "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname); 10271a60c7fcSPawel Jakub Dawidek #endif 10281a60c7fcSPawel Jakub Dawidek } else { 10291a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 10301a60c7fcSPawel Jakub Dawidek } 1031a163d034SWarner Losh ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO); 103243920011SPoul-Henning Kamp ump->um_cp = cp; 103343920011SPoul-Henning Kamp ump->um_bo = &devvp->v_bufobj; 1034dffce215SKirk McKusick ump->um_fs = fs; 10351c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 10361c85e6a3SKirk McKusick ump->um_fstype = UFS1; 10371c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs1; 10381c85e6a3SKirk McKusick } else { 10391c85e6a3SKirk McKusick ump->um_fstype = UFS2; 10401c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs2; 10411c85e6a3SKirk McKusick } 1042cec0f20cSPoul-Henning Kamp ump->um_blkatoff = ffs_blkatoff; 1043cec0f20cSPoul-Henning Kamp ump->um_truncate = ffs_truncate; 1044987f5696SPoul-Henning Kamp ump->um_update = ffs_update; 1045cec0f20cSPoul-Henning Kamp ump->um_valloc = ffs_valloc; 1046cec0f20cSPoul-Henning Kamp ump->um_vfree = ffs_vfree; 1047975512a9SPoul-Henning Kamp ump->um_ifree = ffs_ifree; 104890446e36SKonstantin Belousov ump->um_rdonly = ffs_rdonly; 104916b1f68dSKonstantin Belousov ump->um_snapgone = ffs_snapgone; 1050fdf34aa3SKirk McKusick if ((mp->mnt_flag & MNT_UNTRUSTED) != 0) 1051fdf34aa3SKirk McKusick ump->um_check_blkno = ffs_check_blkno; 1052fdf34aa3SKirk McKusick else 1053fdf34aa3SKirk McKusick ump->um_check_blkno = NULL; 10543ba649d7SJeff Roberson mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF); 10558df4bc48SKonstantin Belousov sx_init(&ump->um_checkpath_lock, "uchpth"); 1056dffce215SKirk McKusick ffs_oldfscompat_read(fs, ump, fs->fs_sblockloc); 1057df8bae1dSRodney W. Grimes fs->fs_ronly = ronly; 1058143a5346SIan Dowse fs->fs_active = NULL; 105977465d93SAlfred Perlstein mp->mnt_data = ump; 106068de329eSPoul-Henning Kamp mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0]; 10618f89943eSGuido van Rooij mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1]; 10623bbd6d8aSJeff Roberson nmp = NULL; 106368de329eSPoul-Henning Kamp if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 || 10643bbd6d8aSJeff Roberson (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) { 10653bbd6d8aSJeff Roberson if (nmp) 10663bbd6d8aSJeff Roberson vfs_rel(nmp); 106768de329eSPoul-Henning Kamp vfs_getnewfsid(mp); 10683bbd6d8aSJeff Roberson } 1069f1b4324bSChuck Silvers ump->um_bsize = fs->fs_bsize; 1070f784da88SKonstantin Belousov ump->um_maxsymlinklen = fs->fs_maxsymlinklen; 10715da56ddbSTor Egge MNT_ILOCK(mp); 1072cc9d8990SPeter Wemm mp->mnt_flag |= MNT_LOCAL; 10735da56ddbSTor Egge MNT_IUNLOCK(mp); 10745da56ddbSTor Egge if ((fs->fs_flags & FS_MULTILABEL) != 0) { 10757b3f1bbdSTom Rhodes #ifdef MAC 10765da56ddbSTor Egge MNT_ILOCK(mp); 107780830407SRobert Watson mp->mnt_flag |= MNT_MULTILABEL; 10785da56ddbSTor Egge MNT_IUNLOCK(mp); 10797b3f1bbdSTom Rhodes #else 1080b60ee81eSKirk McKusick printf("WARNING: %s: multilabel flag on fs but " 1081b60ee81eSKirk McKusick "no MAC support\n", mp->mnt_stat.f_mntonname); 10827b3f1bbdSTom Rhodes #endif 10835da56ddbSTor Egge } 10845da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 10857b3f1bbdSTom Rhodes #ifdef UFS_ACL 10865da56ddbSTor Egge MNT_ILOCK(mp); 10879340fc72SEdward Tomasz Napierala 10889340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_NFS4ACLS) 1089b60ee81eSKirk McKusick printf("WARNING: %s: ACLs flag on fs conflicts with " 1090b60ee81eSKirk McKusick "\"nfsv4acls\" mount option; option ignored\n", 1091b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 10929340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_NFS4ACLS; 109380830407SRobert Watson mp->mnt_flag |= MNT_ACLS; 10949340fc72SEdward Tomasz Napierala 10955da56ddbSTor Egge MNT_IUNLOCK(mp); 10967b3f1bbdSTom Rhodes #else 109759b3a4ebSDavid E. O'Brien printf("WARNING: %s: ACLs flag on fs but no ACLs support\n", 1098946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 10997b3f1bbdSTom Rhodes #endif 11005da56ddbSTor Egge } 11019340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 11029340fc72SEdward Tomasz Napierala #ifdef UFS_ACL 11039340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 11049340fc72SEdward Tomasz Napierala 11059340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_ACLS) 1106b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts " 1107b60ee81eSKirk McKusick "with \"acls\" mount option; option ignored\n", 1108b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 11099340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_ACLS; 11109340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 11119340fc72SEdward Tomasz Napierala 11129340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 11139340fc72SEdward Tomasz Napierala #else 1114b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs but no " 1115b60ee81eSKirk McKusick "ACLs support\n", mp->mnt_stat.f_mntonname); 11169340fc72SEdward Tomasz Napierala #endif 11179340fc72SEdward Tomasz Napierala } 11188c2a54deSKonstantin Belousov if ((fs->fs_flags & FS_TRIM) != 0) { 1119ad544726SKirk McKusick len = sizeof(int); 1120ad544726SKirk McKusick if (g_io_getattr("GEOM::candelete", cp, &len, 1121ab0bcb60SKirk McKusick &candelete) == 0) { 1122ab0bcb60SKirk McKusick if (candelete) 1123ab0bcb60SKirk McKusick ump->um_flags |= UM_CANDELETE; 1124ab0bcb60SKirk McKusick else 1125b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk " 1126b60ee81eSKirk McKusick "does not support TRIM\n", 11278c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 11288c2a54deSKonstantin Belousov } else { 1129b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk does " 1130b60ee81eSKirk McKusick "not confirm that it supports TRIM\n", 11318c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 11328c2a54deSKonstantin Belousov } 1133ab0bcb60SKirk McKusick if (((ump->um_flags) & UM_CANDELETE) != 0) { 1134c79dff0fSKonstantin Belousov ump->um_trim_tq = taskqueue_create("trim", M_WAITOK, 1135c79dff0fSKonstantin Belousov taskqueue_thread_enqueue, &ump->um_trim_tq); 1136c79dff0fSKonstantin Belousov taskqueue_start_threads(&ump->um_trim_tq, 1, PVFS, 1137c79dff0fSKonstantin Belousov "%s trim", mp->mnt_stat.f_mntonname); 11387e038bc2SKirk McKusick ump->um_trimhash = hashinit(MAXTRIMIO, M_TRIM, 11397e038bc2SKirk McKusick &ump->um_trimlisthashsize); 1140c79dff0fSKonstantin Belousov } 11418c2a54deSKonstantin Belousov } 11429340fc72SEdward Tomasz Napierala 114313532153SScott Long len = sizeof(int); 114413532153SScott Long if (g_io_getattr("GEOM::canspeedup", cp, &len, &canspeedup) == 0) { 114513532153SScott Long if (canspeedup) 114613532153SScott Long ump->um_flags |= UM_CANSPEEDUP; 114713532153SScott Long } 114813532153SScott Long 1149df8bae1dSRodney W. Grimes ump->um_mountp = mp; 1150df8bae1dSRodney W. Grimes ump->um_dev = dev; 1151df8bae1dSRodney W. Grimes ump->um_devvp = devvp; 1152f15ccf88SChuck Silvers ump->um_odevvp = odevvp; 1153df8bae1dSRodney W. Grimes ump->um_nindir = fs->fs_nindir; 1154df8bae1dSRodney W. Grimes ump->um_bptrtodb = fs->fs_fsbtodb; 1155df8bae1dSRodney W. Grimes ump->um_seqinc = fs->fs_frag; 1156df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1157df8bae1dSRodney W. Grimes ump->um_quotas[i] = NULLVP; 1158516081f2SRobert Watson #ifdef UFS_EXTATTR 1159a64ed089SRobert Watson ufs_extattr_uepm_init(&ump->um_extattr); 1160a64ed089SRobert Watson #endif 11612b14f991SJulian Elischer /* 11622b14f991SJulian Elischer * Set FS local "last mounted on" information (NULL pad) 11632b14f991SJulian Elischer */ 116493373c42SSuleiman Souhlal bzero(fs->fs_fsmnt, MAXMNTLEN); 116593373c42SSuleiman Souhlal strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN); 1166113db2ddSJeff Roberson mp->mnt_stat.f_iosize = fs->fs_bsize; 11672b14f991SJulian Elischer 11682b14f991SJulian Elischer if (mp->mnt_flag & MNT_ROOTFS) { 11692b14f991SJulian Elischer /* 11702b14f991SJulian Elischer * Root mount; update timestamp in mount structure. 11712b14f991SJulian Elischer * this will be used by the common root mount code 11722b14f991SJulian Elischer * to update the system clock. 11732b14f991SJulian Elischer */ 11742b14f991SJulian Elischer mp->mnt_time = fs->fs_time; 11752b14f991SJulian Elischer } 1176996c772fSJohn Dyson 1177996c772fSJohn Dyson if (ronly == 0) { 1178113db2ddSJeff Roberson fs->fs_mtime = time_second; 1179b1897c19SJulian Elischer if ((fs->fs_flags & FS_DOSOFTDEP) && 1180b1897c19SJulian Elischer (error = softdep_mount(devvp, mp, fs, cred)) != 0) { 1181fddd463dSKonstantin Belousov ffs_flushfiles(mp, FORCECLOSE, td); 1182b1897c19SJulian Elischer goto out; 1183b1897c19SJulian Elischer } 1184f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 1185f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 1186cf60e8e4SKirk McKusick fs->fs_fmod = 1; 1187996c772fSJohn Dyson fs->fs_clean = 0; 1188791dd2faSTor Egge (void) ffs_sbupdate(ump, MNT_WAIT, 0); 1189996c772fSJohn Dyson } 1190d8d3d415SPoul-Henning Kamp /* 119198cbffd7SKonstantin Belousov * Initialize filesystem state information in mount struct. 1192d8d3d415SPoul-Henning Kamp */ 11936cf7bc60SRobert Watson MNT_ILOCK(mp); 1194bc2258daSAttilio Rao mp->mnt_kern_flag |= MNTK_LOOKUP_SHARED | MNTK_EXTENDED_SHARED | 11955f34e93cSMark Johnston MNTK_NO_IOPF | MNTK_UNMAPPED_BUFS | MNTK_USES_BCACHE; 11966cf7bc60SRobert Watson MNT_IUNLOCK(mp); 1197516081f2SRobert Watson #ifdef UFS_EXTATTR 1198516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART 11999de54ba5SRobert Watson /* 12009de54ba5SRobert Watson * 1201f5161237SRobert Watson * Auto-starting does the following: 12029de54ba5SRobert Watson * - check for /.attribute in the fs, and extattr_start if so 12039de54ba5SRobert Watson * - for each file in .attribute, enable that file with 12049de54ba5SRobert Watson * an attribute of the same name. 12059de54ba5SRobert Watson * Not clear how to report errors -- probably eat them. 12069de54ba5SRobert Watson * This would all happen while the filesystem was busy/not 12079de54ba5SRobert Watson * available, so would effectively be "atomic". 12089de54ba5SRobert Watson */ 1209b40ce416SJulian Elischer (void) ufs_extattr_autostart(mp, td); 1210516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */ 1211516081f2SRobert Watson #endif /* !UFS_EXTATTR */ 1212df8bae1dSRodney W. Grimes return (0); 1213df8bae1dSRodney W. Grimes out: 1214dffce215SKirk McKusick if (fs != NULL) { 1215dffce215SKirk McKusick free(fs->fs_csp, M_UFSMNT); 121634816cb9SKirk McKusick free(fs->fs_si, M_UFSMNT); 1217dffce215SKirk McKusick free(fs, M_UFSMNT); 1218dffce215SKirk McKusick } 121943920011SPoul-Henning Kamp if (cp != NULL) { 122043920011SPoul-Henning Kamp g_topology_lock(); 12210d7935fdSAttilio Rao g_vfs_close(cp); 122243920011SPoul-Henning Kamp g_topology_unlock(); 122343920011SPoul-Henning Kamp } 12248df4bc48SKonstantin Belousov if (ump != NULL) { 12253ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 12268df4bc48SKonstantin Belousov sx_destroy(&ump->um_checkpath_lock); 12271a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 12281a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 12291a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 12301a60c7fcSPawel Jakub Dawidek } 12312af934ccSKonstantin Belousov MPASS(ump->um_softdep == NULL); 1232df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 123377465d93SAlfred Perlstein mp->mnt_data = NULL; 1234df8bae1dSRodney W. Grimes } 1235f15ccf88SChuck Silvers BO_LOCK(&odevvp->v_bufobj); 1236f15ccf88SChuck Silvers odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS; 1237f15ccf88SChuck Silvers BO_UNLOCK(&odevvp->v_bufobj); 1238c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 123925809a01SKonstantin Belousov vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 1240f15ccf88SChuck Silvers mntfs_freevp(devvp); 124149c4791cSEdward Tomasz Napierala dev_rel(dev); 1242df8bae1dSRodney W. Grimes return (error); 1243df8bae1dSRodney W. Grimes } 1244df8bae1dSRodney W. Grimes 1245dffce215SKirk McKusick /* 1246dffce215SKirk McKusick * A read function for use by filesystem-layer routines. 1247dffce215SKirk McKusick */ 1248dffce215SKirk McKusick static int 1249dffce215SKirk McKusick ffs_use_bread(void *devfd, off_t loc, void **bufp, int size) 1250dffce215SKirk McKusick { 1251dffce215SKirk McKusick struct buf *bp; 1252dffce215SKirk McKusick int error; 1253dffce215SKirk McKusick 1254efbf3964SKirk McKusick KASSERT(*bufp == NULL, ("ffs_use_bread: non-NULL *bufp %p\n", *bufp)); 1255dffce215SKirk McKusick *bufp = malloc(size, M_UFSMNT, M_WAITOK); 1256dffce215SKirk McKusick if ((error = bread((struct vnode *)devfd, btodb(loc), size, NOCRED, 1257efbf3964SKirk McKusick &bp)) != 0) 1258dffce215SKirk McKusick return (error); 1259dffce215SKirk McKusick bcopy(bp->b_data, *bufp, size); 1260dffce215SKirk McKusick bp->b_flags |= B_INVAL | B_NOCACHE; 1261dffce215SKirk McKusick brelse(bp); 1262dffce215SKirk McKusick return (0); 1263dffce215SKirk McKusick } 1264dffce215SKirk McKusick 1265adf41577SPoul-Henning Kamp static int bigcgs = 0; 12661c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, ""); 12671c85e6a3SKirk McKusick 1268df8bae1dSRodney W. Grimes /* 12691c85e6a3SKirk McKusick * Sanity checks for loading old filesystem superblocks. 12701c85e6a3SKirk McKusick * See ffs_oldfscompat_write below for unwound actions. 1271df8bae1dSRodney W. Grimes * 12721c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 12731c85e6a3SKirk McKusick * Unfortunately new bits get added. 1274df8bae1dSRodney W. Grimes */ 12751c85e6a3SKirk McKusick static void 1276064e6b43SKirk McKusick ffs_oldfscompat_read(struct fs *fs, 1277064e6b43SKirk McKusick struct ufsmount *ump, 1278064e6b43SKirk McKusick ufs2_daddr_t sblockloc) 12791c85e6a3SKirk McKusick { 12801c85e6a3SKirk McKusick off_t maxfilesize; 12811c85e6a3SKirk McKusick 12821c85e6a3SKirk McKusick /* 1283ada981b2SKirk McKusick * If not yet done, update fs_flags location and value of fs_sblockloc. 1284ada981b2SKirk McKusick */ 1285ada981b2SKirk McKusick if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1286ada981b2SKirk McKusick fs->fs_flags = fs->fs_old_flags; 1287ada981b2SKirk McKusick fs->fs_old_flags |= FS_FLAGS_UPDATED; 1288ada981b2SKirk McKusick fs->fs_sblockloc = sblockloc; 1289ada981b2SKirk McKusick } 1290ada981b2SKirk McKusick /* 12911c85e6a3SKirk McKusick * If not yet done, update UFS1 superblock with new wider fields. 12921c85e6a3SKirk McKusick */ 129374f3809aSKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) { 12941c85e6a3SKirk McKusick fs->fs_maxbsize = fs->fs_bsize; 12951c85e6a3SKirk McKusick fs->fs_time = fs->fs_old_time; 12961c85e6a3SKirk McKusick fs->fs_size = fs->fs_old_size; 12971c85e6a3SKirk McKusick fs->fs_dsize = fs->fs_old_dsize; 12981c85e6a3SKirk McKusick fs->fs_csaddr = fs->fs_old_csaddr; 12991c85e6a3SKirk McKusick fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir; 13001c85e6a3SKirk McKusick fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree; 13011c85e6a3SKirk McKusick fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree; 13021c85e6a3SKirk McKusick fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree; 13031c85e6a3SKirk McKusick } 13041c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && 13051c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { 13068680d698SNate Lawson fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1; 13071c85e6a3SKirk McKusick fs->fs_qbmask = ~fs->fs_bmask; 13081c85e6a3SKirk McKusick fs->fs_qfmask = ~fs->fs_fmask; 13091c85e6a3SKirk McKusick } 13108f42fb8fSIan Dowse if (fs->fs_magic == FS_UFS1_MAGIC) { 13111c85e6a3SKirk McKusick ump->um_savedmaxfilesize = fs->fs_maxfilesize; 13128680d698SNate Lawson maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1; 13131c85e6a3SKirk McKusick if (fs->fs_maxfilesize > maxfilesize) 13141c85e6a3SKirk McKusick fs->fs_maxfilesize = maxfilesize; 13158f42fb8fSIan Dowse } 13161c85e6a3SKirk McKusick /* Compatibility for old filesystems */ 13171c85e6a3SKirk McKusick if (fs->fs_avgfilesize <= 0) 13181c85e6a3SKirk McKusick fs->fs_avgfilesize = AVFILESIZ; 13191c85e6a3SKirk McKusick if (fs->fs_avgfpdir <= 0) 13201c85e6a3SKirk McKusick fs->fs_avgfpdir = AFPDIR; 13211c85e6a3SKirk McKusick if (bigcgs) { 13221c85e6a3SKirk McKusick fs->fs_save_cgsize = fs->fs_cgsize; 13231c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_bsize; 13241c85e6a3SKirk McKusick } 13251c85e6a3SKirk McKusick } 13261c85e6a3SKirk McKusick 13271c85e6a3SKirk McKusick /* 13281c85e6a3SKirk McKusick * Unwinding superblock updates for old filesystems. 13291c85e6a3SKirk McKusick * See ffs_oldfscompat_read above for details. 13301c85e6a3SKirk McKusick * 13311c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 13321c85e6a3SKirk McKusick * Unfortunately new bits get added. 13331c85e6a3SKirk McKusick */ 1334113db2ddSJeff Roberson void 1335064e6b43SKirk McKusick ffs_oldfscompat_write(struct fs *fs, struct ufsmount *ump) 1336df8bae1dSRodney W. Grimes { 1337df8bae1dSRodney W. Grimes 13381c85e6a3SKirk McKusick /* 13391c85e6a3SKirk McKusick * Copy back UFS2 updated fields that UFS1 inspects. 13401c85e6a3SKirk McKusick */ 13411c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 13421c85e6a3SKirk McKusick fs->fs_old_time = fs->fs_time; 13431c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir; 13441c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree; 13451c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree; 13461c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree; 13471c85e6a3SKirk McKusick fs->fs_maxfilesize = ump->um_savedmaxfilesize; 13488f42fb8fSIan Dowse } 13491c85e6a3SKirk McKusick if (bigcgs) { 13501c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_save_cgsize; 13511c85e6a3SKirk McKusick fs->fs_save_cgsize = 0; 13521c85e6a3SKirk McKusick } 1353df8bae1dSRodney W. Grimes } 1354df8bae1dSRodney W. Grimes 1355df8bae1dSRodney W. Grimes /* 1356df8bae1dSRodney W. Grimes * unmount system call 1357df8bae1dSRodney W. Grimes */ 1358adf41577SPoul-Henning Kamp static int 1359064e6b43SKirk McKusick ffs_unmount(struct mount *mp, int mntflags) 1360df8bae1dSRodney W. Grimes { 1361dfd233edSAttilio Rao struct thread *td; 136205f4ff5dSPoul-Henning Kamp struct ufsmount *ump = VFSTOUFS(mp); 136305f4ff5dSPoul-Henning Kamp struct fs *fs; 13646fecb4e4SKonstantin Belousov int error, flags, susp; 1365df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1366df86ccf6SKonstantin Belousov int e_restart; 1367df86ccf6SKonstantin Belousov #endif 1368df8bae1dSRodney W. Grimes 1369df8bae1dSRodney W. Grimes flags = 0; 1370dfd233edSAttilio Rao td = curthread; 13716fecb4e4SKonstantin Belousov fs = ump->um_fs; 137271f26429SKonstantin Belousov if (mntflags & MNT_FORCE) 1373df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 13744ce90426SKonstantin Belousov susp = fs->fs_ronly == 0; 1375516081f2SRobert Watson #ifdef UFS_EXTATTR 1376b40ce416SJulian Elischer if ((error = ufs_extattr_stop(mp, td))) { 1377b2b0497aSRobert Watson if (error != EOPNOTSUPP) 1378b60ee81eSKirk McKusick printf("WARNING: unmount %s: ufs_extattr_stop " 1379b60ee81eSKirk McKusick "returned errno %d\n", mp->mnt_stat.f_mntonname, 1380b2b0497aSRobert Watson error); 1381df86ccf6SKonstantin Belousov e_restart = 0; 13827df97b61SRobert Watson } else { 13839de54ba5SRobert Watson ufs_extattr_uepm_destroy(&ump->um_extattr); 1384df86ccf6SKonstantin Belousov e_restart = 1; 13857df97b61SRobert Watson } 1386a64ed089SRobert Watson #endif 13876fecb4e4SKonstantin Belousov if (susp) { 1388895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 1389895b3782SKonstantin Belousov if (error != 0) 1390895b3782SKonstantin Belousov goto fail1; 13916fecb4e4SKonstantin Belousov } 1392fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 13933c140b2dSEdward Tomasz Napierala error = softdep_flushfiles(mp, flags, td); 13943c140b2dSEdward Tomasz Napierala else 13953c140b2dSEdward Tomasz Napierala error = ffs_flushfiles(mp, flags, td); 1396d79ff54bSChuck Silvers if (error != 0 && !ffs_fsfail_cleanup(ump, error)) 13976fecb4e4SKonstantin Belousov goto fail; 13983c140b2dSEdward Tomasz Napierala 13993ba649d7SJeff Roberson UFS_LOCK(ump); 14009ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1401b60ee81eSKirk McKusick printf("WARNING: unmount %s: pending error: blocks %jd " 1402b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 14031c85e6a3SKirk McKusick fs->fs_pendinginodes); 14049ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 14059ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 14069ccb939eSKirk McKusick } 14073ba649d7SJeff Roberson UFS_UNLOCK(ump); 1408519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 1409113db2ddSJeff Roberson softdep_unmount(mp); 14102af934ccSKonstantin Belousov MPASS(ump->um_softdep == NULL); 14119acea164SRobert Wing if (fs->fs_ronly == 0) { 14121a6a6610SKirk McKusick fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1; 1413791dd2faSTor Egge error = ffs_sbupdate(ump, MNT_WAIT, 0); 1414d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, error)) 1415d79ff54bSChuck Silvers error = 0; 1416d79ff54bSChuck Silvers if (error != 0 && !ffs_fsfail_cleanup(ump, error)) { 1417996c772fSJohn Dyson fs->fs_clean = 0; 14186fecb4e4SKonstantin Belousov goto fail; 1419996c772fSJohn Dyson } 1420e0e9c421SDavid Greenman } 1421ddd6b3fcSKonstantin Belousov if (susp) 1422ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1423c79dff0fSKonstantin Belousov if (ump->um_trim_tq != NULL) { 14243dc5f8e1SChuck Silvers MPASS(ump->um_trim_inflight == 0); 1425c79dff0fSKonstantin Belousov taskqueue_free(ump->um_trim_tq); 14267e038bc2SKirk McKusick free (ump->um_trimhash, M_TRIM); 1427c79dff0fSKonstantin Belousov } 1428c34a5148SKonstantin Belousov vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 142943920011SPoul-Henning Kamp g_topology_lock(); 14300d7935fdSAttilio Rao g_vfs_close(ump->um_cp); 143143920011SPoul-Henning Kamp g_topology_unlock(); 1432f15ccf88SChuck Silvers BO_LOCK(&ump->um_odevvp->v_bufobj); 1433f15ccf88SChuck Silvers ump->um_odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS; 1434f15ccf88SChuck Silvers BO_UNLOCK(&ump->um_odevvp->v_bufobj); 1435c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&ump->um_dev->si_mountpt, 0); 1436f15ccf88SChuck Silvers mntfs_freevp(ump->um_devvp); 1437f15ccf88SChuck Silvers vrele(ump->um_odevvp); 143849c4791cSEdward Tomasz Napierala dev_rel(ump->um_dev); 14393ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 14408df4bc48SKonstantin Belousov sx_destroy(&ump->um_checkpath_lock); 14411a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 14421a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 14431a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 14441a60c7fcSPawel Jakub Dawidek } 1445f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 144634816cb9SKirk McKusick free(fs->fs_si, M_UFSMNT); 1447df8bae1dSRodney W. Grimes free(fs, M_UFSMNT); 1448df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 144977465d93SAlfred Perlstein mp->mnt_data = NULL; 14504cbc378cSKonstantin Belousov if (td->td_su == mp) { 14514cbc378cSKonstantin Belousov td->td_su = NULL; 14524cbc378cSKonstantin Belousov vfs_rel(mp); 14534cbc378cSKonstantin Belousov } 1454df8bae1dSRodney W. Grimes return (error); 14556fecb4e4SKonstantin Belousov 14566fecb4e4SKonstantin Belousov fail: 1457ddd6b3fcSKonstantin Belousov if (susp) 1458ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1459895b3782SKonstantin Belousov fail1: 1460df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1461df86ccf6SKonstantin Belousov if (e_restart) { 1462df86ccf6SKonstantin Belousov ufs_extattr_uepm_init(&ump->um_extattr); 1463df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART 1464df86ccf6SKonstantin Belousov (void) ufs_extattr_autostart(mp, td); 1465df86ccf6SKonstantin Belousov #endif 1466df86ccf6SKonstantin Belousov } 1467df86ccf6SKonstantin Belousov #endif 1468df86ccf6SKonstantin Belousov 14696fecb4e4SKonstantin Belousov return (error); 1470df8bae1dSRodney W. Grimes } 1471df8bae1dSRodney W. Grimes 1472df8bae1dSRodney W. Grimes /* 1473df8bae1dSRodney W. Grimes * Flush out all the files in a filesystem. 1474df8bae1dSRodney W. Grimes */ 147526f9a767SRodney W. Grimes int 1476064e6b43SKirk McKusick ffs_flushfiles(struct mount *mp, int flags, struct thread *td) 1477df8bae1dSRodney W. Grimes { 147805f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 1479ba05dec5SKonstantin Belousov int qerror, error; 1480df8bae1dSRodney W. Grimes 1481df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1482ba05dec5SKonstantin Belousov qerror = 0; 1483df8bae1dSRodney W. Grimes #ifdef QUOTA 1484df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_QUOTA) { 1485c1d9efcbSPoul-Henning Kamp int i; 1486f257b7a5SAlfred Perlstein error = vflush(mp, 0, SKIPSYSTEM|flags, td); 1487c1d9efcbSPoul-Henning Kamp if (error) 1488df8bae1dSRodney W. Grimes return (error); 1489df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) { 1490ba05dec5SKonstantin Belousov error = quotaoff(td, mp, i); 1491ba05dec5SKonstantin Belousov if (error != 0) { 1492ba05dec5SKonstantin Belousov if ((flags & EARLYFLUSH) == 0) 1493ba05dec5SKonstantin Belousov return (error); 1494ba05dec5SKonstantin Belousov else 1495ba05dec5SKonstantin Belousov qerror = error; 1496df8bae1dSRodney W. Grimes } 1497ba05dec5SKonstantin Belousov } 1498ba05dec5SKonstantin Belousov 1499df8bae1dSRodney W. Grimes /* 1500ba05dec5SKonstantin Belousov * Here we fall through to vflush again to ensure that 1501ba05dec5SKonstantin Belousov * we have gotten rid of all the system vnodes, unless 1502ba05dec5SKonstantin Belousov * quotas must not be closed. 1503df8bae1dSRodney W. Grimes */ 1504df8bae1dSRodney W. Grimes } 1505df8bae1dSRodney W. Grimes #endif 150676b05e3eSKonstantin Belousov /* devvp is not locked there */ 1507e6e370a7SJeff Roberson if (ump->um_devvp->v_vflag & VV_COPYONWRITE) { 1508f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0) 1509f2a2857bSKirk McKusick return (error); 1510f2a2857bSKirk McKusick ffs_snapshot_unmount(mp); 151195e7a3c3STor Egge flags |= FORCECLOSE; 1512f2a2857bSKirk McKusick /* 1513f2a2857bSKirk McKusick * Here we fall through to vflush again to ensure 1514f2a2857bSKirk McKusick * that we have gotten rid of all the system vnodes. 1515f2a2857bSKirk McKusick */ 1516f2a2857bSKirk McKusick } 1517ba05dec5SKonstantin Belousov 1518b1897c19SJulian Elischer /* 1519ba05dec5SKonstantin Belousov * Do not close system files if quotas were not closed, to be 1520ba05dec5SKonstantin Belousov * able to sync the remaining dquots. The freeblks softupdate 1521ba05dec5SKonstantin Belousov * workitems might hold a reference on a dquot, preventing 1522ba05dec5SKonstantin Belousov * quotaoff() from completing. Next round of 1523ba05dec5SKonstantin Belousov * softdep_flushworklist() iteration should process the 1524ba05dec5SKonstantin Belousov * blockers, allowing the next run of quotaoff() to finally 1525ba05dec5SKonstantin Belousov * flush held dquots. 1526ba05dec5SKonstantin Belousov * 1527ba05dec5SKonstantin Belousov * Otherwise, flush all the files. 1528b1897c19SJulian Elischer */ 1529ba05dec5SKonstantin Belousov if (qerror == 0 && (error = vflush(mp, 0, flags, td)) != 0) 1530b1897c19SJulian Elischer return (error); 1531ba05dec5SKonstantin Belousov 1532b1897c19SJulian Elischer /* 15333dc5f8e1SChuck Silvers * If this is a forcible unmount and there were any files that 15343dc5f8e1SChuck Silvers * were unlinked but still open, then vflush() will have 15353dc5f8e1SChuck Silvers * truncated and freed those files, which might have started 15363dc5f8e1SChuck Silvers * some trim work. Wait here for any trims to complete 15373dc5f8e1SChuck Silvers * and process the blkfrees which follow the trims. 15383dc5f8e1SChuck Silvers * This may create more dirty devvp buffers and softdep deps. 15393dc5f8e1SChuck Silvers */ 15403dc5f8e1SChuck Silvers if (ump->um_trim_tq != NULL) { 15413dc5f8e1SChuck Silvers while (ump->um_trim_inflight != 0) 15423dc5f8e1SChuck Silvers pause("ufsutr", hz); 15433dc5f8e1SChuck Silvers taskqueue_drain_all(ump->um_trim_tq); 15443dc5f8e1SChuck Silvers } 15453dc5f8e1SChuck Silvers 15463dc5f8e1SChuck Silvers /* 1547b1897c19SJulian Elischer * Flush filesystem metadata. 1548b1897c19SJulian Elischer */ 1549cb05b60aSAttilio Rao vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 15508df6bac4SPoul-Henning Kamp error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td); 1551b249ce48SMateusz Guzik VOP_UNLOCK(ump->um_devvp); 1552df8bae1dSRodney W. Grimes return (error); 1553df8bae1dSRodney W. Grimes } 1554df8bae1dSRodney W. Grimes 1555df8bae1dSRodney W. Grimes /* 1556df8bae1dSRodney W. Grimes * Get filesystem statistics. 1557df8bae1dSRodney W. Grimes */ 1558adf41577SPoul-Henning Kamp static int 1559064e6b43SKirk McKusick ffs_statfs(struct mount *mp, struct statfs *sbp) 1560df8bae1dSRodney W. Grimes { 156105f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 156205f4ff5dSPoul-Henning Kamp struct fs *fs; 1563df8bae1dSRodney W. Grimes 1564df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1565df8bae1dSRodney W. Grimes fs = ump->um_fs; 15661c85e6a3SKirk McKusick if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC) 1567df8bae1dSRodney W. Grimes panic("ffs_statfs"); 1568fde81c7dSKirk McKusick sbp->f_version = STATFS_VERSION; 1569df8bae1dSRodney W. Grimes sbp->f_bsize = fs->fs_fsize; 1570df8bae1dSRodney W. Grimes sbp->f_iosize = fs->fs_bsize; 1571df8bae1dSRodney W. Grimes sbp->f_blocks = fs->fs_dsize; 15723ba649d7SJeff Roberson UFS_LOCK(ump); 1573df8bae1dSRodney W. Grimes sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + 15749ccb939eSKirk McKusick fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks); 15759ccb939eSKirk McKusick sbp->f_bavail = freespace(fs, fs->fs_minfree) + 15769ccb939eSKirk McKusick dbtofsb(fs, fs->fs_pendingblocks); 15771dc349abSEd Maste sbp->f_files = fs->fs_ncg * fs->fs_ipg - UFS_ROOTINO; 15789ccb939eSKirk McKusick sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes; 15793ba649d7SJeff Roberson UFS_UNLOCK(ump); 1580a96da1c3SConrad Meyer sbp->f_namemax = UFS_MAXNAMLEN; 1581df8bae1dSRodney W. Grimes return (0); 1582df8bae1dSRodney W. Grimes } 1583df8bae1dSRodney W. Grimes 15841eabd967SKonstantin Belousov static bool 15851eabd967SKonstantin Belousov sync_doupdate(struct inode *ip) 15861eabd967SKonstantin Belousov { 15871eabd967SKonstantin Belousov 15881eabd967SKonstantin Belousov return ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED | 15891eabd967SKonstantin Belousov IN_UPDATE)) != 0); 15901eabd967SKonstantin Belousov } 15911eabd967SKonstantin Belousov 159280663cadSMateusz Guzik static int 159380663cadSMateusz Guzik ffs_sync_lazy_filter(struct vnode *vp, void *arg __unused) 159480663cadSMateusz Guzik { 159580663cadSMateusz Guzik struct inode *ip; 159680663cadSMateusz Guzik 159780663cadSMateusz Guzik /* 159880663cadSMateusz Guzik * Flags are safe to access because ->v_data invalidation 159980663cadSMateusz Guzik * is held off by listmtx. 160080663cadSMateusz Guzik */ 160180663cadSMateusz Guzik if (vp->v_type == VNON) 160280663cadSMateusz Guzik return (false); 160380663cadSMateusz Guzik ip = VTOI(vp); 160480663cadSMateusz Guzik if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) 160580663cadSMateusz Guzik return (false); 160680663cadSMateusz Guzik return (true); 160780663cadSMateusz Guzik } 160880663cadSMateusz Guzik 1609df8bae1dSRodney W. Grimes /* 1610a988a5c6SKonstantin Belousov * For a lazy sync, we only care about access times, quotas and the 1611a988a5c6SKonstantin Belousov * superblock. Other filesystem changes are already converted to 1612a988a5c6SKonstantin Belousov * cylinder group blocks or inode blocks updates and are written to 1613a988a5c6SKonstantin Belousov * disk by syncer. 1614a988a5c6SKonstantin Belousov */ 1615a988a5c6SKonstantin Belousov static int 1616064e6b43SKirk McKusick ffs_sync_lazy(struct mount *mp) 1617a988a5c6SKonstantin Belousov { 1618a988a5c6SKonstantin Belousov struct vnode *mvp, *vp; 1619a988a5c6SKonstantin Belousov struct inode *ip; 1620a988a5c6SKonstantin Belousov int allerror, error; 1621a988a5c6SKonstantin Belousov 1622a988a5c6SKonstantin Belousov allerror = 0; 16230297c138SKirk McKusick if ((mp->mnt_flag & MNT_NOATIME) != 0) { 16240297c138SKirk McKusick #ifdef QUOTA 16250297c138SKirk McKusick qsync(mp); 16260297c138SKirk McKusick #endif 16270297c138SKirk McKusick goto sbupdate; 16280297c138SKirk McKusick } 162980663cadSMateusz Guzik MNT_VNODE_FOREACH_LAZY(vp, mp, mvp, ffs_sync_lazy_filter, NULL) { 163071469bb3SKirk McKusick if (vp->v_type == VNON) { 1631a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1632a988a5c6SKonstantin Belousov continue; 1633a988a5c6SKonstantin Belousov } 1634a988a5c6SKonstantin Belousov ip = VTOI(vp); 1635a988a5c6SKonstantin Belousov 1636a988a5c6SKonstantin Belousov /* 1637a988a5c6SKonstantin Belousov * The IN_ACCESS flag is converted to IN_MODIFIED by 1638a988a5c6SKonstantin Belousov * ufs_close() and ufs_getattr() by the calls to 1639ea573a50SKonstantin Belousov * ufs_itimes_locked(), without subsequent UFS_UPDATE(). 1640ea573a50SKonstantin Belousov * Test also all the other timestamp flags too, to pick up 1641ea573a50SKonstantin Belousov * any other cases that could be missed. 1642a988a5c6SKonstantin Belousov */ 16431eabd967SKonstantin Belousov if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) { 1644a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1645a988a5c6SKonstantin Belousov continue; 1646a988a5c6SKonstantin Belousov } 1647a92a971bSMateusz Guzik if ((error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK)) != 0) 1648a988a5c6SKonstantin Belousov continue; 16490297c138SKirk McKusick #ifdef QUOTA 16500297c138SKirk McKusick qsyncvp(vp); 16510297c138SKirk McKusick #endif 16521eabd967SKonstantin Belousov if (sync_doupdate(ip)) 1653a988a5c6SKonstantin Belousov error = ffs_update(vp, 0); 1654a988a5c6SKonstantin Belousov if (error != 0) 1655a988a5c6SKonstantin Belousov allerror = error; 1656a988a5c6SKonstantin Belousov vput(vp); 1657a988a5c6SKonstantin Belousov } 16580297c138SKirk McKusick sbupdate: 1659a988a5c6SKonstantin Belousov if (VFSTOUFS(mp)->um_fs->fs_fmod != 0 && 1660a988a5c6SKonstantin Belousov (error = ffs_sbupdate(VFSTOUFS(mp), MNT_LAZY, 0)) != 0) 1661a988a5c6SKonstantin Belousov allerror = error; 1662a988a5c6SKonstantin Belousov return (allerror); 1663a988a5c6SKonstantin Belousov } 1664a988a5c6SKonstantin Belousov 1665a988a5c6SKonstantin Belousov /* 1666df8bae1dSRodney W. Grimes * Go through the disk queues to initiate sandbagged IO; 1667df8bae1dSRodney W. Grimes * go through the inodes to write those that have been modified; 1668df8bae1dSRodney W. Grimes * initiate the writing of the super block if it has been modified. 1669df8bae1dSRodney W. Grimes * 1670a988a5c6SKonstantin Belousov * Note: we are always called with the filesystem marked busy using 1671a988a5c6SKonstantin Belousov * vfs_busy(). 1672df8bae1dSRodney W. Grimes */ 1673adf41577SPoul-Henning Kamp static int 1674064e6b43SKirk McKusick ffs_sync(struct mount *mp, int waitfor) 1675df8bae1dSRodney W. Grimes { 167682be0a5aSTor Egge struct vnode *mvp, *vp, *devvp; 1677dfd233edSAttilio Rao struct thread *td; 1678996c772fSJohn Dyson struct inode *ip; 1679996c772fSJohn Dyson struct ufsmount *ump = VFSTOUFS(mp); 1680996c772fSJohn Dyson struct fs *fs; 168169baeadcSKonstantin Belousov int error, count, lockreq, allerror = 0; 1682791dd2faSTor Egge int suspend; 1683791dd2faSTor Egge int suspended; 1684791dd2faSTor Egge int secondary_writes; 1685791dd2faSTor Egge int secondary_accwrites; 1686791dd2faSTor Egge int softdep_deps; 1687791dd2faSTor Egge int softdep_accdeps; 1688156cb265SPoul-Henning Kamp struct bufobj *bo; 1689df8bae1dSRodney W. Grimes 169019c87af0SKirk McKusick suspend = 0; 169119c87af0SKirk McKusick suspended = 0; 1692dfd233edSAttilio Rao td = curthread; 1693df8bae1dSRodney W. Grimes fs = ump->um_fs; 16949acea164SRobert Wing if (fs->fs_fmod != 0 && fs->fs_ronly != 0) 1695b60ee81eSKirk McKusick panic("%s: ffs_sync: modification on read-only filesystem", 1696b60ee81eSKirk McKusick fs->fs_fsmnt); 16974af9f77eSKonstantin Belousov if (waitfor == MNT_LAZY) { 16984af9f77eSKonstantin Belousov if (!rebooting) 1699a988a5c6SKonstantin Belousov return (ffs_sync_lazy(mp)); 17004af9f77eSKonstantin Belousov waitfor = MNT_NOWAIT; 17014af9f77eSKonstantin Belousov } 1702a988a5c6SKonstantin Belousov 170319c87af0SKirk McKusick /* 1704df8bae1dSRodney W. Grimes * Write back each (modified) inode. 1705df8bae1dSRodney W. Grimes */ 1706245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE | LK_NOWAIT; 1707791dd2faSTor Egge if (waitfor == MNT_SUSPEND) { 1708791dd2faSTor Egge suspend = 1; 1709791dd2faSTor Egge waitfor = MNT_WAIT; 1710791dd2faSTor Egge } 171169baeadcSKonstantin Belousov if (waitfor == MNT_WAIT) 1712245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE; 17134d9b2ed3SMateusz Guzik lockreq |= LK_INTERLOCK; 1714df8bae1dSRodney W. Grimes loop: 1715791dd2faSTor Egge /* Grab snapshot of secondary write counts */ 171671469bb3SKirk McKusick MNT_ILOCK(mp); 1717791dd2faSTor Egge secondary_writes = mp->mnt_secondary_writes; 1718791dd2faSTor Egge secondary_accwrites = mp->mnt_secondary_accwrites; 171971469bb3SKirk McKusick MNT_IUNLOCK(mp); 1720791dd2faSTor Egge 1721791dd2faSTor Egge /* Grab snapshot of softdep dependency counts */ 1722791dd2faSTor Egge softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps); 1723791dd2faSTor Egge 172471469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 1725245df27cSMatthew Dillon /* 1726e0c17408SKonstantin Belousov * Depend on the vnode interlock to keep things stable enough 1727245df27cSMatthew Dillon * for a quick test. Since there might be hundreds of 1728245df27cSMatthew Dillon * thousands of vnodes, we cannot afford even a subroutine 1729245df27cSMatthew Dillon * call unless there's a good chance that we have work to do. 1730245df27cSMatthew Dillon */ 173171469bb3SKirk McKusick if (vp->v_type == VNON) { 17322f05568aSJeff Roberson VI_UNLOCK(vp); 17332f05568aSJeff Roberson continue; 17342f05568aSJeff Roberson } 1735df8bae1dSRodney W. Grimes ip = VTOI(vp); 173671469bb3SKirk McKusick if ((ip->i_flag & 1737cf60e8e4SKirk McKusick (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && 173871469bb3SKirk McKusick vp->v_bufobj.bo_dirty.bv_cnt == 0) { 17392f05568aSJeff Roberson VI_UNLOCK(vp); 1740df8bae1dSRodney W. Grimes continue; 1741996c772fSJohn Dyson } 1742a92a971bSMateusz Guzik if ((error = vget(vp, lockreq)) != 0) { 17434d9b2ed3SMateusz Guzik if (error == ENOENT) { 174471469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 1745df8bae1dSRodney W. Grimes goto loop; 174682be0a5aSTor Egge } 17472f05568aSJeff Roberson continue; 17482f05568aSJeff Roberson } 17490297c138SKirk McKusick #ifdef QUOTA 17500297c138SKirk McKusick qsyncvp(vp); 17510297c138SKirk McKusick #endif 17528a1509e4SKonstantin Belousov for (;;) { 17538a1509e4SKonstantin Belousov error = ffs_syncvnode(vp, waitfor, 0); 17548a1509e4SKonstantin Belousov if (error == ERELOOKUP) 17558a1509e4SKonstantin Belousov continue; 17568a1509e4SKonstantin Belousov if (error != 0) 1757df8bae1dSRodney W. Grimes allerror = error; 17588a1509e4SKonstantin Belousov break; 17598a1509e4SKonstantin Belousov } 176041d4783dSJeff Roberson vput(vp); 1761245df27cSMatthew Dillon } 1762df8bae1dSRodney W. Grimes /* 1763df8bae1dSRodney W. Grimes * Force stale filesystem control information to be flushed. 1764df8bae1dSRodney W. Grimes */ 17654af9f77eSKonstantin Belousov if (waitfor == MNT_WAIT || rebooting) { 1766b40ce416SJulian Elischer if ((error = softdep_flushworklist(ump->um_mountp, &count, td))) 17679b971133SKirk McKusick allerror = error; 1768d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1769d79ff54bSChuck Silvers allerror = 0; 17709b971133SKirk McKusick /* Flushed work items may create new vnodes to clean */ 177171469bb3SKirk McKusick if (allerror == 0 && count) 17729b971133SKirk McKusick goto loop; 17739b971133SKirk McKusick } 177419c87af0SKirk McKusick 1775112f7372SKirk McKusick devvp = ump->um_devvp; 1776156cb265SPoul-Henning Kamp bo = &devvp->v_bufobj; 1777698b1a66SJeff Roberson BO_LOCK(bo); 177819c87af0SKirk McKusick if (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0) { 1779698b1a66SJeff Roberson BO_UNLOCK(bo); 1780698b1a66SJeff Roberson vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 17814af9f77eSKonstantin Belousov error = VOP_FSYNC(devvp, waitfor, td); 1782b249ce48SMateusz Guzik VOP_UNLOCK(devvp); 17834af9f77eSKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (error == 0 || error == EAGAIN)) 17844af9f77eSKonstantin Belousov error = ffs_sbupdate(ump, waitfor, 0); 17854af9f77eSKonstantin Belousov if (error != 0) 17864af9f77eSKonstantin Belousov allerror = error; 1787d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1788d79ff54bSChuck Silvers allerror = 0; 178971469bb3SKirk McKusick if (allerror == 0 && waitfor == MNT_WAIT) 1790112f7372SKirk McKusick goto loop; 1791791dd2faSTor Egge } else if (suspend != 0) { 1792791dd2faSTor Egge if (softdep_check_suspend(mp, 1793791dd2faSTor Egge devvp, 1794791dd2faSTor Egge softdep_deps, 1795791dd2faSTor Egge softdep_accdeps, 1796791dd2faSTor Egge secondary_writes, 179771469bb3SKirk McKusick secondary_accwrites) != 0) { 179871469bb3SKirk McKusick MNT_IUNLOCK(mp); 1799791dd2faSTor Egge goto loop; /* More work needed */ 180071469bb3SKirk McKusick } 1801791dd2faSTor Egge mtx_assert(MNT_MTX(mp), MA_OWNED); 1802ca2fa807STor Egge mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED; 1803791dd2faSTor Egge MNT_IUNLOCK(mp); 1804791dd2faSTor Egge suspended = 1; 1805112f7372SKirk McKusick } else 1806698b1a66SJeff Roberson BO_UNLOCK(bo); 1807996c772fSJohn Dyson /* 1808996c772fSJohn Dyson * Write back modified superblock. 1809996c772fSJohn Dyson */ 1810791dd2faSTor Egge if (fs->fs_fmod != 0 && 1811791dd2faSTor Egge (error = ffs_sbupdate(ump, waitfor, suspended)) != 0) 1812996c772fSJohn Dyson allerror = error; 1813d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, allerror)) 1814d79ff54bSChuck Silvers allerror = 0; 1815df8bae1dSRodney W. Grimes return (allerror); 1816df8bae1dSRodney W. Grimes } 1817df8bae1dSRodney W. Grimes 1818df8bae1dSRodney W. Grimes int 1819064e6b43SKirk McKusick ffs_vget(struct mount *mp, ino_t ino, int flags, struct vnode **vpp) 1820df8bae1dSRodney W. Grimes { 18217b7ed832SKonstantin Belousov return (ffs_vgetf(mp, ino, flags, vpp, 0)); 18227b7ed832SKonstantin Belousov } 18237b7ed832SKonstantin Belousov 18247b7ed832SKonstantin Belousov int 1825064e6b43SKirk McKusick ffs_vgetf(struct mount *mp, 1826064e6b43SKirk McKusick ino_t ino, 1827064e6b43SKirk McKusick int flags, 1828064e6b43SKirk McKusick struct vnode **vpp, 1829064e6b43SKirk McKusick int ffs_flags) 18307b7ed832SKonstantin Belousov { 1831996c772fSJohn Dyson struct fs *fs; 1832996c772fSJohn Dyson struct inode *ip; 1833df8bae1dSRodney W. Grimes struct ufsmount *ump; 1834df8bae1dSRodney W. Grimes struct buf *bp; 1835df8bae1dSRodney W. Grimes struct vnode *vp; 1836d79ff54bSChuck Silvers daddr_t dbn; 1837f576a00dSSemen Ustimenko int error; 1838df8bae1dSRodney W. Grimes 1839f16c26b1SKonstantin Belousov MPASS((ffs_flags & (FFSV_REPLACE | FFSV_REPLACE_DOOMED)) == 0 || 1840f16c26b1SKonstantin Belousov (flags & LK_EXCLUSIVE) != 0); 184116040222SKonstantin Belousov 184251f5ce0cSPoul-Henning Kamp error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL); 184316040222SKonstantin Belousov if (error != 0) 184414bc0685SPoul-Henning Kamp return (error); 184516040222SKonstantin Belousov if (*vpp != NULL) { 1846f16c26b1SKonstantin Belousov if ((ffs_flags & FFSV_REPLACE) == 0 || 1847f16c26b1SKonstantin Belousov ((ffs_flags & FFSV_REPLACE_DOOMED) == 0 || 1848f16c26b1SKonstantin Belousov !VN_IS_DOOMED(*vpp))) 184916040222SKonstantin Belousov return (0); 185016040222SKonstantin Belousov vgone(*vpp); 185116040222SKonstantin Belousov vput(*vpp); 185216040222SKonstantin Belousov } 1853f576a00dSSemen Ustimenko 1854f576a00dSSemen Ustimenko /* 1855d6919865SJeff Roberson * We must promote to an exclusive lock for vnode creation. This 1856d6919865SJeff Roberson * can happen if lookup is passed LOCKSHARED. 1857d6919865SJeff Roberson */ 1858d6919865SJeff Roberson if ((flags & LK_TYPE_MASK) == LK_SHARED) { 1859d6919865SJeff Roberson flags &= ~LK_TYPE_MASK; 1860d6919865SJeff Roberson flags |= LK_EXCLUSIVE; 1861d6919865SJeff Roberson } 1862d6919865SJeff Roberson 1863d6919865SJeff Roberson /* 186413866b3fSSemen Ustimenko * We do not lock vnode creation as it is believed to be too 1865f576a00dSSemen Ustimenko * expensive for such rare case as simultaneous creation of vnode 1866f576a00dSSemen Ustimenko * for same ino by different processes. We just allow them to race 1867f576a00dSSemen Ustimenko * and check later to decide who wins. Let the race begin! 1868f576a00dSSemen Ustimenko */ 186914bc0685SPoul-Henning Kamp 187014bc0685SPoul-Henning Kamp ump = VFSTOUFS(mp); 187114bc0685SPoul-Henning Kamp fs = ump->um_fs; 18729d5a594fSMateusz Guzik ip = uma_zalloc_smr(uma_inode, M_WAITOK | M_ZERO); 18732f9bae59SDavid Greenman 1874df8bae1dSRodney W. Grimes /* Allocate a new vnode/inode. */ 187543a993bbSKirk McKusick error = getnewvnode("ufs", mp, fs->fs_magic == FS_UFS1_MAGIC ? 187643a993bbSKirk McKusick &ffs_vnodeops1 : &ffs_vnodeops2, &vp); 1877c9671602SPoul-Henning Kamp if (error) { 1878df8bae1dSRodney W. Grimes *vpp = NULL; 18799d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 1880df8bae1dSRodney W. Grimes return (error); 1881df8bae1dSRodney W. Grimes } 188267e87166SBoris Popov /* 188333fc3625SJohn Baldwin * FFS supports recursive locking. 188467e87166SBoris Popov */ 1885303d3ae7SKonstantin Belousov lockmgr(vp->v_vnlock, LK_EXCLUSIVE | LK_NOWITNESS, NULL); 1886628f51d2SAttilio Rao VN_LOCK_AREC(vp); 1887df8bae1dSRodney W. Grimes vp->v_data = ip; 18885d9d81e7SPoul-Henning Kamp vp->v_bufobj.bo_bsize = fs->fs_bsize; 1889df8bae1dSRodney W. Grimes ip->i_vnode = vp; 18901c85e6a3SKirk McKusick ip->i_ump = ump; 1891df8bae1dSRodney W. Grimes ip->i_number = ino; 1892e65f5a4eSKonstantin Belousov ip->i_ea_refs = 0; 189374a87c38SKirk McKusick ip->i_nextclustercg = -1; 1894e1db6897SKonstantin Belousov ip->i_flag = fs->fs_magic == FS_UFS1_MAGIC ? 0 : IN_UFS2; 189572d28f97SKirk McKusick ip->i_mode = 0; /* ensure error cases below throw away vnode */ 18962bfd8992SKonstantin Belousov cluster_init_vn(&ip->i_clusterw); 189761846fc4SKonstantin Belousov #ifdef DIAGNOSTIC 189861846fc4SKonstantin Belousov ufs_init_trackers(ip); 189961846fc4SKonstantin Belousov #endif 1900df8bae1dSRodney W. Grimes #ifdef QUOTA 1901c1d9efcbSPoul-Henning Kamp { 1902c1d9efcbSPoul-Henning Kamp int i; 1903df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1904df8bae1dSRodney W. Grimes ip->i_dquot[i] = NODQUOT; 1905c1d9efcbSPoul-Henning Kamp } 1906df8bae1dSRodney W. Grimes #endif 1907df8bae1dSRodney W. Grimes 19087b7ed832SKonstantin Belousov if (ffs_flags & FFSV_FORCEINSMQ) 19097b7ed832SKonstantin Belousov vp->v_vflag |= VV_FORCEINSMQ; 191061b9d89fSTor Egge error = insmntque(vp, mp); 191161b9d89fSTor Egge if (error != 0) { 19129d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 191361b9d89fSTor Egge *vpp = NULL; 191461b9d89fSTor Egge return (error); 191561b9d89fSTor Egge } 19167b7ed832SKonstantin Belousov vp->v_vflag &= ~VV_FORCEINSMQ; 1917a80d8caaSPawel Jakub Dawidek error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL); 191816040222SKonstantin Belousov if (error != 0) 1919f576a00dSSemen Ustimenko return (error); 192016040222SKonstantin Belousov if (*vpp != NULL) { 192116040222SKonstantin Belousov /* 192216040222SKonstantin Belousov * Calls from ffs_valloc() (i.e. FFSV_REPLACE set) 192316040222SKonstantin Belousov * operate on empty inode, which must not be found by 192416040222SKonstantin Belousov * other threads until fully filled. Vnode for empty 192516040222SKonstantin Belousov * inode must be not re-inserted on the hash by other 192616040222SKonstantin Belousov * thread, after removal by us at the beginning. 192716040222SKonstantin Belousov */ 192816040222SKonstantin Belousov MPASS((ffs_flags & FFSV_REPLACE) == 0); 192916040222SKonstantin Belousov return (0); 193016040222SKonstantin Belousov } 19316b9d4fbbSKirk McKusick if (I_IS_UFS1(ip)) 19326b9d4fbbSKirk McKusick ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK); 19336b9d4fbbSKirk McKusick else 19346b9d4fbbSKirk McKusick ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK); 1935f576a00dSSemen Ustimenko 19366b9d4fbbSKirk McKusick if ((ffs_flags & FFSV_NEWINODE) != 0) { 19376b9d4fbbSKirk McKusick /* New inode, just zero out its contents. */ 19386b9d4fbbSKirk McKusick if (I_IS_UFS1(ip)) 19396b9d4fbbSKirk McKusick memset(ip->i_din1, 0, sizeof(struct ufs1_dinode)); 19406b9d4fbbSKirk McKusick else 19416b9d4fbbSKirk McKusick memset(ip->i_din2, 0, sizeof(struct ufs2_dinode)); 19426b9d4fbbSKirk McKusick } else { 19436b9d4fbbSKirk McKusick /* Read the disk contents for the inode, copy into the inode. */ 1944d79ff54bSChuck Silvers dbn = fsbtodb(fs, ino_to_fsba(fs, ino)); 19456b9d4fbbSKirk McKusick error = ffs_breadz(ump, ump->um_devvp, dbn, dbn, 19466b9d4fbbSKirk McKusick (int)fs->fs_bsize, NULL, NULL, 0, NOCRED, 0, NULL, &bp); 1947d79ff54bSChuck Silvers if (error != 0) { 1948df8bae1dSRodney W. Grimes /* 19496b9d4fbbSKirk McKusick * The inode does not contain anything useful, so it 19506b9d4fbbSKirk McKusick * would be misleading to leave it on its hash chain. 19516b9d4fbbSKirk McKusick * With mode still zero, it will be unlinked and 19526b9d4fbbSKirk McKusick * returned to the free list by vput(). 1953df8bae1dSRodney W. Grimes */ 19546c44a3e0SMateusz Guzik vgone(vp); 1955bd7e5f99SJohn Dyson vput(vp); 1956df8bae1dSRodney W. Grimes *vpp = NULL; 1957df8bae1dSRodney W. Grimes return (error); 1958df8bae1dSRodney W. Grimes } 19599fc5d538SKirk McKusick if ((error = ffs_load_inode(bp, ip, fs, ino)) != 0) { 19609fc5d538SKirk McKusick bqrelse(bp); 19616c44a3e0SMateusz Guzik vgone(vp); 19629fc5d538SKirk McKusick vput(vp); 19639fc5d538SKirk McKusick *vpp = NULL; 19649fc5d538SKirk McKusick return (error); 19659fc5d538SKirk McKusick } 19666b9d4fbbSKirk McKusick bqrelse(bp); 19676b9d4fbbSKirk McKusick } 1968fd97fa64SKonstantin Belousov if (DOINGSOFTDEP(vp) && (!fs->fs_ronly || 1969fd97fa64SKonstantin Belousov (ffs_flags & FFSV_FORCEINODEDEP) != 0)) 1970b1897c19SJulian Elischer softdep_load_inodeblock(ip); 1971b1897c19SJulian Elischer else 1972b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 1973df8bae1dSRodney W. Grimes 1974df8bae1dSRodney W. Grimes /* 1975df8bae1dSRodney W. Grimes * Initialize the vnode from the inode, check for aliases. 1976df8bae1dSRodney W. Grimes * Note that the underlying vnode may have changed. 1977df8bae1dSRodney W. Grimes */ 1978e1db6897SKonstantin Belousov error = ufs_vinit(mp, I_IS_UFS1(ip) ? &ffs_fifoops1 : &ffs_fifoops2, 1979e1db6897SKonstantin Belousov &vp); 1980c9671602SPoul-Henning Kamp if (error) { 19816c44a3e0SMateusz Guzik vgone(vp); 1982df8bae1dSRodney W. Grimes vput(vp); 1983df8bae1dSRodney W. Grimes *vpp = NULL; 1984df8bae1dSRodney W. Grimes return (error); 1985df8bae1dSRodney W. Grimes } 1986de68347bSPoul-Henning Kamp 1987df8bae1dSRodney W. Grimes /* 19885c24d6eeSPoul-Henning Kamp * Finish inode initialization. 1989df8bae1dSRodney W. Grimes */ 199033fc3625SJohn Baldwin if (vp->v_type != VFIFO) { 199133fc3625SJohn Baldwin /* FFS supports shared locking for all files except fifos. */ 199233fc3625SJohn Baldwin VN_LOCK_ASHARE(vp); 199333fc3625SJohn Baldwin } 1994de68347bSPoul-Henning Kamp 1995df8bae1dSRodney W. Grimes /* 1996df8bae1dSRodney W. Grimes * Set up a generation number for this inode if it does not 1997df8bae1dSRodney W. Grimes * already have one. This should only happen on old filesystems. 1998df8bae1dSRodney W. Grimes */ 1999df8bae1dSRodney W. Grimes if (ip->i_gen == 0) { 200057d2ac2fSKevin Lo while (ip->i_gen == 0) 200157d2ac2fSKevin Lo ip->i_gen = arc4random(); 20021c85e6a3SKirk McKusick if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 2003ac4ec141SMateusz Guzik UFS_INODE_SET_FLAG(ip, IN_MODIFIED); 2004b403319bSAlexander Kabaev DIP_SET(ip, i_gen, ip->i_gen); 20051c85e6a3SKirk McKusick } 2006df8bae1dSRodney W. Grimes } 2007763bbd2fSRobert Watson #ifdef MAC 2008763bbd2fSRobert Watson if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) { 2009763bbd2fSRobert Watson /* 2010763bbd2fSRobert Watson * If this vnode is already allocated, and we're running 2011763bbd2fSRobert Watson * multi-label, attempt to perform a label association 2012763bbd2fSRobert Watson * from the extended attributes on the inode. 2013763bbd2fSRobert Watson */ 201430d239bcSRobert Watson error = mac_vnode_associate_extattr(mp, vp); 2015763bbd2fSRobert Watson if (error) { 2016763bbd2fSRobert Watson /* ufs_inactive will release ip->i_devvp ref. */ 20176c44a3e0SMateusz Guzik vgone(vp); 2018763bbd2fSRobert Watson vput(vp); 2019763bbd2fSRobert Watson *vpp = NULL; 2020763bbd2fSRobert Watson return (error); 2021763bbd2fSRobert Watson } 2022763bbd2fSRobert Watson } 2023763bbd2fSRobert Watson #endif 2024763bbd2fSRobert Watson 2025829f0bcbSMateusz Guzik vn_set_state(vp, VSTATE_CONSTRUCTED); 2026df8bae1dSRodney W. Grimes *vpp = vp; 2027df8bae1dSRodney W. Grimes return (0); 2028df8bae1dSRodney W. Grimes } 2029df8bae1dSRodney W. Grimes 2030df8bae1dSRodney W. Grimes /* 2031df8bae1dSRodney W. Grimes * File handle to vnode 2032df8bae1dSRodney W. Grimes * 2033df8bae1dSRodney W. Grimes * Have to be really careful about stale file handles: 2034df8bae1dSRodney W. Grimes * - check that the inode number is valid 2035abe53f7eSKirk McKusick * - for UFS2 check that the inode number is initialized 2036df8bae1dSRodney W. Grimes * - call ffs_vget() to get the locked inode 2037df8bae1dSRodney W. Grimes * - check for an unallocated inode (i_mode == 0) 2038df8bae1dSRodney W. Grimes * - check that the given client host has export rights and return 2039df8bae1dSRodney W. Grimes * those rights via. exflagsp and credanonp 2040df8bae1dSRodney W. Grimes */ 2041adf41577SPoul-Henning Kamp static int 2042064e6b43SKirk McKusick ffs_fhtovp(struct mount *mp, struct fid *fhp, int flags, struct vnode **vpp) 2043df8bae1dSRodney W. Grimes { 204405f4ff5dSPoul-Henning Kamp struct ufid *ufhp; 20455952c86cSKonstantin Belousov 20465952c86cSKonstantin Belousov ufhp = (struct ufid *)fhp; 20475952c86cSKonstantin Belousov return (ffs_inotovp(mp, ufhp->ufid_ino, ufhp->ufid_gen, flags, 20485952c86cSKonstantin Belousov vpp, 0)); 20495952c86cSKonstantin Belousov } 20505952c86cSKonstantin Belousov 2051886fd36eSKirk McKusick /* 2052886fd36eSKirk McKusick * Return a vnode from a mounted filesystem for inode with specified 2053886fd36eSKirk McKusick * generation number. Return ESTALE if the inode with given generation 2054886fd36eSKirk McKusick * number no longer exists on that filesystem. 2055886fd36eSKirk McKusick */ 20565952c86cSKonstantin Belousov int 2057064e6b43SKirk McKusick ffs_inotovp(struct mount *mp, 2058064e6b43SKirk McKusick ino_t ino, 2059831b1ff7SKirk McKusick uint64_t gen, 2060064e6b43SKirk McKusick int lflags, 2061064e6b43SKirk McKusick struct vnode **vpp, 2062064e6b43SKirk McKusick int ffs_flags) 20635952c86cSKonstantin Belousov { 2064abe53f7eSKirk McKusick struct ufsmount *ump; 20655952c86cSKonstantin Belousov struct vnode *nvp; 206689fd61d9SKonstantin Belousov struct inode *ip; 2067df8bae1dSRodney W. Grimes struct fs *fs; 2068abe53f7eSKirk McKusick struct cg *cgp; 2069abe53f7eSKirk McKusick struct buf *bp; 2070831b1ff7SKirk McKusick uint64_t cg; 2071df8bae1dSRodney W. Grimes 2072abe53f7eSKirk McKusick ump = VFSTOUFS(mp); 2073abe53f7eSKirk McKusick fs = ump->um_fs; 207489fd61d9SKonstantin Belousov *vpp = NULL; 207589fd61d9SKonstantin Belousov 20761dc349abSEd Maste if (ino < UFS_ROOTINO || ino >= fs->fs_ncg * fs->fs_ipg) 2077df8bae1dSRodney W. Grimes return (ESTALE); 20785952c86cSKonstantin Belousov 2079abe53f7eSKirk McKusick /* 2080abe53f7eSKirk McKusick * Need to check if inode is initialized because UFS2 does lazy 2081abe53f7eSKirk McKusick * initialization and nfs_fhtovp can offer arbitrary inode numbers. 2082abe53f7eSKirk McKusick */ 20835952c86cSKonstantin Belousov if (fs->fs_magic == FS_UFS2_MAGIC) { 2084abe53f7eSKirk McKusick cg = ino_to_cg(fs, ino); 2085886fd36eSKirk McKusick if (ffs_getcg(fs, ump->um_devvp, cg, 0, &bp, &cgp) != 0) 2086886fd36eSKirk McKusick return (ESTALE); 20879c4f551eSKirk McKusick if (ino >= cg * fs->fs_ipg + cgp->cg_initediblk) { 2088abe53f7eSKirk McKusick brelse(bp); 2089abe53f7eSKirk McKusick return (ESTALE); 2090abe53f7eSKirk McKusick } 2091abe53f7eSKirk McKusick brelse(bp); 20925952c86cSKonstantin Belousov } 20935952c86cSKonstantin Belousov 2094886fd36eSKirk McKusick if (ffs_vgetf(mp, ino, lflags, &nvp, ffs_flags) != 0) 2095886fd36eSKirk McKusick return (ESTALE); 209689fd61d9SKonstantin Belousov 209789fd61d9SKonstantin Belousov ip = VTOI(nvp); 209889fd61d9SKonstantin Belousov if (ip->i_mode == 0 || ip->i_gen != gen || ip->i_effnlink <= 0) { 209989fd61d9SKonstantin Belousov if (ip->i_mode == 0) 210089fd61d9SKonstantin Belousov vgone(nvp); 210189fd61d9SKonstantin Belousov vput(nvp); 210289fd61d9SKonstantin Belousov return (ESTALE); 210389fd61d9SKonstantin Belousov } 210489fd61d9SKonstantin Belousov 210589fd61d9SKonstantin Belousov vnode_create_vobject(nvp, DIP(ip, i_size), curthread); 210689fd61d9SKonstantin Belousov *vpp = nvp; 210789fd61d9SKonstantin Belousov return (0); 2108df8bae1dSRodney W. Grimes } 2109df8bae1dSRodney W. Grimes 2110df8bae1dSRodney W. Grimes /* 21115346934fSIan Dowse * Initialize the filesystem. 2112996c772fSJohn Dyson */ 2113996c772fSJohn Dyson static int 2114064e6b43SKirk McKusick ffs_init(struct vfsconf *vfsp) 2115996c772fSJohn Dyson { 2116996c772fSJohn Dyson 21171848286aSEdward Tomasz Napierala ffs_susp_initialize(); 2118b1897c19SJulian Elischer softdep_initialize(); 2119996c772fSJohn Dyson return (ufs_init(vfsp)); 2120996c772fSJohn Dyson } 2121996c772fSJohn Dyson 2122996c772fSJohn Dyson /* 21235346934fSIan Dowse * Undo the work of ffs_init(). 21245346934fSIan Dowse */ 21255346934fSIan Dowse static int 2126064e6b43SKirk McKusick ffs_uninit(struct vfsconf *vfsp) 21275346934fSIan Dowse { 21285346934fSIan Dowse int ret; 21295346934fSIan Dowse 21305346934fSIan Dowse ret = ufs_uninit(vfsp); 21315346934fSIan Dowse softdep_uninitialize(); 21321848286aSEdward Tomasz Napierala ffs_susp_uninitialize(); 2133d79ff54bSChuck Silvers taskqueue_drain_all(taskqueue_thread); 21345346934fSIan Dowse return (ret); 21355346934fSIan Dowse } 21365346934fSIan Dowse 21375346934fSIan Dowse /* 2138dffce215SKirk McKusick * Structure used to pass information from ffs_sbupdate to its 2139dffce215SKirk McKusick * helper routine ffs_use_bwrite. 2140dffce215SKirk McKusick */ 2141dffce215SKirk McKusick struct devfd { 2142dffce215SKirk McKusick struct ufsmount *ump; 2143dffce215SKirk McKusick struct buf *sbbp; 2144dffce215SKirk McKusick int waitfor; 2145dffce215SKirk McKusick int suspended; 2146dffce215SKirk McKusick int error; 2147dffce215SKirk McKusick }; 2148dffce215SKirk McKusick 2149dffce215SKirk McKusick /* 2150df8bae1dSRodney W. Grimes * Write a superblock and associated information back to disk. 2151df8bae1dSRodney W. Grimes */ 21521a60c7fcSPawel Jakub Dawidek int 2153064e6b43SKirk McKusick ffs_sbupdate(struct ufsmount *ump, int waitfor, int suspended) 2154df8bae1dSRodney W. Grimes { 2155dffce215SKirk McKusick struct fs *fs; 21563ba649d7SJeff Roberson struct buf *sbbp; 2157dffce215SKirk McKusick struct devfd devfd; 2158df8bae1dSRodney W. Grimes 2159dffce215SKirk McKusick fs = ump->um_fs; 216074f3809aSKirk McKusick if (fs->fs_ronly == 1 && 2161927a12aeSKirk McKusick (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) != 21629acea164SRobert Wing (MNT_RDONLY | MNT_UPDATE)) 216374f3809aSKirk McKusick panic("ffs_sbupdate: write read-only filesystem"); 2164996c772fSJohn Dyson /* 21653ba649d7SJeff Roberson * We use the superblock's buf to serialize calls to ffs_sbupdate(). 21663ba649d7SJeff Roberson */ 2167927a12aeSKirk McKusick sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc), 2168927a12aeSKirk McKusick (int)fs->fs_sbsize, 0, 0, 0); 21693ba649d7SJeff Roberson /* 2170dffce215SKirk McKusick * Initialize info needed for write function. 2171996c772fSJohn Dyson */ 2172dffce215SKirk McKusick devfd.ump = ump; 2173dffce215SKirk McKusick devfd.sbbp = sbbp; 2174dffce215SKirk McKusick devfd.waitfor = waitfor; 2175dffce215SKirk McKusick devfd.suspended = suspended; 2176dffce215SKirk McKusick devfd.error = 0; 2177dffce215SKirk McKusick return (ffs_sbput(&devfd, fs, fs->fs_sblockloc, ffs_use_bwrite)); 2178dffce215SKirk McKusick } 2179dffce215SKirk McKusick 2180dffce215SKirk McKusick /* 2181dffce215SKirk McKusick * Write function for use by filesystem-layer routines. 2182dffce215SKirk McKusick */ 2183dffce215SKirk McKusick static int 2184dffce215SKirk McKusick ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size) 2185dffce215SKirk McKusick { 2186dffce215SKirk McKusick struct devfd *devfdp; 2187dffce215SKirk McKusick struct ufsmount *ump; 2188dffce215SKirk McKusick struct buf *bp; 2189dffce215SKirk McKusick struct fs *fs; 2190dffce215SKirk McKusick int error; 2191dffce215SKirk McKusick 2192dffce215SKirk McKusick devfdp = devfd; 2193dffce215SKirk McKusick ump = devfdp->ump; 2194dffce215SKirk McKusick fs = ump->um_fs; 2195dffce215SKirk McKusick /* 2196dffce215SKirk McKusick * Writing the superblock summary information. 2197dffce215SKirk McKusick */ 2198dffce215SKirk McKusick if (loc != fs->fs_sblockloc) { 2199dffce215SKirk McKusick bp = getblk(ump->um_devvp, btodb(loc), size, 0, 0, 0); 2200831b1ff7SKirk McKusick bcopy(buf, bp->b_data, (uint64_t)size); 2201dffce215SKirk McKusick if (devfdp->suspended) 2202791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 2203dffce215SKirk McKusick if (devfdp->waitfor != MNT_WAIT) 2204df8bae1dSRodney W. Grimes bawrite(bp); 22058aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 2206dffce215SKirk McKusick devfdp->error = error; 2207dffce215SKirk McKusick return (0); 2208df8bae1dSRodney W. Grimes } 2209996c772fSJohn Dyson /* 2210dffce215SKirk McKusick * Writing the superblock itself. We need to do special checks for it. 2211996c772fSJohn Dyson */ 2212dffce215SKirk McKusick bp = devfdp->sbbp; 2213d79ff54bSChuck Silvers if (ffs_fsfail_cleanup(ump, devfdp->error)) 2214d79ff54bSChuck Silvers devfdp->error = 0; 2215dffce215SKirk McKusick if (devfdp->error != 0) { 2216dffce215SKirk McKusick brelse(bp); 2217dffce215SKirk McKusick return (devfdp->error); 22183ba649d7SJeff Roberson } 221931574422SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 && 2220e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 2221b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 2222fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1); 2223fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS1; 2224fa5d33e2SKirk McKusick } 222531574422SKirk McKusick if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 && 2226e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 2227b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 2228fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2); 2229fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS2; 2230fa5d33e2SKirk McKusick } 2231519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(ump->um_mountp)) 2232927a12aeSKirk McKusick softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp); 22334ac2df8fSKonstantin Belousov UFS_LOCK(ump); 2234831b1ff7SKirk McKusick bcopy((caddr_t)fs, bp->b_data, (uint64_t)fs->fs_sbsize); 22354ac2df8fSKonstantin Belousov UFS_UNLOCK(ump); 22369454b4fdSKirk McKusick fs = (struct fs *)bp->b_data; 2237ca7c2d2eSKonstantin Belousov fs->fs_fmod = 0; 22389454b4fdSKirk McKusick ffs_oldfscompat_write(fs, ump); 223993440bbeSKirk McKusick fs->fs_si = NULL; 224034816cb9SKirk McKusick /* Recalculate the superblock hash */ 22419454b4fdSKirk McKusick fs->fs_ckhash = ffs_calc_sbhash(fs); 2242dffce215SKirk McKusick if (devfdp->suspended) 2243791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 2244dffce215SKirk McKusick if (devfdp->waitfor != MNT_WAIT) 2245996c772fSJohn Dyson bawrite(bp); 22468aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 2247dffce215SKirk McKusick devfdp->error = error; 2248dffce215SKirk McKusick return (devfdp->error); 2249df8bae1dSRodney W. Grimes } 2250d6fe88e4SPoul-Henning Kamp 2251d6fe88e4SPoul-Henning Kamp static int 2252d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp, 2253dfd233edSAttilio Rao int attrnamespace, const char *attrname) 2254d6fe88e4SPoul-Henning Kamp { 2255d6fe88e4SPoul-Henning Kamp 2256d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR 2257d6fe88e4SPoul-Henning Kamp return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace, 2258dfd233edSAttilio Rao attrname)); 2259d6fe88e4SPoul-Henning Kamp #else 2260d6fe88e4SPoul-Henning Kamp return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, 2261dfd233edSAttilio Rao attrname)); 2262d6fe88e4SPoul-Henning Kamp #endif 2263d6fe88e4SPoul-Henning Kamp } 2264975512a9SPoul-Henning Kamp 2265975512a9SPoul-Henning Kamp static void 2266975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip) 2267975512a9SPoul-Henning Kamp { 2268975512a9SPoul-Henning Kamp 226936329289STim J. Robbins if (ump->um_fstype == UFS1 && ip->i_din1 != NULL) 2270aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_ufs1, ip->i_din1); 227136329289STim J. Robbins else if (ip->i_din2 != NULL) 22728d721e87STim J. Robbins uma_zfree(uma_ufs2, ip->i_din2); 22739d5a594fSMateusz Guzik uma_zfree_smr(uma_inode, ip); 2274975512a9SPoul-Henning Kamp } 22756e77a041SPoul-Henning Kamp 2276dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1; 2277dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0, 2278dd19a799SPoul-Henning Kamp "Do background writes (honoring the BV_BKGRDWRITE flag)?"); 2279dd19a799SPoul-Henning Kamp 2280dd19a799SPoul-Henning Kamp /* 2281dd19a799SPoul-Henning Kamp * Complete a background write started from bwrite. 2282dd19a799SPoul-Henning Kamp */ 2283dd19a799SPoul-Henning Kamp static void 2284dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp) 2285dd19a799SPoul-Henning Kamp { 2286204ec66dSJeff Roberson struct bufobj *bufobj; 2287dd19a799SPoul-Henning Kamp struct buf *origbp; 2288dd19a799SPoul-Henning Kamp 2289d79ff54bSChuck Silvers #ifdef SOFTUPDATES 2290d79ff54bSChuck Silvers if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) != 0) 2291d79ff54bSChuck Silvers softdep_handle_error(bp); 2292d79ff54bSChuck Silvers #endif 2293d79ff54bSChuck Silvers 2294dd19a799SPoul-Henning Kamp /* 2295dd19a799SPoul-Henning Kamp * Find the original buffer that we are writing. 2296dd19a799SPoul-Henning Kamp */ 2297204ec66dSJeff Roberson bufobj = bp->b_bufobj; 2298204ec66dSJeff Roberson BO_LOCK(bufobj); 2299dd19a799SPoul-Henning Kamp if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL) 2300dd19a799SPoul-Henning Kamp panic("backgroundwritedone: lost buffer"); 2301b2c3df84SKonstantin Belousov 2302b2c3df84SKonstantin Belousov /* 2303b2c3df84SKonstantin Belousov * We should mark the cylinder group buffer origbp as 2304d79ff54bSChuck Silvers * dirty, to not lose the failed write. 2305b2c3df84SKonstantin Belousov */ 2306b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2307b2c3df84SKonstantin Belousov origbp->b_vflags |= BV_BKGRDERR; 2308204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2309dd19a799SPoul-Henning Kamp /* 2310dd19a799SPoul-Henning Kamp * Process dependencies then return any unfinished ones. 2311dd19a799SPoul-Henning Kamp */ 2312b2c3df84SKonstantin Belousov if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) == 0) 2313dd19a799SPoul-Henning Kamp buf_complete(bp); 2314dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 231504533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 2316dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, origbp); 2317dd19a799SPoul-Henning Kamp #endif 2318dd19a799SPoul-Henning Kamp /* 2319204ec66dSJeff Roberson * This buffer is marked B_NOCACHE so when it is released 2320bf0db193SKonstantin Belousov * by biodone it will be tossed. Clear B_IOSTARTED in case of error. 2321dd19a799SPoul-Henning Kamp */ 2322dd19a799SPoul-Henning Kamp bp->b_flags |= B_NOCACHE; 2323bf0db193SKonstantin Belousov bp->b_flags &= ~(B_CACHE | B_IOSTARTED); 2324377f88fbSKonstantin Belousov pbrelvp(bp); 2325b2c3df84SKonstantin Belousov 2326b2c3df84SKonstantin Belousov /* 2327b2c3df84SKonstantin Belousov * Prevent brelse() from trying to keep and re-dirtying bp on 2328b2c3df84SKonstantin Belousov * errors. It causes b_bufobj dereference in 2329b2c3df84SKonstantin Belousov * bdirty()/reassignbuf(), and b_bufobj was cleared in 2330b2c3df84SKonstantin Belousov * pbrelvp() above. 2331b2c3df84SKonstantin Belousov */ 2332b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2333b2c3df84SKonstantin Belousov bp->b_flags |= B_INVAL; 2334dd19a799SPoul-Henning Kamp bufdone(bp); 2335204ec66dSJeff Roberson BO_LOCK(bufobj); 2336dd19a799SPoul-Henning Kamp /* 2337dd19a799SPoul-Henning Kamp * Clear the BV_BKGRDINPROG flag in the original buffer 2338dd19a799SPoul-Henning Kamp * and awaken it if it is waiting for the write to complete. 2339dd19a799SPoul-Henning Kamp * If BV_BKGRDINPROG is not set in the original buffer it must 2340dd19a799SPoul-Henning Kamp * have been released and re-instantiated - which is not legal. 2341dd19a799SPoul-Henning Kamp */ 2342dd19a799SPoul-Henning Kamp KASSERT((origbp->b_vflags & BV_BKGRDINPROG), 2343dd19a799SPoul-Henning Kamp ("backgroundwritedone: lost buffer2")); 2344dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDINPROG; 2345dd19a799SPoul-Henning Kamp if (origbp->b_vflags & BV_BKGRDWAIT) { 2346dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDWAIT; 2347dd19a799SPoul-Henning Kamp wakeup(&origbp->b_xflags); 2348dd19a799SPoul-Henning Kamp } 2349204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2350dd19a799SPoul-Henning Kamp } 2351dd19a799SPoul-Henning Kamp 2352dd19a799SPoul-Henning Kamp /* 2353dd19a799SPoul-Henning Kamp * Write, release buffer on completion. (Done by iodone 2354dd19a799SPoul-Henning Kamp * if async). Do not bother writing anything if the buffer 2355dd19a799SPoul-Henning Kamp * is invalid. 2356dd19a799SPoul-Henning Kamp * 2357dd19a799SPoul-Henning Kamp * Note that we set B_CACHE here, indicating that buffer is 2358dd19a799SPoul-Henning Kamp * fully valid and thus cacheable. This is true even of NFS 2359dd19a799SPoul-Henning Kamp * now so we set it generally. This could be set either here 2360dd19a799SPoul-Henning Kamp * or in biodone() since the I/O is synchronous. We put it 2361dd19a799SPoul-Henning Kamp * here. 2362dd19a799SPoul-Henning Kamp */ 2363dd19a799SPoul-Henning Kamp static int 2364dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp) 2365dd19a799SPoul-Henning Kamp { 2366dd19a799SPoul-Henning Kamp struct buf *newbp; 236747806d1bSKirk McKusick struct cg *cgp; 2368dd19a799SPoul-Henning Kamp 2369dd19a799SPoul-Henning Kamp CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags); 2370dd19a799SPoul-Henning Kamp if (bp->b_flags & B_INVAL) { 2371dd19a799SPoul-Henning Kamp brelse(bp); 2372dd19a799SPoul-Henning Kamp return (0); 2373dd19a799SPoul-Henning Kamp } 2374dd19a799SPoul-Henning Kamp 2375d638e093SAttilio Rao if (!BUF_ISLOCKED(bp)) 2376dd19a799SPoul-Henning Kamp panic("bufwrite: buffer is not busy???"); 2377dd19a799SPoul-Henning Kamp /* 2378dd19a799SPoul-Henning Kamp * If a background write is already in progress, delay 2379dd19a799SPoul-Henning Kamp * writing this block if it is asynchronous. Otherwise 2380dd19a799SPoul-Henning Kamp * wait for the background write to complete. 2381dd19a799SPoul-Henning Kamp */ 2382dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2383dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) { 2384dd19a799SPoul-Henning Kamp if (bp->b_flags & B_ASYNC) { 2385dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2386dd19a799SPoul-Henning Kamp bdwrite(bp); 2387dd19a799SPoul-Henning Kamp return (0); 2388dd19a799SPoul-Henning Kamp } 2389dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDWAIT; 239022a72260SJeff Roberson msleep(&bp->b_xflags, BO_LOCKPTR(bp->b_bufobj), PRIBIO, 239122a72260SJeff Roberson "bwrbg", 0); 2392dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) 2393dd19a799SPoul-Henning Kamp panic("bufwrite: still writing"); 2394dd19a799SPoul-Henning Kamp } 2395b2c3df84SKonstantin Belousov bp->b_vflags &= ~BV_BKGRDERR; 2396dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2397dd19a799SPoul-Henning Kamp 2398dd19a799SPoul-Henning Kamp /* 2399dd19a799SPoul-Henning Kamp * If this buffer is marked for background writing and we 2400dd19a799SPoul-Henning Kamp * do not have to wait for it, make a copy and write the 2401dd19a799SPoul-Henning Kamp * copy so as to leave this buffer ready for further use. 2402dd19a799SPoul-Henning Kamp * 2403dd19a799SPoul-Henning Kamp * This optimization eats a lot of memory. If we have a page 2404dd19a799SPoul-Henning Kamp * or buffer shortfall we can't do it. 2405dd19a799SPoul-Henning Kamp */ 2406dd19a799SPoul-Henning Kamp if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) && 2407dd19a799SPoul-Henning Kamp (bp->b_flags & B_ASYNC) && 2408dd19a799SPoul-Henning Kamp !vm_page_count_severe() && 2409dd19a799SPoul-Henning Kamp !buf_dirty_count_severe()) { 2410dd19a799SPoul-Henning Kamp KASSERT(bp->b_iodone == NULL, 2411dd19a799SPoul-Henning Kamp ("bufwrite: needs chained iodone (%p)", bp->b_iodone)); 2412dd19a799SPoul-Henning Kamp 2413dd19a799SPoul-Henning Kamp /* get a new block */ 2414c1d8b5e8SKonstantin Belousov newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD); 2415c1d8b5e8SKonstantin Belousov if (newbp == NULL) 2416c1d8b5e8SKonstantin Belousov goto normal_write; 2417dd19a799SPoul-Henning Kamp 2418fade8dd7SJeff Roberson KASSERT(buf_mapped(bp), ("Unmapped cg")); 2419dd19a799SPoul-Henning Kamp memcpy(newbp->b_data, bp->b_data, bp->b_bufsize); 2420dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2421dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDINPROG; 2422dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 242375e3597aSKirk McKusick newbp->b_xflags |= 242475e3597aSKirk McKusick (bp->b_xflags & BX_FSPRIV) | BX_BKGRDMARKER; 242526089666SJeff Roberson newbp->b_lblkno = bp->b_lblkno; 2426dd19a799SPoul-Henning Kamp newbp->b_blkno = bp->b_blkno; 2427dd19a799SPoul-Henning Kamp newbp->b_offset = bp->b_offset; 2428dd19a799SPoul-Henning Kamp newbp->b_iodone = ffs_backgroundwritedone; 2429dd19a799SPoul-Henning Kamp newbp->b_flags |= B_ASYNC; 2430dd19a799SPoul-Henning Kamp newbp->b_flags &= ~B_INVAL; 243126089666SJeff Roberson pbgetvp(bp->b_vp, newbp); 2432dd19a799SPoul-Henning Kamp 2433dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 2434113db2ddSJeff Roberson /* 2435113db2ddSJeff Roberson * Move over the dependencies. If there are rollbacks, 2436113db2ddSJeff Roberson * leave the parent buffer dirtied as it will need to 2437113db2ddSJeff Roberson * be written again. 2438113db2ddSJeff Roberson */ 2439113db2ddSJeff Roberson if (LIST_EMPTY(&bp->b_dep) || 2440113db2ddSJeff Roberson softdep_move_dependencies(bp, newbp) == 0) 2441113db2ddSJeff Roberson bundirty(bp); 2442113db2ddSJeff Roberson #else 2443113db2ddSJeff Roberson bundirty(bp); 2444dd19a799SPoul-Henning Kamp #endif 2445dd19a799SPoul-Henning Kamp 2446dd19a799SPoul-Henning Kamp /* 244726089666SJeff Roberson * Initiate write on the copy, release the original. The 244826089666SJeff Roberson * BKGRDINPROG flag prevents it from going away until 244947806d1bSKirk McKusick * the background write completes. We have to recalculate 245047806d1bSKirk McKusick * its check hash in case the buffer gets freed and then 245147806d1bSKirk McKusick * reconstituted from the buffer cache during a later read. 2452dd19a799SPoul-Henning Kamp */ 245347806d1bSKirk McKusick if ((bp->b_xflags & BX_CYLGRP) != 0) { 245447806d1bSKirk McKusick cgp = (struct cg *)bp->b_data; 245547806d1bSKirk McKusick cgp->cg_ckhash = 0; 245647806d1bSKirk McKusick cgp->cg_ckhash = 245747806d1bSKirk McKusick calculate_crc32c(~0L, bp->b_data, bp->b_bcount); 245847806d1bSKirk McKusick } 2459dd19a799SPoul-Henning Kamp bqrelse(bp); 2460dd19a799SPoul-Henning Kamp bp = newbp; 2461113db2ddSJeff Roberson } else 2462113db2ddSJeff Roberson /* Mark the buffer clean */ 2463113db2ddSJeff Roberson bundirty(bp); 2464113db2ddSJeff Roberson 2465dd19a799SPoul-Henning Kamp /* Let the normal bufwrite do the rest for us */ 2466c1d8b5e8SKonstantin Belousov normal_write: 246747806d1bSKirk McKusick /* 246847806d1bSKirk McKusick * If we are writing a cylinder group, update its time. 246947806d1bSKirk McKusick */ 247047806d1bSKirk McKusick if ((bp->b_xflags & BX_CYLGRP) != 0) { 247147806d1bSKirk McKusick cgp = (struct cg *)bp->b_data; 247247806d1bSKirk McKusick cgp->cg_old_time = cgp->cg_time = time_second; 247347806d1bSKirk McKusick } 24749248a827STor Egge return (bufwrite(bp)); 2475dd19a799SPoul-Henning Kamp } 2476dd19a799SPoul-Henning Kamp 24778dd56505SPoul-Henning Kamp static void 24786e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp) 24796e77a041SPoul-Henning Kamp { 2480153910e0SJeff Roberson struct vnode *vp; 24817de3839dSTor Egge struct buf *tbp; 248275e3597aSKirk McKusick int error, nocopy; 24836e77a041SPoul-Henning Kamp 2484f15ccf88SChuck Silvers /* 2485f15ccf88SChuck Silvers * This is the bufobj strategy for the private VCHR vnodes 2486f15ccf88SChuck Silvers * used by FFS to access the underlying storage device. 2487f15ccf88SChuck Silvers * We override the default bufobj strategy and thus bypass 2488f15ccf88SChuck Silvers * VOP_STRATEGY() for these vnodes. 2489f15ccf88SChuck Silvers */ 24908660b707SMateusz Guzik vp = bo2vnode(bo); 2491f15ccf88SChuck Silvers KASSERT(bp->b_vp == NULL || bp->b_vp->v_type != VCHR || 2492f15ccf88SChuck Silvers bp->b_vp->v_rdev == NULL || 2493f15ccf88SChuck Silvers bp->b_vp->v_rdev->si_mountpt == NULL || 2494f15ccf88SChuck Silvers VFSTOUFS(bp->b_vp->v_rdev->si_mountpt) == NULL || 2495f15ccf88SChuck Silvers vp == VFSTOUFS(bp->b_vp->v_rdev->si_mountpt)->um_devvp, 2496f15ccf88SChuck Silvers ("ffs_geom_strategy() with wrong vp")); 2497153910e0SJeff Roberson if (bp->b_iocmd == BIO_WRITE) { 2498153910e0SJeff Roberson if ((bp->b_flags & B_VALIDSUSPWRT) == 0 && 2499153910e0SJeff Roberson bp->b_vp != NULL && bp->b_vp->v_mount != NULL && 2500153910e0SJeff Roberson (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0) 2501153910e0SJeff Roberson panic("ffs_geom_strategy: bad I/O"); 2502113db2ddSJeff Roberson nocopy = bp->b_flags & B_NOCOPY; 2503113db2ddSJeff Roberson bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY); 2504113db2ddSJeff Roberson if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 && 25057de3839dSTor Egge vp->v_rdev->si_snapdata != NULL) { 25067de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 2507868bb88fSTor Egge runningbufwakeup(bp); 25087de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 25097de3839dSTor Egge b_cluster.cluster_entry) { 25107de3839dSTor Egge error = ffs_copyonwrite(vp, tbp); 25117de3839dSTor Egge if (error != 0 && 2512153910e0SJeff Roberson error != EOPNOTSUPP) { 2513153910e0SJeff Roberson bp->b_error = error; 2514153910e0SJeff Roberson bp->b_ioflags |= BIO_ERROR; 2515e1ef4c29SKonstantin Belousov bp->b_flags &= ~B_BARRIER; 2516153910e0SJeff Roberson bufdone(bp); 2517153910e0SJeff Roberson return; 2518153910e0SJeff Roberson } 2519153910e0SJeff Roberson } 25204efe531cSMark Johnston (void)runningbufclaim(bp, bp->b_bufsize); 25217de3839dSTor Egge } else { 25227de3839dSTor Egge error = ffs_copyonwrite(vp, bp); 25237de3839dSTor Egge if (error != 0 && error != EOPNOTSUPP) { 25247de3839dSTor Egge bp->b_error = error; 25257de3839dSTor Egge bp->b_ioflags |= BIO_ERROR; 2526e1ef4c29SKonstantin Belousov bp->b_flags &= ~B_BARRIER; 25277de3839dSTor Egge bufdone(bp); 25287de3839dSTor Egge return; 25297de3839dSTor Egge } 25307de3839dSTor Egge } 25317de3839dSTor Egge } 25327de3839dSTor Egge #ifdef SOFTUPDATES 25337de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 25347de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 25357de3839dSTor Egge b_cluster.cluster_entry) { 253604533fc6SXin LI if (!LIST_EMPTY(&tbp->b_dep)) 25377de3839dSTor Egge buf_start(tbp); 25387de3839dSTor Egge } 25397de3839dSTor Egge } else { 254004533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 25417de3839dSTor Egge buf_start(bp); 25427de3839dSTor Egge } 25437de3839dSTor Egge 25447de3839dSTor Egge #endif 254575e3597aSKirk McKusick /* 254675e3597aSKirk McKusick * Check for metadata that needs check-hashes and update them. 254775e3597aSKirk McKusick */ 254875e3597aSKirk McKusick switch (bp->b_xflags & BX_FSPRIV) { 254975e3597aSKirk McKusick case BX_CYLGRP: 255075e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 0; 255175e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 255275e3597aSKirk McKusick calculate_crc32c(~0L, bp->b_data, bp->b_bcount); 255375e3597aSKirk McKusick break; 255475e3597aSKirk McKusick 255575e3597aSKirk McKusick case BX_SUPERBLOCK: 255675e3597aSKirk McKusick case BX_INODE: 255775e3597aSKirk McKusick case BX_INDIR: 255875e3597aSKirk McKusick case BX_DIR: 255975e3597aSKirk McKusick printf("Check-hash write is unimplemented!!!\n"); 256075e3597aSKirk McKusick break; 256175e3597aSKirk McKusick 256275e3597aSKirk McKusick case 0: 256375e3597aSKirk McKusick break; 256475e3597aSKirk McKusick 256575e3597aSKirk McKusick default: 256675e3597aSKirk McKusick printf("multiple buffer types 0x%b\n", 2567831b1ff7SKirk McKusick (bp->b_xflags & BX_FSPRIV), PRINT_UFS_BUF_XFLAGS); 256875e3597aSKirk McKusick break; 256975e3597aSKirk McKusick } 25707de3839dSTor Egge } 2571d79ff54bSChuck Silvers if (bp->b_iocmd != BIO_READ && ffs_enxio_enable) 2572d79ff54bSChuck Silvers bp->b_xflags |= BX_CVTENXIO; 257343920011SPoul-Henning Kamp g_vfs_strategy(bo, bp); 25746e77a041SPoul-Henning Kamp } 257552dfc8d7SKonstantin Belousov 25761848286aSEdward Tomasz Napierala int 25771848286aSEdward Tomasz Napierala ffs_own_mount(const struct mount *mp) 25781848286aSEdward Tomasz Napierala { 25791848286aSEdward Tomasz Napierala 25801848286aSEdward Tomasz Napierala if (mp->mnt_op == &ufs_vfsops) 25811848286aSEdward Tomasz Napierala return (1); 25821848286aSEdward Tomasz Napierala return (0); 25831848286aSEdward Tomasz Napierala } 25841848286aSEdward Tomasz Napierala 258552dfc8d7SKonstantin Belousov #ifdef DDB 2586cf058082SBrooks Davis #ifdef SOFTUPDATES 258752dfc8d7SKonstantin Belousov 2588519e3c3bSKirk McKusick /* defined in ffs_softdep.c */ 2589519e3c3bSKirk McKusick extern void db_print_ffs(struct ufsmount *ump); 259052dfc8d7SKonstantin Belousov 259152dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs) 259252dfc8d7SKonstantin Belousov { 259352dfc8d7SKonstantin Belousov struct mount *mp; 259452dfc8d7SKonstantin Belousov struct ufsmount *ump; 259552dfc8d7SKonstantin Belousov 259652dfc8d7SKonstantin Belousov if (have_addr) { 259752dfc8d7SKonstantin Belousov ump = VFSTOUFS((struct mount *)addr); 259852dfc8d7SKonstantin Belousov db_print_ffs(ump); 259952dfc8d7SKonstantin Belousov return; 260052dfc8d7SKonstantin Belousov } 260152dfc8d7SKonstantin Belousov 260252dfc8d7SKonstantin Belousov TAILQ_FOREACH(mp, &mountlist, mnt_list) { 260352dfc8d7SKonstantin Belousov if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name)) 260452dfc8d7SKonstantin Belousov db_print_ffs(VFSTOUFS(mp)); 260552dfc8d7SKonstantin Belousov } 260652dfc8d7SKonstantin Belousov } 260752dfc8d7SKonstantin Belousov 2608cf058082SBrooks Davis #endif /* SOFTUPDATES */ 260952dfc8d7SKonstantin Belousov #endif /* DDB */ 2610