160727d8bSWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1989, 1991, 1993, 1994 3df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 6df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 7df8bae1dSRodney W. Grimes * are met: 8df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 9df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 10df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 12df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 13df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 14df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 15df8bae1dSRodney W. Grimes * without specific prior written permission. 16df8bae1dSRodney W. Grimes * 17df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27df8bae1dSRodney W. Grimes * SUCH DAMAGE. 28df8bae1dSRodney W. Grimes * 29996c772fSJohn Dyson * @(#)ffs_vfsops.c 8.31 (Berkeley) 5/20/95 30df8bae1dSRodney W. Grimes */ 31df8bae1dSRodney W. Grimes 32f4636c59SDavid E. O'Brien #include <sys/cdefs.h> 33f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$"); 34f4636c59SDavid E. O'Brien 3501733a9bSGarrett Wollman #include "opt_quota.h" 36516081f2SRobert Watson #include "opt_ufs.h" 376e77a041SPoul-Henning Kamp #include "opt_ffs.h" 3852dfc8d7SKonstantin Belousov #include "opt_ddb.h" 3901733a9bSGarrett Wollman 40df8bae1dSRodney W. Grimes #include <sys/param.h> 41df8bae1dSRodney W. Grimes #include <sys/systm.h> 42df8bae1dSRodney W. Grimes #include <sys/namei.h> 43acd3428bSRobert Watson #include <sys/priv.h> 44df8bae1dSRodney W. Grimes #include <sys/proc.h> 45c79dff0fSKonstantin Belousov #include <sys/taskqueue.h> 46df8bae1dSRodney W. Grimes #include <sys/kernel.h> 47df8bae1dSRodney W. Grimes #include <sys/vnode.h> 48df8bae1dSRodney W. Grimes #include <sys/mount.h> 499626b608SPoul-Henning Kamp #include <sys/bio.h> 50df8bae1dSRodney W. Grimes #include <sys/buf.h> 5181bca6ddSKATO Takenori #include <sys/conf.h> 523ac4d1efSBruce Evans #include <sys/fcntl.h> 531848286aSEdward Tomasz Napierala #include <sys/ioccom.h> 54df8bae1dSRodney W. Grimes #include <sys/malloc.h> 551b367556SJason Evans #include <sys/mutex.h> 5622a72260SJeff Roberson #include <sys/rwlock.h> 57a18b1f1dSJason Evans 58aed55708SRobert Watson #include <security/mac/mac_framework.h> 59aed55708SRobert Watson 60a64ed089SRobert Watson #include <ufs/ufs/extattr.h> 611a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h> 62df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h> 63df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h> 64df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h> 65df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h> 66df8bae1dSRodney W. Grimes 67df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h> 68df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h> 69df8bae1dSRodney W. Grimes 70f6b04d2bSDavid Greenman #include <vm/vm.h> 71aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h> 72f6b04d2bSDavid Greenman #include <vm/vm_page.h> 73f6b04d2bSDavid Greenman 7443920011SPoul-Henning Kamp #include <geom/geom.h> 7543920011SPoul-Henning Kamp #include <geom/geom_vfs.h> 7643920011SPoul-Henning Kamp 7752dfc8d7SKonstantin Belousov #include <ddb/ddb.h> 7852dfc8d7SKonstantin Belousov 79adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2; 8055166637SPoul-Henning Kamp 81975512a9SPoul-Henning Kamp static int ffs_mountfs(struct vnode *, struct mount *, struct thread *); 821c85e6a3SKirk McKusick static void ffs_oldfscompat_read(struct fs *, struct ufsmount *, 831c85e6a3SKirk McKusick ufs2_daddr_t); 84975512a9SPoul-Henning Kamp static void ffs_ifree(struct ufsmount *ump, struct inode *ip); 85a988a5c6SKonstantin Belousov static int ffs_sync_lazy(struct mount *mp); 86a988a5c6SKonstantin Belousov 879bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init; 889bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit; 89d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl; 9020a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount; 91adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount; 9220a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount; 93adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs; 94adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp; 95adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync; 96df8bae1dSRodney W. Grimes 97303b270bSEivind Eklund static struct vfsops ufs_vfsops = { 987652131bSPoul-Henning Kamp .vfs_extattrctl = ffs_extattrctl, 997652131bSPoul-Henning Kamp .vfs_fhtovp = ffs_fhtovp, 1007652131bSPoul-Henning Kamp .vfs_init = ffs_init, 10120a92a18SPoul-Henning Kamp .vfs_mount = ffs_mount, 10220a92a18SPoul-Henning Kamp .vfs_cmount = ffs_cmount, 1037652131bSPoul-Henning Kamp .vfs_quotactl = ufs_quotactl, 1047652131bSPoul-Henning Kamp .vfs_root = ufs_root, 1057652131bSPoul-Henning Kamp .vfs_statfs = ffs_statfs, 1067652131bSPoul-Henning Kamp .vfs_sync = ffs_sync, 1077652131bSPoul-Henning Kamp .vfs_uninit = ffs_uninit, 1087652131bSPoul-Henning Kamp .vfs_unmount = ffs_unmount, 1097652131bSPoul-Henning Kamp .vfs_vget = ffs_vget, 1102814d5baSKonstantin Belousov .vfs_susp_clean = process_deferred_inactive, 111df8bae1dSRodney W. Grimes }; 112df8bae1dSRodney W. Grimes 1138994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0); 1145fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1); 115c901836cSGarrett Wollman 1166e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy; 117dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite; 1186e77a041SPoul-Henning Kamp 1196e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = { 1206e77a041SPoul-Henning Kamp .bop_name = "FFS", 121dd19a799SPoul-Henning Kamp .bop_write = ffs_bufwrite, 1226e77a041SPoul-Henning Kamp .bop_strategy = ffs_geom_strategy, 1236ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 1242cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT 1252cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush, 1262cc7d26fSKonstantin Belousov #else 1272cc7d26fSKonstantin Belousov .bop_bdflush = ffs_bdflush, 1282cc7d26fSKonstantin Belousov #endif 1296e77a041SPoul-Henning Kamp }; 1306e77a041SPoul-Henning Kamp 1310b962648SAndriy Gapon /* 1320b962648SAndriy Gapon * Note that userquota and groupquota options are not currently used 1330b962648SAndriy Gapon * by UFS/FFS code and generally mount(8) does not pass those options 1340b962648SAndriy Gapon * from userland, but they can be passed by loader(8) via 1350b962648SAndriy Gapon * vfs.root.mountfrom.options. 1360b962648SAndriy Gapon */ 137d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr", 1380b962648SAndriy Gapon "noclusterw", "noexec", "export", "force", "from", "groupquota", 139927a12aeSKirk McKusick "multilabel", "nfsv4acls", "fsckpid", "snapshot", "nosuid", "suiddir", 140927a12aeSKirk McKusick "nosymfollow", "sync", "union", "userquota", NULL }; 14120a92a18SPoul-Henning Kamp 1425e8c582aSPoul-Henning Kamp static int 143dfd233edSAttilio Rao ffs_mount(struct mount *mp) 144df8bae1dSRodney W. Grimes { 14520a92a18SPoul-Henning Kamp struct vnode *devvp; 146dfd233edSAttilio Rao struct thread *td; 147f7a3729cSKevin Lo struct ufsmount *ump = NULL; 14805f4ff5dSPoul-Henning Kamp struct fs *fs; 149927a12aeSKirk McKusick pid_t fsckpid = 0; 150f2a2857bSKirk McKusick int error, flags; 151cc672d35SKirk McKusick uint64_t mntorflags; 15215bc6b2bSEdward Tomasz Napierala accmode_t accmode; 1535e8c582aSPoul-Henning Kamp struct nameidata ndp; 15420a92a18SPoul-Henning Kamp char *fspec; 155df8bae1dSRodney W. Grimes 156dfd233edSAttilio Rao td = curthread; 15720a92a18SPoul-Henning Kamp if (vfs_filteropt(mp->mnt_optnew, ffs_opts)) 15820a92a18SPoul-Henning Kamp return (EINVAL); 159aa4d7a8aSPoul-Henning Kamp if (uma_inode == NULL) { 160aa4d7a8aSPoul-Henning Kamp uma_inode = uma_zcreate("FFS inode", 161aa4d7a8aSPoul-Henning Kamp sizeof(struct inode), NULL, NULL, NULL, NULL, 162aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 163aa4d7a8aSPoul-Henning Kamp uma_ufs1 = uma_zcreate("FFS1 dinode", 164aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL, 165aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 166aa4d7a8aSPoul-Henning Kamp uma_ufs2 = uma_zcreate("FFS2 dinode", 167aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL, 168aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 169aa4d7a8aSPoul-Henning Kamp } 1708d02a378SPawel Jakub Dawidek 1710b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "groupquota"); 1720b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "userquota"); 1730b962648SAndriy Gapon 17420a92a18SPoul-Henning Kamp fspec = vfs_getopts(mp->mnt_optnew, "from", &error); 17551ac12abSPoul-Henning Kamp if (error) 176f2a2857bSKirk McKusick return (error); 1772b14f991SJulian Elischer 1785da56ddbSTor Egge mntorflags = 0; 17926f59b64SCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0) 1805da56ddbSTor Egge mntorflags |= MNT_ACLS; 18126f59b64SCraig Rodrigues 182fb77e0afSCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) { 1835da56ddbSTor Egge mntorflags |= MNT_SNAPSHOT; 184fb77e0afSCraig Rodrigues /* 185fb77e0afSCraig Rodrigues * Once we have set the MNT_SNAPSHOT flag, do not 186fb77e0afSCraig Rodrigues * persist "snapshot" in the options list. 187fb77e0afSCraig Rodrigues */ 188fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_optnew, "snapshot"); 189fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_opt, "snapshot"); 190fb77e0afSCraig Rodrigues } 19126f59b64SCraig Rodrigues 192927a12aeSKirk McKusick if (vfs_getopt(mp->mnt_optnew, "fsckpid", NULL, NULL) == 0 && 193927a12aeSKirk McKusick vfs_scanopt(mp->mnt_optnew, "fsckpid", "%d", &fsckpid) == 1) { 194927a12aeSKirk McKusick /* 195927a12aeSKirk McKusick * Once we have set the restricted PID, do not 196927a12aeSKirk McKusick * persist "fsckpid" in the options list. 197927a12aeSKirk McKusick */ 198927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_optnew, "fsckpid"); 199927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_opt, "fsckpid"); 200927a12aeSKirk McKusick if (mp->mnt_flag & MNT_UPDATE) { 201927a12aeSKirk McKusick if (VFSTOUFS(mp)->um_fs->fs_ronly == 0 && 202927a12aeSKirk McKusick vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 203b60ee81eSKirk McKusick vfs_mount_error(mp, 204b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 205927a12aeSKirk McKusick return (EINVAL); 206927a12aeSKirk McKusick } 207927a12aeSKirk McKusick } else if (vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 208b60ee81eSKirk McKusick vfs_mount_error(mp, 209b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 210927a12aeSKirk McKusick return (EINVAL); 211927a12aeSKirk McKusick } 212927a12aeSKirk McKusick /* Set to -1 if we are done */ 213927a12aeSKirk McKusick if (fsckpid == 0) 214927a12aeSKirk McKusick fsckpid = -1; 215927a12aeSKirk McKusick } 216927a12aeSKirk McKusick 2179340fc72SEdward Tomasz Napierala if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) { 2189340fc72SEdward Tomasz Napierala if (mntorflags & MNT_ACLS) { 219b60ee81eSKirk McKusick vfs_mount_error(mp, 220b60ee81eSKirk McKusick "\"acls\" and \"nfsv4acls\" options " 221b60ee81eSKirk McKusick "are mutually exclusive"); 2229340fc72SEdward Tomasz Napierala return (EINVAL); 2239340fc72SEdward Tomasz Napierala } 2249340fc72SEdward Tomasz Napierala mntorflags |= MNT_NFS4ACLS; 2259340fc72SEdward Tomasz Napierala } 2269340fc72SEdward Tomasz Napierala 2275da56ddbSTor Egge MNT_ILOCK(mp); 22861996181SEdward Tomasz Napierala mp->mnt_flag |= mntorflags; 2295da56ddbSTor Egge MNT_IUNLOCK(mp); 230df8bae1dSRodney W. Grimes /* 231df8bae1dSRodney W. Grimes * If updating, check whether changing from read-only to 232df8bae1dSRodney W. Grimes * read/write; if there is no device name, that's all we do. 233df8bae1dSRodney W. Grimes */ 234df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_UPDATE) { 235df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 236df8bae1dSRodney W. Grimes fs = ump->um_fs; 23726cf9c3bSPeter Wemm devvp = ump->um_devvp; 238927a12aeSKirk McKusick if (fsckpid == -1 && ump->um_fsckpid > 0) { 239927a12aeSKirk McKusick if ((error = ffs_flushfiles(mp, WRITECLOSE, td)) != 0 || 240927a12aeSKirk McKusick (error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) 241927a12aeSKirk McKusick return (error); 242927a12aeSKirk McKusick g_topology_lock(); 243927a12aeSKirk McKusick /* 244927a12aeSKirk McKusick * Return to normal read-only mode. 245927a12aeSKirk McKusick */ 246927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 247927a12aeSKirk McKusick g_topology_unlock(); 248927a12aeSKirk McKusick ump->um_fsckpid = 0; 249927a12aeSKirk McKusick } 25020a92a18SPoul-Henning Kamp if (fs->fs_ronly == 0 && 25120a92a18SPoul-Henning Kamp vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 2526fecb4e4SKonstantin Belousov /* 2536fecb4e4SKonstantin Belousov * Flush any dirty data and suspend filesystem. 2546fecb4e4SKonstantin Belousov */ 255f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 256f2a2857bSKirk McKusick return (error); 257895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 258895b3782SKonstantin Belousov if (error != 0) 2599ab73fd1SKirk McKusick return (error); 260cd600596SKirk McKusick /* 261cd600596SKirk McKusick * Check for and optionally get rid of files open 262cd600596SKirk McKusick * for writing. 263cd600596SKirk McKusick */ 264df8bae1dSRodney W. Grimes flags = WRITECLOSE; 265df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_FORCE) 266df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 267fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 268b40ce416SJulian Elischer error = softdep_flushfiles(mp, flags, td); 269b1897c19SJulian Elischer } else { 270b40ce416SJulian Elischer error = ffs_flushfiles(mp, flags, td); 271df8bae1dSRodney W. Grimes } 272f2a2857bSKirk McKusick if (error) { 273ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 274f2a2857bSKirk McKusick return (error); 275b1897c19SJulian Elischer } 2769ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || 2779ccb939eSKirk McKusick fs->fs_pendinginodes != 0) { 278b60ee81eSKirk McKusick printf("WARNING: %s Update error: blocks %jd " 279b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, 2801c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 2819ccb939eSKirk McKusick fs->fs_pendinginodes); 2829ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 2839ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 2849ccb939eSKirk McKusick } 2851a6a6610SKirk McKusick if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0) 286f2a2857bSKirk McKusick fs->fs_clean = 1; 287791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 288f2a2857bSKirk McKusick fs->fs_ronly = 0; 289f2a2857bSKirk McKusick fs->fs_clean = 0; 290ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 291f2a2857bSKirk McKusick return (error); 2922b14f991SJulian Elischer } 293fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 2949420dc62SKirk McKusick softdep_unmount(mp); 29543920011SPoul-Henning Kamp g_topology_lock(); 2968795189cSKirk McKusick /* 2978795189cSKirk McKusick * Drop our write and exclusive access. 2988795189cSKirk McKusick */ 2998795189cSKirk McKusick g_access(ump->um_cp, 0, -1, -1); 30043920011SPoul-Henning Kamp g_topology_unlock(); 30120a92a18SPoul-Henning Kamp fs->fs_ronly = 1; 3025da56ddbSTor Egge MNT_ILOCK(mp); 30320a92a18SPoul-Henning Kamp mp->mnt_flag |= MNT_RDONLY; 3045da56ddbSTor Egge MNT_IUNLOCK(mp); 3056fecb4e4SKonstantin Belousov /* 3066fecb4e4SKonstantin Belousov * Allow the writers to note that filesystem 3076fecb4e4SKonstantin Belousov * is ro now. 3086fecb4e4SKonstantin Belousov */ 309ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 310f2a2857bSKirk McKusick } 311f2a2857bSKirk McKusick if ((mp->mnt_flag & MNT_RELOAD) && 3121848286aSEdward Tomasz Napierala (error = ffs_reload(mp, td, 0)) != 0) 313f2a2857bSKirk McKusick return (error); 31420a92a18SPoul-Henning Kamp if (fs->fs_ronly && 31520a92a18SPoul-Henning Kamp !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 316c9b99213SBruce Evans /* 317927a12aeSKirk McKusick * If we are running a checker, do not allow upgrade. 318927a12aeSKirk McKusick */ 319927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 320b60ee81eSKirk McKusick vfs_mount_error(mp, 321b60ee81eSKirk McKusick "Active checker, cannot upgrade to write"); 322927a12aeSKirk McKusick return (EINVAL); 323927a12aeSKirk McKusick } 324927a12aeSKirk McKusick /* 325c9b99213SBruce Evans * If upgrade to read-write by non-root, then verify 326c9b99213SBruce Evans * that user has necessary permissions on the device. 327c9b99213SBruce Evans */ 328cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 329acd3428bSRobert Watson error = VOP_ACCESS(devvp, VREAD | VWRITE, 330acd3428bSRobert Watson td->td_ucred, td); 331acd3428bSRobert Watson if (error) 332acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 333acd3428bSRobert Watson if (error) { 33422db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 335c9b99213SBruce Evans return (error); 336c9b99213SBruce Evans } 33722db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 3387e58bfacSBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 3390922cce6SBruce Evans if (fs->fs_clean == 0) { 3407e58bfacSBruce Evans fs->fs_flags |= FS_UNCLEAN; 341812b1d41SKirk McKusick if ((mp->mnt_flag & MNT_FORCE) || 342113db2ddSJeff Roberson ((fs->fs_flags & 343113db2ddSJeff Roberson (FS_SUJ | FS_NEEDSFSCK)) == 0 && 3441a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 345b60ee81eSKirk McKusick printf("WARNING: %s was not properly " 346b60ee81eSKirk McKusick "dismounted\n", fs->fs_fsmnt); 3470922cce6SBruce Evans } else { 348b60ee81eSKirk McKusick vfs_mount_error(mp, 349b60ee81eSKirk McKusick "R/W mount of %s denied. %s.%s", 350b60ee81eSKirk McKusick fs->fs_fsmnt, 351b60ee81eSKirk McKusick "Filesystem is not clean - run fsck", 352b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 353b60ee81eSKirk McKusick " Forced mount will invalidate" 354b60ee81eSKirk McKusick " journal contents"); 355f2a2857bSKirk McKusick return (EPERM); 3560922cce6SBruce Evans } 3570922cce6SBruce Evans } 35840c340aaSPoul-Henning Kamp g_topology_lock(); 35940c340aaSPoul-Henning Kamp /* 3608795189cSKirk McKusick * Request exclusive write access. 36140c340aaSPoul-Henning Kamp */ 36240c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 1); 36340c340aaSPoul-Henning Kamp g_topology_unlock(); 36440c340aaSPoul-Henning Kamp if (error) 36540c340aaSPoul-Henning Kamp return (error); 366f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 367f2a2857bSKirk McKusick return (error); 368f2a2857bSKirk McKusick fs->fs_ronly = 0; 3695da56ddbSTor Egge MNT_ILOCK(mp); 37020a92a18SPoul-Henning Kamp mp->mnt_flag &= ~MNT_RDONLY; 3715da56ddbSTor Egge MNT_IUNLOCK(mp); 372113db2ddSJeff Roberson fs->fs_mtime = time_second; 37326cf9c3bSPeter Wemm /* check to see if we need to start softdep */ 374f2a2857bSKirk McKusick if ((fs->fs_flags & FS_DOSOFTDEP) && 375a854ed98SJohn Baldwin (error = softdep_mount(devvp, mp, fs, td->td_ucred))){ 376f2a2857bSKirk McKusick vn_finished_write(mp); 377f2a2857bSKirk McKusick return (error); 37826cf9c3bSPeter Wemm } 379113db2ddSJeff Roberson fs->fs_clean = 0; 380113db2ddSJeff Roberson if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 381113db2ddSJeff Roberson vn_finished_write(mp); 382113db2ddSJeff Roberson return (error); 383113db2ddSJeff Roberson } 384f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 385f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 386f2a2857bSKirk McKusick vn_finished_write(mp); 3871469eec8SDavid Greenman } 388c11d2981SJulian Elischer /* 389c11d2981SJulian Elischer * Soft updates is incompatible with "async", 390c11d2981SJulian Elischer * so if we are doing softupdates stop the user 391c11d2981SJulian Elischer * from setting the async flag in an update. 392c11d2981SJulian Elischer * Softdep_mount() clears it in an initial mount 393c11d2981SJulian Elischer * or ro->rw remount. 394c11d2981SJulian Elischer */ 395fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 3965da56ddbSTor Egge /* XXX: Reset too late ? */ 3975da56ddbSTor Egge MNT_ILOCK(mp); 398c11d2981SJulian Elischer mp->mnt_flag &= ~MNT_ASYNC; 3995da56ddbSTor Egge MNT_IUNLOCK(mp); 4005da56ddbSTor Egge } 401df8bae1dSRodney W. Grimes /* 40239cfb239SPawel Jakub Dawidek * Keep MNT_ACLS flag if it is stored in superblock. 40339cfb239SPawel Jakub Dawidek */ 4045da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 4055da56ddbSTor Egge /* XXX: Set too late ? */ 4065da56ddbSTor Egge MNT_ILOCK(mp); 40739cfb239SPawel Jakub Dawidek mp->mnt_flag |= MNT_ACLS; 4085da56ddbSTor Egge MNT_IUNLOCK(mp); 4095da56ddbSTor Egge } 410cea90362SCraig Rodrigues 4119340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 4129340fc72SEdward Tomasz Napierala /* XXX: Set too late ? */ 4139340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 4149340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 4159340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 4169340fc72SEdward Tomasz Napierala } 417927a12aeSKirk McKusick /* 418927a12aeSKirk McKusick * If this is a request from fsck to clean up the filesystem, 419927a12aeSKirk McKusick * then allow the specified pid to proceed. 420927a12aeSKirk McKusick */ 421927a12aeSKirk McKusick if (fsckpid > 0) { 422927a12aeSKirk McKusick if (ump->um_fsckpid != 0) { 423b60ee81eSKirk McKusick vfs_mount_error(mp, 424b60ee81eSKirk McKusick "Active checker already running on %s", 425927a12aeSKirk McKusick fs->fs_fsmnt); 426927a12aeSKirk McKusick return (EINVAL); 427927a12aeSKirk McKusick } 428fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 429927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 430927a12aeSKirk McKusick g_topology_lock(); 431927a12aeSKirk McKusick /* 432927a12aeSKirk McKusick * Request write access. 433927a12aeSKirk McKusick */ 434927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 435927a12aeSKirk McKusick g_topology_unlock(); 436927a12aeSKirk McKusick if (error) { 437b60ee81eSKirk McKusick vfs_mount_error(mp, 438b60ee81eSKirk McKusick "Checker activation failed on %s", 439927a12aeSKirk McKusick fs->fs_fsmnt); 440927a12aeSKirk McKusick return (error); 441927a12aeSKirk McKusick } 442927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 443927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 444927a12aeSKirk McKusick ffs_snapshot_mount(mp); 445927a12aeSKirk McKusick fs->fs_mtime = time_second; 446927a12aeSKirk McKusick fs->fs_fmod = 1; 447927a12aeSKirk McKusick fs->fs_clean = 0; 448927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 449927a12aeSKirk McKusick } 4509340fc72SEdward Tomasz Napierala 451f2a2857bSKirk McKusick /* 452f2a2857bSKirk McKusick * If this is a snapshot request, take the snapshot. 453f2a2857bSKirk McKusick */ 454f2a2857bSKirk McKusick if (mp->mnt_flag & MNT_SNAPSHOT) 45520a92a18SPoul-Henning Kamp return (ffs_snapshot(mp, fspec)); 456df8bae1dSRodney W. Grimes } 4572b14f991SJulian Elischer 458df8bae1dSRodney W. Grimes /* 459df8bae1dSRodney W. Grimes * Not an update, or updating the name: look up the name 460e9827c6dSBruce Evans * and verify that it refers to a sensible disk device. 461df8bae1dSRodney W. Grimes */ 462fdedad76SSuleiman Souhlal NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td); 4635e8c582aSPoul-Henning Kamp if ((error = namei(&ndp)) != 0) 464f2a2857bSKirk McKusick return (error); 4655e8c582aSPoul-Henning Kamp NDFREE(&ndp, NDF_ONLY_PNBUF); 4665e8c582aSPoul-Henning Kamp devvp = ndp.ni_vp; 467f2a2857bSKirk McKusick if (!vn_isdisk(devvp, &error)) { 468fdedad76SSuleiman Souhlal vput(devvp); 469f2a2857bSKirk McKusick return (error); 470f2a2857bSKirk McKusick } 471c9b99213SBruce Evans 472c9b99213SBruce Evans /* 473c9b99213SBruce Evans * If mount by non-root, then verify that user has necessary 474c9b99213SBruce Evans * permissions on the device. 475c9b99213SBruce Evans */ 47615bc6b2bSEdward Tomasz Napierala accmode = VREAD; 477c9b99213SBruce Evans if ((mp->mnt_flag & MNT_RDONLY) == 0) 47815bc6b2bSEdward Tomasz Napierala accmode |= VWRITE; 47915bc6b2bSEdward Tomasz Napierala error = VOP_ACCESS(devvp, accmode, td->td_ucred, td); 480acd3428bSRobert Watson if (error) 481acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 482acd3428bSRobert Watson if (error) { 483c9b99213SBruce Evans vput(devvp); 484c9b99213SBruce Evans return (error); 485c9b99213SBruce Evans } 486c9b99213SBruce Evans 4872b14f991SJulian Elischer if (mp->mnt_flag & MNT_UPDATE) { 4882b14f991SJulian Elischer /* 489f2a2857bSKirk McKusick * Update only 490f2a2857bSKirk McKusick * 4913e425b96SJulian Elischer * If it's not the same vnode, or at least the same device 4923e425b96SJulian Elischer * then it's not correct. 4932b14f991SJulian Elischer */ 4942b14f991SJulian Elischer 49543920011SPoul-Henning Kamp if (devvp->v_rdev != ump->um_devvp->v_rdev) 496f2a2857bSKirk McKusick error = EINVAL; /* needs translation */ 497fdedad76SSuleiman Souhlal vput(devvp); 498f2a2857bSKirk McKusick if (error) 499f2a2857bSKirk McKusick return (error); 5002b14f991SJulian Elischer } else { 5012b14f991SJulian Elischer /* 502f2a2857bSKirk McKusick * New mount 5032b14f991SJulian Elischer * 504f2a2857bSKirk McKusick * We need the name for the mount point (also used for 505f2a2857bSKirk McKusick * "last mounted on") copied in. If an error occurs, 506f2a2857bSKirk McKusick * the mount point is discarded by the upper level code. 50798cbffd7SKonstantin Belousov * Note that vfs_mount_alloc() populates f_mntonname for us. 508f2a2857bSKirk McKusick */ 509975512a9SPoul-Henning Kamp if ((error = ffs_mountfs(devvp, mp, td)) != 0) { 510f2a2857bSKirk McKusick vrele(devvp); 511f2a2857bSKirk McKusick return (error); 512f2a2857bSKirk McKusick } 513927a12aeSKirk McKusick if (fsckpid > 0) { 514fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 515927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 516927a12aeSKirk McKusick ump = VFSTOUFS(mp); 517927a12aeSKirk McKusick fs = ump->um_fs; 518927a12aeSKirk McKusick g_topology_lock(); 519927a12aeSKirk McKusick /* 520927a12aeSKirk McKusick * Request write access. 521927a12aeSKirk McKusick */ 522927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 523927a12aeSKirk McKusick g_topology_unlock(); 524927a12aeSKirk McKusick if (error) { 525b60ee81eSKirk McKusick printf("WARNING: %s: Checker activation " 526b60ee81eSKirk McKusick "failed\n", fs->fs_fsmnt); 527927a12aeSKirk McKusick } else { 528927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 529927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 530927a12aeSKirk McKusick ffs_snapshot_mount(mp); 531927a12aeSKirk McKusick fs->fs_mtime = time_second; 532927a12aeSKirk McKusick fs->fs_clean = 0; 533927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 534927a12aeSKirk McKusick } 535927a12aeSKirk McKusick } 536f2a2857bSKirk McKusick } 53720a92a18SPoul-Henning Kamp vfs_mountedfrom(mp, fspec); 538f2a2857bSKirk McKusick return (0); 5392b14f991SJulian Elischer } 5402b14f991SJulian Elischer 541df8bae1dSRodney W. Grimes /* 54220a92a18SPoul-Henning Kamp * Compatibility with old mount system call. 54320a92a18SPoul-Henning Kamp */ 54420a92a18SPoul-Henning Kamp 54520a92a18SPoul-Henning Kamp static int 546cc672d35SKirk McKusick ffs_cmount(struct mntarg *ma, void *data, uint64_t flags) 54720a92a18SPoul-Henning Kamp { 54820a92a18SPoul-Henning Kamp struct ufs_args args; 549d0cc54f3SKonstantin Belousov struct export_args exp; 55020a92a18SPoul-Henning Kamp int error; 55120a92a18SPoul-Henning Kamp 55220a92a18SPoul-Henning Kamp if (data == NULL) 55320a92a18SPoul-Henning Kamp return (EINVAL); 55420a92a18SPoul-Henning Kamp error = copyin(data, &args, sizeof args); 55520a92a18SPoul-Henning Kamp if (error) 55620a92a18SPoul-Henning Kamp return (error); 557d0cc54f3SKonstantin Belousov vfs_oexport_conv(&args.export, &exp); 55820a92a18SPoul-Henning Kamp 55920a92a18SPoul-Henning Kamp ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN); 560d0cc54f3SKonstantin Belousov ma = mount_arg(ma, "export", &exp, sizeof(exp)); 56120a92a18SPoul-Henning Kamp error = kernel_mount(ma, flags); 56220a92a18SPoul-Henning Kamp 56320a92a18SPoul-Henning Kamp return (error); 56420a92a18SPoul-Henning Kamp } 56520a92a18SPoul-Henning Kamp 56620a92a18SPoul-Henning Kamp /* 567df8bae1dSRodney W. Grimes * Reload all incore data for a filesystem (used after running fsck on 5681848286aSEdward Tomasz Napierala * the root filesystem and finding things to fix). If the 'force' flag 5691848286aSEdward Tomasz Napierala * is 0, the filesystem must be mounted read-only. 570df8bae1dSRodney W. Grimes * 571df8bae1dSRodney W. Grimes * Things to do to update the mount: 572df8bae1dSRodney W. Grimes * 1) invalidate all cached meta-data. 573df8bae1dSRodney W. Grimes * 2) re-read superblock from disk. 574df8bae1dSRodney W. Grimes * 3) re-read summary information from disk. 575df8bae1dSRodney W. Grimes * 4) invalidate all inactive vnodes. 576df426577SKonstantin Belousov * 5) clear MNTK_SUSPEND2 and MNTK_SUSPENDED flags, allowing secondary 577df426577SKonstantin Belousov * writers, if requested. 578df426577SKonstantin Belousov * 6) invalidate all cached file data. 579df426577SKonstantin Belousov * 7) re-read inode data for all active vnodes. 580df8bae1dSRodney W. Grimes */ 5811848286aSEdward Tomasz Napierala int 582df426577SKonstantin Belousov ffs_reload(struct mount *mp, struct thread *td, int flags) 583df8bae1dSRodney W. Grimes { 58482be0a5aSTor Egge struct vnode *vp, *mvp, *devvp; 585df8bae1dSRodney W. Grimes struct inode *ip; 586f55ff3f3SIan Dowse void *space; 587df8bae1dSRodney W. Grimes struct buf *bp; 588996c772fSJohn Dyson struct fs *fs, *newfs; 5893ba649d7SJeff Roberson struct ufsmount *ump; 5901c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 591df8bae1dSRodney W. Grimes int i, blks, size, error; 592996c772fSJohn Dyson int32_t *lp; 593df8bae1dSRodney W. Grimes 5943ba649d7SJeff Roberson ump = VFSTOUFS(mp); 5951848286aSEdward Tomasz Napierala 5961848286aSEdward Tomasz Napierala MNT_ILOCK(mp); 597df426577SKonstantin Belousov if ((mp->mnt_flag & MNT_RDONLY) == 0 && (flags & FFSR_FORCE) == 0) { 5981848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 5991848286aSEdward Tomasz Napierala return (EINVAL); 6001848286aSEdward Tomasz Napierala } 6011848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 6021848286aSEdward Tomasz Napierala 603df8bae1dSRodney W. Grimes /* 604df8bae1dSRodney W. Grimes * Step 1: invalidate all cached meta-data. 605df8bae1dSRodney W. Grimes */ 6062b14f991SJulian Elischer devvp = VFSTOUFS(mp)->um_devvp; 607cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 6080d7935fdSAttilio Rao if (vinvalbuf(devvp, 0, 0, 0) != 0) 609df8bae1dSRodney W. Grimes panic("ffs_reload: dirty1"); 61022db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 61195e5e988SJohn Dyson 612df8bae1dSRodney W. Grimes /* 613df8bae1dSRodney W. Grimes * Step 2: re-read superblock from disk. 614df8bae1dSRodney W. Grimes */ 6151c85e6a3SKirk McKusick fs = VFSTOUFS(mp)->um_fs; 616ada981b2SKirk McKusick if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize, 6171c85e6a3SKirk McKusick NOCRED, &bp)) != 0) 618df8bae1dSRodney W. Grimes return (error); 619996c772fSJohn Dyson newfs = (struct fs *)bp->b_data; 6201c85e6a3SKirk McKusick if ((newfs->fs_magic != FS_UFS1_MAGIC && 6211c85e6a3SKirk McKusick newfs->fs_magic != FS_UFS2_MAGIC) || 6221c85e6a3SKirk McKusick newfs->fs_bsize > MAXBSIZE || 623996c772fSJohn Dyson newfs->fs_bsize < sizeof(struct fs)) { 624df8bae1dSRodney W. Grimes brelse(bp); 625df8bae1dSRodney W. Grimes return (EIO); /* XXX needs translation */ 626df8bae1dSRodney W. Grimes } 627996c772fSJohn Dyson /* 628996c772fSJohn Dyson * Copy pointer fields back into superblock before copying in XXX 629996c772fSJohn Dyson * new superblock. These should really be in the ufsmount. XXX 630996c772fSJohn Dyson * Note that important parameters (eg fs_ncg) are unchanged. 631996c772fSJohn Dyson */ 632f55ff3f3SIan Dowse newfs->fs_csp = fs->fs_csp; 633996c772fSJohn Dyson newfs->fs_maxcluster = fs->fs_maxcluster; 6345d69bac4SIan Dowse newfs->fs_contigdirs = fs->fs_contigdirs; 635143a5346SIan Dowse newfs->fs_active = fs->fs_active; 6361848286aSEdward Tomasz Napierala newfs->fs_ronly = fs->fs_ronly; 6371c85e6a3SKirk McKusick sblockloc = fs->fs_sblockloc; 638996c772fSJohn Dyson bcopy(newfs, fs, (u_int)fs->fs_sbsize); 639df8bae1dSRodney W. Grimes brelse(bp); 640996c772fSJohn Dyson mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 6411c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc); 6423ba649d7SJeff Roberson UFS_LOCK(ump); 6439ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 644b60ee81eSKirk McKusick printf("WARNING: %s: reload pending error: blocks %jd " 645b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 6461c85e6a3SKirk McKusick fs->fs_pendinginodes); 6479ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 6489ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 6499ccb939eSKirk McKusick } 6503ba649d7SJeff Roberson UFS_UNLOCK(ump); 651996c772fSJohn Dyson 652df8bae1dSRodney W. Grimes /* 653df8bae1dSRodney W. Grimes * Step 3: re-read summary information from disk. 654df8bae1dSRodney W. Grimes */ 6552b028c25SEdward Tomasz Napierala size = fs->fs_cssize; 6562b028c25SEdward Tomasz Napierala blks = howmany(size, fs->fs_fsize); 6572b028c25SEdward Tomasz Napierala if (fs->fs_contigsumsize > 0) 6582b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(int32_t); 6592b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(u_int8_t); 6602b028c25SEdward Tomasz Napierala free(fs->fs_csp, M_UFSMNT); 6612b028c25SEdward Tomasz Napierala space = malloc((u_long)size, M_UFSMNT, M_WAITOK); 6622b028c25SEdward Tomasz Napierala fs->fs_csp = space; 663df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 664df8bae1dSRodney W. Grimes size = fs->fs_bsize; 665df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 666df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 667c9671602SPoul-Henning Kamp error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 668c9671602SPoul-Henning Kamp NOCRED, &bp); 669c9671602SPoul-Henning Kamp if (error) 670df8bae1dSRodney W. Grimes return (error); 671f55ff3f3SIan Dowse bcopy(bp->b_data, space, (u_int)size); 672f55ff3f3SIan Dowse space = (char *)space + size; 673df8bae1dSRodney W. Grimes brelse(bp); 674df8bae1dSRodney W. Grimes } 675996c772fSJohn Dyson /* 676996c772fSJohn Dyson * We no longer know anything about clusters per cylinder group. 677996c772fSJohn Dyson */ 678996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 67972b8ff1cSEdward Tomasz Napierala fs->fs_maxcluster = lp = space; 680996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 681996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 68272b8ff1cSEdward Tomasz Napierala space = lp; 683996c772fSJohn Dyson } 68472b8ff1cSEdward Tomasz Napierala size = fs->fs_ncg * sizeof(u_int8_t); 68572b8ff1cSEdward Tomasz Napierala fs->fs_contigdirs = (u_int8_t *)space; 68672b8ff1cSEdward Tomasz Napierala bzero(fs->fs_contigdirs, size); 687df426577SKonstantin Belousov if ((flags & FFSR_UNSUSPEND) != 0) { 688df426577SKonstantin Belousov MNT_ILOCK(mp); 689df426577SKonstantin Belousov mp->mnt_kern_flag &= ~(MNTK_SUSPENDED | MNTK_SUSPEND2); 690df426577SKonstantin Belousov wakeup(&mp->mnt_flag); 691df426577SKonstantin Belousov MNT_IUNLOCK(mp); 692df426577SKonstantin Belousov } 693996c772fSJohn Dyson 694df8bae1dSRodney W. Grimes loop: 69571469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 696df8bae1dSRodney W. Grimes /* 6971848286aSEdward Tomasz Napierala * Skip syncer vnode. 6981848286aSEdward Tomasz Napierala */ 6991848286aSEdward Tomasz Napierala if (vp->v_type == VNON) { 7001848286aSEdward Tomasz Napierala VI_UNLOCK(vp); 7011848286aSEdward Tomasz Napierala continue; 7021848286aSEdward Tomasz Napierala } 7031848286aSEdward Tomasz Napierala /* 704fe68abe2SJeff Roberson * Step 4: invalidate all cached file data. 705df8bae1dSRodney W. Grimes */ 706b40ce416SJulian Elischer if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, td)) { 70771469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 708df8bae1dSRodney W. Grimes goto loop; 709996c772fSJohn Dyson } 7100d7935fdSAttilio Rao if (vinvalbuf(vp, 0, 0, 0)) 711df8bae1dSRodney W. Grimes panic("ffs_reload: dirty2"); 712df8bae1dSRodney W. Grimes /* 713fe68abe2SJeff Roberson * Step 5: re-read inode data for all active vnodes. 714df8bae1dSRodney W. Grimes */ 715df8bae1dSRodney W. Grimes ip = VTOI(vp); 716c9671602SPoul-Henning Kamp error = 717df8bae1dSRodney W. Grimes bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), 718c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 719c9671602SPoul-Henning Kamp if (error) { 72022db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 72145d45c6cSAlexander Kabaev vrele(vp); 72271469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 723df8bae1dSRodney W. Grimes return (error); 724df8bae1dSRodney W. Grimes } 725de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ip->i_number); 726b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 727df8bae1dSRodney W. Grimes brelse(bp); 72822db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 729cb9ddc80SAlexander Kabaev vrele(vp); 730df8bae1dSRodney W. Grimes } 731df8bae1dSRodney W. Grimes return (0); 732df8bae1dSRodney W. Grimes } 733df8bae1dSRodney W. Grimes 7341c85e6a3SKirk McKusick /* 7351c85e6a3SKirk McKusick * Possible superblock locations ordered from most to least likely. 7361c85e6a3SKirk McKusick */ 7371c85e6a3SKirk McKusick static int sblock_try[] = SBLOCKSEARCH; 7385819ab3fSKirk McKusick 739df8bae1dSRodney W. Grimes /* 740df8bae1dSRodney W. Grimes * Common code for mount and mountroot 741df8bae1dSRodney W. Grimes */ 742975512a9SPoul-Henning Kamp static int 743975512a9SPoul-Henning Kamp ffs_mountfs(devvp, mp, td) 74405f4ff5dSPoul-Henning Kamp struct vnode *devvp; 745df8bae1dSRodney W. Grimes struct mount *mp; 746b40ce416SJulian Elischer struct thread *td; 747df8bae1dSRodney W. Grimes { 74805f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 749df8bae1dSRodney W. Grimes struct buf *bp; 75005f4ff5dSPoul-Henning Kamp struct fs *fs; 75189c9c53dSPoul-Henning Kamp struct cdev *dev; 752f55ff3f3SIan Dowse void *space; 7531c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 754f5ef029eSPoul-Henning Kamp int error, i, blks, size, ronly; 755996c772fSJohn Dyson int32_t *lp; 756996c772fSJohn Dyson struct ucred *cred; 75743920011SPoul-Henning Kamp struct g_consumer *cp; 7583bbd6d8aSJeff Roberson struct mount *nmp; 759df8bae1dSRodney W. Grimes 760ee445a69SJohn Baldwin bp = NULL; 761ee445a69SJohn Baldwin ump = NULL; 762a854ed98SJohn Baldwin cred = td ? td->td_ucred : NOCRED; 76343920011SPoul-Henning Kamp ronly = (mp->mnt_flag & MNT_RDONLY) != 0; 764ee445a69SJohn Baldwin 765c70b3cd2SKonstantin Belousov KASSERT(devvp->v_type == VCHR, ("reclaimed devvp")); 766ee445a69SJohn Baldwin dev = devvp->v_rdev; 767c70b3cd2SKonstantin Belousov if (atomic_cmpset_acq_ptr((uintptr_t *)&dev->si_mountpt, 0, 768c70b3cd2SKonstantin Belousov (uintptr_t)mp) == 0) { 769c70b3cd2SKonstantin Belousov VOP_UNLOCK(devvp, 0); 770c70b3cd2SKonstantin Belousov return (EBUSY); 771c70b3cd2SKonstantin Belousov } 77243920011SPoul-Henning Kamp g_topology_lock(); 77343920011SPoul-Henning Kamp error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1); 77443920011SPoul-Henning Kamp g_topology_unlock(); 775c70b3cd2SKonstantin Belousov if (error != 0) { 776c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 77722db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 778c70b3cd2SKonstantin Belousov return (error); 779c70b3cd2SKonstantin Belousov } 780c70b3cd2SKonstantin Belousov dev_ref(dev); 781c70b3cd2SKonstantin Belousov devvp->v_bufobj.bo_ops = &ffs_ops; 782c70b3cd2SKonstantin Belousov VOP_UNLOCK(devvp, 0); 783c70b3cd2SKonstantin Belousov if (dev->si_iosize_max != 0) 784c70b3cd2SKonstantin Belousov mp->mnt_iosize_max = dev->si_iosize_max; 7851b5464efSPoul-Henning Kamp if (mp->mnt_iosize_max > MAXPHYS) 7861b5464efSPoul-Henning Kamp mp->mnt_iosize_max = MAXPHYS; 78795e5e988SJohn Dyson 7881c85e6a3SKirk McKusick fs = NULL; 7891c85e6a3SKirk McKusick sblockloc = 0; 7901c85e6a3SKirk McKusick /* 7911c85e6a3SKirk McKusick * Try reading the superblock in each of its possible locations. 7921c85e6a3SKirk McKusick */ 7931c85e6a3SKirk McKusick for (i = 0; sblock_try[i] != -1; i++) { 79471ac2d7cSCraig Rodrigues if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) { 79571ac2d7cSCraig Rodrigues error = EINVAL; 79671ac2d7cSCraig Rodrigues vfs_mount_error(mp, 79771ac2d7cSCraig Rodrigues "Invalid sectorsize %d for superblock size %d", 79871ac2d7cSCraig Rodrigues cp->provider->sectorsize, SBLOCKSIZE); 79971ac2d7cSCraig Rodrigues goto out; 80071ac2d7cSCraig Rodrigues } 80171ac2d7cSCraig Rodrigues if ((error = bread(devvp, btodb(sblock_try[i]), SBLOCKSIZE, 8021c85e6a3SKirk McKusick cred, &bp)) != 0) 803df8bae1dSRodney W. Grimes goto out; 804df8bae1dSRodney W. Grimes fs = (struct fs *)bp->b_data; 805ada981b2SKirk McKusick sblockloc = sblock_try[i]; 8061c85e6a3SKirk McKusick if ((fs->fs_magic == FS_UFS1_MAGIC || 8071c85e6a3SKirk McKusick (fs->fs_magic == FS_UFS2_MAGIC && 808ada981b2SKirk McKusick (fs->fs_sblockloc == sblockloc || 809ada981b2SKirk McKusick (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0))) && 8101c85e6a3SKirk McKusick fs->fs_bsize <= MAXBSIZE && 8111c85e6a3SKirk McKusick fs->fs_bsize >= sizeof(struct fs)) 8121c85e6a3SKirk McKusick break; 8131c85e6a3SKirk McKusick brelse(bp); 8141c85e6a3SKirk McKusick bp = NULL; 8151c85e6a3SKirk McKusick } 8161c85e6a3SKirk McKusick if (sblock_try[i] == -1) { 817df8bae1dSRodney W. Grimes error = EINVAL; /* XXX needs translation */ 818df8bae1dSRodney W. Grimes goto out; 819df8bae1dSRodney W. Grimes } 8203f6f17eeSJulian Elischer fs->fs_fmod = 0; 82108e94183SPedro F. Giffuni fs->fs_flags &= ~FS_INDEXDIRS; /* no support for directory indices */ 8220922cce6SBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 8230922cce6SBruce Evans if (fs->fs_clean == 0) { 8240922cce6SBruce Evans fs->fs_flags |= FS_UNCLEAN; 825812b1d41SKirk McKusick if (ronly || (mp->mnt_flag & MNT_FORCE) || 826113db2ddSJeff Roberson ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 && 8271a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 82859b3a4ebSDavid E. O'Brien printf("WARNING: %s was not properly dismounted\n", 8290922cce6SBruce Evans fs->fs_fsmnt); 8301469eec8SDavid Greenman } else { 831b60ee81eSKirk McKusick vfs_mount_error(mp, "R/W mount of %s denied. %s%s", 832b60ee81eSKirk McKusick fs->fs_fsmnt, "Filesystem is not clean - run fsck.", 833b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 834b60ee81eSKirk McKusick " Forced mount will invalidate journal contents"); 8351469eec8SDavid Greenman error = EPERM; 8361469eec8SDavid Greenman goto out; 8371469eec8SDavid Greenman } 8381c85e6a3SKirk McKusick if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) && 8391c85e6a3SKirk McKusick (mp->mnt_flag & MNT_FORCE)) { 840b60ee81eSKirk McKusick printf("WARNING: %s: lost blocks %jd files %d\n", 841b60ee81eSKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 8421c85e6a3SKirk McKusick fs->fs_pendinginodes); 8439ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 8449ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 8459ccb939eSKirk McKusick } 8469ccb939eSKirk McKusick } 8479ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 848b60ee81eSKirk McKusick printf("WARNING: %s: mount pending error: blocks %jd " 849b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 8501c85e6a3SKirk McKusick fs->fs_pendinginodes); 8519ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 8529ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 8531469eec8SDavid Greenman } 8541a60c7fcSPawel Jakub Dawidek if ((fs->fs_flags & FS_GJOURNAL) != 0) { 8551a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL 8561a60c7fcSPawel Jakub Dawidek /* 8571a60c7fcSPawel Jakub Dawidek * Get journal provider name. 8581a60c7fcSPawel Jakub Dawidek */ 8591a60c7fcSPawel Jakub Dawidek size = 1024; 8601a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = malloc(size, M_UFSMNT, M_WAITOK); 8611a60c7fcSPawel Jakub Dawidek if (g_io_getattr("GJOURNAL::provider", cp, &size, 8621a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider) == 0) { 8631a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, size, 8641a60c7fcSPawel Jakub Dawidek M_UFSMNT, M_WAITOK); 8651a60c7fcSPawel Jakub Dawidek MNT_ILOCK(mp); 8661a60c7fcSPawel Jakub Dawidek mp->mnt_flag |= MNT_GJOURNAL; 8671a60c7fcSPawel Jakub Dawidek MNT_IUNLOCK(mp); 8681a60c7fcSPawel Jakub Dawidek } else { 869b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs " 870b60ee81eSKirk McKusick "but no gjournal provider below\n", 8711a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 8721a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 8731a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 8741a60c7fcSPawel Jakub Dawidek } 8751a60c7fcSPawel Jakub Dawidek #else 876b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs but no " 877b60ee81eSKirk McKusick "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname); 8781a60c7fcSPawel Jakub Dawidek #endif 8791a60c7fcSPawel Jakub Dawidek } else { 8801a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 8811a60c7fcSPawel Jakub Dawidek } 882a163d034SWarner Losh ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO); 88343920011SPoul-Henning Kamp ump->um_cp = cp; 88443920011SPoul-Henning Kamp ump->um_bo = &devvp->v_bufobj; 8858dd56505SPoul-Henning Kamp ump->um_fs = malloc((u_long)fs->fs_sbsize, M_UFSMNT, M_WAITOK); 8861c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 8871c85e6a3SKirk McKusick ump->um_fstype = UFS1; 8881c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs1; 8891c85e6a3SKirk McKusick } else { 8901c85e6a3SKirk McKusick ump->um_fstype = UFS2; 8911c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs2; 8921c85e6a3SKirk McKusick } 893cec0f20cSPoul-Henning Kamp ump->um_blkatoff = ffs_blkatoff; 894cec0f20cSPoul-Henning Kamp ump->um_truncate = ffs_truncate; 895987f5696SPoul-Henning Kamp ump->um_update = ffs_update; 896cec0f20cSPoul-Henning Kamp ump->um_valloc = ffs_valloc; 897cec0f20cSPoul-Henning Kamp ump->um_vfree = ffs_vfree; 898975512a9SPoul-Henning Kamp ump->um_ifree = ffs_ifree; 89990446e36SKonstantin Belousov ump->um_rdonly = ffs_rdonly; 90016b1f68dSKonstantin Belousov ump->um_snapgone = ffs_snapgone; 9013ba649d7SJeff Roberson mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF); 902df8bae1dSRodney W. Grimes bcopy(bp->b_data, ump->um_fs, (u_int)fs->fs_sbsize); 9031c85e6a3SKirk McKusick if (fs->fs_sbsize < SBLOCKSIZE) 904f2a2857bSKirk McKusick bp->b_flags |= B_INVAL | B_NOCACHE; 905df8bae1dSRodney W. Grimes brelse(bp); 906df8bae1dSRodney W. Grimes bp = NULL; 907df8bae1dSRodney W. Grimes fs = ump->um_fs; 9081c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc); 909df8bae1dSRodney W. Grimes fs->fs_ronly = ronly; 910996c772fSJohn Dyson size = fs->fs_cssize; 911996c772fSJohn Dyson blks = howmany(size, fs->fs_fsize); 912996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) 913996c772fSJohn Dyson size += fs->fs_ncg * sizeof(int32_t); 914a61ab64aSKirk McKusick size += fs->fs_ncg * sizeof(u_int8_t); 915a163d034SWarner Losh space = malloc((u_long)size, M_UFSMNT, M_WAITOK); 916f55ff3f3SIan Dowse fs->fs_csp = space; 917df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 918df8bae1dSRodney W. Grimes size = fs->fs_bsize; 919df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 920df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 9218aef1712SMatthew Dillon if ((error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 9228aef1712SMatthew Dillon cred, &bp)) != 0) { 923f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 924df8bae1dSRodney W. Grimes goto out; 925df8bae1dSRodney W. Grimes } 926df8bae1dSRodney W. Grimes bcopy(bp->b_data, space, (u_int)size); 927f55ff3f3SIan Dowse space = (char *)space + size; 928df8bae1dSRodney W. Grimes brelse(bp); 929df8bae1dSRodney W. Grimes bp = NULL; 930df8bae1dSRodney W. Grimes } 931996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 932f55ff3f3SIan Dowse fs->fs_maxcluster = lp = space; 933996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 934996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 9354691e9eaSIan Dowse space = lp; 936996c772fSJohn Dyson } 937a61ab64aSKirk McKusick size = fs->fs_ncg * sizeof(u_int8_t); 938a61ab64aSKirk McKusick fs->fs_contigdirs = (u_int8_t *)space; 939a61ab64aSKirk McKusick bzero(fs->fs_contigdirs, size); 940143a5346SIan Dowse fs->fs_active = NULL; 94177465d93SAlfred Perlstein mp->mnt_data = ump; 94268de329eSPoul-Henning Kamp mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0]; 9438f89943eSGuido van Rooij mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1]; 9443bbd6d8aSJeff Roberson nmp = NULL; 94568de329eSPoul-Henning Kamp if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 || 9463bbd6d8aSJeff Roberson (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) { 9473bbd6d8aSJeff Roberson if (nmp) 9483bbd6d8aSJeff Roberson vfs_rel(nmp); 94968de329eSPoul-Henning Kamp vfs_getnewfsid(mp); 9503bbd6d8aSJeff Roberson } 951df8bae1dSRodney W. Grimes mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 9525da56ddbSTor Egge MNT_ILOCK(mp); 953cc9d8990SPeter Wemm mp->mnt_flag |= MNT_LOCAL; 9545da56ddbSTor Egge MNT_IUNLOCK(mp); 9555da56ddbSTor Egge if ((fs->fs_flags & FS_MULTILABEL) != 0) { 9567b3f1bbdSTom Rhodes #ifdef MAC 9575da56ddbSTor Egge MNT_ILOCK(mp); 95880830407SRobert Watson mp->mnt_flag |= MNT_MULTILABEL; 9595da56ddbSTor Egge MNT_IUNLOCK(mp); 9607b3f1bbdSTom Rhodes #else 961b60ee81eSKirk McKusick printf("WARNING: %s: multilabel flag on fs but " 962b60ee81eSKirk McKusick "no MAC support\n", mp->mnt_stat.f_mntonname); 9637b3f1bbdSTom Rhodes #endif 9645da56ddbSTor Egge } 9655da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 9667b3f1bbdSTom Rhodes #ifdef UFS_ACL 9675da56ddbSTor Egge MNT_ILOCK(mp); 9689340fc72SEdward Tomasz Napierala 9699340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_NFS4ACLS) 970b60ee81eSKirk McKusick printf("WARNING: %s: ACLs flag on fs conflicts with " 971b60ee81eSKirk McKusick "\"nfsv4acls\" mount option; option ignored\n", 972b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 9739340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_NFS4ACLS; 97480830407SRobert Watson mp->mnt_flag |= MNT_ACLS; 9759340fc72SEdward Tomasz Napierala 9765da56ddbSTor Egge MNT_IUNLOCK(mp); 9777b3f1bbdSTom Rhodes #else 97859b3a4ebSDavid E. O'Brien printf("WARNING: %s: ACLs flag on fs but no ACLs support\n", 979946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 9807b3f1bbdSTom Rhodes #endif 9815da56ddbSTor Egge } 9829340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 9839340fc72SEdward Tomasz Napierala #ifdef UFS_ACL 9849340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 9859340fc72SEdward Tomasz Napierala 9869340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_ACLS) 987b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts " 988b60ee81eSKirk McKusick "with \"acls\" mount option; option ignored\n", 989b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 9909340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_ACLS; 9919340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 9929340fc72SEdward Tomasz Napierala 9939340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 9949340fc72SEdward Tomasz Napierala #else 995b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs but no " 996b60ee81eSKirk McKusick "ACLs support\n", mp->mnt_stat.f_mntonname); 9979340fc72SEdward Tomasz Napierala #endif 9989340fc72SEdward Tomasz Napierala } 9998c2a54deSKonstantin Belousov if ((fs->fs_flags & FS_TRIM) != 0) { 10008c2a54deSKonstantin Belousov size = sizeof(int); 10018c2a54deSKonstantin Belousov if (g_io_getattr("GEOM::candelete", cp, &size, 10028c2a54deSKonstantin Belousov &ump->um_candelete) == 0) { 10038c2a54deSKonstantin Belousov if (!ump->um_candelete) 1004b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk " 1005b60ee81eSKirk McKusick "does not support TRIM\n", 10068c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 10078c2a54deSKonstantin Belousov } else { 1008b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk does " 1009b60ee81eSKirk McKusick "not confirm that it supports TRIM\n", 10108c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 10118c2a54deSKonstantin Belousov ump->um_candelete = 0; 10128c2a54deSKonstantin Belousov } 1013c79dff0fSKonstantin Belousov if (ump->um_candelete) { 1014c79dff0fSKonstantin Belousov ump->um_trim_tq = taskqueue_create("trim", M_WAITOK, 1015c79dff0fSKonstantin Belousov taskqueue_thread_enqueue, &ump->um_trim_tq); 1016c79dff0fSKonstantin Belousov taskqueue_start_threads(&ump->um_trim_tq, 1, PVFS, 1017c79dff0fSKonstantin Belousov "%s trim", mp->mnt_stat.f_mntonname); 1018c79dff0fSKonstantin Belousov } 10198c2a54deSKonstantin Belousov } 10209340fc72SEdward Tomasz Napierala 1021df8bae1dSRodney W. Grimes ump->um_mountp = mp; 1022df8bae1dSRodney W. Grimes ump->um_dev = dev; 1023df8bae1dSRodney W. Grimes ump->um_devvp = devvp; 1024df8bae1dSRodney W. Grimes ump->um_nindir = fs->fs_nindir; 1025df8bae1dSRodney W. Grimes ump->um_bptrtodb = fs->fs_fsbtodb; 1026df8bae1dSRodney W. Grimes ump->um_seqinc = fs->fs_frag; 1027df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1028df8bae1dSRodney W. Grimes ump->um_quotas[i] = NULLVP; 1029516081f2SRobert Watson #ifdef UFS_EXTATTR 1030a64ed089SRobert Watson ufs_extattr_uepm_init(&ump->um_extattr); 1031a64ed089SRobert Watson #endif 10322b14f991SJulian Elischer /* 10332b14f991SJulian Elischer * Set FS local "last mounted on" information (NULL pad) 10342b14f991SJulian Elischer */ 103593373c42SSuleiman Souhlal bzero(fs->fs_fsmnt, MAXMNTLEN); 103693373c42SSuleiman Souhlal strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN); 1037113db2ddSJeff Roberson mp->mnt_stat.f_iosize = fs->fs_bsize; 10382b14f991SJulian Elischer 10392b14f991SJulian Elischer if (mp->mnt_flag & MNT_ROOTFS) { 10402b14f991SJulian Elischer /* 10412b14f991SJulian Elischer * Root mount; update timestamp in mount structure. 10422b14f991SJulian Elischer * this will be used by the common root mount code 10432b14f991SJulian Elischer * to update the system clock. 10442b14f991SJulian Elischer */ 10452b14f991SJulian Elischer mp->mnt_time = fs->fs_time; 10462b14f991SJulian Elischer } 1047996c772fSJohn Dyson 1048996c772fSJohn Dyson if (ronly == 0) { 1049113db2ddSJeff Roberson fs->fs_mtime = time_second; 1050b1897c19SJulian Elischer if ((fs->fs_flags & FS_DOSOFTDEP) && 1051b1897c19SJulian Elischer (error = softdep_mount(devvp, mp, fs, cred)) != 0) { 1052f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 1053fddd463dSKonstantin Belousov ffs_flushfiles(mp, FORCECLOSE, td); 1054b1897c19SJulian Elischer goto out; 1055b1897c19SJulian Elischer } 1056f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 1057f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 1058cf60e8e4SKirk McKusick fs->fs_fmod = 1; 1059996c772fSJohn Dyson fs->fs_clean = 0; 1060791dd2faSTor Egge (void) ffs_sbupdate(ump, MNT_WAIT, 0); 1061996c772fSJohn Dyson } 1062d8d3d415SPoul-Henning Kamp /* 106398cbffd7SKonstantin Belousov * Initialize filesystem state information in mount struct. 1064d8d3d415SPoul-Henning Kamp */ 10656cf7bc60SRobert Watson MNT_ILOCK(mp); 1066bc2258daSAttilio Rao mp->mnt_kern_flag |= MNTK_LOOKUP_SHARED | MNTK_EXTENDED_SHARED | 10675f34e93cSMark Johnston MNTK_NO_IOPF | MNTK_UNMAPPED_BUFS | MNTK_USES_BCACHE; 10686cf7bc60SRobert Watson MNT_IUNLOCK(mp); 1069516081f2SRobert Watson #ifdef UFS_EXTATTR 1070516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART 10719de54ba5SRobert Watson /* 10729de54ba5SRobert Watson * 1073f5161237SRobert Watson * Auto-starting does the following: 10749de54ba5SRobert Watson * - check for /.attribute in the fs, and extattr_start if so 10759de54ba5SRobert Watson * - for each file in .attribute, enable that file with 10769de54ba5SRobert Watson * an attribute of the same name. 10779de54ba5SRobert Watson * Not clear how to report errors -- probably eat them. 10789de54ba5SRobert Watson * This would all happen while the filesystem was busy/not 10799de54ba5SRobert Watson * available, so would effectively be "atomic". 10809de54ba5SRobert Watson */ 1081b40ce416SJulian Elischer (void) ufs_extattr_autostart(mp, td); 1082516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */ 1083516081f2SRobert Watson #endif /* !UFS_EXTATTR */ 1084df8bae1dSRodney W. Grimes return (0); 1085df8bae1dSRodney W. Grimes out: 1086df8bae1dSRodney W. Grimes if (bp) 1087df8bae1dSRodney W. Grimes brelse(bp); 108843920011SPoul-Henning Kamp if (cp != NULL) { 108943920011SPoul-Henning Kamp g_topology_lock(); 10900d7935fdSAttilio Rao g_vfs_close(cp); 109143920011SPoul-Henning Kamp g_topology_unlock(); 109243920011SPoul-Henning Kamp } 1093df8bae1dSRodney W. Grimes if (ump) { 10943ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 10951a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 10961a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 10971a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 10981a60c7fcSPawel Jakub Dawidek } 1099df8bae1dSRodney W. Grimes free(ump->um_fs, M_UFSMNT); 1100df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 110177465d93SAlfred Perlstein mp->mnt_data = NULL; 1102df8bae1dSRodney W. Grimes } 1103c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 110449c4791cSEdward Tomasz Napierala dev_rel(dev); 1105df8bae1dSRodney W. Grimes return (error); 1106df8bae1dSRodney W. Grimes } 1107df8bae1dSRodney W. Grimes 11081c85e6a3SKirk McKusick #include <sys/sysctl.h> 1109adf41577SPoul-Henning Kamp static int bigcgs = 0; 11101c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, ""); 11111c85e6a3SKirk McKusick 1112df8bae1dSRodney W. Grimes /* 11131c85e6a3SKirk McKusick * Sanity checks for loading old filesystem superblocks. 11141c85e6a3SKirk McKusick * See ffs_oldfscompat_write below for unwound actions. 1115df8bae1dSRodney W. Grimes * 11161c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 11171c85e6a3SKirk McKusick * Unfortunately new bits get added. 1118df8bae1dSRodney W. Grimes */ 11191c85e6a3SKirk McKusick static void 11201c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc) 1121df8bae1dSRodney W. Grimes struct fs *fs; 11221c85e6a3SKirk McKusick struct ufsmount *ump; 11231c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 11241c85e6a3SKirk McKusick { 11251c85e6a3SKirk McKusick off_t maxfilesize; 11261c85e6a3SKirk McKusick 11271c85e6a3SKirk McKusick /* 1128ada981b2SKirk McKusick * If not yet done, update fs_flags location and value of fs_sblockloc. 1129ada981b2SKirk McKusick */ 1130ada981b2SKirk McKusick if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1131ada981b2SKirk McKusick fs->fs_flags = fs->fs_old_flags; 1132ada981b2SKirk McKusick fs->fs_old_flags |= FS_FLAGS_UPDATED; 1133ada981b2SKirk McKusick fs->fs_sblockloc = sblockloc; 1134ada981b2SKirk McKusick } 1135ada981b2SKirk McKusick /* 11361c85e6a3SKirk McKusick * If not yet done, update UFS1 superblock with new wider fields. 11371c85e6a3SKirk McKusick */ 113874f3809aSKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) { 11391c85e6a3SKirk McKusick fs->fs_maxbsize = fs->fs_bsize; 11401c85e6a3SKirk McKusick fs->fs_time = fs->fs_old_time; 11411c85e6a3SKirk McKusick fs->fs_size = fs->fs_old_size; 11421c85e6a3SKirk McKusick fs->fs_dsize = fs->fs_old_dsize; 11431c85e6a3SKirk McKusick fs->fs_csaddr = fs->fs_old_csaddr; 11441c85e6a3SKirk McKusick fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir; 11451c85e6a3SKirk McKusick fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree; 11461c85e6a3SKirk McKusick fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree; 11471c85e6a3SKirk McKusick fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree; 11481c85e6a3SKirk McKusick } 11491c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && 11501c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { 11518680d698SNate Lawson fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1; 11521c85e6a3SKirk McKusick fs->fs_qbmask = ~fs->fs_bmask; 11531c85e6a3SKirk McKusick fs->fs_qfmask = ~fs->fs_fmask; 11541c85e6a3SKirk McKusick } 11558f42fb8fSIan Dowse if (fs->fs_magic == FS_UFS1_MAGIC) { 11561c85e6a3SKirk McKusick ump->um_savedmaxfilesize = fs->fs_maxfilesize; 11578680d698SNate Lawson maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1; 11581c85e6a3SKirk McKusick if (fs->fs_maxfilesize > maxfilesize) 11591c85e6a3SKirk McKusick fs->fs_maxfilesize = maxfilesize; 11608f42fb8fSIan Dowse } 11611c85e6a3SKirk McKusick /* Compatibility for old filesystems */ 11621c85e6a3SKirk McKusick if (fs->fs_avgfilesize <= 0) 11631c85e6a3SKirk McKusick fs->fs_avgfilesize = AVFILESIZ; 11641c85e6a3SKirk McKusick if (fs->fs_avgfpdir <= 0) 11651c85e6a3SKirk McKusick fs->fs_avgfpdir = AFPDIR; 11661c85e6a3SKirk McKusick if (bigcgs) { 11671c85e6a3SKirk McKusick fs->fs_save_cgsize = fs->fs_cgsize; 11681c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_bsize; 11691c85e6a3SKirk McKusick } 11701c85e6a3SKirk McKusick } 11711c85e6a3SKirk McKusick 11721c85e6a3SKirk McKusick /* 11731c85e6a3SKirk McKusick * Unwinding superblock updates for old filesystems. 11741c85e6a3SKirk McKusick * See ffs_oldfscompat_read above for details. 11751c85e6a3SKirk McKusick * 11761c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 11771c85e6a3SKirk McKusick * Unfortunately new bits get added. 11781c85e6a3SKirk McKusick */ 1179113db2ddSJeff Roberson void 11801c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump) 11811c85e6a3SKirk McKusick struct fs *fs; 11821c85e6a3SKirk McKusick struct ufsmount *ump; 1183df8bae1dSRodney W. Grimes { 1184df8bae1dSRodney W. Grimes 11851c85e6a3SKirk McKusick /* 11861c85e6a3SKirk McKusick * Copy back UFS2 updated fields that UFS1 inspects. 11871c85e6a3SKirk McKusick */ 11881c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 11891c85e6a3SKirk McKusick fs->fs_old_time = fs->fs_time; 11901c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir; 11911c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree; 11921c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree; 11931c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree; 11941c85e6a3SKirk McKusick fs->fs_maxfilesize = ump->um_savedmaxfilesize; 11958f42fb8fSIan Dowse } 11961c85e6a3SKirk McKusick if (bigcgs) { 11971c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_save_cgsize; 11981c85e6a3SKirk McKusick fs->fs_save_cgsize = 0; 11991c85e6a3SKirk McKusick } 1200df8bae1dSRodney W. Grimes } 1201df8bae1dSRodney W. Grimes 1202df8bae1dSRodney W. Grimes /* 1203df8bae1dSRodney W. Grimes * unmount system call 1204df8bae1dSRodney W. Grimes */ 1205adf41577SPoul-Henning Kamp static int 1206dfd233edSAttilio Rao ffs_unmount(mp, mntflags) 1207df8bae1dSRodney W. Grimes struct mount *mp; 1208df8bae1dSRodney W. Grimes int mntflags; 1209df8bae1dSRodney W. Grimes { 1210dfd233edSAttilio Rao struct thread *td; 121105f4ff5dSPoul-Henning Kamp struct ufsmount *ump = VFSTOUFS(mp); 121205f4ff5dSPoul-Henning Kamp struct fs *fs; 12136fecb4e4SKonstantin Belousov int error, flags, susp; 1214df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1215df86ccf6SKonstantin Belousov int e_restart; 1216df86ccf6SKonstantin Belousov #endif 1217df8bae1dSRodney W. Grimes 1218df8bae1dSRodney W. Grimes flags = 0; 1219dfd233edSAttilio Rao td = curthread; 12206fecb4e4SKonstantin Belousov fs = ump->um_fs; 1221b60ee81eSKirk McKusick susp = 0; 1222df8bae1dSRodney W. Grimes if (mntflags & MNT_FORCE) { 1223df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 12244ce90426SKonstantin Belousov susp = fs->fs_ronly == 0; 1225b60ee81eSKirk McKusick } 1226516081f2SRobert Watson #ifdef UFS_EXTATTR 1227b40ce416SJulian Elischer if ((error = ufs_extattr_stop(mp, td))) { 1228b2b0497aSRobert Watson if (error != EOPNOTSUPP) 1229b60ee81eSKirk McKusick printf("WARNING: unmount %s: ufs_extattr_stop " 1230b60ee81eSKirk McKusick "returned errno %d\n", mp->mnt_stat.f_mntonname, 1231b2b0497aSRobert Watson error); 1232df86ccf6SKonstantin Belousov e_restart = 0; 12337df97b61SRobert Watson } else { 12349de54ba5SRobert Watson ufs_extattr_uepm_destroy(&ump->um_extattr); 1235df86ccf6SKonstantin Belousov e_restart = 1; 12367df97b61SRobert Watson } 1237a64ed089SRobert Watson #endif 12386fecb4e4SKonstantin Belousov if (susp) { 1239895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 1240895b3782SKonstantin Belousov if (error != 0) 1241895b3782SKonstantin Belousov goto fail1; 12426fecb4e4SKonstantin Belousov } 1243fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 12443c140b2dSEdward Tomasz Napierala error = softdep_flushfiles(mp, flags, td); 12453c140b2dSEdward Tomasz Napierala else 12463c140b2dSEdward Tomasz Napierala error = ffs_flushfiles(mp, flags, td); 12474f560d75SEdward Tomasz Napierala if (error != 0 && error != ENXIO) 12486fecb4e4SKonstantin Belousov goto fail; 12493c140b2dSEdward Tomasz Napierala 12503ba649d7SJeff Roberson UFS_LOCK(ump); 12519ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1252b60ee81eSKirk McKusick printf("WARNING: unmount %s: pending error: blocks %jd " 1253b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 12541c85e6a3SKirk McKusick fs->fs_pendinginodes); 12559ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 12569ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 12579ccb939eSKirk McKusick } 12583ba649d7SJeff Roberson UFS_UNLOCK(ump); 1259519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 1260113db2ddSJeff Roberson softdep_unmount(mp); 1261927a12aeSKirk McKusick if (fs->fs_ronly == 0 || ump->um_fsckpid > 0) { 12621a6a6610SKirk McKusick fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1; 1263791dd2faSTor Egge error = ffs_sbupdate(ump, MNT_WAIT, 0); 12644f560d75SEdward Tomasz Napierala if (error && error != ENXIO) { 1265996c772fSJohn Dyson fs->fs_clean = 0; 12666fecb4e4SKonstantin Belousov goto fail; 1267996c772fSJohn Dyson } 1268e0e9c421SDavid Greenman } 1269ddd6b3fcSKonstantin Belousov if (susp) 1270ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1271c79dff0fSKonstantin Belousov if (ump->um_trim_tq != NULL) { 1272c79dff0fSKonstantin Belousov while (ump->um_trim_inflight != 0) 1273c79dff0fSKonstantin Belousov pause("ufsutr", hz); 1274c79dff0fSKonstantin Belousov taskqueue_drain_all(ump->um_trim_tq); 1275c79dff0fSKonstantin Belousov taskqueue_free(ump->um_trim_tq); 1276c79dff0fSKonstantin Belousov } 127743920011SPoul-Henning Kamp g_topology_lock(); 1278927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 1279927a12aeSKirk McKusick /* 1280927a12aeSKirk McKusick * Return to normal read-only mode. 1281927a12aeSKirk McKusick */ 1282927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 1283927a12aeSKirk McKusick ump->um_fsckpid = 0; 1284927a12aeSKirk McKusick } 12850d7935fdSAttilio Rao g_vfs_close(ump->um_cp); 128643920011SPoul-Henning Kamp g_topology_unlock(); 1287c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&ump->um_dev->si_mountpt, 0); 12886476c0d2SJohn Dyson vrele(ump->um_devvp); 128949c4791cSEdward Tomasz Napierala dev_rel(ump->um_dev); 12903ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 12911a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 12921a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 12931a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 12941a60c7fcSPawel Jakub Dawidek } 1295f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 1296df8bae1dSRodney W. Grimes free(fs, M_UFSMNT); 1297df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 129877465d93SAlfred Perlstein mp->mnt_data = NULL; 12995da56ddbSTor Egge MNT_ILOCK(mp); 1300cc9d8990SPeter Wemm mp->mnt_flag &= ~MNT_LOCAL; 13015da56ddbSTor Egge MNT_IUNLOCK(mp); 1302df8bae1dSRodney W. Grimes return (error); 13036fecb4e4SKonstantin Belousov 13046fecb4e4SKonstantin Belousov fail: 1305ddd6b3fcSKonstantin Belousov if (susp) 1306ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1307895b3782SKonstantin Belousov fail1: 1308df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1309df86ccf6SKonstantin Belousov if (e_restart) { 1310df86ccf6SKonstantin Belousov ufs_extattr_uepm_init(&ump->um_extattr); 1311df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART 1312df86ccf6SKonstantin Belousov (void) ufs_extattr_autostart(mp, td); 1313df86ccf6SKonstantin Belousov #endif 1314df86ccf6SKonstantin Belousov } 1315df86ccf6SKonstantin Belousov #endif 1316df86ccf6SKonstantin Belousov 13176fecb4e4SKonstantin Belousov return (error); 1318df8bae1dSRodney W. Grimes } 1319df8bae1dSRodney W. Grimes 1320df8bae1dSRodney W. Grimes /* 1321df8bae1dSRodney W. Grimes * Flush out all the files in a filesystem. 1322df8bae1dSRodney W. Grimes */ 132326f9a767SRodney W. Grimes int 1324b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td) 132505f4ff5dSPoul-Henning Kamp struct mount *mp; 1326df8bae1dSRodney W. Grimes int flags; 1327b40ce416SJulian Elischer struct thread *td; 1328df8bae1dSRodney W. Grimes { 132905f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 1330ba05dec5SKonstantin Belousov int qerror, error; 1331df8bae1dSRodney W. Grimes 1332df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1333ba05dec5SKonstantin Belousov qerror = 0; 1334df8bae1dSRodney W. Grimes #ifdef QUOTA 1335df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_QUOTA) { 1336c1d9efcbSPoul-Henning Kamp int i; 1337f257b7a5SAlfred Perlstein error = vflush(mp, 0, SKIPSYSTEM|flags, td); 1338c1d9efcbSPoul-Henning Kamp if (error) 1339df8bae1dSRodney W. Grimes return (error); 1340df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) { 1341ba05dec5SKonstantin Belousov error = quotaoff(td, mp, i); 1342ba05dec5SKonstantin Belousov if (error != 0) { 1343ba05dec5SKonstantin Belousov if ((flags & EARLYFLUSH) == 0) 1344ba05dec5SKonstantin Belousov return (error); 1345ba05dec5SKonstantin Belousov else 1346ba05dec5SKonstantin Belousov qerror = error; 1347df8bae1dSRodney W. Grimes } 1348ba05dec5SKonstantin Belousov } 1349ba05dec5SKonstantin Belousov 1350df8bae1dSRodney W. Grimes /* 1351ba05dec5SKonstantin Belousov * Here we fall through to vflush again to ensure that 1352ba05dec5SKonstantin Belousov * we have gotten rid of all the system vnodes, unless 1353ba05dec5SKonstantin Belousov * quotas must not be closed. 1354df8bae1dSRodney W. Grimes */ 1355df8bae1dSRodney W. Grimes } 1356df8bae1dSRodney W. Grimes #endif 1357e6e370a7SJeff Roberson ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles"); 1358e6e370a7SJeff Roberson if (ump->um_devvp->v_vflag & VV_COPYONWRITE) { 1359f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0) 1360f2a2857bSKirk McKusick return (error); 1361f2a2857bSKirk McKusick ffs_snapshot_unmount(mp); 136295e7a3c3STor Egge flags |= FORCECLOSE; 1363f2a2857bSKirk McKusick /* 1364f2a2857bSKirk McKusick * Here we fall through to vflush again to ensure 1365f2a2857bSKirk McKusick * that we have gotten rid of all the system vnodes. 1366f2a2857bSKirk McKusick */ 1367f2a2857bSKirk McKusick } 1368ba05dec5SKonstantin Belousov 1369b1897c19SJulian Elischer /* 1370ba05dec5SKonstantin Belousov * Do not close system files if quotas were not closed, to be 1371ba05dec5SKonstantin Belousov * able to sync the remaining dquots. The freeblks softupdate 1372ba05dec5SKonstantin Belousov * workitems might hold a reference on a dquot, preventing 1373ba05dec5SKonstantin Belousov * quotaoff() from completing. Next round of 1374ba05dec5SKonstantin Belousov * softdep_flushworklist() iteration should process the 1375ba05dec5SKonstantin Belousov * blockers, allowing the next run of quotaoff() to finally 1376ba05dec5SKonstantin Belousov * flush held dquots. 1377ba05dec5SKonstantin Belousov * 1378ba05dec5SKonstantin Belousov * Otherwise, flush all the files. 1379b1897c19SJulian Elischer */ 1380ba05dec5SKonstantin Belousov if (qerror == 0 && (error = vflush(mp, 0, flags, td)) != 0) 1381b1897c19SJulian Elischer return (error); 1382ba05dec5SKonstantin Belousov 1383b1897c19SJulian Elischer /* 1384b1897c19SJulian Elischer * Flush filesystem metadata. 1385b1897c19SJulian Elischer */ 1386cb05b60aSAttilio Rao vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 13878df6bac4SPoul-Henning Kamp error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td); 138822db15c0SAttilio Rao VOP_UNLOCK(ump->um_devvp, 0); 1389df8bae1dSRodney W. Grimes return (error); 1390df8bae1dSRodney W. Grimes } 1391df8bae1dSRodney W. Grimes 1392df8bae1dSRodney W. Grimes /* 1393df8bae1dSRodney W. Grimes * Get filesystem statistics. 1394df8bae1dSRodney W. Grimes */ 1395adf41577SPoul-Henning Kamp static int 1396dfd233edSAttilio Rao ffs_statfs(mp, sbp) 1397df8bae1dSRodney W. Grimes struct mount *mp; 139805f4ff5dSPoul-Henning Kamp struct statfs *sbp; 1399df8bae1dSRodney W. Grimes { 140005f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 140105f4ff5dSPoul-Henning Kamp struct fs *fs; 1402df8bae1dSRodney W. Grimes 1403df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1404df8bae1dSRodney W. Grimes fs = ump->um_fs; 14051c85e6a3SKirk McKusick if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC) 1406df8bae1dSRodney W. Grimes panic("ffs_statfs"); 1407fde81c7dSKirk McKusick sbp->f_version = STATFS_VERSION; 1408df8bae1dSRodney W. Grimes sbp->f_bsize = fs->fs_fsize; 1409df8bae1dSRodney W. Grimes sbp->f_iosize = fs->fs_bsize; 1410df8bae1dSRodney W. Grimes sbp->f_blocks = fs->fs_dsize; 14113ba649d7SJeff Roberson UFS_LOCK(ump); 1412df8bae1dSRodney W. Grimes sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + 14139ccb939eSKirk McKusick fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks); 14149ccb939eSKirk McKusick sbp->f_bavail = freespace(fs, fs->fs_minfree) + 14159ccb939eSKirk McKusick dbtofsb(fs, fs->fs_pendingblocks); 1416df8bae1dSRodney W. Grimes sbp->f_files = fs->fs_ncg * fs->fs_ipg - ROOTINO; 14179ccb939eSKirk McKusick sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes; 14183ba649d7SJeff Roberson UFS_UNLOCK(ump); 1419fde81c7dSKirk McKusick sbp->f_namemax = NAME_MAX; 1420df8bae1dSRodney W. Grimes return (0); 1421df8bae1dSRodney W. Grimes } 1422df8bae1dSRodney W. Grimes 14231eabd967SKonstantin Belousov static bool 14241eabd967SKonstantin Belousov sync_doupdate(struct inode *ip) 14251eabd967SKonstantin Belousov { 14261eabd967SKonstantin Belousov 14271eabd967SKonstantin Belousov return ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED | 14281eabd967SKonstantin Belousov IN_UPDATE)) != 0); 14291eabd967SKonstantin Belousov } 14301eabd967SKonstantin Belousov 1431df8bae1dSRodney W. Grimes /* 1432a988a5c6SKonstantin Belousov * For a lazy sync, we only care about access times, quotas and the 1433a988a5c6SKonstantin Belousov * superblock. Other filesystem changes are already converted to 1434a988a5c6SKonstantin Belousov * cylinder group blocks or inode blocks updates and are written to 1435a988a5c6SKonstantin Belousov * disk by syncer. 1436a988a5c6SKonstantin Belousov */ 1437a988a5c6SKonstantin Belousov static int 1438a988a5c6SKonstantin Belousov ffs_sync_lazy(mp) 1439a988a5c6SKonstantin Belousov struct mount *mp; 1440a988a5c6SKonstantin Belousov { 1441a988a5c6SKonstantin Belousov struct vnode *mvp, *vp; 1442a988a5c6SKonstantin Belousov struct inode *ip; 1443a988a5c6SKonstantin Belousov struct thread *td; 1444a988a5c6SKonstantin Belousov int allerror, error; 1445a988a5c6SKonstantin Belousov 1446a988a5c6SKonstantin Belousov allerror = 0; 1447a988a5c6SKonstantin Belousov td = curthread; 1448a988a5c6SKonstantin Belousov if ((mp->mnt_flag & MNT_NOATIME) != 0) 1449a988a5c6SKonstantin Belousov goto qupdate; 1450dca5e0ecSKirk McKusick MNT_VNODE_FOREACH_ACTIVE(vp, mp, mvp) { 145171469bb3SKirk McKusick if (vp->v_type == VNON) { 1452a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1453a988a5c6SKonstantin Belousov continue; 1454a988a5c6SKonstantin Belousov } 1455a988a5c6SKonstantin Belousov ip = VTOI(vp); 1456a988a5c6SKonstantin Belousov 1457a988a5c6SKonstantin Belousov /* 1458a988a5c6SKonstantin Belousov * The IN_ACCESS flag is converted to IN_MODIFIED by 1459a988a5c6SKonstantin Belousov * ufs_close() and ufs_getattr() by the calls to 1460ea573a50SKonstantin Belousov * ufs_itimes_locked(), without subsequent UFS_UPDATE(). 1461ea573a50SKonstantin Belousov * Test also all the other timestamp flags too, to pick up 1462ea573a50SKonstantin Belousov * any other cases that could be missed. 1463a988a5c6SKonstantin Belousov */ 14641eabd967SKonstantin Belousov if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) { 1465a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1466a988a5c6SKonstantin Belousov continue; 1467a988a5c6SKonstantin Belousov } 1468a988a5c6SKonstantin Belousov if ((error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK, 146971469bb3SKirk McKusick td)) != 0) 1470a988a5c6SKonstantin Belousov continue; 14711eabd967SKonstantin Belousov if (sync_doupdate(ip)) 1472a988a5c6SKonstantin Belousov error = ffs_update(vp, 0); 1473a988a5c6SKonstantin Belousov if (error != 0) 1474a988a5c6SKonstantin Belousov allerror = error; 1475a988a5c6SKonstantin Belousov vput(vp); 1476a988a5c6SKonstantin Belousov } 1477a988a5c6SKonstantin Belousov 1478a988a5c6SKonstantin Belousov qupdate: 1479a988a5c6SKonstantin Belousov #ifdef QUOTA 1480a988a5c6SKonstantin Belousov qsync(mp); 1481a988a5c6SKonstantin Belousov #endif 1482a988a5c6SKonstantin Belousov 1483a988a5c6SKonstantin Belousov if (VFSTOUFS(mp)->um_fs->fs_fmod != 0 && 1484a988a5c6SKonstantin Belousov (error = ffs_sbupdate(VFSTOUFS(mp), MNT_LAZY, 0)) != 0) 1485a988a5c6SKonstantin Belousov allerror = error; 1486a988a5c6SKonstantin Belousov return (allerror); 1487a988a5c6SKonstantin Belousov } 1488a988a5c6SKonstantin Belousov 1489a988a5c6SKonstantin Belousov /* 1490df8bae1dSRodney W. Grimes * Go through the disk queues to initiate sandbagged IO; 1491df8bae1dSRodney W. Grimes * go through the inodes to write those that have been modified; 1492df8bae1dSRodney W. Grimes * initiate the writing of the super block if it has been modified. 1493df8bae1dSRodney W. Grimes * 1494a988a5c6SKonstantin Belousov * Note: we are always called with the filesystem marked busy using 1495a988a5c6SKonstantin Belousov * vfs_busy(). 1496df8bae1dSRodney W. Grimes */ 1497adf41577SPoul-Henning Kamp static int 1498dfd233edSAttilio Rao ffs_sync(mp, waitfor) 1499df8bae1dSRodney W. Grimes struct mount *mp; 1500df8bae1dSRodney W. Grimes int waitfor; 1501df8bae1dSRodney W. Grimes { 150282be0a5aSTor Egge struct vnode *mvp, *vp, *devvp; 1503dfd233edSAttilio Rao struct thread *td; 1504996c772fSJohn Dyson struct inode *ip; 1505996c772fSJohn Dyson struct ufsmount *ump = VFSTOUFS(mp); 1506996c772fSJohn Dyson struct fs *fs; 150769baeadcSKonstantin Belousov int error, count, lockreq, allerror = 0; 1508791dd2faSTor Egge int suspend; 1509791dd2faSTor Egge int suspended; 1510791dd2faSTor Egge int secondary_writes; 1511791dd2faSTor Egge int secondary_accwrites; 1512791dd2faSTor Egge int softdep_deps; 1513791dd2faSTor Egge int softdep_accdeps; 1514156cb265SPoul-Henning Kamp struct bufobj *bo; 1515df8bae1dSRodney W. Grimes 151619c87af0SKirk McKusick suspend = 0; 151719c87af0SKirk McKusick suspended = 0; 1518dfd233edSAttilio Rao td = curthread; 1519df8bae1dSRodney W. Grimes fs = ump->um_fs; 1520b60ee81eSKirk McKusick if (fs->fs_fmod != 0 && fs->fs_ronly != 0 && ump->um_fsckpid == 0) 1521b60ee81eSKirk McKusick panic("%s: ffs_sync: modification on read-only filesystem", 1522b60ee81eSKirk McKusick fs->fs_fsmnt); 15234af9f77eSKonstantin Belousov if (waitfor == MNT_LAZY) { 15244af9f77eSKonstantin Belousov if (!rebooting) 1525a988a5c6SKonstantin Belousov return (ffs_sync_lazy(mp)); 15264af9f77eSKonstantin Belousov waitfor = MNT_NOWAIT; 15274af9f77eSKonstantin Belousov } 1528a988a5c6SKonstantin Belousov 152919c87af0SKirk McKusick /* 1530df8bae1dSRodney W. Grimes * Write back each (modified) inode. 1531df8bae1dSRodney W. Grimes */ 1532245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE | LK_NOWAIT; 1533791dd2faSTor Egge if (waitfor == MNT_SUSPEND) { 1534791dd2faSTor Egge suspend = 1; 1535791dd2faSTor Egge waitfor = MNT_WAIT; 1536791dd2faSTor Egge } 153769baeadcSKonstantin Belousov if (waitfor == MNT_WAIT) 1538245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE; 153941d4783dSJeff Roberson lockreq |= LK_INTERLOCK | LK_SLEEPFAIL; 1540df8bae1dSRodney W. Grimes loop: 1541791dd2faSTor Egge /* Grab snapshot of secondary write counts */ 154271469bb3SKirk McKusick MNT_ILOCK(mp); 1543791dd2faSTor Egge secondary_writes = mp->mnt_secondary_writes; 1544791dd2faSTor Egge secondary_accwrites = mp->mnt_secondary_accwrites; 154571469bb3SKirk McKusick MNT_IUNLOCK(mp); 1546791dd2faSTor Egge 1547791dd2faSTor Egge /* Grab snapshot of softdep dependency counts */ 1548791dd2faSTor Egge softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps); 1549791dd2faSTor Egge 155071469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 1551245df27cSMatthew Dillon /* 1552e0c17408SKonstantin Belousov * Depend on the vnode interlock to keep things stable enough 1553245df27cSMatthew Dillon * for a quick test. Since there might be hundreds of 1554245df27cSMatthew Dillon * thousands of vnodes, we cannot afford even a subroutine 1555245df27cSMatthew Dillon * call unless there's a good chance that we have work to do. 1556245df27cSMatthew Dillon */ 155771469bb3SKirk McKusick if (vp->v_type == VNON) { 15582f05568aSJeff Roberson VI_UNLOCK(vp); 15592f05568aSJeff Roberson continue; 15602f05568aSJeff Roberson } 1561df8bae1dSRodney W. Grimes ip = VTOI(vp); 156271469bb3SKirk McKusick if ((ip->i_flag & 1563cf60e8e4SKirk McKusick (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && 156471469bb3SKirk McKusick vp->v_bufobj.bo_dirty.bv_cnt == 0) { 15652f05568aSJeff Roberson VI_UNLOCK(vp); 1566df8bae1dSRodney W. Grimes continue; 1567996c772fSJohn Dyson } 1568b40ce416SJulian Elischer if ((error = vget(vp, lockreq, td)) != 0) { 156982be0a5aSTor Egge if (error == ENOENT || error == ENOLCK) { 157071469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 1571df8bae1dSRodney W. Grimes goto loop; 157282be0a5aSTor Egge } 15732f05568aSJeff Roberson continue; 15742f05568aSJeff Roberson } 157575a58389SKirk McKusick if ((error = ffs_syncvnode(vp, waitfor, 0)) != 0) 1576df8bae1dSRodney W. Grimes allerror = error; 157741d4783dSJeff Roberson vput(vp); 1578245df27cSMatthew Dillon } 1579df8bae1dSRodney W. Grimes /* 1580df8bae1dSRodney W. Grimes * Force stale filesystem control information to be flushed. 1581df8bae1dSRodney W. Grimes */ 15824af9f77eSKonstantin Belousov if (waitfor == MNT_WAIT || rebooting) { 1583b40ce416SJulian Elischer if ((error = softdep_flushworklist(ump->um_mountp, &count, td))) 15849b971133SKirk McKusick allerror = error; 15859b971133SKirk McKusick /* Flushed work items may create new vnodes to clean */ 158671469bb3SKirk McKusick if (allerror == 0 && count) 15879b971133SKirk McKusick goto loop; 15889b971133SKirk McKusick } 1589589c7af9SKirk McKusick #ifdef QUOTA 1590589c7af9SKirk McKusick qsync(mp); 1591589c7af9SKirk McKusick #endif 159219c87af0SKirk McKusick 1593112f7372SKirk McKusick devvp = ump->um_devvp; 1594156cb265SPoul-Henning Kamp bo = &devvp->v_bufobj; 1595698b1a66SJeff Roberson BO_LOCK(bo); 159619c87af0SKirk McKusick if (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0) { 1597698b1a66SJeff Roberson BO_UNLOCK(bo); 1598698b1a66SJeff Roberson vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 15994af9f77eSKonstantin Belousov error = VOP_FSYNC(devvp, waitfor, td); 160022db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 16014af9f77eSKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (error == 0 || error == EAGAIN)) 16024af9f77eSKonstantin Belousov error = ffs_sbupdate(ump, waitfor, 0); 16034af9f77eSKonstantin Belousov if (error != 0) 16044af9f77eSKonstantin Belousov allerror = error; 160571469bb3SKirk McKusick if (allerror == 0 && waitfor == MNT_WAIT) 1606112f7372SKirk McKusick goto loop; 1607791dd2faSTor Egge } else if (suspend != 0) { 1608791dd2faSTor Egge if (softdep_check_suspend(mp, 1609791dd2faSTor Egge devvp, 1610791dd2faSTor Egge softdep_deps, 1611791dd2faSTor Egge softdep_accdeps, 1612791dd2faSTor Egge secondary_writes, 161371469bb3SKirk McKusick secondary_accwrites) != 0) { 161471469bb3SKirk McKusick MNT_IUNLOCK(mp); 1615791dd2faSTor Egge goto loop; /* More work needed */ 161671469bb3SKirk McKusick } 1617791dd2faSTor Egge mtx_assert(MNT_MTX(mp), MA_OWNED); 1618ca2fa807STor Egge mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED; 1619791dd2faSTor Egge MNT_IUNLOCK(mp); 1620791dd2faSTor Egge suspended = 1; 1621112f7372SKirk McKusick } else 1622698b1a66SJeff Roberson BO_UNLOCK(bo); 1623996c772fSJohn Dyson /* 1624996c772fSJohn Dyson * Write back modified superblock. 1625996c772fSJohn Dyson */ 1626791dd2faSTor Egge if (fs->fs_fmod != 0 && 1627791dd2faSTor Egge (error = ffs_sbupdate(ump, waitfor, suspended)) != 0) 1628996c772fSJohn Dyson allerror = error; 1629df8bae1dSRodney W. Grimes return (allerror); 1630df8bae1dSRodney W. Grimes } 1631df8bae1dSRodney W. Grimes 1632df8bae1dSRodney W. Grimes int 1633a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp) 1634df8bae1dSRodney W. Grimes struct mount *mp; 1635df8bae1dSRodney W. Grimes ino_t ino; 1636a0595d02SKirk McKusick int flags; 1637df8bae1dSRodney W. Grimes struct vnode **vpp; 1638df8bae1dSRodney W. Grimes { 16397b7ed832SKonstantin Belousov return (ffs_vgetf(mp, ino, flags, vpp, 0)); 16407b7ed832SKonstantin Belousov } 16417b7ed832SKonstantin Belousov 16427b7ed832SKonstantin Belousov int 16437b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags) 16447b7ed832SKonstantin Belousov struct mount *mp; 16457b7ed832SKonstantin Belousov ino_t ino; 16467b7ed832SKonstantin Belousov int flags; 16477b7ed832SKonstantin Belousov struct vnode **vpp; 16487b7ed832SKonstantin Belousov int ffs_flags; 16497b7ed832SKonstantin Belousov { 1650996c772fSJohn Dyson struct fs *fs; 1651996c772fSJohn Dyson struct inode *ip; 1652df8bae1dSRodney W. Grimes struct ufsmount *ump; 1653df8bae1dSRodney W. Grimes struct buf *bp; 1654df8bae1dSRodney W. Grimes struct vnode *vp; 1655f576a00dSSemen Ustimenko int error; 1656df8bae1dSRodney W. Grimes 165751f5ce0cSPoul-Henning Kamp error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL); 1658e82ef95cSPoul-Henning Kamp if (error || *vpp != NULL) 165914bc0685SPoul-Henning Kamp return (error); 1660f576a00dSSemen Ustimenko 1661f576a00dSSemen Ustimenko /* 1662d6919865SJeff Roberson * We must promote to an exclusive lock for vnode creation. This 1663d6919865SJeff Roberson * can happen if lookup is passed LOCKSHARED. 1664d6919865SJeff Roberson */ 1665d6919865SJeff Roberson if ((flags & LK_TYPE_MASK) == LK_SHARED) { 1666d6919865SJeff Roberson flags &= ~LK_TYPE_MASK; 1667d6919865SJeff Roberson flags |= LK_EXCLUSIVE; 1668d6919865SJeff Roberson } 1669d6919865SJeff Roberson 1670d6919865SJeff Roberson /* 167113866b3fSSemen Ustimenko * We do not lock vnode creation as it is believed to be too 1672f576a00dSSemen Ustimenko * expensive for such rare case as simultaneous creation of vnode 1673f576a00dSSemen Ustimenko * for same ino by different processes. We just allow them to race 1674f576a00dSSemen Ustimenko * and check later to decide who wins. Let the race begin! 1675f576a00dSSemen Ustimenko */ 167614bc0685SPoul-Henning Kamp 167714bc0685SPoul-Henning Kamp ump = VFSTOUFS(mp); 167814bc0685SPoul-Henning Kamp fs = ump->um_fs; 167914bc0685SPoul-Henning Kamp ip = uma_zalloc(uma_inode, M_WAITOK | M_ZERO); 16802f9bae59SDavid Greenman 1681df8bae1dSRodney W. Grimes /* Allocate a new vnode/inode. */ 168243a993bbSKirk McKusick error = getnewvnode("ufs", mp, fs->fs_magic == FS_UFS1_MAGIC ? 168343a993bbSKirk McKusick &ffs_vnodeops1 : &ffs_vnodeops2, &vp); 1684c9671602SPoul-Henning Kamp if (error) { 1685df8bae1dSRodney W. Grimes *vpp = NULL; 1686aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 1687df8bae1dSRodney W. Grimes return (error); 1688df8bae1dSRodney W. Grimes } 168967e87166SBoris Popov /* 169033fc3625SJohn Baldwin * FFS supports recursive locking. 169167e87166SBoris Popov */ 16923634d5b2SJohn Baldwin lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL); 1693628f51d2SAttilio Rao VN_LOCK_AREC(vp); 1694df8bae1dSRodney W. Grimes vp->v_data = ip; 16955d9d81e7SPoul-Henning Kamp vp->v_bufobj.bo_bsize = fs->fs_bsize; 1696df8bae1dSRodney W. Grimes ip->i_vnode = vp; 16971c85e6a3SKirk McKusick ip->i_ump = ump; 1698df8bae1dSRodney W. Grimes ip->i_number = ino; 1699e65f5a4eSKonstantin Belousov ip->i_ea_refs = 0; 170074a87c38SKirk McKusick ip->i_nextclustercg = -1; 1701*e1db6897SKonstantin Belousov ip->i_flag = fs->fs_magic == FS_UFS1_MAGIC ? 0 : IN_UFS2; 1702df8bae1dSRodney W. Grimes #ifdef QUOTA 1703c1d9efcbSPoul-Henning Kamp { 1704c1d9efcbSPoul-Henning Kamp int i; 1705df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1706df8bae1dSRodney W. Grimes ip->i_dquot[i] = NODQUOT; 1707c1d9efcbSPoul-Henning Kamp } 1708df8bae1dSRodney W. Grimes #endif 1709df8bae1dSRodney W. Grimes 17107b7ed832SKonstantin Belousov if (ffs_flags & FFSV_FORCEINSMQ) 17117b7ed832SKonstantin Belousov vp->v_vflag |= VV_FORCEINSMQ; 171261b9d89fSTor Egge error = insmntque(vp, mp); 171361b9d89fSTor Egge if (error != 0) { 17146cc745d2SKonstantin Belousov uma_zfree(uma_inode, ip); 171561b9d89fSTor Egge *vpp = NULL; 171661b9d89fSTor Egge return (error); 171761b9d89fSTor Egge } 17187b7ed832SKonstantin Belousov vp->v_vflag &= ~VV_FORCEINSMQ; 1719a80d8caaSPawel Jakub Dawidek error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL); 172045c26fa2SPoul-Henning Kamp if (error || *vpp != NULL) 1721f576a00dSSemen Ustimenko return (error); 1722f576a00dSSemen Ustimenko 1723df8bae1dSRodney W. Grimes /* Read in the disk contents for the inode, copy into the inode. */ 1724c9671602SPoul-Henning Kamp error = bread(ump->um_devvp, fsbtodb(fs, ino_to_fsba(fs, ino)), 1725c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 1726c9671602SPoul-Henning Kamp if (error) { 1727df8bae1dSRodney W. Grimes /* 1728df8bae1dSRodney W. Grimes * The inode does not contain anything useful, so it would 1729df8bae1dSRodney W. Grimes * be misleading to leave it on its hash chain. With mode 1730df8bae1dSRodney W. Grimes * still zero, it will be unlinked and returned to the free 1731df8bae1dSRodney W. Grimes * list by vput(). 1732df8bae1dSRodney W. Grimes */ 1733df8bae1dSRodney W. Grimes brelse(bp); 1734bd7e5f99SJohn Dyson vput(vp); 1735df8bae1dSRodney W. Grimes *vpp = NULL; 1736df8bae1dSRodney W. Grimes return (error); 1737df8bae1dSRodney W. Grimes } 1738*e1db6897SKonstantin Belousov if (I_IS_UFS1(ip)) 1739a163d034SWarner Losh ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK); 1740de6ba7c0SPoul-Henning Kamp else 1741a163d034SWarner Losh ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK); 1742de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ino); 1743b1897c19SJulian Elischer if (DOINGSOFTDEP(vp)) 1744b1897c19SJulian Elischer softdep_load_inodeblock(ip); 1745b1897c19SJulian Elischer else 1746b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 1747bd7e5f99SJohn Dyson bqrelse(bp); 1748df8bae1dSRodney W. Grimes 1749df8bae1dSRodney W. Grimes /* 1750df8bae1dSRodney W. Grimes * Initialize the vnode from the inode, check for aliases. 1751df8bae1dSRodney W. Grimes * Note that the underlying vnode may have changed. 1752df8bae1dSRodney W. Grimes */ 1753*e1db6897SKonstantin Belousov error = ufs_vinit(mp, I_IS_UFS1(ip) ? &ffs_fifoops1 : &ffs_fifoops2, 1754*e1db6897SKonstantin Belousov &vp); 1755c9671602SPoul-Henning Kamp if (error) { 1756df8bae1dSRodney W. Grimes vput(vp); 1757df8bae1dSRodney W. Grimes *vpp = NULL; 1758df8bae1dSRodney W. Grimes return (error); 1759df8bae1dSRodney W. Grimes } 1760de68347bSPoul-Henning Kamp 1761df8bae1dSRodney W. Grimes /* 17625c24d6eeSPoul-Henning Kamp * Finish inode initialization. 1763df8bae1dSRodney W. Grimes */ 176433fc3625SJohn Baldwin if (vp->v_type != VFIFO) { 176533fc3625SJohn Baldwin /* FFS supports shared locking for all files except fifos. */ 176633fc3625SJohn Baldwin VN_LOCK_ASHARE(vp); 176733fc3625SJohn Baldwin } 1768de68347bSPoul-Henning Kamp 1769df8bae1dSRodney W. Grimes /* 1770df8bae1dSRodney W. Grimes * Set up a generation number for this inode if it does not 1771df8bae1dSRodney W. Grimes * already have one. This should only happen on old filesystems. 1772df8bae1dSRodney W. Grimes */ 1773df8bae1dSRodney W. Grimes if (ip->i_gen == 0) { 177457d2ac2fSKevin Lo while (ip->i_gen == 0) 177557d2ac2fSKevin Lo ip->i_gen = arc4random(); 17761c85e6a3SKirk McKusick if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 1777df8bae1dSRodney W. Grimes ip->i_flag |= IN_MODIFIED; 1778b403319bSAlexander Kabaev DIP_SET(ip, i_gen, ip->i_gen); 17791c85e6a3SKirk McKusick } 1780df8bae1dSRodney W. Grimes } 1781763bbd2fSRobert Watson #ifdef MAC 1782763bbd2fSRobert Watson if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) { 1783763bbd2fSRobert Watson /* 1784763bbd2fSRobert Watson * If this vnode is already allocated, and we're running 1785763bbd2fSRobert Watson * multi-label, attempt to perform a label association 1786763bbd2fSRobert Watson * from the extended attributes on the inode. 1787763bbd2fSRobert Watson */ 178830d239bcSRobert Watson error = mac_vnode_associate_extattr(mp, vp); 1789763bbd2fSRobert Watson if (error) { 1790763bbd2fSRobert Watson /* ufs_inactive will release ip->i_devvp ref. */ 1791763bbd2fSRobert Watson vput(vp); 1792763bbd2fSRobert Watson *vpp = NULL; 1793763bbd2fSRobert Watson return (error); 1794763bbd2fSRobert Watson } 1795763bbd2fSRobert Watson } 1796763bbd2fSRobert Watson #endif 1797763bbd2fSRobert Watson 1798df8bae1dSRodney W. Grimes *vpp = vp; 1799df8bae1dSRodney W. Grimes return (0); 1800df8bae1dSRodney W. Grimes } 1801df8bae1dSRodney W. Grimes 1802df8bae1dSRodney W. Grimes /* 1803df8bae1dSRodney W. Grimes * File handle to vnode 1804df8bae1dSRodney W. Grimes * 1805df8bae1dSRodney W. Grimes * Have to be really careful about stale file handles: 1806df8bae1dSRodney W. Grimes * - check that the inode number is valid 1807abe53f7eSKirk McKusick * - for UFS2 check that the inode number is initialized 1808df8bae1dSRodney W. Grimes * - call ffs_vget() to get the locked inode 1809df8bae1dSRodney W. Grimes * - check for an unallocated inode (i_mode == 0) 1810df8bae1dSRodney W. Grimes * - check that the given client host has export rights and return 1811df8bae1dSRodney W. Grimes * those rights via. exflagsp and credanonp 1812df8bae1dSRodney W. Grimes */ 1813adf41577SPoul-Henning Kamp static int 1814694a586aSRick Macklem ffs_fhtovp(mp, fhp, flags, vpp) 181505f4ff5dSPoul-Henning Kamp struct mount *mp; 1816df8bae1dSRodney W. Grimes struct fid *fhp; 1817694a586aSRick Macklem int flags; 1818df8bae1dSRodney W. Grimes struct vnode **vpp; 1819df8bae1dSRodney W. Grimes { 182005f4ff5dSPoul-Henning Kamp struct ufid *ufhp; 1821abe53f7eSKirk McKusick struct ufsmount *ump; 1822df8bae1dSRodney W. Grimes struct fs *fs; 1823abe53f7eSKirk McKusick struct cg *cgp; 1824abe53f7eSKirk McKusick struct buf *bp; 1825abe53f7eSKirk McKusick ino_t ino; 1826abe53f7eSKirk McKusick u_int cg; 1827abe53f7eSKirk McKusick int error; 1828df8bae1dSRodney W. Grimes 1829df8bae1dSRodney W. Grimes ufhp = (struct ufid *)fhp; 1830abe53f7eSKirk McKusick ino = ufhp->ufid_ino; 1831abe53f7eSKirk McKusick ump = VFSTOUFS(mp); 1832abe53f7eSKirk McKusick fs = ump->um_fs; 1833abe53f7eSKirk McKusick if (ino < ROOTINO || ino >= fs->fs_ncg * fs->fs_ipg) 1834df8bae1dSRodney W. Grimes return (ESTALE); 1835abe53f7eSKirk McKusick /* 1836abe53f7eSKirk McKusick * Need to check if inode is initialized because UFS2 does lazy 1837abe53f7eSKirk McKusick * initialization and nfs_fhtovp can offer arbitrary inode numbers. 1838abe53f7eSKirk McKusick */ 1839abe53f7eSKirk McKusick if (fs->fs_magic != FS_UFS2_MAGIC) 1840abe53f7eSKirk McKusick return (ufs_fhtovp(mp, ufhp, flags, vpp)); 1841abe53f7eSKirk McKusick cg = ino_to_cg(fs, ino); 1842abe53f7eSKirk McKusick error = bread(ump->um_devvp, fsbtodb(fs, cgtod(fs, cg)), 1843abe53f7eSKirk McKusick (int)fs->fs_cgsize, NOCRED, &bp); 1844abe53f7eSKirk McKusick if (error) 1845abe53f7eSKirk McKusick return (error); 1846abe53f7eSKirk McKusick cgp = (struct cg *)bp->b_data; 1847abe53f7eSKirk McKusick if (!cg_chkmagic(cgp) || ino >= cg * fs->fs_ipg + cgp->cg_initediblk) { 1848abe53f7eSKirk McKusick brelse(bp); 1849abe53f7eSKirk McKusick return (ESTALE); 1850abe53f7eSKirk McKusick } 1851abe53f7eSKirk McKusick brelse(bp); 1852694a586aSRick Macklem return (ufs_fhtovp(mp, ufhp, flags, vpp)); 1853df8bae1dSRodney W. Grimes } 1854df8bae1dSRodney W. Grimes 1855df8bae1dSRodney W. Grimes /* 18565346934fSIan Dowse * Initialize the filesystem. 1857996c772fSJohn Dyson */ 1858996c772fSJohn Dyson static int 1859996c772fSJohn Dyson ffs_init(vfsp) 1860996c772fSJohn Dyson struct vfsconf *vfsp; 1861996c772fSJohn Dyson { 1862996c772fSJohn Dyson 18631848286aSEdward Tomasz Napierala ffs_susp_initialize(); 1864b1897c19SJulian Elischer softdep_initialize(); 1865996c772fSJohn Dyson return (ufs_init(vfsp)); 1866996c772fSJohn Dyson } 1867996c772fSJohn Dyson 1868996c772fSJohn Dyson /* 18695346934fSIan Dowse * Undo the work of ffs_init(). 18705346934fSIan Dowse */ 18715346934fSIan Dowse static int 18725346934fSIan Dowse ffs_uninit(vfsp) 18735346934fSIan Dowse struct vfsconf *vfsp; 18745346934fSIan Dowse { 18755346934fSIan Dowse int ret; 18765346934fSIan Dowse 18775346934fSIan Dowse ret = ufs_uninit(vfsp); 18785346934fSIan Dowse softdep_uninitialize(); 18791848286aSEdward Tomasz Napierala ffs_susp_uninitialize(); 18805346934fSIan Dowse return (ret); 18815346934fSIan Dowse } 18825346934fSIan Dowse 18835346934fSIan Dowse /* 1884df8bae1dSRodney W. Grimes * Write a superblock and associated information back to disk. 1885df8bae1dSRodney W. Grimes */ 18861a60c7fcSPawel Jakub Dawidek int 1887927a12aeSKirk McKusick ffs_sbupdate(ump, waitfor, suspended) 1888927a12aeSKirk McKusick struct ufsmount *ump; 1889df8bae1dSRodney W. Grimes int waitfor; 1890791dd2faSTor Egge int suspended; 1891df8bae1dSRodney W. Grimes { 1892927a12aeSKirk McKusick struct fs *fs = ump->um_fs; 18933ba649d7SJeff Roberson struct buf *sbbp; 189405f4ff5dSPoul-Henning Kamp struct buf *bp; 1895df8bae1dSRodney W. Grimes int blks; 1896f55ff3f3SIan Dowse void *space; 1897996c772fSJohn Dyson int i, size, error, allerror = 0; 1898df8bae1dSRodney W. Grimes 189974f3809aSKirk McKusick if (fs->fs_ronly == 1 && 1900927a12aeSKirk McKusick (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) != 1901927a12aeSKirk McKusick (MNT_RDONLY | MNT_UPDATE) && ump->um_fsckpid == 0) 190274f3809aSKirk McKusick panic("ffs_sbupdate: write read-only filesystem"); 1903996c772fSJohn Dyson /* 19043ba649d7SJeff Roberson * We use the superblock's buf to serialize calls to ffs_sbupdate(). 19053ba649d7SJeff Roberson */ 1906927a12aeSKirk McKusick sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc), 1907927a12aeSKirk McKusick (int)fs->fs_sbsize, 0, 0, 0); 19083ba649d7SJeff Roberson /* 1909996c772fSJohn Dyson * First write back the summary information. 1910996c772fSJohn Dyson */ 1911df8bae1dSRodney W. Grimes blks = howmany(fs->fs_cssize, fs->fs_fsize); 1912f55ff3f3SIan Dowse space = fs->fs_csp; 1913df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 1914df8bae1dSRodney W. Grimes size = fs->fs_bsize; 1915df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 1916df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 1917927a12aeSKirk McKusick bp = getblk(ump->um_devvp, fsbtodb(fs, fs->fs_csaddr + i), 19187261f5f6SJeff Roberson size, 0, 0, 0); 1919df8bae1dSRodney W. Grimes bcopy(space, bp->b_data, (u_int)size); 1920f55ff3f3SIan Dowse space = (char *)space + size; 1921791dd2faSTor Egge if (suspended) 1922791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1923996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1924df8bae1dSRodney W. Grimes bawrite(bp); 19258aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1926996c772fSJohn Dyson allerror = error; 1927df8bae1dSRodney W. Grimes } 1928996c772fSJohn Dyson /* 1929996c772fSJohn Dyson * Now write back the superblock itself. If any errors occurred 1930996c772fSJohn Dyson * up to this point, then fail so that the superblock avoids 1931996c772fSJohn Dyson * being written out as clean. 1932996c772fSJohn Dyson */ 19333ba649d7SJeff Roberson if (allerror) { 19343ba649d7SJeff Roberson brelse(sbbp); 1935996c772fSJohn Dyson return (allerror); 19363ba649d7SJeff Roberson } 19373ba649d7SJeff Roberson bp = sbbp; 193831574422SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 && 1939e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1940b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 1941fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1); 1942fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS1; 1943fa5d33e2SKirk McKusick } 194431574422SKirk McKusick if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 && 1945e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1946b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 1947fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2); 1948fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS2; 1949fa5d33e2SKirk McKusick } 1950b1897c19SJulian Elischer fs->fs_fmod = 0; 1951227ee8a1SPoul-Henning Kamp fs->fs_time = time_second; 1952519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(ump->um_mountp)) 1953927a12aeSKirk McKusick softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp); 1954996c772fSJohn Dyson bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize); 1955927a12aeSKirk McKusick ffs_oldfscompat_write((struct fs *)bp->b_data, ump); 1956791dd2faSTor Egge if (suspended) 1957791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1958996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1959996c772fSJohn Dyson bawrite(bp); 19608aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1961996c772fSJohn Dyson allerror = error; 1962996c772fSJohn Dyson return (allerror); 1963df8bae1dSRodney W. Grimes } 1964d6fe88e4SPoul-Henning Kamp 1965d6fe88e4SPoul-Henning Kamp static int 1966d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp, 1967dfd233edSAttilio Rao int attrnamespace, const char *attrname) 1968d6fe88e4SPoul-Henning Kamp { 1969d6fe88e4SPoul-Henning Kamp 1970d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR 1971d6fe88e4SPoul-Henning Kamp return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace, 1972dfd233edSAttilio Rao attrname)); 1973d6fe88e4SPoul-Henning Kamp #else 1974d6fe88e4SPoul-Henning Kamp return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, 1975dfd233edSAttilio Rao attrname)); 1976d6fe88e4SPoul-Henning Kamp #endif 1977d6fe88e4SPoul-Henning Kamp } 1978975512a9SPoul-Henning Kamp 1979975512a9SPoul-Henning Kamp static void 1980975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip) 1981975512a9SPoul-Henning Kamp { 1982975512a9SPoul-Henning Kamp 198336329289STim J. Robbins if (ump->um_fstype == UFS1 && ip->i_din1 != NULL) 1984aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_ufs1, ip->i_din1); 198536329289STim J. Robbins else if (ip->i_din2 != NULL) 19868d721e87STim J. Robbins uma_zfree(uma_ufs2, ip->i_din2); 1987aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 1988975512a9SPoul-Henning Kamp } 19896e77a041SPoul-Henning Kamp 1990dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1; 1991dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0, 1992dd19a799SPoul-Henning Kamp "Do background writes (honoring the BV_BKGRDWRITE flag)?"); 1993dd19a799SPoul-Henning Kamp 1994dd19a799SPoul-Henning Kamp /* 1995dd19a799SPoul-Henning Kamp * Complete a background write started from bwrite. 1996dd19a799SPoul-Henning Kamp */ 1997dd19a799SPoul-Henning Kamp static void 1998dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp) 1999dd19a799SPoul-Henning Kamp { 2000204ec66dSJeff Roberson struct bufobj *bufobj; 2001dd19a799SPoul-Henning Kamp struct buf *origbp; 2002dd19a799SPoul-Henning Kamp 2003dd19a799SPoul-Henning Kamp /* 2004dd19a799SPoul-Henning Kamp * Find the original buffer that we are writing. 2005dd19a799SPoul-Henning Kamp */ 2006204ec66dSJeff Roberson bufobj = bp->b_bufobj; 2007204ec66dSJeff Roberson BO_LOCK(bufobj); 2008dd19a799SPoul-Henning Kamp if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL) 2009dd19a799SPoul-Henning Kamp panic("backgroundwritedone: lost buffer"); 2010b2c3df84SKonstantin Belousov 2011b2c3df84SKonstantin Belousov /* 2012b2c3df84SKonstantin Belousov * We should mark the cylinder group buffer origbp as 2013b2c3df84SKonstantin Belousov * dirty, to not loose the failed write. 2014b2c3df84SKonstantin Belousov */ 2015b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2016b2c3df84SKonstantin Belousov origbp->b_vflags |= BV_BKGRDERR; 2017204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2018dd19a799SPoul-Henning Kamp /* 2019dd19a799SPoul-Henning Kamp * Process dependencies then return any unfinished ones. 2020dd19a799SPoul-Henning Kamp */ 202126089666SJeff Roberson pbrelvp(bp); 2022b2c3df84SKonstantin Belousov if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) == 0) 2023dd19a799SPoul-Henning Kamp buf_complete(bp); 2024dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 202504533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 2026dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, origbp); 2027dd19a799SPoul-Henning Kamp #endif 2028dd19a799SPoul-Henning Kamp /* 2029204ec66dSJeff Roberson * This buffer is marked B_NOCACHE so when it is released 2030204ec66dSJeff Roberson * by biodone it will be tossed. 2031dd19a799SPoul-Henning Kamp */ 2032dd19a799SPoul-Henning Kamp bp->b_flags |= B_NOCACHE; 2033ec9c9e73SAlan Cox bp->b_flags &= ~B_CACHE; 2034b2c3df84SKonstantin Belousov 2035b2c3df84SKonstantin Belousov /* 2036b2c3df84SKonstantin Belousov * Prevent brelse() from trying to keep and re-dirtying bp on 2037b2c3df84SKonstantin Belousov * errors. It causes b_bufobj dereference in 2038b2c3df84SKonstantin Belousov * bdirty()/reassignbuf(), and b_bufobj was cleared in 2039b2c3df84SKonstantin Belousov * pbrelvp() above. 2040b2c3df84SKonstantin Belousov */ 2041b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2042b2c3df84SKonstantin Belousov bp->b_flags |= B_INVAL; 2043dd19a799SPoul-Henning Kamp bufdone(bp); 2044204ec66dSJeff Roberson BO_LOCK(bufobj); 2045dd19a799SPoul-Henning Kamp /* 2046dd19a799SPoul-Henning Kamp * Clear the BV_BKGRDINPROG flag in the original buffer 2047dd19a799SPoul-Henning Kamp * and awaken it if it is waiting for the write to complete. 2048dd19a799SPoul-Henning Kamp * If BV_BKGRDINPROG is not set in the original buffer it must 2049dd19a799SPoul-Henning Kamp * have been released and re-instantiated - which is not legal. 2050dd19a799SPoul-Henning Kamp */ 2051dd19a799SPoul-Henning Kamp KASSERT((origbp->b_vflags & BV_BKGRDINPROG), 2052dd19a799SPoul-Henning Kamp ("backgroundwritedone: lost buffer2")); 2053dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDINPROG; 2054dd19a799SPoul-Henning Kamp if (origbp->b_vflags & BV_BKGRDWAIT) { 2055dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDWAIT; 2056dd19a799SPoul-Henning Kamp wakeup(&origbp->b_xflags); 2057dd19a799SPoul-Henning Kamp } 2058204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2059dd19a799SPoul-Henning Kamp } 2060dd19a799SPoul-Henning Kamp 2061dd19a799SPoul-Henning Kamp 2062dd19a799SPoul-Henning Kamp /* 2063dd19a799SPoul-Henning Kamp * Write, release buffer on completion. (Done by iodone 2064dd19a799SPoul-Henning Kamp * if async). Do not bother writing anything if the buffer 2065dd19a799SPoul-Henning Kamp * is invalid. 2066dd19a799SPoul-Henning Kamp * 2067dd19a799SPoul-Henning Kamp * Note that we set B_CACHE here, indicating that buffer is 2068dd19a799SPoul-Henning Kamp * fully valid and thus cacheable. This is true even of NFS 2069dd19a799SPoul-Henning Kamp * now so we set it generally. This could be set either here 2070dd19a799SPoul-Henning Kamp * or in biodone() since the I/O is synchronous. We put it 2071dd19a799SPoul-Henning Kamp * here. 2072dd19a799SPoul-Henning Kamp */ 2073dd19a799SPoul-Henning Kamp static int 2074dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp) 2075dd19a799SPoul-Henning Kamp { 2076dd19a799SPoul-Henning Kamp struct buf *newbp; 2077dd19a799SPoul-Henning Kamp 2078dd19a799SPoul-Henning Kamp CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags); 2079dd19a799SPoul-Henning Kamp if (bp->b_flags & B_INVAL) { 2080dd19a799SPoul-Henning Kamp brelse(bp); 2081dd19a799SPoul-Henning Kamp return (0); 2082dd19a799SPoul-Henning Kamp } 2083dd19a799SPoul-Henning Kamp 2084d638e093SAttilio Rao if (!BUF_ISLOCKED(bp)) 2085dd19a799SPoul-Henning Kamp panic("bufwrite: buffer is not busy???"); 2086dd19a799SPoul-Henning Kamp /* 2087dd19a799SPoul-Henning Kamp * If a background write is already in progress, delay 2088dd19a799SPoul-Henning Kamp * writing this block if it is asynchronous. Otherwise 2089dd19a799SPoul-Henning Kamp * wait for the background write to complete. 2090dd19a799SPoul-Henning Kamp */ 2091dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2092dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) { 2093dd19a799SPoul-Henning Kamp if (bp->b_flags & B_ASYNC) { 2094dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2095dd19a799SPoul-Henning Kamp bdwrite(bp); 2096dd19a799SPoul-Henning Kamp return (0); 2097dd19a799SPoul-Henning Kamp } 2098dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDWAIT; 209922a72260SJeff Roberson msleep(&bp->b_xflags, BO_LOCKPTR(bp->b_bufobj), PRIBIO, 210022a72260SJeff Roberson "bwrbg", 0); 2101dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) 2102dd19a799SPoul-Henning Kamp panic("bufwrite: still writing"); 2103dd19a799SPoul-Henning Kamp } 2104b2c3df84SKonstantin Belousov bp->b_vflags &= ~BV_BKGRDERR; 2105dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2106dd19a799SPoul-Henning Kamp 2107dd19a799SPoul-Henning Kamp /* 2108dd19a799SPoul-Henning Kamp * If this buffer is marked for background writing and we 2109dd19a799SPoul-Henning Kamp * do not have to wait for it, make a copy and write the 2110dd19a799SPoul-Henning Kamp * copy so as to leave this buffer ready for further use. 2111dd19a799SPoul-Henning Kamp * 2112dd19a799SPoul-Henning Kamp * This optimization eats a lot of memory. If we have a page 2113dd19a799SPoul-Henning Kamp * or buffer shortfall we can't do it. 2114dd19a799SPoul-Henning Kamp */ 2115dd19a799SPoul-Henning Kamp if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) && 2116dd19a799SPoul-Henning Kamp (bp->b_flags & B_ASYNC) && 2117dd19a799SPoul-Henning Kamp !vm_page_count_severe() && 2118dd19a799SPoul-Henning Kamp !buf_dirty_count_severe()) { 2119dd19a799SPoul-Henning Kamp KASSERT(bp->b_iodone == NULL, 2120dd19a799SPoul-Henning Kamp ("bufwrite: needs chained iodone (%p)", bp->b_iodone)); 2121dd19a799SPoul-Henning Kamp 2122dd19a799SPoul-Henning Kamp /* get a new block */ 2123c1d8b5e8SKonstantin Belousov newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD); 2124c1d8b5e8SKonstantin Belousov if (newbp == NULL) 2125c1d8b5e8SKonstantin Belousov goto normal_write; 2126dd19a799SPoul-Henning Kamp 2127fade8dd7SJeff Roberson KASSERT(buf_mapped(bp), ("Unmapped cg")); 2128dd19a799SPoul-Henning Kamp memcpy(newbp->b_data, bp->b_data, bp->b_bufsize); 2129dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2130dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDINPROG; 2131dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 213226089666SJeff Roberson newbp->b_xflags |= BX_BKGRDMARKER; 213326089666SJeff Roberson newbp->b_lblkno = bp->b_lblkno; 2134dd19a799SPoul-Henning Kamp newbp->b_blkno = bp->b_blkno; 2135dd19a799SPoul-Henning Kamp newbp->b_offset = bp->b_offset; 2136dd19a799SPoul-Henning Kamp newbp->b_iodone = ffs_backgroundwritedone; 2137dd19a799SPoul-Henning Kamp newbp->b_flags |= B_ASYNC; 2138dd19a799SPoul-Henning Kamp newbp->b_flags &= ~B_INVAL; 213926089666SJeff Roberson pbgetvp(bp->b_vp, newbp); 2140dd19a799SPoul-Henning Kamp 2141dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 2142113db2ddSJeff Roberson /* 2143113db2ddSJeff Roberson * Move over the dependencies. If there are rollbacks, 2144113db2ddSJeff Roberson * leave the parent buffer dirtied as it will need to 2145113db2ddSJeff Roberson * be written again. 2146113db2ddSJeff Roberson */ 2147113db2ddSJeff Roberson if (LIST_EMPTY(&bp->b_dep) || 2148113db2ddSJeff Roberson softdep_move_dependencies(bp, newbp) == 0) 2149113db2ddSJeff Roberson bundirty(bp); 2150113db2ddSJeff Roberson #else 2151113db2ddSJeff Roberson bundirty(bp); 2152dd19a799SPoul-Henning Kamp #endif 2153dd19a799SPoul-Henning Kamp 2154dd19a799SPoul-Henning Kamp /* 215526089666SJeff Roberson * Initiate write on the copy, release the original. The 215626089666SJeff Roberson * BKGRDINPROG flag prevents it from going away until 215726089666SJeff Roberson * the background write completes. 2158dd19a799SPoul-Henning Kamp */ 2159dd19a799SPoul-Henning Kamp bqrelse(bp); 2160dd19a799SPoul-Henning Kamp bp = newbp; 2161113db2ddSJeff Roberson } else 2162113db2ddSJeff Roberson /* Mark the buffer clean */ 2163113db2ddSJeff Roberson bundirty(bp); 2164113db2ddSJeff Roberson 2165dd19a799SPoul-Henning Kamp 2166dd19a799SPoul-Henning Kamp /* Let the normal bufwrite do the rest for us */ 2167c1d8b5e8SKonstantin Belousov normal_write: 21689248a827STor Egge return (bufwrite(bp)); 2169dd19a799SPoul-Henning Kamp } 2170dd19a799SPoul-Henning Kamp 2171dd19a799SPoul-Henning Kamp 21728dd56505SPoul-Henning Kamp static void 21736e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp) 21746e77a041SPoul-Henning Kamp { 2175153910e0SJeff Roberson struct vnode *vp; 2176153910e0SJeff Roberson int error; 21777de3839dSTor Egge struct buf *tbp; 2178113db2ddSJeff Roberson int nocopy; 21796e77a041SPoul-Henning Kamp 2180153910e0SJeff Roberson vp = bo->__bo_vnode; 2181153910e0SJeff Roberson if (bp->b_iocmd == BIO_WRITE) { 2182153910e0SJeff Roberson if ((bp->b_flags & B_VALIDSUSPWRT) == 0 && 2183153910e0SJeff Roberson bp->b_vp != NULL && bp->b_vp->v_mount != NULL && 2184153910e0SJeff Roberson (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0) 2185153910e0SJeff Roberson panic("ffs_geom_strategy: bad I/O"); 2186113db2ddSJeff Roberson nocopy = bp->b_flags & B_NOCOPY; 2187113db2ddSJeff Roberson bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY); 2188113db2ddSJeff Roberson if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 && 21897de3839dSTor Egge vp->v_rdev->si_snapdata != NULL) { 21907de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 2191868bb88fSTor Egge runningbufwakeup(bp); 21927de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 21937de3839dSTor Egge b_cluster.cluster_entry) { 21947de3839dSTor Egge error = ffs_copyonwrite(vp, tbp); 21957de3839dSTor Egge if (error != 0 && 2196153910e0SJeff Roberson error != EOPNOTSUPP) { 2197153910e0SJeff Roberson bp->b_error = error; 2198153910e0SJeff Roberson bp->b_ioflags |= BIO_ERROR; 2199153910e0SJeff Roberson bufdone(bp); 2200153910e0SJeff Roberson return; 2201153910e0SJeff Roberson } 2202153910e0SJeff Roberson } 2203868bb88fSTor Egge bp->b_runningbufspace = bp->b_bufsize; 22045bd65606SJohn Baldwin atomic_add_long(&runningbufspace, 2205868bb88fSTor Egge bp->b_runningbufspace); 22067de3839dSTor Egge } else { 22077de3839dSTor Egge error = ffs_copyonwrite(vp, bp); 22087de3839dSTor Egge if (error != 0 && error != EOPNOTSUPP) { 22097de3839dSTor Egge bp->b_error = error; 22107de3839dSTor Egge bp->b_ioflags |= BIO_ERROR; 22117de3839dSTor Egge bufdone(bp); 22127de3839dSTor Egge return; 22137de3839dSTor Egge } 22147de3839dSTor Egge } 22157de3839dSTor Egge } 22167de3839dSTor Egge #ifdef SOFTUPDATES 22177de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 22187de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 22197de3839dSTor Egge b_cluster.cluster_entry) { 222004533fc6SXin LI if (!LIST_EMPTY(&tbp->b_dep)) 22217de3839dSTor Egge buf_start(tbp); 22227de3839dSTor Egge } 22237de3839dSTor Egge } else { 222404533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 22257de3839dSTor Egge buf_start(bp); 22267de3839dSTor Egge } 22277de3839dSTor Egge 22287de3839dSTor Egge #endif 22297de3839dSTor Egge } 223043920011SPoul-Henning Kamp g_vfs_strategy(bo, bp); 22316e77a041SPoul-Henning Kamp } 223252dfc8d7SKonstantin Belousov 22331848286aSEdward Tomasz Napierala int 22341848286aSEdward Tomasz Napierala ffs_own_mount(const struct mount *mp) 22351848286aSEdward Tomasz Napierala { 22361848286aSEdward Tomasz Napierala 22371848286aSEdward Tomasz Napierala if (mp->mnt_op == &ufs_vfsops) 22381848286aSEdward Tomasz Napierala return (1); 22391848286aSEdward Tomasz Napierala return (0); 22401848286aSEdward Tomasz Napierala } 22411848286aSEdward Tomasz Napierala 224252dfc8d7SKonstantin Belousov #ifdef DDB 2243cf058082SBrooks Davis #ifdef SOFTUPDATES 224452dfc8d7SKonstantin Belousov 2245519e3c3bSKirk McKusick /* defined in ffs_softdep.c */ 2246519e3c3bSKirk McKusick extern void db_print_ffs(struct ufsmount *ump); 224752dfc8d7SKonstantin Belousov 224852dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs) 224952dfc8d7SKonstantin Belousov { 225052dfc8d7SKonstantin Belousov struct mount *mp; 225152dfc8d7SKonstantin Belousov struct ufsmount *ump; 225252dfc8d7SKonstantin Belousov 225352dfc8d7SKonstantin Belousov if (have_addr) { 225452dfc8d7SKonstantin Belousov ump = VFSTOUFS((struct mount *)addr); 225552dfc8d7SKonstantin Belousov db_print_ffs(ump); 225652dfc8d7SKonstantin Belousov return; 225752dfc8d7SKonstantin Belousov } 225852dfc8d7SKonstantin Belousov 225952dfc8d7SKonstantin Belousov TAILQ_FOREACH(mp, &mountlist, mnt_list) { 226052dfc8d7SKonstantin Belousov if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name)) 226152dfc8d7SKonstantin Belousov db_print_ffs(VFSTOUFS(mp)); 226252dfc8d7SKonstantin Belousov } 226352dfc8d7SKonstantin Belousov } 226452dfc8d7SKonstantin Belousov 2265cf058082SBrooks Davis #endif /* SOFTUPDATES */ 226652dfc8d7SKonstantin Belousov #endif /* DDB */ 2267