160727d8bSWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1989, 1991, 1993, 1994 5df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31996c772fSJohn Dyson * @(#)ffs_vfsops.c 8.31 (Berkeley) 5/20/95 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f4636c59SDavid E. O'Brien #include <sys/cdefs.h> 35f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$"); 36f4636c59SDavid E. O'Brien 3701733a9bSGarrett Wollman #include "opt_quota.h" 38516081f2SRobert Watson #include "opt_ufs.h" 396e77a041SPoul-Henning Kamp #include "opt_ffs.h" 4052dfc8d7SKonstantin Belousov #include "opt_ddb.h" 4101733a9bSGarrett Wollman 42df8bae1dSRodney W. Grimes #include <sys/param.h> 43df8bae1dSRodney W. Grimes #include <sys/systm.h> 44df8bae1dSRodney W. Grimes #include <sys/namei.h> 45acd3428bSRobert Watson #include <sys/priv.h> 46df8bae1dSRodney W. Grimes #include <sys/proc.h> 47c79dff0fSKonstantin Belousov #include <sys/taskqueue.h> 48df8bae1dSRodney W. Grimes #include <sys/kernel.h> 49df8bae1dSRodney W. Grimes #include <sys/vnode.h> 50df8bae1dSRodney W. Grimes #include <sys/mount.h> 519626b608SPoul-Henning Kamp #include <sys/bio.h> 52df8bae1dSRodney W. Grimes #include <sys/buf.h> 5381bca6ddSKATO Takenori #include <sys/conf.h> 543ac4d1efSBruce Evans #include <sys/fcntl.h> 551848286aSEdward Tomasz Napierala #include <sys/ioccom.h> 56df8bae1dSRodney W. Grimes #include <sys/malloc.h> 571b367556SJason Evans #include <sys/mutex.h> 5822a72260SJeff Roberson #include <sys/rwlock.h> 599ed01c32SGleb Smirnoff #include <sys/vmmeter.h> 60a18b1f1dSJason Evans 61aed55708SRobert Watson #include <security/mac/mac_framework.h> 62aed55708SRobert Watson 63a96da1c3SConrad Meyer #include <ufs/ufs/dir.h> 64a64ed089SRobert Watson #include <ufs/ufs/extattr.h> 651a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h> 66df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h> 67df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h> 68df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h> 69df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h> 70df8bae1dSRodney W. Grimes 71df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h> 72df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h> 73df8bae1dSRodney W. Grimes 74f6b04d2bSDavid Greenman #include <vm/vm.h> 75aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h> 76f6b04d2bSDavid Greenman #include <vm/vm_page.h> 77f6b04d2bSDavid Greenman 7843920011SPoul-Henning Kamp #include <geom/geom.h> 7943920011SPoul-Henning Kamp #include <geom/geom_vfs.h> 8043920011SPoul-Henning Kamp 8152dfc8d7SKonstantin Belousov #include <ddb/ddb.h> 8252dfc8d7SKonstantin Belousov 83adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2; 8455166637SPoul-Henning Kamp 85975512a9SPoul-Henning Kamp static int ffs_mountfs(struct vnode *, struct mount *, struct thread *); 861c85e6a3SKirk McKusick static void ffs_oldfscompat_read(struct fs *, struct ufsmount *, 871c85e6a3SKirk McKusick ufs2_daddr_t); 88975512a9SPoul-Henning Kamp static void ffs_ifree(struct ufsmount *ump, struct inode *ip); 89a988a5c6SKonstantin Belousov static int ffs_sync_lazy(struct mount *mp); 90a988a5c6SKonstantin Belousov 919bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init; 929bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit; 93d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl; 9420a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount; 95adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount; 9620a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount; 97adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs; 98adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp; 99adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync; 100df8bae1dSRodney W. Grimes 101303b270bSEivind Eklund static struct vfsops ufs_vfsops = { 1027652131bSPoul-Henning Kamp .vfs_extattrctl = ffs_extattrctl, 1037652131bSPoul-Henning Kamp .vfs_fhtovp = ffs_fhtovp, 1047652131bSPoul-Henning Kamp .vfs_init = ffs_init, 10520a92a18SPoul-Henning Kamp .vfs_mount = ffs_mount, 10620a92a18SPoul-Henning Kamp .vfs_cmount = ffs_cmount, 1077652131bSPoul-Henning Kamp .vfs_quotactl = ufs_quotactl, 1087652131bSPoul-Henning Kamp .vfs_root = ufs_root, 1097652131bSPoul-Henning Kamp .vfs_statfs = ffs_statfs, 1107652131bSPoul-Henning Kamp .vfs_sync = ffs_sync, 1117652131bSPoul-Henning Kamp .vfs_uninit = ffs_uninit, 1127652131bSPoul-Henning Kamp .vfs_unmount = ffs_unmount, 1137652131bSPoul-Henning Kamp .vfs_vget = ffs_vget, 1142814d5baSKonstantin Belousov .vfs_susp_clean = process_deferred_inactive, 115df8bae1dSRodney W. Grimes }; 116df8bae1dSRodney W. Grimes 1178994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0); 1185fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1); 119c901836cSGarrett Wollman 1206e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy; 121dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite; 1226e77a041SPoul-Henning Kamp 1236e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = { 1246e77a041SPoul-Henning Kamp .bop_name = "FFS", 125dd19a799SPoul-Henning Kamp .bop_write = ffs_bufwrite, 1266e77a041SPoul-Henning Kamp .bop_strategy = ffs_geom_strategy, 1276ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 1282cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT 1292cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush, 1302cc7d26fSKonstantin Belousov #else 1312cc7d26fSKonstantin Belousov .bop_bdflush = ffs_bdflush, 1322cc7d26fSKonstantin Belousov #endif 1336e77a041SPoul-Henning Kamp }; 1346e77a041SPoul-Henning Kamp 1350b962648SAndriy Gapon /* 1360b962648SAndriy Gapon * Note that userquota and groupquota options are not currently used 1370b962648SAndriy Gapon * by UFS/FFS code and generally mount(8) does not pass those options 1380b962648SAndriy Gapon * from userland, but they can be passed by loader(8) via 1390b962648SAndriy Gapon * vfs.root.mountfrom.options. 1400b962648SAndriy Gapon */ 141d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr", 1420b962648SAndriy Gapon "noclusterw", "noexec", "export", "force", "from", "groupquota", 143927a12aeSKirk McKusick "multilabel", "nfsv4acls", "fsckpid", "snapshot", "nosuid", "suiddir", 144927a12aeSKirk McKusick "nosymfollow", "sync", "union", "userquota", NULL }; 14520a92a18SPoul-Henning Kamp 1465e8c582aSPoul-Henning Kamp static int 147dfd233edSAttilio Rao ffs_mount(struct mount *mp) 148df8bae1dSRodney W. Grimes { 14920a92a18SPoul-Henning Kamp struct vnode *devvp; 150dfd233edSAttilio Rao struct thread *td; 151f7a3729cSKevin Lo struct ufsmount *ump = NULL; 15205f4ff5dSPoul-Henning Kamp struct fs *fs; 153927a12aeSKirk McKusick pid_t fsckpid = 0; 154714b7df5SKonstantin Belousov int error, error1, flags; 155cc672d35SKirk McKusick uint64_t mntorflags; 15615bc6b2bSEdward Tomasz Napierala accmode_t accmode; 1575e8c582aSPoul-Henning Kamp struct nameidata ndp; 15820a92a18SPoul-Henning Kamp char *fspec; 159df8bae1dSRodney W. Grimes 160dfd233edSAttilio Rao td = curthread; 16120a92a18SPoul-Henning Kamp if (vfs_filteropt(mp->mnt_optnew, ffs_opts)) 16220a92a18SPoul-Henning Kamp return (EINVAL); 163aa4d7a8aSPoul-Henning Kamp if (uma_inode == NULL) { 164aa4d7a8aSPoul-Henning Kamp uma_inode = uma_zcreate("FFS inode", 165aa4d7a8aSPoul-Henning Kamp sizeof(struct inode), NULL, NULL, NULL, NULL, 166aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 167aa4d7a8aSPoul-Henning Kamp uma_ufs1 = uma_zcreate("FFS1 dinode", 168aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL, 169aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 170aa4d7a8aSPoul-Henning Kamp uma_ufs2 = uma_zcreate("FFS2 dinode", 171aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL, 172aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 173aa4d7a8aSPoul-Henning Kamp } 1748d02a378SPawel Jakub Dawidek 1750b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "groupquota"); 1760b962648SAndriy Gapon vfs_deleteopt(mp->mnt_optnew, "userquota"); 1770b962648SAndriy Gapon 17820a92a18SPoul-Henning Kamp fspec = vfs_getopts(mp->mnt_optnew, "from", &error); 17951ac12abSPoul-Henning Kamp if (error) 180f2a2857bSKirk McKusick return (error); 1812b14f991SJulian Elischer 1825da56ddbSTor Egge mntorflags = 0; 18326f59b64SCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0) 1845da56ddbSTor Egge mntorflags |= MNT_ACLS; 18526f59b64SCraig Rodrigues 186fb77e0afSCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) { 1875da56ddbSTor Egge mntorflags |= MNT_SNAPSHOT; 188fb77e0afSCraig Rodrigues /* 189fb77e0afSCraig Rodrigues * Once we have set the MNT_SNAPSHOT flag, do not 190fb77e0afSCraig Rodrigues * persist "snapshot" in the options list. 191fb77e0afSCraig Rodrigues */ 192fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_optnew, "snapshot"); 193fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_opt, "snapshot"); 194fb77e0afSCraig Rodrigues } 19526f59b64SCraig Rodrigues 196927a12aeSKirk McKusick if (vfs_getopt(mp->mnt_optnew, "fsckpid", NULL, NULL) == 0 && 197927a12aeSKirk McKusick vfs_scanopt(mp->mnt_optnew, "fsckpid", "%d", &fsckpid) == 1) { 198927a12aeSKirk McKusick /* 199927a12aeSKirk McKusick * Once we have set the restricted PID, do not 200927a12aeSKirk McKusick * persist "fsckpid" in the options list. 201927a12aeSKirk McKusick */ 202927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_optnew, "fsckpid"); 203927a12aeSKirk McKusick vfs_deleteopt(mp->mnt_opt, "fsckpid"); 204927a12aeSKirk McKusick if (mp->mnt_flag & MNT_UPDATE) { 205927a12aeSKirk McKusick if (VFSTOUFS(mp)->um_fs->fs_ronly == 0 && 206927a12aeSKirk McKusick vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 207b60ee81eSKirk McKusick vfs_mount_error(mp, 208b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 209927a12aeSKirk McKusick return (EINVAL); 210927a12aeSKirk McKusick } 211927a12aeSKirk McKusick } else if (vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) { 212b60ee81eSKirk McKusick vfs_mount_error(mp, 213b60ee81eSKirk McKusick "Checker enable: Must be read-only"); 214927a12aeSKirk McKusick return (EINVAL); 215927a12aeSKirk McKusick } 216927a12aeSKirk McKusick /* Set to -1 if we are done */ 217927a12aeSKirk McKusick if (fsckpid == 0) 218927a12aeSKirk McKusick fsckpid = -1; 219927a12aeSKirk McKusick } 220927a12aeSKirk McKusick 2219340fc72SEdward Tomasz Napierala if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) { 2229340fc72SEdward Tomasz Napierala if (mntorflags & MNT_ACLS) { 223b60ee81eSKirk McKusick vfs_mount_error(mp, 224b60ee81eSKirk McKusick "\"acls\" and \"nfsv4acls\" options " 225b60ee81eSKirk McKusick "are mutually exclusive"); 2269340fc72SEdward Tomasz Napierala return (EINVAL); 2279340fc72SEdward Tomasz Napierala } 2289340fc72SEdward Tomasz Napierala mntorflags |= MNT_NFS4ACLS; 2299340fc72SEdward Tomasz Napierala } 2309340fc72SEdward Tomasz Napierala 2315da56ddbSTor Egge MNT_ILOCK(mp); 23261996181SEdward Tomasz Napierala mp->mnt_flag |= mntorflags; 2335da56ddbSTor Egge MNT_IUNLOCK(mp); 234df8bae1dSRodney W. Grimes /* 235df8bae1dSRodney W. Grimes * If updating, check whether changing from read-only to 236df8bae1dSRodney W. Grimes * read/write; if there is no device name, that's all we do. 237df8bae1dSRodney W. Grimes */ 238df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_UPDATE) { 239df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 240df8bae1dSRodney W. Grimes fs = ump->um_fs; 24126cf9c3bSPeter Wemm devvp = ump->um_devvp; 242927a12aeSKirk McKusick if (fsckpid == -1 && ump->um_fsckpid > 0) { 243927a12aeSKirk McKusick if ((error = ffs_flushfiles(mp, WRITECLOSE, td)) != 0 || 244927a12aeSKirk McKusick (error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) 245927a12aeSKirk McKusick return (error); 246927a12aeSKirk McKusick g_topology_lock(); 247927a12aeSKirk McKusick /* 248927a12aeSKirk McKusick * Return to normal read-only mode. 249927a12aeSKirk McKusick */ 250927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 251927a12aeSKirk McKusick g_topology_unlock(); 252927a12aeSKirk McKusick ump->um_fsckpid = 0; 253927a12aeSKirk McKusick } 25420a92a18SPoul-Henning Kamp if (fs->fs_ronly == 0 && 25520a92a18SPoul-Henning Kamp vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 2566fecb4e4SKonstantin Belousov /* 2576fecb4e4SKonstantin Belousov * Flush any dirty data and suspend filesystem. 2586fecb4e4SKonstantin Belousov */ 259f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 260f2a2857bSKirk McKusick return (error); 261895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 262895b3782SKonstantin Belousov if (error != 0) 2639ab73fd1SKirk McKusick return (error); 264cd600596SKirk McKusick /* 265cd600596SKirk McKusick * Check for and optionally get rid of files open 266cd600596SKirk McKusick * for writing. 267cd600596SKirk McKusick */ 268df8bae1dSRodney W. Grimes flags = WRITECLOSE; 269df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_FORCE) 270df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 271fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 272b40ce416SJulian Elischer error = softdep_flushfiles(mp, flags, td); 273b1897c19SJulian Elischer } else { 274b40ce416SJulian Elischer error = ffs_flushfiles(mp, flags, td); 275df8bae1dSRodney W. Grimes } 276f2a2857bSKirk McKusick if (error) { 277ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 278f2a2857bSKirk McKusick return (error); 279b1897c19SJulian Elischer } 2809ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || 2819ccb939eSKirk McKusick fs->fs_pendinginodes != 0) { 282b60ee81eSKirk McKusick printf("WARNING: %s Update error: blocks %jd " 283b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, 2841c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 2859ccb939eSKirk McKusick fs->fs_pendinginodes); 2869ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 2879ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 2889ccb939eSKirk McKusick } 2891a6a6610SKirk McKusick if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0) 290f2a2857bSKirk McKusick fs->fs_clean = 1; 291791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 292f2a2857bSKirk McKusick fs->fs_ronly = 0; 293f2a2857bSKirk McKusick fs->fs_clean = 0; 294ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 295f2a2857bSKirk McKusick return (error); 2962b14f991SJulian Elischer } 297fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 2989420dc62SKirk McKusick softdep_unmount(mp); 29943920011SPoul-Henning Kamp g_topology_lock(); 3008795189cSKirk McKusick /* 3018795189cSKirk McKusick * Drop our write and exclusive access. 3028795189cSKirk McKusick */ 3038795189cSKirk McKusick g_access(ump->um_cp, 0, -1, -1); 30443920011SPoul-Henning Kamp g_topology_unlock(); 30520a92a18SPoul-Henning Kamp fs->fs_ronly = 1; 3065da56ddbSTor Egge MNT_ILOCK(mp); 30720a92a18SPoul-Henning Kamp mp->mnt_flag |= MNT_RDONLY; 3085da56ddbSTor Egge MNT_IUNLOCK(mp); 3096fecb4e4SKonstantin Belousov /* 3106fecb4e4SKonstantin Belousov * Allow the writers to note that filesystem 3116fecb4e4SKonstantin Belousov * is ro now. 3126fecb4e4SKonstantin Belousov */ 313ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, 0); 314f2a2857bSKirk McKusick } 315f2a2857bSKirk McKusick if ((mp->mnt_flag & MNT_RELOAD) && 3161848286aSEdward Tomasz Napierala (error = ffs_reload(mp, td, 0)) != 0) 317f2a2857bSKirk McKusick return (error); 31820a92a18SPoul-Henning Kamp if (fs->fs_ronly && 31920a92a18SPoul-Henning Kamp !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 320c9b99213SBruce Evans /* 321927a12aeSKirk McKusick * If we are running a checker, do not allow upgrade. 322927a12aeSKirk McKusick */ 323927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 324b60ee81eSKirk McKusick vfs_mount_error(mp, 325b60ee81eSKirk McKusick "Active checker, cannot upgrade to write"); 326927a12aeSKirk McKusick return (EINVAL); 327927a12aeSKirk McKusick } 328927a12aeSKirk McKusick /* 329c9b99213SBruce Evans * If upgrade to read-write by non-root, then verify 330c9b99213SBruce Evans * that user has necessary permissions on the device. 331c9b99213SBruce Evans */ 332cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 333acd3428bSRobert Watson error = VOP_ACCESS(devvp, VREAD | VWRITE, 334acd3428bSRobert Watson td->td_ucred, td); 335acd3428bSRobert Watson if (error) 336acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 337acd3428bSRobert Watson if (error) { 33822db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 339c9b99213SBruce Evans return (error); 340c9b99213SBruce Evans } 34122db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 3427e58bfacSBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 3430922cce6SBruce Evans if (fs->fs_clean == 0) { 3447e58bfacSBruce Evans fs->fs_flags |= FS_UNCLEAN; 345812b1d41SKirk McKusick if ((mp->mnt_flag & MNT_FORCE) || 346113db2ddSJeff Roberson ((fs->fs_flags & 347113db2ddSJeff Roberson (FS_SUJ | FS_NEEDSFSCK)) == 0 && 3481a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 349b60ee81eSKirk McKusick printf("WARNING: %s was not properly " 350b60ee81eSKirk McKusick "dismounted\n", fs->fs_fsmnt); 3510922cce6SBruce Evans } else { 352b60ee81eSKirk McKusick vfs_mount_error(mp, 353b60ee81eSKirk McKusick "R/W mount of %s denied. %s.%s", 354b60ee81eSKirk McKusick fs->fs_fsmnt, 355b60ee81eSKirk McKusick "Filesystem is not clean - run fsck", 356b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 357b60ee81eSKirk McKusick " Forced mount will invalidate" 358b60ee81eSKirk McKusick " journal contents"); 359f2a2857bSKirk McKusick return (EPERM); 3600922cce6SBruce Evans } 3610922cce6SBruce Evans } 36240c340aaSPoul-Henning Kamp g_topology_lock(); 36340c340aaSPoul-Henning Kamp /* 3648795189cSKirk McKusick * Request exclusive write access. 36540c340aaSPoul-Henning Kamp */ 36640c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 1); 36740c340aaSPoul-Henning Kamp g_topology_unlock(); 36840c340aaSPoul-Henning Kamp if (error) 36940c340aaSPoul-Henning Kamp return (error); 370f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 371f2a2857bSKirk McKusick return (error); 372f2a2857bSKirk McKusick fs->fs_ronly = 0; 3735da56ddbSTor Egge MNT_ILOCK(mp); 37420a92a18SPoul-Henning Kamp mp->mnt_flag &= ~MNT_RDONLY; 3755da56ddbSTor Egge MNT_IUNLOCK(mp); 376113db2ddSJeff Roberson fs->fs_mtime = time_second; 37726cf9c3bSPeter Wemm /* check to see if we need to start softdep */ 378f2a2857bSKirk McKusick if ((fs->fs_flags & FS_DOSOFTDEP) && 379a854ed98SJohn Baldwin (error = softdep_mount(devvp, mp, fs, td->td_ucred))){ 380f2a2857bSKirk McKusick vn_finished_write(mp); 381f2a2857bSKirk McKusick return (error); 38226cf9c3bSPeter Wemm } 383113db2ddSJeff Roberson fs->fs_clean = 0; 384113db2ddSJeff Roberson if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 385113db2ddSJeff Roberson vn_finished_write(mp); 386113db2ddSJeff Roberson return (error); 387113db2ddSJeff Roberson } 388f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 389f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 390f2a2857bSKirk McKusick vn_finished_write(mp); 3911469eec8SDavid Greenman } 392c11d2981SJulian Elischer /* 393c11d2981SJulian Elischer * Soft updates is incompatible with "async", 394c11d2981SJulian Elischer * so if we are doing softupdates stop the user 395c11d2981SJulian Elischer * from setting the async flag in an update. 396c11d2981SJulian Elischer * Softdep_mount() clears it in an initial mount 397c11d2981SJulian Elischer * or ro->rw remount. 398c11d2981SJulian Elischer */ 399fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) { 4005da56ddbSTor Egge /* XXX: Reset too late ? */ 4015da56ddbSTor Egge MNT_ILOCK(mp); 402c11d2981SJulian Elischer mp->mnt_flag &= ~MNT_ASYNC; 4035da56ddbSTor Egge MNT_IUNLOCK(mp); 4045da56ddbSTor Egge } 405df8bae1dSRodney W. Grimes /* 40639cfb239SPawel Jakub Dawidek * Keep MNT_ACLS flag if it is stored in superblock. 40739cfb239SPawel Jakub Dawidek */ 4085da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 4095da56ddbSTor Egge /* XXX: Set too late ? */ 4105da56ddbSTor Egge MNT_ILOCK(mp); 41139cfb239SPawel Jakub Dawidek mp->mnt_flag |= MNT_ACLS; 4125da56ddbSTor Egge MNT_IUNLOCK(mp); 4135da56ddbSTor Egge } 414cea90362SCraig Rodrigues 4159340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 4169340fc72SEdward Tomasz Napierala /* XXX: Set too late ? */ 4179340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 4189340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 4199340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 4209340fc72SEdward Tomasz Napierala } 421927a12aeSKirk McKusick /* 422927a12aeSKirk McKusick * If this is a request from fsck to clean up the filesystem, 423927a12aeSKirk McKusick * then allow the specified pid to proceed. 424927a12aeSKirk McKusick */ 425927a12aeSKirk McKusick if (fsckpid > 0) { 426927a12aeSKirk McKusick if (ump->um_fsckpid != 0) { 427b60ee81eSKirk McKusick vfs_mount_error(mp, 428b60ee81eSKirk McKusick "Active checker already running on %s", 429927a12aeSKirk McKusick fs->fs_fsmnt); 430927a12aeSKirk McKusick return (EINVAL); 431927a12aeSKirk McKusick } 432fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 433927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 434927a12aeSKirk McKusick g_topology_lock(); 435927a12aeSKirk McKusick /* 436927a12aeSKirk McKusick * Request write access. 437927a12aeSKirk McKusick */ 438927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 439927a12aeSKirk McKusick g_topology_unlock(); 440927a12aeSKirk McKusick if (error) { 441b60ee81eSKirk McKusick vfs_mount_error(mp, 442b60ee81eSKirk McKusick "Checker activation failed on %s", 443927a12aeSKirk McKusick fs->fs_fsmnt); 444927a12aeSKirk McKusick return (error); 445927a12aeSKirk McKusick } 446927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 447927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 448927a12aeSKirk McKusick ffs_snapshot_mount(mp); 449927a12aeSKirk McKusick fs->fs_mtime = time_second; 450927a12aeSKirk McKusick fs->fs_fmod = 1; 451927a12aeSKirk McKusick fs->fs_clean = 0; 452927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 453927a12aeSKirk McKusick } 4549340fc72SEdward Tomasz Napierala 455f2a2857bSKirk McKusick /* 456f2a2857bSKirk McKusick * If this is a snapshot request, take the snapshot. 457f2a2857bSKirk McKusick */ 458f2a2857bSKirk McKusick if (mp->mnt_flag & MNT_SNAPSHOT) 45920a92a18SPoul-Henning Kamp return (ffs_snapshot(mp, fspec)); 460714b7df5SKonstantin Belousov 461714b7df5SKonstantin Belousov /* 462714b7df5SKonstantin Belousov * Must not call namei() while owning busy ref. 463714b7df5SKonstantin Belousov */ 464714b7df5SKonstantin Belousov vfs_unbusy(mp); 465df8bae1dSRodney W. Grimes } 4662b14f991SJulian Elischer 467df8bae1dSRodney W. Grimes /* 468df8bae1dSRodney W. Grimes * Not an update, or updating the name: look up the name 469e9827c6dSBruce Evans * and verify that it refers to a sensible disk device. 470df8bae1dSRodney W. Grimes */ 471fdedad76SSuleiman Souhlal NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td); 472714b7df5SKonstantin Belousov error = namei(&ndp); 473714b7df5SKonstantin Belousov if ((mp->mnt_flag & MNT_UPDATE) != 0) { 474714b7df5SKonstantin Belousov /* 475714b7df5SKonstantin Belousov * Unmount does not start if MNT_UPDATE is set. Mount 476714b7df5SKonstantin Belousov * update busies mp before setting MNT_UPDATE. We 477714b7df5SKonstantin Belousov * must be able to retain our busy ref succesfully, 478714b7df5SKonstantin Belousov * without sleep. 479714b7df5SKonstantin Belousov */ 480714b7df5SKonstantin Belousov error1 = vfs_busy(mp, MBF_NOWAIT); 481714b7df5SKonstantin Belousov MPASS(error1 == 0); 482714b7df5SKonstantin Belousov } 483714b7df5SKonstantin Belousov if (error != 0) 484f2a2857bSKirk McKusick return (error); 4855e8c582aSPoul-Henning Kamp NDFREE(&ndp, NDF_ONLY_PNBUF); 4865e8c582aSPoul-Henning Kamp devvp = ndp.ni_vp; 487f2a2857bSKirk McKusick if (!vn_isdisk(devvp, &error)) { 488fdedad76SSuleiman Souhlal vput(devvp); 489f2a2857bSKirk McKusick return (error); 490f2a2857bSKirk McKusick } 491c9b99213SBruce Evans 492c9b99213SBruce Evans /* 493c9b99213SBruce Evans * If mount by non-root, then verify that user has necessary 494c9b99213SBruce Evans * permissions on the device. 495c9b99213SBruce Evans */ 49615bc6b2bSEdward Tomasz Napierala accmode = VREAD; 497c9b99213SBruce Evans if ((mp->mnt_flag & MNT_RDONLY) == 0) 49815bc6b2bSEdward Tomasz Napierala accmode |= VWRITE; 49915bc6b2bSEdward Tomasz Napierala error = VOP_ACCESS(devvp, accmode, td->td_ucred, td); 500acd3428bSRobert Watson if (error) 501acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 502acd3428bSRobert Watson if (error) { 503c9b99213SBruce Evans vput(devvp); 504c9b99213SBruce Evans return (error); 505c9b99213SBruce Evans } 506c9b99213SBruce Evans 5072b14f991SJulian Elischer if (mp->mnt_flag & MNT_UPDATE) { 5082b14f991SJulian Elischer /* 509f2a2857bSKirk McKusick * Update only 510f2a2857bSKirk McKusick * 5113e425b96SJulian Elischer * If it's not the same vnode, or at least the same device 5123e425b96SJulian Elischer * then it's not correct. 5132b14f991SJulian Elischer */ 5142b14f991SJulian Elischer 51543920011SPoul-Henning Kamp if (devvp->v_rdev != ump->um_devvp->v_rdev) 516f2a2857bSKirk McKusick error = EINVAL; /* needs translation */ 517fdedad76SSuleiman Souhlal vput(devvp); 518f2a2857bSKirk McKusick if (error) 519f2a2857bSKirk McKusick return (error); 5202b14f991SJulian Elischer } else { 5212b14f991SJulian Elischer /* 522f2a2857bSKirk McKusick * New mount 5232b14f991SJulian Elischer * 524f2a2857bSKirk McKusick * We need the name for the mount point (also used for 525f2a2857bSKirk McKusick * "last mounted on") copied in. If an error occurs, 526f2a2857bSKirk McKusick * the mount point is discarded by the upper level code. 52798cbffd7SKonstantin Belousov * Note that vfs_mount_alloc() populates f_mntonname for us. 528f2a2857bSKirk McKusick */ 529975512a9SPoul-Henning Kamp if ((error = ffs_mountfs(devvp, mp, td)) != 0) { 530f2a2857bSKirk McKusick vrele(devvp); 531f2a2857bSKirk McKusick return (error); 532f2a2857bSKirk McKusick } 533927a12aeSKirk McKusick if (fsckpid > 0) { 534fddf7baeSKirk McKusick KASSERT(MOUNTEDSOFTDEP(mp) == 0, 535927a12aeSKirk McKusick ("soft updates enabled on read-only file system")); 536927a12aeSKirk McKusick ump = VFSTOUFS(mp); 537927a12aeSKirk McKusick fs = ump->um_fs; 538927a12aeSKirk McKusick g_topology_lock(); 539927a12aeSKirk McKusick /* 540927a12aeSKirk McKusick * Request write access. 541927a12aeSKirk McKusick */ 542927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, 1, 0); 543927a12aeSKirk McKusick g_topology_unlock(); 544927a12aeSKirk McKusick if (error) { 545b60ee81eSKirk McKusick printf("WARNING: %s: Checker activation " 546b60ee81eSKirk McKusick "failed\n", fs->fs_fsmnt); 547927a12aeSKirk McKusick } else { 548927a12aeSKirk McKusick ump->um_fsckpid = fsckpid; 549927a12aeSKirk McKusick if (fs->fs_snapinum[0] != 0) 550927a12aeSKirk McKusick ffs_snapshot_mount(mp); 551927a12aeSKirk McKusick fs->fs_mtime = time_second; 552927a12aeSKirk McKusick fs->fs_clean = 0; 553927a12aeSKirk McKusick (void) ffs_sbupdate(ump, MNT_WAIT, 0); 554927a12aeSKirk McKusick } 555927a12aeSKirk McKusick } 556f2a2857bSKirk McKusick } 55720a92a18SPoul-Henning Kamp vfs_mountedfrom(mp, fspec); 558f2a2857bSKirk McKusick return (0); 5592b14f991SJulian Elischer } 5602b14f991SJulian Elischer 561df8bae1dSRodney W. Grimes /* 56220a92a18SPoul-Henning Kamp * Compatibility with old mount system call. 56320a92a18SPoul-Henning Kamp */ 56420a92a18SPoul-Henning Kamp 56520a92a18SPoul-Henning Kamp static int 566cc672d35SKirk McKusick ffs_cmount(struct mntarg *ma, void *data, uint64_t flags) 56720a92a18SPoul-Henning Kamp { 56820a92a18SPoul-Henning Kamp struct ufs_args args; 569d0cc54f3SKonstantin Belousov struct export_args exp; 57020a92a18SPoul-Henning Kamp int error; 57120a92a18SPoul-Henning Kamp 57220a92a18SPoul-Henning Kamp if (data == NULL) 57320a92a18SPoul-Henning Kamp return (EINVAL); 57420a92a18SPoul-Henning Kamp error = copyin(data, &args, sizeof args); 57520a92a18SPoul-Henning Kamp if (error) 57620a92a18SPoul-Henning Kamp return (error); 577d0cc54f3SKonstantin Belousov vfs_oexport_conv(&args.export, &exp); 57820a92a18SPoul-Henning Kamp 57920a92a18SPoul-Henning Kamp ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN); 580d0cc54f3SKonstantin Belousov ma = mount_arg(ma, "export", &exp, sizeof(exp)); 58120a92a18SPoul-Henning Kamp error = kernel_mount(ma, flags); 58220a92a18SPoul-Henning Kamp 58320a92a18SPoul-Henning Kamp return (error); 58420a92a18SPoul-Henning Kamp } 58520a92a18SPoul-Henning Kamp 58620a92a18SPoul-Henning Kamp /* 587df8bae1dSRodney W. Grimes * Reload all incore data for a filesystem (used after running fsck on 5881848286aSEdward Tomasz Napierala * the root filesystem and finding things to fix). If the 'force' flag 5891848286aSEdward Tomasz Napierala * is 0, the filesystem must be mounted read-only. 590df8bae1dSRodney W. Grimes * 591df8bae1dSRodney W. Grimes * Things to do to update the mount: 592df8bae1dSRodney W. Grimes * 1) invalidate all cached meta-data. 593df8bae1dSRodney W. Grimes * 2) re-read superblock from disk. 594df8bae1dSRodney W. Grimes * 3) re-read summary information from disk. 595df8bae1dSRodney W. Grimes * 4) invalidate all inactive vnodes. 596df426577SKonstantin Belousov * 5) clear MNTK_SUSPEND2 and MNTK_SUSPENDED flags, allowing secondary 597df426577SKonstantin Belousov * writers, if requested. 598df426577SKonstantin Belousov * 6) invalidate all cached file data. 599df426577SKonstantin Belousov * 7) re-read inode data for all active vnodes. 600df8bae1dSRodney W. Grimes */ 6011848286aSEdward Tomasz Napierala int 602df426577SKonstantin Belousov ffs_reload(struct mount *mp, struct thread *td, int flags) 603df8bae1dSRodney W. Grimes { 60482be0a5aSTor Egge struct vnode *vp, *mvp, *devvp; 605df8bae1dSRodney W. Grimes struct inode *ip; 606f55ff3f3SIan Dowse void *space; 607df8bae1dSRodney W. Grimes struct buf *bp; 608996c772fSJohn Dyson struct fs *fs, *newfs; 6093ba649d7SJeff Roberson struct ufsmount *ump; 6101c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 611ad544726SKirk McKusick int i, blks, error; 612ad544726SKirk McKusick u_long size; 613996c772fSJohn Dyson int32_t *lp; 614df8bae1dSRodney W. Grimes 6153ba649d7SJeff Roberson ump = VFSTOUFS(mp); 6161848286aSEdward Tomasz Napierala 6171848286aSEdward Tomasz Napierala MNT_ILOCK(mp); 618df426577SKonstantin Belousov if ((mp->mnt_flag & MNT_RDONLY) == 0 && (flags & FFSR_FORCE) == 0) { 6191848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 6201848286aSEdward Tomasz Napierala return (EINVAL); 6211848286aSEdward Tomasz Napierala } 6221848286aSEdward Tomasz Napierala MNT_IUNLOCK(mp); 6231848286aSEdward Tomasz Napierala 624df8bae1dSRodney W. Grimes /* 625df8bae1dSRodney W. Grimes * Step 1: invalidate all cached meta-data. 626df8bae1dSRodney W. Grimes */ 6272b14f991SJulian Elischer devvp = VFSTOUFS(mp)->um_devvp; 628cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 6290d7935fdSAttilio Rao if (vinvalbuf(devvp, 0, 0, 0) != 0) 630df8bae1dSRodney W. Grimes panic("ffs_reload: dirty1"); 63122db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 63295e5e988SJohn Dyson 633df8bae1dSRodney W. Grimes /* 634df8bae1dSRodney W. Grimes * Step 2: re-read superblock from disk. 635df8bae1dSRodney W. Grimes */ 6361c85e6a3SKirk McKusick fs = VFSTOUFS(mp)->um_fs; 637ada981b2SKirk McKusick if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize, 6381c85e6a3SKirk McKusick NOCRED, &bp)) != 0) 639df8bae1dSRodney W. Grimes return (error); 640996c772fSJohn Dyson newfs = (struct fs *)bp->b_data; 6411c85e6a3SKirk McKusick if ((newfs->fs_magic != FS_UFS1_MAGIC && 6421c85e6a3SKirk McKusick newfs->fs_magic != FS_UFS2_MAGIC) || 6431c85e6a3SKirk McKusick newfs->fs_bsize > MAXBSIZE || 644996c772fSJohn Dyson newfs->fs_bsize < sizeof(struct fs)) { 645df8bae1dSRodney W. Grimes brelse(bp); 646df8bae1dSRodney W. Grimes return (EIO); /* XXX needs translation */ 647df8bae1dSRodney W. Grimes } 648996c772fSJohn Dyson /* 649996c772fSJohn Dyson * Copy pointer fields back into superblock before copying in XXX 650996c772fSJohn Dyson * new superblock. These should really be in the ufsmount. XXX 651996c772fSJohn Dyson * Note that important parameters (eg fs_ncg) are unchanged. 652996c772fSJohn Dyson */ 653f55ff3f3SIan Dowse newfs->fs_csp = fs->fs_csp; 654996c772fSJohn Dyson newfs->fs_maxcluster = fs->fs_maxcluster; 6555d69bac4SIan Dowse newfs->fs_contigdirs = fs->fs_contigdirs; 656143a5346SIan Dowse newfs->fs_active = fs->fs_active; 6571848286aSEdward Tomasz Napierala newfs->fs_ronly = fs->fs_ronly; 6581c85e6a3SKirk McKusick sblockloc = fs->fs_sblockloc; 659996c772fSJohn Dyson bcopy(newfs, fs, (u_int)fs->fs_sbsize); 660df8bae1dSRodney W. Grimes brelse(bp); 661996c772fSJohn Dyson mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 6621c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc); 6633ba649d7SJeff Roberson UFS_LOCK(ump); 6649ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 665b60ee81eSKirk McKusick printf("WARNING: %s: reload pending error: blocks %jd " 666b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 6671c85e6a3SKirk McKusick fs->fs_pendinginodes); 6689ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 6699ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 6709ccb939eSKirk McKusick } 6713ba649d7SJeff Roberson UFS_UNLOCK(ump); 672996c772fSJohn Dyson 673df8bae1dSRodney W. Grimes /* 674df8bae1dSRodney W. Grimes * Step 3: re-read summary information from disk. 675df8bae1dSRodney W. Grimes */ 6762b028c25SEdward Tomasz Napierala size = fs->fs_cssize; 6772b028c25SEdward Tomasz Napierala blks = howmany(size, fs->fs_fsize); 6782b028c25SEdward Tomasz Napierala if (fs->fs_contigsumsize > 0) 6792b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(int32_t); 6802b028c25SEdward Tomasz Napierala size += fs->fs_ncg * sizeof(u_int8_t); 6812b028c25SEdward Tomasz Napierala free(fs->fs_csp, M_UFSMNT); 682ad544726SKirk McKusick space = malloc(size, M_UFSMNT, M_WAITOK); 6832b028c25SEdward Tomasz Napierala fs->fs_csp = space; 684df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 685df8bae1dSRodney W. Grimes size = fs->fs_bsize; 686df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 687df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 688c9671602SPoul-Henning Kamp error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 689c9671602SPoul-Henning Kamp NOCRED, &bp); 690c9671602SPoul-Henning Kamp if (error) 691df8bae1dSRodney W. Grimes return (error); 692f55ff3f3SIan Dowse bcopy(bp->b_data, space, (u_int)size); 693f55ff3f3SIan Dowse space = (char *)space + size; 694df8bae1dSRodney W. Grimes brelse(bp); 695df8bae1dSRodney W. Grimes } 696996c772fSJohn Dyson /* 697996c772fSJohn Dyson * We no longer know anything about clusters per cylinder group. 698996c772fSJohn Dyson */ 699996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 70072b8ff1cSEdward Tomasz Napierala fs->fs_maxcluster = lp = space; 701996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 702996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 70372b8ff1cSEdward Tomasz Napierala space = lp; 704996c772fSJohn Dyson } 70572b8ff1cSEdward Tomasz Napierala size = fs->fs_ncg * sizeof(u_int8_t); 70672b8ff1cSEdward Tomasz Napierala fs->fs_contigdirs = (u_int8_t *)space; 70772b8ff1cSEdward Tomasz Napierala bzero(fs->fs_contigdirs, size); 708df426577SKonstantin Belousov if ((flags & FFSR_UNSUSPEND) != 0) { 709df426577SKonstantin Belousov MNT_ILOCK(mp); 710df426577SKonstantin Belousov mp->mnt_kern_flag &= ~(MNTK_SUSPENDED | MNTK_SUSPEND2); 711df426577SKonstantin Belousov wakeup(&mp->mnt_flag); 712df426577SKonstantin Belousov MNT_IUNLOCK(mp); 713df426577SKonstantin Belousov } 714996c772fSJohn Dyson 715df8bae1dSRodney W. Grimes loop: 71671469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 717df8bae1dSRodney W. Grimes /* 7181848286aSEdward Tomasz Napierala * Skip syncer vnode. 7191848286aSEdward Tomasz Napierala */ 7201848286aSEdward Tomasz Napierala if (vp->v_type == VNON) { 7211848286aSEdward Tomasz Napierala VI_UNLOCK(vp); 7221848286aSEdward Tomasz Napierala continue; 7231848286aSEdward Tomasz Napierala } 7241848286aSEdward Tomasz Napierala /* 725fe68abe2SJeff Roberson * Step 4: invalidate all cached file data. 726df8bae1dSRodney W. Grimes */ 727b40ce416SJulian Elischer if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, td)) { 72871469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 729df8bae1dSRodney W. Grimes goto loop; 730996c772fSJohn Dyson } 7310d7935fdSAttilio Rao if (vinvalbuf(vp, 0, 0, 0)) 732df8bae1dSRodney W. Grimes panic("ffs_reload: dirty2"); 733df8bae1dSRodney W. Grimes /* 734fe68abe2SJeff Roberson * Step 5: re-read inode data for all active vnodes. 735df8bae1dSRodney W. Grimes */ 736df8bae1dSRodney W. Grimes ip = VTOI(vp); 737c9671602SPoul-Henning Kamp error = 738df8bae1dSRodney W. Grimes bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), 739c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 740c9671602SPoul-Henning Kamp if (error) { 74122db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 74245d45c6cSAlexander Kabaev vrele(vp); 74371469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 744df8bae1dSRodney W. Grimes return (error); 745df8bae1dSRodney W. Grimes } 746de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ip->i_number); 747b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 748df8bae1dSRodney W. Grimes brelse(bp); 74922db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 750cb9ddc80SAlexander Kabaev vrele(vp); 751df8bae1dSRodney W. Grimes } 752df8bae1dSRodney W. Grimes return (0); 753df8bae1dSRodney W. Grimes } 754df8bae1dSRodney W. Grimes 7551c85e6a3SKirk McKusick /* 7561c85e6a3SKirk McKusick * Possible superblock locations ordered from most to least likely. 7571c85e6a3SKirk McKusick */ 7581c85e6a3SKirk McKusick static int sblock_try[] = SBLOCKSEARCH; 7595819ab3fSKirk McKusick 760df8bae1dSRodney W. Grimes /* 761df8bae1dSRodney W. Grimes * Common code for mount and mountroot 762df8bae1dSRodney W. Grimes */ 763975512a9SPoul-Henning Kamp static int 764975512a9SPoul-Henning Kamp ffs_mountfs(devvp, mp, td) 76505f4ff5dSPoul-Henning Kamp struct vnode *devvp; 766df8bae1dSRodney W. Grimes struct mount *mp; 767b40ce416SJulian Elischer struct thread *td; 768df8bae1dSRodney W. Grimes { 76905f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 770df8bae1dSRodney W. Grimes struct buf *bp; 77105f4ff5dSPoul-Henning Kamp struct fs *fs; 77289c9c53dSPoul-Henning Kamp struct cdev *dev; 773f55ff3f3SIan Dowse void *space; 7741c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 775ad544726SKirk McKusick int error, i, blks, len, ronly; 776ad544726SKirk McKusick u_long size; 777996c772fSJohn Dyson int32_t *lp; 778996c772fSJohn Dyson struct ucred *cred; 77943920011SPoul-Henning Kamp struct g_consumer *cp; 7803bbd6d8aSJeff Roberson struct mount *nmp; 781df8bae1dSRodney W. Grimes 782ee445a69SJohn Baldwin bp = NULL; 783ee445a69SJohn Baldwin ump = NULL; 784a854ed98SJohn Baldwin cred = td ? td->td_ucred : NOCRED; 78543920011SPoul-Henning Kamp ronly = (mp->mnt_flag & MNT_RDONLY) != 0; 786ee445a69SJohn Baldwin 787c70b3cd2SKonstantin Belousov KASSERT(devvp->v_type == VCHR, ("reclaimed devvp")); 788ee445a69SJohn Baldwin dev = devvp->v_rdev; 789c70b3cd2SKonstantin Belousov if (atomic_cmpset_acq_ptr((uintptr_t *)&dev->si_mountpt, 0, 790c70b3cd2SKonstantin Belousov (uintptr_t)mp) == 0) { 791c70b3cd2SKonstantin Belousov VOP_UNLOCK(devvp, 0); 792c70b3cd2SKonstantin Belousov return (EBUSY); 793c70b3cd2SKonstantin Belousov } 79443920011SPoul-Henning Kamp g_topology_lock(); 79543920011SPoul-Henning Kamp error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1); 79643920011SPoul-Henning Kamp g_topology_unlock(); 797c70b3cd2SKonstantin Belousov if (error != 0) { 798c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 79922db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 800c70b3cd2SKonstantin Belousov return (error); 801c70b3cd2SKonstantin Belousov } 802c70b3cd2SKonstantin Belousov dev_ref(dev); 803c70b3cd2SKonstantin Belousov devvp->v_bufobj.bo_ops = &ffs_ops; 804c70b3cd2SKonstantin Belousov VOP_UNLOCK(devvp, 0); 805c70b3cd2SKonstantin Belousov if (dev->si_iosize_max != 0) 806c70b3cd2SKonstantin Belousov mp->mnt_iosize_max = dev->si_iosize_max; 8071b5464efSPoul-Henning Kamp if (mp->mnt_iosize_max > MAXPHYS) 8081b5464efSPoul-Henning Kamp mp->mnt_iosize_max = MAXPHYS; 80995e5e988SJohn Dyson 8101c85e6a3SKirk McKusick fs = NULL; 8111c85e6a3SKirk McKusick sblockloc = 0; 8121c85e6a3SKirk McKusick /* 8131c85e6a3SKirk McKusick * Try reading the superblock in each of its possible locations. 8141c85e6a3SKirk McKusick */ 8151c85e6a3SKirk McKusick for (i = 0; sblock_try[i] != -1; i++) { 81671ac2d7cSCraig Rodrigues if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) { 81771ac2d7cSCraig Rodrigues error = EINVAL; 81871ac2d7cSCraig Rodrigues vfs_mount_error(mp, 81971ac2d7cSCraig Rodrigues "Invalid sectorsize %d for superblock size %d", 82071ac2d7cSCraig Rodrigues cp->provider->sectorsize, SBLOCKSIZE); 82171ac2d7cSCraig Rodrigues goto out; 82271ac2d7cSCraig Rodrigues } 82371ac2d7cSCraig Rodrigues if ((error = bread(devvp, btodb(sblock_try[i]), SBLOCKSIZE, 8241c85e6a3SKirk McKusick cred, &bp)) != 0) 825df8bae1dSRodney W. Grimes goto out; 826df8bae1dSRodney W. Grimes fs = (struct fs *)bp->b_data; 827ada981b2SKirk McKusick sblockloc = sblock_try[i]; 8281c85e6a3SKirk McKusick if ((fs->fs_magic == FS_UFS1_MAGIC || 8291c85e6a3SKirk McKusick (fs->fs_magic == FS_UFS2_MAGIC && 830ada981b2SKirk McKusick (fs->fs_sblockloc == sblockloc || 831ada981b2SKirk McKusick (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0))) && 8321c85e6a3SKirk McKusick fs->fs_bsize <= MAXBSIZE && 8331c85e6a3SKirk McKusick fs->fs_bsize >= sizeof(struct fs)) 8341c85e6a3SKirk McKusick break; 8351c85e6a3SKirk McKusick brelse(bp); 8361c85e6a3SKirk McKusick bp = NULL; 8371c85e6a3SKirk McKusick } 8381c85e6a3SKirk McKusick if (sblock_try[i] == -1) { 839df8bae1dSRodney W. Grimes error = EINVAL; /* XXX needs translation */ 840df8bae1dSRodney W. Grimes goto out; 841df8bae1dSRodney W. Grimes } 8423f6f17eeSJulian Elischer fs->fs_fmod = 0; 84375e3597aSKirk McKusick /* none of these types of check-hashes are maintained */ 84475e3597aSKirk McKusick fs->fs_metackhash &= ~(CK_SUPERBLOCK | CK_INODE | CK_INDIR | CK_DIR); 84575e3597aSKirk McKusick /* no support for directory indices or any other undefined flags */ 84675e3597aSKirk McKusick fs->fs_flags &= ~FS_INDEXDIRS; 84775e3597aSKirk McKusick fs->fs_flags &= FS_SUPPORTED; 8480922cce6SBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 8490922cce6SBruce Evans if (fs->fs_clean == 0) { 8500922cce6SBruce Evans fs->fs_flags |= FS_UNCLEAN; 851812b1d41SKirk McKusick if (ronly || (mp->mnt_flag & MNT_FORCE) || 852113db2ddSJeff Roberson ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 && 8531a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 85459b3a4ebSDavid E. O'Brien printf("WARNING: %s was not properly dismounted\n", 8550922cce6SBruce Evans fs->fs_fsmnt); 8561469eec8SDavid Greenman } else { 857b60ee81eSKirk McKusick vfs_mount_error(mp, "R/W mount of %s denied. %s%s", 858b60ee81eSKirk McKusick fs->fs_fsmnt, "Filesystem is not clean - run fsck.", 859b60ee81eSKirk McKusick (fs->fs_flags & FS_SUJ) == 0 ? "" : 860b60ee81eSKirk McKusick " Forced mount will invalidate journal contents"); 8611469eec8SDavid Greenman error = EPERM; 8621469eec8SDavid Greenman goto out; 8631469eec8SDavid Greenman } 8641c85e6a3SKirk McKusick if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) && 8651c85e6a3SKirk McKusick (mp->mnt_flag & MNT_FORCE)) { 866b60ee81eSKirk McKusick printf("WARNING: %s: lost blocks %jd files %d\n", 867b60ee81eSKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 8681c85e6a3SKirk McKusick fs->fs_pendinginodes); 8699ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 8709ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 8719ccb939eSKirk McKusick } 8729ccb939eSKirk McKusick } 8739ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 874b60ee81eSKirk McKusick printf("WARNING: %s: mount pending error: blocks %jd " 875b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 8761c85e6a3SKirk McKusick fs->fs_pendinginodes); 8779ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 8789ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 8791469eec8SDavid Greenman } 8801a60c7fcSPawel Jakub Dawidek if ((fs->fs_flags & FS_GJOURNAL) != 0) { 8811a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL 8821a60c7fcSPawel Jakub Dawidek /* 8831a60c7fcSPawel Jakub Dawidek * Get journal provider name. 8841a60c7fcSPawel Jakub Dawidek */ 885ad544726SKirk McKusick len = 1024; 886ad544726SKirk McKusick mp->mnt_gjprovider = malloc((u_long)len, M_UFSMNT, M_WAITOK); 887ad544726SKirk McKusick if (g_io_getattr("GJOURNAL::provider", cp, &len, 8881a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider) == 0) { 889ad544726SKirk McKusick mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, len, 8901a60c7fcSPawel Jakub Dawidek M_UFSMNT, M_WAITOK); 8911a60c7fcSPawel Jakub Dawidek MNT_ILOCK(mp); 8921a60c7fcSPawel Jakub Dawidek mp->mnt_flag |= MNT_GJOURNAL; 8931a60c7fcSPawel Jakub Dawidek MNT_IUNLOCK(mp); 8941a60c7fcSPawel Jakub Dawidek } else { 895b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs " 896b60ee81eSKirk McKusick "but no gjournal provider below\n", 8971a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 8981a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 8991a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 9001a60c7fcSPawel Jakub Dawidek } 9011a60c7fcSPawel Jakub Dawidek #else 902b60ee81eSKirk McKusick printf("WARNING: %s: GJOURNAL flag on fs but no " 903b60ee81eSKirk McKusick "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname); 9041a60c7fcSPawel Jakub Dawidek #endif 9051a60c7fcSPawel Jakub Dawidek } else { 9061a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 9071a60c7fcSPawel Jakub Dawidek } 908a163d034SWarner Losh ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO); 90943920011SPoul-Henning Kamp ump->um_cp = cp; 91043920011SPoul-Henning Kamp ump->um_bo = &devvp->v_bufobj; 9118dd56505SPoul-Henning Kamp ump->um_fs = malloc((u_long)fs->fs_sbsize, M_UFSMNT, M_WAITOK); 9121c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 9131c85e6a3SKirk McKusick ump->um_fstype = UFS1; 9141c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs1; 9151c85e6a3SKirk McKusick } else { 9161c85e6a3SKirk McKusick ump->um_fstype = UFS2; 9171c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs2; 9181c85e6a3SKirk McKusick } 919cec0f20cSPoul-Henning Kamp ump->um_blkatoff = ffs_blkatoff; 920cec0f20cSPoul-Henning Kamp ump->um_truncate = ffs_truncate; 921987f5696SPoul-Henning Kamp ump->um_update = ffs_update; 922cec0f20cSPoul-Henning Kamp ump->um_valloc = ffs_valloc; 923cec0f20cSPoul-Henning Kamp ump->um_vfree = ffs_vfree; 924975512a9SPoul-Henning Kamp ump->um_ifree = ffs_ifree; 92590446e36SKonstantin Belousov ump->um_rdonly = ffs_rdonly; 92616b1f68dSKonstantin Belousov ump->um_snapgone = ffs_snapgone; 9273ba649d7SJeff Roberson mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF); 928df8bae1dSRodney W. Grimes bcopy(bp->b_data, ump->um_fs, (u_int)fs->fs_sbsize); 9291c85e6a3SKirk McKusick if (fs->fs_sbsize < SBLOCKSIZE) 930f2a2857bSKirk McKusick bp->b_flags |= B_INVAL | B_NOCACHE; 931df8bae1dSRodney W. Grimes brelse(bp); 932df8bae1dSRodney W. Grimes bp = NULL; 933df8bae1dSRodney W. Grimes fs = ump->um_fs; 9341c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc); 935df8bae1dSRodney W. Grimes fs->fs_ronly = ronly; 936996c772fSJohn Dyson size = fs->fs_cssize; 937996c772fSJohn Dyson blks = howmany(size, fs->fs_fsize); 938996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) 939996c772fSJohn Dyson size += fs->fs_ncg * sizeof(int32_t); 940a61ab64aSKirk McKusick size += fs->fs_ncg * sizeof(u_int8_t); 941ad544726SKirk McKusick space = malloc(size, M_UFSMNT, M_WAITOK); 942f55ff3f3SIan Dowse fs->fs_csp = space; 943df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 944df8bae1dSRodney W. Grimes size = fs->fs_bsize; 945df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 946df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 9478aef1712SMatthew Dillon if ((error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 9488aef1712SMatthew Dillon cred, &bp)) != 0) { 949f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 950df8bae1dSRodney W. Grimes goto out; 951df8bae1dSRodney W. Grimes } 952df8bae1dSRodney W. Grimes bcopy(bp->b_data, space, (u_int)size); 953f55ff3f3SIan Dowse space = (char *)space + size; 954df8bae1dSRodney W. Grimes brelse(bp); 955df8bae1dSRodney W. Grimes bp = NULL; 956df8bae1dSRodney W. Grimes } 957996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 958f55ff3f3SIan Dowse fs->fs_maxcluster = lp = space; 959996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 960996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 9614691e9eaSIan Dowse space = lp; 962996c772fSJohn Dyson } 963a61ab64aSKirk McKusick size = fs->fs_ncg * sizeof(u_int8_t); 964a61ab64aSKirk McKusick fs->fs_contigdirs = (u_int8_t *)space; 965a61ab64aSKirk McKusick bzero(fs->fs_contigdirs, size); 966143a5346SIan Dowse fs->fs_active = NULL; 96777465d93SAlfred Perlstein mp->mnt_data = ump; 96868de329eSPoul-Henning Kamp mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0]; 9698f89943eSGuido van Rooij mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1]; 9703bbd6d8aSJeff Roberson nmp = NULL; 97168de329eSPoul-Henning Kamp if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 || 9723bbd6d8aSJeff Roberson (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) { 9733bbd6d8aSJeff Roberson if (nmp) 9743bbd6d8aSJeff Roberson vfs_rel(nmp); 97568de329eSPoul-Henning Kamp vfs_getnewfsid(mp); 9763bbd6d8aSJeff Roberson } 977df8bae1dSRodney W. Grimes mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 9785da56ddbSTor Egge MNT_ILOCK(mp); 979cc9d8990SPeter Wemm mp->mnt_flag |= MNT_LOCAL; 9805da56ddbSTor Egge MNT_IUNLOCK(mp); 9815da56ddbSTor Egge if ((fs->fs_flags & FS_MULTILABEL) != 0) { 9827b3f1bbdSTom Rhodes #ifdef MAC 9835da56ddbSTor Egge MNT_ILOCK(mp); 98480830407SRobert Watson mp->mnt_flag |= MNT_MULTILABEL; 9855da56ddbSTor Egge MNT_IUNLOCK(mp); 9867b3f1bbdSTom Rhodes #else 987b60ee81eSKirk McKusick printf("WARNING: %s: multilabel flag on fs but " 988b60ee81eSKirk McKusick "no MAC support\n", mp->mnt_stat.f_mntonname); 9897b3f1bbdSTom Rhodes #endif 9905da56ddbSTor Egge } 9915da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 9927b3f1bbdSTom Rhodes #ifdef UFS_ACL 9935da56ddbSTor Egge MNT_ILOCK(mp); 9949340fc72SEdward Tomasz Napierala 9959340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_NFS4ACLS) 996b60ee81eSKirk McKusick printf("WARNING: %s: ACLs flag on fs conflicts with " 997b60ee81eSKirk McKusick "\"nfsv4acls\" mount option; option ignored\n", 998b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 9999340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_NFS4ACLS; 100080830407SRobert Watson mp->mnt_flag |= MNT_ACLS; 10019340fc72SEdward Tomasz Napierala 10025da56ddbSTor Egge MNT_IUNLOCK(mp); 10037b3f1bbdSTom Rhodes #else 100459b3a4ebSDavid E. O'Brien printf("WARNING: %s: ACLs flag on fs but no ACLs support\n", 1005946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 10067b3f1bbdSTom Rhodes #endif 10075da56ddbSTor Egge } 10089340fc72SEdward Tomasz Napierala if ((fs->fs_flags & FS_NFS4ACLS) != 0) { 10099340fc72SEdward Tomasz Napierala #ifdef UFS_ACL 10109340fc72SEdward Tomasz Napierala MNT_ILOCK(mp); 10119340fc72SEdward Tomasz Napierala 10129340fc72SEdward Tomasz Napierala if (mp->mnt_flag & MNT_ACLS) 1013b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts " 1014b60ee81eSKirk McKusick "with \"acls\" mount option; option ignored\n", 1015b60ee81eSKirk McKusick mp->mnt_stat.f_mntonname); 10169340fc72SEdward Tomasz Napierala mp->mnt_flag &= ~MNT_ACLS; 10179340fc72SEdward Tomasz Napierala mp->mnt_flag |= MNT_NFS4ACLS; 10189340fc72SEdward Tomasz Napierala 10199340fc72SEdward Tomasz Napierala MNT_IUNLOCK(mp); 10209340fc72SEdward Tomasz Napierala #else 1021b60ee81eSKirk McKusick printf("WARNING: %s: NFSv4 ACLs flag on fs but no " 1022b60ee81eSKirk McKusick "ACLs support\n", mp->mnt_stat.f_mntonname); 10239340fc72SEdward Tomasz Napierala #endif 10249340fc72SEdward Tomasz Napierala } 10258c2a54deSKonstantin Belousov if ((fs->fs_flags & FS_TRIM) != 0) { 1026ad544726SKirk McKusick len = sizeof(int); 1027ad544726SKirk McKusick if (g_io_getattr("GEOM::candelete", cp, &len, 10288c2a54deSKonstantin Belousov &ump->um_candelete) == 0) { 10298c2a54deSKonstantin Belousov if (!ump->um_candelete) 1030b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk " 1031b60ee81eSKirk McKusick "does not support TRIM\n", 10328c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 10338c2a54deSKonstantin Belousov } else { 1034b60ee81eSKirk McKusick printf("WARNING: %s: TRIM flag on fs but disk does " 1035b60ee81eSKirk McKusick "not confirm that it supports TRIM\n", 10368c2a54deSKonstantin Belousov mp->mnt_stat.f_mntonname); 10378c2a54deSKonstantin Belousov ump->um_candelete = 0; 10388c2a54deSKonstantin Belousov } 1039c79dff0fSKonstantin Belousov if (ump->um_candelete) { 1040c79dff0fSKonstantin Belousov ump->um_trim_tq = taskqueue_create("trim", M_WAITOK, 1041c79dff0fSKonstantin Belousov taskqueue_thread_enqueue, &ump->um_trim_tq); 1042c79dff0fSKonstantin Belousov taskqueue_start_threads(&ump->um_trim_tq, 1, PVFS, 1043c79dff0fSKonstantin Belousov "%s trim", mp->mnt_stat.f_mntonname); 1044c79dff0fSKonstantin Belousov } 10458c2a54deSKonstantin Belousov } 10469340fc72SEdward Tomasz Napierala 1047df8bae1dSRodney W. Grimes ump->um_mountp = mp; 1048df8bae1dSRodney W. Grimes ump->um_dev = dev; 1049df8bae1dSRodney W. Grimes ump->um_devvp = devvp; 1050df8bae1dSRodney W. Grimes ump->um_nindir = fs->fs_nindir; 1051df8bae1dSRodney W. Grimes ump->um_bptrtodb = fs->fs_fsbtodb; 1052df8bae1dSRodney W. Grimes ump->um_seqinc = fs->fs_frag; 1053df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1054df8bae1dSRodney W. Grimes ump->um_quotas[i] = NULLVP; 1055516081f2SRobert Watson #ifdef UFS_EXTATTR 1056a64ed089SRobert Watson ufs_extattr_uepm_init(&ump->um_extattr); 1057a64ed089SRobert Watson #endif 10582b14f991SJulian Elischer /* 10592b14f991SJulian Elischer * Set FS local "last mounted on" information (NULL pad) 10602b14f991SJulian Elischer */ 106193373c42SSuleiman Souhlal bzero(fs->fs_fsmnt, MAXMNTLEN); 106293373c42SSuleiman Souhlal strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN); 1063113db2ddSJeff Roberson mp->mnt_stat.f_iosize = fs->fs_bsize; 10642b14f991SJulian Elischer 10652b14f991SJulian Elischer if (mp->mnt_flag & MNT_ROOTFS) { 10662b14f991SJulian Elischer /* 10672b14f991SJulian Elischer * Root mount; update timestamp in mount structure. 10682b14f991SJulian Elischer * this will be used by the common root mount code 10692b14f991SJulian Elischer * to update the system clock. 10702b14f991SJulian Elischer */ 10712b14f991SJulian Elischer mp->mnt_time = fs->fs_time; 10722b14f991SJulian Elischer } 1073996c772fSJohn Dyson 1074996c772fSJohn Dyson if (ronly == 0) { 1075113db2ddSJeff Roberson fs->fs_mtime = time_second; 1076b1897c19SJulian Elischer if ((fs->fs_flags & FS_DOSOFTDEP) && 1077b1897c19SJulian Elischer (error = softdep_mount(devvp, mp, fs, cred)) != 0) { 1078f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 1079fddd463dSKonstantin Belousov ffs_flushfiles(mp, FORCECLOSE, td); 1080b1897c19SJulian Elischer goto out; 1081b1897c19SJulian Elischer } 1082f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 1083f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 1084cf60e8e4SKirk McKusick fs->fs_fmod = 1; 1085996c772fSJohn Dyson fs->fs_clean = 0; 1086791dd2faSTor Egge (void) ffs_sbupdate(ump, MNT_WAIT, 0); 1087996c772fSJohn Dyson } 1088d8d3d415SPoul-Henning Kamp /* 108998cbffd7SKonstantin Belousov * Initialize filesystem state information in mount struct. 1090d8d3d415SPoul-Henning Kamp */ 10916cf7bc60SRobert Watson MNT_ILOCK(mp); 1092bc2258daSAttilio Rao mp->mnt_kern_flag |= MNTK_LOOKUP_SHARED | MNTK_EXTENDED_SHARED | 10935f34e93cSMark Johnston MNTK_NO_IOPF | MNTK_UNMAPPED_BUFS | MNTK_USES_BCACHE; 10946cf7bc60SRobert Watson MNT_IUNLOCK(mp); 1095516081f2SRobert Watson #ifdef UFS_EXTATTR 1096516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART 10979de54ba5SRobert Watson /* 10989de54ba5SRobert Watson * 1099f5161237SRobert Watson * Auto-starting does the following: 11009de54ba5SRobert Watson * - check for /.attribute in the fs, and extattr_start if so 11019de54ba5SRobert Watson * - for each file in .attribute, enable that file with 11029de54ba5SRobert Watson * an attribute of the same name. 11039de54ba5SRobert Watson * Not clear how to report errors -- probably eat them. 11049de54ba5SRobert Watson * This would all happen while the filesystem was busy/not 11059de54ba5SRobert Watson * available, so would effectively be "atomic". 11069de54ba5SRobert Watson */ 1107b40ce416SJulian Elischer (void) ufs_extattr_autostart(mp, td); 1108516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */ 1109516081f2SRobert Watson #endif /* !UFS_EXTATTR */ 1110df8bae1dSRodney W. Grimes return (0); 1111df8bae1dSRodney W. Grimes out: 1112df8bae1dSRodney W. Grimes if (bp) 1113df8bae1dSRodney W. Grimes brelse(bp); 111443920011SPoul-Henning Kamp if (cp != NULL) { 111543920011SPoul-Henning Kamp g_topology_lock(); 11160d7935fdSAttilio Rao g_vfs_close(cp); 111743920011SPoul-Henning Kamp g_topology_unlock(); 111843920011SPoul-Henning Kamp } 1119df8bae1dSRodney W. Grimes if (ump) { 11203ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 11211a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 11221a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 11231a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 11241a60c7fcSPawel Jakub Dawidek } 1125df8bae1dSRodney W. Grimes free(ump->um_fs, M_UFSMNT); 1126df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 112777465d93SAlfred Perlstein mp->mnt_data = NULL; 1128df8bae1dSRodney W. Grimes } 1129c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0); 113049c4791cSEdward Tomasz Napierala dev_rel(dev); 1131df8bae1dSRodney W. Grimes return (error); 1132df8bae1dSRodney W. Grimes } 1133df8bae1dSRodney W. Grimes 11341c85e6a3SKirk McKusick #include <sys/sysctl.h> 1135adf41577SPoul-Henning Kamp static int bigcgs = 0; 11361c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, ""); 11371c85e6a3SKirk McKusick 1138df8bae1dSRodney W. Grimes /* 11391c85e6a3SKirk McKusick * Sanity checks for loading old filesystem superblocks. 11401c85e6a3SKirk McKusick * See ffs_oldfscompat_write below for unwound actions. 1141df8bae1dSRodney W. Grimes * 11421c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 11431c85e6a3SKirk McKusick * Unfortunately new bits get added. 1144df8bae1dSRodney W. Grimes */ 11451c85e6a3SKirk McKusick static void 11461c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc) 1147df8bae1dSRodney W. Grimes struct fs *fs; 11481c85e6a3SKirk McKusick struct ufsmount *ump; 11491c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 11501c85e6a3SKirk McKusick { 11511c85e6a3SKirk McKusick off_t maxfilesize; 11521c85e6a3SKirk McKusick 11531c85e6a3SKirk McKusick /* 1154ada981b2SKirk McKusick * If not yet done, update fs_flags location and value of fs_sblockloc. 1155ada981b2SKirk McKusick */ 1156ada981b2SKirk McKusick if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1157ada981b2SKirk McKusick fs->fs_flags = fs->fs_old_flags; 1158ada981b2SKirk McKusick fs->fs_old_flags |= FS_FLAGS_UPDATED; 1159ada981b2SKirk McKusick fs->fs_sblockloc = sblockloc; 1160ada981b2SKirk McKusick } 1161ada981b2SKirk McKusick /* 11621c85e6a3SKirk McKusick * If not yet done, update UFS1 superblock with new wider fields. 11631c85e6a3SKirk McKusick */ 116474f3809aSKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) { 11651c85e6a3SKirk McKusick fs->fs_maxbsize = fs->fs_bsize; 11661c85e6a3SKirk McKusick fs->fs_time = fs->fs_old_time; 11671c85e6a3SKirk McKusick fs->fs_size = fs->fs_old_size; 11681c85e6a3SKirk McKusick fs->fs_dsize = fs->fs_old_dsize; 11691c85e6a3SKirk McKusick fs->fs_csaddr = fs->fs_old_csaddr; 11701c85e6a3SKirk McKusick fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir; 11711c85e6a3SKirk McKusick fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree; 11721c85e6a3SKirk McKusick fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree; 11731c85e6a3SKirk McKusick fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree; 11741c85e6a3SKirk McKusick } 11751c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && 11761c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { 11778680d698SNate Lawson fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1; 11781c85e6a3SKirk McKusick fs->fs_qbmask = ~fs->fs_bmask; 11791c85e6a3SKirk McKusick fs->fs_qfmask = ~fs->fs_fmask; 11801c85e6a3SKirk McKusick } 11818f42fb8fSIan Dowse if (fs->fs_magic == FS_UFS1_MAGIC) { 11821c85e6a3SKirk McKusick ump->um_savedmaxfilesize = fs->fs_maxfilesize; 11838680d698SNate Lawson maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1; 11841c85e6a3SKirk McKusick if (fs->fs_maxfilesize > maxfilesize) 11851c85e6a3SKirk McKusick fs->fs_maxfilesize = maxfilesize; 11868f42fb8fSIan Dowse } 11871c85e6a3SKirk McKusick /* Compatibility for old filesystems */ 11881c85e6a3SKirk McKusick if (fs->fs_avgfilesize <= 0) 11891c85e6a3SKirk McKusick fs->fs_avgfilesize = AVFILESIZ; 11901c85e6a3SKirk McKusick if (fs->fs_avgfpdir <= 0) 11911c85e6a3SKirk McKusick fs->fs_avgfpdir = AFPDIR; 11921c85e6a3SKirk McKusick if (bigcgs) { 11931c85e6a3SKirk McKusick fs->fs_save_cgsize = fs->fs_cgsize; 11941c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_bsize; 11951c85e6a3SKirk McKusick } 11961c85e6a3SKirk McKusick } 11971c85e6a3SKirk McKusick 11981c85e6a3SKirk McKusick /* 11991c85e6a3SKirk McKusick * Unwinding superblock updates for old filesystems. 12001c85e6a3SKirk McKusick * See ffs_oldfscompat_read above for details. 12011c85e6a3SKirk McKusick * 12021c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 12031c85e6a3SKirk McKusick * Unfortunately new bits get added. 12041c85e6a3SKirk McKusick */ 1205113db2ddSJeff Roberson void 12061c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump) 12071c85e6a3SKirk McKusick struct fs *fs; 12081c85e6a3SKirk McKusick struct ufsmount *ump; 1209df8bae1dSRodney W. Grimes { 1210df8bae1dSRodney W. Grimes 12111c85e6a3SKirk McKusick /* 12121c85e6a3SKirk McKusick * Copy back UFS2 updated fields that UFS1 inspects. 12131c85e6a3SKirk McKusick */ 12141c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 12151c85e6a3SKirk McKusick fs->fs_old_time = fs->fs_time; 12161c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir; 12171c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree; 12181c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree; 12191c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree; 12201c85e6a3SKirk McKusick fs->fs_maxfilesize = ump->um_savedmaxfilesize; 12218f42fb8fSIan Dowse } 12221c85e6a3SKirk McKusick if (bigcgs) { 12231c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_save_cgsize; 12241c85e6a3SKirk McKusick fs->fs_save_cgsize = 0; 12251c85e6a3SKirk McKusick } 1226df8bae1dSRodney W. Grimes } 1227df8bae1dSRodney W. Grimes 1228df8bae1dSRodney W. Grimes /* 1229df8bae1dSRodney W. Grimes * unmount system call 1230df8bae1dSRodney W. Grimes */ 1231adf41577SPoul-Henning Kamp static int 1232dfd233edSAttilio Rao ffs_unmount(mp, mntflags) 1233df8bae1dSRodney W. Grimes struct mount *mp; 1234df8bae1dSRodney W. Grimes int mntflags; 1235df8bae1dSRodney W. Grimes { 1236dfd233edSAttilio Rao struct thread *td; 123705f4ff5dSPoul-Henning Kamp struct ufsmount *ump = VFSTOUFS(mp); 123805f4ff5dSPoul-Henning Kamp struct fs *fs; 12396fecb4e4SKonstantin Belousov int error, flags, susp; 1240df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1241df86ccf6SKonstantin Belousov int e_restart; 1242df86ccf6SKonstantin Belousov #endif 1243df8bae1dSRodney W. Grimes 1244df8bae1dSRodney W. Grimes flags = 0; 1245dfd233edSAttilio Rao td = curthread; 12466fecb4e4SKonstantin Belousov fs = ump->um_fs; 1247b60ee81eSKirk McKusick susp = 0; 1248df8bae1dSRodney W. Grimes if (mntflags & MNT_FORCE) { 1249df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 12504ce90426SKonstantin Belousov susp = fs->fs_ronly == 0; 1251b60ee81eSKirk McKusick } 1252516081f2SRobert Watson #ifdef UFS_EXTATTR 1253b40ce416SJulian Elischer if ((error = ufs_extattr_stop(mp, td))) { 1254b2b0497aSRobert Watson if (error != EOPNOTSUPP) 1255b60ee81eSKirk McKusick printf("WARNING: unmount %s: ufs_extattr_stop " 1256b60ee81eSKirk McKusick "returned errno %d\n", mp->mnt_stat.f_mntonname, 1257b2b0497aSRobert Watson error); 1258df86ccf6SKonstantin Belousov e_restart = 0; 12597df97b61SRobert Watson } else { 12609de54ba5SRobert Watson ufs_extattr_uepm_destroy(&ump->um_extattr); 1261df86ccf6SKonstantin Belousov e_restart = 1; 12627df97b61SRobert Watson } 1263a64ed089SRobert Watson #endif 12646fecb4e4SKonstantin Belousov if (susp) { 1265895b3782SKonstantin Belousov error = vfs_write_suspend_umnt(mp); 1266895b3782SKonstantin Belousov if (error != 0) 1267895b3782SKonstantin Belousov goto fail1; 12686fecb4e4SKonstantin Belousov } 1269fddf7baeSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 12703c140b2dSEdward Tomasz Napierala error = softdep_flushfiles(mp, flags, td); 12713c140b2dSEdward Tomasz Napierala else 12723c140b2dSEdward Tomasz Napierala error = ffs_flushfiles(mp, flags, td); 12734f560d75SEdward Tomasz Napierala if (error != 0 && error != ENXIO) 12746fecb4e4SKonstantin Belousov goto fail; 12753c140b2dSEdward Tomasz Napierala 12763ba649d7SJeff Roberson UFS_LOCK(ump); 12779ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1278b60ee81eSKirk McKusick printf("WARNING: unmount %s: pending error: blocks %jd " 1279b60ee81eSKirk McKusick "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 12801c85e6a3SKirk McKusick fs->fs_pendinginodes); 12819ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 12829ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 12839ccb939eSKirk McKusick } 12843ba649d7SJeff Roberson UFS_UNLOCK(ump); 1285519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(mp)) 1286113db2ddSJeff Roberson softdep_unmount(mp); 1287927a12aeSKirk McKusick if (fs->fs_ronly == 0 || ump->um_fsckpid > 0) { 12881a6a6610SKirk McKusick fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1; 1289791dd2faSTor Egge error = ffs_sbupdate(ump, MNT_WAIT, 0); 12904f560d75SEdward Tomasz Napierala if (error && error != ENXIO) { 1291996c772fSJohn Dyson fs->fs_clean = 0; 12926fecb4e4SKonstantin Belousov goto fail; 1293996c772fSJohn Dyson } 1294e0e9c421SDavid Greenman } 1295ddd6b3fcSKonstantin Belousov if (susp) 1296ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1297c79dff0fSKonstantin Belousov if (ump->um_trim_tq != NULL) { 1298c79dff0fSKonstantin Belousov while (ump->um_trim_inflight != 0) 1299c79dff0fSKonstantin Belousov pause("ufsutr", hz); 1300c79dff0fSKonstantin Belousov taskqueue_drain_all(ump->um_trim_tq); 1301c79dff0fSKonstantin Belousov taskqueue_free(ump->um_trim_tq); 1302c79dff0fSKonstantin Belousov } 130343920011SPoul-Henning Kamp g_topology_lock(); 1304927a12aeSKirk McKusick if (ump->um_fsckpid > 0) { 1305927a12aeSKirk McKusick /* 1306927a12aeSKirk McKusick * Return to normal read-only mode. 1307927a12aeSKirk McKusick */ 1308927a12aeSKirk McKusick error = g_access(ump->um_cp, 0, -1, 0); 1309927a12aeSKirk McKusick ump->um_fsckpid = 0; 1310927a12aeSKirk McKusick } 13110d7935fdSAttilio Rao g_vfs_close(ump->um_cp); 131243920011SPoul-Henning Kamp g_topology_unlock(); 1313c70b3cd2SKonstantin Belousov atomic_store_rel_ptr((uintptr_t *)&ump->um_dev->si_mountpt, 0); 13146476c0d2SJohn Dyson vrele(ump->um_devvp); 131549c4791cSEdward Tomasz Napierala dev_rel(ump->um_dev); 13163ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 13171a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 13181a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 13191a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 13201a60c7fcSPawel Jakub Dawidek } 1321f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 1322df8bae1dSRodney W. Grimes free(fs, M_UFSMNT); 1323df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 132477465d93SAlfred Perlstein mp->mnt_data = NULL; 13255da56ddbSTor Egge MNT_ILOCK(mp); 1326cc9d8990SPeter Wemm mp->mnt_flag &= ~MNT_LOCAL; 13275da56ddbSTor Egge MNT_IUNLOCK(mp); 13284cbc378cSKonstantin Belousov if (td->td_su == mp) { 13294cbc378cSKonstantin Belousov td->td_su = NULL; 13304cbc378cSKonstantin Belousov vfs_rel(mp); 13314cbc378cSKonstantin Belousov } 1332df8bae1dSRodney W. Grimes return (error); 13336fecb4e4SKonstantin Belousov 13346fecb4e4SKonstantin Belousov fail: 1335ddd6b3fcSKonstantin Belousov if (susp) 1336ddd6b3fcSKonstantin Belousov vfs_write_resume(mp, VR_START_WRITE); 1337895b3782SKonstantin Belousov fail1: 1338df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR 1339df86ccf6SKonstantin Belousov if (e_restart) { 1340df86ccf6SKonstantin Belousov ufs_extattr_uepm_init(&ump->um_extattr); 1341df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART 1342df86ccf6SKonstantin Belousov (void) ufs_extattr_autostart(mp, td); 1343df86ccf6SKonstantin Belousov #endif 1344df86ccf6SKonstantin Belousov } 1345df86ccf6SKonstantin Belousov #endif 1346df86ccf6SKonstantin Belousov 13476fecb4e4SKonstantin Belousov return (error); 1348df8bae1dSRodney W. Grimes } 1349df8bae1dSRodney W. Grimes 1350df8bae1dSRodney W. Grimes /* 1351df8bae1dSRodney W. Grimes * Flush out all the files in a filesystem. 1352df8bae1dSRodney W. Grimes */ 135326f9a767SRodney W. Grimes int 1354b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td) 135505f4ff5dSPoul-Henning Kamp struct mount *mp; 1356df8bae1dSRodney W. Grimes int flags; 1357b40ce416SJulian Elischer struct thread *td; 1358df8bae1dSRodney W. Grimes { 135905f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 1360ba05dec5SKonstantin Belousov int qerror, error; 1361df8bae1dSRodney W. Grimes 1362df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1363ba05dec5SKonstantin Belousov qerror = 0; 1364df8bae1dSRodney W. Grimes #ifdef QUOTA 1365df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_QUOTA) { 1366c1d9efcbSPoul-Henning Kamp int i; 1367f257b7a5SAlfred Perlstein error = vflush(mp, 0, SKIPSYSTEM|flags, td); 1368c1d9efcbSPoul-Henning Kamp if (error) 1369df8bae1dSRodney W. Grimes return (error); 1370df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) { 1371ba05dec5SKonstantin Belousov error = quotaoff(td, mp, i); 1372ba05dec5SKonstantin Belousov if (error != 0) { 1373ba05dec5SKonstantin Belousov if ((flags & EARLYFLUSH) == 0) 1374ba05dec5SKonstantin Belousov return (error); 1375ba05dec5SKonstantin Belousov else 1376ba05dec5SKonstantin Belousov qerror = error; 1377df8bae1dSRodney W. Grimes } 1378ba05dec5SKonstantin Belousov } 1379ba05dec5SKonstantin Belousov 1380df8bae1dSRodney W. Grimes /* 1381ba05dec5SKonstantin Belousov * Here we fall through to vflush again to ensure that 1382ba05dec5SKonstantin Belousov * we have gotten rid of all the system vnodes, unless 1383ba05dec5SKonstantin Belousov * quotas must not be closed. 1384df8bae1dSRodney W. Grimes */ 1385df8bae1dSRodney W. Grimes } 1386df8bae1dSRodney W. Grimes #endif 1387e6e370a7SJeff Roberson ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles"); 1388e6e370a7SJeff Roberson if (ump->um_devvp->v_vflag & VV_COPYONWRITE) { 1389f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0) 1390f2a2857bSKirk McKusick return (error); 1391f2a2857bSKirk McKusick ffs_snapshot_unmount(mp); 139295e7a3c3STor Egge flags |= FORCECLOSE; 1393f2a2857bSKirk McKusick /* 1394f2a2857bSKirk McKusick * Here we fall through to vflush again to ensure 1395f2a2857bSKirk McKusick * that we have gotten rid of all the system vnodes. 1396f2a2857bSKirk McKusick */ 1397f2a2857bSKirk McKusick } 1398ba05dec5SKonstantin Belousov 1399b1897c19SJulian Elischer /* 1400ba05dec5SKonstantin Belousov * Do not close system files if quotas were not closed, to be 1401ba05dec5SKonstantin Belousov * able to sync the remaining dquots. The freeblks softupdate 1402ba05dec5SKonstantin Belousov * workitems might hold a reference on a dquot, preventing 1403ba05dec5SKonstantin Belousov * quotaoff() from completing. Next round of 1404ba05dec5SKonstantin Belousov * softdep_flushworklist() iteration should process the 1405ba05dec5SKonstantin Belousov * blockers, allowing the next run of quotaoff() to finally 1406ba05dec5SKonstantin Belousov * flush held dquots. 1407ba05dec5SKonstantin Belousov * 1408ba05dec5SKonstantin Belousov * Otherwise, flush all the files. 1409b1897c19SJulian Elischer */ 1410ba05dec5SKonstantin Belousov if (qerror == 0 && (error = vflush(mp, 0, flags, td)) != 0) 1411b1897c19SJulian Elischer return (error); 1412ba05dec5SKonstantin Belousov 1413b1897c19SJulian Elischer /* 1414b1897c19SJulian Elischer * Flush filesystem metadata. 1415b1897c19SJulian Elischer */ 1416cb05b60aSAttilio Rao vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 14178df6bac4SPoul-Henning Kamp error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td); 141822db15c0SAttilio Rao VOP_UNLOCK(ump->um_devvp, 0); 1419df8bae1dSRodney W. Grimes return (error); 1420df8bae1dSRodney W. Grimes } 1421df8bae1dSRodney W. Grimes 1422df8bae1dSRodney W. Grimes /* 1423df8bae1dSRodney W. Grimes * Get filesystem statistics. 1424df8bae1dSRodney W. Grimes */ 1425adf41577SPoul-Henning Kamp static int 1426dfd233edSAttilio Rao ffs_statfs(mp, sbp) 1427df8bae1dSRodney W. Grimes struct mount *mp; 142805f4ff5dSPoul-Henning Kamp struct statfs *sbp; 1429df8bae1dSRodney W. Grimes { 143005f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 143105f4ff5dSPoul-Henning Kamp struct fs *fs; 1432df8bae1dSRodney W. Grimes 1433df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1434df8bae1dSRodney W. Grimes fs = ump->um_fs; 14351c85e6a3SKirk McKusick if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC) 1436df8bae1dSRodney W. Grimes panic("ffs_statfs"); 1437fde81c7dSKirk McKusick sbp->f_version = STATFS_VERSION; 1438df8bae1dSRodney W. Grimes sbp->f_bsize = fs->fs_fsize; 1439df8bae1dSRodney W. Grimes sbp->f_iosize = fs->fs_bsize; 1440df8bae1dSRodney W. Grimes sbp->f_blocks = fs->fs_dsize; 14413ba649d7SJeff Roberson UFS_LOCK(ump); 1442df8bae1dSRodney W. Grimes sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + 14439ccb939eSKirk McKusick fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks); 14449ccb939eSKirk McKusick sbp->f_bavail = freespace(fs, fs->fs_minfree) + 14459ccb939eSKirk McKusick dbtofsb(fs, fs->fs_pendingblocks); 14461dc349abSEd Maste sbp->f_files = fs->fs_ncg * fs->fs_ipg - UFS_ROOTINO; 14479ccb939eSKirk McKusick sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes; 14483ba649d7SJeff Roberson UFS_UNLOCK(ump); 1449a96da1c3SConrad Meyer sbp->f_namemax = UFS_MAXNAMLEN; 1450df8bae1dSRodney W. Grimes return (0); 1451df8bae1dSRodney W. Grimes } 1452df8bae1dSRodney W. Grimes 14531eabd967SKonstantin Belousov static bool 14541eabd967SKonstantin Belousov sync_doupdate(struct inode *ip) 14551eabd967SKonstantin Belousov { 14561eabd967SKonstantin Belousov 14571eabd967SKonstantin Belousov return ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED | 14581eabd967SKonstantin Belousov IN_UPDATE)) != 0); 14591eabd967SKonstantin Belousov } 14601eabd967SKonstantin Belousov 1461df8bae1dSRodney W. Grimes /* 1462a988a5c6SKonstantin Belousov * For a lazy sync, we only care about access times, quotas and the 1463a988a5c6SKonstantin Belousov * superblock. Other filesystem changes are already converted to 1464a988a5c6SKonstantin Belousov * cylinder group blocks or inode blocks updates and are written to 1465a988a5c6SKonstantin Belousov * disk by syncer. 1466a988a5c6SKonstantin Belousov */ 1467a988a5c6SKonstantin Belousov static int 1468a988a5c6SKonstantin Belousov ffs_sync_lazy(mp) 1469a988a5c6SKonstantin Belousov struct mount *mp; 1470a988a5c6SKonstantin Belousov { 1471a988a5c6SKonstantin Belousov struct vnode *mvp, *vp; 1472a988a5c6SKonstantin Belousov struct inode *ip; 1473a988a5c6SKonstantin Belousov struct thread *td; 1474a988a5c6SKonstantin Belousov int allerror, error; 1475a988a5c6SKonstantin Belousov 1476a988a5c6SKonstantin Belousov allerror = 0; 1477a988a5c6SKonstantin Belousov td = curthread; 1478a988a5c6SKonstantin Belousov if ((mp->mnt_flag & MNT_NOATIME) != 0) 1479a988a5c6SKonstantin Belousov goto qupdate; 1480dca5e0ecSKirk McKusick MNT_VNODE_FOREACH_ACTIVE(vp, mp, mvp) { 148171469bb3SKirk McKusick if (vp->v_type == VNON) { 1482a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1483a988a5c6SKonstantin Belousov continue; 1484a988a5c6SKonstantin Belousov } 1485a988a5c6SKonstantin Belousov ip = VTOI(vp); 1486a988a5c6SKonstantin Belousov 1487a988a5c6SKonstantin Belousov /* 1488a988a5c6SKonstantin Belousov * The IN_ACCESS flag is converted to IN_MODIFIED by 1489a988a5c6SKonstantin Belousov * ufs_close() and ufs_getattr() by the calls to 1490ea573a50SKonstantin Belousov * ufs_itimes_locked(), without subsequent UFS_UPDATE(). 1491ea573a50SKonstantin Belousov * Test also all the other timestamp flags too, to pick up 1492ea573a50SKonstantin Belousov * any other cases that could be missed. 1493a988a5c6SKonstantin Belousov */ 14941eabd967SKonstantin Belousov if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) { 1495a988a5c6SKonstantin Belousov VI_UNLOCK(vp); 1496a988a5c6SKonstantin Belousov continue; 1497a988a5c6SKonstantin Belousov } 1498a988a5c6SKonstantin Belousov if ((error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK, 149971469bb3SKirk McKusick td)) != 0) 1500a988a5c6SKonstantin Belousov continue; 15011eabd967SKonstantin Belousov if (sync_doupdate(ip)) 1502a988a5c6SKonstantin Belousov error = ffs_update(vp, 0); 1503a988a5c6SKonstantin Belousov if (error != 0) 1504a988a5c6SKonstantin Belousov allerror = error; 1505a988a5c6SKonstantin Belousov vput(vp); 1506a988a5c6SKonstantin Belousov } 1507a988a5c6SKonstantin Belousov 1508a988a5c6SKonstantin Belousov qupdate: 1509a988a5c6SKonstantin Belousov #ifdef QUOTA 1510a988a5c6SKonstantin Belousov qsync(mp); 1511a988a5c6SKonstantin Belousov #endif 1512a988a5c6SKonstantin Belousov 1513a988a5c6SKonstantin Belousov if (VFSTOUFS(mp)->um_fs->fs_fmod != 0 && 1514a988a5c6SKonstantin Belousov (error = ffs_sbupdate(VFSTOUFS(mp), MNT_LAZY, 0)) != 0) 1515a988a5c6SKonstantin Belousov allerror = error; 1516a988a5c6SKonstantin Belousov return (allerror); 1517a988a5c6SKonstantin Belousov } 1518a988a5c6SKonstantin Belousov 1519a988a5c6SKonstantin Belousov /* 1520df8bae1dSRodney W. Grimes * Go through the disk queues to initiate sandbagged IO; 1521df8bae1dSRodney W. Grimes * go through the inodes to write those that have been modified; 1522df8bae1dSRodney W. Grimes * initiate the writing of the super block if it has been modified. 1523df8bae1dSRodney W. Grimes * 1524a988a5c6SKonstantin Belousov * Note: we are always called with the filesystem marked busy using 1525a988a5c6SKonstantin Belousov * vfs_busy(). 1526df8bae1dSRodney W. Grimes */ 1527adf41577SPoul-Henning Kamp static int 1528dfd233edSAttilio Rao ffs_sync(mp, waitfor) 1529df8bae1dSRodney W. Grimes struct mount *mp; 1530df8bae1dSRodney W. Grimes int waitfor; 1531df8bae1dSRodney W. Grimes { 153282be0a5aSTor Egge struct vnode *mvp, *vp, *devvp; 1533dfd233edSAttilio Rao struct thread *td; 1534996c772fSJohn Dyson struct inode *ip; 1535996c772fSJohn Dyson struct ufsmount *ump = VFSTOUFS(mp); 1536996c772fSJohn Dyson struct fs *fs; 153769baeadcSKonstantin Belousov int error, count, lockreq, allerror = 0; 1538791dd2faSTor Egge int suspend; 1539791dd2faSTor Egge int suspended; 1540791dd2faSTor Egge int secondary_writes; 1541791dd2faSTor Egge int secondary_accwrites; 1542791dd2faSTor Egge int softdep_deps; 1543791dd2faSTor Egge int softdep_accdeps; 1544156cb265SPoul-Henning Kamp struct bufobj *bo; 1545df8bae1dSRodney W. Grimes 154619c87af0SKirk McKusick suspend = 0; 154719c87af0SKirk McKusick suspended = 0; 1548dfd233edSAttilio Rao td = curthread; 1549df8bae1dSRodney W. Grimes fs = ump->um_fs; 1550b60ee81eSKirk McKusick if (fs->fs_fmod != 0 && fs->fs_ronly != 0 && ump->um_fsckpid == 0) 1551b60ee81eSKirk McKusick panic("%s: ffs_sync: modification on read-only filesystem", 1552b60ee81eSKirk McKusick fs->fs_fsmnt); 15534af9f77eSKonstantin Belousov if (waitfor == MNT_LAZY) { 15544af9f77eSKonstantin Belousov if (!rebooting) 1555a988a5c6SKonstantin Belousov return (ffs_sync_lazy(mp)); 15564af9f77eSKonstantin Belousov waitfor = MNT_NOWAIT; 15574af9f77eSKonstantin Belousov } 1558a988a5c6SKonstantin Belousov 155919c87af0SKirk McKusick /* 1560df8bae1dSRodney W. Grimes * Write back each (modified) inode. 1561df8bae1dSRodney W. Grimes */ 1562245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE | LK_NOWAIT; 1563791dd2faSTor Egge if (waitfor == MNT_SUSPEND) { 1564791dd2faSTor Egge suspend = 1; 1565791dd2faSTor Egge waitfor = MNT_WAIT; 1566791dd2faSTor Egge } 156769baeadcSKonstantin Belousov if (waitfor == MNT_WAIT) 1568245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE; 156941d4783dSJeff Roberson lockreq |= LK_INTERLOCK | LK_SLEEPFAIL; 1570df8bae1dSRodney W. Grimes loop: 1571791dd2faSTor Egge /* Grab snapshot of secondary write counts */ 157271469bb3SKirk McKusick MNT_ILOCK(mp); 1573791dd2faSTor Egge secondary_writes = mp->mnt_secondary_writes; 1574791dd2faSTor Egge secondary_accwrites = mp->mnt_secondary_accwrites; 157571469bb3SKirk McKusick MNT_IUNLOCK(mp); 1576791dd2faSTor Egge 1577791dd2faSTor Egge /* Grab snapshot of softdep dependency counts */ 1578791dd2faSTor Egge softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps); 1579791dd2faSTor Egge 158071469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL(vp, mp, mvp) { 1581245df27cSMatthew Dillon /* 1582e0c17408SKonstantin Belousov * Depend on the vnode interlock to keep things stable enough 1583245df27cSMatthew Dillon * for a quick test. Since there might be hundreds of 1584245df27cSMatthew Dillon * thousands of vnodes, we cannot afford even a subroutine 1585245df27cSMatthew Dillon * call unless there's a good chance that we have work to do. 1586245df27cSMatthew Dillon */ 158771469bb3SKirk McKusick if (vp->v_type == VNON) { 15882f05568aSJeff Roberson VI_UNLOCK(vp); 15892f05568aSJeff Roberson continue; 15902f05568aSJeff Roberson } 1591df8bae1dSRodney W. Grimes ip = VTOI(vp); 159271469bb3SKirk McKusick if ((ip->i_flag & 1593cf60e8e4SKirk McKusick (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && 159471469bb3SKirk McKusick vp->v_bufobj.bo_dirty.bv_cnt == 0) { 15952f05568aSJeff Roberson VI_UNLOCK(vp); 1596df8bae1dSRodney W. Grimes continue; 1597996c772fSJohn Dyson } 1598b40ce416SJulian Elischer if ((error = vget(vp, lockreq, td)) != 0) { 159982be0a5aSTor Egge if (error == ENOENT || error == ENOLCK) { 160071469bb3SKirk McKusick MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp); 1601df8bae1dSRodney W. Grimes goto loop; 160282be0a5aSTor Egge } 16032f05568aSJeff Roberson continue; 16042f05568aSJeff Roberson } 160575a58389SKirk McKusick if ((error = ffs_syncvnode(vp, waitfor, 0)) != 0) 1606df8bae1dSRodney W. Grimes allerror = error; 160741d4783dSJeff Roberson vput(vp); 1608245df27cSMatthew Dillon } 1609df8bae1dSRodney W. Grimes /* 1610df8bae1dSRodney W. Grimes * Force stale filesystem control information to be flushed. 1611df8bae1dSRodney W. Grimes */ 16124af9f77eSKonstantin Belousov if (waitfor == MNT_WAIT || rebooting) { 1613b40ce416SJulian Elischer if ((error = softdep_flushworklist(ump->um_mountp, &count, td))) 16149b971133SKirk McKusick allerror = error; 16159b971133SKirk McKusick /* Flushed work items may create new vnodes to clean */ 161671469bb3SKirk McKusick if (allerror == 0 && count) 16179b971133SKirk McKusick goto loop; 16189b971133SKirk McKusick } 1619589c7af9SKirk McKusick #ifdef QUOTA 1620589c7af9SKirk McKusick qsync(mp); 1621589c7af9SKirk McKusick #endif 162219c87af0SKirk McKusick 1623112f7372SKirk McKusick devvp = ump->um_devvp; 1624156cb265SPoul-Henning Kamp bo = &devvp->v_bufobj; 1625698b1a66SJeff Roberson BO_LOCK(bo); 162619c87af0SKirk McKusick if (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0) { 1627698b1a66SJeff Roberson BO_UNLOCK(bo); 1628698b1a66SJeff Roberson vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 16294af9f77eSKonstantin Belousov error = VOP_FSYNC(devvp, waitfor, td); 163022db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 16314af9f77eSKonstantin Belousov if (MOUNTEDSOFTDEP(mp) && (error == 0 || error == EAGAIN)) 16324af9f77eSKonstantin Belousov error = ffs_sbupdate(ump, waitfor, 0); 16334af9f77eSKonstantin Belousov if (error != 0) 16344af9f77eSKonstantin Belousov allerror = error; 163571469bb3SKirk McKusick if (allerror == 0 && waitfor == MNT_WAIT) 1636112f7372SKirk McKusick goto loop; 1637791dd2faSTor Egge } else if (suspend != 0) { 1638791dd2faSTor Egge if (softdep_check_suspend(mp, 1639791dd2faSTor Egge devvp, 1640791dd2faSTor Egge softdep_deps, 1641791dd2faSTor Egge softdep_accdeps, 1642791dd2faSTor Egge secondary_writes, 164371469bb3SKirk McKusick secondary_accwrites) != 0) { 164471469bb3SKirk McKusick MNT_IUNLOCK(mp); 1645791dd2faSTor Egge goto loop; /* More work needed */ 164671469bb3SKirk McKusick } 1647791dd2faSTor Egge mtx_assert(MNT_MTX(mp), MA_OWNED); 1648ca2fa807STor Egge mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED; 1649791dd2faSTor Egge MNT_IUNLOCK(mp); 1650791dd2faSTor Egge suspended = 1; 1651112f7372SKirk McKusick } else 1652698b1a66SJeff Roberson BO_UNLOCK(bo); 1653996c772fSJohn Dyson /* 1654996c772fSJohn Dyson * Write back modified superblock. 1655996c772fSJohn Dyson */ 1656791dd2faSTor Egge if (fs->fs_fmod != 0 && 1657791dd2faSTor Egge (error = ffs_sbupdate(ump, waitfor, suspended)) != 0) 1658996c772fSJohn Dyson allerror = error; 1659df8bae1dSRodney W. Grimes return (allerror); 1660df8bae1dSRodney W. Grimes } 1661df8bae1dSRodney W. Grimes 1662df8bae1dSRodney W. Grimes int 1663a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp) 1664df8bae1dSRodney W. Grimes struct mount *mp; 1665df8bae1dSRodney W. Grimes ino_t ino; 1666a0595d02SKirk McKusick int flags; 1667df8bae1dSRodney W. Grimes struct vnode **vpp; 1668df8bae1dSRodney W. Grimes { 16697b7ed832SKonstantin Belousov return (ffs_vgetf(mp, ino, flags, vpp, 0)); 16707b7ed832SKonstantin Belousov } 16717b7ed832SKonstantin Belousov 16727b7ed832SKonstantin Belousov int 16737b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags) 16747b7ed832SKonstantin Belousov struct mount *mp; 16757b7ed832SKonstantin Belousov ino_t ino; 16767b7ed832SKonstantin Belousov int flags; 16777b7ed832SKonstantin Belousov struct vnode **vpp; 16787b7ed832SKonstantin Belousov int ffs_flags; 16797b7ed832SKonstantin Belousov { 1680996c772fSJohn Dyson struct fs *fs; 1681996c772fSJohn Dyson struct inode *ip; 1682df8bae1dSRodney W. Grimes struct ufsmount *ump; 1683df8bae1dSRodney W. Grimes struct buf *bp; 1684df8bae1dSRodney W. Grimes struct vnode *vp; 1685f576a00dSSemen Ustimenko int error; 1686df8bae1dSRodney W. Grimes 168751f5ce0cSPoul-Henning Kamp error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL); 1688e82ef95cSPoul-Henning Kamp if (error || *vpp != NULL) 168914bc0685SPoul-Henning Kamp return (error); 1690f576a00dSSemen Ustimenko 1691f576a00dSSemen Ustimenko /* 1692d6919865SJeff Roberson * We must promote to an exclusive lock for vnode creation. This 1693d6919865SJeff Roberson * can happen if lookup is passed LOCKSHARED. 1694d6919865SJeff Roberson */ 1695d6919865SJeff Roberson if ((flags & LK_TYPE_MASK) == LK_SHARED) { 1696d6919865SJeff Roberson flags &= ~LK_TYPE_MASK; 1697d6919865SJeff Roberson flags |= LK_EXCLUSIVE; 1698d6919865SJeff Roberson } 1699d6919865SJeff Roberson 1700d6919865SJeff Roberson /* 170113866b3fSSemen Ustimenko * We do not lock vnode creation as it is believed to be too 1702f576a00dSSemen Ustimenko * expensive for such rare case as simultaneous creation of vnode 1703f576a00dSSemen Ustimenko * for same ino by different processes. We just allow them to race 1704f576a00dSSemen Ustimenko * and check later to decide who wins. Let the race begin! 1705f576a00dSSemen Ustimenko */ 170614bc0685SPoul-Henning Kamp 170714bc0685SPoul-Henning Kamp ump = VFSTOUFS(mp); 170814bc0685SPoul-Henning Kamp fs = ump->um_fs; 170914bc0685SPoul-Henning Kamp ip = uma_zalloc(uma_inode, M_WAITOK | M_ZERO); 17102f9bae59SDavid Greenman 1711df8bae1dSRodney W. Grimes /* Allocate a new vnode/inode. */ 171243a993bbSKirk McKusick error = getnewvnode("ufs", mp, fs->fs_magic == FS_UFS1_MAGIC ? 171343a993bbSKirk McKusick &ffs_vnodeops1 : &ffs_vnodeops2, &vp); 1714c9671602SPoul-Henning Kamp if (error) { 1715df8bae1dSRodney W. Grimes *vpp = NULL; 1716aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 1717df8bae1dSRodney W. Grimes return (error); 1718df8bae1dSRodney W. Grimes } 171967e87166SBoris Popov /* 172033fc3625SJohn Baldwin * FFS supports recursive locking. 172167e87166SBoris Popov */ 17223634d5b2SJohn Baldwin lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL); 1723628f51d2SAttilio Rao VN_LOCK_AREC(vp); 1724df8bae1dSRodney W. Grimes vp->v_data = ip; 17255d9d81e7SPoul-Henning Kamp vp->v_bufobj.bo_bsize = fs->fs_bsize; 1726df8bae1dSRodney W. Grimes ip->i_vnode = vp; 17271c85e6a3SKirk McKusick ip->i_ump = ump; 1728df8bae1dSRodney W. Grimes ip->i_number = ino; 1729e65f5a4eSKonstantin Belousov ip->i_ea_refs = 0; 173074a87c38SKirk McKusick ip->i_nextclustercg = -1; 1731e1db6897SKonstantin Belousov ip->i_flag = fs->fs_magic == FS_UFS1_MAGIC ? 0 : IN_UFS2; 1732df8bae1dSRodney W. Grimes #ifdef QUOTA 1733c1d9efcbSPoul-Henning Kamp { 1734c1d9efcbSPoul-Henning Kamp int i; 1735df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1736df8bae1dSRodney W. Grimes ip->i_dquot[i] = NODQUOT; 1737c1d9efcbSPoul-Henning Kamp } 1738df8bae1dSRodney W. Grimes #endif 1739df8bae1dSRodney W. Grimes 17407b7ed832SKonstantin Belousov if (ffs_flags & FFSV_FORCEINSMQ) 17417b7ed832SKonstantin Belousov vp->v_vflag |= VV_FORCEINSMQ; 174261b9d89fSTor Egge error = insmntque(vp, mp); 174361b9d89fSTor Egge if (error != 0) { 17446cc745d2SKonstantin Belousov uma_zfree(uma_inode, ip); 174561b9d89fSTor Egge *vpp = NULL; 174661b9d89fSTor Egge return (error); 174761b9d89fSTor Egge } 17487b7ed832SKonstantin Belousov vp->v_vflag &= ~VV_FORCEINSMQ; 1749a80d8caaSPawel Jakub Dawidek error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL); 175045c26fa2SPoul-Henning Kamp if (error || *vpp != NULL) 1751f576a00dSSemen Ustimenko return (error); 1752f576a00dSSemen Ustimenko 1753df8bae1dSRodney W. Grimes /* Read in the disk contents for the inode, copy into the inode. */ 1754c9671602SPoul-Henning Kamp error = bread(ump->um_devvp, fsbtodb(fs, ino_to_fsba(fs, ino)), 1755c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 1756c9671602SPoul-Henning Kamp if (error) { 1757df8bae1dSRodney W. Grimes /* 1758df8bae1dSRodney W. Grimes * The inode does not contain anything useful, so it would 1759df8bae1dSRodney W. Grimes * be misleading to leave it on its hash chain. With mode 1760df8bae1dSRodney W. Grimes * still zero, it will be unlinked and returned to the free 1761df8bae1dSRodney W. Grimes * list by vput(). 1762df8bae1dSRodney W. Grimes */ 1763df8bae1dSRodney W. Grimes brelse(bp); 1764bd7e5f99SJohn Dyson vput(vp); 1765df8bae1dSRodney W. Grimes *vpp = NULL; 1766df8bae1dSRodney W. Grimes return (error); 1767df8bae1dSRodney W. Grimes } 1768e1db6897SKonstantin Belousov if (I_IS_UFS1(ip)) 1769a163d034SWarner Losh ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK); 1770de6ba7c0SPoul-Henning Kamp else 1771a163d034SWarner Losh ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK); 1772de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ino); 1773b1897c19SJulian Elischer if (DOINGSOFTDEP(vp)) 1774b1897c19SJulian Elischer softdep_load_inodeblock(ip); 1775b1897c19SJulian Elischer else 1776b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 1777bd7e5f99SJohn Dyson bqrelse(bp); 1778df8bae1dSRodney W. Grimes 1779df8bae1dSRodney W. Grimes /* 1780df8bae1dSRodney W. Grimes * Initialize the vnode from the inode, check for aliases. 1781df8bae1dSRodney W. Grimes * Note that the underlying vnode may have changed. 1782df8bae1dSRodney W. Grimes */ 1783e1db6897SKonstantin Belousov error = ufs_vinit(mp, I_IS_UFS1(ip) ? &ffs_fifoops1 : &ffs_fifoops2, 1784e1db6897SKonstantin Belousov &vp); 1785c9671602SPoul-Henning Kamp if (error) { 1786df8bae1dSRodney W. Grimes vput(vp); 1787df8bae1dSRodney W. Grimes *vpp = NULL; 1788df8bae1dSRodney W. Grimes return (error); 1789df8bae1dSRodney W. Grimes } 1790de68347bSPoul-Henning Kamp 1791df8bae1dSRodney W. Grimes /* 17925c24d6eeSPoul-Henning Kamp * Finish inode initialization. 1793df8bae1dSRodney W. Grimes */ 179433fc3625SJohn Baldwin if (vp->v_type != VFIFO) { 179533fc3625SJohn Baldwin /* FFS supports shared locking for all files except fifos. */ 179633fc3625SJohn Baldwin VN_LOCK_ASHARE(vp); 179733fc3625SJohn Baldwin } 1798de68347bSPoul-Henning Kamp 1799df8bae1dSRodney W. Grimes /* 1800df8bae1dSRodney W. Grimes * Set up a generation number for this inode if it does not 1801df8bae1dSRodney W. Grimes * already have one. This should only happen on old filesystems. 1802df8bae1dSRodney W. Grimes */ 1803df8bae1dSRodney W. Grimes if (ip->i_gen == 0) { 180457d2ac2fSKevin Lo while (ip->i_gen == 0) 180557d2ac2fSKevin Lo ip->i_gen = arc4random(); 18061c85e6a3SKirk McKusick if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 1807df8bae1dSRodney W. Grimes ip->i_flag |= IN_MODIFIED; 1808b403319bSAlexander Kabaev DIP_SET(ip, i_gen, ip->i_gen); 18091c85e6a3SKirk McKusick } 1810df8bae1dSRodney W. Grimes } 1811763bbd2fSRobert Watson #ifdef MAC 1812763bbd2fSRobert Watson if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) { 1813763bbd2fSRobert Watson /* 1814763bbd2fSRobert Watson * If this vnode is already allocated, and we're running 1815763bbd2fSRobert Watson * multi-label, attempt to perform a label association 1816763bbd2fSRobert Watson * from the extended attributes on the inode. 1817763bbd2fSRobert Watson */ 181830d239bcSRobert Watson error = mac_vnode_associate_extattr(mp, vp); 1819763bbd2fSRobert Watson if (error) { 1820763bbd2fSRobert Watson /* ufs_inactive will release ip->i_devvp ref. */ 1821763bbd2fSRobert Watson vput(vp); 1822763bbd2fSRobert Watson *vpp = NULL; 1823763bbd2fSRobert Watson return (error); 1824763bbd2fSRobert Watson } 1825763bbd2fSRobert Watson } 1826763bbd2fSRobert Watson #endif 1827763bbd2fSRobert Watson 1828df8bae1dSRodney W. Grimes *vpp = vp; 1829df8bae1dSRodney W. Grimes return (0); 1830df8bae1dSRodney W. Grimes } 1831df8bae1dSRodney W. Grimes 1832df8bae1dSRodney W. Grimes /* 1833df8bae1dSRodney W. Grimes * File handle to vnode 1834df8bae1dSRodney W. Grimes * 1835df8bae1dSRodney W. Grimes * Have to be really careful about stale file handles: 1836df8bae1dSRodney W. Grimes * - check that the inode number is valid 1837abe53f7eSKirk McKusick * - for UFS2 check that the inode number is initialized 1838df8bae1dSRodney W. Grimes * - call ffs_vget() to get the locked inode 1839df8bae1dSRodney W. Grimes * - check for an unallocated inode (i_mode == 0) 1840df8bae1dSRodney W. Grimes * - check that the given client host has export rights and return 1841df8bae1dSRodney W. Grimes * those rights via. exflagsp and credanonp 1842df8bae1dSRodney W. Grimes */ 1843adf41577SPoul-Henning Kamp static int 1844694a586aSRick Macklem ffs_fhtovp(mp, fhp, flags, vpp) 184505f4ff5dSPoul-Henning Kamp struct mount *mp; 1846df8bae1dSRodney W. Grimes struct fid *fhp; 1847694a586aSRick Macklem int flags; 1848df8bae1dSRodney W. Grimes struct vnode **vpp; 1849df8bae1dSRodney W. Grimes { 185005f4ff5dSPoul-Henning Kamp struct ufid *ufhp; 1851abe53f7eSKirk McKusick struct ufsmount *ump; 1852df8bae1dSRodney W. Grimes struct fs *fs; 1853abe53f7eSKirk McKusick struct cg *cgp; 1854abe53f7eSKirk McKusick struct buf *bp; 1855abe53f7eSKirk McKusick ino_t ino; 1856abe53f7eSKirk McKusick u_int cg; 1857abe53f7eSKirk McKusick int error; 1858df8bae1dSRodney W. Grimes 1859df8bae1dSRodney W. Grimes ufhp = (struct ufid *)fhp; 1860abe53f7eSKirk McKusick ino = ufhp->ufid_ino; 1861abe53f7eSKirk McKusick ump = VFSTOUFS(mp); 1862abe53f7eSKirk McKusick fs = ump->um_fs; 18631dc349abSEd Maste if (ino < UFS_ROOTINO || ino >= fs->fs_ncg * fs->fs_ipg) 1864df8bae1dSRodney W. Grimes return (ESTALE); 1865abe53f7eSKirk McKusick /* 1866abe53f7eSKirk McKusick * Need to check if inode is initialized because UFS2 does lazy 1867abe53f7eSKirk McKusick * initialization and nfs_fhtovp can offer arbitrary inode numbers. 1868abe53f7eSKirk McKusick */ 1869abe53f7eSKirk McKusick if (fs->fs_magic != FS_UFS2_MAGIC) 1870abe53f7eSKirk McKusick return (ufs_fhtovp(mp, ufhp, flags, vpp)); 1871abe53f7eSKirk McKusick cg = ino_to_cg(fs, ino); 18729c4f551eSKirk McKusick if ((error = ffs_getcg(fs, ump->um_devvp, cg, &bp, &cgp)) != 0) 1873abe53f7eSKirk McKusick return (error); 18749c4f551eSKirk McKusick if (ino >= cg * fs->fs_ipg + cgp->cg_initediblk) { 1875abe53f7eSKirk McKusick brelse(bp); 1876abe53f7eSKirk McKusick return (ESTALE); 1877abe53f7eSKirk McKusick } 1878abe53f7eSKirk McKusick brelse(bp); 1879694a586aSRick Macklem return (ufs_fhtovp(mp, ufhp, flags, vpp)); 1880df8bae1dSRodney W. Grimes } 1881df8bae1dSRodney W. Grimes 1882df8bae1dSRodney W. Grimes /* 18835346934fSIan Dowse * Initialize the filesystem. 1884996c772fSJohn Dyson */ 1885996c772fSJohn Dyson static int 1886996c772fSJohn Dyson ffs_init(vfsp) 1887996c772fSJohn Dyson struct vfsconf *vfsp; 1888996c772fSJohn Dyson { 1889996c772fSJohn Dyson 18901848286aSEdward Tomasz Napierala ffs_susp_initialize(); 1891b1897c19SJulian Elischer softdep_initialize(); 1892996c772fSJohn Dyson return (ufs_init(vfsp)); 1893996c772fSJohn Dyson } 1894996c772fSJohn Dyson 1895996c772fSJohn Dyson /* 18965346934fSIan Dowse * Undo the work of ffs_init(). 18975346934fSIan Dowse */ 18985346934fSIan Dowse static int 18995346934fSIan Dowse ffs_uninit(vfsp) 19005346934fSIan Dowse struct vfsconf *vfsp; 19015346934fSIan Dowse { 19025346934fSIan Dowse int ret; 19035346934fSIan Dowse 19045346934fSIan Dowse ret = ufs_uninit(vfsp); 19055346934fSIan Dowse softdep_uninitialize(); 19061848286aSEdward Tomasz Napierala ffs_susp_uninitialize(); 19075346934fSIan Dowse return (ret); 19085346934fSIan Dowse } 19095346934fSIan Dowse 19105346934fSIan Dowse /* 1911df8bae1dSRodney W. Grimes * Write a superblock and associated information back to disk. 1912df8bae1dSRodney W. Grimes */ 19131a60c7fcSPawel Jakub Dawidek int 1914927a12aeSKirk McKusick ffs_sbupdate(ump, waitfor, suspended) 1915927a12aeSKirk McKusick struct ufsmount *ump; 1916df8bae1dSRodney W. Grimes int waitfor; 1917791dd2faSTor Egge int suspended; 1918df8bae1dSRodney W. Grimes { 1919927a12aeSKirk McKusick struct fs *fs = ump->um_fs; 19203ba649d7SJeff Roberson struct buf *sbbp; 192105f4ff5dSPoul-Henning Kamp struct buf *bp; 1922df8bae1dSRodney W. Grimes int blks; 1923f55ff3f3SIan Dowse void *space; 1924996c772fSJohn Dyson int i, size, error, allerror = 0; 1925df8bae1dSRodney W. Grimes 192674f3809aSKirk McKusick if (fs->fs_ronly == 1 && 1927927a12aeSKirk McKusick (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) != 1928927a12aeSKirk McKusick (MNT_RDONLY | MNT_UPDATE) && ump->um_fsckpid == 0) 192974f3809aSKirk McKusick panic("ffs_sbupdate: write read-only filesystem"); 1930996c772fSJohn Dyson /* 19313ba649d7SJeff Roberson * We use the superblock's buf to serialize calls to ffs_sbupdate(). 19323ba649d7SJeff Roberson */ 1933927a12aeSKirk McKusick sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc), 1934927a12aeSKirk McKusick (int)fs->fs_sbsize, 0, 0, 0); 19353ba649d7SJeff Roberson /* 1936996c772fSJohn Dyson * First write back the summary information. 1937996c772fSJohn Dyson */ 1938df8bae1dSRodney W. Grimes blks = howmany(fs->fs_cssize, fs->fs_fsize); 1939f55ff3f3SIan Dowse space = fs->fs_csp; 1940df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 1941df8bae1dSRodney W. Grimes size = fs->fs_bsize; 1942df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 1943df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 1944927a12aeSKirk McKusick bp = getblk(ump->um_devvp, fsbtodb(fs, fs->fs_csaddr + i), 19457261f5f6SJeff Roberson size, 0, 0, 0); 1946df8bae1dSRodney W. Grimes bcopy(space, bp->b_data, (u_int)size); 1947f55ff3f3SIan Dowse space = (char *)space + size; 1948791dd2faSTor Egge if (suspended) 1949791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1950996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1951df8bae1dSRodney W. Grimes bawrite(bp); 19528aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1953996c772fSJohn Dyson allerror = error; 1954df8bae1dSRodney W. Grimes } 1955996c772fSJohn Dyson /* 1956996c772fSJohn Dyson * Now write back the superblock itself. If any errors occurred 1957996c772fSJohn Dyson * up to this point, then fail so that the superblock avoids 1958996c772fSJohn Dyson * being written out as clean. 1959996c772fSJohn Dyson */ 19603ba649d7SJeff Roberson if (allerror) { 19613ba649d7SJeff Roberson brelse(sbbp); 1962996c772fSJohn Dyson return (allerror); 19633ba649d7SJeff Roberson } 19643ba649d7SJeff Roberson bp = sbbp; 196531574422SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 && 1966e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1967b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 1968fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1); 1969fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS1; 1970fa5d33e2SKirk McKusick } 197131574422SKirk McKusick if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 && 1972e9838c11SJohn-Mark Gurney (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 1973b60ee81eSKirk McKusick printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n", 1974fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2); 1975fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS2; 1976fa5d33e2SKirk McKusick } 1977b1897c19SJulian Elischer fs->fs_fmod = 0; 1978227ee8a1SPoul-Henning Kamp fs->fs_time = time_second; 1979519e3c3bSKirk McKusick if (MOUNTEDSOFTDEP(ump->um_mountp)) 1980927a12aeSKirk McKusick softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp); 1981996c772fSJohn Dyson bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize); 1982927a12aeSKirk McKusick ffs_oldfscompat_write((struct fs *)bp->b_data, ump); 1983791dd2faSTor Egge if (suspended) 1984791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1985996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1986996c772fSJohn Dyson bawrite(bp); 19878aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1988996c772fSJohn Dyson allerror = error; 1989996c772fSJohn Dyson return (allerror); 1990df8bae1dSRodney W. Grimes } 1991d6fe88e4SPoul-Henning Kamp 1992d6fe88e4SPoul-Henning Kamp static int 1993d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp, 1994dfd233edSAttilio Rao int attrnamespace, const char *attrname) 1995d6fe88e4SPoul-Henning Kamp { 1996d6fe88e4SPoul-Henning Kamp 1997d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR 1998d6fe88e4SPoul-Henning Kamp return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace, 1999dfd233edSAttilio Rao attrname)); 2000d6fe88e4SPoul-Henning Kamp #else 2001d6fe88e4SPoul-Henning Kamp return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, 2002dfd233edSAttilio Rao attrname)); 2003d6fe88e4SPoul-Henning Kamp #endif 2004d6fe88e4SPoul-Henning Kamp } 2005975512a9SPoul-Henning Kamp 2006975512a9SPoul-Henning Kamp static void 2007975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip) 2008975512a9SPoul-Henning Kamp { 2009975512a9SPoul-Henning Kamp 201036329289STim J. Robbins if (ump->um_fstype == UFS1 && ip->i_din1 != NULL) 2011aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_ufs1, ip->i_din1); 201236329289STim J. Robbins else if (ip->i_din2 != NULL) 20138d721e87STim J. Robbins uma_zfree(uma_ufs2, ip->i_din2); 2014aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 2015975512a9SPoul-Henning Kamp } 20166e77a041SPoul-Henning Kamp 2017dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1; 2018dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0, 2019dd19a799SPoul-Henning Kamp "Do background writes (honoring the BV_BKGRDWRITE flag)?"); 2020dd19a799SPoul-Henning Kamp 2021dd19a799SPoul-Henning Kamp /* 2022dd19a799SPoul-Henning Kamp * Complete a background write started from bwrite. 2023dd19a799SPoul-Henning Kamp */ 2024dd19a799SPoul-Henning Kamp static void 2025dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp) 2026dd19a799SPoul-Henning Kamp { 2027204ec66dSJeff Roberson struct bufobj *bufobj; 2028dd19a799SPoul-Henning Kamp struct buf *origbp; 2029dd19a799SPoul-Henning Kamp 2030dd19a799SPoul-Henning Kamp /* 2031dd19a799SPoul-Henning Kamp * Find the original buffer that we are writing. 2032dd19a799SPoul-Henning Kamp */ 2033204ec66dSJeff Roberson bufobj = bp->b_bufobj; 2034204ec66dSJeff Roberson BO_LOCK(bufobj); 2035dd19a799SPoul-Henning Kamp if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL) 2036dd19a799SPoul-Henning Kamp panic("backgroundwritedone: lost buffer"); 2037b2c3df84SKonstantin Belousov 2038b2c3df84SKonstantin Belousov /* 2039b2c3df84SKonstantin Belousov * We should mark the cylinder group buffer origbp as 2040b2c3df84SKonstantin Belousov * dirty, to not loose the failed write. 2041b2c3df84SKonstantin Belousov */ 2042b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2043b2c3df84SKonstantin Belousov origbp->b_vflags |= BV_BKGRDERR; 2044204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2045dd19a799SPoul-Henning Kamp /* 2046dd19a799SPoul-Henning Kamp * Process dependencies then return any unfinished ones. 2047dd19a799SPoul-Henning Kamp */ 2048b2c3df84SKonstantin Belousov if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) == 0) 2049dd19a799SPoul-Henning Kamp buf_complete(bp); 2050dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 205104533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 2052dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, origbp); 2053dd19a799SPoul-Henning Kamp #endif 2054dd19a799SPoul-Henning Kamp /* 2055204ec66dSJeff Roberson * This buffer is marked B_NOCACHE so when it is released 2056204ec66dSJeff Roberson * by biodone it will be tossed. 2057dd19a799SPoul-Henning Kamp */ 2058dd19a799SPoul-Henning Kamp bp->b_flags |= B_NOCACHE; 2059ec9c9e73SAlan Cox bp->b_flags &= ~B_CACHE; 2060*377f88fbSKonstantin Belousov pbrelvp(bp); 2061b2c3df84SKonstantin Belousov 2062b2c3df84SKonstantin Belousov /* 2063b2c3df84SKonstantin Belousov * Prevent brelse() from trying to keep and re-dirtying bp on 2064b2c3df84SKonstantin Belousov * errors. It causes b_bufobj dereference in 2065b2c3df84SKonstantin Belousov * bdirty()/reassignbuf(), and b_bufobj was cleared in 2066b2c3df84SKonstantin Belousov * pbrelvp() above. 2067b2c3df84SKonstantin Belousov */ 2068b2c3df84SKonstantin Belousov if ((bp->b_ioflags & BIO_ERROR) != 0) 2069b2c3df84SKonstantin Belousov bp->b_flags |= B_INVAL; 2070dd19a799SPoul-Henning Kamp bufdone(bp); 2071204ec66dSJeff Roberson BO_LOCK(bufobj); 2072dd19a799SPoul-Henning Kamp /* 2073dd19a799SPoul-Henning Kamp * Clear the BV_BKGRDINPROG flag in the original buffer 2074dd19a799SPoul-Henning Kamp * and awaken it if it is waiting for the write to complete. 2075dd19a799SPoul-Henning Kamp * If BV_BKGRDINPROG is not set in the original buffer it must 2076dd19a799SPoul-Henning Kamp * have been released and re-instantiated - which is not legal. 2077dd19a799SPoul-Henning Kamp */ 2078dd19a799SPoul-Henning Kamp KASSERT((origbp->b_vflags & BV_BKGRDINPROG), 2079dd19a799SPoul-Henning Kamp ("backgroundwritedone: lost buffer2")); 2080dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDINPROG; 2081dd19a799SPoul-Henning Kamp if (origbp->b_vflags & BV_BKGRDWAIT) { 2082dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDWAIT; 2083dd19a799SPoul-Henning Kamp wakeup(&origbp->b_xflags); 2084dd19a799SPoul-Henning Kamp } 2085204ec66dSJeff Roberson BO_UNLOCK(bufobj); 2086dd19a799SPoul-Henning Kamp } 2087dd19a799SPoul-Henning Kamp 2088dd19a799SPoul-Henning Kamp 2089dd19a799SPoul-Henning Kamp /* 2090dd19a799SPoul-Henning Kamp * Write, release buffer on completion. (Done by iodone 2091dd19a799SPoul-Henning Kamp * if async). Do not bother writing anything if the buffer 2092dd19a799SPoul-Henning Kamp * is invalid. 2093dd19a799SPoul-Henning Kamp * 2094dd19a799SPoul-Henning Kamp * Note that we set B_CACHE here, indicating that buffer is 2095dd19a799SPoul-Henning Kamp * fully valid and thus cacheable. This is true even of NFS 2096dd19a799SPoul-Henning Kamp * now so we set it generally. This could be set either here 2097dd19a799SPoul-Henning Kamp * or in biodone() since the I/O is synchronous. We put it 2098dd19a799SPoul-Henning Kamp * here. 2099dd19a799SPoul-Henning Kamp */ 2100dd19a799SPoul-Henning Kamp static int 2101dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp) 2102dd19a799SPoul-Henning Kamp { 2103dd19a799SPoul-Henning Kamp struct buf *newbp; 2104dd19a799SPoul-Henning Kamp 2105dd19a799SPoul-Henning Kamp CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags); 2106dd19a799SPoul-Henning Kamp if (bp->b_flags & B_INVAL) { 2107dd19a799SPoul-Henning Kamp brelse(bp); 2108dd19a799SPoul-Henning Kamp return (0); 2109dd19a799SPoul-Henning Kamp } 2110dd19a799SPoul-Henning Kamp 2111d638e093SAttilio Rao if (!BUF_ISLOCKED(bp)) 2112dd19a799SPoul-Henning Kamp panic("bufwrite: buffer is not busy???"); 2113dd19a799SPoul-Henning Kamp /* 2114dd19a799SPoul-Henning Kamp * If a background write is already in progress, delay 2115dd19a799SPoul-Henning Kamp * writing this block if it is asynchronous. Otherwise 2116dd19a799SPoul-Henning Kamp * wait for the background write to complete. 2117dd19a799SPoul-Henning Kamp */ 2118dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2119dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) { 2120dd19a799SPoul-Henning Kamp if (bp->b_flags & B_ASYNC) { 2121dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2122dd19a799SPoul-Henning Kamp bdwrite(bp); 2123dd19a799SPoul-Henning Kamp return (0); 2124dd19a799SPoul-Henning Kamp } 2125dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDWAIT; 212622a72260SJeff Roberson msleep(&bp->b_xflags, BO_LOCKPTR(bp->b_bufobj), PRIBIO, 212722a72260SJeff Roberson "bwrbg", 0); 2128dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) 2129dd19a799SPoul-Henning Kamp panic("bufwrite: still writing"); 2130dd19a799SPoul-Henning Kamp } 2131b2c3df84SKonstantin Belousov bp->b_vflags &= ~BV_BKGRDERR; 2132dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 2133dd19a799SPoul-Henning Kamp 2134dd19a799SPoul-Henning Kamp /* 2135dd19a799SPoul-Henning Kamp * If this buffer is marked for background writing and we 2136dd19a799SPoul-Henning Kamp * do not have to wait for it, make a copy and write the 2137dd19a799SPoul-Henning Kamp * copy so as to leave this buffer ready for further use. 2138dd19a799SPoul-Henning Kamp * 2139dd19a799SPoul-Henning Kamp * This optimization eats a lot of memory. If we have a page 2140dd19a799SPoul-Henning Kamp * or buffer shortfall we can't do it. 2141dd19a799SPoul-Henning Kamp */ 2142dd19a799SPoul-Henning Kamp if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) && 2143dd19a799SPoul-Henning Kamp (bp->b_flags & B_ASYNC) && 2144dd19a799SPoul-Henning Kamp !vm_page_count_severe() && 2145dd19a799SPoul-Henning Kamp !buf_dirty_count_severe()) { 2146dd19a799SPoul-Henning Kamp KASSERT(bp->b_iodone == NULL, 2147dd19a799SPoul-Henning Kamp ("bufwrite: needs chained iodone (%p)", bp->b_iodone)); 2148dd19a799SPoul-Henning Kamp 2149dd19a799SPoul-Henning Kamp /* get a new block */ 2150c1d8b5e8SKonstantin Belousov newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD); 2151c1d8b5e8SKonstantin Belousov if (newbp == NULL) 2152c1d8b5e8SKonstantin Belousov goto normal_write; 2153dd19a799SPoul-Henning Kamp 2154fade8dd7SJeff Roberson KASSERT(buf_mapped(bp), ("Unmapped cg")); 2155dd19a799SPoul-Henning Kamp memcpy(newbp->b_data, bp->b_data, bp->b_bufsize); 2156dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 2157dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDINPROG; 2158dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 215975e3597aSKirk McKusick newbp->b_xflags |= 216075e3597aSKirk McKusick (bp->b_xflags & BX_FSPRIV) | BX_BKGRDMARKER; 216126089666SJeff Roberson newbp->b_lblkno = bp->b_lblkno; 2162dd19a799SPoul-Henning Kamp newbp->b_blkno = bp->b_blkno; 2163dd19a799SPoul-Henning Kamp newbp->b_offset = bp->b_offset; 2164dd19a799SPoul-Henning Kamp newbp->b_iodone = ffs_backgroundwritedone; 2165dd19a799SPoul-Henning Kamp newbp->b_flags |= B_ASYNC; 2166dd19a799SPoul-Henning Kamp newbp->b_flags &= ~B_INVAL; 216726089666SJeff Roberson pbgetvp(bp->b_vp, newbp); 2168dd19a799SPoul-Henning Kamp 2169dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 2170113db2ddSJeff Roberson /* 2171113db2ddSJeff Roberson * Move over the dependencies. If there are rollbacks, 2172113db2ddSJeff Roberson * leave the parent buffer dirtied as it will need to 2173113db2ddSJeff Roberson * be written again. 2174113db2ddSJeff Roberson */ 2175113db2ddSJeff Roberson if (LIST_EMPTY(&bp->b_dep) || 2176113db2ddSJeff Roberson softdep_move_dependencies(bp, newbp) == 0) 2177113db2ddSJeff Roberson bundirty(bp); 2178113db2ddSJeff Roberson #else 2179113db2ddSJeff Roberson bundirty(bp); 2180dd19a799SPoul-Henning Kamp #endif 2181dd19a799SPoul-Henning Kamp 2182dd19a799SPoul-Henning Kamp /* 218326089666SJeff Roberson * Initiate write on the copy, release the original. The 218426089666SJeff Roberson * BKGRDINPROG flag prevents it from going away until 218526089666SJeff Roberson * the background write completes. 2186dd19a799SPoul-Henning Kamp */ 2187dd19a799SPoul-Henning Kamp bqrelse(bp); 2188dd19a799SPoul-Henning Kamp bp = newbp; 2189113db2ddSJeff Roberson } else 2190113db2ddSJeff Roberson /* Mark the buffer clean */ 2191113db2ddSJeff Roberson bundirty(bp); 2192113db2ddSJeff Roberson 2193dd19a799SPoul-Henning Kamp 2194dd19a799SPoul-Henning Kamp /* Let the normal bufwrite do the rest for us */ 2195c1d8b5e8SKonstantin Belousov normal_write: 21969248a827STor Egge return (bufwrite(bp)); 2197dd19a799SPoul-Henning Kamp } 2198dd19a799SPoul-Henning Kamp 2199dd19a799SPoul-Henning Kamp 22008dd56505SPoul-Henning Kamp static void 22016e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp) 22026e77a041SPoul-Henning Kamp { 2203153910e0SJeff Roberson struct vnode *vp; 22047de3839dSTor Egge struct buf *tbp; 220575e3597aSKirk McKusick int error, nocopy; 22066e77a041SPoul-Henning Kamp 22078660b707SMateusz Guzik vp = bo2vnode(bo); 2208153910e0SJeff Roberson if (bp->b_iocmd == BIO_WRITE) { 2209153910e0SJeff Roberson if ((bp->b_flags & B_VALIDSUSPWRT) == 0 && 2210153910e0SJeff Roberson bp->b_vp != NULL && bp->b_vp->v_mount != NULL && 2211153910e0SJeff Roberson (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0) 2212153910e0SJeff Roberson panic("ffs_geom_strategy: bad I/O"); 2213113db2ddSJeff Roberson nocopy = bp->b_flags & B_NOCOPY; 2214113db2ddSJeff Roberson bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY); 2215113db2ddSJeff Roberson if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 && 22167de3839dSTor Egge vp->v_rdev->si_snapdata != NULL) { 22177de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 2218868bb88fSTor Egge runningbufwakeup(bp); 22197de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 22207de3839dSTor Egge b_cluster.cluster_entry) { 22217de3839dSTor Egge error = ffs_copyonwrite(vp, tbp); 22227de3839dSTor Egge if (error != 0 && 2223153910e0SJeff Roberson error != EOPNOTSUPP) { 2224153910e0SJeff Roberson bp->b_error = error; 2225153910e0SJeff Roberson bp->b_ioflags |= BIO_ERROR; 2226153910e0SJeff Roberson bufdone(bp); 2227153910e0SJeff Roberson return; 2228153910e0SJeff Roberson } 2229153910e0SJeff Roberson } 2230868bb88fSTor Egge bp->b_runningbufspace = bp->b_bufsize; 22315bd65606SJohn Baldwin atomic_add_long(&runningbufspace, 2232868bb88fSTor Egge bp->b_runningbufspace); 22337de3839dSTor Egge } else { 22347de3839dSTor Egge error = ffs_copyonwrite(vp, bp); 22357de3839dSTor Egge if (error != 0 && error != EOPNOTSUPP) { 22367de3839dSTor Egge bp->b_error = error; 22377de3839dSTor Egge bp->b_ioflags |= BIO_ERROR; 22387de3839dSTor Egge bufdone(bp); 22397de3839dSTor Egge return; 22407de3839dSTor Egge } 22417de3839dSTor Egge } 22427de3839dSTor Egge } 22437de3839dSTor Egge #ifdef SOFTUPDATES 22447de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 22457de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 22467de3839dSTor Egge b_cluster.cluster_entry) { 224704533fc6SXin LI if (!LIST_EMPTY(&tbp->b_dep)) 22487de3839dSTor Egge buf_start(tbp); 22497de3839dSTor Egge } 22507de3839dSTor Egge } else { 225104533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 22527de3839dSTor Egge buf_start(bp); 22537de3839dSTor Egge } 22547de3839dSTor Egge 22557de3839dSTor Egge #endif 225675e3597aSKirk McKusick /* 225775e3597aSKirk McKusick * Check for metadata that needs check-hashes and update them. 225875e3597aSKirk McKusick */ 225975e3597aSKirk McKusick switch (bp->b_xflags & BX_FSPRIV) { 226075e3597aSKirk McKusick case BX_CYLGRP: 226175e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 0; 226275e3597aSKirk McKusick ((struct cg *)bp->b_data)->cg_ckhash = 226375e3597aSKirk McKusick calculate_crc32c(~0L, bp->b_data, bp->b_bcount); 226475e3597aSKirk McKusick break; 226575e3597aSKirk McKusick 226675e3597aSKirk McKusick case BX_SUPERBLOCK: 226775e3597aSKirk McKusick case BX_INODE: 226875e3597aSKirk McKusick case BX_INDIR: 226975e3597aSKirk McKusick case BX_DIR: 227075e3597aSKirk McKusick printf("Check-hash write is unimplemented!!!\n"); 227175e3597aSKirk McKusick break; 227275e3597aSKirk McKusick 227375e3597aSKirk McKusick case 0: 227475e3597aSKirk McKusick break; 227575e3597aSKirk McKusick 227675e3597aSKirk McKusick default: 227775e3597aSKirk McKusick printf("multiple buffer types 0x%b\n", 227875e3597aSKirk McKusick (u_int)(bp->b_xflags & BX_FSPRIV), 227975e3597aSKirk McKusick PRINT_UFS_BUF_XFLAGS); 228075e3597aSKirk McKusick break; 228175e3597aSKirk McKusick } 22827de3839dSTor Egge } 228343920011SPoul-Henning Kamp g_vfs_strategy(bo, bp); 22846e77a041SPoul-Henning Kamp } 228552dfc8d7SKonstantin Belousov 22861848286aSEdward Tomasz Napierala int 22871848286aSEdward Tomasz Napierala ffs_own_mount(const struct mount *mp) 22881848286aSEdward Tomasz Napierala { 22891848286aSEdward Tomasz Napierala 22901848286aSEdward Tomasz Napierala if (mp->mnt_op == &ufs_vfsops) 22911848286aSEdward Tomasz Napierala return (1); 22921848286aSEdward Tomasz Napierala return (0); 22931848286aSEdward Tomasz Napierala } 22941848286aSEdward Tomasz Napierala 229552dfc8d7SKonstantin Belousov #ifdef DDB 2296cf058082SBrooks Davis #ifdef SOFTUPDATES 229752dfc8d7SKonstantin Belousov 2298519e3c3bSKirk McKusick /* defined in ffs_softdep.c */ 2299519e3c3bSKirk McKusick extern void db_print_ffs(struct ufsmount *ump); 230052dfc8d7SKonstantin Belousov 230152dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs) 230252dfc8d7SKonstantin Belousov { 230352dfc8d7SKonstantin Belousov struct mount *mp; 230452dfc8d7SKonstantin Belousov struct ufsmount *ump; 230552dfc8d7SKonstantin Belousov 230652dfc8d7SKonstantin Belousov if (have_addr) { 230752dfc8d7SKonstantin Belousov ump = VFSTOUFS((struct mount *)addr); 230852dfc8d7SKonstantin Belousov db_print_ffs(ump); 230952dfc8d7SKonstantin Belousov return; 231052dfc8d7SKonstantin Belousov } 231152dfc8d7SKonstantin Belousov 231252dfc8d7SKonstantin Belousov TAILQ_FOREACH(mp, &mountlist, mnt_list) { 231352dfc8d7SKonstantin Belousov if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name)) 231452dfc8d7SKonstantin Belousov db_print_ffs(VFSTOUFS(mp)); 231552dfc8d7SKonstantin Belousov } 231652dfc8d7SKonstantin Belousov } 231752dfc8d7SKonstantin Belousov 2318cf058082SBrooks Davis #endif /* SOFTUPDATES */ 231952dfc8d7SKonstantin Belousov #endif /* DDB */ 2320