160727d8bSWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1989, 1991, 1993, 1994 3df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 6df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 7df8bae1dSRodney W. Grimes * are met: 8df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 9df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 10df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 12df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 13df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 14df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 15df8bae1dSRodney W. Grimes * without specific prior written permission. 16df8bae1dSRodney W. Grimes * 17df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27df8bae1dSRodney W. Grimes * SUCH DAMAGE. 28df8bae1dSRodney W. Grimes * 29996c772fSJohn Dyson * @(#)ffs_vfsops.c 8.31 (Berkeley) 5/20/95 30df8bae1dSRodney W. Grimes */ 31df8bae1dSRodney W. Grimes 32f4636c59SDavid E. O'Brien #include <sys/cdefs.h> 33f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$"); 34f4636c59SDavid E. O'Brien 3580830407SRobert Watson #include "opt_mac.h" 3601733a9bSGarrett Wollman #include "opt_quota.h" 37516081f2SRobert Watson #include "opt_ufs.h" 386e77a041SPoul-Henning Kamp #include "opt_ffs.h" 3901733a9bSGarrett Wollman 40df8bae1dSRodney W. Grimes #include <sys/param.h> 41df8bae1dSRodney W. Grimes #include <sys/systm.h> 42df8bae1dSRodney W. Grimes #include <sys/namei.h> 43acd3428bSRobert Watson #include <sys/priv.h> 44df8bae1dSRodney W. Grimes #include <sys/proc.h> 45df8bae1dSRodney W. Grimes #include <sys/kernel.h> 46df8bae1dSRodney W. Grimes #include <sys/vnode.h> 47df8bae1dSRodney W. Grimes #include <sys/mount.h> 489626b608SPoul-Henning Kamp #include <sys/bio.h> 49df8bae1dSRodney W. Grimes #include <sys/buf.h> 5081bca6ddSKATO Takenori #include <sys/conf.h> 513ac4d1efSBruce Evans #include <sys/fcntl.h> 52df8bae1dSRodney W. Grimes #include <sys/malloc.h> 531b367556SJason Evans #include <sys/mutex.h> 54a18b1f1dSJason Evans 55aed55708SRobert Watson #include <security/mac/mac_framework.h> 56aed55708SRobert Watson 57a64ed089SRobert Watson #include <ufs/ufs/extattr.h> 581a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h> 59df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h> 60df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h> 61df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h> 62df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h> 63df8bae1dSRodney W. Grimes 64df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h> 65df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h> 66df8bae1dSRodney W. Grimes 67f6b04d2bSDavid Greenman #include <vm/vm.h> 68aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h> 69f6b04d2bSDavid Greenman #include <vm/vm_page.h> 70f6b04d2bSDavid Greenman 7143920011SPoul-Henning Kamp #include <geom/geom.h> 7243920011SPoul-Henning Kamp #include <geom/geom_vfs.h> 7343920011SPoul-Henning Kamp 74adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2; 7555166637SPoul-Henning Kamp 765e8c582aSPoul-Henning Kamp static int ffs_reload(struct mount *, struct thread *); 77975512a9SPoul-Henning Kamp static int ffs_mountfs(struct vnode *, struct mount *, struct thread *); 781c85e6a3SKirk McKusick static void ffs_oldfscompat_read(struct fs *, struct ufsmount *, 791c85e6a3SKirk McKusick ufs2_daddr_t); 801c85e6a3SKirk McKusick static void ffs_oldfscompat_write(struct fs *, struct ufsmount *); 81975512a9SPoul-Henning Kamp static void ffs_ifree(struct ufsmount *ump, struct inode *ip); 829bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init; 839bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit; 84d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl; 8520a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount; 86adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount; 8720a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount; 88adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs; 89adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp; 90adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync; 91df8bae1dSRodney W. Grimes 92303b270bSEivind Eklund static struct vfsops ufs_vfsops = { 937652131bSPoul-Henning Kamp .vfs_extattrctl = ffs_extattrctl, 947652131bSPoul-Henning Kamp .vfs_fhtovp = ffs_fhtovp, 957652131bSPoul-Henning Kamp .vfs_init = ffs_init, 9620a92a18SPoul-Henning Kamp .vfs_mount = ffs_mount, 9720a92a18SPoul-Henning Kamp .vfs_cmount = ffs_cmount, 987652131bSPoul-Henning Kamp .vfs_quotactl = ufs_quotactl, 997652131bSPoul-Henning Kamp .vfs_root = ufs_root, 1007652131bSPoul-Henning Kamp .vfs_statfs = ffs_statfs, 1017652131bSPoul-Henning Kamp .vfs_sync = ffs_sync, 1027652131bSPoul-Henning Kamp .vfs_uninit = ffs_uninit, 1037652131bSPoul-Henning Kamp .vfs_unmount = ffs_unmount, 1047652131bSPoul-Henning Kamp .vfs_vget = ffs_vget, 105df8bae1dSRodney W. Grimes }; 106df8bae1dSRodney W. Grimes 1078994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0); 1085fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1); 109c901836cSGarrett Wollman 1106e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy; 111dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite; 1126e77a041SPoul-Henning Kamp 1136e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = { 1146e77a041SPoul-Henning Kamp .bop_name = "FFS", 115dd19a799SPoul-Henning Kamp .bop_write = ffs_bufwrite, 1166e77a041SPoul-Henning Kamp .bop_strategy = ffs_geom_strategy, 1176ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 1182cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT 1192cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush, 1202cc7d26fSKonstantin Belousov #else 1212cc7d26fSKonstantin Belousov .bop_bdflush = ffs_bdflush, 1222cc7d26fSKonstantin Belousov #endif 1236e77a041SPoul-Henning Kamp }; 1246e77a041SPoul-Henning Kamp 125d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr", 126d952ba1bSJohn Baldwin "noclusterw", "noexec", "export", "force", "from", "multilabel", 127d952ba1bSJohn Baldwin "snapshot", "nosuid", "suiddir", "nosymfollow", "sync", 128ee98eb82SCraig Rodrigues "union", NULL }; 12920a92a18SPoul-Henning Kamp 1305e8c582aSPoul-Henning Kamp static int 13120a92a18SPoul-Henning Kamp ffs_mount(struct mount *mp, struct thread *td) 132df8bae1dSRodney W. Grimes { 13320a92a18SPoul-Henning Kamp struct vnode *devvp; 13426f9a767SRodney W. Grimes struct ufsmount *ump = 0; 13505f4ff5dSPoul-Henning Kamp struct fs *fs; 136f2a2857bSKirk McKusick int error, flags; 1375da56ddbSTor Egge u_int mntorflags, mntandnotflags; 138c9b99213SBruce Evans mode_t accessmode; 1395e8c582aSPoul-Henning Kamp struct nameidata ndp; 14020a92a18SPoul-Henning Kamp char *fspec; 141df8bae1dSRodney W. Grimes 14220a92a18SPoul-Henning Kamp if (vfs_filteropt(mp->mnt_optnew, ffs_opts)) 14320a92a18SPoul-Henning Kamp return (EINVAL); 144aa4d7a8aSPoul-Henning Kamp if (uma_inode == NULL) { 145aa4d7a8aSPoul-Henning Kamp uma_inode = uma_zcreate("FFS inode", 146aa4d7a8aSPoul-Henning Kamp sizeof(struct inode), NULL, NULL, NULL, NULL, 147aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 148aa4d7a8aSPoul-Henning Kamp uma_ufs1 = uma_zcreate("FFS1 dinode", 149aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL, 150aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 151aa4d7a8aSPoul-Henning Kamp uma_ufs2 = uma_zcreate("FFS2 dinode", 152aa4d7a8aSPoul-Henning Kamp sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL, 153aa4d7a8aSPoul-Henning Kamp UMA_ALIGN_PTR, 0); 154aa4d7a8aSPoul-Henning Kamp } 1558d02a378SPawel Jakub Dawidek 15620a92a18SPoul-Henning Kamp fspec = vfs_getopts(mp->mnt_optnew, "from", &error); 15751ac12abSPoul-Henning Kamp if (error) 158f2a2857bSKirk McKusick return (error); 1592b14f991SJulian Elischer 1605da56ddbSTor Egge mntorflags = 0; 1615da56ddbSTor Egge mntandnotflags = 0; 16226f59b64SCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0) 1635da56ddbSTor Egge mntorflags |= MNT_ACLS; 16426f59b64SCraig Rodrigues 165fb77e0afSCraig Rodrigues if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) { 1665da56ddbSTor Egge mntorflags |= MNT_SNAPSHOT; 167fb77e0afSCraig Rodrigues /* 168fb77e0afSCraig Rodrigues * Once we have set the MNT_SNAPSHOT flag, do not 169fb77e0afSCraig Rodrigues * persist "snapshot" in the options list. 170fb77e0afSCraig Rodrigues */ 171fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_optnew, "snapshot"); 172fb77e0afSCraig Rodrigues vfs_deleteopt(mp->mnt_opt, "snapshot"); 173fb77e0afSCraig Rodrigues } 17426f59b64SCraig Rodrigues 1755da56ddbSTor Egge MNT_ILOCK(mp); 1765da56ddbSTor Egge mp->mnt_flag = (mp->mnt_flag | mntorflags) & ~mntandnotflags; 1775da56ddbSTor Egge MNT_IUNLOCK(mp); 178df8bae1dSRodney W. Grimes /* 179df8bae1dSRodney W. Grimes * If updating, check whether changing from read-only to 180df8bae1dSRodney W. Grimes * read/write; if there is no device name, that's all we do. 181df8bae1dSRodney W. Grimes */ 182df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_UPDATE) { 183df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 184df8bae1dSRodney W. Grimes fs = ump->um_fs; 18526cf9c3bSPeter Wemm devvp = ump->um_devvp; 18620a92a18SPoul-Henning Kamp if (fs->fs_ronly == 0 && 18720a92a18SPoul-Henning Kamp vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 188f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 189f2a2857bSKirk McKusick return (error); 190cd600596SKirk McKusick /* 191cd600596SKirk McKusick * Flush any dirty data. 192cd600596SKirk McKusick */ 193efd6d980SPoul-Henning Kamp if ((error = ffs_sync(mp, MNT_WAIT, td)) != 0) { 1949ab73fd1SKirk McKusick vn_finished_write(mp); 1959ab73fd1SKirk McKusick return (error); 1969ab73fd1SKirk McKusick } 197cd600596SKirk McKusick /* 198cd600596SKirk McKusick * Check for and optionally get rid of files open 199cd600596SKirk McKusick * for writing. 200cd600596SKirk McKusick */ 201df8bae1dSRodney W. Grimes flags = WRITECLOSE; 202df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_FORCE) 203df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 204b1897c19SJulian Elischer if (mp->mnt_flag & MNT_SOFTDEP) { 205b40ce416SJulian Elischer error = softdep_flushfiles(mp, flags, td); 206b1897c19SJulian Elischer } else { 207b40ce416SJulian Elischer error = ffs_flushfiles(mp, flags, td); 208df8bae1dSRodney W. Grimes } 209f2a2857bSKirk McKusick if (error) { 210f2a2857bSKirk McKusick vn_finished_write(mp); 211f2a2857bSKirk McKusick return (error); 212b1897c19SJulian Elischer } 2139ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || 2149ccb939eSKirk McKusick fs->fs_pendinginodes != 0) { 215cfbf0a46SMaxime Henrion printf("%s: %s: blocks %jd files %d\n", 2161c85e6a3SKirk McKusick fs->fs_fsmnt, "update error", 2171c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 2189ccb939eSKirk McKusick fs->fs_pendinginodes); 2199ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 2209ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 2219ccb939eSKirk McKusick } 2221a6a6610SKirk McKusick if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0) 223f2a2857bSKirk McKusick fs->fs_clean = 1; 224791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 225f2a2857bSKirk McKusick fs->fs_ronly = 0; 226f2a2857bSKirk McKusick fs->fs_clean = 0; 227f2a2857bSKirk McKusick vn_finished_write(mp); 228f2a2857bSKirk McKusick return (error); 2292b14f991SJulian Elischer } 230f2a2857bSKirk McKusick vn_finished_write(mp); 23143920011SPoul-Henning Kamp DROP_GIANT(); 23243920011SPoul-Henning Kamp g_topology_lock(); 23343920011SPoul-Henning Kamp g_access(ump->um_cp, 0, -1, 0); 23443920011SPoul-Henning Kamp g_topology_unlock(); 23543920011SPoul-Henning Kamp PICKUP_GIANT(); 23620a92a18SPoul-Henning Kamp fs->fs_ronly = 1; 2375da56ddbSTor Egge MNT_ILOCK(mp); 23820a92a18SPoul-Henning Kamp mp->mnt_flag |= MNT_RDONLY; 2395da56ddbSTor Egge MNT_IUNLOCK(mp); 240f2a2857bSKirk McKusick } 241f2a2857bSKirk McKusick if ((mp->mnt_flag & MNT_RELOAD) && 2425e8c582aSPoul-Henning Kamp (error = ffs_reload(mp, td)) != 0) 243f2a2857bSKirk McKusick return (error); 24420a92a18SPoul-Henning Kamp if (fs->fs_ronly && 24520a92a18SPoul-Henning Kamp !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) { 246c9b99213SBruce Evans /* 247c9b99213SBruce Evans * If upgrade to read-write by non-root, then verify 248c9b99213SBruce Evans * that user has necessary permissions on the device. 249c9b99213SBruce Evans */ 250cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 251acd3428bSRobert Watson error = VOP_ACCESS(devvp, VREAD | VWRITE, 252acd3428bSRobert Watson td->td_ucred, td); 253acd3428bSRobert Watson if (error) 254acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 255acd3428bSRobert Watson if (error) { 25622db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 257c9b99213SBruce Evans return (error); 258c9b99213SBruce Evans } 25922db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 2607e58bfacSBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 2610922cce6SBruce Evans if (fs->fs_clean == 0) { 2627e58bfacSBruce Evans fs->fs_flags |= FS_UNCLEAN; 263812b1d41SKirk McKusick if ((mp->mnt_flag & MNT_FORCE) || 2641a6a6610SKirk McKusick ((fs->fs_flags & FS_NEEDSFSCK) == 0 && 2651a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 266f2a2857bSKirk McKusick printf("WARNING: %s was not %s\n", 267f2a2857bSKirk McKusick fs->fs_fsmnt, "properly dismounted"); 2680922cce6SBruce Evans } else { 2690922cce6SBruce Evans printf( 2700922cce6SBruce Evans "WARNING: R/W mount of %s denied. Filesystem is not clean - run fsck\n", 2710922cce6SBruce Evans fs->fs_fsmnt); 272f2a2857bSKirk McKusick return (EPERM); 2730922cce6SBruce Evans } 2740922cce6SBruce Evans } 27540c340aaSPoul-Henning Kamp DROP_GIANT(); 27640c340aaSPoul-Henning Kamp g_topology_lock(); 27740c340aaSPoul-Henning Kamp /* 27840c340aaSPoul-Henning Kamp * If we're the root device, we may not have an E count 27940c340aaSPoul-Henning Kamp * yet, get it now. 28040c340aaSPoul-Henning Kamp */ 28140c340aaSPoul-Henning Kamp if (ump->um_cp->ace == 0) 28240c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 1); 28340c340aaSPoul-Henning Kamp else 28440c340aaSPoul-Henning Kamp error = g_access(ump->um_cp, 0, 1, 0); 28540c340aaSPoul-Henning Kamp g_topology_unlock(); 28640c340aaSPoul-Henning Kamp PICKUP_GIANT(); 28740c340aaSPoul-Henning Kamp if (error) 28840c340aaSPoul-Henning Kamp return (error); 289f2a2857bSKirk McKusick if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0) 290f2a2857bSKirk McKusick return (error); 291f2a2857bSKirk McKusick fs->fs_ronly = 0; 2925da56ddbSTor Egge MNT_ILOCK(mp); 29320a92a18SPoul-Henning Kamp mp->mnt_flag &= ~MNT_RDONLY; 2945da56ddbSTor Egge MNT_IUNLOCK(mp); 295f2a2857bSKirk McKusick fs->fs_clean = 0; 296791dd2faSTor Egge if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) { 297f2a2857bSKirk McKusick vn_finished_write(mp); 298f2a2857bSKirk McKusick return (error); 299f2a2857bSKirk McKusick } 30026cf9c3bSPeter Wemm /* check to see if we need to start softdep */ 301f2a2857bSKirk McKusick if ((fs->fs_flags & FS_DOSOFTDEP) && 302a854ed98SJohn Baldwin (error = softdep_mount(devvp, mp, fs, td->td_ucred))){ 303f2a2857bSKirk McKusick vn_finished_write(mp); 304f2a2857bSKirk McKusick return (error); 30526cf9c3bSPeter Wemm } 306f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 307f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 308f2a2857bSKirk McKusick vn_finished_write(mp); 3091469eec8SDavid Greenman } 310c11d2981SJulian Elischer /* 311c11d2981SJulian Elischer * Soft updates is incompatible with "async", 312c11d2981SJulian Elischer * so if we are doing softupdates stop the user 313c11d2981SJulian Elischer * from setting the async flag in an update. 314c11d2981SJulian Elischer * Softdep_mount() clears it in an initial mount 315c11d2981SJulian Elischer * or ro->rw remount. 316c11d2981SJulian Elischer */ 3175da56ddbSTor Egge if (mp->mnt_flag & MNT_SOFTDEP) { 3185da56ddbSTor Egge /* XXX: Reset too late ? */ 3195da56ddbSTor Egge MNT_ILOCK(mp); 320c11d2981SJulian Elischer mp->mnt_flag &= ~MNT_ASYNC; 3215da56ddbSTor Egge MNT_IUNLOCK(mp); 3225da56ddbSTor Egge } 323df8bae1dSRodney W. Grimes /* 32439cfb239SPawel Jakub Dawidek * Keep MNT_ACLS flag if it is stored in superblock. 32539cfb239SPawel Jakub Dawidek */ 3265da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 3275da56ddbSTor Egge /* XXX: Set too late ? */ 3285da56ddbSTor Egge MNT_ILOCK(mp); 32939cfb239SPawel Jakub Dawidek mp->mnt_flag |= MNT_ACLS; 3305da56ddbSTor Egge MNT_IUNLOCK(mp); 3315da56ddbSTor Egge } 332cea90362SCraig Rodrigues 333f2a2857bSKirk McKusick /* 334f2a2857bSKirk McKusick * If this is a snapshot request, take the snapshot. 335f2a2857bSKirk McKusick */ 336f2a2857bSKirk McKusick if (mp->mnt_flag & MNT_SNAPSHOT) 33720a92a18SPoul-Henning Kamp return (ffs_snapshot(mp, fspec)); 338df8bae1dSRodney W. Grimes } 3392b14f991SJulian Elischer 340df8bae1dSRodney W. Grimes /* 341df8bae1dSRodney W. Grimes * Not an update, or updating the name: look up the name 342e9827c6dSBruce Evans * and verify that it refers to a sensible disk device. 343df8bae1dSRodney W. Grimes */ 344fdedad76SSuleiman Souhlal NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td); 3455e8c582aSPoul-Henning Kamp if ((error = namei(&ndp)) != 0) 346f2a2857bSKirk McKusick return (error); 3475e8c582aSPoul-Henning Kamp NDFREE(&ndp, NDF_ONLY_PNBUF); 3485e8c582aSPoul-Henning Kamp devvp = ndp.ni_vp; 349f2a2857bSKirk McKusick if (!vn_isdisk(devvp, &error)) { 350fdedad76SSuleiman Souhlal vput(devvp); 351f2a2857bSKirk McKusick return (error); 352f2a2857bSKirk McKusick } 353c9b99213SBruce Evans 354c9b99213SBruce Evans /* 355c9b99213SBruce Evans * If mount by non-root, then verify that user has necessary 356c9b99213SBruce Evans * permissions on the device. 357c9b99213SBruce Evans */ 358c9b99213SBruce Evans accessmode = VREAD; 359c9b99213SBruce Evans if ((mp->mnt_flag & MNT_RDONLY) == 0) 360c9b99213SBruce Evans accessmode |= VWRITE; 361acd3428bSRobert Watson error = VOP_ACCESS(devvp, accessmode, td->td_ucred, td); 362acd3428bSRobert Watson if (error) 363acd3428bSRobert Watson error = priv_check(td, PRIV_VFS_MOUNT_PERM); 364acd3428bSRobert Watson if (error) { 365c9b99213SBruce Evans vput(devvp); 366c9b99213SBruce Evans return (error); 367c9b99213SBruce Evans } 368c9b99213SBruce Evans 3692b14f991SJulian Elischer if (mp->mnt_flag & MNT_UPDATE) { 3702b14f991SJulian Elischer /* 371f2a2857bSKirk McKusick * Update only 372f2a2857bSKirk McKusick * 3733e425b96SJulian Elischer * If it's not the same vnode, or at least the same device 3743e425b96SJulian Elischer * then it's not correct. 3752b14f991SJulian Elischer */ 3762b14f991SJulian Elischer 37743920011SPoul-Henning Kamp if (devvp->v_rdev != ump->um_devvp->v_rdev) 378f2a2857bSKirk McKusick error = EINVAL; /* needs translation */ 379fdedad76SSuleiman Souhlal vput(devvp); 380f2a2857bSKirk McKusick if (error) 381f2a2857bSKirk McKusick return (error); 3822b14f991SJulian Elischer } else { 3832b14f991SJulian Elischer /* 384f2a2857bSKirk McKusick * New mount 3852b14f991SJulian Elischer * 386f2a2857bSKirk McKusick * We need the name for the mount point (also used for 387f2a2857bSKirk McKusick * "last mounted on") copied in. If an error occurs, 388f2a2857bSKirk McKusick * the mount point is discarded by the upper level code. 389f3a90da9SAdrian Chadd * Note that vfs_mount() populates f_mntonname for us. 390f2a2857bSKirk McKusick */ 391975512a9SPoul-Henning Kamp if ((error = ffs_mountfs(devvp, mp, td)) != 0) { 392f2a2857bSKirk McKusick vrele(devvp); 393f2a2857bSKirk McKusick return (error); 394f2a2857bSKirk McKusick } 395f2a2857bSKirk McKusick } 39620a92a18SPoul-Henning Kamp vfs_mountedfrom(mp, fspec); 397f2a2857bSKirk McKusick return (0); 3982b14f991SJulian Elischer } 3992b14f991SJulian Elischer 400df8bae1dSRodney W. Grimes /* 40120a92a18SPoul-Henning Kamp * Compatibility with old mount system call. 40220a92a18SPoul-Henning Kamp */ 40320a92a18SPoul-Henning Kamp 40420a92a18SPoul-Henning Kamp static int 40520a92a18SPoul-Henning Kamp ffs_cmount(struct mntarg *ma, void *data, int flags, struct thread *td) 40620a92a18SPoul-Henning Kamp { 40720a92a18SPoul-Henning Kamp struct ufs_args args; 40820a92a18SPoul-Henning Kamp int error; 40920a92a18SPoul-Henning Kamp 41020a92a18SPoul-Henning Kamp if (data == NULL) 41120a92a18SPoul-Henning Kamp return (EINVAL); 41220a92a18SPoul-Henning Kamp error = copyin(data, &args, sizeof args); 41320a92a18SPoul-Henning Kamp if (error) 41420a92a18SPoul-Henning Kamp return (error); 41520a92a18SPoul-Henning Kamp 41620a92a18SPoul-Henning Kamp ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN); 41720a92a18SPoul-Henning Kamp ma = mount_arg(ma, "export", &args.export, sizeof args.export); 41820a92a18SPoul-Henning Kamp error = kernel_mount(ma, flags); 41920a92a18SPoul-Henning Kamp 42020a92a18SPoul-Henning Kamp return (error); 42120a92a18SPoul-Henning Kamp } 42220a92a18SPoul-Henning Kamp 42320a92a18SPoul-Henning Kamp /* 424df8bae1dSRodney W. Grimes * Reload all incore data for a filesystem (used after running fsck on 425df8bae1dSRodney W. Grimes * the root filesystem and finding things to fix). The filesystem must 426df8bae1dSRodney W. Grimes * be mounted read-only. 427df8bae1dSRodney W. Grimes * 428df8bae1dSRodney W. Grimes * Things to do to update the mount: 429df8bae1dSRodney W. Grimes * 1) invalidate all cached meta-data. 430df8bae1dSRodney W. Grimes * 2) re-read superblock from disk. 431df8bae1dSRodney W. Grimes * 3) re-read summary information from disk. 432df8bae1dSRodney W. Grimes * 4) invalidate all inactive vnodes. 433df8bae1dSRodney W. Grimes * 5) invalidate all cached file data. 434df8bae1dSRodney W. Grimes * 6) re-read inode data for all active vnodes. 435df8bae1dSRodney W. Grimes */ 4365e8c582aSPoul-Henning Kamp static int 4375e8c582aSPoul-Henning Kamp ffs_reload(struct mount *mp, struct thread *td) 438df8bae1dSRodney W. Grimes { 43982be0a5aSTor Egge struct vnode *vp, *mvp, *devvp; 440df8bae1dSRodney W. Grimes struct inode *ip; 441f55ff3f3SIan Dowse void *space; 442df8bae1dSRodney W. Grimes struct buf *bp; 443996c772fSJohn Dyson struct fs *fs, *newfs; 4443ba649d7SJeff Roberson struct ufsmount *ump; 4451c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 446df8bae1dSRodney W. Grimes int i, blks, size, error; 447996c772fSJohn Dyson int32_t *lp; 448df8bae1dSRodney W. Grimes 4492b14f991SJulian Elischer if ((mp->mnt_flag & MNT_RDONLY) == 0) 450df8bae1dSRodney W. Grimes return (EINVAL); 4513ba649d7SJeff Roberson ump = VFSTOUFS(mp); 452df8bae1dSRodney W. Grimes /* 453df8bae1dSRodney W. Grimes * Step 1: invalidate all cached meta-data. 454df8bae1dSRodney W. Grimes */ 4552b14f991SJulian Elischer devvp = VFSTOUFS(mp)->um_devvp; 456cb05b60aSAttilio Rao vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 4577c0745eeSPoul-Henning Kamp if (vinvalbuf(devvp, 0, td, 0, 0) != 0) 458df8bae1dSRodney W. Grimes panic("ffs_reload: dirty1"); 45922db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 46095e5e988SJohn Dyson 461df8bae1dSRodney W. Grimes /* 462df8bae1dSRodney W. Grimes * Step 2: re-read superblock from disk. 463df8bae1dSRodney W. Grimes */ 4641c85e6a3SKirk McKusick fs = VFSTOUFS(mp)->um_fs; 465ada981b2SKirk McKusick if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize, 4661c85e6a3SKirk McKusick NOCRED, &bp)) != 0) 467df8bae1dSRodney W. Grimes return (error); 468996c772fSJohn Dyson newfs = (struct fs *)bp->b_data; 4691c85e6a3SKirk McKusick if ((newfs->fs_magic != FS_UFS1_MAGIC && 4701c85e6a3SKirk McKusick newfs->fs_magic != FS_UFS2_MAGIC) || 4711c85e6a3SKirk McKusick newfs->fs_bsize > MAXBSIZE || 472996c772fSJohn Dyson newfs->fs_bsize < sizeof(struct fs)) { 473df8bae1dSRodney W. Grimes brelse(bp); 474df8bae1dSRodney W. Grimes return (EIO); /* XXX needs translation */ 475df8bae1dSRodney W. Grimes } 476996c772fSJohn Dyson /* 477996c772fSJohn Dyson * Copy pointer fields back into superblock before copying in XXX 478996c772fSJohn Dyson * new superblock. These should really be in the ufsmount. XXX 479996c772fSJohn Dyson * Note that important parameters (eg fs_ncg) are unchanged. 480996c772fSJohn Dyson */ 481f55ff3f3SIan Dowse newfs->fs_csp = fs->fs_csp; 482996c772fSJohn Dyson newfs->fs_maxcluster = fs->fs_maxcluster; 4835d69bac4SIan Dowse newfs->fs_contigdirs = fs->fs_contigdirs; 484143a5346SIan Dowse newfs->fs_active = fs->fs_active; 48531c81e4bSDon Lewis /* The file system is still read-only. */ 48631c81e4bSDon Lewis newfs->fs_ronly = 1; 4871c85e6a3SKirk McKusick sblockloc = fs->fs_sblockloc; 488996c772fSJohn Dyson bcopy(newfs, fs, (u_int)fs->fs_sbsize); 489df8bae1dSRodney W. Grimes brelse(bp); 490996c772fSJohn Dyson mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 4911c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc); 4923ba649d7SJeff Roberson UFS_LOCK(ump); 4939ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 494cfbf0a46SMaxime Henrion printf("%s: reload pending error: blocks %jd files %d\n", 4951c85e6a3SKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 4961c85e6a3SKirk McKusick fs->fs_pendinginodes); 4979ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 4989ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 4999ccb939eSKirk McKusick } 5003ba649d7SJeff Roberson UFS_UNLOCK(ump); 501996c772fSJohn Dyson 502df8bae1dSRodney W. Grimes /* 503df8bae1dSRodney W. Grimes * Step 3: re-read summary information from disk. 504df8bae1dSRodney W. Grimes */ 505df8bae1dSRodney W. Grimes blks = howmany(fs->fs_cssize, fs->fs_fsize); 506f55ff3f3SIan Dowse space = fs->fs_csp; 507df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 508df8bae1dSRodney W. Grimes size = fs->fs_bsize; 509df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 510df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 511c9671602SPoul-Henning Kamp error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 512c9671602SPoul-Henning Kamp NOCRED, &bp); 513c9671602SPoul-Henning Kamp if (error) 514df8bae1dSRodney W. Grimes return (error); 515f55ff3f3SIan Dowse bcopy(bp->b_data, space, (u_int)size); 516f55ff3f3SIan Dowse space = (char *)space + size; 517df8bae1dSRodney W. Grimes brelse(bp); 518df8bae1dSRodney W. Grimes } 519996c772fSJohn Dyson /* 520996c772fSJohn Dyson * We no longer know anything about clusters per cylinder group. 521996c772fSJohn Dyson */ 522996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 523996c772fSJohn Dyson lp = fs->fs_maxcluster; 524996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 525996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 526996c772fSJohn Dyson } 527996c772fSJohn Dyson 528df8bae1dSRodney W. Grimes loop: 529ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 53082be0a5aSTor Egge MNT_VNODE_FOREACH(vp, mp, mvp) { 53104a17687SJeff Roberson VI_LOCK(vp); 532fe68abe2SJeff Roberson if (vp->v_iflag & VI_DOOMED) { 5332f05568aSJeff Roberson VI_UNLOCK(vp); 5342f05568aSJeff Roberson continue; 5352f05568aSJeff Roberson } 536ca430f2eSAlexander Kabaev MNT_IUNLOCK(mp); 537df8bae1dSRodney W. Grimes /* 538fe68abe2SJeff Roberson * Step 4: invalidate all cached file data. 539df8bae1dSRodney W. Grimes */ 540b40ce416SJulian Elischer if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, td)) { 54182be0a5aSTor Egge MNT_VNODE_FOREACH_ABORT(mp, mvp); 542df8bae1dSRodney W. Grimes goto loop; 543996c772fSJohn Dyson } 5447c0745eeSPoul-Henning Kamp if (vinvalbuf(vp, 0, td, 0, 0)) 545df8bae1dSRodney W. Grimes panic("ffs_reload: dirty2"); 546df8bae1dSRodney W. Grimes /* 547fe68abe2SJeff Roberson * Step 5: re-read inode data for all active vnodes. 548df8bae1dSRodney W. Grimes */ 549df8bae1dSRodney W. Grimes ip = VTOI(vp); 550c9671602SPoul-Henning Kamp error = 551df8bae1dSRodney W. Grimes bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), 552c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 553c9671602SPoul-Henning Kamp if (error) { 55422db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 55545d45c6cSAlexander Kabaev vrele(vp); 55682be0a5aSTor Egge MNT_VNODE_FOREACH_ABORT(mp, mvp); 557df8bae1dSRodney W. Grimes return (error); 558df8bae1dSRodney W. Grimes } 559de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ip->i_number); 560b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 561df8bae1dSRodney W. Grimes brelse(bp); 56222db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 563cb9ddc80SAlexander Kabaev vrele(vp); 564ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 565df8bae1dSRodney W. Grimes } 566ca430f2eSAlexander Kabaev MNT_IUNLOCK(mp); 567df8bae1dSRodney W. Grimes return (0); 568df8bae1dSRodney W. Grimes } 569df8bae1dSRodney W. Grimes 5701c85e6a3SKirk McKusick /* 5711c85e6a3SKirk McKusick * Possible superblock locations ordered from most to least likely. 5721c85e6a3SKirk McKusick */ 5731c85e6a3SKirk McKusick static int sblock_try[] = SBLOCKSEARCH; 5745819ab3fSKirk McKusick 575df8bae1dSRodney W. Grimes /* 576df8bae1dSRodney W. Grimes * Common code for mount and mountroot 577df8bae1dSRodney W. Grimes */ 578975512a9SPoul-Henning Kamp static int 579975512a9SPoul-Henning Kamp ffs_mountfs(devvp, mp, td) 58005f4ff5dSPoul-Henning Kamp struct vnode *devvp; 581df8bae1dSRodney W. Grimes struct mount *mp; 582b40ce416SJulian Elischer struct thread *td; 583df8bae1dSRodney W. Grimes { 58405f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 585df8bae1dSRodney W. Grimes struct buf *bp; 58605f4ff5dSPoul-Henning Kamp struct fs *fs; 58789c9c53dSPoul-Henning Kamp struct cdev *dev; 588f55ff3f3SIan Dowse void *space; 5891c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 590f5ef029eSPoul-Henning Kamp int error, i, blks, size, ronly; 591996c772fSJohn Dyson int32_t *lp; 592996c772fSJohn Dyson struct ucred *cred; 59343920011SPoul-Henning Kamp struct g_consumer *cp; 5943bbd6d8aSJeff Roberson struct mount *nmp; 595df8bae1dSRodney W. Grimes 596996c772fSJohn Dyson dev = devvp->v_rdev; 597a854ed98SJohn Baldwin cred = td ? td->td_ucred : NOCRED; 59843920011SPoul-Henning Kamp 59943920011SPoul-Henning Kamp ronly = (mp->mnt_flag & MNT_RDONLY) != 0; 60043920011SPoul-Henning Kamp DROP_GIANT(); 60143920011SPoul-Henning Kamp g_topology_lock(); 60243920011SPoul-Henning Kamp error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1); 60343920011SPoul-Henning Kamp 60443920011SPoul-Henning Kamp /* 60543920011SPoul-Henning Kamp * If we are a root mount, drop the E flag so fsck can do its magic. 60693e0b506SPoul-Henning Kamp * We will pick it up again when we remount R/W. 60743920011SPoul-Henning Kamp */ 60843920011SPoul-Henning Kamp if (error == 0 && ronly && (mp->mnt_flag & MNT_ROOTFS)) 60943920011SPoul-Henning Kamp error = g_access(cp, 0, 0, -1); 61043920011SPoul-Henning Kamp g_topology_unlock(); 61143920011SPoul-Henning Kamp PICKUP_GIANT(); 61222db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 613c9671602SPoul-Henning Kamp if (error) 614df8bae1dSRodney W. Grimes return (error); 6150508986cSBruce Evans if (devvp->v_rdev->si_iosize_max != 0) 6161b5464efSPoul-Henning Kamp mp->mnt_iosize_max = devvp->v_rdev->si_iosize_max; 6171b5464efSPoul-Henning Kamp if (mp->mnt_iosize_max > MAXPHYS) 6181b5464efSPoul-Henning Kamp mp->mnt_iosize_max = MAXPHYS; 61995e5e988SJohn Dyson 62043920011SPoul-Henning Kamp devvp->v_bufobj.bo_private = cp; 6216e77a041SPoul-Henning Kamp devvp->v_bufobj.bo_ops = &ffs_ops; 6226e77a041SPoul-Henning Kamp 623df8bae1dSRodney W. Grimes bp = NULL; 624df8bae1dSRodney W. Grimes ump = NULL; 6251c85e6a3SKirk McKusick fs = NULL; 6261c85e6a3SKirk McKusick sblockloc = 0; 6271c85e6a3SKirk McKusick /* 6281c85e6a3SKirk McKusick * Try reading the superblock in each of its possible locations. 6291c85e6a3SKirk McKusick */ 6301c85e6a3SKirk McKusick for (i = 0; sblock_try[i] != -1; i++) { 63171ac2d7cSCraig Rodrigues if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) { 63271ac2d7cSCraig Rodrigues error = EINVAL; 63371ac2d7cSCraig Rodrigues vfs_mount_error(mp, 63471ac2d7cSCraig Rodrigues "Invalid sectorsize %d for superblock size %d", 63571ac2d7cSCraig Rodrigues cp->provider->sectorsize, SBLOCKSIZE); 63671ac2d7cSCraig Rodrigues goto out; 63771ac2d7cSCraig Rodrigues } 63871ac2d7cSCraig Rodrigues if ((error = bread(devvp, btodb(sblock_try[i]), SBLOCKSIZE, 6391c85e6a3SKirk McKusick cred, &bp)) != 0) 640df8bae1dSRodney W. Grimes goto out; 641df8bae1dSRodney W. Grimes fs = (struct fs *)bp->b_data; 642ada981b2SKirk McKusick sblockloc = sblock_try[i]; 6431c85e6a3SKirk McKusick if ((fs->fs_magic == FS_UFS1_MAGIC || 6441c85e6a3SKirk McKusick (fs->fs_magic == FS_UFS2_MAGIC && 645ada981b2SKirk McKusick (fs->fs_sblockloc == sblockloc || 646ada981b2SKirk McKusick (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0))) && 6471c85e6a3SKirk McKusick fs->fs_bsize <= MAXBSIZE && 6481c85e6a3SKirk McKusick fs->fs_bsize >= sizeof(struct fs)) 6491c85e6a3SKirk McKusick break; 6501c85e6a3SKirk McKusick brelse(bp); 6511c85e6a3SKirk McKusick bp = NULL; 6521c85e6a3SKirk McKusick } 6531c85e6a3SKirk McKusick if (sblock_try[i] == -1) { 654df8bae1dSRodney W. Grimes error = EINVAL; /* XXX needs translation */ 655df8bae1dSRodney W. Grimes goto out; 656df8bae1dSRodney W. Grimes } 6573f6f17eeSJulian Elischer fs->fs_fmod = 0; 6581c85e6a3SKirk McKusick fs->fs_flags &= ~FS_INDEXDIRS; /* no support for directory indicies */ 6590922cce6SBruce Evans fs->fs_flags &= ~FS_UNCLEAN; 6600922cce6SBruce Evans if (fs->fs_clean == 0) { 6610922cce6SBruce Evans fs->fs_flags |= FS_UNCLEAN; 662812b1d41SKirk McKusick if (ronly || (mp->mnt_flag & MNT_FORCE) || 6631a6a6610SKirk McKusick ((fs->fs_flags & FS_NEEDSFSCK) == 0 && 6641a6a6610SKirk McKusick (fs->fs_flags & FS_DOSOFTDEP))) { 6650922cce6SBruce Evans printf( 6660922cce6SBruce Evans "WARNING: %s was not properly dismounted\n", 6670922cce6SBruce Evans fs->fs_fsmnt); 6681469eec8SDavid Greenman } else { 6690922cce6SBruce Evans printf( 6700922cce6SBruce Evans "WARNING: R/W mount of %s denied. Filesystem is not clean - run fsck\n", 6710922cce6SBruce Evans fs->fs_fsmnt); 6721469eec8SDavid Greenman error = EPERM; 6731469eec8SDavid Greenman goto out; 6741469eec8SDavid Greenman } 6751c85e6a3SKirk McKusick if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) && 6761c85e6a3SKirk McKusick (mp->mnt_flag & MNT_FORCE)) { 677cfbf0a46SMaxime Henrion printf("%s: lost blocks %jd files %d\n", fs->fs_fsmnt, 6781c85e6a3SKirk McKusick (intmax_t)fs->fs_pendingblocks, 6791c85e6a3SKirk McKusick fs->fs_pendinginodes); 6809ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 6819ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 6829ccb939eSKirk McKusick } 6839ccb939eSKirk McKusick } 6849ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 685cfbf0a46SMaxime Henrion printf("%s: mount pending error: blocks %jd files %d\n", 6861c85e6a3SKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 6871c85e6a3SKirk McKusick fs->fs_pendinginodes); 6889ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 6899ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 6901469eec8SDavid Greenman } 6911a60c7fcSPawel Jakub Dawidek if ((fs->fs_flags & FS_GJOURNAL) != 0) { 6921a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL 6931a60c7fcSPawel Jakub Dawidek /* 6941a60c7fcSPawel Jakub Dawidek * Get journal provider name. 6951a60c7fcSPawel Jakub Dawidek */ 6961a60c7fcSPawel Jakub Dawidek size = 1024; 6971a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = malloc(size, M_UFSMNT, M_WAITOK); 6981a60c7fcSPawel Jakub Dawidek if (g_io_getattr("GJOURNAL::provider", cp, &size, 6991a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider) == 0) { 7001a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, size, 7011a60c7fcSPawel Jakub Dawidek M_UFSMNT, M_WAITOK); 7021a60c7fcSPawel Jakub Dawidek MNT_ILOCK(mp); 7031a60c7fcSPawel Jakub Dawidek mp->mnt_flag |= MNT_GJOURNAL; 7041a60c7fcSPawel Jakub Dawidek MNT_IUNLOCK(mp); 7051a60c7fcSPawel Jakub Dawidek } else { 7061a60c7fcSPawel Jakub Dawidek printf( 7071a60c7fcSPawel Jakub Dawidek "WARNING: %s: GJOURNAL flag on fs but no gjournal provider below\n", 7081a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 7091a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 7101a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 7111a60c7fcSPawel Jakub Dawidek } 7121a60c7fcSPawel Jakub Dawidek #else 7131a60c7fcSPawel Jakub Dawidek printf( 7141a60c7fcSPawel Jakub Dawidek "WARNING: %s: GJOURNAL flag on fs but no UFS_GJOURNAL support\n", 7151a60c7fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 7161a60c7fcSPawel Jakub Dawidek #endif 7171a60c7fcSPawel Jakub Dawidek } else { 7181a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 7191a60c7fcSPawel Jakub Dawidek } 720a163d034SWarner Losh ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO); 72143920011SPoul-Henning Kamp ump->um_cp = cp; 72243920011SPoul-Henning Kamp ump->um_bo = &devvp->v_bufobj; 7238dd56505SPoul-Henning Kamp ump->um_fs = malloc((u_long)fs->fs_sbsize, M_UFSMNT, M_WAITOK); 7241c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 7251c85e6a3SKirk McKusick ump->um_fstype = UFS1; 7261c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs1; 7271c85e6a3SKirk McKusick } else { 7281c85e6a3SKirk McKusick ump->um_fstype = UFS2; 7291c85e6a3SKirk McKusick ump->um_balloc = ffs_balloc_ufs2; 7301c85e6a3SKirk McKusick } 731cec0f20cSPoul-Henning Kamp ump->um_blkatoff = ffs_blkatoff; 732cec0f20cSPoul-Henning Kamp ump->um_truncate = ffs_truncate; 733987f5696SPoul-Henning Kamp ump->um_update = ffs_update; 734cec0f20cSPoul-Henning Kamp ump->um_valloc = ffs_valloc; 735cec0f20cSPoul-Henning Kamp ump->um_vfree = ffs_vfree; 736975512a9SPoul-Henning Kamp ump->um_ifree = ffs_ifree; 73790446e36SKonstantin Belousov ump->um_rdonly = ffs_rdonly; 7383ba649d7SJeff Roberson mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF); 739df8bae1dSRodney W. Grimes bcopy(bp->b_data, ump->um_fs, (u_int)fs->fs_sbsize); 7401c85e6a3SKirk McKusick if (fs->fs_sbsize < SBLOCKSIZE) 741f2a2857bSKirk McKusick bp->b_flags |= B_INVAL | B_NOCACHE; 742df8bae1dSRodney W. Grimes brelse(bp); 743df8bae1dSRodney W. Grimes bp = NULL; 744df8bae1dSRodney W. Grimes fs = ump->um_fs; 7451c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc); 746df8bae1dSRodney W. Grimes fs->fs_ronly = ronly; 747996c772fSJohn Dyson size = fs->fs_cssize; 748996c772fSJohn Dyson blks = howmany(size, fs->fs_fsize); 749996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) 750996c772fSJohn Dyson size += fs->fs_ncg * sizeof(int32_t); 751a61ab64aSKirk McKusick size += fs->fs_ncg * sizeof(u_int8_t); 752a163d034SWarner Losh space = malloc((u_long)size, M_UFSMNT, M_WAITOK); 753f55ff3f3SIan Dowse fs->fs_csp = space; 754df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 755df8bae1dSRodney W. Grimes size = fs->fs_bsize; 756df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 757df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 7588aef1712SMatthew Dillon if ((error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, 7598aef1712SMatthew Dillon cred, &bp)) != 0) { 760f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 761df8bae1dSRodney W. Grimes goto out; 762df8bae1dSRodney W. Grimes } 763df8bae1dSRodney W. Grimes bcopy(bp->b_data, space, (u_int)size); 764f55ff3f3SIan Dowse space = (char *)space + size; 765df8bae1dSRodney W. Grimes brelse(bp); 766df8bae1dSRodney W. Grimes bp = NULL; 767df8bae1dSRodney W. Grimes } 768996c772fSJohn Dyson if (fs->fs_contigsumsize > 0) { 769f55ff3f3SIan Dowse fs->fs_maxcluster = lp = space; 770996c772fSJohn Dyson for (i = 0; i < fs->fs_ncg; i++) 771996c772fSJohn Dyson *lp++ = fs->fs_contigsumsize; 7724691e9eaSIan Dowse space = lp; 773996c772fSJohn Dyson } 774a61ab64aSKirk McKusick size = fs->fs_ncg * sizeof(u_int8_t); 775a61ab64aSKirk McKusick fs->fs_contigdirs = (u_int8_t *)space; 776a61ab64aSKirk McKusick bzero(fs->fs_contigdirs, size); 777143a5346SIan Dowse fs->fs_active = NULL; 77877465d93SAlfred Perlstein mp->mnt_data = ump; 77968de329eSPoul-Henning Kamp mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0]; 7808f89943eSGuido van Rooij mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1]; 7813bbd6d8aSJeff Roberson nmp = NULL; 78268de329eSPoul-Henning Kamp if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 || 7833bbd6d8aSJeff Roberson (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) { 7843bbd6d8aSJeff Roberson if (nmp) 7853bbd6d8aSJeff Roberson vfs_rel(nmp); 78668de329eSPoul-Henning Kamp vfs_getnewfsid(mp); 7873bbd6d8aSJeff Roberson } 788df8bae1dSRodney W. Grimes mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; 7895da56ddbSTor Egge MNT_ILOCK(mp); 790cc9d8990SPeter Wemm mp->mnt_flag |= MNT_LOCAL; 7915da56ddbSTor Egge MNT_IUNLOCK(mp); 7925da56ddbSTor Egge if ((fs->fs_flags & FS_MULTILABEL) != 0) { 7937b3f1bbdSTom Rhodes #ifdef MAC 7945da56ddbSTor Egge MNT_ILOCK(mp); 79580830407SRobert Watson mp->mnt_flag |= MNT_MULTILABEL; 7965da56ddbSTor Egge MNT_IUNLOCK(mp); 7977b3f1bbdSTom Rhodes #else 7987b3f1bbdSTom Rhodes printf( 7997b3f1bbdSTom Rhodes "WARNING: %s: multilabel flag on fs but no MAC support\n", 800946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 8017b3f1bbdSTom Rhodes #endif 8025da56ddbSTor Egge } 8035da56ddbSTor Egge if ((fs->fs_flags & FS_ACLS) != 0) { 8047b3f1bbdSTom Rhodes #ifdef UFS_ACL 8055da56ddbSTor Egge MNT_ILOCK(mp); 80680830407SRobert Watson mp->mnt_flag |= MNT_ACLS; 8075da56ddbSTor Egge MNT_IUNLOCK(mp); 8087b3f1bbdSTom Rhodes #else 8097b3f1bbdSTom Rhodes printf( 8107b3f1bbdSTom Rhodes "WARNING: %s: ACLs flag on fs but no ACLs support\n", 811946478fcSPawel Jakub Dawidek mp->mnt_stat.f_mntonname); 8127b3f1bbdSTom Rhodes #endif 8135da56ddbSTor Egge } 814df8bae1dSRodney W. Grimes ump->um_mountp = mp; 815df8bae1dSRodney W. Grimes ump->um_dev = dev; 816df8bae1dSRodney W. Grimes ump->um_devvp = devvp; 817df8bae1dSRodney W. Grimes ump->um_nindir = fs->fs_nindir; 818df8bae1dSRodney W. Grimes ump->um_bptrtodb = fs->fs_fsbtodb; 819df8bae1dSRodney W. Grimes ump->um_seqinc = fs->fs_frag; 820df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 821df8bae1dSRodney W. Grimes ump->um_quotas[i] = NULLVP; 822516081f2SRobert Watson #ifdef UFS_EXTATTR 823a64ed089SRobert Watson ufs_extattr_uepm_init(&ump->um_extattr); 824a64ed089SRobert Watson #endif 8252b14f991SJulian Elischer /* 8262b14f991SJulian Elischer * Set FS local "last mounted on" information (NULL pad) 8272b14f991SJulian Elischer */ 82893373c42SSuleiman Souhlal bzero(fs->fs_fsmnt, MAXMNTLEN); 82993373c42SSuleiman Souhlal strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN); 8302b14f991SJulian Elischer 8312b14f991SJulian Elischer if( mp->mnt_flag & MNT_ROOTFS) { 8322b14f991SJulian Elischer /* 8332b14f991SJulian Elischer * Root mount; update timestamp in mount structure. 8342b14f991SJulian Elischer * this will be used by the common root mount code 8352b14f991SJulian Elischer * to update the system clock. 8362b14f991SJulian Elischer */ 8372b14f991SJulian Elischer mp->mnt_time = fs->fs_time; 8382b14f991SJulian Elischer } 839996c772fSJohn Dyson 840996c772fSJohn Dyson if (ronly == 0) { 841b1897c19SJulian Elischer if ((fs->fs_flags & FS_DOSOFTDEP) && 842b1897c19SJulian Elischer (error = softdep_mount(devvp, mp, fs, cred)) != 0) { 843f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 844b1897c19SJulian Elischer goto out; 845b1897c19SJulian Elischer } 846f2a2857bSKirk McKusick if (fs->fs_snapinum[0] != 0) 847f2a2857bSKirk McKusick ffs_snapshot_mount(mp); 848cf60e8e4SKirk McKusick fs->fs_fmod = 1; 849996c772fSJohn Dyson fs->fs_clean = 0; 850791dd2faSTor Egge (void) ffs_sbupdate(ump, MNT_WAIT, 0); 851996c772fSJohn Dyson } 852d8d3d415SPoul-Henning Kamp /* 853d8d3d415SPoul-Henning Kamp * Initialize filesystem stat information in mount struct. 854d8d3d415SPoul-Henning Kamp */ 8556cf7bc60SRobert Watson MNT_ILOCK(mp); 8566cf7bc60SRobert Watson mp->mnt_kern_flag |= MNTK_MPSAFE; 8576cf7bc60SRobert Watson MNT_IUNLOCK(mp); 858516081f2SRobert Watson #ifdef UFS_EXTATTR 859516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART 8609de54ba5SRobert Watson /* 8619de54ba5SRobert Watson * 862f5161237SRobert Watson * Auto-starting does the following: 8639de54ba5SRobert Watson * - check for /.attribute in the fs, and extattr_start if so 8649de54ba5SRobert Watson * - for each file in .attribute, enable that file with 8659de54ba5SRobert Watson * an attribute of the same name. 8669de54ba5SRobert Watson * Not clear how to report errors -- probably eat them. 8679de54ba5SRobert Watson * This would all happen while the filesystem was busy/not 8689de54ba5SRobert Watson * available, so would effectively be "atomic". 8699de54ba5SRobert Watson */ 870e7fd8877SKonstantin Belousov mp->mnt_stat.f_iosize = fs->fs_bsize; 871b40ce416SJulian Elischer (void) ufs_extattr_autostart(mp, td); 872516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */ 873516081f2SRobert Watson #endif /* !UFS_EXTATTR */ 874df8bae1dSRodney W. Grimes return (0); 875df8bae1dSRodney W. Grimes out: 876df8bae1dSRodney W. Grimes if (bp) 877df8bae1dSRodney W. Grimes brelse(bp); 87843920011SPoul-Henning Kamp if (cp != NULL) { 87943920011SPoul-Henning Kamp DROP_GIANT(); 88043920011SPoul-Henning Kamp g_topology_lock(); 88184a69752SPoul-Henning Kamp g_vfs_close(cp, td); 88243920011SPoul-Henning Kamp g_topology_unlock(); 88343920011SPoul-Henning Kamp PICKUP_GIANT(); 88443920011SPoul-Henning Kamp } 885df8bae1dSRodney W. Grimes if (ump) { 8863ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 8871a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 8881a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 8891a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 8901a60c7fcSPawel Jakub Dawidek } 891df8bae1dSRodney W. Grimes free(ump->um_fs, M_UFSMNT); 892df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 89377465d93SAlfred Perlstein mp->mnt_data = NULL; 894df8bae1dSRodney W. Grimes } 895df8bae1dSRodney W. Grimes return (error); 896df8bae1dSRodney W. Grimes } 897df8bae1dSRodney W. Grimes 8981c85e6a3SKirk McKusick #include <sys/sysctl.h> 899adf41577SPoul-Henning Kamp static int bigcgs = 0; 9001c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, ""); 9011c85e6a3SKirk McKusick 902df8bae1dSRodney W. Grimes /* 9031c85e6a3SKirk McKusick * Sanity checks for loading old filesystem superblocks. 9041c85e6a3SKirk McKusick * See ffs_oldfscompat_write below for unwound actions. 905df8bae1dSRodney W. Grimes * 9061c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 9071c85e6a3SKirk McKusick * Unfortunately new bits get added. 908df8bae1dSRodney W. Grimes */ 9091c85e6a3SKirk McKusick static void 9101c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc) 911df8bae1dSRodney W. Grimes struct fs *fs; 9121c85e6a3SKirk McKusick struct ufsmount *ump; 9131c85e6a3SKirk McKusick ufs2_daddr_t sblockloc; 9141c85e6a3SKirk McKusick { 9151c85e6a3SKirk McKusick off_t maxfilesize; 9161c85e6a3SKirk McKusick 9171c85e6a3SKirk McKusick /* 918ada981b2SKirk McKusick * If not yet done, update fs_flags location and value of fs_sblockloc. 919ada981b2SKirk McKusick */ 920ada981b2SKirk McKusick if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) { 921ada981b2SKirk McKusick fs->fs_flags = fs->fs_old_flags; 922ada981b2SKirk McKusick fs->fs_old_flags |= FS_FLAGS_UPDATED; 923ada981b2SKirk McKusick fs->fs_sblockloc = sblockloc; 924ada981b2SKirk McKusick } 925ada981b2SKirk McKusick /* 9261c85e6a3SKirk McKusick * If not yet done, update UFS1 superblock with new wider fields. 9271c85e6a3SKirk McKusick */ 92874f3809aSKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) { 9291c85e6a3SKirk McKusick fs->fs_maxbsize = fs->fs_bsize; 9301c85e6a3SKirk McKusick fs->fs_time = fs->fs_old_time; 9311c85e6a3SKirk McKusick fs->fs_size = fs->fs_old_size; 9321c85e6a3SKirk McKusick fs->fs_dsize = fs->fs_old_dsize; 9331c85e6a3SKirk McKusick fs->fs_csaddr = fs->fs_old_csaddr; 9341c85e6a3SKirk McKusick fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir; 9351c85e6a3SKirk McKusick fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree; 9361c85e6a3SKirk McKusick fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree; 9371c85e6a3SKirk McKusick fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree; 9381c85e6a3SKirk McKusick } 9391c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && 9401c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { 9418680d698SNate Lawson fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1; 9421c85e6a3SKirk McKusick fs->fs_qbmask = ~fs->fs_bmask; 9431c85e6a3SKirk McKusick fs->fs_qfmask = ~fs->fs_fmask; 9441c85e6a3SKirk McKusick } 9458f42fb8fSIan Dowse if (fs->fs_magic == FS_UFS1_MAGIC) { 9461c85e6a3SKirk McKusick ump->um_savedmaxfilesize = fs->fs_maxfilesize; 9478680d698SNate Lawson maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1; 9481c85e6a3SKirk McKusick if (fs->fs_maxfilesize > maxfilesize) 9491c85e6a3SKirk McKusick fs->fs_maxfilesize = maxfilesize; 9508f42fb8fSIan Dowse } 9511c85e6a3SKirk McKusick /* Compatibility for old filesystems */ 9521c85e6a3SKirk McKusick if (fs->fs_avgfilesize <= 0) 9531c85e6a3SKirk McKusick fs->fs_avgfilesize = AVFILESIZ; 9541c85e6a3SKirk McKusick if (fs->fs_avgfpdir <= 0) 9551c85e6a3SKirk McKusick fs->fs_avgfpdir = AFPDIR; 9561c85e6a3SKirk McKusick if (bigcgs) { 9571c85e6a3SKirk McKusick fs->fs_save_cgsize = fs->fs_cgsize; 9581c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_bsize; 9591c85e6a3SKirk McKusick } 9601c85e6a3SKirk McKusick } 9611c85e6a3SKirk McKusick 9621c85e6a3SKirk McKusick /* 9631c85e6a3SKirk McKusick * Unwinding superblock updates for old filesystems. 9641c85e6a3SKirk McKusick * See ffs_oldfscompat_read above for details. 9651c85e6a3SKirk McKusick * 9661c85e6a3SKirk McKusick * XXX - Parts get retired eventually. 9671c85e6a3SKirk McKusick * Unfortunately new bits get added. 9681c85e6a3SKirk McKusick */ 9691c85e6a3SKirk McKusick static void 9701c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump) 9711c85e6a3SKirk McKusick struct fs *fs; 9721c85e6a3SKirk McKusick struct ufsmount *ump; 973df8bae1dSRodney W. Grimes { 974df8bae1dSRodney W. Grimes 9751c85e6a3SKirk McKusick /* 9761c85e6a3SKirk McKusick * Copy back UFS2 updated fields that UFS1 inspects. 9771c85e6a3SKirk McKusick */ 9781c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC) { 9791c85e6a3SKirk McKusick fs->fs_old_time = fs->fs_time; 9801c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir; 9811c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree; 9821c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree; 9831c85e6a3SKirk McKusick fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree; 9841c85e6a3SKirk McKusick fs->fs_maxfilesize = ump->um_savedmaxfilesize; 9858f42fb8fSIan Dowse } 9861c85e6a3SKirk McKusick if (bigcgs) { 9871c85e6a3SKirk McKusick fs->fs_cgsize = fs->fs_save_cgsize; 9881c85e6a3SKirk McKusick fs->fs_save_cgsize = 0; 9891c85e6a3SKirk McKusick } 990df8bae1dSRodney W. Grimes } 991df8bae1dSRodney W. Grimes 992df8bae1dSRodney W. Grimes /* 993df8bae1dSRodney W. Grimes * unmount system call 994df8bae1dSRodney W. Grimes */ 995adf41577SPoul-Henning Kamp static int 996b40ce416SJulian Elischer ffs_unmount(mp, mntflags, td) 997df8bae1dSRodney W. Grimes struct mount *mp; 998df8bae1dSRodney W. Grimes int mntflags; 999b40ce416SJulian Elischer struct thread *td; 1000df8bae1dSRodney W. Grimes { 100105f4ff5dSPoul-Henning Kamp struct ufsmount *ump = VFSTOUFS(mp); 100205f4ff5dSPoul-Henning Kamp struct fs *fs; 1003996c772fSJohn Dyson int error, flags; 1004df8bae1dSRodney W. Grimes 1005df8bae1dSRodney W. Grimes flags = 0; 1006df8bae1dSRodney W. Grimes if (mntflags & MNT_FORCE) { 1007df8bae1dSRodney W. Grimes flags |= FORCECLOSE; 1008df8bae1dSRodney W. Grimes } 1009516081f2SRobert Watson #ifdef UFS_EXTATTR 1010b40ce416SJulian Elischer if ((error = ufs_extattr_stop(mp, td))) { 1011b2b0497aSRobert Watson if (error != EOPNOTSUPP) 1012b2b0497aSRobert Watson printf("ffs_unmount: ufs_extattr_stop returned %d\n", 1013b2b0497aSRobert Watson error); 10147df97b61SRobert Watson } else { 10159de54ba5SRobert Watson ufs_extattr_uepm_destroy(&ump->um_extattr); 10167df97b61SRobert Watson } 1017a64ed089SRobert Watson #endif 1018b1897c19SJulian Elischer if (mp->mnt_flag & MNT_SOFTDEP) { 1019b40ce416SJulian Elischer if ((error = softdep_flushfiles(mp, flags, td)) != 0) 1020df8bae1dSRodney W. Grimes return (error); 1021b1897c19SJulian Elischer } else { 1022b40ce416SJulian Elischer if ((error = ffs_flushfiles(mp, flags, td)) != 0) 1023b1897c19SJulian Elischer return (error); 1024b1897c19SJulian Elischer } 1025df8bae1dSRodney W. Grimes fs = ump->um_fs; 10263ba649d7SJeff Roberson UFS_LOCK(ump); 10279ccb939eSKirk McKusick if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) { 1028cfbf0a46SMaxime Henrion printf("%s: unmount pending error: blocks %jd files %d\n", 10291c85e6a3SKirk McKusick fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks, 10301c85e6a3SKirk McKusick fs->fs_pendinginodes); 10319ccb939eSKirk McKusick fs->fs_pendingblocks = 0; 10329ccb939eSKirk McKusick fs->fs_pendinginodes = 0; 10339ccb939eSKirk McKusick } 10343ba649d7SJeff Roberson UFS_UNLOCK(ump); 1035996c772fSJohn Dyson if (fs->fs_ronly == 0) { 10361a6a6610SKirk McKusick fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1; 1037791dd2faSTor Egge error = ffs_sbupdate(ump, MNT_WAIT, 0); 1038996c772fSJohn Dyson if (error) { 1039996c772fSJohn Dyson fs->fs_clean = 0; 1040996c772fSJohn Dyson return (error); 1041996c772fSJohn Dyson } 1042e0e9c421SDavid Greenman } 104343920011SPoul-Henning Kamp DROP_GIANT(); 104443920011SPoul-Henning Kamp g_topology_lock(); 104584a69752SPoul-Henning Kamp g_vfs_close(ump->um_cp, td); 104643920011SPoul-Henning Kamp g_topology_unlock(); 104743920011SPoul-Henning Kamp PICKUP_GIANT(); 10486476c0d2SJohn Dyson vrele(ump->um_devvp); 10493ba649d7SJeff Roberson mtx_destroy(UFS_MTX(ump)); 10501a60c7fcSPawel Jakub Dawidek if (mp->mnt_gjprovider != NULL) { 10511a60c7fcSPawel Jakub Dawidek free(mp->mnt_gjprovider, M_UFSMNT); 10521a60c7fcSPawel Jakub Dawidek mp->mnt_gjprovider = NULL; 10531a60c7fcSPawel Jakub Dawidek } 1054f55ff3f3SIan Dowse free(fs->fs_csp, M_UFSMNT); 1055df8bae1dSRodney W. Grimes free(fs, M_UFSMNT); 1056df8bae1dSRodney W. Grimes free(ump, M_UFSMNT); 105777465d93SAlfred Perlstein mp->mnt_data = NULL; 10585da56ddbSTor Egge MNT_ILOCK(mp); 1059cc9d8990SPeter Wemm mp->mnt_flag &= ~MNT_LOCAL; 10605da56ddbSTor Egge MNT_IUNLOCK(mp); 1061df8bae1dSRodney W. Grimes return (error); 1062df8bae1dSRodney W. Grimes } 1063df8bae1dSRodney W. Grimes 1064df8bae1dSRodney W. Grimes /* 1065df8bae1dSRodney W. Grimes * Flush out all the files in a filesystem. 1066df8bae1dSRodney W. Grimes */ 106726f9a767SRodney W. Grimes int 1068b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td) 106905f4ff5dSPoul-Henning Kamp struct mount *mp; 1070df8bae1dSRodney W. Grimes int flags; 1071b40ce416SJulian Elischer struct thread *td; 1072df8bae1dSRodney W. Grimes { 107305f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 1074c9671602SPoul-Henning Kamp int error; 1075df8bae1dSRodney W. Grimes 1076df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1077df8bae1dSRodney W. Grimes #ifdef QUOTA 1078df8bae1dSRodney W. Grimes if (mp->mnt_flag & MNT_QUOTA) { 1079c1d9efcbSPoul-Henning Kamp int i; 1080f257b7a5SAlfred Perlstein error = vflush(mp, 0, SKIPSYSTEM|flags, td); 1081c1d9efcbSPoul-Henning Kamp if (error) 1082df8bae1dSRodney W. Grimes return (error); 1083df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) { 1084b40ce416SJulian Elischer quotaoff(td, mp, i); 1085df8bae1dSRodney W. Grimes } 1086df8bae1dSRodney W. Grimes /* 1087df8bae1dSRodney W. Grimes * Here we fall through to vflush again to ensure 1088df8bae1dSRodney W. Grimes * that we have gotten rid of all the system vnodes. 1089df8bae1dSRodney W. Grimes */ 1090df8bae1dSRodney W. Grimes } 1091df8bae1dSRodney W. Grimes #endif 1092e6e370a7SJeff Roberson ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles"); 1093e6e370a7SJeff Roberson if (ump->um_devvp->v_vflag & VV_COPYONWRITE) { 1094f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0) 1095f2a2857bSKirk McKusick return (error); 1096f2a2857bSKirk McKusick ffs_snapshot_unmount(mp); 109795e7a3c3STor Egge flags |= FORCECLOSE; 1098f2a2857bSKirk McKusick /* 1099f2a2857bSKirk McKusick * Here we fall through to vflush again to ensure 1100f2a2857bSKirk McKusick * that we have gotten rid of all the system vnodes. 1101f2a2857bSKirk McKusick */ 1102f2a2857bSKirk McKusick } 1103b1897c19SJulian Elischer /* 1104b1897c19SJulian Elischer * Flush all the files. 1105b1897c19SJulian Elischer */ 1106f257b7a5SAlfred Perlstein if ((error = vflush(mp, 0, flags, td)) != 0) 1107b1897c19SJulian Elischer return (error); 1108b1897c19SJulian Elischer /* 1109b1897c19SJulian Elischer * Flush filesystem metadata. 1110b1897c19SJulian Elischer */ 1111cb05b60aSAttilio Rao vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY); 11128df6bac4SPoul-Henning Kamp error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td); 111322db15c0SAttilio Rao VOP_UNLOCK(ump->um_devvp, 0); 1114df8bae1dSRodney W. Grimes return (error); 1115df8bae1dSRodney W. Grimes } 1116df8bae1dSRodney W. Grimes 1117df8bae1dSRodney W. Grimes /* 1118df8bae1dSRodney W. Grimes * Get filesystem statistics. 1119df8bae1dSRodney W. Grimes */ 1120adf41577SPoul-Henning Kamp static int 1121b40ce416SJulian Elischer ffs_statfs(mp, sbp, td) 1122df8bae1dSRodney W. Grimes struct mount *mp; 112305f4ff5dSPoul-Henning Kamp struct statfs *sbp; 1124b40ce416SJulian Elischer struct thread *td; 1125df8bae1dSRodney W. Grimes { 112605f4ff5dSPoul-Henning Kamp struct ufsmount *ump; 112705f4ff5dSPoul-Henning Kamp struct fs *fs; 1128df8bae1dSRodney W. Grimes 1129df8bae1dSRodney W. Grimes ump = VFSTOUFS(mp); 1130df8bae1dSRodney W. Grimes fs = ump->um_fs; 11311c85e6a3SKirk McKusick if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC) 1132df8bae1dSRodney W. Grimes panic("ffs_statfs"); 1133fde81c7dSKirk McKusick sbp->f_version = STATFS_VERSION; 1134df8bae1dSRodney W. Grimes sbp->f_bsize = fs->fs_fsize; 1135df8bae1dSRodney W. Grimes sbp->f_iosize = fs->fs_bsize; 1136df8bae1dSRodney W. Grimes sbp->f_blocks = fs->fs_dsize; 11373ba649d7SJeff Roberson UFS_LOCK(ump); 1138df8bae1dSRodney W. Grimes sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + 11399ccb939eSKirk McKusick fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks); 11409ccb939eSKirk McKusick sbp->f_bavail = freespace(fs, fs->fs_minfree) + 11419ccb939eSKirk McKusick dbtofsb(fs, fs->fs_pendingblocks); 1142df8bae1dSRodney W. Grimes sbp->f_files = fs->fs_ncg * fs->fs_ipg - ROOTINO; 11439ccb939eSKirk McKusick sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes; 11443ba649d7SJeff Roberson UFS_UNLOCK(ump); 1145fde81c7dSKirk McKusick sbp->f_namemax = NAME_MAX; 1146df8bae1dSRodney W. Grimes return (0); 1147df8bae1dSRodney W. Grimes } 1148df8bae1dSRodney W. Grimes 1149df8bae1dSRodney W. Grimes /* 1150df8bae1dSRodney W. Grimes * Go through the disk queues to initiate sandbagged IO; 1151df8bae1dSRodney W. Grimes * go through the inodes to write those that have been modified; 1152df8bae1dSRodney W. Grimes * initiate the writing of the super block if it has been modified. 1153df8bae1dSRodney W. Grimes * 1154df8bae1dSRodney W. Grimes * Note: we are always called with the filesystem marked `MPBUSY'. 1155df8bae1dSRodney W. Grimes */ 1156adf41577SPoul-Henning Kamp static int 11578df6bac4SPoul-Henning Kamp ffs_sync(mp, waitfor, td) 1158df8bae1dSRodney W. Grimes struct mount *mp; 1159df8bae1dSRodney W. Grimes int waitfor; 1160b40ce416SJulian Elischer struct thread *td; 1161df8bae1dSRodney W. Grimes { 116282be0a5aSTor Egge struct vnode *mvp, *vp, *devvp; 1163996c772fSJohn Dyson struct inode *ip; 1164996c772fSJohn Dyson struct ufsmount *ump = VFSTOUFS(mp); 1165996c772fSJohn Dyson struct fs *fs; 11669b971133SKirk McKusick int error, count, wait, lockreq, allerror = 0; 1167791dd2faSTor Egge int suspend; 1168791dd2faSTor Egge int suspended; 1169791dd2faSTor Egge int secondary_writes; 1170791dd2faSTor Egge int secondary_accwrites; 1171791dd2faSTor Egge int softdep_deps; 1172791dd2faSTor Egge int softdep_accdeps; 1173156cb265SPoul-Henning Kamp struct bufobj *bo; 1174df8bae1dSRodney W. Grimes 1175df8bae1dSRodney W. Grimes fs = ump->um_fs; 1176996c772fSJohn Dyson if (fs->fs_fmod != 0 && fs->fs_ronly != 0) { /* XXX */ 1177df8bae1dSRodney W. Grimes printf("fs = %s\n", fs->fs_fsmnt); 11785ace3b26SMike Pritchard panic("ffs_sync: rofs mod"); 1179df8bae1dSRodney W. Grimes } 1180df8bae1dSRodney W. Grimes /* 1181df8bae1dSRodney W. Grimes * Write back each (modified) inode. 1182df8bae1dSRodney W. Grimes */ 11839b971133SKirk McKusick wait = 0; 1184791dd2faSTor Egge suspend = 0; 1185791dd2faSTor Egge suspended = 0; 1186245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE | LK_NOWAIT; 1187791dd2faSTor Egge if (waitfor == MNT_SUSPEND) { 1188791dd2faSTor Egge suspend = 1; 1189791dd2faSTor Egge waitfor = MNT_WAIT; 1190791dd2faSTor Egge } 11919b971133SKirk McKusick if (waitfor == MNT_WAIT) { 11929b971133SKirk McKusick wait = 1; 1193245df27cSMatthew Dillon lockreq = LK_EXCLUSIVE; 11949b971133SKirk McKusick } 119541d4783dSJeff Roberson lockreq |= LK_INTERLOCK | LK_SLEEPFAIL; 1196ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 1197df8bae1dSRodney W. Grimes loop: 1198791dd2faSTor Egge /* Grab snapshot of secondary write counts */ 1199791dd2faSTor Egge secondary_writes = mp->mnt_secondary_writes; 1200791dd2faSTor Egge secondary_accwrites = mp->mnt_secondary_accwrites; 1201791dd2faSTor Egge 1202791dd2faSTor Egge /* Grab snapshot of softdep dependency counts */ 1203791dd2faSTor Egge MNT_IUNLOCK(mp); 1204791dd2faSTor Egge softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps); 1205791dd2faSTor Egge MNT_ILOCK(mp); 1206791dd2faSTor Egge 120782be0a5aSTor Egge MNT_VNODE_FOREACH(vp, mp, mvp) { 1208245df27cSMatthew Dillon /* 1209245df27cSMatthew Dillon * Depend on the mntvnode_slock to keep things stable enough 1210245df27cSMatthew Dillon * for a quick test. Since there might be hundreds of 1211245df27cSMatthew Dillon * thousands of vnodes, we cannot afford even a subroutine 1212245df27cSMatthew Dillon * call unless there's a good chance that we have work to do. 1213245df27cSMatthew Dillon */ 12142f05568aSJeff Roberson VI_LOCK(vp); 1215fe68abe2SJeff Roberson if (vp->v_iflag & VI_DOOMED) { 12162f05568aSJeff Roberson VI_UNLOCK(vp); 12172f05568aSJeff Roberson continue; 12182f05568aSJeff Roberson } 1219df8bae1dSRodney W. Grimes ip = VTOI(vp); 1220cf60e8e4SKirk McKusick if (vp->v_type == VNON || ((ip->i_flag & 1221cf60e8e4SKirk McKusick (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && 1222156cb265SPoul-Henning Kamp vp->v_bufobj.bo_dirty.bv_cnt == 0)) { 12232f05568aSJeff Roberson VI_UNLOCK(vp); 1224df8bae1dSRodney W. Grimes continue; 1225996c772fSJohn Dyson } 1226ca430f2eSAlexander Kabaev MNT_IUNLOCK(mp); 1227b40ce416SJulian Elischer if ((error = vget(vp, lockreq, td)) != 0) { 1228ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 122982be0a5aSTor Egge if (error == ENOENT || error == ENOLCK) { 123082be0a5aSTor Egge MNT_VNODE_FOREACH_ABORT_ILOCKED(mp, mvp); 1231df8bae1dSRodney W. Grimes goto loop; 123282be0a5aSTor Egge } 12332f05568aSJeff Roberson continue; 12342f05568aSJeff Roberson } 123540854ff5SPoul-Henning Kamp if ((error = ffs_syncvnode(vp, waitfor)) != 0) 1236df8bae1dSRodney W. Grimes allerror = error; 123741d4783dSJeff Roberson vput(vp); 1238ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 1239245df27cSMatthew Dillon } 1240ca430f2eSAlexander Kabaev MNT_IUNLOCK(mp); 1241df8bae1dSRodney W. Grimes /* 1242df8bae1dSRodney W. Grimes * Force stale filesystem control information to be flushed. 1243df8bae1dSRodney W. Grimes */ 12449b971133SKirk McKusick if (waitfor == MNT_WAIT) { 1245b40ce416SJulian Elischer if ((error = softdep_flushworklist(ump->um_mountp, &count, td))) 12469b971133SKirk McKusick allerror = error; 12479b971133SKirk McKusick /* Flushed work items may create new vnodes to clean */ 12489ab73fd1SKirk McKusick if (allerror == 0 && count) { 1249ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 12509b971133SKirk McKusick goto loop; 12519b971133SKirk McKusick } 12529b971133SKirk McKusick } 1253589c7af9SKirk McKusick #ifdef QUOTA 1254589c7af9SKirk McKusick qsync(mp); 1255589c7af9SKirk McKusick #endif 1256112f7372SKirk McKusick devvp = ump->um_devvp; 1257156cb265SPoul-Henning Kamp bo = &devvp->v_bufobj; 1258698b1a66SJeff Roberson BO_LOCK(bo); 1259112f7372SKirk McKusick if (waitfor != MNT_LAZY && 1260156cb265SPoul-Henning Kamp (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0)) { 1261698b1a66SJeff Roberson BO_UNLOCK(bo); 1262698b1a66SJeff Roberson vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY); 12638df6bac4SPoul-Henning Kamp if ((error = VOP_FSYNC(devvp, waitfor, td)) != 0) 1264df8bae1dSRodney W. Grimes allerror = error; 126522db15c0SAttilio Rao VOP_UNLOCK(devvp, 0); 12669ab73fd1SKirk McKusick if (allerror == 0 && waitfor == MNT_WAIT) { 1267ca430f2eSAlexander Kabaev MNT_ILOCK(mp); 1268112f7372SKirk McKusick goto loop; 1269b1897c19SJulian Elischer } 1270791dd2faSTor Egge } else if (suspend != 0) { 1271791dd2faSTor Egge if (softdep_check_suspend(mp, 1272791dd2faSTor Egge devvp, 1273791dd2faSTor Egge softdep_deps, 1274791dd2faSTor Egge softdep_accdeps, 1275791dd2faSTor Egge secondary_writes, 1276791dd2faSTor Egge secondary_accwrites) != 0) 1277791dd2faSTor Egge goto loop; /* More work needed */ 1278791dd2faSTor Egge mtx_assert(MNT_MTX(mp), MA_OWNED); 1279ca2fa807STor Egge mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED; 1280791dd2faSTor Egge MNT_IUNLOCK(mp); 1281791dd2faSTor Egge suspended = 1; 1282112f7372SKirk McKusick } else 1283698b1a66SJeff Roberson BO_UNLOCK(bo); 1284996c772fSJohn Dyson /* 1285996c772fSJohn Dyson * Write back modified superblock. 1286996c772fSJohn Dyson */ 1287791dd2faSTor Egge if (fs->fs_fmod != 0 && 1288791dd2faSTor Egge (error = ffs_sbupdate(ump, waitfor, suspended)) != 0) 1289996c772fSJohn Dyson allerror = error; 1290df8bae1dSRodney W. Grimes return (allerror); 1291df8bae1dSRodney W. Grimes } 1292df8bae1dSRodney W. Grimes 1293df8bae1dSRodney W. Grimes int 1294a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp) 1295df8bae1dSRodney W. Grimes struct mount *mp; 1296df8bae1dSRodney W. Grimes ino_t ino; 1297a0595d02SKirk McKusick int flags; 1298df8bae1dSRodney W. Grimes struct vnode **vpp; 1299df8bae1dSRodney W. Grimes { 13007b7ed832SKonstantin Belousov return (ffs_vgetf(mp, ino, flags, vpp, 0)); 13017b7ed832SKonstantin Belousov } 13027b7ed832SKonstantin Belousov 13037b7ed832SKonstantin Belousov int 13047b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags) 13057b7ed832SKonstantin Belousov struct mount *mp; 13067b7ed832SKonstantin Belousov ino_t ino; 13077b7ed832SKonstantin Belousov int flags; 13087b7ed832SKonstantin Belousov struct vnode **vpp; 13097b7ed832SKonstantin Belousov int ffs_flags; 13107b7ed832SKonstantin Belousov { 1311996c772fSJohn Dyson struct fs *fs; 1312996c772fSJohn Dyson struct inode *ip; 1313df8bae1dSRodney W. Grimes struct ufsmount *ump; 1314df8bae1dSRodney W. Grimes struct buf *bp; 1315df8bae1dSRodney W. Grimes struct vnode *vp; 131689c9c53dSPoul-Henning Kamp struct cdev *dev; 1317f576a00dSSemen Ustimenko int error; 1318df8bae1dSRodney W. Grimes 131951f5ce0cSPoul-Henning Kamp error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL); 1320e82ef95cSPoul-Henning Kamp if (error || *vpp != NULL) 132114bc0685SPoul-Henning Kamp return (error); 1322f576a00dSSemen Ustimenko 1323f576a00dSSemen Ustimenko /* 1324d6919865SJeff Roberson * We must promote to an exclusive lock for vnode creation. This 1325d6919865SJeff Roberson * can happen if lookup is passed LOCKSHARED. 1326d6919865SJeff Roberson */ 1327d6919865SJeff Roberson if ((flags & LK_TYPE_MASK) == LK_SHARED) { 1328d6919865SJeff Roberson flags &= ~LK_TYPE_MASK; 1329d6919865SJeff Roberson flags |= LK_EXCLUSIVE; 1330d6919865SJeff Roberson } 1331d6919865SJeff Roberson 1332d6919865SJeff Roberson /* 133313866b3fSSemen Ustimenko * We do not lock vnode creation as it is believed to be too 1334f576a00dSSemen Ustimenko * expensive for such rare case as simultaneous creation of vnode 1335f576a00dSSemen Ustimenko * for same ino by different processes. We just allow them to race 1336f576a00dSSemen Ustimenko * and check later to decide who wins. Let the race begin! 1337f576a00dSSemen Ustimenko */ 133814bc0685SPoul-Henning Kamp 133914bc0685SPoul-Henning Kamp ump = VFSTOUFS(mp); 134014bc0685SPoul-Henning Kamp dev = ump->um_dev; 134114bc0685SPoul-Henning Kamp fs = ump->um_fs; 1342df8bae1dSRodney W. Grimes 13432094ddb6SDavid Greenman /* 13442f9bae59SDavid Greenman * If this MALLOC() is performed after the getnewvnode() 13452f9bae59SDavid Greenman * it might block, leaving a vnode with a NULL v_data to be 13462f9bae59SDavid Greenman * found by ffs_sync() if a sync happens to fire right then, 13472f9bae59SDavid Greenman * which will cause a panic because ffs_sync() blindly 13482f9bae59SDavid Greenman * dereferences vp->v_data (as well it should). 13492f9bae59SDavid Greenman */ 135014bc0685SPoul-Henning Kamp ip = uma_zalloc(uma_inode, M_WAITOK | M_ZERO); 13512f9bae59SDavid Greenman 1352df8bae1dSRodney W. Grimes /* Allocate a new vnode/inode. */ 135302f2c6a9SPoul-Henning Kamp if (fs->fs_magic == FS_UFS1_MAGIC) 135402f2c6a9SPoul-Henning Kamp error = getnewvnode("ufs", mp, &ffs_vnodeops1, &vp); 135502f2c6a9SPoul-Henning Kamp else 135602f2c6a9SPoul-Henning Kamp error = getnewvnode("ufs", mp, &ffs_vnodeops2, &vp); 1357c9671602SPoul-Henning Kamp if (error) { 1358df8bae1dSRodney W. Grimes *vpp = NULL; 1359aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 1360df8bae1dSRodney W. Grimes return (error); 1361df8bae1dSRodney W. Grimes } 136267e87166SBoris Popov /* 1363aa7ba427SJeff Roberson * FFS supports recursive and shared locking. 136467e87166SBoris Popov */ 1365628f51d2SAttilio Rao VN_LOCK_AREC(vp); 1366628f51d2SAttilio Rao VN_LOCK_ASHARE(vp); 1367df8bae1dSRodney W. Grimes vp->v_data = ip; 13685d9d81e7SPoul-Henning Kamp vp->v_bufobj.bo_bsize = fs->fs_bsize; 1369df8bae1dSRodney W. Grimes ip->i_vnode = vp; 13701c85e6a3SKirk McKusick ip->i_ump = ump; 1371c94cd5fcSPoul-Henning Kamp ip->i_fs = fs; 1372df8bae1dSRodney W. Grimes ip->i_dev = dev; 1373df8bae1dSRodney W. Grimes ip->i_number = ino; 1374df8bae1dSRodney W. Grimes #ifdef QUOTA 1375c1d9efcbSPoul-Henning Kamp { 1376c1d9efcbSPoul-Henning Kamp int i; 1377df8bae1dSRodney W. Grimes for (i = 0; i < MAXQUOTAS; i++) 1378df8bae1dSRodney W. Grimes ip->i_dquot[i] = NODQUOT; 1379c1d9efcbSPoul-Henning Kamp } 1380df8bae1dSRodney W. Grimes #endif 1381df8bae1dSRodney W. Grimes 13820e9eb108SAttilio Rao lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL); 13837b7ed832SKonstantin Belousov if (ffs_flags & FFSV_FORCEINSMQ) 13847b7ed832SKonstantin Belousov vp->v_vflag |= VV_FORCEINSMQ; 138561b9d89fSTor Egge error = insmntque(vp, mp); 138661b9d89fSTor Egge if (error != 0) { 138761b9d89fSTor Egge uma_zfree(uma_inode, ip); 138861b9d89fSTor Egge *vpp = NULL; 138961b9d89fSTor Egge return (error); 139061b9d89fSTor Egge } 13917b7ed832SKonstantin Belousov vp->v_vflag &= ~VV_FORCEINSMQ; 1392a80d8caaSPawel Jakub Dawidek error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL); 139345c26fa2SPoul-Henning Kamp if (error || *vpp != NULL) 1394f576a00dSSemen Ustimenko return (error); 1395f576a00dSSemen Ustimenko 1396df8bae1dSRodney W. Grimes /* Read in the disk contents for the inode, copy into the inode. */ 1397c9671602SPoul-Henning Kamp error = bread(ump->um_devvp, fsbtodb(fs, ino_to_fsba(fs, ino)), 1398c9671602SPoul-Henning Kamp (int)fs->fs_bsize, NOCRED, &bp); 1399c9671602SPoul-Henning Kamp if (error) { 1400df8bae1dSRodney W. Grimes /* 1401df8bae1dSRodney W. Grimes * The inode does not contain anything useful, so it would 1402df8bae1dSRodney W. Grimes * be misleading to leave it on its hash chain. With mode 1403df8bae1dSRodney W. Grimes * still zero, it will be unlinked and returned to the free 1404df8bae1dSRodney W. Grimes * list by vput(). 1405df8bae1dSRodney W. Grimes */ 1406df8bae1dSRodney W. Grimes brelse(bp); 1407bd7e5f99SJohn Dyson vput(vp); 1408df8bae1dSRodney W. Grimes *vpp = NULL; 1409df8bae1dSRodney W. Grimes return (error); 1410df8bae1dSRodney W. Grimes } 1411de6ba7c0SPoul-Henning Kamp if (ip->i_ump->um_fstype == UFS1) 1412a163d034SWarner Losh ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK); 1413de6ba7c0SPoul-Henning Kamp else 1414a163d034SWarner Losh ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK); 1415de6ba7c0SPoul-Henning Kamp ffs_load_inode(bp, ip, fs, ino); 1416b1897c19SJulian Elischer if (DOINGSOFTDEP(vp)) 1417b1897c19SJulian Elischer softdep_load_inodeblock(ip); 1418b1897c19SJulian Elischer else 1419b1897c19SJulian Elischer ip->i_effnlink = ip->i_nlink; 1420bd7e5f99SJohn Dyson bqrelse(bp); 1421df8bae1dSRodney W. Grimes 1422df8bae1dSRodney W. Grimes /* 1423df8bae1dSRodney W. Grimes * Initialize the vnode from the inode, check for aliases. 1424df8bae1dSRodney W. Grimes * Note that the underlying vnode may have changed. 1425df8bae1dSRodney W. Grimes */ 142602f2c6a9SPoul-Henning Kamp if (ip->i_ump->um_fstype == UFS1) 142702f2c6a9SPoul-Henning Kamp error = ufs_vinit(mp, &ffs_fifoops1, &vp); 142802f2c6a9SPoul-Henning Kamp else 142902f2c6a9SPoul-Henning Kamp error = ufs_vinit(mp, &ffs_fifoops2, &vp); 1430c9671602SPoul-Henning Kamp if (error) { 1431df8bae1dSRodney W. Grimes vput(vp); 1432df8bae1dSRodney W. Grimes *vpp = NULL; 1433df8bae1dSRodney W. Grimes return (error); 1434df8bae1dSRodney W. Grimes } 1435de68347bSPoul-Henning Kamp 1436df8bae1dSRodney W. Grimes /* 14375c24d6eeSPoul-Henning Kamp * Finish inode initialization. 1438df8bae1dSRodney W. Grimes */ 1439de68347bSPoul-Henning Kamp 1440df8bae1dSRodney W. Grimes /* 1441df8bae1dSRodney W. Grimes * Set up a generation number for this inode if it does not 1442df8bae1dSRodney W. Grimes * already have one. This should only happen on old filesystems. 1443df8bae1dSRodney W. Grimes */ 1444df8bae1dSRodney W. Grimes if (ip->i_gen == 0) { 1445aca3e497SKirk McKusick ip->i_gen = arc4random() / 2 + 1; 14461c85e6a3SKirk McKusick if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 1447df8bae1dSRodney W. Grimes ip->i_flag |= IN_MODIFIED; 1448b403319bSAlexander Kabaev DIP_SET(ip, i_gen, ip->i_gen); 14491c85e6a3SKirk McKusick } 1450df8bae1dSRodney W. Grimes } 1451df8bae1dSRodney W. Grimes /* 1452df8bae1dSRodney W. Grimes * Ensure that uid and gid are correct. This is a temporary 1453df8bae1dSRodney W. Grimes * fix until fsck has been changed to do the update. 1454df8bae1dSRodney W. Grimes */ 14551c85e6a3SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && /* XXX */ 14561c85e6a3SKirk McKusick fs->fs_old_inodefmt < FS_44INODEFMT) { /* XXX */ 14571c85e6a3SKirk McKusick ip->i_uid = ip->i_din1->di_ouid; /* XXX */ 14581c85e6a3SKirk McKusick ip->i_gid = ip->i_din1->di_ogid; /* XXX */ 1459df8bae1dSRodney W. Grimes } /* XXX */ 1460df8bae1dSRodney W. Grimes 1461763bbd2fSRobert Watson #ifdef MAC 1462763bbd2fSRobert Watson if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) { 1463763bbd2fSRobert Watson /* 1464763bbd2fSRobert Watson * If this vnode is already allocated, and we're running 1465763bbd2fSRobert Watson * multi-label, attempt to perform a label association 1466763bbd2fSRobert Watson * from the extended attributes on the inode. 1467763bbd2fSRobert Watson */ 146830d239bcSRobert Watson error = mac_vnode_associate_extattr(mp, vp); 1469763bbd2fSRobert Watson if (error) { 1470763bbd2fSRobert Watson /* ufs_inactive will release ip->i_devvp ref. */ 1471763bbd2fSRobert Watson vput(vp); 1472763bbd2fSRobert Watson *vpp = NULL; 1473763bbd2fSRobert Watson return (error); 1474763bbd2fSRobert Watson } 1475763bbd2fSRobert Watson } 1476763bbd2fSRobert Watson #endif 1477763bbd2fSRobert Watson 1478df8bae1dSRodney W. Grimes *vpp = vp; 1479df8bae1dSRodney W. Grimes return (0); 1480df8bae1dSRodney W. Grimes } 1481df8bae1dSRodney W. Grimes 1482df8bae1dSRodney W. Grimes /* 1483df8bae1dSRodney W. Grimes * File handle to vnode 1484df8bae1dSRodney W. Grimes * 1485df8bae1dSRodney W. Grimes * Have to be really careful about stale file handles: 1486df8bae1dSRodney W. Grimes * - check that the inode number is valid 1487df8bae1dSRodney W. Grimes * - call ffs_vget() to get the locked inode 1488df8bae1dSRodney W. Grimes * - check for an unallocated inode (i_mode == 0) 1489df8bae1dSRodney W. Grimes * - check that the given client host has export rights and return 1490df8bae1dSRodney W. Grimes * those rights via. exflagsp and credanonp 1491df8bae1dSRodney W. Grimes */ 1492adf41577SPoul-Henning Kamp static int 1493c24fda81SAlfred Perlstein ffs_fhtovp(mp, fhp, vpp) 149405f4ff5dSPoul-Henning Kamp struct mount *mp; 1495df8bae1dSRodney W. Grimes struct fid *fhp; 1496df8bae1dSRodney W. Grimes struct vnode **vpp; 1497df8bae1dSRodney W. Grimes { 149805f4ff5dSPoul-Henning Kamp struct ufid *ufhp; 1499df8bae1dSRodney W. Grimes struct fs *fs; 1500df8bae1dSRodney W. Grimes 1501df8bae1dSRodney W. Grimes ufhp = (struct ufid *)fhp; 1502df8bae1dSRodney W. Grimes fs = VFSTOUFS(mp)->um_fs; 1503df8bae1dSRodney W. Grimes if (ufhp->ufid_ino < ROOTINO || 1504df8bae1dSRodney W. Grimes ufhp->ufid_ino >= fs->fs_ncg * fs->fs_ipg) 1505df8bae1dSRodney W. Grimes return (ESTALE); 1506c24fda81SAlfred Perlstein return (ufs_fhtovp(mp, ufhp, vpp)); 1507df8bae1dSRodney W. Grimes } 1508df8bae1dSRodney W. Grimes 1509df8bae1dSRodney W. Grimes /* 15105346934fSIan Dowse * Initialize the filesystem. 1511996c772fSJohn Dyson */ 1512996c772fSJohn Dyson static int 1513996c772fSJohn Dyson ffs_init(vfsp) 1514996c772fSJohn Dyson struct vfsconf *vfsp; 1515996c772fSJohn Dyson { 1516996c772fSJohn Dyson 1517b1897c19SJulian Elischer softdep_initialize(); 1518996c772fSJohn Dyson return (ufs_init(vfsp)); 1519996c772fSJohn Dyson } 1520996c772fSJohn Dyson 1521996c772fSJohn Dyson /* 15225346934fSIan Dowse * Undo the work of ffs_init(). 15235346934fSIan Dowse */ 15245346934fSIan Dowse static int 15255346934fSIan Dowse ffs_uninit(vfsp) 15265346934fSIan Dowse struct vfsconf *vfsp; 15275346934fSIan Dowse { 15285346934fSIan Dowse int ret; 15295346934fSIan Dowse 15305346934fSIan Dowse ret = ufs_uninit(vfsp); 15315346934fSIan Dowse softdep_uninitialize(); 15325346934fSIan Dowse return (ret); 15335346934fSIan Dowse } 15345346934fSIan Dowse 15355346934fSIan Dowse /* 1536df8bae1dSRodney W. Grimes * Write a superblock and associated information back to disk. 1537df8bae1dSRodney W. Grimes */ 15381a60c7fcSPawel Jakub Dawidek int 1539791dd2faSTor Egge ffs_sbupdate(mp, waitfor, suspended) 1540df8bae1dSRodney W. Grimes struct ufsmount *mp; 1541df8bae1dSRodney W. Grimes int waitfor; 1542791dd2faSTor Egge int suspended; 1543df8bae1dSRodney W. Grimes { 15441c85e6a3SKirk McKusick struct fs *fs = mp->um_fs; 15453ba649d7SJeff Roberson struct buf *sbbp; 154605f4ff5dSPoul-Henning Kamp struct buf *bp; 1547df8bae1dSRodney W. Grimes int blks; 1548f55ff3f3SIan Dowse void *space; 1549996c772fSJohn Dyson int i, size, error, allerror = 0; 1550df8bae1dSRodney W. Grimes 155174f3809aSKirk McKusick if (fs->fs_ronly == 1 && 155274f3809aSKirk McKusick (mp->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) != 155374f3809aSKirk McKusick (MNT_RDONLY | MNT_UPDATE)) 155474f3809aSKirk McKusick panic("ffs_sbupdate: write read-only filesystem"); 1555996c772fSJohn Dyson /* 15563ba649d7SJeff Roberson * We use the superblock's buf to serialize calls to ffs_sbupdate(). 15573ba649d7SJeff Roberson */ 15583ba649d7SJeff Roberson sbbp = getblk(mp->um_devvp, btodb(fs->fs_sblockloc), (int)fs->fs_sbsize, 15593ba649d7SJeff Roberson 0, 0, 0); 15603ba649d7SJeff Roberson /* 1561996c772fSJohn Dyson * First write back the summary information. 1562996c772fSJohn Dyson */ 1563df8bae1dSRodney W. Grimes blks = howmany(fs->fs_cssize, fs->fs_fsize); 1564f55ff3f3SIan Dowse space = fs->fs_csp; 1565df8bae1dSRodney W. Grimes for (i = 0; i < blks; i += fs->fs_frag) { 1566df8bae1dSRodney W. Grimes size = fs->fs_bsize; 1567df8bae1dSRodney W. Grimes if (i + fs->fs_frag > blks) 1568df8bae1dSRodney W. Grimes size = (blks - i) * fs->fs_fsize; 1569df8bae1dSRodney W. Grimes bp = getblk(mp->um_devvp, fsbtodb(fs, fs->fs_csaddr + i), 15707261f5f6SJeff Roberson size, 0, 0, 0); 1571df8bae1dSRodney W. Grimes bcopy(space, bp->b_data, (u_int)size); 1572f55ff3f3SIan Dowse space = (char *)space + size; 1573791dd2faSTor Egge if (suspended) 1574791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1575996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1576df8bae1dSRodney W. Grimes bawrite(bp); 15778aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1578996c772fSJohn Dyson allerror = error; 1579df8bae1dSRodney W. Grimes } 1580996c772fSJohn Dyson /* 1581996c772fSJohn Dyson * Now write back the superblock itself. If any errors occurred 1582996c772fSJohn Dyson * up to this point, then fail so that the superblock avoids 1583996c772fSJohn Dyson * being written out as clean. 1584996c772fSJohn Dyson */ 15853ba649d7SJeff Roberson if (allerror) { 15863ba649d7SJeff Roberson brelse(sbbp); 1587996c772fSJohn Dyson return (allerror); 15883ba649d7SJeff Roberson } 15893ba649d7SJeff Roberson bp = sbbp; 159031574422SKirk McKusick if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 && 159131574422SKirk McKusick (fs->fs_flags & FS_FLAGS_UPDATED) == 0) { 1592fa5d33e2SKirk McKusick printf("%s: correcting fs_sblockloc from %jd to %d\n", 1593fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1); 1594fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS1; 1595fa5d33e2SKirk McKusick } 159631574422SKirk McKusick if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 && 159731574422SKirk McKusick (fs->fs_flags & FS_FLAGS_UPDATED) == 0) { 1598fa5d33e2SKirk McKusick printf("%s: correcting fs_sblockloc from %jd to %d\n", 1599fa5d33e2SKirk McKusick fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2); 1600fa5d33e2SKirk McKusick fs->fs_sblockloc = SBLOCK_UFS2; 1601fa5d33e2SKirk McKusick } 1602b1897c19SJulian Elischer fs->fs_fmod = 0; 1603227ee8a1SPoul-Henning Kamp fs->fs_time = time_second; 1604996c772fSJohn Dyson bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize); 16051c85e6a3SKirk McKusick ffs_oldfscompat_write((struct fs *)bp->b_data, mp); 1606791dd2faSTor Egge if (suspended) 1607791dd2faSTor Egge bp->b_flags |= B_VALIDSUSPWRT; 1608996c772fSJohn Dyson if (waitfor != MNT_WAIT) 1609996c772fSJohn Dyson bawrite(bp); 16108aef1712SMatthew Dillon else if ((error = bwrite(bp)) != 0) 1611996c772fSJohn Dyson allerror = error; 1612996c772fSJohn Dyson return (allerror); 1613df8bae1dSRodney W. Grimes } 1614d6fe88e4SPoul-Henning Kamp 1615d6fe88e4SPoul-Henning Kamp static int 1616d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp, 1617d6fe88e4SPoul-Henning Kamp int attrnamespace, const char *attrname, struct thread *td) 1618d6fe88e4SPoul-Henning Kamp { 1619d6fe88e4SPoul-Henning Kamp 1620d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR 1621d6fe88e4SPoul-Henning Kamp return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace, 1622d6fe88e4SPoul-Henning Kamp attrname, td)); 1623d6fe88e4SPoul-Henning Kamp #else 1624d6fe88e4SPoul-Henning Kamp return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace, 1625d6fe88e4SPoul-Henning Kamp attrname, td)); 1626d6fe88e4SPoul-Henning Kamp #endif 1627d6fe88e4SPoul-Henning Kamp } 1628975512a9SPoul-Henning Kamp 1629975512a9SPoul-Henning Kamp static void 1630975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip) 1631975512a9SPoul-Henning Kamp { 1632975512a9SPoul-Henning Kamp 163336329289STim J. Robbins if (ump->um_fstype == UFS1 && ip->i_din1 != NULL) 1634aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_ufs1, ip->i_din1); 163536329289STim J. Robbins else if (ip->i_din2 != NULL) 16368d721e87STim J. Robbins uma_zfree(uma_ufs2, ip->i_din2); 1637aa4d7a8aSPoul-Henning Kamp uma_zfree(uma_inode, ip); 1638975512a9SPoul-Henning Kamp } 16396e77a041SPoul-Henning Kamp 1640dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1; 1641dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0, 1642dd19a799SPoul-Henning Kamp "Do background writes (honoring the BV_BKGRDWRITE flag)?"); 1643dd19a799SPoul-Henning Kamp 1644dd19a799SPoul-Henning Kamp /* 1645dd19a799SPoul-Henning Kamp * Complete a background write started from bwrite. 1646dd19a799SPoul-Henning Kamp */ 1647dd19a799SPoul-Henning Kamp static void 1648dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp) 1649dd19a799SPoul-Henning Kamp { 1650204ec66dSJeff Roberson struct bufobj *bufobj; 1651dd19a799SPoul-Henning Kamp struct buf *origbp; 1652dd19a799SPoul-Henning Kamp 1653dd19a799SPoul-Henning Kamp /* 1654dd19a799SPoul-Henning Kamp * Find the original buffer that we are writing. 1655dd19a799SPoul-Henning Kamp */ 1656204ec66dSJeff Roberson bufobj = bp->b_bufobj; 1657204ec66dSJeff Roberson BO_LOCK(bufobj); 1658dd19a799SPoul-Henning Kamp if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL) 1659dd19a799SPoul-Henning Kamp panic("backgroundwritedone: lost buffer"); 1660204ec66dSJeff Roberson /* Grab an extra reference to be dropped by the bufdone() below. */ 1661204ec66dSJeff Roberson bufobj_wrefl(bufobj); 1662204ec66dSJeff Roberson BO_UNLOCK(bufobj); 1663dd19a799SPoul-Henning Kamp /* 1664dd19a799SPoul-Henning Kamp * Process dependencies then return any unfinished ones. 1665dd19a799SPoul-Henning Kamp */ 166604533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 1667dd19a799SPoul-Henning Kamp buf_complete(bp); 1668dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 166904533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 1670dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, origbp); 1671dd19a799SPoul-Henning Kamp #endif 1672dd19a799SPoul-Henning Kamp /* 1673204ec66dSJeff Roberson * This buffer is marked B_NOCACHE so when it is released 1674204ec66dSJeff Roberson * by biodone it will be tossed. 1675dd19a799SPoul-Henning Kamp */ 1676dd19a799SPoul-Henning Kamp bp->b_flags |= B_NOCACHE; 1677ec9c9e73SAlan Cox bp->b_flags &= ~B_CACHE; 1678dd19a799SPoul-Henning Kamp bufdone(bp); 1679204ec66dSJeff Roberson BO_LOCK(bufobj); 1680dd19a799SPoul-Henning Kamp /* 1681dd19a799SPoul-Henning Kamp * Clear the BV_BKGRDINPROG flag in the original buffer 1682dd19a799SPoul-Henning Kamp * and awaken it if it is waiting for the write to complete. 1683dd19a799SPoul-Henning Kamp * If BV_BKGRDINPROG is not set in the original buffer it must 1684dd19a799SPoul-Henning Kamp * have been released and re-instantiated - which is not legal. 1685dd19a799SPoul-Henning Kamp */ 1686dd19a799SPoul-Henning Kamp KASSERT((origbp->b_vflags & BV_BKGRDINPROG), 1687dd19a799SPoul-Henning Kamp ("backgroundwritedone: lost buffer2")); 1688dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDINPROG; 1689dd19a799SPoul-Henning Kamp if (origbp->b_vflags & BV_BKGRDWAIT) { 1690dd19a799SPoul-Henning Kamp origbp->b_vflags &= ~BV_BKGRDWAIT; 1691dd19a799SPoul-Henning Kamp wakeup(&origbp->b_xflags); 1692dd19a799SPoul-Henning Kamp } 1693204ec66dSJeff Roberson BO_UNLOCK(bufobj); 1694dd19a799SPoul-Henning Kamp } 1695dd19a799SPoul-Henning Kamp 1696dd19a799SPoul-Henning Kamp 1697dd19a799SPoul-Henning Kamp /* 1698dd19a799SPoul-Henning Kamp * Write, release buffer on completion. (Done by iodone 1699dd19a799SPoul-Henning Kamp * if async). Do not bother writing anything if the buffer 1700dd19a799SPoul-Henning Kamp * is invalid. 1701dd19a799SPoul-Henning Kamp * 1702dd19a799SPoul-Henning Kamp * Note that we set B_CACHE here, indicating that buffer is 1703dd19a799SPoul-Henning Kamp * fully valid and thus cacheable. This is true even of NFS 1704dd19a799SPoul-Henning Kamp * now so we set it generally. This could be set either here 1705dd19a799SPoul-Henning Kamp * or in biodone() since the I/O is synchronous. We put it 1706dd19a799SPoul-Henning Kamp * here. 1707dd19a799SPoul-Henning Kamp */ 1708dd19a799SPoul-Henning Kamp static int 1709dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp) 1710dd19a799SPoul-Henning Kamp { 1711dd19a799SPoul-Henning Kamp int oldflags, s; 1712dd19a799SPoul-Henning Kamp struct buf *newbp; 1713dd19a799SPoul-Henning Kamp 1714dd19a799SPoul-Henning Kamp CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags); 1715dd19a799SPoul-Henning Kamp if (bp->b_flags & B_INVAL) { 1716dd19a799SPoul-Henning Kamp brelse(bp); 1717dd19a799SPoul-Henning Kamp return (0); 1718dd19a799SPoul-Henning Kamp } 1719dd19a799SPoul-Henning Kamp 1720dd19a799SPoul-Henning Kamp oldflags = bp->b_flags; 1721dd19a799SPoul-Henning Kamp 1722d638e093SAttilio Rao if (!BUF_ISLOCKED(bp)) 1723dd19a799SPoul-Henning Kamp panic("bufwrite: buffer is not busy???"); 1724dd19a799SPoul-Henning Kamp s = splbio(); 1725dd19a799SPoul-Henning Kamp /* 1726dd19a799SPoul-Henning Kamp * If a background write is already in progress, delay 1727dd19a799SPoul-Henning Kamp * writing this block if it is asynchronous. Otherwise 1728dd19a799SPoul-Henning Kamp * wait for the background write to complete. 1729dd19a799SPoul-Henning Kamp */ 1730dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 1731dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) { 1732dd19a799SPoul-Henning Kamp if (bp->b_flags & B_ASYNC) { 1733dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 1734dd19a799SPoul-Henning Kamp splx(s); 1735dd19a799SPoul-Henning Kamp bdwrite(bp); 1736dd19a799SPoul-Henning Kamp return (0); 1737dd19a799SPoul-Henning Kamp } 1738dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDWAIT; 1739dd19a799SPoul-Henning Kamp msleep(&bp->b_xflags, BO_MTX(bp->b_bufobj), PRIBIO, "bwrbg", 0); 1740dd19a799SPoul-Henning Kamp if (bp->b_vflags & BV_BKGRDINPROG) 1741dd19a799SPoul-Henning Kamp panic("bufwrite: still writing"); 1742dd19a799SPoul-Henning Kamp } 1743dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 1744dd19a799SPoul-Henning Kamp 1745dd19a799SPoul-Henning Kamp /* Mark the buffer clean */ 1746dd19a799SPoul-Henning Kamp bundirty(bp); 1747dd19a799SPoul-Henning Kamp 1748dd19a799SPoul-Henning Kamp /* 1749dd19a799SPoul-Henning Kamp * If this buffer is marked for background writing and we 1750dd19a799SPoul-Henning Kamp * do not have to wait for it, make a copy and write the 1751dd19a799SPoul-Henning Kamp * copy so as to leave this buffer ready for further use. 1752dd19a799SPoul-Henning Kamp * 1753dd19a799SPoul-Henning Kamp * This optimization eats a lot of memory. If we have a page 1754dd19a799SPoul-Henning Kamp * or buffer shortfall we can't do it. 1755dd19a799SPoul-Henning Kamp */ 1756dd19a799SPoul-Henning Kamp if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) && 1757dd19a799SPoul-Henning Kamp (bp->b_flags & B_ASYNC) && 1758dd19a799SPoul-Henning Kamp !vm_page_count_severe() && 1759dd19a799SPoul-Henning Kamp !buf_dirty_count_severe()) { 1760dd19a799SPoul-Henning Kamp KASSERT(bp->b_iodone == NULL, 1761dd19a799SPoul-Henning Kamp ("bufwrite: needs chained iodone (%p)", bp->b_iodone)); 1762dd19a799SPoul-Henning Kamp 1763dd19a799SPoul-Henning Kamp /* get a new block */ 1764dd19a799SPoul-Henning Kamp newbp = geteblk(bp->b_bufsize); 1765dd19a799SPoul-Henning Kamp 1766dd19a799SPoul-Henning Kamp /* 1767dd19a799SPoul-Henning Kamp * set it to be identical to the old block. We have to 1768dd19a799SPoul-Henning Kamp * set b_lblkno and BKGRDMARKER before calling bgetvp() 1769dd19a799SPoul-Henning Kamp * to avoid confusing the splay tree and gbincore(). 1770dd19a799SPoul-Henning Kamp */ 1771dd19a799SPoul-Henning Kamp memcpy(newbp->b_data, bp->b_data, bp->b_bufsize); 1772dd19a799SPoul-Henning Kamp newbp->b_lblkno = bp->b_lblkno; 1773dd19a799SPoul-Henning Kamp newbp->b_xflags |= BX_BKGRDMARKER; 1774dd19a799SPoul-Henning Kamp BO_LOCK(bp->b_bufobj); 1775dd19a799SPoul-Henning Kamp bp->b_vflags |= BV_BKGRDINPROG; 1776dd19a799SPoul-Henning Kamp bgetvp(bp->b_vp, newbp); 1777dd19a799SPoul-Henning Kamp BO_UNLOCK(bp->b_bufobj); 1778dd19a799SPoul-Henning Kamp newbp->b_bufobj = &bp->b_vp->v_bufobj; 1779dd19a799SPoul-Henning Kamp newbp->b_blkno = bp->b_blkno; 1780dd19a799SPoul-Henning Kamp newbp->b_offset = bp->b_offset; 1781dd19a799SPoul-Henning Kamp newbp->b_iodone = ffs_backgroundwritedone; 1782dd19a799SPoul-Henning Kamp newbp->b_flags |= B_ASYNC; 1783dd19a799SPoul-Henning Kamp newbp->b_flags &= ~B_INVAL; 1784dd19a799SPoul-Henning Kamp 1785dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES 1786dd19a799SPoul-Henning Kamp /* move over the dependencies */ 178704533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 1788dd19a799SPoul-Henning Kamp softdep_move_dependencies(bp, newbp); 1789dd19a799SPoul-Henning Kamp #endif 1790dd19a799SPoul-Henning Kamp 1791dd19a799SPoul-Henning Kamp /* 1792dd19a799SPoul-Henning Kamp * Initiate write on the copy, release the original to 1793dd19a799SPoul-Henning Kamp * the B_LOCKED queue so that it cannot go away until 1794dd19a799SPoul-Henning Kamp * the background write completes. If not locked it could go 1795dd19a799SPoul-Henning Kamp * away and then be reconstituted while it was being written. 1796dd19a799SPoul-Henning Kamp * If the reconstituted buffer were written, we could end up 1797dd19a799SPoul-Henning Kamp * with two background copies being written at the same time. 1798dd19a799SPoul-Henning Kamp */ 1799dd19a799SPoul-Henning Kamp bqrelse(bp); 1800dd19a799SPoul-Henning Kamp bp = newbp; 1801dd19a799SPoul-Henning Kamp } 1802dd19a799SPoul-Henning Kamp 1803dd19a799SPoul-Henning Kamp /* Let the normal bufwrite do the rest for us */ 18049248a827STor Egge return (bufwrite(bp)); 1805dd19a799SPoul-Henning Kamp } 1806dd19a799SPoul-Henning Kamp 1807dd19a799SPoul-Henning Kamp 18088dd56505SPoul-Henning Kamp static void 18096e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp) 18106e77a041SPoul-Henning Kamp { 1811153910e0SJeff Roberson struct vnode *vp; 1812153910e0SJeff Roberson int error; 18137de3839dSTor Egge struct buf *tbp; 18146e77a041SPoul-Henning Kamp 1815153910e0SJeff Roberson vp = bo->__bo_vnode; 1816153910e0SJeff Roberson if (bp->b_iocmd == BIO_WRITE) { 1817153910e0SJeff Roberson if ((bp->b_flags & B_VALIDSUSPWRT) == 0 && 1818153910e0SJeff Roberson bp->b_vp != NULL && bp->b_vp->v_mount != NULL && 1819153910e0SJeff Roberson (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0) 1820153910e0SJeff Roberson panic("ffs_geom_strategy: bad I/O"); 1821153910e0SJeff Roberson bp->b_flags &= ~B_VALIDSUSPWRT; 1822153910e0SJeff Roberson if ((vp->v_vflag & VV_COPYONWRITE) && 18237de3839dSTor Egge vp->v_rdev->si_snapdata != NULL) { 18247de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 1825868bb88fSTor Egge runningbufwakeup(bp); 18267de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 18277de3839dSTor Egge b_cluster.cluster_entry) { 18287de3839dSTor Egge error = ffs_copyonwrite(vp, tbp); 18297de3839dSTor Egge if (error != 0 && 1830153910e0SJeff Roberson error != EOPNOTSUPP) { 1831153910e0SJeff Roberson bp->b_error = error; 1832153910e0SJeff Roberson bp->b_ioflags |= BIO_ERROR; 1833153910e0SJeff Roberson bufdone(bp); 1834153910e0SJeff Roberson return; 1835153910e0SJeff Roberson } 1836153910e0SJeff Roberson } 1837868bb88fSTor Egge bp->b_runningbufspace = bp->b_bufsize; 1838868bb88fSTor Egge atomic_add_int(&runningbufspace, 1839868bb88fSTor Egge bp->b_runningbufspace); 18407de3839dSTor Egge } else { 18417de3839dSTor Egge error = ffs_copyonwrite(vp, bp); 18427de3839dSTor Egge if (error != 0 && error != EOPNOTSUPP) { 18437de3839dSTor Egge bp->b_error = error; 18447de3839dSTor Egge bp->b_ioflags |= BIO_ERROR; 18457de3839dSTor Egge bufdone(bp); 18467de3839dSTor Egge return; 18477de3839dSTor Egge } 18487de3839dSTor Egge } 18497de3839dSTor Egge } 18507de3839dSTor Egge #ifdef SOFTUPDATES 18517de3839dSTor Egge if ((bp->b_flags & B_CLUSTER) != 0) { 18527de3839dSTor Egge TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head, 18537de3839dSTor Egge b_cluster.cluster_entry) { 185404533fc6SXin LI if (!LIST_EMPTY(&tbp->b_dep)) 18557de3839dSTor Egge buf_start(tbp); 18567de3839dSTor Egge } 18577de3839dSTor Egge } else { 185804533fc6SXin LI if (!LIST_EMPTY(&bp->b_dep)) 18597de3839dSTor Egge buf_start(bp); 18607de3839dSTor Egge } 18617de3839dSTor Egge 18627de3839dSTor Egge #endif 18637de3839dSTor Egge } 186443920011SPoul-Henning Kamp g_vfs_strategy(bo, bp); 18656e77a041SPoul-Henning Kamp } 1866