xref: /freebsd/sys/ufs/ffs/ffs_vfsops.c (revision b60ee81e3d7c574bd464214c16e9cbf22be9937d)
160727d8bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1989, 1991, 1993, 1994
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
29996c772fSJohn Dyson  *	@(#)ffs_vfsops.c	8.31 (Berkeley) 5/20/95
30df8bae1dSRodney W. Grimes  */
31df8bae1dSRodney W. Grimes 
32f4636c59SDavid E. O'Brien #include <sys/cdefs.h>
33f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$");
34f4636c59SDavid E. O'Brien 
3501733a9bSGarrett Wollman #include "opt_quota.h"
36516081f2SRobert Watson #include "opt_ufs.h"
376e77a041SPoul-Henning Kamp #include "opt_ffs.h"
3852dfc8d7SKonstantin Belousov #include "opt_ddb.h"
3901733a9bSGarrett Wollman 
40df8bae1dSRodney W. Grimes #include <sys/param.h>
41df8bae1dSRodney W. Grimes #include <sys/systm.h>
42df8bae1dSRodney W. Grimes #include <sys/namei.h>
43acd3428bSRobert Watson #include <sys/priv.h>
44df8bae1dSRodney W. Grimes #include <sys/proc.h>
45df8bae1dSRodney W. Grimes #include <sys/kernel.h>
46df8bae1dSRodney W. Grimes #include <sys/vnode.h>
47df8bae1dSRodney W. Grimes #include <sys/mount.h>
489626b608SPoul-Henning Kamp #include <sys/bio.h>
49df8bae1dSRodney W. Grimes #include <sys/buf.h>
5081bca6ddSKATO Takenori #include <sys/conf.h>
513ac4d1efSBruce Evans #include <sys/fcntl.h>
52df8bae1dSRodney W. Grimes #include <sys/malloc.h>
531b367556SJason Evans #include <sys/mutex.h>
54a18b1f1dSJason Evans 
55aed55708SRobert Watson #include <security/mac/mac_framework.h>
56aed55708SRobert Watson 
57a64ed089SRobert Watson #include <ufs/ufs/extattr.h>
581a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h>
59df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h>
60df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h>
61df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h>
62df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h>
63df8bae1dSRodney W. Grimes 
64df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h>
65df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h>
66df8bae1dSRodney W. Grimes 
67f6b04d2bSDavid Greenman #include <vm/vm.h>
68aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h>
69f6b04d2bSDavid Greenman #include <vm/vm_page.h>
70f6b04d2bSDavid Greenman 
7143920011SPoul-Henning Kamp #include <geom/geom.h>
7243920011SPoul-Henning Kamp #include <geom/geom_vfs.h>
7343920011SPoul-Henning Kamp 
7452dfc8d7SKonstantin Belousov #include <ddb/ddb.h>
7552dfc8d7SKonstantin Belousov 
76adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2;
7755166637SPoul-Henning Kamp 
785e8c582aSPoul-Henning Kamp static int	ffs_reload(struct mount *, struct thread *);
79975512a9SPoul-Henning Kamp static int	ffs_mountfs(struct vnode *, struct mount *, struct thread *);
801c85e6a3SKirk McKusick static void	ffs_oldfscompat_read(struct fs *, struct ufsmount *,
811c85e6a3SKirk McKusick 		    ufs2_daddr_t);
82975512a9SPoul-Henning Kamp static void	ffs_ifree(struct ufsmount *ump, struct inode *ip);
839bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init;
849bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit;
85d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl;
8620a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount;
87adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount;
8820a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount;
89adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs;
90adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp;
91adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync;
92df8bae1dSRodney W. Grimes 
93303b270bSEivind Eklund static struct vfsops ufs_vfsops = {
947652131bSPoul-Henning Kamp 	.vfs_extattrctl =	ffs_extattrctl,
957652131bSPoul-Henning Kamp 	.vfs_fhtovp =		ffs_fhtovp,
967652131bSPoul-Henning Kamp 	.vfs_init =		ffs_init,
9720a92a18SPoul-Henning Kamp 	.vfs_mount =		ffs_mount,
9820a92a18SPoul-Henning Kamp 	.vfs_cmount =		ffs_cmount,
997652131bSPoul-Henning Kamp 	.vfs_quotactl =		ufs_quotactl,
1007652131bSPoul-Henning Kamp 	.vfs_root =		ufs_root,
1017652131bSPoul-Henning Kamp 	.vfs_statfs =		ffs_statfs,
1027652131bSPoul-Henning Kamp 	.vfs_sync =		ffs_sync,
1037652131bSPoul-Henning Kamp 	.vfs_uninit =		ffs_uninit,
1047652131bSPoul-Henning Kamp 	.vfs_unmount =		ffs_unmount,
1057652131bSPoul-Henning Kamp 	.vfs_vget =		ffs_vget,
1062814d5baSKonstantin Belousov 	.vfs_susp_clean =	process_deferred_inactive,
107df8bae1dSRodney W. Grimes };
108df8bae1dSRodney W. Grimes 
1098994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0);
1105fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1);
111c901836cSGarrett Wollman 
1126e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy;
113dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite;
1146e77a041SPoul-Henning Kamp 
1156e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = {
1166e77a041SPoul-Henning Kamp 	.bop_name =	"FFS",
117dd19a799SPoul-Henning Kamp 	.bop_write =	ffs_bufwrite,
1186e77a041SPoul-Henning Kamp 	.bop_strategy =	ffs_geom_strategy,
1196ef8480aSPoul-Henning Kamp 	.bop_sync =	bufsync,
1202cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT
1212cc7d26fSKonstantin Belousov 	.bop_bdflush =	bufbdflush,
1222cc7d26fSKonstantin Belousov #else
1232cc7d26fSKonstantin Belousov 	.bop_bdflush =	ffs_bdflush,
1242cc7d26fSKonstantin Belousov #endif
1256e77a041SPoul-Henning Kamp };
1266e77a041SPoul-Henning Kamp 
1270b962648SAndriy Gapon /*
1280b962648SAndriy Gapon  * Note that userquota and groupquota options are not currently used
1290b962648SAndriy Gapon  * by UFS/FFS code and generally mount(8) does not pass those options
1300b962648SAndriy Gapon  * from userland, but they can be passed by loader(8) via
1310b962648SAndriy Gapon  * vfs.root.mountfrom.options.
1320b962648SAndriy Gapon  */
133d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr",
1340b962648SAndriy Gapon     "noclusterw", "noexec", "export", "force", "from", "groupquota",
135927a12aeSKirk McKusick     "multilabel", "nfsv4acls", "fsckpid", "snapshot", "nosuid", "suiddir",
136927a12aeSKirk McKusick     "nosymfollow", "sync", "union", "userquota", NULL };
13720a92a18SPoul-Henning Kamp 
1385e8c582aSPoul-Henning Kamp static int
139dfd233edSAttilio Rao ffs_mount(struct mount *mp)
140df8bae1dSRodney W. Grimes {
14120a92a18SPoul-Henning Kamp 	struct vnode *devvp;
142dfd233edSAttilio Rao 	struct thread *td;
14326f9a767SRodney W. Grimes 	struct ufsmount *ump = 0;
14405f4ff5dSPoul-Henning Kamp 	struct fs *fs;
145927a12aeSKirk McKusick 	pid_t fsckpid = 0;
146f2a2857bSKirk McKusick 	int error, flags;
14761996181SEdward Tomasz Napierala 	u_int mntorflags;
14815bc6b2bSEdward Tomasz Napierala 	accmode_t accmode;
1495e8c582aSPoul-Henning Kamp 	struct nameidata ndp;
15020a92a18SPoul-Henning Kamp 	char *fspec;
151df8bae1dSRodney W. Grimes 
152dfd233edSAttilio Rao 	td = curthread;
15320a92a18SPoul-Henning Kamp 	if (vfs_filteropt(mp->mnt_optnew, ffs_opts))
15420a92a18SPoul-Henning Kamp 		return (EINVAL);
155aa4d7a8aSPoul-Henning Kamp 	if (uma_inode == NULL) {
156aa4d7a8aSPoul-Henning Kamp 		uma_inode = uma_zcreate("FFS inode",
157aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct inode), NULL, NULL, NULL, NULL,
158aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
159aa4d7a8aSPoul-Henning Kamp 		uma_ufs1 = uma_zcreate("FFS1 dinode",
160aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL,
161aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
162aa4d7a8aSPoul-Henning Kamp 		uma_ufs2 = uma_zcreate("FFS2 dinode",
163aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL,
164aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
165aa4d7a8aSPoul-Henning Kamp 	}
1668d02a378SPawel Jakub Dawidek 
1670b962648SAndriy Gapon 	vfs_deleteopt(mp->mnt_optnew, "groupquota");
1680b962648SAndriy Gapon 	vfs_deleteopt(mp->mnt_optnew, "userquota");
1690b962648SAndriy Gapon 
17020a92a18SPoul-Henning Kamp 	fspec = vfs_getopts(mp->mnt_optnew, "from", &error);
17151ac12abSPoul-Henning Kamp 	if (error)
172f2a2857bSKirk McKusick 		return (error);
1732b14f991SJulian Elischer 
1745da56ddbSTor Egge 	mntorflags = 0;
17526f59b64SCraig Rodrigues 	if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0)
1765da56ddbSTor Egge 		mntorflags |= MNT_ACLS;
17726f59b64SCraig Rodrigues 
178fb77e0afSCraig Rodrigues 	if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) {
1795da56ddbSTor Egge 		mntorflags |= MNT_SNAPSHOT;
180fb77e0afSCraig Rodrigues 		/*
181fb77e0afSCraig Rodrigues 		 * Once we have set the MNT_SNAPSHOT flag, do not
182fb77e0afSCraig Rodrigues 		 * persist "snapshot" in the options list.
183fb77e0afSCraig Rodrigues 		 */
184fb77e0afSCraig Rodrigues 		vfs_deleteopt(mp->mnt_optnew, "snapshot");
185fb77e0afSCraig Rodrigues 		vfs_deleteopt(mp->mnt_opt, "snapshot");
186fb77e0afSCraig Rodrigues 	}
18726f59b64SCraig Rodrigues 
188927a12aeSKirk McKusick 	if (vfs_getopt(mp->mnt_optnew, "fsckpid", NULL, NULL) == 0 &&
189927a12aeSKirk McKusick 	    vfs_scanopt(mp->mnt_optnew, "fsckpid", "%d", &fsckpid) == 1) {
190927a12aeSKirk McKusick 		/*
191927a12aeSKirk McKusick 		 * Once we have set the restricted PID, do not
192927a12aeSKirk McKusick 		 * persist "fsckpid" in the options list.
193927a12aeSKirk McKusick 		 */
194927a12aeSKirk McKusick 		vfs_deleteopt(mp->mnt_optnew, "fsckpid");
195927a12aeSKirk McKusick 		vfs_deleteopt(mp->mnt_opt, "fsckpid");
196927a12aeSKirk McKusick 		if (mp->mnt_flag & MNT_UPDATE) {
197927a12aeSKirk McKusick 			if (VFSTOUFS(mp)->um_fs->fs_ronly == 0 &&
198927a12aeSKirk McKusick 			     vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) {
199*b60ee81eSKirk McKusick 				vfs_mount_error(mp,
200*b60ee81eSKirk McKusick 				    "Checker enable: Must be read-only");
201927a12aeSKirk McKusick 				return (EINVAL);
202927a12aeSKirk McKusick 			}
203927a12aeSKirk McKusick 		} else if (vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) {
204*b60ee81eSKirk McKusick 			vfs_mount_error(mp,
205*b60ee81eSKirk McKusick 			    "Checker enable: Must be read-only");
206927a12aeSKirk McKusick 			return (EINVAL);
207927a12aeSKirk McKusick 		}
208927a12aeSKirk McKusick 		/* Set to -1 if we are done */
209927a12aeSKirk McKusick 		if (fsckpid == 0)
210927a12aeSKirk McKusick 			fsckpid = -1;
211927a12aeSKirk McKusick 	}
212927a12aeSKirk McKusick 
2139340fc72SEdward Tomasz Napierala 	if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) {
2149340fc72SEdward Tomasz Napierala 		if (mntorflags & MNT_ACLS) {
215*b60ee81eSKirk McKusick 			vfs_mount_error(mp,
216*b60ee81eSKirk McKusick 			    "\"acls\" and \"nfsv4acls\" options "
217*b60ee81eSKirk McKusick 			    "are mutually exclusive");
2189340fc72SEdward Tomasz Napierala 			return (EINVAL);
2199340fc72SEdward Tomasz Napierala 		}
2209340fc72SEdward Tomasz Napierala 		mntorflags |= MNT_NFS4ACLS;
2219340fc72SEdward Tomasz Napierala 	}
2229340fc72SEdward Tomasz Napierala 
2235da56ddbSTor Egge 	MNT_ILOCK(mp);
22461996181SEdward Tomasz Napierala 	mp->mnt_flag |= mntorflags;
2255da56ddbSTor Egge 	MNT_IUNLOCK(mp);
226df8bae1dSRodney W. Grimes 	/*
227df8bae1dSRodney W. Grimes 	 * If updating, check whether changing from read-only to
228df8bae1dSRodney W. Grimes 	 * read/write; if there is no device name, that's all we do.
229df8bae1dSRodney W. Grimes 	 */
230df8bae1dSRodney W. Grimes 	if (mp->mnt_flag & MNT_UPDATE) {
231df8bae1dSRodney W. Grimes 		ump = VFSTOUFS(mp);
232df8bae1dSRodney W. Grimes 		fs = ump->um_fs;
23326cf9c3bSPeter Wemm 		devvp = ump->um_devvp;
234927a12aeSKirk McKusick 		if (fsckpid == -1 && ump->um_fsckpid > 0) {
235927a12aeSKirk McKusick 			if ((error = ffs_flushfiles(mp, WRITECLOSE, td)) != 0 ||
236927a12aeSKirk McKusick 			    (error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0)
237927a12aeSKirk McKusick 				return (error);
238927a12aeSKirk McKusick 			DROP_GIANT();
239927a12aeSKirk McKusick 			g_topology_lock();
240927a12aeSKirk McKusick 			/*
241927a12aeSKirk McKusick 			 * Return to normal read-only mode.
242927a12aeSKirk McKusick 			 */
243927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, -1, 0);
244927a12aeSKirk McKusick 			g_topology_unlock();
245927a12aeSKirk McKusick 			PICKUP_GIANT();
246927a12aeSKirk McKusick 			ump->um_fsckpid = 0;
247927a12aeSKirk McKusick 		}
24820a92a18SPoul-Henning Kamp 		if (fs->fs_ronly == 0 &&
24920a92a18SPoul-Henning Kamp 		    vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) {
2506fecb4e4SKonstantin Belousov 			/*
2516fecb4e4SKonstantin Belousov 			 * Flush any dirty data and suspend filesystem.
2526fecb4e4SKonstantin Belousov 			 */
253f2a2857bSKirk McKusick 			if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0)
254f2a2857bSKirk McKusick 				return (error);
2556fecb4e4SKonstantin Belousov 			for (;;) {
2569ab73fd1SKirk McKusick 				vn_finished_write(mp);
2576fecb4e4SKonstantin Belousov 				if ((error = vfs_write_suspend(mp)) != 0)
2589ab73fd1SKirk McKusick 					return (error);
2596fecb4e4SKonstantin Belousov 				MNT_ILOCK(mp);
2606fecb4e4SKonstantin Belousov 				if (mp->mnt_kern_flag & MNTK_SUSPENDED) {
2616fecb4e4SKonstantin Belousov 					/*
2626fecb4e4SKonstantin Belousov 					 * Allow the secondary writes
2636fecb4e4SKonstantin Belousov 					 * to proceed.
2646fecb4e4SKonstantin Belousov 					 */
2656fecb4e4SKonstantin Belousov 					mp->mnt_kern_flag &= ~(MNTK_SUSPENDED |
2666fecb4e4SKonstantin Belousov 					    MNTK_SUSPEND2);
2676fecb4e4SKonstantin Belousov 					wakeup(&mp->mnt_flag);
2686fecb4e4SKonstantin Belousov 					MNT_IUNLOCK(mp);
2696fecb4e4SKonstantin Belousov 					/*
2706fecb4e4SKonstantin Belousov 					 * Allow the curthread to
2716fecb4e4SKonstantin Belousov 					 * ignore the suspension to
2726fecb4e4SKonstantin Belousov 					 * synchronize on-disk state.
2736fecb4e4SKonstantin Belousov 					 */
274dfd233edSAttilio Rao 					td->td_pflags |= TDP_IGNSUSP;
2756fecb4e4SKonstantin Belousov 					break;
2766fecb4e4SKonstantin Belousov 				}
2776fecb4e4SKonstantin Belousov 				MNT_IUNLOCK(mp);
2786fecb4e4SKonstantin Belousov 				vn_start_write(NULL, &mp, V_WAIT);
2799ab73fd1SKirk McKusick 			}
280cd600596SKirk McKusick 			/*
281cd600596SKirk McKusick 			 * Check for and optionally get rid of files open
282cd600596SKirk McKusick 			 * for writing.
283cd600596SKirk McKusick 			 */
284df8bae1dSRodney W. Grimes 			flags = WRITECLOSE;
285df8bae1dSRodney W. Grimes 			if (mp->mnt_flag & MNT_FORCE)
286df8bae1dSRodney W. Grimes 				flags |= FORCECLOSE;
287fddf7baeSKirk McKusick 			if (MOUNTEDSOFTDEP(mp)) {
288b40ce416SJulian Elischer 				error = softdep_flushfiles(mp, flags, td);
289b1897c19SJulian Elischer 			} else {
290b40ce416SJulian Elischer 				error = ffs_flushfiles(mp, flags, td);
291df8bae1dSRodney W. Grimes 			}
292f2a2857bSKirk McKusick 			if (error) {
2936fecb4e4SKonstantin Belousov 				vfs_write_resume(mp);
294f2a2857bSKirk McKusick 				return (error);
295b1897c19SJulian Elischer 			}
2969ccb939eSKirk McKusick 			if (fs->fs_pendingblocks != 0 ||
2979ccb939eSKirk McKusick 			    fs->fs_pendinginodes != 0) {
298*b60ee81eSKirk McKusick 				printf("WARNING: %s Update error: blocks %jd "
299*b60ee81eSKirk McKusick 				    "files %d\n", fs->fs_fsmnt,
3001c85e6a3SKirk McKusick 				    (intmax_t)fs->fs_pendingblocks,
3019ccb939eSKirk McKusick 				    fs->fs_pendinginodes);
3029ccb939eSKirk McKusick 				fs->fs_pendingblocks = 0;
3039ccb939eSKirk McKusick 				fs->fs_pendinginodes = 0;
3049ccb939eSKirk McKusick 			}
3051a6a6610SKirk McKusick 			if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0)
306f2a2857bSKirk McKusick 				fs->fs_clean = 1;
307791dd2faSTor Egge 			if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) {
308f2a2857bSKirk McKusick 				fs->fs_ronly = 0;
309f2a2857bSKirk McKusick 				fs->fs_clean = 0;
3106fecb4e4SKonstantin Belousov 				vfs_write_resume(mp);
311f2a2857bSKirk McKusick 				return (error);
3122b14f991SJulian Elischer 			}
313fddf7baeSKirk McKusick 			if (MOUNTEDSOFTDEP(mp))
3149420dc62SKirk McKusick 				softdep_unmount(mp);
31543920011SPoul-Henning Kamp 			DROP_GIANT();
31643920011SPoul-Henning Kamp 			g_topology_lock();
3178795189cSKirk McKusick 			/*
3188795189cSKirk McKusick 			 * Drop our write and exclusive access.
3198795189cSKirk McKusick 			 */
3208795189cSKirk McKusick 			g_access(ump->um_cp, 0, -1, -1);
32143920011SPoul-Henning Kamp 			g_topology_unlock();
32243920011SPoul-Henning Kamp 			PICKUP_GIANT();
32320a92a18SPoul-Henning Kamp 			fs->fs_ronly = 1;
3245da56ddbSTor Egge 			MNT_ILOCK(mp);
32520a92a18SPoul-Henning Kamp 			mp->mnt_flag |= MNT_RDONLY;
3265da56ddbSTor Egge 			MNT_IUNLOCK(mp);
3276fecb4e4SKonstantin Belousov 			/*
3286fecb4e4SKonstantin Belousov 			 * Allow the writers to note that filesystem
3296fecb4e4SKonstantin Belousov 			 * is ro now.
3306fecb4e4SKonstantin Belousov 			 */
3316fecb4e4SKonstantin Belousov 			vfs_write_resume(mp);
332f2a2857bSKirk McKusick 		}
333f2a2857bSKirk McKusick 		if ((mp->mnt_flag & MNT_RELOAD) &&
3345e8c582aSPoul-Henning Kamp 		    (error = ffs_reload(mp, td)) != 0)
335f2a2857bSKirk McKusick 			return (error);
33620a92a18SPoul-Henning Kamp 		if (fs->fs_ronly &&
33720a92a18SPoul-Henning Kamp 		    !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) {
338c9b99213SBruce Evans 			/*
339927a12aeSKirk McKusick 			 * If we are running a checker, do not allow upgrade.
340927a12aeSKirk McKusick 			 */
341927a12aeSKirk McKusick 			if (ump->um_fsckpid > 0) {
342*b60ee81eSKirk McKusick 				vfs_mount_error(mp,
343*b60ee81eSKirk McKusick 				    "Active checker, cannot upgrade to write");
344927a12aeSKirk McKusick 				return (EINVAL);
345927a12aeSKirk McKusick 			}
346927a12aeSKirk McKusick 			/*
347c9b99213SBruce Evans 			 * If upgrade to read-write by non-root, then verify
348c9b99213SBruce Evans 			 * that user has necessary permissions on the device.
349c9b99213SBruce Evans 			 */
350cb05b60aSAttilio Rao 			vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
351acd3428bSRobert Watson 			error = VOP_ACCESS(devvp, VREAD | VWRITE,
352acd3428bSRobert Watson 			    td->td_ucred, td);
353acd3428bSRobert Watson 			if (error)
354acd3428bSRobert Watson 				error = priv_check(td, PRIV_VFS_MOUNT_PERM);
355acd3428bSRobert Watson 			if (error) {
35622db15c0SAttilio Rao 				VOP_UNLOCK(devvp, 0);
357c9b99213SBruce Evans 				return (error);
358c9b99213SBruce Evans 			}
35922db15c0SAttilio Rao 			VOP_UNLOCK(devvp, 0);
3607e58bfacSBruce Evans 			fs->fs_flags &= ~FS_UNCLEAN;
3610922cce6SBruce Evans 			if (fs->fs_clean == 0) {
3627e58bfacSBruce Evans 				fs->fs_flags |= FS_UNCLEAN;
363812b1d41SKirk McKusick 				if ((mp->mnt_flag & MNT_FORCE) ||
364113db2ddSJeff Roberson 				    ((fs->fs_flags &
365113db2ddSJeff Roberson 				     (FS_SUJ | FS_NEEDSFSCK)) == 0 &&
3661a6a6610SKirk McKusick 				     (fs->fs_flags & FS_DOSOFTDEP))) {
367*b60ee81eSKirk McKusick 					printf("WARNING: %s was not properly "
368*b60ee81eSKirk McKusick 					   "dismounted\n", fs->fs_fsmnt);
3690922cce6SBruce Evans 				} else {
370*b60ee81eSKirk McKusick 					vfs_mount_error(mp,
371*b60ee81eSKirk McKusick 					   "R/W mount of %s denied. %s.%s",
372*b60ee81eSKirk McKusick 					   fs->fs_fsmnt,
373*b60ee81eSKirk McKusick 					   "Filesystem is not clean - run fsck",
374*b60ee81eSKirk McKusick 					   (fs->fs_flags & FS_SUJ) == 0 ? "" :
375*b60ee81eSKirk McKusick 					   " Forced mount will invalidate"
376*b60ee81eSKirk McKusick 					   " journal contents");
377f2a2857bSKirk McKusick 					return (EPERM);
3780922cce6SBruce Evans 				}
3790922cce6SBruce Evans 			}
38040c340aaSPoul-Henning Kamp 			DROP_GIANT();
38140c340aaSPoul-Henning Kamp 			g_topology_lock();
38240c340aaSPoul-Henning Kamp 			/*
3838795189cSKirk McKusick 			 * Request exclusive write access.
38440c340aaSPoul-Henning Kamp 			 */
38540c340aaSPoul-Henning Kamp 			error = g_access(ump->um_cp, 0, 1, 1);
38640c340aaSPoul-Henning Kamp 			g_topology_unlock();
38740c340aaSPoul-Henning Kamp 			PICKUP_GIANT();
38840c340aaSPoul-Henning Kamp 			if (error)
38940c340aaSPoul-Henning Kamp 				return (error);
390f2a2857bSKirk McKusick 			if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0)
391f2a2857bSKirk McKusick 				return (error);
392f2a2857bSKirk McKusick 			fs->fs_ronly = 0;
3935da56ddbSTor Egge 			MNT_ILOCK(mp);
39420a92a18SPoul-Henning Kamp 			mp->mnt_flag &= ~MNT_RDONLY;
3955da56ddbSTor Egge 			MNT_IUNLOCK(mp);
396113db2ddSJeff Roberson 			fs->fs_mtime = time_second;
39726cf9c3bSPeter Wemm 			/* check to see if we need to start softdep */
398f2a2857bSKirk McKusick 			if ((fs->fs_flags & FS_DOSOFTDEP) &&
399a854ed98SJohn Baldwin 			    (error = softdep_mount(devvp, mp, fs, td->td_ucred))){
400f2a2857bSKirk McKusick 				vn_finished_write(mp);
401f2a2857bSKirk McKusick 				return (error);
40226cf9c3bSPeter Wemm 			}
403113db2ddSJeff Roberson 			fs->fs_clean = 0;
404113db2ddSJeff Roberson 			if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) {
405113db2ddSJeff Roberson 				vn_finished_write(mp);
406113db2ddSJeff Roberson 				return (error);
407113db2ddSJeff Roberson 			}
408f2a2857bSKirk McKusick 			if (fs->fs_snapinum[0] != 0)
409f2a2857bSKirk McKusick 				ffs_snapshot_mount(mp);
410f2a2857bSKirk McKusick 			vn_finished_write(mp);
4111469eec8SDavid Greenman 		}
412c11d2981SJulian Elischer 		/*
413c11d2981SJulian Elischer 		 * Soft updates is incompatible with "async",
414c11d2981SJulian Elischer 		 * so if we are doing softupdates stop the user
415c11d2981SJulian Elischer 		 * from setting the async flag in an update.
416c11d2981SJulian Elischer 		 * Softdep_mount() clears it in an initial mount
417c11d2981SJulian Elischer 		 * or ro->rw remount.
418c11d2981SJulian Elischer 		 */
419fddf7baeSKirk McKusick 		if (MOUNTEDSOFTDEP(mp)) {
4205da56ddbSTor Egge 			/* XXX: Reset too late ? */
4215da56ddbSTor Egge 			MNT_ILOCK(mp);
422c11d2981SJulian Elischer 			mp->mnt_flag &= ~MNT_ASYNC;
4235da56ddbSTor Egge 			MNT_IUNLOCK(mp);
4245da56ddbSTor Egge 		}
425df8bae1dSRodney W. Grimes 		/*
42639cfb239SPawel Jakub Dawidek 		 * Keep MNT_ACLS flag if it is stored in superblock.
42739cfb239SPawel Jakub Dawidek 		 */
4285da56ddbSTor Egge 		if ((fs->fs_flags & FS_ACLS) != 0) {
4295da56ddbSTor Egge 			/* XXX: Set too late ? */
4305da56ddbSTor Egge 			MNT_ILOCK(mp);
43139cfb239SPawel Jakub Dawidek 			mp->mnt_flag |= MNT_ACLS;
4325da56ddbSTor Egge 			MNT_IUNLOCK(mp);
4335da56ddbSTor Egge 		}
434cea90362SCraig Rodrigues 
4359340fc72SEdward Tomasz Napierala 		if ((fs->fs_flags & FS_NFS4ACLS) != 0) {
4369340fc72SEdward Tomasz Napierala 			/* XXX: Set too late ? */
4379340fc72SEdward Tomasz Napierala 			MNT_ILOCK(mp);
4389340fc72SEdward Tomasz Napierala 			mp->mnt_flag |= MNT_NFS4ACLS;
4399340fc72SEdward Tomasz Napierala 			MNT_IUNLOCK(mp);
4409340fc72SEdward Tomasz Napierala 		}
441927a12aeSKirk McKusick 		/*
442927a12aeSKirk McKusick 		 * If this is a request from fsck to clean up the filesystem,
443927a12aeSKirk McKusick 		 * then allow the specified pid to proceed.
444927a12aeSKirk McKusick 		 */
445927a12aeSKirk McKusick 		if (fsckpid > 0) {
446927a12aeSKirk McKusick 			if (ump->um_fsckpid != 0) {
447*b60ee81eSKirk McKusick 				vfs_mount_error(mp,
448*b60ee81eSKirk McKusick 				    "Active checker already running on %s",
449927a12aeSKirk McKusick 				    fs->fs_fsmnt);
450927a12aeSKirk McKusick 				return (EINVAL);
451927a12aeSKirk McKusick 			}
452fddf7baeSKirk McKusick 			KASSERT(MOUNTEDSOFTDEP(mp) == 0,
453927a12aeSKirk McKusick 			    ("soft updates enabled on read-only file system"));
454927a12aeSKirk McKusick 			DROP_GIANT();
455927a12aeSKirk McKusick 			g_topology_lock();
456927a12aeSKirk McKusick 			/*
457927a12aeSKirk McKusick 			 * Request write access.
458927a12aeSKirk McKusick 			 */
459927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, 1, 0);
460927a12aeSKirk McKusick 			g_topology_unlock();
461927a12aeSKirk McKusick 			PICKUP_GIANT();
462927a12aeSKirk McKusick 			if (error) {
463*b60ee81eSKirk McKusick 				vfs_mount_error(mp,
464*b60ee81eSKirk McKusick 				    "Checker activation failed on %s",
465927a12aeSKirk McKusick 				    fs->fs_fsmnt);
466927a12aeSKirk McKusick 				return (error);
467927a12aeSKirk McKusick 			}
468927a12aeSKirk McKusick 			ump->um_fsckpid = fsckpid;
469927a12aeSKirk McKusick 			if (fs->fs_snapinum[0] != 0)
470927a12aeSKirk McKusick 				ffs_snapshot_mount(mp);
471927a12aeSKirk McKusick 			fs->fs_mtime = time_second;
472927a12aeSKirk McKusick 			fs->fs_fmod = 1;
473927a12aeSKirk McKusick 			fs->fs_clean = 0;
474927a12aeSKirk McKusick 			(void) ffs_sbupdate(ump, MNT_WAIT, 0);
475927a12aeSKirk McKusick 		}
4769340fc72SEdward Tomasz Napierala 
477f2a2857bSKirk McKusick 		/*
478f2a2857bSKirk McKusick 		 * If this is a snapshot request, take the snapshot.
479f2a2857bSKirk McKusick 		 */
480f2a2857bSKirk McKusick 		if (mp->mnt_flag & MNT_SNAPSHOT)
48120a92a18SPoul-Henning Kamp 			return (ffs_snapshot(mp, fspec));
482df8bae1dSRodney W. Grimes 	}
4832b14f991SJulian Elischer 
484df8bae1dSRodney W. Grimes 	/*
485df8bae1dSRodney W. Grimes 	 * Not an update, or updating the name: look up the name
486e9827c6dSBruce Evans 	 * and verify that it refers to a sensible disk device.
487df8bae1dSRodney W. Grimes 	 */
488fdedad76SSuleiman Souhlal 	NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td);
4895e8c582aSPoul-Henning Kamp 	if ((error = namei(&ndp)) != 0)
490f2a2857bSKirk McKusick 		return (error);
4915e8c582aSPoul-Henning Kamp 	NDFREE(&ndp, NDF_ONLY_PNBUF);
4925e8c582aSPoul-Henning Kamp 	devvp = ndp.ni_vp;
493f2a2857bSKirk McKusick 	if (!vn_isdisk(devvp, &error)) {
494fdedad76SSuleiman Souhlal 		vput(devvp);
495f2a2857bSKirk McKusick 		return (error);
496f2a2857bSKirk McKusick 	}
497c9b99213SBruce Evans 
498c9b99213SBruce Evans 	/*
499c9b99213SBruce Evans 	 * If mount by non-root, then verify that user has necessary
500c9b99213SBruce Evans 	 * permissions on the device.
501c9b99213SBruce Evans 	 */
50215bc6b2bSEdward Tomasz Napierala 	accmode = VREAD;
503c9b99213SBruce Evans 	if ((mp->mnt_flag & MNT_RDONLY) == 0)
50415bc6b2bSEdward Tomasz Napierala 		accmode |= VWRITE;
50515bc6b2bSEdward Tomasz Napierala 	error = VOP_ACCESS(devvp, accmode, td->td_ucred, td);
506acd3428bSRobert Watson 	if (error)
507acd3428bSRobert Watson 		error = priv_check(td, PRIV_VFS_MOUNT_PERM);
508acd3428bSRobert Watson 	if (error) {
509c9b99213SBruce Evans 		vput(devvp);
510c9b99213SBruce Evans 		return (error);
511c9b99213SBruce Evans 	}
512c9b99213SBruce Evans 
5132b14f991SJulian Elischer 	if (mp->mnt_flag & MNT_UPDATE) {
5142b14f991SJulian Elischer 		/*
515f2a2857bSKirk McKusick 		 * Update only
516f2a2857bSKirk McKusick 		 *
5173e425b96SJulian Elischer 		 * If it's not the same vnode, or at least the same device
5183e425b96SJulian Elischer 		 * then it's not correct.
5192b14f991SJulian Elischer 		 */
5202b14f991SJulian Elischer 
52143920011SPoul-Henning Kamp 		if (devvp->v_rdev != ump->um_devvp->v_rdev)
522f2a2857bSKirk McKusick 			error = EINVAL;	/* needs translation */
523fdedad76SSuleiman Souhlal 		vput(devvp);
524f2a2857bSKirk McKusick 		if (error)
525f2a2857bSKirk McKusick 			return (error);
5262b14f991SJulian Elischer 	} else {
5272b14f991SJulian Elischer 		/*
528f2a2857bSKirk McKusick 		 * New mount
5292b14f991SJulian Elischer 		 *
530f2a2857bSKirk McKusick 		 * We need the name for the mount point (also used for
531f2a2857bSKirk McKusick 		 * "last mounted on") copied in. If an error occurs,
532f2a2857bSKirk McKusick 		 * the mount point is discarded by the upper level code.
533f3a90da9SAdrian Chadd 		 * Note that vfs_mount() populates f_mntonname for us.
534f2a2857bSKirk McKusick 		 */
535975512a9SPoul-Henning Kamp 		if ((error = ffs_mountfs(devvp, mp, td)) != 0) {
536f2a2857bSKirk McKusick 			vrele(devvp);
537f2a2857bSKirk McKusick 			return (error);
538f2a2857bSKirk McKusick 		}
539927a12aeSKirk McKusick 		if (fsckpid > 0) {
540fddf7baeSKirk McKusick 			KASSERT(MOUNTEDSOFTDEP(mp) == 0,
541927a12aeSKirk McKusick 			    ("soft updates enabled on read-only file system"));
542927a12aeSKirk McKusick 			ump = VFSTOUFS(mp);
543927a12aeSKirk McKusick 			fs = ump->um_fs;
544927a12aeSKirk McKusick 			DROP_GIANT();
545927a12aeSKirk McKusick 			g_topology_lock();
546927a12aeSKirk McKusick 			/*
547927a12aeSKirk McKusick 			 * Request write access.
548927a12aeSKirk McKusick 			 */
549927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, 1, 0);
550927a12aeSKirk McKusick 			g_topology_unlock();
551927a12aeSKirk McKusick 			PICKUP_GIANT();
552927a12aeSKirk McKusick 			if (error) {
553*b60ee81eSKirk McKusick 				printf("WARNING: %s: Checker activation "
554*b60ee81eSKirk McKusick 				    "failed\n", fs->fs_fsmnt);
555927a12aeSKirk McKusick 			} else {
556927a12aeSKirk McKusick 				ump->um_fsckpid = fsckpid;
557927a12aeSKirk McKusick 				if (fs->fs_snapinum[0] != 0)
558927a12aeSKirk McKusick 					ffs_snapshot_mount(mp);
559927a12aeSKirk McKusick 				fs->fs_mtime = time_second;
560927a12aeSKirk McKusick 				fs->fs_clean = 0;
561927a12aeSKirk McKusick 				(void) ffs_sbupdate(ump, MNT_WAIT, 0);
562927a12aeSKirk McKusick 			}
563927a12aeSKirk McKusick 		}
564f2a2857bSKirk McKusick 	}
56520a92a18SPoul-Henning Kamp 	vfs_mountedfrom(mp, fspec);
566f2a2857bSKirk McKusick 	return (0);
5672b14f991SJulian Elischer }
5682b14f991SJulian Elischer 
569df8bae1dSRodney W. Grimes /*
57020a92a18SPoul-Henning Kamp  * Compatibility with old mount system call.
57120a92a18SPoul-Henning Kamp  */
57220a92a18SPoul-Henning Kamp 
57320a92a18SPoul-Henning Kamp static int
574dfd233edSAttilio Rao ffs_cmount(struct mntarg *ma, void *data, int flags)
57520a92a18SPoul-Henning Kamp {
57620a92a18SPoul-Henning Kamp 	struct ufs_args args;
577d0cc54f3SKonstantin Belousov 	struct export_args exp;
57820a92a18SPoul-Henning Kamp 	int error;
57920a92a18SPoul-Henning Kamp 
58020a92a18SPoul-Henning Kamp 	if (data == NULL)
58120a92a18SPoul-Henning Kamp 		return (EINVAL);
58220a92a18SPoul-Henning Kamp 	error = copyin(data, &args, sizeof args);
58320a92a18SPoul-Henning Kamp 	if (error)
58420a92a18SPoul-Henning Kamp 		return (error);
585d0cc54f3SKonstantin Belousov 	vfs_oexport_conv(&args.export, &exp);
58620a92a18SPoul-Henning Kamp 
58720a92a18SPoul-Henning Kamp 	ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN);
588d0cc54f3SKonstantin Belousov 	ma = mount_arg(ma, "export", &exp, sizeof(exp));
58920a92a18SPoul-Henning Kamp 	error = kernel_mount(ma, flags);
59020a92a18SPoul-Henning Kamp 
59120a92a18SPoul-Henning Kamp 	return (error);
59220a92a18SPoul-Henning Kamp }
59320a92a18SPoul-Henning Kamp 
59420a92a18SPoul-Henning Kamp /*
595df8bae1dSRodney W. Grimes  * Reload all incore data for a filesystem (used after running fsck on
596df8bae1dSRodney W. Grimes  * the root filesystem and finding things to fix). The filesystem must
597df8bae1dSRodney W. Grimes  * be mounted read-only.
598df8bae1dSRodney W. Grimes  *
599df8bae1dSRodney W. Grimes  * Things to do to update the mount:
600df8bae1dSRodney W. Grimes  *	1) invalidate all cached meta-data.
601df8bae1dSRodney W. Grimes  *	2) re-read superblock from disk.
602df8bae1dSRodney W. Grimes  *	3) re-read summary information from disk.
603df8bae1dSRodney W. Grimes  *	4) invalidate all inactive vnodes.
604df8bae1dSRodney W. Grimes  *	5) invalidate all cached file data.
605df8bae1dSRodney W. Grimes  *	6) re-read inode data for all active vnodes.
606df8bae1dSRodney W. Grimes  */
6075e8c582aSPoul-Henning Kamp static int
6085e8c582aSPoul-Henning Kamp ffs_reload(struct mount *mp, struct thread *td)
609df8bae1dSRodney W. Grimes {
61082be0a5aSTor Egge 	struct vnode *vp, *mvp, *devvp;
611df8bae1dSRodney W. Grimes 	struct inode *ip;
612f55ff3f3SIan Dowse 	void *space;
613df8bae1dSRodney W. Grimes 	struct buf *bp;
614996c772fSJohn Dyson 	struct fs *fs, *newfs;
6153ba649d7SJeff Roberson 	struct ufsmount *ump;
6161c85e6a3SKirk McKusick 	ufs2_daddr_t sblockloc;
617df8bae1dSRodney W. Grimes 	int i, blks, size, error;
618996c772fSJohn Dyson 	int32_t *lp;
619df8bae1dSRodney W. Grimes 
6202b14f991SJulian Elischer 	if ((mp->mnt_flag & MNT_RDONLY) == 0)
621df8bae1dSRodney W. Grimes 		return (EINVAL);
6223ba649d7SJeff Roberson 	ump = VFSTOUFS(mp);
623df8bae1dSRodney W. Grimes 	/*
624df8bae1dSRodney W. Grimes 	 * Step 1: invalidate all cached meta-data.
625df8bae1dSRodney W. Grimes 	 */
6262b14f991SJulian Elischer 	devvp = VFSTOUFS(mp)->um_devvp;
627cb05b60aSAttilio Rao 	vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
6280d7935fdSAttilio Rao 	if (vinvalbuf(devvp, 0, 0, 0) != 0)
629df8bae1dSRodney W. Grimes 		panic("ffs_reload: dirty1");
63022db15c0SAttilio Rao 	VOP_UNLOCK(devvp, 0);
63195e5e988SJohn Dyson 
632df8bae1dSRodney W. Grimes 	/*
633df8bae1dSRodney W. Grimes 	 * Step 2: re-read superblock from disk.
634df8bae1dSRodney W. Grimes 	 */
6351c85e6a3SKirk McKusick 	fs = VFSTOUFS(mp)->um_fs;
636ada981b2SKirk McKusick 	if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize,
6371c85e6a3SKirk McKusick 	    NOCRED, &bp)) != 0)
638df8bae1dSRodney W. Grimes 		return (error);
639996c772fSJohn Dyson 	newfs = (struct fs *)bp->b_data;
6401c85e6a3SKirk McKusick 	if ((newfs->fs_magic != FS_UFS1_MAGIC &&
6411c85e6a3SKirk McKusick 	     newfs->fs_magic != FS_UFS2_MAGIC) ||
6421c85e6a3SKirk McKusick 	    newfs->fs_bsize > MAXBSIZE ||
643996c772fSJohn Dyson 	    newfs->fs_bsize < sizeof(struct fs)) {
644df8bae1dSRodney W. Grimes 			brelse(bp);
645df8bae1dSRodney W. Grimes 			return (EIO);		/* XXX needs translation */
646df8bae1dSRodney W. Grimes 	}
647996c772fSJohn Dyson 	/*
648996c772fSJohn Dyson 	 * Copy pointer fields back into superblock before copying in	XXX
649996c772fSJohn Dyson 	 * new superblock. These should really be in the ufsmount.	XXX
650996c772fSJohn Dyson 	 * Note that important parameters (eg fs_ncg) are unchanged.
651996c772fSJohn Dyson 	 */
652f55ff3f3SIan Dowse 	newfs->fs_csp = fs->fs_csp;
653996c772fSJohn Dyson 	newfs->fs_maxcluster = fs->fs_maxcluster;
6545d69bac4SIan Dowse 	newfs->fs_contigdirs = fs->fs_contigdirs;
655143a5346SIan Dowse 	newfs->fs_active = fs->fs_active;
65631c81e4bSDon Lewis 	/* The file system is still read-only. */
65731c81e4bSDon Lewis 	newfs->fs_ronly = 1;
6581c85e6a3SKirk McKusick 	sblockloc = fs->fs_sblockloc;
659996c772fSJohn Dyson 	bcopy(newfs, fs, (u_int)fs->fs_sbsize);
660df8bae1dSRodney W. Grimes 	brelse(bp);
661996c772fSJohn Dyson 	mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen;
6621c85e6a3SKirk McKusick 	ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc);
6633ba649d7SJeff Roberson 	UFS_LOCK(ump);
6649ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
665*b60ee81eSKirk McKusick 		printf("WARNING: %s: reload pending error: blocks %jd "
666*b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
6671c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
6689ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
6699ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
6709ccb939eSKirk McKusick 	}
6713ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
672996c772fSJohn Dyson 
673df8bae1dSRodney W. Grimes 	/*
674df8bae1dSRodney W. Grimes 	 * Step 3: re-read summary information from disk.
675df8bae1dSRodney W. Grimes 	 */
676df8bae1dSRodney W. Grimes 	blks = howmany(fs->fs_cssize, fs->fs_fsize);
677f55ff3f3SIan Dowse 	space = fs->fs_csp;
678df8bae1dSRodney W. Grimes 	for (i = 0; i < blks; i += fs->fs_frag) {
679df8bae1dSRodney W. Grimes 		size = fs->fs_bsize;
680df8bae1dSRodney W. Grimes 		if (i + fs->fs_frag > blks)
681df8bae1dSRodney W. Grimes 			size = (blks - i) * fs->fs_fsize;
682c9671602SPoul-Henning Kamp 		error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size,
683c9671602SPoul-Henning Kamp 		    NOCRED, &bp);
684c9671602SPoul-Henning Kamp 		if (error)
685df8bae1dSRodney W. Grimes 			return (error);
686f55ff3f3SIan Dowse 		bcopy(bp->b_data, space, (u_int)size);
687f55ff3f3SIan Dowse 		space = (char *)space + size;
688df8bae1dSRodney W. Grimes 		brelse(bp);
689df8bae1dSRodney W. Grimes 	}
690996c772fSJohn Dyson 	/*
691996c772fSJohn Dyson 	 * We no longer know anything about clusters per cylinder group.
692996c772fSJohn Dyson 	 */
693996c772fSJohn Dyson 	if (fs->fs_contigsumsize > 0) {
694996c772fSJohn Dyson 		lp = fs->fs_maxcluster;
695996c772fSJohn Dyson 		for (i = 0; i < fs->fs_ncg; i++)
696996c772fSJohn Dyson 			*lp++ = fs->fs_contigsumsize;
697996c772fSJohn Dyson 	}
698996c772fSJohn Dyson 
699df8bae1dSRodney W. Grimes loop:
700ca430f2eSAlexander Kabaev 	MNT_ILOCK(mp);
70182be0a5aSTor Egge 	MNT_VNODE_FOREACH(vp, mp, mvp) {
70204a17687SJeff Roberson 		VI_LOCK(vp);
703fe68abe2SJeff Roberson 		if (vp->v_iflag & VI_DOOMED) {
7042f05568aSJeff Roberson 			VI_UNLOCK(vp);
7052f05568aSJeff Roberson 			continue;
7062f05568aSJeff Roberson 		}
707ca430f2eSAlexander Kabaev 		MNT_IUNLOCK(mp);
708df8bae1dSRodney W. Grimes 		/*
709fe68abe2SJeff Roberson 		 * Step 4: invalidate all cached file data.
710df8bae1dSRodney W. Grimes 		 */
711b40ce416SJulian Elischer 		if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, td)) {
71282be0a5aSTor Egge 			MNT_VNODE_FOREACH_ABORT(mp, mvp);
713df8bae1dSRodney W. Grimes 			goto loop;
714996c772fSJohn Dyson 		}
7150d7935fdSAttilio Rao 		if (vinvalbuf(vp, 0, 0, 0))
716df8bae1dSRodney W. Grimes 			panic("ffs_reload: dirty2");
717df8bae1dSRodney W. Grimes 		/*
718fe68abe2SJeff Roberson 		 * Step 5: re-read inode data for all active vnodes.
719df8bae1dSRodney W. Grimes 		 */
720df8bae1dSRodney W. Grimes 		ip = VTOI(vp);
721c9671602SPoul-Henning Kamp 		error =
722df8bae1dSRodney W. Grimes 		    bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)),
723c9671602SPoul-Henning Kamp 		    (int)fs->fs_bsize, NOCRED, &bp);
724c9671602SPoul-Henning Kamp 		if (error) {
72522db15c0SAttilio Rao 			VOP_UNLOCK(vp, 0);
72645d45c6cSAlexander Kabaev 			vrele(vp);
72782be0a5aSTor Egge 			MNT_VNODE_FOREACH_ABORT(mp, mvp);
728df8bae1dSRodney W. Grimes 			return (error);
729df8bae1dSRodney W. Grimes 		}
730de6ba7c0SPoul-Henning Kamp 		ffs_load_inode(bp, ip, fs, ip->i_number);
731b1897c19SJulian Elischer 		ip->i_effnlink = ip->i_nlink;
732df8bae1dSRodney W. Grimes 		brelse(bp);
73322db15c0SAttilio Rao 		VOP_UNLOCK(vp, 0);
734cb9ddc80SAlexander Kabaev 		vrele(vp);
735ca430f2eSAlexander Kabaev 		MNT_ILOCK(mp);
736df8bae1dSRodney W. Grimes 	}
737ca430f2eSAlexander Kabaev 	MNT_IUNLOCK(mp);
738df8bae1dSRodney W. Grimes 	return (0);
739df8bae1dSRodney W. Grimes }
740df8bae1dSRodney W. Grimes 
7411c85e6a3SKirk McKusick /*
7421c85e6a3SKirk McKusick  * Possible superblock locations ordered from most to least likely.
7431c85e6a3SKirk McKusick  */
7441c85e6a3SKirk McKusick static int sblock_try[] = SBLOCKSEARCH;
7455819ab3fSKirk McKusick 
746df8bae1dSRodney W. Grimes /*
747df8bae1dSRodney W. Grimes  * Common code for mount and mountroot
748df8bae1dSRodney W. Grimes  */
749975512a9SPoul-Henning Kamp static int
750975512a9SPoul-Henning Kamp ffs_mountfs(devvp, mp, td)
75105f4ff5dSPoul-Henning Kamp 	struct vnode *devvp;
752df8bae1dSRodney W. Grimes 	struct mount *mp;
753b40ce416SJulian Elischer 	struct thread *td;
754df8bae1dSRodney W. Grimes {
75505f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
756df8bae1dSRodney W. Grimes 	struct buf *bp;
75705f4ff5dSPoul-Henning Kamp 	struct fs *fs;
75889c9c53dSPoul-Henning Kamp 	struct cdev *dev;
759f55ff3f3SIan Dowse 	void *space;
7601c85e6a3SKirk McKusick 	ufs2_daddr_t sblockloc;
761f5ef029eSPoul-Henning Kamp 	int error, i, blks, size, ronly;
762996c772fSJohn Dyson 	int32_t *lp;
763996c772fSJohn Dyson 	struct ucred *cred;
76443920011SPoul-Henning Kamp 	struct g_consumer *cp;
7653bbd6d8aSJeff Roberson 	struct mount *nmp;
766df8bae1dSRodney W. Grimes 
767ee445a69SJohn Baldwin 	bp = NULL;
768ee445a69SJohn Baldwin 	ump = NULL;
769a854ed98SJohn Baldwin 	cred = td ? td->td_ucred : NOCRED;
77043920011SPoul-Henning Kamp 	ronly = (mp->mnt_flag & MNT_RDONLY) != 0;
771ee445a69SJohn Baldwin 
772ee445a69SJohn Baldwin 	dev = devvp->v_rdev;
773ee445a69SJohn Baldwin 	dev_ref(dev);
77443920011SPoul-Henning Kamp 	DROP_GIANT();
77543920011SPoul-Henning Kamp 	g_topology_lock();
77643920011SPoul-Henning Kamp 	error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1);
77743920011SPoul-Henning Kamp 	g_topology_unlock();
77843920011SPoul-Henning Kamp 	PICKUP_GIANT();
77922db15c0SAttilio Rao 	VOP_UNLOCK(devvp, 0);
780c9671602SPoul-Henning Kamp 	if (error)
781ee445a69SJohn Baldwin 		goto out;
7820508986cSBruce Evans 	if (devvp->v_rdev->si_iosize_max != 0)
7831b5464efSPoul-Henning Kamp 		mp->mnt_iosize_max = devvp->v_rdev->si_iosize_max;
7841b5464efSPoul-Henning Kamp 	if (mp->mnt_iosize_max > MAXPHYS)
7851b5464efSPoul-Henning Kamp 		mp->mnt_iosize_max = MAXPHYS;
78695e5e988SJohn Dyson 
7876e77a041SPoul-Henning Kamp 	devvp->v_bufobj.bo_ops = &ffs_ops;
7886e77a041SPoul-Henning Kamp 
7891c85e6a3SKirk McKusick 	fs = NULL;
7901c85e6a3SKirk McKusick 	sblockloc = 0;
7911c85e6a3SKirk McKusick 	/*
7921c85e6a3SKirk McKusick 	 * Try reading the superblock in each of its possible locations.
7931c85e6a3SKirk McKusick 	 */
7941c85e6a3SKirk McKusick 	for (i = 0; sblock_try[i] != -1; i++) {
79571ac2d7cSCraig Rodrigues 		if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) {
79671ac2d7cSCraig Rodrigues 			error = EINVAL;
79771ac2d7cSCraig Rodrigues 			vfs_mount_error(mp,
79871ac2d7cSCraig Rodrigues 			    "Invalid sectorsize %d for superblock size %d",
79971ac2d7cSCraig Rodrigues 			    cp->provider->sectorsize, SBLOCKSIZE);
80071ac2d7cSCraig Rodrigues 			goto out;
80171ac2d7cSCraig Rodrigues 		}
80271ac2d7cSCraig Rodrigues 		if ((error = bread(devvp, btodb(sblock_try[i]), SBLOCKSIZE,
8031c85e6a3SKirk McKusick 		    cred, &bp)) != 0)
804df8bae1dSRodney W. Grimes 			goto out;
805df8bae1dSRodney W. Grimes 		fs = (struct fs *)bp->b_data;
806ada981b2SKirk McKusick 		sblockloc = sblock_try[i];
8071c85e6a3SKirk McKusick 		if ((fs->fs_magic == FS_UFS1_MAGIC ||
8081c85e6a3SKirk McKusick 		     (fs->fs_magic == FS_UFS2_MAGIC &&
809ada981b2SKirk McKusick 		      (fs->fs_sblockloc == sblockloc ||
810ada981b2SKirk McKusick 		       (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0))) &&
8111c85e6a3SKirk McKusick 		    fs->fs_bsize <= MAXBSIZE &&
8121c85e6a3SKirk McKusick 		    fs->fs_bsize >= sizeof(struct fs))
8131c85e6a3SKirk McKusick 			break;
8141c85e6a3SKirk McKusick 		brelse(bp);
8151c85e6a3SKirk McKusick 		bp = NULL;
8161c85e6a3SKirk McKusick 	}
8171c85e6a3SKirk McKusick 	if (sblock_try[i] == -1) {
818df8bae1dSRodney W. Grimes 		error = EINVAL;		/* XXX needs translation */
819df8bae1dSRodney W. Grimes 		goto out;
820df8bae1dSRodney W. Grimes 	}
8213f6f17eeSJulian Elischer 	fs->fs_fmod = 0;
8221c85e6a3SKirk McKusick 	fs->fs_flags &= ~FS_INDEXDIRS;	/* no support for directory indicies */
8230922cce6SBruce Evans 	fs->fs_flags &= ~FS_UNCLEAN;
8240922cce6SBruce Evans 	if (fs->fs_clean == 0) {
8250922cce6SBruce Evans 		fs->fs_flags |= FS_UNCLEAN;
826812b1d41SKirk McKusick 		if (ronly || (mp->mnt_flag & MNT_FORCE) ||
827113db2ddSJeff Roberson 		    ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 &&
8281a6a6610SKirk McKusick 		     (fs->fs_flags & FS_DOSOFTDEP))) {
82959b3a4ebSDavid E. O'Brien 			printf("WARNING: %s was not properly dismounted\n",
8300922cce6SBruce Evans 			    fs->fs_fsmnt);
8311469eec8SDavid Greenman 		} else {
832*b60ee81eSKirk McKusick 			vfs_mount_error(mp, "R/W mount of %s denied. %s%s",
833*b60ee81eSKirk McKusick 			    fs->fs_fsmnt, "Filesystem is not clean - run fsck.",
834*b60ee81eSKirk McKusick 			    (fs->fs_flags & FS_SUJ) == 0 ? "" :
835*b60ee81eSKirk McKusick 			    " Forced mount will invalidate journal contents");
8361469eec8SDavid Greenman 			error = EPERM;
8371469eec8SDavid Greenman 			goto out;
8381469eec8SDavid Greenman 		}
8391c85e6a3SKirk McKusick 		if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) &&
8401c85e6a3SKirk McKusick 		    (mp->mnt_flag & MNT_FORCE)) {
841*b60ee81eSKirk McKusick 			printf("WARNING: %s: lost blocks %jd files %d\n",
842*b60ee81eSKirk McKusick 			    fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
8431c85e6a3SKirk McKusick 			    fs->fs_pendinginodes);
8449ccb939eSKirk McKusick 			fs->fs_pendingblocks = 0;
8459ccb939eSKirk McKusick 			fs->fs_pendinginodes = 0;
8469ccb939eSKirk McKusick 		}
8479ccb939eSKirk McKusick 	}
8489ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
849*b60ee81eSKirk McKusick 		printf("WARNING: %s: mount pending error: blocks %jd "
850*b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
8511c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
8529ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
8539ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
8541469eec8SDavid Greenman 	}
8551a60c7fcSPawel Jakub Dawidek 	if ((fs->fs_flags & FS_GJOURNAL) != 0) {
8561a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL
8571a60c7fcSPawel Jakub Dawidek 		/*
8581a60c7fcSPawel Jakub Dawidek 		 * Get journal provider name.
8591a60c7fcSPawel Jakub Dawidek 		 */
8601a60c7fcSPawel Jakub Dawidek 		size = 1024;
8611a60c7fcSPawel Jakub Dawidek 		mp->mnt_gjprovider = malloc(size, M_UFSMNT, M_WAITOK);
8621a60c7fcSPawel Jakub Dawidek 		if (g_io_getattr("GJOURNAL::provider", cp, &size,
8631a60c7fcSPawel Jakub Dawidek 		    mp->mnt_gjprovider) == 0) {
8641a60c7fcSPawel Jakub Dawidek 			mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, size,
8651a60c7fcSPawel Jakub Dawidek 			    M_UFSMNT, M_WAITOK);
8661a60c7fcSPawel Jakub Dawidek 			MNT_ILOCK(mp);
8671a60c7fcSPawel Jakub Dawidek 			mp->mnt_flag |= MNT_GJOURNAL;
8681a60c7fcSPawel Jakub Dawidek 			MNT_IUNLOCK(mp);
8691a60c7fcSPawel Jakub Dawidek 		} else {
870*b60ee81eSKirk McKusick 			printf("WARNING: %s: GJOURNAL flag on fs "
871*b60ee81eSKirk McKusick 			    "but no gjournal provider below\n",
8721a60c7fcSPawel Jakub Dawidek 			    mp->mnt_stat.f_mntonname);
8731a60c7fcSPawel Jakub Dawidek 			free(mp->mnt_gjprovider, M_UFSMNT);
8741a60c7fcSPawel Jakub Dawidek 			mp->mnt_gjprovider = NULL;
8751a60c7fcSPawel Jakub Dawidek 		}
8761a60c7fcSPawel Jakub Dawidek #else
877*b60ee81eSKirk McKusick 		printf("WARNING: %s: GJOURNAL flag on fs but no "
878*b60ee81eSKirk McKusick 		    "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname);
8791a60c7fcSPawel Jakub Dawidek #endif
8801a60c7fcSPawel Jakub Dawidek 	} else {
8811a60c7fcSPawel Jakub Dawidek 		mp->mnt_gjprovider = NULL;
8821a60c7fcSPawel Jakub Dawidek 	}
883a163d034SWarner Losh 	ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO);
88443920011SPoul-Henning Kamp 	ump->um_cp = cp;
88543920011SPoul-Henning Kamp 	ump->um_bo = &devvp->v_bufobj;
8868dd56505SPoul-Henning Kamp 	ump->um_fs = malloc((u_long)fs->fs_sbsize, M_UFSMNT, M_WAITOK);
8871c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC) {
8881c85e6a3SKirk McKusick 		ump->um_fstype = UFS1;
8891c85e6a3SKirk McKusick 		ump->um_balloc = ffs_balloc_ufs1;
8901c85e6a3SKirk McKusick 	} else {
8911c85e6a3SKirk McKusick 		ump->um_fstype = UFS2;
8921c85e6a3SKirk McKusick 		ump->um_balloc = ffs_balloc_ufs2;
8931c85e6a3SKirk McKusick 	}
894cec0f20cSPoul-Henning Kamp 	ump->um_blkatoff = ffs_blkatoff;
895cec0f20cSPoul-Henning Kamp 	ump->um_truncate = ffs_truncate;
896987f5696SPoul-Henning Kamp 	ump->um_update = ffs_update;
897cec0f20cSPoul-Henning Kamp 	ump->um_valloc = ffs_valloc;
898cec0f20cSPoul-Henning Kamp 	ump->um_vfree = ffs_vfree;
899975512a9SPoul-Henning Kamp 	ump->um_ifree = ffs_ifree;
90090446e36SKonstantin Belousov 	ump->um_rdonly = ffs_rdonly;
90116b1f68dSKonstantin Belousov 	ump->um_snapgone = ffs_snapgone;
9023ba649d7SJeff Roberson 	mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF);
903df8bae1dSRodney W. Grimes 	bcopy(bp->b_data, ump->um_fs, (u_int)fs->fs_sbsize);
9041c85e6a3SKirk McKusick 	if (fs->fs_sbsize < SBLOCKSIZE)
905f2a2857bSKirk McKusick 		bp->b_flags |= B_INVAL | B_NOCACHE;
906df8bae1dSRodney W. Grimes 	brelse(bp);
907df8bae1dSRodney W. Grimes 	bp = NULL;
908df8bae1dSRodney W. Grimes 	fs = ump->um_fs;
9091c85e6a3SKirk McKusick 	ffs_oldfscompat_read(fs, ump, sblockloc);
910df8bae1dSRodney W. Grimes 	fs->fs_ronly = ronly;
911996c772fSJohn Dyson 	size = fs->fs_cssize;
912996c772fSJohn Dyson 	blks = howmany(size, fs->fs_fsize);
913996c772fSJohn Dyson 	if (fs->fs_contigsumsize > 0)
914996c772fSJohn Dyson 		size += fs->fs_ncg * sizeof(int32_t);
915a61ab64aSKirk McKusick 	size += fs->fs_ncg * sizeof(u_int8_t);
916a163d034SWarner Losh 	space = malloc((u_long)size, M_UFSMNT, M_WAITOK);
917f55ff3f3SIan Dowse 	fs->fs_csp = space;
918df8bae1dSRodney W. Grimes 	for (i = 0; i < blks; i += fs->fs_frag) {
919df8bae1dSRodney W. Grimes 		size = fs->fs_bsize;
920df8bae1dSRodney W. Grimes 		if (i + fs->fs_frag > blks)
921df8bae1dSRodney W. Grimes 			size = (blks - i) * fs->fs_fsize;
9228aef1712SMatthew Dillon 		if ((error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size,
9238aef1712SMatthew Dillon 		    cred, &bp)) != 0) {
924f55ff3f3SIan Dowse 			free(fs->fs_csp, M_UFSMNT);
925df8bae1dSRodney W. Grimes 			goto out;
926df8bae1dSRodney W. Grimes 		}
927df8bae1dSRodney W. Grimes 		bcopy(bp->b_data, space, (u_int)size);
928f55ff3f3SIan Dowse 		space = (char *)space + size;
929df8bae1dSRodney W. Grimes 		brelse(bp);
930df8bae1dSRodney W. Grimes 		bp = NULL;
931df8bae1dSRodney W. Grimes 	}
932996c772fSJohn Dyson 	if (fs->fs_contigsumsize > 0) {
933f55ff3f3SIan Dowse 		fs->fs_maxcluster = lp = space;
934996c772fSJohn Dyson 		for (i = 0; i < fs->fs_ncg; i++)
935996c772fSJohn Dyson 			*lp++ = fs->fs_contigsumsize;
9364691e9eaSIan Dowse 		space = lp;
937996c772fSJohn Dyson 	}
938a61ab64aSKirk McKusick 	size = fs->fs_ncg * sizeof(u_int8_t);
939a61ab64aSKirk McKusick 	fs->fs_contigdirs = (u_int8_t *)space;
940a61ab64aSKirk McKusick 	bzero(fs->fs_contigdirs, size);
941143a5346SIan Dowse 	fs->fs_active = NULL;
94277465d93SAlfred Perlstein 	mp->mnt_data = ump;
94368de329eSPoul-Henning Kamp 	mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0];
9448f89943eSGuido van Rooij 	mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1];
9453bbd6d8aSJeff Roberson 	nmp = NULL;
94668de329eSPoul-Henning Kamp 	if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 ||
9473bbd6d8aSJeff Roberson 	    (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) {
9483bbd6d8aSJeff Roberson 		if (nmp)
9493bbd6d8aSJeff Roberson 			vfs_rel(nmp);
95068de329eSPoul-Henning Kamp 		vfs_getnewfsid(mp);
9513bbd6d8aSJeff Roberson 	}
952df8bae1dSRodney W. Grimes 	mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen;
9535da56ddbSTor Egge 	MNT_ILOCK(mp);
954cc9d8990SPeter Wemm 	mp->mnt_flag |= MNT_LOCAL;
9555da56ddbSTor Egge 	MNT_IUNLOCK(mp);
9565da56ddbSTor Egge 	if ((fs->fs_flags & FS_MULTILABEL) != 0) {
9577b3f1bbdSTom Rhodes #ifdef MAC
9585da56ddbSTor Egge 		MNT_ILOCK(mp);
95980830407SRobert Watson 		mp->mnt_flag |= MNT_MULTILABEL;
9605da56ddbSTor Egge 		MNT_IUNLOCK(mp);
9617b3f1bbdSTom Rhodes #else
962*b60ee81eSKirk McKusick 		printf("WARNING: %s: multilabel flag on fs but "
963*b60ee81eSKirk McKusick 		    "no MAC support\n", mp->mnt_stat.f_mntonname);
9647b3f1bbdSTom Rhodes #endif
9655da56ddbSTor Egge 	}
9665da56ddbSTor Egge 	if ((fs->fs_flags & FS_ACLS) != 0) {
9677b3f1bbdSTom Rhodes #ifdef UFS_ACL
9685da56ddbSTor Egge 		MNT_ILOCK(mp);
9699340fc72SEdward Tomasz Napierala 
9709340fc72SEdward Tomasz Napierala 		if (mp->mnt_flag & MNT_NFS4ACLS)
971*b60ee81eSKirk McKusick 			printf("WARNING: %s: ACLs flag on fs conflicts with "
972*b60ee81eSKirk McKusick 			    "\"nfsv4acls\" mount option; option ignored\n",
973*b60ee81eSKirk McKusick 			    mp->mnt_stat.f_mntonname);
9749340fc72SEdward Tomasz Napierala 		mp->mnt_flag &= ~MNT_NFS4ACLS;
97580830407SRobert Watson 		mp->mnt_flag |= MNT_ACLS;
9769340fc72SEdward Tomasz Napierala 
9775da56ddbSTor Egge 		MNT_IUNLOCK(mp);
9787b3f1bbdSTom Rhodes #else
97959b3a4ebSDavid E. O'Brien 		printf("WARNING: %s: ACLs flag on fs but no ACLs support\n",
980946478fcSPawel Jakub Dawidek 		    mp->mnt_stat.f_mntonname);
9817b3f1bbdSTom Rhodes #endif
9825da56ddbSTor Egge 	}
9839340fc72SEdward Tomasz Napierala 	if ((fs->fs_flags & FS_NFS4ACLS) != 0) {
9849340fc72SEdward Tomasz Napierala #ifdef UFS_ACL
9859340fc72SEdward Tomasz Napierala 		MNT_ILOCK(mp);
9869340fc72SEdward Tomasz Napierala 
9879340fc72SEdward Tomasz Napierala 		if (mp->mnt_flag & MNT_ACLS)
988*b60ee81eSKirk McKusick 			printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts "
989*b60ee81eSKirk McKusick 			    "with \"acls\" mount option; option ignored\n",
990*b60ee81eSKirk McKusick 			    mp->mnt_stat.f_mntonname);
9919340fc72SEdward Tomasz Napierala 		mp->mnt_flag &= ~MNT_ACLS;
9929340fc72SEdward Tomasz Napierala 		mp->mnt_flag |= MNT_NFS4ACLS;
9939340fc72SEdward Tomasz Napierala 
9949340fc72SEdward Tomasz Napierala 		MNT_IUNLOCK(mp);
9959340fc72SEdward Tomasz Napierala #else
996*b60ee81eSKirk McKusick 		printf("WARNING: %s: NFSv4 ACLs flag on fs but no "
997*b60ee81eSKirk McKusick 		    "ACLs support\n", mp->mnt_stat.f_mntonname);
9989340fc72SEdward Tomasz Napierala #endif
9999340fc72SEdward Tomasz Napierala 	}
10008c2a54deSKonstantin Belousov 	if ((fs->fs_flags & FS_TRIM) != 0) {
10018c2a54deSKonstantin Belousov 		size = sizeof(int);
10028c2a54deSKonstantin Belousov 		if (g_io_getattr("GEOM::candelete", cp, &size,
10038c2a54deSKonstantin Belousov 		    &ump->um_candelete) == 0) {
10048c2a54deSKonstantin Belousov 			if (!ump->um_candelete)
1005*b60ee81eSKirk McKusick 				printf("WARNING: %s: TRIM flag on fs but disk "
1006*b60ee81eSKirk McKusick 				    "does not support TRIM\n",
10078c2a54deSKonstantin Belousov 				    mp->mnt_stat.f_mntonname);
10088c2a54deSKonstantin Belousov 		} else {
1009*b60ee81eSKirk McKusick 			printf("WARNING: %s: TRIM flag on fs but disk does "
1010*b60ee81eSKirk McKusick 			    "not confirm that it supports TRIM\n",
10118c2a54deSKonstantin Belousov 			    mp->mnt_stat.f_mntonname);
10128c2a54deSKonstantin Belousov 			ump->um_candelete = 0;
10138c2a54deSKonstantin Belousov 		}
10148c2a54deSKonstantin Belousov 	}
10159340fc72SEdward Tomasz Napierala 
1016df8bae1dSRodney W. Grimes 	ump->um_mountp = mp;
1017df8bae1dSRodney W. Grimes 	ump->um_dev = dev;
1018df8bae1dSRodney W. Grimes 	ump->um_devvp = devvp;
1019df8bae1dSRodney W. Grimes 	ump->um_nindir = fs->fs_nindir;
1020df8bae1dSRodney W. Grimes 	ump->um_bptrtodb = fs->fs_fsbtodb;
1021df8bae1dSRodney W. Grimes 	ump->um_seqinc = fs->fs_frag;
1022df8bae1dSRodney W. Grimes 	for (i = 0; i < MAXQUOTAS; i++)
1023df8bae1dSRodney W. Grimes 		ump->um_quotas[i] = NULLVP;
1024516081f2SRobert Watson #ifdef UFS_EXTATTR
1025a64ed089SRobert Watson 	ufs_extattr_uepm_init(&ump->um_extattr);
1026a64ed089SRobert Watson #endif
10272b14f991SJulian Elischer 	/*
10282b14f991SJulian Elischer 	 * Set FS local "last mounted on" information (NULL pad)
10292b14f991SJulian Elischer 	 */
103093373c42SSuleiman Souhlal 	bzero(fs->fs_fsmnt, MAXMNTLEN);
103193373c42SSuleiman Souhlal 	strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN);
1032113db2ddSJeff Roberson 	mp->mnt_stat.f_iosize = fs->fs_bsize;
10332b14f991SJulian Elischer 
10342b14f991SJulian Elischer 	if (mp->mnt_flag & MNT_ROOTFS) {
10352b14f991SJulian Elischer 		/*
10362b14f991SJulian Elischer 		 * Root mount; update timestamp in mount structure.
10372b14f991SJulian Elischer 		 * this will be used by the common root mount code
10382b14f991SJulian Elischer 		 * to update the system clock.
10392b14f991SJulian Elischer 		 */
10402b14f991SJulian Elischer 		mp->mnt_time = fs->fs_time;
10412b14f991SJulian Elischer 	}
1042996c772fSJohn Dyson 
1043996c772fSJohn Dyson 	if (ronly == 0) {
1044113db2ddSJeff Roberson 		fs->fs_mtime = time_second;
1045b1897c19SJulian Elischer 		if ((fs->fs_flags & FS_DOSOFTDEP) &&
1046b1897c19SJulian Elischer 		    (error = softdep_mount(devvp, mp, fs, cred)) != 0) {
1047f55ff3f3SIan Dowse 			free(fs->fs_csp, M_UFSMNT);
1048fddd463dSKonstantin Belousov 			ffs_flushfiles(mp, FORCECLOSE, td);
1049b1897c19SJulian Elischer 			goto out;
1050b1897c19SJulian Elischer 		}
1051f2a2857bSKirk McKusick 		if (fs->fs_snapinum[0] != 0)
1052f2a2857bSKirk McKusick 			ffs_snapshot_mount(mp);
1053cf60e8e4SKirk McKusick 		fs->fs_fmod = 1;
1054996c772fSJohn Dyson 		fs->fs_clean = 0;
1055791dd2faSTor Egge 		(void) ffs_sbupdate(ump, MNT_WAIT, 0);
1056996c772fSJohn Dyson 	}
1057d8d3d415SPoul-Henning Kamp 	/*
1058d8d3d415SPoul-Henning Kamp 	 * Initialize filesystem stat information in mount struct.
1059d8d3d415SPoul-Henning Kamp 	 */
10606cf7bc60SRobert Watson 	MNT_ILOCK(mp);
106133fc3625SJohn Baldwin 	mp->mnt_kern_flag |= MNTK_MPSAFE | MNTK_LOOKUP_SHARED |
106233fc3625SJohn Baldwin 	    MNTK_EXTENDED_SHARED;
10636cf7bc60SRobert Watson 	MNT_IUNLOCK(mp);
1064516081f2SRobert Watson #ifdef UFS_EXTATTR
1065516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART
10669de54ba5SRobert Watson 	/*
10679de54ba5SRobert Watson 	 *
1068f5161237SRobert Watson 	 * Auto-starting does the following:
10699de54ba5SRobert Watson 	 *	- check for /.attribute in the fs, and extattr_start if so
10709de54ba5SRobert Watson 	 *	- for each file in .attribute, enable that file with
10719de54ba5SRobert Watson 	 * 	  an attribute of the same name.
10729de54ba5SRobert Watson 	 * Not clear how to report errors -- probably eat them.
10739de54ba5SRobert Watson 	 * This would all happen while the filesystem was busy/not
10749de54ba5SRobert Watson 	 * available, so would effectively be "atomic".
10759de54ba5SRobert Watson 	 */
1076b40ce416SJulian Elischer 	(void) ufs_extattr_autostart(mp, td);
1077516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */
1078516081f2SRobert Watson #endif /* !UFS_EXTATTR */
1079df8bae1dSRodney W. Grimes 	return (0);
1080df8bae1dSRodney W. Grimes out:
1081df8bae1dSRodney W. Grimes 	if (bp)
1082df8bae1dSRodney W. Grimes 		brelse(bp);
108343920011SPoul-Henning Kamp 	if (cp != NULL) {
108443920011SPoul-Henning Kamp 		DROP_GIANT();
108543920011SPoul-Henning Kamp 		g_topology_lock();
10860d7935fdSAttilio Rao 		g_vfs_close(cp);
108743920011SPoul-Henning Kamp 		g_topology_unlock();
108843920011SPoul-Henning Kamp 		PICKUP_GIANT();
108943920011SPoul-Henning Kamp 	}
1090df8bae1dSRodney W. Grimes 	if (ump) {
10913ba649d7SJeff Roberson 		mtx_destroy(UFS_MTX(ump));
10921a60c7fcSPawel Jakub Dawidek 		if (mp->mnt_gjprovider != NULL) {
10931a60c7fcSPawel Jakub Dawidek 			free(mp->mnt_gjprovider, M_UFSMNT);
10941a60c7fcSPawel Jakub Dawidek 			mp->mnt_gjprovider = NULL;
10951a60c7fcSPawel Jakub Dawidek 		}
1096df8bae1dSRodney W. Grimes 		free(ump->um_fs, M_UFSMNT);
1097df8bae1dSRodney W. Grimes 		free(ump, M_UFSMNT);
109877465d93SAlfred Perlstein 		mp->mnt_data = NULL;
1099df8bae1dSRodney W. Grimes 	}
110049c4791cSEdward Tomasz Napierala 	dev_rel(dev);
1101df8bae1dSRodney W. Grimes 	return (error);
1102df8bae1dSRodney W. Grimes }
1103df8bae1dSRodney W. Grimes 
11041c85e6a3SKirk McKusick #include <sys/sysctl.h>
1105adf41577SPoul-Henning Kamp static int bigcgs = 0;
11061c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, "");
11071c85e6a3SKirk McKusick 
1108df8bae1dSRodney W. Grimes /*
11091c85e6a3SKirk McKusick  * Sanity checks for loading old filesystem superblocks.
11101c85e6a3SKirk McKusick  * See ffs_oldfscompat_write below for unwound actions.
1111df8bae1dSRodney W. Grimes  *
11121c85e6a3SKirk McKusick  * XXX - Parts get retired eventually.
11131c85e6a3SKirk McKusick  * Unfortunately new bits get added.
1114df8bae1dSRodney W. Grimes  */
11151c85e6a3SKirk McKusick static void
11161c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc)
1117df8bae1dSRodney W. Grimes 	struct fs *fs;
11181c85e6a3SKirk McKusick 	struct ufsmount *ump;
11191c85e6a3SKirk McKusick 	ufs2_daddr_t sblockloc;
11201c85e6a3SKirk McKusick {
11211c85e6a3SKirk McKusick 	off_t maxfilesize;
11221c85e6a3SKirk McKusick 
11231c85e6a3SKirk McKusick 	/*
1124ada981b2SKirk McKusick 	 * If not yet done, update fs_flags location and value of fs_sblockloc.
1125ada981b2SKirk McKusick 	 */
1126ada981b2SKirk McKusick 	if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) {
1127ada981b2SKirk McKusick 		fs->fs_flags = fs->fs_old_flags;
1128ada981b2SKirk McKusick 		fs->fs_old_flags |= FS_FLAGS_UPDATED;
1129ada981b2SKirk McKusick 		fs->fs_sblockloc = sblockloc;
1130ada981b2SKirk McKusick 	}
1131ada981b2SKirk McKusick 	/*
11321c85e6a3SKirk McKusick 	 * If not yet done, update UFS1 superblock with new wider fields.
11331c85e6a3SKirk McKusick 	 */
113474f3809aSKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) {
11351c85e6a3SKirk McKusick 		fs->fs_maxbsize = fs->fs_bsize;
11361c85e6a3SKirk McKusick 		fs->fs_time = fs->fs_old_time;
11371c85e6a3SKirk McKusick 		fs->fs_size = fs->fs_old_size;
11381c85e6a3SKirk McKusick 		fs->fs_dsize = fs->fs_old_dsize;
11391c85e6a3SKirk McKusick 		fs->fs_csaddr = fs->fs_old_csaddr;
11401c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir;
11411c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree;
11421c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree;
11431c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree;
11441c85e6a3SKirk McKusick 	}
11451c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC &&
11461c85e6a3SKirk McKusick 	    fs->fs_old_inodefmt < FS_44INODEFMT) {
11478680d698SNate Lawson 		fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1;
11481c85e6a3SKirk McKusick 		fs->fs_qbmask = ~fs->fs_bmask;
11491c85e6a3SKirk McKusick 		fs->fs_qfmask = ~fs->fs_fmask;
11501c85e6a3SKirk McKusick 	}
11518f42fb8fSIan Dowse 	if (fs->fs_magic == FS_UFS1_MAGIC) {
11521c85e6a3SKirk McKusick 		ump->um_savedmaxfilesize = fs->fs_maxfilesize;
11538680d698SNate Lawson 		maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1;
11541c85e6a3SKirk McKusick 		if (fs->fs_maxfilesize > maxfilesize)
11551c85e6a3SKirk McKusick 			fs->fs_maxfilesize = maxfilesize;
11568f42fb8fSIan Dowse 	}
11571c85e6a3SKirk McKusick 	/* Compatibility for old filesystems */
11581c85e6a3SKirk McKusick 	if (fs->fs_avgfilesize <= 0)
11591c85e6a3SKirk McKusick 		fs->fs_avgfilesize = AVFILESIZ;
11601c85e6a3SKirk McKusick 	if (fs->fs_avgfpdir <= 0)
11611c85e6a3SKirk McKusick 		fs->fs_avgfpdir = AFPDIR;
11621c85e6a3SKirk McKusick 	if (bigcgs) {
11631c85e6a3SKirk McKusick 		fs->fs_save_cgsize = fs->fs_cgsize;
11641c85e6a3SKirk McKusick 		fs->fs_cgsize = fs->fs_bsize;
11651c85e6a3SKirk McKusick 	}
11661c85e6a3SKirk McKusick }
11671c85e6a3SKirk McKusick 
11681c85e6a3SKirk McKusick /*
11691c85e6a3SKirk McKusick  * Unwinding superblock updates for old filesystems.
11701c85e6a3SKirk McKusick  * See ffs_oldfscompat_read above for details.
11711c85e6a3SKirk McKusick  *
11721c85e6a3SKirk McKusick  * XXX - Parts get retired eventually.
11731c85e6a3SKirk McKusick  * Unfortunately new bits get added.
11741c85e6a3SKirk McKusick  */
1175113db2ddSJeff Roberson void
11761c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump)
11771c85e6a3SKirk McKusick 	struct fs *fs;
11781c85e6a3SKirk McKusick 	struct ufsmount *ump;
1179df8bae1dSRodney W. Grimes {
1180df8bae1dSRodney W. Grimes 
11811c85e6a3SKirk McKusick 	/*
11821c85e6a3SKirk McKusick 	 * Copy back UFS2 updated fields that UFS1 inspects.
11831c85e6a3SKirk McKusick 	 */
11841c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC) {
11851c85e6a3SKirk McKusick 		fs->fs_old_time = fs->fs_time;
11861c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir;
11871c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree;
11881c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree;
11891c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree;
11901c85e6a3SKirk McKusick 		fs->fs_maxfilesize = ump->um_savedmaxfilesize;
11918f42fb8fSIan Dowse 	}
11921c85e6a3SKirk McKusick 	if (bigcgs) {
11931c85e6a3SKirk McKusick 		fs->fs_cgsize = fs->fs_save_cgsize;
11941c85e6a3SKirk McKusick 		fs->fs_save_cgsize = 0;
11951c85e6a3SKirk McKusick 	}
1196df8bae1dSRodney W. Grimes }
1197df8bae1dSRodney W. Grimes 
1198df8bae1dSRodney W. Grimes /*
1199df8bae1dSRodney W. Grimes  * unmount system call
1200df8bae1dSRodney W. Grimes  */
1201adf41577SPoul-Henning Kamp static int
1202dfd233edSAttilio Rao ffs_unmount(mp, mntflags)
1203df8bae1dSRodney W. Grimes 	struct mount *mp;
1204df8bae1dSRodney W. Grimes 	int mntflags;
1205df8bae1dSRodney W. Grimes {
1206dfd233edSAttilio Rao 	struct thread *td;
120705f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump = VFSTOUFS(mp);
120805f4ff5dSPoul-Henning Kamp 	struct fs *fs;
12096fecb4e4SKonstantin Belousov 	int error, flags, susp;
1210df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR
1211df86ccf6SKonstantin Belousov 	int e_restart;
1212df86ccf6SKonstantin Belousov #endif
1213df8bae1dSRodney W. Grimes 
1214df8bae1dSRodney W. Grimes 	flags = 0;
1215dfd233edSAttilio Rao 	td = curthread;
12166fecb4e4SKonstantin Belousov 	fs = ump->um_fs;
1217*b60ee81eSKirk McKusick 	susp = 0;
1218df8bae1dSRodney W. Grimes 	if (mntflags & MNT_FORCE) {
1219df8bae1dSRodney W. Grimes 		flags |= FORCECLOSE;
12206fecb4e4SKonstantin Belousov 		susp = fs->fs_ronly != 0;
1221*b60ee81eSKirk McKusick 	}
1222516081f2SRobert Watson #ifdef UFS_EXTATTR
1223b40ce416SJulian Elischer 	if ((error = ufs_extattr_stop(mp, td))) {
1224b2b0497aSRobert Watson 		if (error != EOPNOTSUPP)
1225*b60ee81eSKirk McKusick 			printf("WARNING: unmount %s: ufs_extattr_stop "
1226*b60ee81eSKirk McKusick 			    "returned errno %d\n", mp->mnt_stat.f_mntonname,
1227b2b0497aSRobert Watson 			    error);
1228df86ccf6SKonstantin Belousov 		e_restart = 0;
12297df97b61SRobert Watson 	} else {
12309de54ba5SRobert Watson 		ufs_extattr_uepm_destroy(&ump->um_extattr);
1231df86ccf6SKonstantin Belousov 		e_restart = 1;
12327df97b61SRobert Watson 	}
1233a64ed089SRobert Watson #endif
12346fecb4e4SKonstantin Belousov 	if (susp) {
12356fecb4e4SKonstantin Belousov 		/*
12366fecb4e4SKonstantin Belousov 		 * dounmount already called vn_start_write().
12376fecb4e4SKonstantin Belousov 		 */
12386fecb4e4SKonstantin Belousov 		for (;;) {
12396fecb4e4SKonstantin Belousov 			vn_finished_write(mp);
12406fecb4e4SKonstantin Belousov 			if ((error = vfs_write_suspend(mp)) != 0)
12416fecb4e4SKonstantin Belousov 				return (error);
12426fecb4e4SKonstantin Belousov 			MNT_ILOCK(mp);
12436fecb4e4SKonstantin Belousov 			if (mp->mnt_kern_flag & MNTK_SUSPENDED) {
12446fecb4e4SKonstantin Belousov 				mp->mnt_kern_flag &= ~(MNTK_SUSPENDED |
12456fecb4e4SKonstantin Belousov 				    MNTK_SUSPEND2);
12466fecb4e4SKonstantin Belousov 				wakeup(&mp->mnt_flag);
12476fecb4e4SKonstantin Belousov 				MNT_IUNLOCK(mp);
1248dfd233edSAttilio Rao 				td->td_pflags |= TDP_IGNSUSP;
12496fecb4e4SKonstantin Belousov 				break;
12506fecb4e4SKonstantin Belousov 			}
12516fecb4e4SKonstantin Belousov 			MNT_IUNLOCK(mp);
12526fecb4e4SKonstantin Belousov 			vn_start_write(NULL, &mp, V_WAIT);
12536fecb4e4SKonstantin Belousov 		}
12546fecb4e4SKonstantin Belousov 	}
1255fddf7baeSKirk McKusick 	if (MOUNTEDSOFTDEP(mp))
12563c140b2dSEdward Tomasz Napierala 		error = softdep_flushfiles(mp, flags, td);
12573c140b2dSEdward Tomasz Napierala 	else
12583c140b2dSEdward Tomasz Napierala 		error = ffs_flushfiles(mp, flags, td);
12594f560d75SEdward Tomasz Napierala 	if (error != 0 && error != ENXIO)
12606fecb4e4SKonstantin Belousov 		goto fail;
12613c140b2dSEdward Tomasz Napierala 
12623ba649d7SJeff Roberson 	UFS_LOCK(ump);
12639ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
1264*b60ee81eSKirk McKusick 		printf("WARNING: unmount %s: pending error: blocks %jd "
1265*b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
12661c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
12679ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
12689ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
12699ccb939eSKirk McKusick 	}
12703ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
1271113db2ddSJeff Roberson 	softdep_unmount(mp);
1272927a12aeSKirk McKusick 	if (fs->fs_ronly == 0 || ump->um_fsckpid > 0) {
12731a6a6610SKirk McKusick 		fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1;
1274791dd2faSTor Egge 		error = ffs_sbupdate(ump, MNT_WAIT, 0);
12754f560d75SEdward Tomasz Napierala 		if (error && error != ENXIO) {
1276996c772fSJohn Dyson 			fs->fs_clean = 0;
12776fecb4e4SKonstantin Belousov 			goto fail;
1278996c772fSJohn Dyson 		}
1279e0e9c421SDavid Greenman 	}
12806fecb4e4SKonstantin Belousov 	if (susp) {
12816fecb4e4SKonstantin Belousov 		vfs_write_resume(mp);
12826fecb4e4SKonstantin Belousov 		vn_start_write(NULL, &mp, V_WAIT);
12836fecb4e4SKonstantin Belousov 	}
128443920011SPoul-Henning Kamp 	DROP_GIANT();
128543920011SPoul-Henning Kamp 	g_topology_lock();
1286927a12aeSKirk McKusick 	if (ump->um_fsckpid > 0) {
1287927a12aeSKirk McKusick 		/*
1288927a12aeSKirk McKusick 		 * Return to normal read-only mode.
1289927a12aeSKirk McKusick 		 */
1290927a12aeSKirk McKusick 		error = g_access(ump->um_cp, 0, -1, 0);
1291927a12aeSKirk McKusick 		ump->um_fsckpid = 0;
1292927a12aeSKirk McKusick 	}
12930d7935fdSAttilio Rao 	g_vfs_close(ump->um_cp);
129443920011SPoul-Henning Kamp 	g_topology_unlock();
129543920011SPoul-Henning Kamp 	PICKUP_GIANT();
12966476c0d2SJohn Dyson 	vrele(ump->um_devvp);
129749c4791cSEdward Tomasz Napierala 	dev_rel(ump->um_dev);
12983ba649d7SJeff Roberson 	mtx_destroy(UFS_MTX(ump));
12991a60c7fcSPawel Jakub Dawidek 	if (mp->mnt_gjprovider != NULL) {
13001a60c7fcSPawel Jakub Dawidek 		free(mp->mnt_gjprovider, M_UFSMNT);
13011a60c7fcSPawel Jakub Dawidek 		mp->mnt_gjprovider = NULL;
13021a60c7fcSPawel Jakub Dawidek 	}
1303f55ff3f3SIan Dowse 	free(fs->fs_csp, M_UFSMNT);
1304df8bae1dSRodney W. Grimes 	free(fs, M_UFSMNT);
1305df8bae1dSRodney W. Grimes 	free(ump, M_UFSMNT);
130677465d93SAlfred Perlstein 	mp->mnt_data = NULL;
13075da56ddbSTor Egge 	MNT_ILOCK(mp);
1308cc9d8990SPeter Wemm 	mp->mnt_flag &= ~MNT_LOCAL;
13095da56ddbSTor Egge 	MNT_IUNLOCK(mp);
1310df8bae1dSRodney W. Grimes 	return (error);
13116fecb4e4SKonstantin Belousov 
13126fecb4e4SKonstantin Belousov fail:
13136fecb4e4SKonstantin Belousov 	if (susp) {
13146fecb4e4SKonstantin Belousov 		vfs_write_resume(mp);
13156fecb4e4SKonstantin Belousov 		vn_start_write(NULL, &mp, V_WAIT);
13166fecb4e4SKonstantin Belousov 	}
1317df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR
1318df86ccf6SKonstantin Belousov 	if (e_restart) {
1319df86ccf6SKonstantin Belousov 		ufs_extattr_uepm_init(&ump->um_extattr);
1320df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART
1321df86ccf6SKonstantin Belousov 		(void) ufs_extattr_autostart(mp, td);
1322df86ccf6SKonstantin Belousov #endif
1323df86ccf6SKonstantin Belousov 	}
1324df86ccf6SKonstantin Belousov #endif
1325df86ccf6SKonstantin Belousov 
13266fecb4e4SKonstantin Belousov 	return (error);
1327df8bae1dSRodney W. Grimes }
1328df8bae1dSRodney W. Grimes 
1329df8bae1dSRodney W. Grimes /*
1330df8bae1dSRodney W. Grimes  * Flush out all the files in a filesystem.
1331df8bae1dSRodney W. Grimes  */
133226f9a767SRodney W. Grimes int
1333b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td)
133405f4ff5dSPoul-Henning Kamp 	struct mount *mp;
1335df8bae1dSRodney W. Grimes 	int flags;
1336b40ce416SJulian Elischer 	struct thread *td;
1337df8bae1dSRodney W. Grimes {
133805f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
1339c9671602SPoul-Henning Kamp 	int error;
1340df8bae1dSRodney W. Grimes 
1341df8bae1dSRodney W. Grimes 	ump = VFSTOUFS(mp);
1342df8bae1dSRodney W. Grimes #ifdef QUOTA
1343df8bae1dSRodney W. Grimes 	if (mp->mnt_flag & MNT_QUOTA) {
1344c1d9efcbSPoul-Henning Kamp 		int i;
1345f257b7a5SAlfred Perlstein 		error = vflush(mp, 0, SKIPSYSTEM|flags, td);
1346c1d9efcbSPoul-Henning Kamp 		if (error)
1347df8bae1dSRodney W. Grimes 			return (error);
1348df8bae1dSRodney W. Grimes 		for (i = 0; i < MAXQUOTAS; i++) {
1349b40ce416SJulian Elischer 			quotaoff(td, mp, i);
1350df8bae1dSRodney W. Grimes 		}
1351df8bae1dSRodney W. Grimes 		/*
1352df8bae1dSRodney W. Grimes 		 * Here we fall through to vflush again to ensure
1353df8bae1dSRodney W. Grimes 		 * that we have gotten rid of all the system vnodes.
1354df8bae1dSRodney W. Grimes 		 */
1355df8bae1dSRodney W. Grimes 	}
1356df8bae1dSRodney W. Grimes #endif
1357e6e370a7SJeff Roberson 	ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles");
1358e6e370a7SJeff Roberson 	if (ump->um_devvp->v_vflag & VV_COPYONWRITE) {
1359f257b7a5SAlfred Perlstein 		if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0)
1360f2a2857bSKirk McKusick 			return (error);
1361f2a2857bSKirk McKusick 		ffs_snapshot_unmount(mp);
136295e7a3c3STor Egge 		flags |= FORCECLOSE;
1363f2a2857bSKirk McKusick 		/*
1364f2a2857bSKirk McKusick 		 * Here we fall through to vflush again to ensure
1365f2a2857bSKirk McKusick 		 * that we have gotten rid of all the system vnodes.
1366f2a2857bSKirk McKusick 		 */
1367f2a2857bSKirk McKusick 	}
1368b1897c19SJulian Elischer         /*
1369b1897c19SJulian Elischer 	 * Flush all the files.
1370b1897c19SJulian Elischer 	 */
1371f257b7a5SAlfred Perlstein 	if ((error = vflush(mp, 0, flags, td)) != 0)
1372b1897c19SJulian Elischer 		return (error);
1373b1897c19SJulian Elischer 	/*
1374b1897c19SJulian Elischer 	 * Flush filesystem metadata.
1375b1897c19SJulian Elischer 	 */
1376cb05b60aSAttilio Rao 	vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY);
13778df6bac4SPoul-Henning Kamp 	error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td);
137822db15c0SAttilio Rao 	VOP_UNLOCK(ump->um_devvp, 0);
1379df8bae1dSRodney W. Grimes 	return (error);
1380df8bae1dSRodney W. Grimes }
1381df8bae1dSRodney W. Grimes 
1382df8bae1dSRodney W. Grimes /*
1383df8bae1dSRodney W. Grimes  * Get filesystem statistics.
1384df8bae1dSRodney W. Grimes  */
1385adf41577SPoul-Henning Kamp static int
1386dfd233edSAttilio Rao ffs_statfs(mp, sbp)
1387df8bae1dSRodney W. Grimes 	struct mount *mp;
138805f4ff5dSPoul-Henning Kamp 	struct statfs *sbp;
1389df8bae1dSRodney W. Grimes {
139005f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
139105f4ff5dSPoul-Henning Kamp 	struct fs *fs;
1392df8bae1dSRodney W. Grimes 
1393df8bae1dSRodney W. Grimes 	ump = VFSTOUFS(mp);
1394df8bae1dSRodney W. Grimes 	fs = ump->um_fs;
13951c85e6a3SKirk McKusick 	if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC)
1396df8bae1dSRodney W. Grimes 		panic("ffs_statfs");
1397fde81c7dSKirk McKusick 	sbp->f_version = STATFS_VERSION;
1398df8bae1dSRodney W. Grimes 	sbp->f_bsize = fs->fs_fsize;
1399df8bae1dSRodney W. Grimes 	sbp->f_iosize = fs->fs_bsize;
1400df8bae1dSRodney W. Grimes 	sbp->f_blocks = fs->fs_dsize;
14013ba649d7SJeff Roberson 	UFS_LOCK(ump);
1402df8bae1dSRodney W. Grimes 	sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag +
14039ccb939eSKirk McKusick 	    fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks);
14049ccb939eSKirk McKusick 	sbp->f_bavail = freespace(fs, fs->fs_minfree) +
14059ccb939eSKirk McKusick 	    dbtofsb(fs, fs->fs_pendingblocks);
1406df8bae1dSRodney W. Grimes 	sbp->f_files =  fs->fs_ncg * fs->fs_ipg - ROOTINO;
14079ccb939eSKirk McKusick 	sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes;
14083ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
1409fde81c7dSKirk McKusick 	sbp->f_namemax = NAME_MAX;
1410df8bae1dSRodney W. Grimes 	return (0);
1411df8bae1dSRodney W. Grimes }
1412df8bae1dSRodney W. Grimes 
1413df8bae1dSRodney W. Grimes /*
1414df8bae1dSRodney W. Grimes  * Go through the disk queues to initiate sandbagged IO;
1415df8bae1dSRodney W. Grimes  * go through the inodes to write those that have been modified;
1416df8bae1dSRodney W. Grimes  * initiate the writing of the super block if it has been modified.
1417df8bae1dSRodney W. Grimes  *
1418df8bae1dSRodney W. Grimes  * Note: we are always called with the filesystem marked `MPBUSY'.
1419df8bae1dSRodney W. Grimes  */
1420adf41577SPoul-Henning Kamp static int
1421dfd233edSAttilio Rao ffs_sync(mp, waitfor)
1422df8bae1dSRodney W. Grimes 	struct mount *mp;
1423df8bae1dSRodney W. Grimes 	int waitfor;
1424df8bae1dSRodney W. Grimes {
142582be0a5aSTor Egge 	struct vnode *mvp, *vp, *devvp;
1426dfd233edSAttilio Rao 	struct thread *td;
1427996c772fSJohn Dyson 	struct inode *ip;
1428996c772fSJohn Dyson 	struct ufsmount *ump = VFSTOUFS(mp);
1429996c772fSJohn Dyson 	struct fs *fs;
14309b971133SKirk McKusick 	int error, count, wait, lockreq, allerror = 0;
1431791dd2faSTor Egge 	int suspend;
1432791dd2faSTor Egge 	int suspended;
1433791dd2faSTor Egge 	int secondary_writes;
1434791dd2faSTor Egge 	int secondary_accwrites;
1435791dd2faSTor Egge 	int softdep_deps;
1436791dd2faSTor Egge 	int softdep_accdeps;
1437156cb265SPoul-Henning Kamp 	struct bufobj *bo;
1438df8bae1dSRodney W. Grimes 
1439dfd233edSAttilio Rao 	td = curthread;
1440df8bae1dSRodney W. Grimes 	fs = ump->um_fs;
1441*b60ee81eSKirk McKusick 	if (fs->fs_fmod != 0 && fs->fs_ronly != 0 && ump->um_fsckpid == 0)
1442*b60ee81eSKirk McKusick 		panic("%s: ffs_sync: modification on read-only filesystem",
1443*b60ee81eSKirk McKusick 		    fs->fs_fsmnt);
1444df8bae1dSRodney W. Grimes 	/*
1445df8bae1dSRodney W. Grimes 	 * Write back each (modified) inode.
1446df8bae1dSRodney W. Grimes 	 */
14479b971133SKirk McKusick 	wait = 0;
1448791dd2faSTor Egge 	suspend = 0;
1449791dd2faSTor Egge 	suspended = 0;
1450245df27cSMatthew Dillon 	lockreq = LK_EXCLUSIVE | LK_NOWAIT;
1451791dd2faSTor Egge 	if (waitfor == MNT_SUSPEND) {
1452791dd2faSTor Egge 		suspend = 1;
1453791dd2faSTor Egge 		waitfor = MNT_WAIT;
1454791dd2faSTor Egge 	}
14559b971133SKirk McKusick 	if (waitfor == MNT_WAIT) {
14569b971133SKirk McKusick 		wait = 1;
1457245df27cSMatthew Dillon 		lockreq = LK_EXCLUSIVE;
14589b971133SKirk McKusick 	}
145941d4783dSJeff Roberson 	lockreq |= LK_INTERLOCK | LK_SLEEPFAIL;
1460ca430f2eSAlexander Kabaev 	MNT_ILOCK(mp);
1461df8bae1dSRodney W. Grimes loop:
1462791dd2faSTor Egge 	/* Grab snapshot of secondary write counts */
1463791dd2faSTor Egge 	secondary_writes = mp->mnt_secondary_writes;
1464791dd2faSTor Egge 	secondary_accwrites = mp->mnt_secondary_accwrites;
1465791dd2faSTor Egge 
1466791dd2faSTor Egge 	/* Grab snapshot of softdep dependency counts */
1467791dd2faSTor Egge 	MNT_IUNLOCK(mp);
1468791dd2faSTor Egge 	softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps);
1469791dd2faSTor Egge 	MNT_ILOCK(mp);
1470791dd2faSTor Egge 
147182be0a5aSTor Egge 	MNT_VNODE_FOREACH(vp, mp, mvp) {
1472245df27cSMatthew Dillon 		/*
1473245df27cSMatthew Dillon 		 * Depend on the mntvnode_slock to keep things stable enough
1474245df27cSMatthew Dillon 		 * for a quick test.  Since there might be hundreds of
1475245df27cSMatthew Dillon 		 * thousands of vnodes, we cannot afford even a subroutine
1476245df27cSMatthew Dillon 		 * call unless there's a good chance that we have work to do.
1477245df27cSMatthew Dillon 		 */
14782f05568aSJeff Roberson 		VI_LOCK(vp);
1479fe68abe2SJeff Roberson 		if (vp->v_iflag & VI_DOOMED) {
14802f05568aSJeff Roberson 			VI_UNLOCK(vp);
14812f05568aSJeff Roberson 			continue;
14822f05568aSJeff Roberson 		}
1483df8bae1dSRodney W. Grimes 		ip = VTOI(vp);
1484cf60e8e4SKirk McKusick 		if (vp->v_type == VNON || ((ip->i_flag &
1485cf60e8e4SKirk McKusick 		    (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 &&
1486156cb265SPoul-Henning Kamp 		    vp->v_bufobj.bo_dirty.bv_cnt == 0)) {
14872f05568aSJeff Roberson 			VI_UNLOCK(vp);
1488df8bae1dSRodney W. Grimes 			continue;
1489996c772fSJohn Dyson 		}
1490ca430f2eSAlexander Kabaev 		MNT_IUNLOCK(mp);
1491b40ce416SJulian Elischer 		if ((error = vget(vp, lockreq, td)) != 0) {
1492ca430f2eSAlexander Kabaev 			MNT_ILOCK(mp);
149382be0a5aSTor Egge 			if (error == ENOENT || error == ENOLCK) {
149482be0a5aSTor Egge 				MNT_VNODE_FOREACH_ABORT_ILOCKED(mp, mvp);
1495df8bae1dSRodney W. Grimes 				goto loop;
149682be0a5aSTor Egge 			}
14972f05568aSJeff Roberson 			continue;
14982f05568aSJeff Roberson 		}
149940854ff5SPoul-Henning Kamp 		if ((error = ffs_syncvnode(vp, waitfor)) != 0)
1500df8bae1dSRodney W. Grimes 			allerror = error;
150141d4783dSJeff Roberson 		vput(vp);
1502ca430f2eSAlexander Kabaev 		MNT_ILOCK(mp);
1503245df27cSMatthew Dillon 	}
1504ca430f2eSAlexander Kabaev 	MNT_IUNLOCK(mp);
1505df8bae1dSRodney W. Grimes 	/*
1506df8bae1dSRodney W. Grimes 	 * Force stale filesystem control information to be flushed.
1507df8bae1dSRodney W. Grimes 	 */
15089b971133SKirk McKusick 	if (waitfor == MNT_WAIT) {
1509b40ce416SJulian Elischer 		if ((error = softdep_flushworklist(ump->um_mountp, &count, td)))
15109b971133SKirk McKusick 			allerror = error;
15119b971133SKirk McKusick 		/* Flushed work items may create new vnodes to clean */
15129ab73fd1SKirk McKusick 		if (allerror == 0 && count) {
1513ca430f2eSAlexander Kabaev 			MNT_ILOCK(mp);
15149b971133SKirk McKusick 			goto loop;
15159b971133SKirk McKusick 		}
15169b971133SKirk McKusick 	}
1517589c7af9SKirk McKusick #ifdef QUOTA
1518589c7af9SKirk McKusick 	qsync(mp);
1519589c7af9SKirk McKusick #endif
1520112f7372SKirk McKusick 	devvp = ump->um_devvp;
1521156cb265SPoul-Henning Kamp 	bo = &devvp->v_bufobj;
1522698b1a66SJeff Roberson 	BO_LOCK(bo);
1523112f7372SKirk McKusick 	if (waitfor != MNT_LAZY &&
1524156cb265SPoul-Henning Kamp 	    (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0)) {
1525698b1a66SJeff Roberson 		BO_UNLOCK(bo);
1526698b1a66SJeff Roberson 		vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
15278df6bac4SPoul-Henning Kamp 		if ((error = VOP_FSYNC(devvp, waitfor, td)) != 0)
1528df8bae1dSRodney W. Grimes 			allerror = error;
152922db15c0SAttilio Rao 		VOP_UNLOCK(devvp, 0);
15309ab73fd1SKirk McKusick 		if (allerror == 0 && waitfor == MNT_WAIT) {
1531ca430f2eSAlexander Kabaev 			MNT_ILOCK(mp);
1532112f7372SKirk McKusick 			goto loop;
1533b1897c19SJulian Elischer 		}
1534791dd2faSTor Egge 	} else if (suspend != 0) {
1535791dd2faSTor Egge 		if (softdep_check_suspend(mp,
1536791dd2faSTor Egge 					  devvp,
1537791dd2faSTor Egge 					  softdep_deps,
1538791dd2faSTor Egge 					  softdep_accdeps,
1539791dd2faSTor Egge 					  secondary_writes,
1540791dd2faSTor Egge 					  secondary_accwrites) != 0)
1541791dd2faSTor Egge 			goto loop;	/* More work needed */
1542791dd2faSTor Egge 		mtx_assert(MNT_MTX(mp), MA_OWNED);
1543ca2fa807STor Egge 		mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED;
1544791dd2faSTor Egge 		MNT_IUNLOCK(mp);
1545791dd2faSTor Egge 		suspended = 1;
1546112f7372SKirk McKusick 	} else
1547698b1a66SJeff Roberson 		BO_UNLOCK(bo);
1548996c772fSJohn Dyson 	/*
1549996c772fSJohn Dyson 	 * Write back modified superblock.
1550996c772fSJohn Dyson 	 */
1551791dd2faSTor Egge 	if (fs->fs_fmod != 0 &&
1552791dd2faSTor Egge 	    (error = ffs_sbupdate(ump, waitfor, suspended)) != 0)
1553996c772fSJohn Dyson 		allerror = error;
1554df8bae1dSRodney W. Grimes 	return (allerror);
1555df8bae1dSRodney W. Grimes }
1556df8bae1dSRodney W. Grimes 
1557df8bae1dSRodney W. Grimes int
1558a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp)
1559df8bae1dSRodney W. Grimes 	struct mount *mp;
1560df8bae1dSRodney W. Grimes 	ino_t ino;
1561a0595d02SKirk McKusick 	int flags;
1562df8bae1dSRodney W. Grimes 	struct vnode **vpp;
1563df8bae1dSRodney W. Grimes {
15647b7ed832SKonstantin Belousov 	return (ffs_vgetf(mp, ino, flags, vpp, 0));
15657b7ed832SKonstantin Belousov }
15667b7ed832SKonstantin Belousov 
15677b7ed832SKonstantin Belousov int
15687b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags)
15697b7ed832SKonstantin Belousov 	struct mount *mp;
15707b7ed832SKonstantin Belousov 	ino_t ino;
15717b7ed832SKonstantin Belousov 	int flags;
15727b7ed832SKonstantin Belousov 	struct vnode **vpp;
15737b7ed832SKonstantin Belousov 	int ffs_flags;
15747b7ed832SKonstantin Belousov {
1575996c772fSJohn Dyson 	struct fs *fs;
1576996c772fSJohn Dyson 	struct inode *ip;
1577df8bae1dSRodney W. Grimes 	struct ufsmount *ump;
1578df8bae1dSRodney W. Grimes 	struct buf *bp;
1579df8bae1dSRodney W. Grimes 	struct vnode *vp;
158089c9c53dSPoul-Henning Kamp 	struct cdev *dev;
1581f576a00dSSemen Ustimenko 	int error;
1582df8bae1dSRodney W. Grimes 
158351f5ce0cSPoul-Henning Kamp 	error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL);
1584e82ef95cSPoul-Henning Kamp 	if (error || *vpp != NULL)
158514bc0685SPoul-Henning Kamp 		return (error);
1586f576a00dSSemen Ustimenko 
1587f576a00dSSemen Ustimenko 	/*
1588d6919865SJeff Roberson 	 * We must promote to an exclusive lock for vnode creation.  This
1589d6919865SJeff Roberson 	 * can happen if lookup is passed LOCKSHARED.
1590d6919865SJeff Roberson  	 */
1591d6919865SJeff Roberson 	if ((flags & LK_TYPE_MASK) == LK_SHARED) {
1592d6919865SJeff Roberson 		flags &= ~LK_TYPE_MASK;
1593d6919865SJeff Roberson 		flags |= LK_EXCLUSIVE;
1594d6919865SJeff Roberson 	}
1595d6919865SJeff Roberson 
1596d6919865SJeff Roberson 	/*
159713866b3fSSemen Ustimenko 	 * We do not lock vnode creation as it is believed to be too
1598f576a00dSSemen Ustimenko 	 * expensive for such rare case as simultaneous creation of vnode
1599f576a00dSSemen Ustimenko 	 * for same ino by different processes. We just allow them to race
1600f576a00dSSemen Ustimenko 	 * and check later to decide who wins. Let the race begin!
1601f576a00dSSemen Ustimenko 	 */
160214bc0685SPoul-Henning Kamp 
160314bc0685SPoul-Henning Kamp 	ump = VFSTOUFS(mp);
160414bc0685SPoul-Henning Kamp 	dev = ump->um_dev;
160514bc0685SPoul-Henning Kamp 	fs = ump->um_fs;
1606df8bae1dSRodney W. Grimes 
16072094ddb6SDavid Greenman 	/*
16081ede983cSDag-Erling Smørgrav 	 * If this malloc() is performed after the getnewvnode()
16092f9bae59SDavid Greenman 	 * it might block, leaving a vnode with a NULL v_data to be
16102f9bae59SDavid Greenman 	 * found by ffs_sync() if a sync happens to fire right then,
16112f9bae59SDavid Greenman 	 * which will cause a panic because ffs_sync() blindly
16122f9bae59SDavid Greenman 	 * dereferences vp->v_data (as well it should).
16132f9bae59SDavid Greenman 	 */
161414bc0685SPoul-Henning Kamp 	ip = uma_zalloc(uma_inode, M_WAITOK | M_ZERO);
16152f9bae59SDavid Greenman 
1616df8bae1dSRodney W. Grimes 	/* Allocate a new vnode/inode. */
161702f2c6a9SPoul-Henning Kamp 	if (fs->fs_magic == FS_UFS1_MAGIC)
161802f2c6a9SPoul-Henning Kamp 		error = getnewvnode("ufs", mp, &ffs_vnodeops1, &vp);
161902f2c6a9SPoul-Henning Kamp 	else
162002f2c6a9SPoul-Henning Kamp 		error = getnewvnode("ufs", mp, &ffs_vnodeops2, &vp);
1621c9671602SPoul-Henning Kamp 	if (error) {
1622df8bae1dSRodney W. Grimes 		*vpp = NULL;
1623aa4d7a8aSPoul-Henning Kamp 		uma_zfree(uma_inode, ip);
1624df8bae1dSRodney W. Grimes 		return (error);
1625df8bae1dSRodney W. Grimes 	}
162667e87166SBoris Popov 	/*
162733fc3625SJohn Baldwin 	 * FFS supports recursive locking.
162867e87166SBoris Popov 	 */
16293634d5b2SJohn Baldwin 	lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL);
1630628f51d2SAttilio Rao 	VN_LOCK_AREC(vp);
1631df8bae1dSRodney W. Grimes 	vp->v_data = ip;
16325d9d81e7SPoul-Henning Kamp 	vp->v_bufobj.bo_bsize = fs->fs_bsize;
1633df8bae1dSRodney W. Grimes 	ip->i_vnode = vp;
16341c85e6a3SKirk McKusick 	ip->i_ump = ump;
1635c94cd5fcSPoul-Henning Kamp 	ip->i_fs = fs;
1636df8bae1dSRodney W. Grimes 	ip->i_dev = dev;
1637df8bae1dSRodney W. Grimes 	ip->i_number = ino;
1638e65f5a4eSKonstantin Belousov 	ip->i_ea_refs = 0;
1639df8bae1dSRodney W. Grimes #ifdef QUOTA
1640c1d9efcbSPoul-Henning Kamp 	{
1641c1d9efcbSPoul-Henning Kamp 		int i;
1642df8bae1dSRodney W. Grimes 		for (i = 0; i < MAXQUOTAS; i++)
1643df8bae1dSRodney W. Grimes 			ip->i_dquot[i] = NODQUOT;
1644c1d9efcbSPoul-Henning Kamp 	}
1645df8bae1dSRodney W. Grimes #endif
1646df8bae1dSRodney W. Grimes 
16477b7ed832SKonstantin Belousov 	if (ffs_flags & FFSV_FORCEINSMQ)
16487b7ed832SKonstantin Belousov 		vp->v_vflag |= VV_FORCEINSMQ;
164961b9d89fSTor Egge 	error = insmntque(vp, mp);
165061b9d89fSTor Egge 	if (error != 0) {
16516cc745d2SKonstantin Belousov 		uma_zfree(uma_inode, ip);
165261b9d89fSTor Egge 		*vpp = NULL;
165361b9d89fSTor Egge 		return (error);
165461b9d89fSTor Egge 	}
16557b7ed832SKonstantin Belousov 	vp->v_vflag &= ~VV_FORCEINSMQ;
1656a80d8caaSPawel Jakub Dawidek 	error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL);
165745c26fa2SPoul-Henning Kamp 	if (error || *vpp != NULL)
1658f576a00dSSemen Ustimenko 		return (error);
1659f576a00dSSemen Ustimenko 
1660df8bae1dSRodney W. Grimes 	/* Read in the disk contents for the inode, copy into the inode. */
1661c9671602SPoul-Henning Kamp 	error = bread(ump->um_devvp, fsbtodb(fs, ino_to_fsba(fs, ino)),
1662c9671602SPoul-Henning Kamp 	    (int)fs->fs_bsize, NOCRED, &bp);
1663c9671602SPoul-Henning Kamp 	if (error) {
1664df8bae1dSRodney W. Grimes 		/*
1665df8bae1dSRodney W. Grimes 		 * The inode does not contain anything useful, so it would
1666df8bae1dSRodney W. Grimes 		 * be misleading to leave it on its hash chain. With mode
1667df8bae1dSRodney W. Grimes 		 * still zero, it will be unlinked and returned to the free
1668df8bae1dSRodney W. Grimes 		 * list by vput().
1669df8bae1dSRodney W. Grimes 		 */
1670df8bae1dSRodney W. Grimes 		brelse(bp);
1671bd7e5f99SJohn Dyson 		vput(vp);
1672df8bae1dSRodney W. Grimes 		*vpp = NULL;
1673df8bae1dSRodney W. Grimes 		return (error);
1674df8bae1dSRodney W. Grimes 	}
1675de6ba7c0SPoul-Henning Kamp 	if (ip->i_ump->um_fstype == UFS1)
1676a163d034SWarner Losh 		ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK);
1677de6ba7c0SPoul-Henning Kamp 	else
1678a163d034SWarner Losh 		ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK);
1679de6ba7c0SPoul-Henning Kamp 	ffs_load_inode(bp, ip, fs, ino);
1680b1897c19SJulian Elischer 	if (DOINGSOFTDEP(vp))
1681b1897c19SJulian Elischer 		softdep_load_inodeblock(ip);
1682b1897c19SJulian Elischer 	else
1683b1897c19SJulian Elischer 		ip->i_effnlink = ip->i_nlink;
1684bd7e5f99SJohn Dyson 	bqrelse(bp);
1685df8bae1dSRodney W. Grimes 
1686df8bae1dSRodney W. Grimes 	/*
1687df8bae1dSRodney W. Grimes 	 * Initialize the vnode from the inode, check for aliases.
1688df8bae1dSRodney W. Grimes 	 * Note that the underlying vnode may have changed.
1689df8bae1dSRodney W. Grimes 	 */
169002f2c6a9SPoul-Henning Kamp 	if (ip->i_ump->um_fstype == UFS1)
169102f2c6a9SPoul-Henning Kamp 		error = ufs_vinit(mp, &ffs_fifoops1, &vp);
169202f2c6a9SPoul-Henning Kamp 	else
169302f2c6a9SPoul-Henning Kamp 		error = ufs_vinit(mp, &ffs_fifoops2, &vp);
1694c9671602SPoul-Henning Kamp 	if (error) {
1695df8bae1dSRodney W. Grimes 		vput(vp);
1696df8bae1dSRodney W. Grimes 		*vpp = NULL;
1697df8bae1dSRodney W. Grimes 		return (error);
1698df8bae1dSRodney W. Grimes 	}
1699de68347bSPoul-Henning Kamp 
1700df8bae1dSRodney W. Grimes 	/*
17015c24d6eeSPoul-Henning Kamp 	 * Finish inode initialization.
1702df8bae1dSRodney W. Grimes 	 */
170333fc3625SJohn Baldwin 	if (vp->v_type != VFIFO) {
170433fc3625SJohn Baldwin 		/* FFS supports shared locking for all files except fifos. */
170533fc3625SJohn Baldwin 		VN_LOCK_ASHARE(vp);
170633fc3625SJohn Baldwin 	}
1707de68347bSPoul-Henning Kamp 
1708df8bae1dSRodney W. Grimes 	/*
1709df8bae1dSRodney W. Grimes 	 * Set up a generation number for this inode if it does not
1710df8bae1dSRodney W. Grimes 	 * already have one. This should only happen on old filesystems.
1711df8bae1dSRodney W. Grimes 	 */
1712df8bae1dSRodney W. Grimes 	if (ip->i_gen == 0) {
1713aca3e497SKirk McKusick 		ip->i_gen = arc4random() / 2 + 1;
17141c85e6a3SKirk McKusick 		if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) {
1715df8bae1dSRodney W. Grimes 			ip->i_flag |= IN_MODIFIED;
1716b403319bSAlexander Kabaev 			DIP_SET(ip, i_gen, ip->i_gen);
17171c85e6a3SKirk McKusick 		}
1718df8bae1dSRodney W. Grimes 	}
1719763bbd2fSRobert Watson #ifdef MAC
1720763bbd2fSRobert Watson 	if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) {
1721763bbd2fSRobert Watson 		/*
1722763bbd2fSRobert Watson 		 * If this vnode is already allocated, and we're running
1723763bbd2fSRobert Watson 		 * multi-label, attempt to perform a label association
1724763bbd2fSRobert Watson 		 * from the extended attributes on the inode.
1725763bbd2fSRobert Watson 		 */
172630d239bcSRobert Watson 		error = mac_vnode_associate_extattr(mp, vp);
1727763bbd2fSRobert Watson 		if (error) {
1728763bbd2fSRobert Watson 			/* ufs_inactive will release ip->i_devvp ref. */
1729763bbd2fSRobert Watson 			vput(vp);
1730763bbd2fSRobert Watson 			*vpp = NULL;
1731763bbd2fSRobert Watson 			return (error);
1732763bbd2fSRobert Watson 		}
1733763bbd2fSRobert Watson 	}
1734763bbd2fSRobert Watson #endif
1735763bbd2fSRobert Watson 
1736df8bae1dSRodney W. Grimes 	*vpp = vp;
1737df8bae1dSRodney W. Grimes 	return (0);
1738df8bae1dSRodney W. Grimes }
1739df8bae1dSRodney W. Grimes 
1740df8bae1dSRodney W. Grimes /*
1741df8bae1dSRodney W. Grimes  * File handle to vnode
1742df8bae1dSRodney W. Grimes  *
1743df8bae1dSRodney W. Grimes  * Have to be really careful about stale file handles:
1744df8bae1dSRodney W. Grimes  * - check that the inode number is valid
1745df8bae1dSRodney W. Grimes  * - call ffs_vget() to get the locked inode
1746df8bae1dSRodney W. Grimes  * - check for an unallocated inode (i_mode == 0)
1747df8bae1dSRodney W. Grimes  * - check that the given client host has export rights and return
1748df8bae1dSRodney W. Grimes  *   those rights via. exflagsp and credanonp
1749df8bae1dSRodney W. Grimes  */
1750adf41577SPoul-Henning Kamp static int
1751694a586aSRick Macklem ffs_fhtovp(mp, fhp, flags, vpp)
175205f4ff5dSPoul-Henning Kamp 	struct mount *mp;
1753df8bae1dSRodney W. Grimes 	struct fid *fhp;
1754694a586aSRick Macklem 	int flags;
1755df8bae1dSRodney W. Grimes 	struct vnode **vpp;
1756df8bae1dSRodney W. Grimes {
175705f4ff5dSPoul-Henning Kamp 	struct ufid *ufhp;
1758df8bae1dSRodney W. Grimes 	struct fs *fs;
1759df8bae1dSRodney W. Grimes 
1760df8bae1dSRodney W. Grimes 	ufhp = (struct ufid *)fhp;
1761df8bae1dSRodney W. Grimes 	fs = VFSTOUFS(mp)->um_fs;
1762df8bae1dSRodney W. Grimes 	if (ufhp->ufid_ino < ROOTINO ||
1763df8bae1dSRodney W. Grimes 	    ufhp->ufid_ino >= fs->fs_ncg * fs->fs_ipg)
1764df8bae1dSRodney W. Grimes 		return (ESTALE);
1765694a586aSRick Macklem 	return (ufs_fhtovp(mp, ufhp, flags, vpp));
1766df8bae1dSRodney W. Grimes }
1767df8bae1dSRodney W. Grimes 
1768df8bae1dSRodney W. Grimes /*
17695346934fSIan Dowse  * Initialize the filesystem.
1770996c772fSJohn Dyson  */
1771996c772fSJohn Dyson static int
1772996c772fSJohn Dyson ffs_init(vfsp)
1773996c772fSJohn Dyson 	struct vfsconf *vfsp;
1774996c772fSJohn Dyson {
1775996c772fSJohn Dyson 
1776b1897c19SJulian Elischer 	softdep_initialize();
1777996c772fSJohn Dyson 	return (ufs_init(vfsp));
1778996c772fSJohn Dyson }
1779996c772fSJohn Dyson 
1780996c772fSJohn Dyson /*
17815346934fSIan Dowse  * Undo the work of ffs_init().
17825346934fSIan Dowse  */
17835346934fSIan Dowse static int
17845346934fSIan Dowse ffs_uninit(vfsp)
17855346934fSIan Dowse 	struct vfsconf *vfsp;
17865346934fSIan Dowse {
17875346934fSIan Dowse 	int ret;
17885346934fSIan Dowse 
17895346934fSIan Dowse 	ret = ufs_uninit(vfsp);
17905346934fSIan Dowse 	softdep_uninitialize();
17915346934fSIan Dowse 	return (ret);
17925346934fSIan Dowse }
17935346934fSIan Dowse 
17945346934fSIan Dowse /*
1795df8bae1dSRodney W. Grimes  * Write a superblock and associated information back to disk.
1796df8bae1dSRodney W. Grimes  */
17971a60c7fcSPawel Jakub Dawidek int
1798927a12aeSKirk McKusick ffs_sbupdate(ump, waitfor, suspended)
1799927a12aeSKirk McKusick 	struct ufsmount *ump;
1800df8bae1dSRodney W. Grimes 	int waitfor;
1801791dd2faSTor Egge 	int suspended;
1802df8bae1dSRodney W. Grimes {
1803927a12aeSKirk McKusick 	struct fs *fs = ump->um_fs;
18043ba649d7SJeff Roberson 	struct buf *sbbp;
180505f4ff5dSPoul-Henning Kamp 	struct buf *bp;
1806df8bae1dSRodney W. Grimes 	int blks;
1807f55ff3f3SIan Dowse 	void *space;
1808996c772fSJohn Dyson 	int i, size, error, allerror = 0;
1809df8bae1dSRodney W. Grimes 
181074f3809aSKirk McKusick 	if (fs->fs_ronly == 1 &&
1811927a12aeSKirk McKusick 	    (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) !=
1812927a12aeSKirk McKusick 	    (MNT_RDONLY | MNT_UPDATE) && ump->um_fsckpid == 0)
181374f3809aSKirk McKusick 		panic("ffs_sbupdate: write read-only filesystem");
1814996c772fSJohn Dyson 	/*
18153ba649d7SJeff Roberson 	 * We use the superblock's buf to serialize calls to ffs_sbupdate().
18163ba649d7SJeff Roberson 	 */
1817927a12aeSKirk McKusick 	sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc),
1818927a12aeSKirk McKusick 	    (int)fs->fs_sbsize, 0, 0, 0);
18193ba649d7SJeff Roberson 	/*
1820996c772fSJohn Dyson 	 * First write back the summary information.
1821996c772fSJohn Dyson 	 */
1822df8bae1dSRodney W. Grimes 	blks = howmany(fs->fs_cssize, fs->fs_fsize);
1823f55ff3f3SIan Dowse 	space = fs->fs_csp;
1824df8bae1dSRodney W. Grimes 	for (i = 0; i < blks; i += fs->fs_frag) {
1825df8bae1dSRodney W. Grimes 		size = fs->fs_bsize;
1826df8bae1dSRodney W. Grimes 		if (i + fs->fs_frag > blks)
1827df8bae1dSRodney W. Grimes 			size = (blks - i) * fs->fs_fsize;
1828927a12aeSKirk McKusick 		bp = getblk(ump->um_devvp, fsbtodb(fs, fs->fs_csaddr + i),
18297261f5f6SJeff Roberson 		    size, 0, 0, 0);
1830df8bae1dSRodney W. Grimes 		bcopy(space, bp->b_data, (u_int)size);
1831f55ff3f3SIan Dowse 		space = (char *)space + size;
1832791dd2faSTor Egge 		if (suspended)
1833791dd2faSTor Egge 			bp->b_flags |= B_VALIDSUSPWRT;
1834996c772fSJohn Dyson 		if (waitfor != MNT_WAIT)
1835df8bae1dSRodney W. Grimes 			bawrite(bp);
18368aef1712SMatthew Dillon 		else if ((error = bwrite(bp)) != 0)
1837996c772fSJohn Dyson 			allerror = error;
1838df8bae1dSRodney W. Grimes 	}
1839996c772fSJohn Dyson 	/*
1840996c772fSJohn Dyson 	 * Now write back the superblock itself. If any errors occurred
1841996c772fSJohn Dyson 	 * up to this point, then fail so that the superblock avoids
1842996c772fSJohn Dyson 	 * being written out as clean.
1843996c772fSJohn Dyson 	 */
18443ba649d7SJeff Roberson 	if (allerror) {
18453ba649d7SJeff Roberson 		brelse(sbbp);
1846996c772fSJohn Dyson 		return (allerror);
18473ba649d7SJeff Roberson 	}
18483ba649d7SJeff Roberson 	bp = sbbp;
184931574422SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 &&
185031574422SKirk McKusick 	    (fs->fs_flags & FS_FLAGS_UPDATED) == 0) {
1851*b60ee81eSKirk McKusick 		printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n",
1852fa5d33e2SKirk McKusick 		    fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1);
1853fa5d33e2SKirk McKusick 		fs->fs_sblockloc = SBLOCK_UFS1;
1854fa5d33e2SKirk McKusick 	}
185531574422SKirk McKusick 	if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 &&
185631574422SKirk McKusick 	    (fs->fs_flags & FS_FLAGS_UPDATED) == 0) {
1857*b60ee81eSKirk McKusick 		printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n",
1858fa5d33e2SKirk McKusick 		    fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2);
1859fa5d33e2SKirk McKusick 		fs->fs_sblockloc = SBLOCK_UFS2;
1860fa5d33e2SKirk McKusick 	}
1861b1897c19SJulian Elischer 	fs->fs_fmod = 0;
1862227ee8a1SPoul-Henning Kamp 	fs->fs_time = time_second;
1863113db2ddSJeff Roberson 	if (fs->fs_flags & FS_DOSOFTDEP)
1864927a12aeSKirk McKusick 		softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp);
1865996c772fSJohn Dyson 	bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize);
1866927a12aeSKirk McKusick 	ffs_oldfscompat_write((struct fs *)bp->b_data, ump);
1867791dd2faSTor Egge 	if (suspended)
1868791dd2faSTor Egge 		bp->b_flags |= B_VALIDSUSPWRT;
1869996c772fSJohn Dyson 	if (waitfor != MNT_WAIT)
1870996c772fSJohn Dyson 		bawrite(bp);
18718aef1712SMatthew Dillon 	else if ((error = bwrite(bp)) != 0)
1872996c772fSJohn Dyson 		allerror = error;
1873996c772fSJohn Dyson 	return (allerror);
1874df8bae1dSRodney W. Grimes }
1875d6fe88e4SPoul-Henning Kamp 
1876d6fe88e4SPoul-Henning Kamp static int
1877d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp,
1878dfd233edSAttilio Rao 	int attrnamespace, const char *attrname)
1879d6fe88e4SPoul-Henning Kamp {
1880d6fe88e4SPoul-Henning Kamp 
1881d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR
1882d6fe88e4SPoul-Henning Kamp 	return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace,
1883dfd233edSAttilio Rao 	    attrname));
1884d6fe88e4SPoul-Henning Kamp #else
1885d6fe88e4SPoul-Henning Kamp 	return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace,
1886dfd233edSAttilio Rao 	    attrname));
1887d6fe88e4SPoul-Henning Kamp #endif
1888d6fe88e4SPoul-Henning Kamp }
1889975512a9SPoul-Henning Kamp 
1890975512a9SPoul-Henning Kamp static void
1891975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip)
1892975512a9SPoul-Henning Kamp {
1893975512a9SPoul-Henning Kamp 
189436329289STim J. Robbins 	if (ump->um_fstype == UFS1 && ip->i_din1 != NULL)
1895aa4d7a8aSPoul-Henning Kamp 		uma_zfree(uma_ufs1, ip->i_din1);
189636329289STim J. Robbins 	else if (ip->i_din2 != NULL)
18978d721e87STim J. Robbins 		uma_zfree(uma_ufs2, ip->i_din2);
1898aa4d7a8aSPoul-Henning Kamp 	uma_zfree(uma_inode, ip);
1899975512a9SPoul-Henning Kamp }
19006e77a041SPoul-Henning Kamp 
1901dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1;
1902dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0,
1903dd19a799SPoul-Henning Kamp     "Do background writes (honoring the BV_BKGRDWRITE flag)?");
1904dd19a799SPoul-Henning Kamp 
1905dd19a799SPoul-Henning Kamp /*
1906dd19a799SPoul-Henning Kamp  * Complete a background write started from bwrite.
1907dd19a799SPoul-Henning Kamp  */
1908dd19a799SPoul-Henning Kamp static void
1909dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp)
1910dd19a799SPoul-Henning Kamp {
1911204ec66dSJeff Roberson 	struct bufobj *bufobj;
1912dd19a799SPoul-Henning Kamp 	struct buf *origbp;
1913dd19a799SPoul-Henning Kamp 
1914dd19a799SPoul-Henning Kamp 	/*
1915dd19a799SPoul-Henning Kamp 	 * Find the original buffer that we are writing.
1916dd19a799SPoul-Henning Kamp 	 */
1917204ec66dSJeff Roberson 	bufobj = bp->b_bufobj;
1918204ec66dSJeff Roberson 	BO_LOCK(bufobj);
1919dd19a799SPoul-Henning Kamp 	if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL)
1920dd19a799SPoul-Henning Kamp 		panic("backgroundwritedone: lost buffer");
1921204ec66dSJeff Roberson 	/* Grab an extra reference to be dropped by the bufdone() below. */
1922204ec66dSJeff Roberson 	bufobj_wrefl(bufobj);
1923204ec66dSJeff Roberson 	BO_UNLOCK(bufobj);
1924dd19a799SPoul-Henning Kamp 	/*
1925dd19a799SPoul-Henning Kamp 	 * Process dependencies then return any unfinished ones.
1926dd19a799SPoul-Henning Kamp 	 */
192704533fc6SXin LI 	if (!LIST_EMPTY(&bp->b_dep))
1928dd19a799SPoul-Henning Kamp 		buf_complete(bp);
1929dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES
193004533fc6SXin LI 	if (!LIST_EMPTY(&bp->b_dep))
1931dd19a799SPoul-Henning Kamp 		softdep_move_dependencies(bp, origbp);
1932dd19a799SPoul-Henning Kamp #endif
1933dd19a799SPoul-Henning Kamp 	/*
1934204ec66dSJeff Roberson 	 * This buffer is marked B_NOCACHE so when it is released
1935204ec66dSJeff Roberson 	 * by biodone it will be tossed.
1936dd19a799SPoul-Henning Kamp 	 */
1937dd19a799SPoul-Henning Kamp 	bp->b_flags |= B_NOCACHE;
1938ec9c9e73SAlan Cox 	bp->b_flags &= ~B_CACHE;
1939dd19a799SPoul-Henning Kamp 	bufdone(bp);
1940204ec66dSJeff Roberson 	BO_LOCK(bufobj);
1941dd19a799SPoul-Henning Kamp 	/*
1942dd19a799SPoul-Henning Kamp 	 * Clear the BV_BKGRDINPROG flag in the original buffer
1943dd19a799SPoul-Henning Kamp 	 * and awaken it if it is waiting for the write to complete.
1944dd19a799SPoul-Henning Kamp 	 * If BV_BKGRDINPROG is not set in the original buffer it must
1945dd19a799SPoul-Henning Kamp 	 * have been released and re-instantiated - which is not legal.
1946dd19a799SPoul-Henning Kamp 	 */
1947dd19a799SPoul-Henning Kamp 	KASSERT((origbp->b_vflags & BV_BKGRDINPROG),
1948dd19a799SPoul-Henning Kamp 	    ("backgroundwritedone: lost buffer2"));
1949dd19a799SPoul-Henning Kamp 	origbp->b_vflags &= ~BV_BKGRDINPROG;
1950dd19a799SPoul-Henning Kamp 	if (origbp->b_vflags & BV_BKGRDWAIT) {
1951dd19a799SPoul-Henning Kamp 		origbp->b_vflags &= ~BV_BKGRDWAIT;
1952dd19a799SPoul-Henning Kamp 		wakeup(&origbp->b_xflags);
1953dd19a799SPoul-Henning Kamp 	}
1954204ec66dSJeff Roberson 	BO_UNLOCK(bufobj);
1955dd19a799SPoul-Henning Kamp }
1956dd19a799SPoul-Henning Kamp 
1957dd19a799SPoul-Henning Kamp 
1958dd19a799SPoul-Henning Kamp /*
1959dd19a799SPoul-Henning Kamp  * Write, release buffer on completion.  (Done by iodone
1960dd19a799SPoul-Henning Kamp  * if async).  Do not bother writing anything if the buffer
1961dd19a799SPoul-Henning Kamp  * is invalid.
1962dd19a799SPoul-Henning Kamp  *
1963dd19a799SPoul-Henning Kamp  * Note that we set B_CACHE here, indicating that buffer is
1964dd19a799SPoul-Henning Kamp  * fully valid and thus cacheable.  This is true even of NFS
1965dd19a799SPoul-Henning Kamp  * now so we set it generally.  This could be set either here
1966dd19a799SPoul-Henning Kamp  * or in biodone() since the I/O is synchronous.  We put it
1967dd19a799SPoul-Henning Kamp  * here.
1968dd19a799SPoul-Henning Kamp  */
1969dd19a799SPoul-Henning Kamp static int
1970dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp)
1971dd19a799SPoul-Henning Kamp {
1972dd19a799SPoul-Henning Kamp 	int oldflags, s;
1973dd19a799SPoul-Henning Kamp 	struct buf *newbp;
1974dd19a799SPoul-Henning Kamp 
1975dd19a799SPoul-Henning Kamp 	CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags);
1976dd19a799SPoul-Henning Kamp 	if (bp->b_flags & B_INVAL) {
1977dd19a799SPoul-Henning Kamp 		brelse(bp);
1978dd19a799SPoul-Henning Kamp 		return (0);
1979dd19a799SPoul-Henning Kamp 	}
1980dd19a799SPoul-Henning Kamp 
1981dd19a799SPoul-Henning Kamp 	oldflags = bp->b_flags;
1982dd19a799SPoul-Henning Kamp 
1983d638e093SAttilio Rao 	if (!BUF_ISLOCKED(bp))
1984dd19a799SPoul-Henning Kamp 		panic("bufwrite: buffer is not busy???");
1985dd19a799SPoul-Henning Kamp 	s = splbio();
1986dd19a799SPoul-Henning Kamp 	/*
1987dd19a799SPoul-Henning Kamp 	 * If a background write is already in progress, delay
1988dd19a799SPoul-Henning Kamp 	 * writing this block if it is asynchronous. Otherwise
1989dd19a799SPoul-Henning Kamp 	 * wait for the background write to complete.
1990dd19a799SPoul-Henning Kamp 	 */
1991dd19a799SPoul-Henning Kamp 	BO_LOCK(bp->b_bufobj);
1992dd19a799SPoul-Henning Kamp 	if (bp->b_vflags & BV_BKGRDINPROG) {
1993dd19a799SPoul-Henning Kamp 		if (bp->b_flags & B_ASYNC) {
1994dd19a799SPoul-Henning Kamp 			BO_UNLOCK(bp->b_bufobj);
1995dd19a799SPoul-Henning Kamp 			splx(s);
1996dd19a799SPoul-Henning Kamp 			bdwrite(bp);
1997dd19a799SPoul-Henning Kamp 			return (0);
1998dd19a799SPoul-Henning Kamp 		}
1999dd19a799SPoul-Henning Kamp 		bp->b_vflags |= BV_BKGRDWAIT;
2000dd19a799SPoul-Henning Kamp 		msleep(&bp->b_xflags, BO_MTX(bp->b_bufobj), PRIBIO, "bwrbg", 0);
2001dd19a799SPoul-Henning Kamp 		if (bp->b_vflags & BV_BKGRDINPROG)
2002dd19a799SPoul-Henning Kamp 			panic("bufwrite: still writing");
2003dd19a799SPoul-Henning Kamp 	}
2004dd19a799SPoul-Henning Kamp 	BO_UNLOCK(bp->b_bufobj);
2005dd19a799SPoul-Henning Kamp 
2006dd19a799SPoul-Henning Kamp 	/*
2007dd19a799SPoul-Henning Kamp 	 * If this buffer is marked for background writing and we
2008dd19a799SPoul-Henning Kamp 	 * do not have to wait for it, make a copy and write the
2009dd19a799SPoul-Henning Kamp 	 * copy so as to leave this buffer ready for further use.
2010dd19a799SPoul-Henning Kamp 	 *
2011dd19a799SPoul-Henning Kamp 	 * This optimization eats a lot of memory.  If we have a page
2012dd19a799SPoul-Henning Kamp 	 * or buffer shortfall we can't do it.
2013dd19a799SPoul-Henning Kamp 	 */
2014dd19a799SPoul-Henning Kamp 	if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) &&
2015dd19a799SPoul-Henning Kamp 	    (bp->b_flags & B_ASYNC) &&
2016dd19a799SPoul-Henning Kamp 	    !vm_page_count_severe() &&
2017dd19a799SPoul-Henning Kamp 	    !buf_dirty_count_severe()) {
2018dd19a799SPoul-Henning Kamp 		KASSERT(bp->b_iodone == NULL,
2019dd19a799SPoul-Henning Kamp 		    ("bufwrite: needs chained iodone (%p)", bp->b_iodone));
2020dd19a799SPoul-Henning Kamp 
2021dd19a799SPoul-Henning Kamp 		/* get a new block */
2022c1d8b5e8SKonstantin Belousov 		newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD);
2023c1d8b5e8SKonstantin Belousov 		if (newbp == NULL)
2024c1d8b5e8SKonstantin Belousov 			goto normal_write;
2025dd19a799SPoul-Henning Kamp 
2026dd19a799SPoul-Henning Kamp 		/*
2027dd19a799SPoul-Henning Kamp 		 * set it to be identical to the old block.  We have to
2028dd19a799SPoul-Henning Kamp 		 * set b_lblkno and BKGRDMARKER before calling bgetvp()
2029dd19a799SPoul-Henning Kamp 		 * to avoid confusing the splay tree and gbincore().
2030dd19a799SPoul-Henning Kamp 		 */
2031dd19a799SPoul-Henning Kamp 		memcpy(newbp->b_data, bp->b_data, bp->b_bufsize);
2032dd19a799SPoul-Henning Kamp 		newbp->b_lblkno = bp->b_lblkno;
2033dd19a799SPoul-Henning Kamp 		newbp->b_xflags |= BX_BKGRDMARKER;
2034dd19a799SPoul-Henning Kamp 		BO_LOCK(bp->b_bufobj);
2035dd19a799SPoul-Henning Kamp 		bp->b_vflags |= BV_BKGRDINPROG;
2036dd19a799SPoul-Henning Kamp 		bgetvp(bp->b_vp, newbp);
2037dd19a799SPoul-Henning Kamp 		BO_UNLOCK(bp->b_bufobj);
2038dd19a799SPoul-Henning Kamp 		newbp->b_bufobj = &bp->b_vp->v_bufobj;
2039dd19a799SPoul-Henning Kamp 		newbp->b_blkno = bp->b_blkno;
2040dd19a799SPoul-Henning Kamp 		newbp->b_offset = bp->b_offset;
2041dd19a799SPoul-Henning Kamp 		newbp->b_iodone = ffs_backgroundwritedone;
2042dd19a799SPoul-Henning Kamp 		newbp->b_flags |= B_ASYNC;
2043dd19a799SPoul-Henning Kamp 		newbp->b_flags &= ~B_INVAL;
2044dd19a799SPoul-Henning Kamp 
2045dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES
2046113db2ddSJeff Roberson 		/*
2047113db2ddSJeff Roberson 		 * Move over the dependencies.  If there are rollbacks,
2048113db2ddSJeff Roberson 		 * leave the parent buffer dirtied as it will need to
2049113db2ddSJeff Roberson 		 * be written again.
2050113db2ddSJeff Roberson 		 */
2051113db2ddSJeff Roberson 		if (LIST_EMPTY(&bp->b_dep) ||
2052113db2ddSJeff Roberson 		    softdep_move_dependencies(bp, newbp) == 0)
2053113db2ddSJeff Roberson 			bundirty(bp);
2054113db2ddSJeff Roberson #else
2055113db2ddSJeff Roberson 		bundirty(bp);
2056dd19a799SPoul-Henning Kamp #endif
2057dd19a799SPoul-Henning Kamp 
2058dd19a799SPoul-Henning Kamp 		/*
2059dd19a799SPoul-Henning Kamp 		 * Initiate write on the copy, release the original to
2060dd19a799SPoul-Henning Kamp 		 * the B_LOCKED queue so that it cannot go away until
2061dd19a799SPoul-Henning Kamp 		 * the background write completes. If not locked it could go
2062dd19a799SPoul-Henning Kamp 		 * away and then be reconstituted while it was being written.
2063dd19a799SPoul-Henning Kamp 		 * If the reconstituted buffer were written, we could end up
2064dd19a799SPoul-Henning Kamp 		 * with two background copies being written at the same time.
2065dd19a799SPoul-Henning Kamp 		 */
2066dd19a799SPoul-Henning Kamp 		bqrelse(bp);
2067dd19a799SPoul-Henning Kamp 		bp = newbp;
2068113db2ddSJeff Roberson 	} else
2069113db2ddSJeff Roberson 		/* Mark the buffer clean */
2070113db2ddSJeff Roberson 		bundirty(bp);
2071113db2ddSJeff Roberson 
2072dd19a799SPoul-Henning Kamp 
2073dd19a799SPoul-Henning Kamp 	/* Let the normal bufwrite do the rest for us */
2074c1d8b5e8SKonstantin Belousov normal_write:
20759248a827STor Egge 	return (bufwrite(bp));
2076dd19a799SPoul-Henning Kamp }
2077dd19a799SPoul-Henning Kamp 
2078dd19a799SPoul-Henning Kamp 
20798dd56505SPoul-Henning Kamp static void
20806e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp)
20816e77a041SPoul-Henning Kamp {
2082153910e0SJeff Roberson 	struct vnode *vp;
2083153910e0SJeff Roberson 	int error;
20847de3839dSTor Egge 	struct buf *tbp;
2085113db2ddSJeff Roberson 	int nocopy;
20866e77a041SPoul-Henning Kamp 
2087153910e0SJeff Roberson 	vp = bo->__bo_vnode;
2088153910e0SJeff Roberson 	if (bp->b_iocmd == BIO_WRITE) {
2089153910e0SJeff Roberson 		if ((bp->b_flags & B_VALIDSUSPWRT) == 0 &&
2090153910e0SJeff Roberson 		    bp->b_vp != NULL && bp->b_vp->v_mount != NULL &&
2091153910e0SJeff Roberson 		    (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0)
2092153910e0SJeff Roberson 			panic("ffs_geom_strategy: bad I/O");
2093113db2ddSJeff Roberson 		nocopy = bp->b_flags & B_NOCOPY;
2094113db2ddSJeff Roberson 		bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY);
2095113db2ddSJeff Roberson 		if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 &&
20967de3839dSTor Egge 		    vp->v_rdev->si_snapdata != NULL) {
20977de3839dSTor Egge 			if ((bp->b_flags & B_CLUSTER) != 0) {
2098868bb88fSTor Egge 				runningbufwakeup(bp);
20997de3839dSTor Egge 				TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head,
21007de3839dSTor Egge 					      b_cluster.cluster_entry) {
21017de3839dSTor Egge 					error = ffs_copyonwrite(vp, tbp);
21027de3839dSTor Egge 					if (error != 0 &&
2103153910e0SJeff Roberson 					    error != EOPNOTSUPP) {
2104153910e0SJeff Roberson 						bp->b_error = error;
2105153910e0SJeff Roberson 						bp->b_ioflags |= BIO_ERROR;
2106153910e0SJeff Roberson 						bufdone(bp);
2107153910e0SJeff Roberson 						return;
2108153910e0SJeff Roberson 					}
2109153910e0SJeff Roberson 				}
2110868bb88fSTor Egge 				bp->b_runningbufspace = bp->b_bufsize;
21115bd65606SJohn Baldwin 				atomic_add_long(&runningbufspace,
2112868bb88fSTor Egge 					       bp->b_runningbufspace);
21137de3839dSTor Egge 			} else {
21147de3839dSTor Egge 				error = ffs_copyonwrite(vp, bp);
21157de3839dSTor Egge 				if (error != 0 && error != EOPNOTSUPP) {
21167de3839dSTor Egge 					bp->b_error = error;
21177de3839dSTor Egge 					bp->b_ioflags |= BIO_ERROR;
21187de3839dSTor Egge 					bufdone(bp);
21197de3839dSTor Egge 					return;
21207de3839dSTor Egge 				}
21217de3839dSTor Egge 			}
21227de3839dSTor Egge 		}
21237de3839dSTor Egge #ifdef SOFTUPDATES
21247de3839dSTor Egge 		if ((bp->b_flags & B_CLUSTER) != 0) {
21257de3839dSTor Egge 			TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head,
21267de3839dSTor Egge 				      b_cluster.cluster_entry) {
212704533fc6SXin LI 				if (!LIST_EMPTY(&tbp->b_dep))
21287de3839dSTor Egge 					buf_start(tbp);
21297de3839dSTor Egge 			}
21307de3839dSTor Egge 		} else {
213104533fc6SXin LI 			if (!LIST_EMPTY(&bp->b_dep))
21327de3839dSTor Egge 				buf_start(bp);
21337de3839dSTor Egge 		}
21347de3839dSTor Egge 
21357de3839dSTor Egge #endif
21367de3839dSTor Egge 	}
213743920011SPoul-Henning Kamp 	g_vfs_strategy(bo, bp);
21386e77a041SPoul-Henning Kamp }
213952dfc8d7SKonstantin Belousov 
214052dfc8d7SKonstantin Belousov #ifdef	DDB
214152dfc8d7SKonstantin Belousov 
214252dfc8d7SKonstantin Belousov static void
214352dfc8d7SKonstantin Belousov db_print_ffs(struct ufsmount *ump)
214452dfc8d7SKonstantin Belousov {
2145280e091aSJeff Roberson 	db_printf("mp %p %s devvp %p fs %p su_wl %d su_deps %d su_req %d\n",
214652dfc8d7SKonstantin Belousov 	    ump->um_mountp, ump->um_mountp->mnt_stat.f_mntonname,
214752dfc8d7SKonstantin Belousov 	    ump->um_devvp, ump->um_fs, ump->softdep_on_worklist,
2148280e091aSJeff Roberson 	    ump->softdep_deps, ump->softdep_req);
214952dfc8d7SKonstantin Belousov }
215052dfc8d7SKonstantin Belousov 
215152dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs)
215252dfc8d7SKonstantin Belousov {
215352dfc8d7SKonstantin Belousov 	struct mount *mp;
215452dfc8d7SKonstantin Belousov 	struct ufsmount *ump;
215552dfc8d7SKonstantin Belousov 
215652dfc8d7SKonstantin Belousov 	if (have_addr) {
215752dfc8d7SKonstantin Belousov 		ump = VFSTOUFS((struct mount *)addr);
215852dfc8d7SKonstantin Belousov 		db_print_ffs(ump);
215952dfc8d7SKonstantin Belousov 		return;
216052dfc8d7SKonstantin Belousov 	}
216152dfc8d7SKonstantin Belousov 
216252dfc8d7SKonstantin Belousov 	TAILQ_FOREACH(mp, &mountlist, mnt_list) {
216352dfc8d7SKonstantin Belousov 		if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name))
216452dfc8d7SKonstantin Belousov 			db_print_ffs(VFSTOUFS(mp));
216552dfc8d7SKonstantin Belousov 	}
216652dfc8d7SKonstantin Belousov }
216752dfc8d7SKonstantin Belousov 
216852dfc8d7SKonstantin Belousov #endif	/* DDB */
2169