xref: /freebsd/sys/ufs/ffs/ffs_vfsops.c (revision 2af934cc15bd8e7daa2daeb806321d0daddf3b7a)
160727d8bSWarner Losh /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
4df8bae1dSRodney W. Grimes  * Copyright (c) 1989, 1991, 1993, 1994
5df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
6df8bae1dSRodney W. Grimes  *
7df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
8df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
9df8bae1dSRodney W. Grimes  * are met:
10df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
12df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
13df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
14df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
15fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
16df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
17df8bae1dSRodney W. Grimes  *    without specific prior written permission.
18df8bae1dSRodney W. Grimes  *
19df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
30df8bae1dSRodney W. Grimes  *
31996c772fSJohn Dyson  *	@(#)ffs_vfsops.c	8.31 (Berkeley) 5/20/95
32df8bae1dSRodney W. Grimes  */
33df8bae1dSRodney W. Grimes 
34f4636c59SDavid E. O'Brien #include <sys/cdefs.h>
35f4636c59SDavid E. O'Brien __FBSDID("$FreeBSD$");
36f4636c59SDavid E. O'Brien 
3701733a9bSGarrett Wollman #include "opt_quota.h"
38516081f2SRobert Watson #include "opt_ufs.h"
396e77a041SPoul-Henning Kamp #include "opt_ffs.h"
4052dfc8d7SKonstantin Belousov #include "opt_ddb.h"
4101733a9bSGarrett Wollman 
42df8bae1dSRodney W. Grimes #include <sys/param.h>
43f89d2072SXin LI #include <sys/gsb_crc32.h>
44df8bae1dSRodney W. Grimes #include <sys/systm.h>
45df8bae1dSRodney W. Grimes #include <sys/namei.h>
46acd3428bSRobert Watson #include <sys/priv.h>
47df8bae1dSRodney W. Grimes #include <sys/proc.h>
48c79dff0fSKonstantin Belousov #include <sys/taskqueue.h>
49df8bae1dSRodney W. Grimes #include <sys/kernel.h>
50daec9284SConrad Meyer #include <sys/ktr.h>
51df8bae1dSRodney W. Grimes #include <sys/vnode.h>
52df8bae1dSRodney W. Grimes #include <sys/mount.h>
539626b608SPoul-Henning Kamp #include <sys/bio.h>
54df8bae1dSRodney W. Grimes #include <sys/buf.h>
5581bca6ddSKATO Takenori #include <sys/conf.h>
563ac4d1efSBruce Evans #include <sys/fcntl.h>
571848286aSEdward Tomasz Napierala #include <sys/ioccom.h>
58df8bae1dSRodney W. Grimes #include <sys/malloc.h>
591b367556SJason Evans #include <sys/mutex.h>
6022a72260SJeff Roberson #include <sys/rwlock.h>
61d79ff54bSChuck Silvers #include <sys/sysctl.h>
629ed01c32SGleb Smirnoff #include <sys/vmmeter.h>
63a18b1f1dSJason Evans 
64aed55708SRobert Watson #include <security/mac/mac_framework.h>
65aed55708SRobert Watson 
66a96da1c3SConrad Meyer #include <ufs/ufs/dir.h>
67a64ed089SRobert Watson #include <ufs/ufs/extattr.h>
681a60c7fcSPawel Jakub Dawidek #include <ufs/ufs/gjournal.h>
69df8bae1dSRodney W. Grimes #include <ufs/ufs/quota.h>
70df8bae1dSRodney W. Grimes #include <ufs/ufs/ufsmount.h>
71df8bae1dSRodney W. Grimes #include <ufs/ufs/inode.h>
72df8bae1dSRodney W. Grimes #include <ufs/ufs/ufs_extern.h>
73df8bae1dSRodney W. Grimes 
74df8bae1dSRodney W. Grimes #include <ufs/ffs/fs.h>
75df8bae1dSRodney W. Grimes #include <ufs/ffs/ffs_extern.h>
76df8bae1dSRodney W. Grimes 
77f6b04d2bSDavid Greenman #include <vm/vm.h>
78aa4d7a8aSPoul-Henning Kamp #include <vm/uma.h>
79f6b04d2bSDavid Greenman #include <vm/vm_page.h>
80f6b04d2bSDavid Greenman 
8143920011SPoul-Henning Kamp #include <geom/geom.h>
8243920011SPoul-Henning Kamp #include <geom/geom_vfs.h>
8343920011SPoul-Henning Kamp 
8452dfc8d7SKonstantin Belousov #include <ddb/ddb.h>
8552dfc8d7SKonstantin Belousov 
86adf41577SPoul-Henning Kamp static uma_zone_t uma_inode, uma_ufs1, uma_ufs2;
879d5a594fSMateusz Guzik VFS_SMR_DECLARE;
8855166637SPoul-Henning Kamp 
89975512a9SPoul-Henning Kamp static int	ffs_mountfs(struct vnode *, struct mount *, struct thread *);
901c85e6a3SKirk McKusick static void	ffs_oldfscompat_read(struct fs *, struct ufsmount *,
911c85e6a3SKirk McKusick 		    ufs2_daddr_t);
92975512a9SPoul-Henning Kamp static void	ffs_ifree(struct ufsmount *ump, struct inode *ip);
93a988a5c6SKonstantin Belousov static int	ffs_sync_lazy(struct mount *mp);
94dffce215SKirk McKusick static int	ffs_use_bread(void *devfd, off_t loc, void **bufp, int size);
95dffce215SKirk McKusick static int	ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size);
96a988a5c6SKonstantin Belousov 
979bf1a756SPoul-Henning Kamp static vfs_init_t ffs_init;
989bf1a756SPoul-Henning Kamp static vfs_uninit_t ffs_uninit;
99d6fe88e4SPoul-Henning Kamp static vfs_extattrctl_t ffs_extattrctl;
10020a92a18SPoul-Henning Kamp static vfs_cmount_t ffs_cmount;
101adf41577SPoul-Henning Kamp static vfs_unmount_t ffs_unmount;
10220a92a18SPoul-Henning Kamp static vfs_mount_t ffs_mount;
103adf41577SPoul-Henning Kamp static vfs_statfs_t ffs_statfs;
104adf41577SPoul-Henning Kamp static vfs_fhtovp_t ffs_fhtovp;
105adf41577SPoul-Henning Kamp static vfs_sync_t ffs_sync;
106df8bae1dSRodney W. Grimes 
107303b270bSEivind Eklund static struct vfsops ufs_vfsops = {
1087652131bSPoul-Henning Kamp 	.vfs_extattrctl =	ffs_extattrctl,
1097652131bSPoul-Henning Kamp 	.vfs_fhtovp =		ffs_fhtovp,
1107652131bSPoul-Henning Kamp 	.vfs_init =		ffs_init,
11120a92a18SPoul-Henning Kamp 	.vfs_mount =		ffs_mount,
11220a92a18SPoul-Henning Kamp 	.vfs_cmount =		ffs_cmount,
1137652131bSPoul-Henning Kamp 	.vfs_quotactl =		ufs_quotactl,
114e35cd9e3SMateusz Guzik 	.vfs_root =		vfs_cache_root,
115e35cd9e3SMateusz Guzik 	.vfs_cachedroot =	ufs_root,
1167652131bSPoul-Henning Kamp 	.vfs_statfs =		ffs_statfs,
1177652131bSPoul-Henning Kamp 	.vfs_sync =		ffs_sync,
1187652131bSPoul-Henning Kamp 	.vfs_uninit =		ffs_uninit,
1197652131bSPoul-Henning Kamp 	.vfs_unmount =		ffs_unmount,
1207652131bSPoul-Henning Kamp 	.vfs_vget =		ffs_vget,
1212814d5baSKonstantin Belousov 	.vfs_susp_clean =	process_deferred_inactive,
122df8bae1dSRodney W. Grimes };
123df8bae1dSRodney W. Grimes 
1248994ca3cSBruce Evans VFS_SET(ufs_vfsops, ufs, 0);
1255fe6d2beSPawel Jakub Dawidek MODULE_VERSION(ufs, 1);
126c901836cSGarrett Wollman 
1276e77a041SPoul-Henning Kamp static b_strategy_t ffs_geom_strategy;
128dd19a799SPoul-Henning Kamp static b_write_t ffs_bufwrite;
1296e77a041SPoul-Henning Kamp 
1306e77a041SPoul-Henning Kamp static struct buf_ops ffs_ops = {
1316e77a041SPoul-Henning Kamp 	.bop_name =	"FFS",
132dd19a799SPoul-Henning Kamp 	.bop_write =	ffs_bufwrite,
1336e77a041SPoul-Henning Kamp 	.bop_strategy =	ffs_geom_strategy,
1346ef8480aSPoul-Henning Kamp 	.bop_sync =	bufsync,
1352cc7d26fSKonstantin Belousov #ifdef NO_FFS_SNAPSHOT
1362cc7d26fSKonstantin Belousov 	.bop_bdflush =	bufbdflush,
1372cc7d26fSKonstantin Belousov #else
1382cc7d26fSKonstantin Belousov 	.bop_bdflush =	ffs_bdflush,
1392cc7d26fSKonstantin Belousov #endif
1406e77a041SPoul-Henning Kamp };
1416e77a041SPoul-Henning Kamp 
1420b962648SAndriy Gapon /*
1430b962648SAndriy Gapon  * Note that userquota and groupquota options are not currently used
1440b962648SAndriy Gapon  * by UFS/FFS code and generally mount(8) does not pass those options
1450b962648SAndriy Gapon  * from userland, but they can be passed by loader(8) via
1460b962648SAndriy Gapon  * vfs.root.mountfrom.options.
1470b962648SAndriy Gapon  */
148d952ba1bSJohn Baldwin static const char *ffs_opts[] = { "acls", "async", "noatime", "noclusterr",
1490b962648SAndriy Gapon     "noclusterw", "noexec", "export", "force", "from", "groupquota",
150927a12aeSKirk McKusick     "multilabel", "nfsv4acls", "fsckpid", "snapshot", "nosuid", "suiddir",
151daba4da8SKirk McKusick     "nosymfollow", "sync", "union", "userquota", "untrusted", NULL };
15220a92a18SPoul-Henning Kamp 
153d79ff54bSChuck Silvers static int ffs_enxio_enable = 1;
154d79ff54bSChuck Silvers SYSCTL_DECL(_vfs_ffs);
155d79ff54bSChuck Silvers SYSCTL_INT(_vfs_ffs, OID_AUTO, enxio_enable, CTLFLAG_RWTUN,
156d79ff54bSChuck Silvers     &ffs_enxio_enable, 0,
157d79ff54bSChuck Silvers     "enable mapping of other disk I/O errors to ENXIO");
158d79ff54bSChuck Silvers 
159d9a8abf6SChuck Silvers /*
160d9a8abf6SChuck Silvers  * Return buffer with the contents of block "offset" from the beginning of
161d9a8abf6SChuck Silvers  * directory "ip".  If "res" is non-zero, fill it in with a pointer to the
162d9a8abf6SChuck Silvers  * remaining space in the directory.
163d9a8abf6SChuck Silvers  */
164d9a8abf6SChuck Silvers static int
165d9a8abf6SChuck Silvers ffs_blkatoff(struct vnode *vp, off_t offset, char **res, struct buf **bpp)
166d9a8abf6SChuck Silvers {
167d9a8abf6SChuck Silvers 	struct inode *ip;
168d9a8abf6SChuck Silvers 	struct fs *fs;
169d9a8abf6SChuck Silvers 	struct buf *bp;
170d9a8abf6SChuck Silvers 	ufs_lbn_t lbn;
171d9a8abf6SChuck Silvers 	int bsize, error;
172d9a8abf6SChuck Silvers 
173d9a8abf6SChuck Silvers 	ip = VTOI(vp);
174d9a8abf6SChuck Silvers 	fs = ITOFS(ip);
175d9a8abf6SChuck Silvers 	lbn = lblkno(fs, offset);
176d9a8abf6SChuck Silvers 	bsize = blksize(fs, ip, lbn);
177d9a8abf6SChuck Silvers 
178d9a8abf6SChuck Silvers 	*bpp = NULL;
179d9a8abf6SChuck Silvers 	error = bread(vp, lbn, bsize, NOCRED, &bp);
180d9a8abf6SChuck Silvers 	if (error) {
181d9a8abf6SChuck Silvers 		return (error);
182d9a8abf6SChuck Silvers 	}
183d9a8abf6SChuck Silvers 	if (res)
184d9a8abf6SChuck Silvers 		*res = (char *)bp->b_data + blkoff(fs, offset);
185d9a8abf6SChuck Silvers 	*bpp = bp;
186d9a8abf6SChuck Silvers 	return (0);
187d9a8abf6SChuck Silvers }
188d9a8abf6SChuck Silvers 
189d9a8abf6SChuck Silvers /*
190d9a8abf6SChuck Silvers  * Load up the contents of an inode and copy the appropriate pieces
191d9a8abf6SChuck Silvers  * to the incore copy.
192d9a8abf6SChuck Silvers  */
193d9a8abf6SChuck Silvers static int
194d9a8abf6SChuck Silvers ffs_load_inode(struct buf *bp, struct inode *ip, struct fs *fs, ino_t ino)
195d9a8abf6SChuck Silvers {
196d9a8abf6SChuck Silvers 	struct ufs1_dinode *dip1;
197d9a8abf6SChuck Silvers 	struct ufs2_dinode *dip2;
198d9a8abf6SChuck Silvers 	int error;
199d9a8abf6SChuck Silvers 
200d9a8abf6SChuck Silvers 	if (I_IS_UFS1(ip)) {
201d9a8abf6SChuck Silvers 		dip1 = ip->i_din1;
202d9a8abf6SChuck Silvers 		*dip1 =
203d9a8abf6SChuck Silvers 		    *((struct ufs1_dinode *)bp->b_data + ino_to_fsbo(fs, ino));
204d9a8abf6SChuck Silvers 		ip->i_mode = dip1->di_mode;
205d9a8abf6SChuck Silvers 		ip->i_nlink = dip1->di_nlink;
206d9a8abf6SChuck Silvers 		ip->i_effnlink = dip1->di_nlink;
207d9a8abf6SChuck Silvers 		ip->i_size = dip1->di_size;
208d9a8abf6SChuck Silvers 		ip->i_flags = dip1->di_flags;
209d9a8abf6SChuck Silvers 		ip->i_gen = dip1->di_gen;
210d9a8abf6SChuck Silvers 		ip->i_uid = dip1->di_uid;
211d9a8abf6SChuck Silvers 		ip->i_gid = dip1->di_gid;
212d9a8abf6SChuck Silvers 		return (0);
213d9a8abf6SChuck Silvers 	}
214d9a8abf6SChuck Silvers 	dip2 = ((struct ufs2_dinode *)bp->b_data + ino_to_fsbo(fs, ino));
215d9a8abf6SChuck Silvers 	if ((error = ffs_verify_dinode_ckhash(fs, dip2)) != 0 &&
216d9a8abf6SChuck Silvers 	    !ffs_fsfail_cleanup(ITOUMP(ip), error)) {
217d9a8abf6SChuck Silvers 		printf("%s: inode %jd: check-hash failed\n", fs->fs_fsmnt,
218d9a8abf6SChuck Silvers 		    (intmax_t)ino);
219d9a8abf6SChuck Silvers 		return (error);
220d9a8abf6SChuck Silvers 	}
221d9a8abf6SChuck Silvers 	*ip->i_din2 = *dip2;
222d9a8abf6SChuck Silvers 	dip2 = ip->i_din2;
223d9a8abf6SChuck Silvers 	ip->i_mode = dip2->di_mode;
224d9a8abf6SChuck Silvers 	ip->i_nlink = dip2->di_nlink;
225d9a8abf6SChuck Silvers 	ip->i_effnlink = dip2->di_nlink;
226d9a8abf6SChuck Silvers 	ip->i_size = dip2->di_size;
227d9a8abf6SChuck Silvers 	ip->i_flags = dip2->di_flags;
228d9a8abf6SChuck Silvers 	ip->i_gen = dip2->di_gen;
229d9a8abf6SChuck Silvers 	ip->i_uid = dip2->di_uid;
230d9a8abf6SChuck Silvers 	ip->i_gid = dip2->di_gid;
231d9a8abf6SChuck Silvers 	return (0);
232d9a8abf6SChuck Silvers }
233d9a8abf6SChuck Silvers 
234d9a8abf6SChuck Silvers /*
235d9a8abf6SChuck Silvers  * Verify that a filesystem block number is a valid data block.
236d9a8abf6SChuck Silvers  * This routine is only called on untrusted filesystems.
237d9a8abf6SChuck Silvers  */
238d9a8abf6SChuck Silvers static int
239d9a8abf6SChuck Silvers ffs_check_blkno(struct mount *mp, ino_t inum, ufs2_daddr_t daddr, int blksize)
240d9a8abf6SChuck Silvers {
241d9a8abf6SChuck Silvers 	struct fs *fs;
242d9a8abf6SChuck Silvers 	struct ufsmount *ump;
243d9a8abf6SChuck Silvers 	ufs2_daddr_t end_daddr;
244d9a8abf6SChuck Silvers 	int cg, havemtx;
245d9a8abf6SChuck Silvers 
246d9a8abf6SChuck Silvers 	KASSERT((mp->mnt_flag & MNT_UNTRUSTED) != 0,
247d9a8abf6SChuck Silvers 	    ("ffs_check_blkno called on a trusted file system"));
248d9a8abf6SChuck Silvers 	ump = VFSTOUFS(mp);
249d9a8abf6SChuck Silvers 	fs = ump->um_fs;
250d9a8abf6SChuck Silvers 	cg = dtog(fs, daddr);
251d9a8abf6SChuck Silvers 	end_daddr = daddr + numfrags(fs, blksize);
252d9a8abf6SChuck Silvers 	/*
253d9a8abf6SChuck Silvers 	 * Verify that the block number is a valid data block. Also check
254d9a8abf6SChuck Silvers 	 * that it does not point to an inode block or a superblock. Accept
255d9a8abf6SChuck Silvers 	 * blocks that are unalloacted (0) or part of snapshot metadata
256d9a8abf6SChuck Silvers 	 * (BLK_NOCOPY or BLK_SNAP).
257d9a8abf6SChuck Silvers 	 *
258d9a8abf6SChuck Silvers 	 * Thus, the block must be in a valid range for the filesystem and
259d9a8abf6SChuck Silvers 	 * either in the space before a backup superblock (except the first
260d9a8abf6SChuck Silvers 	 * cylinder group where that space is used by the bootstrap code) or
261d9a8abf6SChuck Silvers 	 * after the inode blocks and before the end of the cylinder group.
262d9a8abf6SChuck Silvers 	 */
263d9a8abf6SChuck Silvers 	if ((uint64_t)daddr <= BLK_SNAP ||
264d9a8abf6SChuck Silvers 	    ((uint64_t)end_daddr <= fs->fs_size &&
265d9a8abf6SChuck Silvers 	    ((cg > 0 && end_daddr <= cgsblock(fs, cg)) ||
266d9a8abf6SChuck Silvers 	    (daddr >= cgdmin(fs, cg) &&
267d9a8abf6SChuck Silvers 	    end_daddr <= cgbase(fs, cg) + fs->fs_fpg))))
268d9a8abf6SChuck Silvers 		return (0);
269d9a8abf6SChuck Silvers 	if ((havemtx = mtx_owned(UFS_MTX(ump))) == 0)
270d9a8abf6SChuck Silvers 		UFS_LOCK(ump);
271d9a8abf6SChuck Silvers 	if (ppsratecheck(&ump->um_last_integritymsg,
272d9a8abf6SChuck Silvers 	    &ump->um_secs_integritymsg, 1)) {
273d9a8abf6SChuck Silvers 		UFS_UNLOCK(ump);
274d9a8abf6SChuck Silvers 		uprintf("\n%s: inode %jd, out-of-range indirect block "
275d9a8abf6SChuck Silvers 		    "number %jd\n", mp->mnt_stat.f_mntonname, inum, daddr);
276d9a8abf6SChuck Silvers 		if (havemtx)
277d9a8abf6SChuck Silvers 			UFS_LOCK(ump);
278d9a8abf6SChuck Silvers 	} else if (!havemtx)
279d9a8abf6SChuck Silvers 		UFS_UNLOCK(ump);
280d9a8abf6SChuck Silvers 	return (EINTEGRITY);
281d9a8abf6SChuck Silvers }
282d9a8abf6SChuck Silvers 
283d9a8abf6SChuck Silvers /*
284d9a8abf6SChuck Silvers  * Initiate a forcible unmount.
285d9a8abf6SChuck Silvers  * Used to unmount filesystems whose underlying media has gone away.
286d9a8abf6SChuck Silvers  */
287d9a8abf6SChuck Silvers static void
288d9a8abf6SChuck Silvers ffs_fsfail_unmount(void *v, int pending)
289d9a8abf6SChuck Silvers {
290d9a8abf6SChuck Silvers 	struct fsfail_task *etp;
291d9a8abf6SChuck Silvers 	struct mount *mp;
292d9a8abf6SChuck Silvers 
293d9a8abf6SChuck Silvers 	etp = v;
294d9a8abf6SChuck Silvers 
295d9a8abf6SChuck Silvers 	/*
296d9a8abf6SChuck Silvers 	 * Find our mount and get a ref on it, then try to unmount.
297d9a8abf6SChuck Silvers 	 */
298d9a8abf6SChuck Silvers 	mp = vfs_getvfs(&etp->fsid);
299d9a8abf6SChuck Silvers 	if (mp != NULL)
300d9a8abf6SChuck Silvers 		dounmount(mp, MNT_FORCE, curthread);
301d9a8abf6SChuck Silvers 	free(etp, M_UFSMNT);
302d9a8abf6SChuck Silvers }
303d9a8abf6SChuck Silvers 
304d9a8abf6SChuck Silvers /*
305d9a8abf6SChuck Silvers  * On first ENXIO error, start a task that forcibly unmounts the filesystem.
306d9a8abf6SChuck Silvers  *
307d9a8abf6SChuck Silvers  * Return true if a cleanup is in progress.
308d9a8abf6SChuck Silvers  */
309d9a8abf6SChuck Silvers int
310d9a8abf6SChuck Silvers ffs_fsfail_cleanup(struct ufsmount *ump, int error)
311d9a8abf6SChuck Silvers {
312d9a8abf6SChuck Silvers 	int retval;
313d9a8abf6SChuck Silvers 
314d9a8abf6SChuck Silvers 	UFS_LOCK(ump);
315d9a8abf6SChuck Silvers 	retval = ffs_fsfail_cleanup_locked(ump, error);
316d9a8abf6SChuck Silvers 	UFS_UNLOCK(ump);
317d9a8abf6SChuck Silvers 	return (retval);
318d9a8abf6SChuck Silvers }
319d9a8abf6SChuck Silvers 
320d9a8abf6SChuck Silvers int
321d9a8abf6SChuck Silvers ffs_fsfail_cleanup_locked(struct ufsmount *ump, int error)
322d9a8abf6SChuck Silvers {
323d9a8abf6SChuck Silvers 	struct fsfail_task *etp;
324d9a8abf6SChuck Silvers 	struct task *tp;
325d9a8abf6SChuck Silvers 
326d9a8abf6SChuck Silvers 	mtx_assert(UFS_MTX(ump), MA_OWNED);
327d9a8abf6SChuck Silvers 	if (error == ENXIO && (ump->um_flags & UM_FSFAIL_CLEANUP) == 0) {
328d9a8abf6SChuck Silvers 		ump->um_flags |= UM_FSFAIL_CLEANUP;
329d9a8abf6SChuck Silvers 		/*
330d9a8abf6SChuck Silvers 		 * Queue an async forced unmount.
331d9a8abf6SChuck Silvers 		 */
332d9a8abf6SChuck Silvers 		etp = ump->um_fsfail_task;
333d9a8abf6SChuck Silvers 		ump->um_fsfail_task = NULL;
334d9a8abf6SChuck Silvers 		if (etp != NULL) {
335d9a8abf6SChuck Silvers 			tp = &etp->task;
336d9a8abf6SChuck Silvers 			TASK_INIT(tp, 0, ffs_fsfail_unmount, etp);
337d9a8abf6SChuck Silvers 			taskqueue_enqueue(taskqueue_thread, tp);
338d9a8abf6SChuck Silvers 			printf("UFS: forcibly unmounting %s from %s\n",
339d9a8abf6SChuck Silvers 			    ump->um_mountp->mnt_stat.f_mntfromname,
340d9a8abf6SChuck Silvers 			    ump->um_mountp->mnt_stat.f_mntonname);
341d9a8abf6SChuck Silvers 		}
342d9a8abf6SChuck Silvers 	}
343d9a8abf6SChuck Silvers 	return ((ump->um_flags & UM_FSFAIL_CLEANUP) != 0);
344d9a8abf6SChuck Silvers }
345d9a8abf6SChuck Silvers 
346d9a8abf6SChuck Silvers /*
347d9a8abf6SChuck Silvers  * Wrapper used during ENXIO cleanup to allocate empty buffers when
348d9a8abf6SChuck Silvers  * the kernel is unable to read the real one. They are needed so that
349d9a8abf6SChuck Silvers  * the soft updates code can use them to unwind its dependencies.
350d9a8abf6SChuck Silvers  */
351d9a8abf6SChuck Silvers int
352d9a8abf6SChuck Silvers ffs_breadz(struct ufsmount *ump, struct vnode *vp, daddr_t lblkno,
353d9a8abf6SChuck Silvers     daddr_t dblkno, int size, daddr_t *rablkno, int *rabsize, int cnt,
354d9a8abf6SChuck Silvers     struct ucred *cred, int flags, void (*ckhashfunc)(struct buf *),
355d9a8abf6SChuck Silvers     struct buf **bpp)
356d9a8abf6SChuck Silvers {
357d9a8abf6SChuck Silvers 	int error;
358d9a8abf6SChuck Silvers 
359d9a8abf6SChuck Silvers 	flags |= GB_CVTENXIO;
360d9a8abf6SChuck Silvers 	error = breadn_flags(vp, lblkno, dblkno, size, rablkno, rabsize, cnt,
361d9a8abf6SChuck Silvers 	    cred, flags, ckhashfunc, bpp);
362d9a8abf6SChuck Silvers 	if (error != 0 && ffs_fsfail_cleanup(ump, error)) {
363d9a8abf6SChuck Silvers 		error = getblkx(vp, lblkno, dblkno, size, 0, 0, flags, bpp);
364d9a8abf6SChuck Silvers 		KASSERT(error == 0, ("getblkx failed"));
365d9a8abf6SChuck Silvers 		vfs_bio_bzero_buf(*bpp, 0, size);
366d9a8abf6SChuck Silvers 	}
367d9a8abf6SChuck Silvers 	return (error);
368d9a8abf6SChuck Silvers }
369d9a8abf6SChuck Silvers 
3705e8c582aSPoul-Henning Kamp static int
371dfd233edSAttilio Rao ffs_mount(struct mount *mp)
372df8bae1dSRodney W. Grimes {
373f15ccf88SChuck Silvers 	struct vnode *devvp, *odevvp;
374dfd233edSAttilio Rao 	struct thread *td;
375f7a3729cSKevin Lo 	struct ufsmount *ump = NULL;
37605f4ff5dSPoul-Henning Kamp 	struct fs *fs;
377927a12aeSKirk McKusick 	pid_t fsckpid = 0;
378714b7df5SKonstantin Belousov 	int error, error1, flags;
3795ffc99e2SKonstantin Belousov 	uint64_t mntorflags, saved_mnt_flag;
38015bc6b2bSEdward Tomasz Napierala 	accmode_t accmode;
3815e8c582aSPoul-Henning Kamp 	struct nameidata ndp;
38220a92a18SPoul-Henning Kamp 	char *fspec;
3837c7a6681SKonstantin Belousov 	bool mounted_softdep;
384df8bae1dSRodney W. Grimes 
385dfd233edSAttilio Rao 	td = curthread;
38620a92a18SPoul-Henning Kamp 	if (vfs_filteropt(mp->mnt_optnew, ffs_opts))
38720a92a18SPoul-Henning Kamp 		return (EINVAL);
388aa4d7a8aSPoul-Henning Kamp 	if (uma_inode == NULL) {
389aa4d7a8aSPoul-Henning Kamp 		uma_inode = uma_zcreate("FFS inode",
390aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct inode), NULL, NULL, NULL, NULL,
391aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
392aa4d7a8aSPoul-Henning Kamp 		uma_ufs1 = uma_zcreate("FFS1 dinode",
393aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct ufs1_dinode), NULL, NULL, NULL, NULL,
394aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
395aa4d7a8aSPoul-Henning Kamp 		uma_ufs2 = uma_zcreate("FFS2 dinode",
396aa4d7a8aSPoul-Henning Kamp 		    sizeof(struct ufs2_dinode), NULL, NULL, NULL, NULL,
397aa4d7a8aSPoul-Henning Kamp 		    UMA_ALIGN_PTR, 0);
3989d5a594fSMateusz Guzik 		VFS_SMR_ZONE_SET(uma_inode);
399aa4d7a8aSPoul-Henning Kamp 	}
4008d02a378SPawel Jakub Dawidek 
4010b962648SAndriy Gapon 	vfs_deleteopt(mp->mnt_optnew, "groupquota");
4020b962648SAndriy Gapon 	vfs_deleteopt(mp->mnt_optnew, "userquota");
4030b962648SAndriy Gapon 
40420a92a18SPoul-Henning Kamp 	fspec = vfs_getopts(mp->mnt_optnew, "from", &error);
40551ac12abSPoul-Henning Kamp 	if (error)
406f2a2857bSKirk McKusick 		return (error);
4072b14f991SJulian Elischer 
4085da56ddbSTor Egge 	mntorflags = 0;
409daba4da8SKirk McKusick 	if (vfs_getopt(mp->mnt_optnew, "untrusted", NULL, NULL) == 0)
410daba4da8SKirk McKusick 		mntorflags |= MNT_UNTRUSTED;
411daba4da8SKirk McKusick 
41226f59b64SCraig Rodrigues 	if (vfs_getopt(mp->mnt_optnew, "acls", NULL, NULL) == 0)
4135da56ddbSTor Egge 		mntorflags |= MNT_ACLS;
41426f59b64SCraig Rodrigues 
415fb77e0afSCraig Rodrigues 	if (vfs_getopt(mp->mnt_optnew, "snapshot", NULL, NULL) == 0) {
4165da56ddbSTor Egge 		mntorflags |= MNT_SNAPSHOT;
417fb77e0afSCraig Rodrigues 		/*
418fb77e0afSCraig Rodrigues 		 * Once we have set the MNT_SNAPSHOT flag, do not
419fb77e0afSCraig Rodrigues 		 * persist "snapshot" in the options list.
420fb77e0afSCraig Rodrigues 		 */
421fb77e0afSCraig Rodrigues 		vfs_deleteopt(mp->mnt_optnew, "snapshot");
422fb77e0afSCraig Rodrigues 		vfs_deleteopt(mp->mnt_opt, "snapshot");
423fb77e0afSCraig Rodrigues 	}
42426f59b64SCraig Rodrigues 
425927a12aeSKirk McKusick 	if (vfs_getopt(mp->mnt_optnew, "fsckpid", NULL, NULL) == 0 &&
426927a12aeSKirk McKusick 	    vfs_scanopt(mp->mnt_optnew, "fsckpid", "%d", &fsckpid) == 1) {
427927a12aeSKirk McKusick 		/*
428927a12aeSKirk McKusick 		 * Once we have set the restricted PID, do not
429927a12aeSKirk McKusick 		 * persist "fsckpid" in the options list.
430927a12aeSKirk McKusick 		 */
431927a12aeSKirk McKusick 		vfs_deleteopt(mp->mnt_optnew, "fsckpid");
432927a12aeSKirk McKusick 		vfs_deleteopt(mp->mnt_opt, "fsckpid");
433927a12aeSKirk McKusick 		if (mp->mnt_flag & MNT_UPDATE) {
434927a12aeSKirk McKusick 			if (VFSTOUFS(mp)->um_fs->fs_ronly == 0 &&
435927a12aeSKirk McKusick 			     vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) {
436b60ee81eSKirk McKusick 				vfs_mount_error(mp,
437b60ee81eSKirk McKusick 				    "Checker enable: Must be read-only");
438927a12aeSKirk McKusick 				return (EINVAL);
439927a12aeSKirk McKusick 			}
440927a12aeSKirk McKusick 		} else if (vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0) == 0) {
441b60ee81eSKirk McKusick 			vfs_mount_error(mp,
442b60ee81eSKirk McKusick 			    "Checker enable: Must be read-only");
443927a12aeSKirk McKusick 			return (EINVAL);
444927a12aeSKirk McKusick 		}
445927a12aeSKirk McKusick 		/* Set to -1 if we are done */
446927a12aeSKirk McKusick 		if (fsckpid == 0)
447927a12aeSKirk McKusick 			fsckpid = -1;
448927a12aeSKirk McKusick 	}
449927a12aeSKirk McKusick 
4509340fc72SEdward Tomasz Napierala 	if (vfs_getopt(mp->mnt_optnew, "nfsv4acls", NULL, NULL) == 0) {
4519340fc72SEdward Tomasz Napierala 		if (mntorflags & MNT_ACLS) {
452b60ee81eSKirk McKusick 			vfs_mount_error(mp,
453b60ee81eSKirk McKusick 			    "\"acls\" and \"nfsv4acls\" options "
454b60ee81eSKirk McKusick 			    "are mutually exclusive");
4559340fc72SEdward Tomasz Napierala 			return (EINVAL);
4569340fc72SEdward Tomasz Napierala 		}
4579340fc72SEdward Tomasz Napierala 		mntorflags |= MNT_NFS4ACLS;
4589340fc72SEdward Tomasz Napierala 	}
4599340fc72SEdward Tomasz Napierala 
4605da56ddbSTor Egge 	MNT_ILOCK(mp);
4619d5a594fSMateusz Guzik 	mp->mnt_kern_flag &= ~MNTK_FPLOOKUP;
46261996181SEdward Tomasz Napierala 	mp->mnt_flag |= mntorflags;
4635da56ddbSTor Egge 	MNT_IUNLOCK(mp);
464df8bae1dSRodney W. Grimes 	/*
465df8bae1dSRodney W. Grimes 	 * If updating, check whether changing from read-only to
466df8bae1dSRodney W. Grimes 	 * read/write; if there is no device name, that's all we do.
467df8bae1dSRodney W. Grimes 	 */
468df8bae1dSRodney W. Grimes 	if (mp->mnt_flag & MNT_UPDATE) {
469df8bae1dSRodney W. Grimes 		ump = VFSTOUFS(mp);
470df8bae1dSRodney W. Grimes 		fs = ump->um_fs;
471f15ccf88SChuck Silvers 		odevvp = ump->um_odevvp;
47226cf9c3bSPeter Wemm 		devvp = ump->um_devvp;
473927a12aeSKirk McKusick 		if (fsckpid == -1 && ump->um_fsckpid > 0) {
474927a12aeSKirk McKusick 			if ((error = ffs_flushfiles(mp, WRITECLOSE, td)) != 0 ||
475927a12aeSKirk McKusick 			    (error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0)
476927a12aeSKirk McKusick 				return (error);
477927a12aeSKirk McKusick 			g_topology_lock();
478927a12aeSKirk McKusick 			/*
479927a12aeSKirk McKusick 			 * Return to normal read-only mode.
480927a12aeSKirk McKusick 			 */
481927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, -1, 0);
482927a12aeSKirk McKusick 			g_topology_unlock();
483927a12aeSKirk McKusick 			ump->um_fsckpid = 0;
484927a12aeSKirk McKusick 		}
48520a92a18SPoul-Henning Kamp 		if (fs->fs_ronly == 0 &&
48620a92a18SPoul-Henning Kamp 		    vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) {
4876fecb4e4SKonstantin Belousov 			/*
4886fecb4e4SKonstantin Belousov 			 * Flush any dirty data and suspend filesystem.
4896fecb4e4SKonstantin Belousov 			 */
490f2a2857bSKirk McKusick 			if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0)
491f2a2857bSKirk McKusick 				return (error);
492895b3782SKonstantin Belousov 			error = vfs_write_suspend_umnt(mp);
493895b3782SKonstantin Belousov 			if (error != 0)
4949ab73fd1SKirk McKusick 				return (error);
4957c7a6681SKonstantin Belousov 
4967c7a6681SKonstantin Belousov 			fs->fs_ronly = 1;
4977c7a6681SKonstantin Belousov 			if (MOUNTEDSOFTDEP(mp)) {
4987c7a6681SKonstantin Belousov 				MNT_ILOCK(mp);
4997c7a6681SKonstantin Belousov 				mp->mnt_flag &= ~MNT_SOFTDEP;
5007c7a6681SKonstantin Belousov 				MNT_IUNLOCK(mp);
5017c7a6681SKonstantin Belousov 				mounted_softdep = true;
5027c7a6681SKonstantin Belousov 			} else
5037c7a6681SKonstantin Belousov 				mounted_softdep = false;
5047c7a6681SKonstantin Belousov 
505cd600596SKirk McKusick 			/*
506cd600596SKirk McKusick 			 * Check for and optionally get rid of files open
507cd600596SKirk McKusick 			 * for writing.
508cd600596SKirk McKusick 			 */
509df8bae1dSRodney W. Grimes 			flags = WRITECLOSE;
510df8bae1dSRodney W. Grimes 			if (mp->mnt_flag & MNT_FORCE)
511df8bae1dSRodney W. Grimes 				flags |= FORCECLOSE;
5127c7a6681SKonstantin Belousov 			if (mounted_softdep) {
513b40ce416SJulian Elischer 				error = softdep_flushfiles(mp, flags, td);
514b1897c19SJulian Elischer 			} else {
515b40ce416SJulian Elischer 				error = ffs_flushfiles(mp, flags, td);
516df8bae1dSRodney W. Grimes 			}
517f2a2857bSKirk McKusick 			if (error) {
5187c7a6681SKonstantin Belousov 				fs->fs_ronly = 0;
5197c7a6681SKonstantin Belousov 				if (mounted_softdep) {
5207c7a6681SKonstantin Belousov 					MNT_ILOCK(mp);
5217c7a6681SKonstantin Belousov 					mp->mnt_flag |= MNT_SOFTDEP;
5227c7a6681SKonstantin Belousov 					MNT_IUNLOCK(mp);
5237c7a6681SKonstantin Belousov 				}
524ddd6b3fcSKonstantin Belousov 				vfs_write_resume(mp, 0);
525f2a2857bSKirk McKusick 				return (error);
526b1897c19SJulian Elischer 			}
5277c7a6681SKonstantin Belousov 
5289ccb939eSKirk McKusick 			if (fs->fs_pendingblocks != 0 ||
5299ccb939eSKirk McKusick 			    fs->fs_pendinginodes != 0) {
530b60ee81eSKirk McKusick 				printf("WARNING: %s Update error: blocks %jd "
531b60ee81eSKirk McKusick 				    "files %d\n", fs->fs_fsmnt,
5321c85e6a3SKirk McKusick 				    (intmax_t)fs->fs_pendingblocks,
5339ccb939eSKirk McKusick 				    fs->fs_pendinginodes);
5349ccb939eSKirk McKusick 				fs->fs_pendingblocks = 0;
5359ccb939eSKirk McKusick 				fs->fs_pendinginodes = 0;
5369ccb939eSKirk McKusick 			}
5371a6a6610SKirk McKusick 			if ((fs->fs_flags & (FS_UNCLEAN | FS_NEEDSFSCK)) == 0)
538f2a2857bSKirk McKusick 				fs->fs_clean = 1;
539791dd2faSTor Egge 			if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) {
540f2a2857bSKirk McKusick 				fs->fs_ronly = 0;
541f2a2857bSKirk McKusick 				fs->fs_clean = 0;
5427c7a6681SKonstantin Belousov 				if (mounted_softdep) {
5437c7a6681SKonstantin Belousov 					MNT_ILOCK(mp);
5447c7a6681SKonstantin Belousov 					mp->mnt_flag |= MNT_SOFTDEP;
5457c7a6681SKonstantin Belousov 					MNT_IUNLOCK(mp);
5467c7a6681SKonstantin Belousov 				}
547ddd6b3fcSKonstantin Belousov 				vfs_write_resume(mp, 0);
548f2a2857bSKirk McKusick 				return (error);
5492b14f991SJulian Elischer 			}
5507c7a6681SKonstantin Belousov 			if (mounted_softdep)
5519420dc62SKirk McKusick 				softdep_unmount(mp);
55243920011SPoul-Henning Kamp 			g_topology_lock();
5538795189cSKirk McKusick 			/*
5548795189cSKirk McKusick 			 * Drop our write and exclusive access.
5558795189cSKirk McKusick 			 */
5568795189cSKirk McKusick 			g_access(ump->um_cp, 0, -1, -1);
55743920011SPoul-Henning Kamp 			g_topology_unlock();
5585da56ddbSTor Egge 			MNT_ILOCK(mp);
55920a92a18SPoul-Henning Kamp 			mp->mnt_flag |= MNT_RDONLY;
5605da56ddbSTor Egge 			MNT_IUNLOCK(mp);
5616fecb4e4SKonstantin Belousov 			/*
5626fecb4e4SKonstantin Belousov 			 * Allow the writers to note that filesystem
5636fecb4e4SKonstantin Belousov 			 * is ro now.
5646fecb4e4SKonstantin Belousov 			 */
565ddd6b3fcSKonstantin Belousov 			vfs_write_resume(mp, 0);
566f2a2857bSKirk McKusick 		}
567f2a2857bSKirk McKusick 		if ((mp->mnt_flag & MNT_RELOAD) &&
5681848286aSEdward Tomasz Napierala 		    (error = ffs_reload(mp, td, 0)) != 0)
569f2a2857bSKirk McKusick 			return (error);
57020a92a18SPoul-Henning Kamp 		if (fs->fs_ronly &&
57120a92a18SPoul-Henning Kamp 		    !vfs_flagopt(mp->mnt_optnew, "ro", NULL, 0)) {
572c9b99213SBruce Evans 			/*
573927a12aeSKirk McKusick 			 * If we are running a checker, do not allow upgrade.
574927a12aeSKirk McKusick 			 */
575927a12aeSKirk McKusick 			if (ump->um_fsckpid > 0) {
576b60ee81eSKirk McKusick 				vfs_mount_error(mp,
577b60ee81eSKirk McKusick 				    "Active checker, cannot upgrade to write");
578927a12aeSKirk McKusick 				return (EINVAL);
579927a12aeSKirk McKusick 			}
580927a12aeSKirk McKusick 			/*
581c9b99213SBruce Evans 			 * If upgrade to read-write by non-root, then verify
582c9b99213SBruce Evans 			 * that user has necessary permissions on the device.
583c9b99213SBruce Evans 			 */
584f15ccf88SChuck Silvers 			vn_lock(odevvp, LK_EXCLUSIVE | LK_RETRY);
585f15ccf88SChuck Silvers 			error = VOP_ACCESS(odevvp, VREAD | VWRITE,
586acd3428bSRobert Watson 			    td->td_ucred, td);
587acd3428bSRobert Watson 			if (error)
588acd3428bSRobert Watson 				error = priv_check(td, PRIV_VFS_MOUNT_PERM);
589f15ccf88SChuck Silvers 			VOP_UNLOCK(odevvp);
590acd3428bSRobert Watson 			if (error) {
591c9b99213SBruce Evans 				return (error);
592c9b99213SBruce Evans 			}
5937e58bfacSBruce Evans 			fs->fs_flags &= ~FS_UNCLEAN;
5940922cce6SBruce Evans 			if (fs->fs_clean == 0) {
5957e58bfacSBruce Evans 				fs->fs_flags |= FS_UNCLEAN;
596812b1d41SKirk McKusick 				if ((mp->mnt_flag & MNT_FORCE) ||
597113db2ddSJeff Roberson 				    ((fs->fs_flags &
598113db2ddSJeff Roberson 				     (FS_SUJ | FS_NEEDSFSCK)) == 0 &&
5991a6a6610SKirk McKusick 				     (fs->fs_flags & FS_DOSOFTDEP))) {
600b60ee81eSKirk McKusick 					printf("WARNING: %s was not properly "
601b60ee81eSKirk McKusick 					   "dismounted\n", fs->fs_fsmnt);
6020922cce6SBruce Evans 				} else {
603b60ee81eSKirk McKusick 					vfs_mount_error(mp,
604b60ee81eSKirk McKusick 					   "R/W mount of %s denied. %s.%s",
605b60ee81eSKirk McKusick 					   fs->fs_fsmnt,
606b60ee81eSKirk McKusick 					   "Filesystem is not clean - run fsck",
607b60ee81eSKirk McKusick 					   (fs->fs_flags & FS_SUJ) == 0 ? "" :
608b60ee81eSKirk McKusick 					   " Forced mount will invalidate"
609b60ee81eSKirk McKusick 					   " journal contents");
610f2a2857bSKirk McKusick 					return (EPERM);
6110922cce6SBruce Evans 				}
6120922cce6SBruce Evans 			}
61340c340aaSPoul-Henning Kamp 			g_topology_lock();
61440c340aaSPoul-Henning Kamp 			/*
6158795189cSKirk McKusick 			 * Request exclusive write access.
61640c340aaSPoul-Henning Kamp 			 */
61740c340aaSPoul-Henning Kamp 			error = g_access(ump->um_cp, 0, 1, 1);
61840c340aaSPoul-Henning Kamp 			g_topology_unlock();
61940c340aaSPoul-Henning Kamp 			if (error)
62040c340aaSPoul-Henning Kamp 				return (error);
621f2a2857bSKirk McKusick 			if ((error = vn_start_write(NULL, &mp, V_WAIT)) != 0)
622f2a2857bSKirk McKusick 				return (error);
6235ffc99e2SKonstantin Belousov 			error = vfs_write_suspend_umnt(mp);
6245ffc99e2SKonstantin Belousov 			if (error != 0)
6255ffc99e2SKonstantin Belousov 				return (error);
626f2a2857bSKirk McKusick 			fs->fs_ronly = 0;
6275da56ddbSTor Egge 			MNT_ILOCK(mp);
6285ffc99e2SKonstantin Belousov 			saved_mnt_flag = MNT_RDONLY;
6295ffc99e2SKonstantin Belousov 			if (MOUNTEDSOFTDEP(mp) && (mp->mnt_flag &
6305ffc99e2SKonstantin Belousov 			    MNT_ASYNC) != 0)
6315ffc99e2SKonstantin Belousov 				saved_mnt_flag |= MNT_ASYNC;
6325ffc99e2SKonstantin Belousov 			mp->mnt_flag &= ~saved_mnt_flag;
6335da56ddbSTor Egge 			MNT_IUNLOCK(mp);
634113db2ddSJeff Roberson 			fs->fs_mtime = time_second;
63526cf9c3bSPeter Wemm 			/* check to see if we need to start softdep */
636f2a2857bSKirk McKusick 			if ((fs->fs_flags & FS_DOSOFTDEP) &&
637a854ed98SJohn Baldwin 			    (error = softdep_mount(devvp, mp, fs, td->td_ucred))){
6385ffc99e2SKonstantin Belousov 				fs->fs_ronly = 1;
6395ffc99e2SKonstantin Belousov 				MNT_ILOCK(mp);
6405ffc99e2SKonstantin Belousov 				mp->mnt_flag |= saved_mnt_flag;
6415ffc99e2SKonstantin Belousov 				MNT_IUNLOCK(mp);
6425ffc99e2SKonstantin Belousov 				vfs_write_resume(mp, 0);
643f2a2857bSKirk McKusick 				return (error);
64426cf9c3bSPeter Wemm 			}
645113db2ddSJeff Roberson 			fs->fs_clean = 0;
646113db2ddSJeff Roberson 			if ((error = ffs_sbupdate(ump, MNT_WAIT, 0)) != 0) {
6475ffc99e2SKonstantin Belousov 				fs->fs_ronly = 1;
648f776c54cSKonstantin Belousov 				if ((fs->fs_flags & FS_DOSOFTDEP) != 0)
649f776c54cSKonstantin Belousov 					softdep_unmount(mp);
6505ffc99e2SKonstantin Belousov 				MNT_ILOCK(mp);
6515ffc99e2SKonstantin Belousov 				mp->mnt_flag |= saved_mnt_flag;
6525ffc99e2SKonstantin Belousov 				MNT_IUNLOCK(mp);
6535ffc99e2SKonstantin Belousov 				vfs_write_resume(mp, 0);
654113db2ddSJeff Roberson 				return (error);
655113db2ddSJeff Roberson 			}
656f2a2857bSKirk McKusick 			if (fs->fs_snapinum[0] != 0)
657f2a2857bSKirk McKusick 				ffs_snapshot_mount(mp);
6585ffc99e2SKonstantin Belousov 			vfs_write_resume(mp, 0);
6591469eec8SDavid Greenman 		}
660c11d2981SJulian Elischer 		/*
661c11d2981SJulian Elischer 		 * Soft updates is incompatible with "async",
662c11d2981SJulian Elischer 		 * so if we are doing softupdates stop the user
663c11d2981SJulian Elischer 		 * from setting the async flag in an update.
664c11d2981SJulian Elischer 		 * Softdep_mount() clears it in an initial mount
665c11d2981SJulian Elischer 		 * or ro->rw remount.
666c11d2981SJulian Elischer 		 */
667fddf7baeSKirk McKusick 		if (MOUNTEDSOFTDEP(mp)) {
6685da56ddbSTor Egge 			/* XXX: Reset too late ? */
6695da56ddbSTor Egge 			MNT_ILOCK(mp);
670c11d2981SJulian Elischer 			mp->mnt_flag &= ~MNT_ASYNC;
6715da56ddbSTor Egge 			MNT_IUNLOCK(mp);
6725da56ddbSTor Egge 		}
673df8bae1dSRodney W. Grimes 		/*
67439cfb239SPawel Jakub Dawidek 		 * Keep MNT_ACLS flag if it is stored in superblock.
67539cfb239SPawel Jakub Dawidek 		 */
6765da56ddbSTor Egge 		if ((fs->fs_flags & FS_ACLS) != 0) {
6775da56ddbSTor Egge 			/* XXX: Set too late ? */
6785da56ddbSTor Egge 			MNT_ILOCK(mp);
67939cfb239SPawel Jakub Dawidek 			mp->mnt_flag |= MNT_ACLS;
6805da56ddbSTor Egge 			MNT_IUNLOCK(mp);
6815da56ddbSTor Egge 		}
682cea90362SCraig Rodrigues 
6839340fc72SEdward Tomasz Napierala 		if ((fs->fs_flags & FS_NFS4ACLS) != 0) {
6849340fc72SEdward Tomasz Napierala 			/* XXX: Set too late ? */
6859340fc72SEdward Tomasz Napierala 			MNT_ILOCK(mp);
6869340fc72SEdward Tomasz Napierala 			mp->mnt_flag |= MNT_NFS4ACLS;
6879340fc72SEdward Tomasz Napierala 			MNT_IUNLOCK(mp);
6889340fc72SEdward Tomasz Napierala 		}
689927a12aeSKirk McKusick 		/*
690927a12aeSKirk McKusick 		 * If this is a request from fsck to clean up the filesystem,
691927a12aeSKirk McKusick 		 * then allow the specified pid to proceed.
692927a12aeSKirk McKusick 		 */
693927a12aeSKirk McKusick 		if (fsckpid > 0) {
694927a12aeSKirk McKusick 			if (ump->um_fsckpid != 0) {
695b60ee81eSKirk McKusick 				vfs_mount_error(mp,
696b60ee81eSKirk McKusick 				    "Active checker already running on %s",
697927a12aeSKirk McKusick 				    fs->fs_fsmnt);
698927a12aeSKirk McKusick 				return (EINVAL);
699927a12aeSKirk McKusick 			}
700fddf7baeSKirk McKusick 			KASSERT(MOUNTEDSOFTDEP(mp) == 0,
701927a12aeSKirk McKusick 			    ("soft updates enabled on read-only file system"));
702927a12aeSKirk McKusick 			g_topology_lock();
703927a12aeSKirk McKusick 			/*
704927a12aeSKirk McKusick 			 * Request write access.
705927a12aeSKirk McKusick 			 */
706927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, 1, 0);
707927a12aeSKirk McKusick 			g_topology_unlock();
708927a12aeSKirk McKusick 			if (error) {
709b60ee81eSKirk McKusick 				vfs_mount_error(mp,
710b60ee81eSKirk McKusick 				    "Checker activation failed on %s",
711927a12aeSKirk McKusick 				    fs->fs_fsmnt);
712927a12aeSKirk McKusick 				return (error);
713927a12aeSKirk McKusick 			}
714927a12aeSKirk McKusick 			ump->um_fsckpid = fsckpid;
715927a12aeSKirk McKusick 			if (fs->fs_snapinum[0] != 0)
716927a12aeSKirk McKusick 				ffs_snapshot_mount(mp);
717927a12aeSKirk McKusick 			fs->fs_mtime = time_second;
718927a12aeSKirk McKusick 			fs->fs_fmod = 1;
719927a12aeSKirk McKusick 			fs->fs_clean = 0;
720927a12aeSKirk McKusick 			(void) ffs_sbupdate(ump, MNT_WAIT, 0);
721927a12aeSKirk McKusick 		}
7229340fc72SEdward Tomasz Napierala 
723f2a2857bSKirk McKusick 		/*
724f2a2857bSKirk McKusick 		 * If this is a snapshot request, take the snapshot.
725f2a2857bSKirk McKusick 		 */
726f2a2857bSKirk McKusick 		if (mp->mnt_flag & MNT_SNAPSHOT)
72720a92a18SPoul-Henning Kamp 			return (ffs_snapshot(mp, fspec));
728714b7df5SKonstantin Belousov 
729714b7df5SKonstantin Belousov 		/*
730714b7df5SKonstantin Belousov 		 * Must not call namei() while owning busy ref.
731714b7df5SKonstantin Belousov 		 */
732714b7df5SKonstantin Belousov 		vfs_unbusy(mp);
733df8bae1dSRodney W. Grimes 	}
7342b14f991SJulian Elischer 
735df8bae1dSRodney W. Grimes 	/*
736df8bae1dSRodney W. Grimes 	 * Not an update, or updating the name: look up the name
737e9827c6dSBruce Evans 	 * and verify that it refers to a sensible disk device.
738df8bae1dSRodney W. Grimes 	 */
739fdedad76SSuleiman Souhlal 	NDINIT(&ndp, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, fspec, td);
740714b7df5SKonstantin Belousov 	error = namei(&ndp);
741714b7df5SKonstantin Belousov 	if ((mp->mnt_flag & MNT_UPDATE) != 0) {
742714b7df5SKonstantin Belousov 		/*
743714b7df5SKonstantin Belousov 		 * Unmount does not start if MNT_UPDATE is set.  Mount
744714b7df5SKonstantin Belousov 		 * update busies mp before setting MNT_UPDATE.  We
745714b7df5SKonstantin Belousov 		 * must be able to retain our busy ref succesfully,
746714b7df5SKonstantin Belousov 		 * without sleep.
747714b7df5SKonstantin Belousov 		 */
748714b7df5SKonstantin Belousov 		error1 = vfs_busy(mp, MBF_NOWAIT);
749714b7df5SKonstantin Belousov 		MPASS(error1 == 0);
750714b7df5SKonstantin Belousov 	}
751714b7df5SKonstantin Belousov 	if (error != 0)
752f2a2857bSKirk McKusick 		return (error);
7535e8c582aSPoul-Henning Kamp 	NDFREE(&ndp, NDF_ONLY_PNBUF);
7545e8c582aSPoul-Henning Kamp 	devvp = ndp.ni_vp;
7557ad2a82dSMateusz Guzik 	if (!vn_isdisk_error(devvp, &error)) {
756fdedad76SSuleiman Souhlal 		vput(devvp);
757f2a2857bSKirk McKusick 		return (error);
758f2a2857bSKirk McKusick 	}
759c9b99213SBruce Evans 
760c9b99213SBruce Evans 	/*
761c9b99213SBruce Evans 	 * If mount by non-root, then verify that user has necessary
762c9b99213SBruce Evans 	 * permissions on the device.
763c9b99213SBruce Evans 	 */
76415bc6b2bSEdward Tomasz Napierala 	accmode = VREAD;
765c9b99213SBruce Evans 	if ((mp->mnt_flag & MNT_RDONLY) == 0)
76615bc6b2bSEdward Tomasz Napierala 		accmode |= VWRITE;
76715bc6b2bSEdward Tomasz Napierala 	error = VOP_ACCESS(devvp, accmode, td->td_ucred, td);
768acd3428bSRobert Watson 	if (error)
769acd3428bSRobert Watson 		error = priv_check(td, PRIV_VFS_MOUNT_PERM);
770acd3428bSRobert Watson 	if (error) {
771c9b99213SBruce Evans 		vput(devvp);
772c9b99213SBruce Evans 		return (error);
773c9b99213SBruce Evans 	}
774c9b99213SBruce Evans 
7752b14f991SJulian Elischer 	if (mp->mnt_flag & MNT_UPDATE) {
7762b14f991SJulian Elischer 		/*
777f2a2857bSKirk McKusick 		 * Update only
778f2a2857bSKirk McKusick 		 *
7793e425b96SJulian Elischer 		 * If it's not the same vnode, or at least the same device
7803e425b96SJulian Elischer 		 * then it's not correct.
7812b14f991SJulian Elischer 		 */
7822b14f991SJulian Elischer 
78343920011SPoul-Henning Kamp 		if (devvp->v_rdev != ump->um_devvp->v_rdev)
784f2a2857bSKirk McKusick 			error = EINVAL;	/* needs translation */
785fdedad76SSuleiman Souhlal 		vput(devvp);
786f2a2857bSKirk McKusick 		if (error)
787f2a2857bSKirk McKusick 			return (error);
7882b14f991SJulian Elischer 	} else {
7892b14f991SJulian Elischer 		/*
790f2a2857bSKirk McKusick 		 * New mount
7912b14f991SJulian Elischer 		 *
792f2a2857bSKirk McKusick 		 * We need the name for the mount point (also used for
793f2a2857bSKirk McKusick 		 * "last mounted on") copied in. If an error occurs,
794f2a2857bSKirk McKusick 		 * the mount point is discarded by the upper level code.
79598cbffd7SKonstantin Belousov 		 * Note that vfs_mount_alloc() populates f_mntonname for us.
796f2a2857bSKirk McKusick 		 */
797975512a9SPoul-Henning Kamp 		if ((error = ffs_mountfs(devvp, mp, td)) != 0) {
798f2a2857bSKirk McKusick 			vrele(devvp);
799f2a2857bSKirk McKusick 			return (error);
800f2a2857bSKirk McKusick 		}
801927a12aeSKirk McKusick 		if (fsckpid > 0) {
802fddf7baeSKirk McKusick 			KASSERT(MOUNTEDSOFTDEP(mp) == 0,
803927a12aeSKirk McKusick 			    ("soft updates enabled on read-only file system"));
804927a12aeSKirk McKusick 			ump = VFSTOUFS(mp);
805927a12aeSKirk McKusick 			fs = ump->um_fs;
806927a12aeSKirk McKusick 			g_topology_lock();
807927a12aeSKirk McKusick 			/*
808927a12aeSKirk McKusick 			 * Request write access.
809927a12aeSKirk McKusick 			 */
810927a12aeSKirk McKusick 			error = g_access(ump->um_cp, 0, 1, 0);
811927a12aeSKirk McKusick 			g_topology_unlock();
812927a12aeSKirk McKusick 			if (error) {
813b60ee81eSKirk McKusick 				printf("WARNING: %s: Checker activation "
814b60ee81eSKirk McKusick 				    "failed\n", fs->fs_fsmnt);
815927a12aeSKirk McKusick 			} else {
816927a12aeSKirk McKusick 				ump->um_fsckpid = fsckpid;
817927a12aeSKirk McKusick 				if (fs->fs_snapinum[0] != 0)
818927a12aeSKirk McKusick 					ffs_snapshot_mount(mp);
819927a12aeSKirk McKusick 				fs->fs_mtime = time_second;
820927a12aeSKirk McKusick 				fs->fs_clean = 0;
821927a12aeSKirk McKusick 				(void) ffs_sbupdate(ump, MNT_WAIT, 0);
822927a12aeSKirk McKusick 			}
823927a12aeSKirk McKusick 		}
824f2a2857bSKirk McKusick 	}
8259d5a594fSMateusz Guzik 
8269d5a594fSMateusz Guzik 	MNT_ILOCK(mp);
8279d5a594fSMateusz Guzik 	/*
8289d5a594fSMateusz Guzik 	 * This is racy versus lookup, see ufs_fplookup_vexec for details.
8299d5a594fSMateusz Guzik 	 */
8309d5a594fSMateusz Guzik 	if ((mp->mnt_kern_flag & MNTK_FPLOOKUP) != 0)
8319d5a594fSMateusz Guzik 		panic("MNTK_FPLOOKUP set on mount %p when it should not be", mp);
83203337743SMateusz Guzik 	if ((mp->mnt_flag & (MNT_ACLS | MNT_NFS4ACLS | MNT_UNION)) == 0)
8339d5a594fSMateusz Guzik 		mp->mnt_kern_flag |= MNTK_FPLOOKUP;
8349d5a594fSMateusz Guzik 	MNT_IUNLOCK(mp);
8359d5a594fSMateusz Guzik 
83620a92a18SPoul-Henning Kamp 	vfs_mountedfrom(mp, fspec);
837f2a2857bSKirk McKusick 	return (0);
8382b14f991SJulian Elischer }
8392b14f991SJulian Elischer 
840df8bae1dSRodney W. Grimes /*
84120a92a18SPoul-Henning Kamp  * Compatibility with old mount system call.
84220a92a18SPoul-Henning Kamp  */
84320a92a18SPoul-Henning Kamp 
84420a92a18SPoul-Henning Kamp static int
845cc672d35SKirk McKusick ffs_cmount(struct mntarg *ma, void *data, uint64_t flags)
84620a92a18SPoul-Henning Kamp {
84720a92a18SPoul-Henning Kamp 	struct ufs_args args;
84820a92a18SPoul-Henning Kamp 	int error;
84920a92a18SPoul-Henning Kamp 
85020a92a18SPoul-Henning Kamp 	if (data == NULL)
85120a92a18SPoul-Henning Kamp 		return (EINVAL);
85220a92a18SPoul-Henning Kamp 	error = copyin(data, &args, sizeof args);
85320a92a18SPoul-Henning Kamp 	if (error)
85420a92a18SPoul-Henning Kamp 		return (error);
85520a92a18SPoul-Henning Kamp 
85620a92a18SPoul-Henning Kamp 	ma = mount_argsu(ma, "from", args.fspec, MAXPATHLEN);
8571f7104d7SRick Macklem 	ma = mount_arg(ma, "export", &args.export, sizeof(args.export));
85820a92a18SPoul-Henning Kamp 	error = kernel_mount(ma, flags);
85920a92a18SPoul-Henning Kamp 
86020a92a18SPoul-Henning Kamp 	return (error);
86120a92a18SPoul-Henning Kamp }
86220a92a18SPoul-Henning Kamp 
86320a92a18SPoul-Henning Kamp /*
864df8bae1dSRodney W. Grimes  * Reload all incore data for a filesystem (used after running fsck on
8651848286aSEdward Tomasz Napierala  * the root filesystem and finding things to fix). If the 'force' flag
8661848286aSEdward Tomasz Napierala  * is 0, the filesystem must be mounted read-only.
867df8bae1dSRodney W. Grimes  *
868df8bae1dSRodney W. Grimes  * Things to do to update the mount:
869df8bae1dSRodney W. Grimes  *	1) invalidate all cached meta-data.
870df8bae1dSRodney W. Grimes  *	2) re-read superblock from disk.
871df8bae1dSRodney W. Grimes  *	3) re-read summary information from disk.
872df8bae1dSRodney W. Grimes  *	4) invalidate all inactive vnodes.
873df426577SKonstantin Belousov  *	5) clear MNTK_SUSPEND2 and MNTK_SUSPENDED flags, allowing secondary
874df426577SKonstantin Belousov  *	   writers, if requested.
875df426577SKonstantin Belousov  *	6) invalidate all cached file data.
876df426577SKonstantin Belousov  *	7) re-read inode data for all active vnodes.
877df8bae1dSRodney W. Grimes  */
8781848286aSEdward Tomasz Napierala int
879df426577SKonstantin Belousov ffs_reload(struct mount *mp, struct thread *td, int flags)
880df8bae1dSRodney W. Grimes {
88182be0a5aSTor Egge 	struct vnode *vp, *mvp, *devvp;
882df8bae1dSRodney W. Grimes 	struct inode *ip;
883f55ff3f3SIan Dowse 	void *space;
884df8bae1dSRodney W. Grimes 	struct buf *bp;
885996c772fSJohn Dyson 	struct fs *fs, *newfs;
8863ba649d7SJeff Roberson 	struct ufsmount *ump;
8871c85e6a3SKirk McKusick 	ufs2_daddr_t sblockloc;
888ad544726SKirk McKusick 	int i, blks, error;
889ad544726SKirk McKusick 	u_long size;
890996c772fSJohn Dyson 	int32_t *lp;
891df8bae1dSRodney W. Grimes 
8923ba649d7SJeff Roberson 	ump = VFSTOUFS(mp);
8931848286aSEdward Tomasz Napierala 
8941848286aSEdward Tomasz Napierala 	MNT_ILOCK(mp);
895df426577SKonstantin Belousov 	if ((mp->mnt_flag & MNT_RDONLY) == 0 && (flags & FFSR_FORCE) == 0) {
8961848286aSEdward Tomasz Napierala 		MNT_IUNLOCK(mp);
8971848286aSEdward Tomasz Napierala 		return (EINVAL);
8981848286aSEdward Tomasz Napierala 	}
8991848286aSEdward Tomasz Napierala 	MNT_IUNLOCK(mp);
9001848286aSEdward Tomasz Napierala 
901df8bae1dSRodney W. Grimes 	/*
902df8bae1dSRodney W. Grimes 	 * Step 1: invalidate all cached meta-data.
903df8bae1dSRodney W. Grimes 	 */
9042b14f991SJulian Elischer 	devvp = VFSTOUFS(mp)->um_devvp;
905cb05b60aSAttilio Rao 	vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
9060d7935fdSAttilio Rao 	if (vinvalbuf(devvp, 0, 0, 0) != 0)
907df8bae1dSRodney W. Grimes 		panic("ffs_reload: dirty1");
908b249ce48SMateusz Guzik 	VOP_UNLOCK(devvp);
90995e5e988SJohn Dyson 
910df8bae1dSRodney W. Grimes 	/*
911df8bae1dSRodney W. Grimes 	 * Step 2: re-read superblock from disk.
912df8bae1dSRodney W. Grimes 	 */
9131c85e6a3SKirk McKusick 	fs = VFSTOUFS(mp)->um_fs;
914ada981b2SKirk McKusick 	if ((error = bread(devvp, btodb(fs->fs_sblockloc), fs->fs_sbsize,
9151c85e6a3SKirk McKusick 	    NOCRED, &bp)) != 0)
916df8bae1dSRodney W. Grimes 		return (error);
917996c772fSJohn Dyson 	newfs = (struct fs *)bp->b_data;
9181c85e6a3SKirk McKusick 	if ((newfs->fs_magic != FS_UFS1_MAGIC &&
9191c85e6a3SKirk McKusick 	     newfs->fs_magic != FS_UFS2_MAGIC) ||
9201c85e6a3SKirk McKusick 	    newfs->fs_bsize > MAXBSIZE ||
921996c772fSJohn Dyson 	    newfs->fs_bsize < sizeof(struct fs)) {
922df8bae1dSRodney W. Grimes 			brelse(bp);
923df8bae1dSRodney W. Grimes 			return (EIO);		/* XXX needs translation */
924df8bae1dSRodney W. Grimes 	}
925996c772fSJohn Dyson 	/*
92634816cb9SKirk McKusick 	 * Preserve the summary information, read-only status, and
92734816cb9SKirk McKusick 	 * superblock location by copying these fields into our new
92834816cb9SKirk McKusick 	 * superblock before using it to update the existing superblock.
929996c772fSJohn Dyson 	 */
93034816cb9SKirk McKusick 	newfs->fs_si = fs->fs_si;
9311848286aSEdward Tomasz Napierala 	newfs->fs_ronly = fs->fs_ronly;
9321c85e6a3SKirk McKusick 	sblockloc = fs->fs_sblockloc;
933996c772fSJohn Dyson 	bcopy(newfs, fs, (u_int)fs->fs_sbsize);
934df8bae1dSRodney W. Grimes 	brelse(bp);
935996c772fSJohn Dyson 	mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen;
9361c85e6a3SKirk McKusick 	ffs_oldfscompat_read(fs, VFSTOUFS(mp), sblockloc);
9373ba649d7SJeff Roberson 	UFS_LOCK(ump);
9389ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
939b60ee81eSKirk McKusick 		printf("WARNING: %s: reload pending error: blocks %jd "
940b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
9411c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
9429ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
9439ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
9449ccb939eSKirk McKusick 	}
9453ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
946996c772fSJohn Dyson 
947df8bae1dSRodney W. Grimes 	/*
948df8bae1dSRodney W. Grimes 	 * Step 3: re-read summary information from disk.
949df8bae1dSRodney W. Grimes 	 */
9502b028c25SEdward Tomasz Napierala 	size = fs->fs_cssize;
9512b028c25SEdward Tomasz Napierala 	blks = howmany(size, fs->fs_fsize);
9522b028c25SEdward Tomasz Napierala 	if (fs->fs_contigsumsize > 0)
9532b028c25SEdward Tomasz Napierala 		size += fs->fs_ncg * sizeof(int32_t);
9542b028c25SEdward Tomasz Napierala 	size += fs->fs_ncg * sizeof(u_int8_t);
9552b028c25SEdward Tomasz Napierala 	free(fs->fs_csp, M_UFSMNT);
956ad544726SKirk McKusick 	space = malloc(size, M_UFSMNT, M_WAITOK);
9572b028c25SEdward Tomasz Napierala 	fs->fs_csp = space;
958df8bae1dSRodney W. Grimes 	for (i = 0; i < blks; i += fs->fs_frag) {
959df8bae1dSRodney W. Grimes 		size = fs->fs_bsize;
960df8bae1dSRodney W. Grimes 		if (i + fs->fs_frag > blks)
961df8bae1dSRodney W. Grimes 			size = (blks - i) * fs->fs_fsize;
962c9671602SPoul-Henning Kamp 		error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size,
963c9671602SPoul-Henning Kamp 		    NOCRED, &bp);
964c9671602SPoul-Henning Kamp 		if (error)
965df8bae1dSRodney W. Grimes 			return (error);
966f55ff3f3SIan Dowse 		bcopy(bp->b_data, space, (u_int)size);
967f55ff3f3SIan Dowse 		space = (char *)space + size;
968df8bae1dSRodney W. Grimes 		brelse(bp);
969df8bae1dSRodney W. Grimes 	}
970996c772fSJohn Dyson 	/*
971996c772fSJohn Dyson 	 * We no longer know anything about clusters per cylinder group.
972996c772fSJohn Dyson 	 */
973996c772fSJohn Dyson 	if (fs->fs_contigsumsize > 0) {
97472b8ff1cSEdward Tomasz Napierala 		fs->fs_maxcluster = lp = space;
975996c772fSJohn Dyson 		for (i = 0; i < fs->fs_ncg; i++)
976996c772fSJohn Dyson 			*lp++ = fs->fs_contigsumsize;
97772b8ff1cSEdward Tomasz Napierala 		space = lp;
978996c772fSJohn Dyson 	}
97972b8ff1cSEdward Tomasz Napierala 	size = fs->fs_ncg * sizeof(u_int8_t);
98072b8ff1cSEdward Tomasz Napierala 	fs->fs_contigdirs = (u_int8_t *)space;
98172b8ff1cSEdward Tomasz Napierala 	bzero(fs->fs_contigdirs, size);
982df426577SKonstantin Belousov 	if ((flags & FFSR_UNSUSPEND) != 0) {
983df426577SKonstantin Belousov 		MNT_ILOCK(mp);
984df426577SKonstantin Belousov 		mp->mnt_kern_flag &= ~(MNTK_SUSPENDED | MNTK_SUSPEND2);
985df426577SKonstantin Belousov 		wakeup(&mp->mnt_flag);
986df426577SKonstantin Belousov 		MNT_IUNLOCK(mp);
987df426577SKonstantin Belousov 	}
988996c772fSJohn Dyson 
989df8bae1dSRodney W. Grimes loop:
99071469bb3SKirk McKusick 	MNT_VNODE_FOREACH_ALL(vp, mp, mvp) {
991df8bae1dSRodney W. Grimes 		/*
9921848286aSEdward Tomasz Napierala 		 * Skip syncer vnode.
9931848286aSEdward Tomasz Napierala 		 */
9941848286aSEdward Tomasz Napierala 		if (vp->v_type == VNON) {
9951848286aSEdward Tomasz Napierala 			VI_UNLOCK(vp);
9961848286aSEdward Tomasz Napierala 			continue;
9971848286aSEdward Tomasz Napierala 		}
9981848286aSEdward Tomasz Napierala 		/*
999fe68abe2SJeff Roberson 		 * Step 4: invalidate all cached file data.
1000df8bae1dSRodney W. Grimes 		 */
1001a92a971bSMateusz Guzik 		if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK)) {
100271469bb3SKirk McKusick 			MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp);
1003df8bae1dSRodney W. Grimes 			goto loop;
1004996c772fSJohn Dyson 		}
10050d7935fdSAttilio Rao 		if (vinvalbuf(vp, 0, 0, 0))
1006df8bae1dSRodney W. Grimes 			panic("ffs_reload: dirty2");
1007df8bae1dSRodney W. Grimes 		/*
1008fe68abe2SJeff Roberson 		 * Step 5: re-read inode data for all active vnodes.
1009df8bae1dSRodney W. Grimes 		 */
1010df8bae1dSRodney W. Grimes 		ip = VTOI(vp);
1011c9671602SPoul-Henning Kamp 		error =
1012df8bae1dSRodney W. Grimes 		    bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)),
1013c9671602SPoul-Henning Kamp 		    (int)fs->fs_bsize, NOCRED, &bp);
1014c9671602SPoul-Henning Kamp 		if (error) {
10159fc5d538SKirk McKusick 			vput(vp);
101671469bb3SKirk McKusick 			MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp);
1017df8bae1dSRodney W. Grimes 			return (error);
1018df8bae1dSRodney W. Grimes 		}
10199fc5d538SKirk McKusick 		if ((error = ffs_load_inode(bp, ip, fs, ip->i_number)) != 0) {
10209fc5d538SKirk McKusick 			brelse(bp);
10219fc5d538SKirk McKusick 			vput(vp);
10229fc5d538SKirk McKusick 			MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp);
10239fc5d538SKirk McKusick 			return (error);
10249fc5d538SKirk McKusick 		}
1025b1897c19SJulian Elischer 		ip->i_effnlink = ip->i_nlink;
1026df8bae1dSRodney W. Grimes 		brelse(bp);
10279fc5d538SKirk McKusick 		vput(vp);
1028df8bae1dSRodney W. Grimes 	}
1029df8bae1dSRodney W. Grimes 	return (0);
1030df8bae1dSRodney W. Grimes }
1031df8bae1dSRodney W. Grimes 
10321c85e6a3SKirk McKusick /*
1033df8bae1dSRodney W. Grimes  * Common code for mount and mountroot
1034df8bae1dSRodney W. Grimes  */
1035975512a9SPoul-Henning Kamp static int
1036f15ccf88SChuck Silvers ffs_mountfs(odevvp, mp, td)
1037f15ccf88SChuck Silvers 	struct vnode *odevvp;
1038df8bae1dSRodney W. Grimes 	struct mount *mp;
1039b40ce416SJulian Elischer 	struct thread *td;
1040df8bae1dSRodney W. Grimes {
104105f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
104205f4ff5dSPoul-Henning Kamp 	struct fs *fs;
104389c9c53dSPoul-Henning Kamp 	struct cdev *dev;
1044dffce215SKirk McKusick 	int error, i, len, ronly;
1045996c772fSJohn Dyson 	struct ucred *cred;
104643920011SPoul-Henning Kamp 	struct g_consumer *cp;
10473bbd6d8aSJeff Roberson 	struct mount *nmp;
1048f15ccf88SChuck Silvers 	struct vnode *devvp;
1049d79ff54bSChuck Silvers 	struct fsfail_task *etp;
105013532153SScott Long 	int candelete, canspeedup;
1051fb14e73cSKirk McKusick 	off_t loc;
1052df8bae1dSRodney W. Grimes 
1053dffce215SKirk McKusick 	fs = NULL;
1054ee445a69SJohn Baldwin 	ump = NULL;
1055a854ed98SJohn Baldwin 	cred = td ? td->td_ucred : NOCRED;
105643920011SPoul-Henning Kamp 	ronly = (mp->mnt_flag & MNT_RDONLY) != 0;
1057ee445a69SJohn Baldwin 
1058f15ccf88SChuck Silvers 	devvp = mntfs_allocvp(mp, odevvp);
1059f15ccf88SChuck Silvers 	VOP_UNLOCK(odevvp);
1060c70b3cd2SKonstantin Belousov 	KASSERT(devvp->v_type == VCHR, ("reclaimed devvp"));
1061ee445a69SJohn Baldwin 	dev = devvp->v_rdev;
106279a5c790SKirk McKusick 	KASSERT(dev->si_snapdata == NULL, ("non-NULL snapshot data"));
1063c70b3cd2SKonstantin Belousov 	if (atomic_cmpset_acq_ptr((uintptr_t *)&dev->si_mountpt, 0,
1064c70b3cd2SKonstantin Belousov 	    (uintptr_t)mp) == 0) {
1065f15ccf88SChuck Silvers 		mntfs_freevp(devvp);
1066c70b3cd2SKonstantin Belousov 		return (EBUSY);
1067c70b3cd2SKonstantin Belousov 	}
106843920011SPoul-Henning Kamp 	g_topology_lock();
106943920011SPoul-Henning Kamp 	error = g_vfs_open(devvp, &cp, "ffs", ronly ? 0 : 1);
107043920011SPoul-Henning Kamp 	g_topology_unlock();
1071c70b3cd2SKonstantin Belousov 	if (error != 0) {
1072c70b3cd2SKonstantin Belousov 		atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0);
1073f15ccf88SChuck Silvers 		mntfs_freevp(devvp);
1074c70b3cd2SKonstantin Belousov 		return (error);
1075c70b3cd2SKonstantin Belousov 	}
1076c70b3cd2SKonstantin Belousov 	dev_ref(dev);
1077c70b3cd2SKonstantin Belousov 	devvp->v_bufobj.bo_ops = &ffs_ops;
1078f15ccf88SChuck Silvers 	BO_LOCK(&odevvp->v_bufobj);
1079f15ccf88SChuck Silvers 	odevvp->v_bufobj.bo_flag |= BO_NOBUFS;
1080f15ccf88SChuck Silvers 	BO_UNLOCK(&odevvp->v_bufobj);
1081c70b3cd2SKonstantin Belousov 	if (dev->si_iosize_max != 0)
1082c70b3cd2SKonstantin Belousov 		mp->mnt_iosize_max = dev->si_iosize_max;
1083cd853791SKonstantin Belousov 	if (mp->mnt_iosize_max > maxphys)
1084cd853791SKonstantin Belousov 		mp->mnt_iosize_max = maxphys;
108571ac2d7cSCraig Rodrigues 	if ((SBLOCKSIZE % cp->provider->sectorsize) != 0) {
108671ac2d7cSCraig Rodrigues 		error = EINVAL;
108771ac2d7cSCraig Rodrigues 		vfs_mount_error(mp,
108871ac2d7cSCraig Rodrigues 		    "Invalid sectorsize %d for superblock size %d",
108971ac2d7cSCraig Rodrigues 		    cp->provider->sectorsize, SBLOCKSIZE);
109071ac2d7cSCraig Rodrigues 		goto out;
109171ac2d7cSCraig Rodrigues 	}
1092dffce215SKirk McKusick 	/* fetch the superblock and summary information */
1093fb14e73cSKirk McKusick 	loc = STDSB;
1094fb14e73cSKirk McKusick 	if ((mp->mnt_flag & MNT_ROOTFS) != 0)
1095fb14e73cSKirk McKusick 		loc = STDSB_NOHASHFAIL;
1096fb14e73cSKirk McKusick 	if ((error = ffs_sbget(devvp, &fs, loc, M_UFSMNT, ffs_use_bread)) != 0)
1097df8bae1dSRodney W. Grimes 		goto out;
10980922cce6SBruce Evans 	fs->fs_flags &= ~FS_UNCLEAN;
10990922cce6SBruce Evans 	if (fs->fs_clean == 0) {
11000922cce6SBruce Evans 		fs->fs_flags |= FS_UNCLEAN;
1101812b1d41SKirk McKusick 		if (ronly || (mp->mnt_flag & MNT_FORCE) ||
1102113db2ddSJeff Roberson 		    ((fs->fs_flags & (FS_SUJ | FS_NEEDSFSCK)) == 0 &&
11031a6a6610SKirk McKusick 		     (fs->fs_flags & FS_DOSOFTDEP))) {
110459b3a4ebSDavid E. O'Brien 			printf("WARNING: %s was not properly dismounted\n",
11050922cce6SBruce Evans 			    fs->fs_fsmnt);
11061469eec8SDavid Greenman 		} else {
1107b60ee81eSKirk McKusick 			vfs_mount_error(mp, "R/W mount of %s denied. %s%s",
1108b60ee81eSKirk McKusick 			    fs->fs_fsmnt, "Filesystem is not clean - run fsck.",
1109b60ee81eSKirk McKusick 			    (fs->fs_flags & FS_SUJ) == 0 ? "" :
1110b60ee81eSKirk McKusick 			    " Forced mount will invalidate journal contents");
11111469eec8SDavid Greenman 			error = EPERM;
11121469eec8SDavid Greenman 			goto out;
11131469eec8SDavid Greenman 		}
11141c85e6a3SKirk McKusick 		if ((fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) &&
11151c85e6a3SKirk McKusick 		    (mp->mnt_flag & MNT_FORCE)) {
1116b60ee81eSKirk McKusick 			printf("WARNING: %s: lost blocks %jd files %d\n",
1117b60ee81eSKirk McKusick 			    fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
11181c85e6a3SKirk McKusick 			    fs->fs_pendinginodes);
11199ccb939eSKirk McKusick 			fs->fs_pendingblocks = 0;
11209ccb939eSKirk McKusick 			fs->fs_pendinginodes = 0;
11219ccb939eSKirk McKusick 		}
11229ccb939eSKirk McKusick 	}
11239ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
1124b60ee81eSKirk McKusick 		printf("WARNING: %s: mount pending error: blocks %jd "
1125b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
11261c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
11279ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
11289ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
11291469eec8SDavid Greenman 	}
11301a60c7fcSPawel Jakub Dawidek 	if ((fs->fs_flags & FS_GJOURNAL) != 0) {
11311a60c7fcSPawel Jakub Dawidek #ifdef UFS_GJOURNAL
11321a60c7fcSPawel Jakub Dawidek 		/*
11331a60c7fcSPawel Jakub Dawidek 		 * Get journal provider name.
11341a60c7fcSPawel Jakub Dawidek 		 */
1135ad544726SKirk McKusick 		len = 1024;
1136ad544726SKirk McKusick 		mp->mnt_gjprovider = malloc((u_long)len, M_UFSMNT, M_WAITOK);
1137ad544726SKirk McKusick 		if (g_io_getattr("GJOURNAL::provider", cp, &len,
11381a60c7fcSPawel Jakub Dawidek 		    mp->mnt_gjprovider) == 0) {
1139ad544726SKirk McKusick 			mp->mnt_gjprovider = realloc(mp->mnt_gjprovider, len,
11401a60c7fcSPawel Jakub Dawidek 			    M_UFSMNT, M_WAITOK);
11411a60c7fcSPawel Jakub Dawidek 			MNT_ILOCK(mp);
11421a60c7fcSPawel Jakub Dawidek 			mp->mnt_flag |= MNT_GJOURNAL;
11431a60c7fcSPawel Jakub Dawidek 			MNT_IUNLOCK(mp);
11441a60c7fcSPawel Jakub Dawidek 		} else {
1145b60ee81eSKirk McKusick 			printf("WARNING: %s: GJOURNAL flag on fs "
1146b60ee81eSKirk McKusick 			    "but no gjournal provider below\n",
11471a60c7fcSPawel Jakub Dawidek 			    mp->mnt_stat.f_mntonname);
11481a60c7fcSPawel Jakub Dawidek 			free(mp->mnt_gjprovider, M_UFSMNT);
11491a60c7fcSPawel Jakub Dawidek 			mp->mnt_gjprovider = NULL;
11501a60c7fcSPawel Jakub Dawidek 		}
11511a60c7fcSPawel Jakub Dawidek #else
1152b60ee81eSKirk McKusick 		printf("WARNING: %s: GJOURNAL flag on fs but no "
1153b60ee81eSKirk McKusick 		    "UFS_GJOURNAL support\n", mp->mnt_stat.f_mntonname);
11541a60c7fcSPawel Jakub Dawidek #endif
11551a60c7fcSPawel Jakub Dawidek 	} else {
11561a60c7fcSPawel Jakub Dawidek 		mp->mnt_gjprovider = NULL;
11571a60c7fcSPawel Jakub Dawidek 	}
1158a163d034SWarner Losh 	ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK | M_ZERO);
115943920011SPoul-Henning Kamp 	ump->um_cp = cp;
116043920011SPoul-Henning Kamp 	ump->um_bo = &devvp->v_bufobj;
1161dffce215SKirk McKusick 	ump->um_fs = fs;
11621c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC) {
11631c85e6a3SKirk McKusick 		ump->um_fstype = UFS1;
11641c85e6a3SKirk McKusick 		ump->um_balloc = ffs_balloc_ufs1;
11651c85e6a3SKirk McKusick 	} else {
11661c85e6a3SKirk McKusick 		ump->um_fstype = UFS2;
11671c85e6a3SKirk McKusick 		ump->um_balloc = ffs_balloc_ufs2;
11681c85e6a3SKirk McKusick 	}
1169cec0f20cSPoul-Henning Kamp 	ump->um_blkatoff = ffs_blkatoff;
1170cec0f20cSPoul-Henning Kamp 	ump->um_truncate = ffs_truncate;
1171987f5696SPoul-Henning Kamp 	ump->um_update = ffs_update;
1172cec0f20cSPoul-Henning Kamp 	ump->um_valloc = ffs_valloc;
1173cec0f20cSPoul-Henning Kamp 	ump->um_vfree = ffs_vfree;
1174975512a9SPoul-Henning Kamp 	ump->um_ifree = ffs_ifree;
117590446e36SKonstantin Belousov 	ump->um_rdonly = ffs_rdonly;
117616b1f68dSKonstantin Belousov 	ump->um_snapgone = ffs_snapgone;
1177fdf34aa3SKirk McKusick 	if ((mp->mnt_flag & MNT_UNTRUSTED) != 0)
1178fdf34aa3SKirk McKusick 		ump->um_check_blkno = ffs_check_blkno;
1179fdf34aa3SKirk McKusick 	else
1180fdf34aa3SKirk McKusick 		ump->um_check_blkno = NULL;
11813ba649d7SJeff Roberson 	mtx_init(UFS_MTX(ump), "FFS", "FFS Lock", MTX_DEF);
1182dffce215SKirk McKusick 	ffs_oldfscompat_read(fs, ump, fs->fs_sblockloc);
1183df8bae1dSRodney W. Grimes 	fs->fs_ronly = ronly;
1184143a5346SIan Dowse 	fs->fs_active = NULL;
118577465d93SAlfred Perlstein 	mp->mnt_data = ump;
118668de329eSPoul-Henning Kamp 	mp->mnt_stat.f_fsid.val[0] = fs->fs_id[0];
11878f89943eSGuido van Rooij 	mp->mnt_stat.f_fsid.val[1] = fs->fs_id[1];
11883bbd6d8aSJeff Roberson 	nmp = NULL;
118968de329eSPoul-Henning Kamp 	if (fs->fs_id[0] == 0 || fs->fs_id[1] == 0 ||
11903bbd6d8aSJeff Roberson 	    (nmp = vfs_getvfs(&mp->mnt_stat.f_fsid))) {
11913bbd6d8aSJeff Roberson 		if (nmp)
11923bbd6d8aSJeff Roberson 			vfs_rel(nmp);
119368de329eSPoul-Henning Kamp 		vfs_getnewfsid(mp);
11943bbd6d8aSJeff Roberson 	}
1195df8bae1dSRodney W. Grimes 	mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen;
11965da56ddbSTor Egge 	MNT_ILOCK(mp);
1197cc9d8990SPeter Wemm 	mp->mnt_flag |= MNT_LOCAL;
11985da56ddbSTor Egge 	MNT_IUNLOCK(mp);
11995da56ddbSTor Egge 	if ((fs->fs_flags & FS_MULTILABEL) != 0) {
12007b3f1bbdSTom Rhodes #ifdef MAC
12015da56ddbSTor Egge 		MNT_ILOCK(mp);
120280830407SRobert Watson 		mp->mnt_flag |= MNT_MULTILABEL;
12035da56ddbSTor Egge 		MNT_IUNLOCK(mp);
12047b3f1bbdSTom Rhodes #else
1205b60ee81eSKirk McKusick 		printf("WARNING: %s: multilabel flag on fs but "
1206b60ee81eSKirk McKusick 		    "no MAC support\n", mp->mnt_stat.f_mntonname);
12077b3f1bbdSTom Rhodes #endif
12085da56ddbSTor Egge 	}
12095da56ddbSTor Egge 	if ((fs->fs_flags & FS_ACLS) != 0) {
12107b3f1bbdSTom Rhodes #ifdef UFS_ACL
12115da56ddbSTor Egge 		MNT_ILOCK(mp);
12129340fc72SEdward Tomasz Napierala 
12139340fc72SEdward Tomasz Napierala 		if (mp->mnt_flag & MNT_NFS4ACLS)
1214b60ee81eSKirk McKusick 			printf("WARNING: %s: ACLs flag on fs conflicts with "
1215b60ee81eSKirk McKusick 			    "\"nfsv4acls\" mount option; option ignored\n",
1216b60ee81eSKirk McKusick 			    mp->mnt_stat.f_mntonname);
12179340fc72SEdward Tomasz Napierala 		mp->mnt_flag &= ~MNT_NFS4ACLS;
121880830407SRobert Watson 		mp->mnt_flag |= MNT_ACLS;
12199340fc72SEdward Tomasz Napierala 
12205da56ddbSTor Egge 		MNT_IUNLOCK(mp);
12217b3f1bbdSTom Rhodes #else
122259b3a4ebSDavid E. O'Brien 		printf("WARNING: %s: ACLs flag on fs but no ACLs support\n",
1223946478fcSPawel Jakub Dawidek 		    mp->mnt_stat.f_mntonname);
12247b3f1bbdSTom Rhodes #endif
12255da56ddbSTor Egge 	}
12269340fc72SEdward Tomasz Napierala 	if ((fs->fs_flags & FS_NFS4ACLS) != 0) {
12279340fc72SEdward Tomasz Napierala #ifdef UFS_ACL
12289340fc72SEdward Tomasz Napierala 		MNT_ILOCK(mp);
12299340fc72SEdward Tomasz Napierala 
12309340fc72SEdward Tomasz Napierala 		if (mp->mnt_flag & MNT_ACLS)
1231b60ee81eSKirk McKusick 			printf("WARNING: %s: NFSv4 ACLs flag on fs conflicts "
1232b60ee81eSKirk McKusick 			    "with \"acls\" mount option; option ignored\n",
1233b60ee81eSKirk McKusick 			    mp->mnt_stat.f_mntonname);
12349340fc72SEdward Tomasz Napierala 		mp->mnt_flag &= ~MNT_ACLS;
12359340fc72SEdward Tomasz Napierala 		mp->mnt_flag |= MNT_NFS4ACLS;
12369340fc72SEdward Tomasz Napierala 
12379340fc72SEdward Tomasz Napierala 		MNT_IUNLOCK(mp);
12389340fc72SEdward Tomasz Napierala #else
1239b60ee81eSKirk McKusick 		printf("WARNING: %s: NFSv4 ACLs flag on fs but no "
1240b60ee81eSKirk McKusick 		    "ACLs support\n", mp->mnt_stat.f_mntonname);
12419340fc72SEdward Tomasz Napierala #endif
12429340fc72SEdward Tomasz Napierala 	}
12438c2a54deSKonstantin Belousov 	if ((fs->fs_flags & FS_TRIM) != 0) {
1244ad544726SKirk McKusick 		len = sizeof(int);
1245ad544726SKirk McKusick 		if (g_io_getattr("GEOM::candelete", cp, &len,
1246ab0bcb60SKirk McKusick 		    &candelete) == 0) {
1247ab0bcb60SKirk McKusick 			if (candelete)
1248ab0bcb60SKirk McKusick 				ump->um_flags |= UM_CANDELETE;
1249ab0bcb60SKirk McKusick 			else
1250b60ee81eSKirk McKusick 				printf("WARNING: %s: TRIM flag on fs but disk "
1251b60ee81eSKirk McKusick 				    "does not support TRIM\n",
12528c2a54deSKonstantin Belousov 				    mp->mnt_stat.f_mntonname);
12538c2a54deSKonstantin Belousov 		} else {
1254b60ee81eSKirk McKusick 			printf("WARNING: %s: TRIM flag on fs but disk does "
1255b60ee81eSKirk McKusick 			    "not confirm that it supports TRIM\n",
12568c2a54deSKonstantin Belousov 			    mp->mnt_stat.f_mntonname);
12578c2a54deSKonstantin Belousov 		}
1258ab0bcb60SKirk McKusick 		if (((ump->um_flags) & UM_CANDELETE) != 0) {
1259c79dff0fSKonstantin Belousov 			ump->um_trim_tq = taskqueue_create("trim", M_WAITOK,
1260c79dff0fSKonstantin Belousov 			    taskqueue_thread_enqueue, &ump->um_trim_tq);
1261c79dff0fSKonstantin Belousov 			taskqueue_start_threads(&ump->um_trim_tq, 1, PVFS,
1262c79dff0fSKonstantin Belousov 			    "%s trim", mp->mnt_stat.f_mntonname);
12637e038bc2SKirk McKusick 			ump->um_trimhash = hashinit(MAXTRIMIO, M_TRIM,
12647e038bc2SKirk McKusick 			    &ump->um_trimlisthashsize);
1265c79dff0fSKonstantin Belousov 		}
12668c2a54deSKonstantin Belousov 	}
12679340fc72SEdward Tomasz Napierala 
126813532153SScott Long 	len = sizeof(int);
126913532153SScott Long 	if (g_io_getattr("GEOM::canspeedup", cp, &len, &canspeedup) == 0) {
127013532153SScott Long 		if (canspeedup)
127113532153SScott Long 			ump->um_flags |= UM_CANSPEEDUP;
127213532153SScott Long 	}
127313532153SScott Long 
1274df8bae1dSRodney W. Grimes 	ump->um_mountp = mp;
1275df8bae1dSRodney W. Grimes 	ump->um_dev = dev;
1276df8bae1dSRodney W. Grimes 	ump->um_devvp = devvp;
1277f15ccf88SChuck Silvers 	ump->um_odevvp = odevvp;
1278df8bae1dSRodney W. Grimes 	ump->um_nindir = fs->fs_nindir;
1279df8bae1dSRodney W. Grimes 	ump->um_bptrtodb = fs->fs_fsbtodb;
1280df8bae1dSRodney W. Grimes 	ump->um_seqinc = fs->fs_frag;
1281df8bae1dSRodney W. Grimes 	for (i = 0; i < MAXQUOTAS; i++)
1282df8bae1dSRodney W. Grimes 		ump->um_quotas[i] = NULLVP;
1283516081f2SRobert Watson #ifdef UFS_EXTATTR
1284a64ed089SRobert Watson 	ufs_extattr_uepm_init(&ump->um_extattr);
1285a64ed089SRobert Watson #endif
12862b14f991SJulian Elischer 	/*
12872b14f991SJulian Elischer 	 * Set FS local "last mounted on" information (NULL pad)
12882b14f991SJulian Elischer 	 */
128993373c42SSuleiman Souhlal 	bzero(fs->fs_fsmnt, MAXMNTLEN);
129093373c42SSuleiman Souhlal 	strlcpy(fs->fs_fsmnt, mp->mnt_stat.f_mntonname, MAXMNTLEN);
1291113db2ddSJeff Roberson 	mp->mnt_stat.f_iosize = fs->fs_bsize;
12922b14f991SJulian Elischer 
12932b14f991SJulian Elischer 	if (mp->mnt_flag & MNT_ROOTFS) {
12942b14f991SJulian Elischer 		/*
12952b14f991SJulian Elischer 		 * Root mount; update timestamp in mount structure.
12962b14f991SJulian Elischer 		 * this will be used by the common root mount code
12972b14f991SJulian Elischer 		 * to update the system clock.
12982b14f991SJulian Elischer 		 */
12992b14f991SJulian Elischer 		mp->mnt_time = fs->fs_time;
13002b14f991SJulian Elischer 	}
1301996c772fSJohn Dyson 
1302996c772fSJohn Dyson 	if (ronly == 0) {
1303113db2ddSJeff Roberson 		fs->fs_mtime = time_second;
1304b1897c19SJulian Elischer 		if ((fs->fs_flags & FS_DOSOFTDEP) &&
1305b1897c19SJulian Elischer 		    (error = softdep_mount(devvp, mp, fs, cred)) != 0) {
1306fddd463dSKonstantin Belousov 			ffs_flushfiles(mp, FORCECLOSE, td);
1307b1897c19SJulian Elischer 			goto out;
1308b1897c19SJulian Elischer 		}
1309f2a2857bSKirk McKusick 		if (fs->fs_snapinum[0] != 0)
1310f2a2857bSKirk McKusick 			ffs_snapshot_mount(mp);
1311cf60e8e4SKirk McKusick 		fs->fs_fmod = 1;
1312996c772fSJohn Dyson 		fs->fs_clean = 0;
1313791dd2faSTor Egge 		(void) ffs_sbupdate(ump, MNT_WAIT, 0);
1314996c772fSJohn Dyson 	}
1315d8d3d415SPoul-Henning Kamp 	/*
131698cbffd7SKonstantin Belousov 	 * Initialize filesystem state information in mount struct.
1317d8d3d415SPoul-Henning Kamp 	 */
13186cf7bc60SRobert Watson 	MNT_ILOCK(mp);
1319bc2258daSAttilio Rao 	mp->mnt_kern_flag |= MNTK_LOOKUP_SHARED | MNTK_EXTENDED_SHARED |
13205f34e93cSMark Johnston 	    MNTK_NO_IOPF | MNTK_UNMAPPED_BUFS | MNTK_USES_BCACHE;
13216cf7bc60SRobert Watson 	MNT_IUNLOCK(mp);
1322516081f2SRobert Watson #ifdef UFS_EXTATTR
1323516081f2SRobert Watson #ifdef UFS_EXTATTR_AUTOSTART
13249de54ba5SRobert Watson 	/*
13259de54ba5SRobert Watson 	 *
1326f5161237SRobert Watson 	 * Auto-starting does the following:
13279de54ba5SRobert Watson 	 *	- check for /.attribute in the fs, and extattr_start if so
13289de54ba5SRobert Watson 	 *	- for each file in .attribute, enable that file with
13299de54ba5SRobert Watson 	 * 	  an attribute of the same name.
13309de54ba5SRobert Watson 	 * Not clear how to report errors -- probably eat them.
13319de54ba5SRobert Watson 	 * This would all happen while the filesystem was busy/not
13329de54ba5SRobert Watson 	 * available, so would effectively be "atomic".
13339de54ba5SRobert Watson 	 */
1334b40ce416SJulian Elischer 	(void) ufs_extattr_autostart(mp, td);
1335516081f2SRobert Watson #endif /* !UFS_EXTATTR_AUTOSTART */
1336516081f2SRobert Watson #endif /* !UFS_EXTATTR */
1337d79ff54bSChuck Silvers 	etp = malloc(sizeof *ump->um_fsfail_task, M_UFSMNT, M_WAITOK | M_ZERO);
1338d79ff54bSChuck Silvers 	etp->fsid = mp->mnt_stat.f_fsid;
1339d79ff54bSChuck Silvers 	ump->um_fsfail_task = etp;
1340df8bae1dSRodney W. Grimes 	return (0);
1341df8bae1dSRodney W. Grimes out:
1342dffce215SKirk McKusick 	if (fs != NULL) {
1343dffce215SKirk McKusick 		free(fs->fs_csp, M_UFSMNT);
134434816cb9SKirk McKusick 		free(fs->fs_si, M_UFSMNT);
1345dffce215SKirk McKusick 		free(fs, M_UFSMNT);
1346dffce215SKirk McKusick 	}
134743920011SPoul-Henning Kamp 	if (cp != NULL) {
134843920011SPoul-Henning Kamp 		g_topology_lock();
13490d7935fdSAttilio Rao 		g_vfs_close(cp);
135043920011SPoul-Henning Kamp 		g_topology_unlock();
135143920011SPoul-Henning Kamp 	}
1352df8bae1dSRodney W. Grimes 	if (ump) {
13533ba649d7SJeff Roberson 		mtx_destroy(UFS_MTX(ump));
13541a60c7fcSPawel Jakub Dawidek 		if (mp->mnt_gjprovider != NULL) {
13551a60c7fcSPawel Jakub Dawidek 			free(mp->mnt_gjprovider, M_UFSMNT);
13561a60c7fcSPawel Jakub Dawidek 			mp->mnt_gjprovider = NULL;
13571a60c7fcSPawel Jakub Dawidek 		}
1358*2af934ccSKonstantin Belousov 		MPASS(ump->um_softdep == NULL);
1359df8bae1dSRodney W. Grimes 		free(ump, M_UFSMNT);
136077465d93SAlfred Perlstein 		mp->mnt_data = NULL;
1361df8bae1dSRodney W. Grimes 	}
1362f15ccf88SChuck Silvers 	BO_LOCK(&odevvp->v_bufobj);
1363f15ccf88SChuck Silvers 	odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS;
1364f15ccf88SChuck Silvers 	BO_UNLOCK(&odevvp->v_bufobj);
1365c70b3cd2SKonstantin Belousov 	atomic_store_rel_ptr((uintptr_t *)&dev->si_mountpt, 0);
1366f15ccf88SChuck Silvers 	mntfs_freevp(devvp);
136749c4791cSEdward Tomasz Napierala 	dev_rel(dev);
1368df8bae1dSRodney W. Grimes 	return (error);
1369df8bae1dSRodney W. Grimes }
1370df8bae1dSRodney W. Grimes 
1371dffce215SKirk McKusick /*
1372dffce215SKirk McKusick  * A read function for use by filesystem-layer routines.
1373dffce215SKirk McKusick  */
1374dffce215SKirk McKusick static int
1375dffce215SKirk McKusick ffs_use_bread(void *devfd, off_t loc, void **bufp, int size)
1376dffce215SKirk McKusick {
1377dffce215SKirk McKusick 	struct buf *bp;
1378dffce215SKirk McKusick 	int error;
1379dffce215SKirk McKusick 
1380efbf3964SKirk McKusick 	KASSERT(*bufp == NULL, ("ffs_use_bread: non-NULL *bufp %p\n", *bufp));
1381dffce215SKirk McKusick 	*bufp = malloc(size, M_UFSMNT, M_WAITOK);
1382dffce215SKirk McKusick 	if ((error = bread((struct vnode *)devfd, btodb(loc), size, NOCRED,
1383efbf3964SKirk McKusick 	    &bp)) != 0)
1384dffce215SKirk McKusick 		return (error);
1385dffce215SKirk McKusick 	bcopy(bp->b_data, *bufp, size);
1386dffce215SKirk McKusick 	bp->b_flags |= B_INVAL | B_NOCACHE;
1387dffce215SKirk McKusick 	brelse(bp);
1388dffce215SKirk McKusick 	return (0);
1389dffce215SKirk McKusick }
1390dffce215SKirk McKusick 
1391adf41577SPoul-Henning Kamp static int bigcgs = 0;
13921c85e6a3SKirk McKusick SYSCTL_INT(_debug, OID_AUTO, bigcgs, CTLFLAG_RW, &bigcgs, 0, "");
13931c85e6a3SKirk McKusick 
1394df8bae1dSRodney W. Grimes /*
13951c85e6a3SKirk McKusick  * Sanity checks for loading old filesystem superblocks.
13961c85e6a3SKirk McKusick  * See ffs_oldfscompat_write below for unwound actions.
1397df8bae1dSRodney W. Grimes  *
13981c85e6a3SKirk McKusick  * XXX - Parts get retired eventually.
13991c85e6a3SKirk McKusick  * Unfortunately new bits get added.
1400df8bae1dSRodney W. Grimes  */
14011c85e6a3SKirk McKusick static void
14021c85e6a3SKirk McKusick ffs_oldfscompat_read(fs, ump, sblockloc)
1403df8bae1dSRodney W. Grimes 	struct fs *fs;
14041c85e6a3SKirk McKusick 	struct ufsmount *ump;
14051c85e6a3SKirk McKusick 	ufs2_daddr_t sblockloc;
14061c85e6a3SKirk McKusick {
14071c85e6a3SKirk McKusick 	off_t maxfilesize;
14081c85e6a3SKirk McKusick 
14091c85e6a3SKirk McKusick 	/*
1410ada981b2SKirk McKusick 	 * If not yet done, update fs_flags location and value of fs_sblockloc.
1411ada981b2SKirk McKusick 	 */
1412ada981b2SKirk McKusick 	if ((fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) {
1413ada981b2SKirk McKusick 		fs->fs_flags = fs->fs_old_flags;
1414ada981b2SKirk McKusick 		fs->fs_old_flags |= FS_FLAGS_UPDATED;
1415ada981b2SKirk McKusick 		fs->fs_sblockloc = sblockloc;
1416ada981b2SKirk McKusick 	}
1417ada981b2SKirk McKusick 	/*
14181c85e6a3SKirk McKusick 	 * If not yet done, update UFS1 superblock with new wider fields.
14191c85e6a3SKirk McKusick 	 */
142074f3809aSKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_maxbsize != fs->fs_bsize) {
14211c85e6a3SKirk McKusick 		fs->fs_maxbsize = fs->fs_bsize;
14221c85e6a3SKirk McKusick 		fs->fs_time = fs->fs_old_time;
14231c85e6a3SKirk McKusick 		fs->fs_size = fs->fs_old_size;
14241c85e6a3SKirk McKusick 		fs->fs_dsize = fs->fs_old_dsize;
14251c85e6a3SKirk McKusick 		fs->fs_csaddr = fs->fs_old_csaddr;
14261c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_ndir = fs->fs_old_cstotal.cs_ndir;
14271c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nbfree = fs->fs_old_cstotal.cs_nbfree;
14281c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nifree = fs->fs_old_cstotal.cs_nifree;
14291c85e6a3SKirk McKusick 		fs->fs_cstotal.cs_nffree = fs->fs_old_cstotal.cs_nffree;
14301c85e6a3SKirk McKusick 	}
14311c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC &&
14321c85e6a3SKirk McKusick 	    fs->fs_old_inodefmt < FS_44INODEFMT) {
14338680d698SNate Lawson 		fs->fs_maxfilesize = ((uint64_t)1 << 31) - 1;
14341c85e6a3SKirk McKusick 		fs->fs_qbmask = ~fs->fs_bmask;
14351c85e6a3SKirk McKusick 		fs->fs_qfmask = ~fs->fs_fmask;
14361c85e6a3SKirk McKusick 	}
14378f42fb8fSIan Dowse 	if (fs->fs_magic == FS_UFS1_MAGIC) {
14381c85e6a3SKirk McKusick 		ump->um_savedmaxfilesize = fs->fs_maxfilesize;
14398680d698SNate Lawson 		maxfilesize = (uint64_t)0x80000000 * fs->fs_bsize - 1;
14401c85e6a3SKirk McKusick 		if (fs->fs_maxfilesize > maxfilesize)
14411c85e6a3SKirk McKusick 			fs->fs_maxfilesize = maxfilesize;
14428f42fb8fSIan Dowse 	}
14431c85e6a3SKirk McKusick 	/* Compatibility for old filesystems */
14441c85e6a3SKirk McKusick 	if (fs->fs_avgfilesize <= 0)
14451c85e6a3SKirk McKusick 		fs->fs_avgfilesize = AVFILESIZ;
14461c85e6a3SKirk McKusick 	if (fs->fs_avgfpdir <= 0)
14471c85e6a3SKirk McKusick 		fs->fs_avgfpdir = AFPDIR;
14481c85e6a3SKirk McKusick 	if (bigcgs) {
14491c85e6a3SKirk McKusick 		fs->fs_save_cgsize = fs->fs_cgsize;
14501c85e6a3SKirk McKusick 		fs->fs_cgsize = fs->fs_bsize;
14511c85e6a3SKirk McKusick 	}
14521c85e6a3SKirk McKusick }
14531c85e6a3SKirk McKusick 
14541c85e6a3SKirk McKusick /*
14551c85e6a3SKirk McKusick  * Unwinding superblock updates for old filesystems.
14561c85e6a3SKirk McKusick  * See ffs_oldfscompat_read above for details.
14571c85e6a3SKirk McKusick  *
14581c85e6a3SKirk McKusick  * XXX - Parts get retired eventually.
14591c85e6a3SKirk McKusick  * Unfortunately new bits get added.
14601c85e6a3SKirk McKusick  */
1461113db2ddSJeff Roberson void
14621c85e6a3SKirk McKusick ffs_oldfscompat_write(fs, ump)
14631c85e6a3SKirk McKusick 	struct fs *fs;
14641c85e6a3SKirk McKusick 	struct ufsmount *ump;
1465df8bae1dSRodney W. Grimes {
1466df8bae1dSRodney W. Grimes 
14671c85e6a3SKirk McKusick 	/*
14681c85e6a3SKirk McKusick 	 * Copy back UFS2 updated fields that UFS1 inspects.
14691c85e6a3SKirk McKusick 	 */
14701c85e6a3SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC) {
14711c85e6a3SKirk McKusick 		fs->fs_old_time = fs->fs_time;
14721c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_ndir = fs->fs_cstotal.cs_ndir;
14731c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nbfree = fs->fs_cstotal.cs_nbfree;
14741c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nifree = fs->fs_cstotal.cs_nifree;
14751c85e6a3SKirk McKusick 		fs->fs_old_cstotal.cs_nffree = fs->fs_cstotal.cs_nffree;
14761c85e6a3SKirk McKusick 		fs->fs_maxfilesize = ump->um_savedmaxfilesize;
14778f42fb8fSIan Dowse 	}
14781c85e6a3SKirk McKusick 	if (bigcgs) {
14791c85e6a3SKirk McKusick 		fs->fs_cgsize = fs->fs_save_cgsize;
14801c85e6a3SKirk McKusick 		fs->fs_save_cgsize = 0;
14811c85e6a3SKirk McKusick 	}
1482df8bae1dSRodney W. Grimes }
1483df8bae1dSRodney W. Grimes 
1484df8bae1dSRodney W. Grimes /*
1485df8bae1dSRodney W. Grimes  * unmount system call
1486df8bae1dSRodney W. Grimes  */
1487adf41577SPoul-Henning Kamp static int
1488dfd233edSAttilio Rao ffs_unmount(mp, mntflags)
1489df8bae1dSRodney W. Grimes 	struct mount *mp;
1490df8bae1dSRodney W. Grimes 	int mntflags;
1491df8bae1dSRodney W. Grimes {
1492dfd233edSAttilio Rao 	struct thread *td;
149305f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump = VFSTOUFS(mp);
149405f4ff5dSPoul-Henning Kamp 	struct fs *fs;
14956fecb4e4SKonstantin Belousov 	int error, flags, susp;
1496df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR
1497df86ccf6SKonstantin Belousov 	int e_restart;
1498df86ccf6SKonstantin Belousov #endif
1499df8bae1dSRodney W. Grimes 
1500df8bae1dSRodney W. Grimes 	flags = 0;
1501dfd233edSAttilio Rao 	td = curthread;
15026fecb4e4SKonstantin Belousov 	fs = ump->um_fs;
150371f26429SKonstantin Belousov 	if (mntflags & MNT_FORCE)
1504df8bae1dSRodney W. Grimes 		flags |= FORCECLOSE;
15054ce90426SKonstantin Belousov 	susp = fs->fs_ronly == 0;
1506516081f2SRobert Watson #ifdef UFS_EXTATTR
1507b40ce416SJulian Elischer 	if ((error = ufs_extattr_stop(mp, td))) {
1508b2b0497aSRobert Watson 		if (error != EOPNOTSUPP)
1509b60ee81eSKirk McKusick 			printf("WARNING: unmount %s: ufs_extattr_stop "
1510b60ee81eSKirk McKusick 			    "returned errno %d\n", mp->mnt_stat.f_mntonname,
1511b2b0497aSRobert Watson 			    error);
1512df86ccf6SKonstantin Belousov 		e_restart = 0;
15137df97b61SRobert Watson 	} else {
15149de54ba5SRobert Watson 		ufs_extattr_uepm_destroy(&ump->um_extattr);
1515df86ccf6SKonstantin Belousov 		e_restart = 1;
15167df97b61SRobert Watson 	}
1517a64ed089SRobert Watson #endif
15186fecb4e4SKonstantin Belousov 	if (susp) {
1519895b3782SKonstantin Belousov 		error = vfs_write_suspend_umnt(mp);
1520895b3782SKonstantin Belousov 		if (error != 0)
1521895b3782SKonstantin Belousov 			goto fail1;
15226fecb4e4SKonstantin Belousov 	}
1523fddf7baeSKirk McKusick 	if (MOUNTEDSOFTDEP(mp))
15243c140b2dSEdward Tomasz Napierala 		error = softdep_flushfiles(mp, flags, td);
15253c140b2dSEdward Tomasz Napierala 	else
15263c140b2dSEdward Tomasz Napierala 		error = ffs_flushfiles(mp, flags, td);
1527d79ff54bSChuck Silvers 	if (error != 0 && !ffs_fsfail_cleanup(ump, error))
15286fecb4e4SKonstantin Belousov 		goto fail;
15293c140b2dSEdward Tomasz Napierala 
15303ba649d7SJeff Roberson 	UFS_LOCK(ump);
15319ccb939eSKirk McKusick 	if (fs->fs_pendingblocks != 0 || fs->fs_pendinginodes != 0) {
1532b60ee81eSKirk McKusick 		printf("WARNING: unmount %s: pending error: blocks %jd "
1533b60ee81eSKirk McKusick 		    "files %d\n", fs->fs_fsmnt, (intmax_t)fs->fs_pendingblocks,
15341c85e6a3SKirk McKusick 		    fs->fs_pendinginodes);
15359ccb939eSKirk McKusick 		fs->fs_pendingblocks = 0;
15369ccb939eSKirk McKusick 		fs->fs_pendinginodes = 0;
15379ccb939eSKirk McKusick 	}
15383ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
1539519e3c3bSKirk McKusick 	if (MOUNTEDSOFTDEP(mp))
1540113db2ddSJeff Roberson 		softdep_unmount(mp);
1541*2af934ccSKonstantin Belousov 	MPASS(ump->um_softdep == NULL);
1542927a12aeSKirk McKusick 	if (fs->fs_ronly == 0 || ump->um_fsckpid > 0) {
15431a6a6610SKirk McKusick 		fs->fs_clean = fs->fs_flags & (FS_UNCLEAN|FS_NEEDSFSCK) ? 0 : 1;
1544791dd2faSTor Egge 		error = ffs_sbupdate(ump, MNT_WAIT, 0);
1545d79ff54bSChuck Silvers 		if (ffs_fsfail_cleanup(ump, error))
1546d79ff54bSChuck Silvers 			error = 0;
1547d79ff54bSChuck Silvers 		if (error != 0 && !ffs_fsfail_cleanup(ump, error)) {
1548996c772fSJohn Dyson 			fs->fs_clean = 0;
15496fecb4e4SKonstantin Belousov 			goto fail;
1550996c772fSJohn Dyson 		}
1551e0e9c421SDavid Greenman 	}
1552ddd6b3fcSKonstantin Belousov 	if (susp)
1553ddd6b3fcSKonstantin Belousov 		vfs_write_resume(mp, VR_START_WRITE);
1554c79dff0fSKonstantin Belousov 	if (ump->um_trim_tq != NULL) {
1555c79dff0fSKonstantin Belousov 		while (ump->um_trim_inflight != 0)
1556c79dff0fSKonstantin Belousov 			pause("ufsutr", hz);
1557c79dff0fSKonstantin Belousov 		taskqueue_drain_all(ump->um_trim_tq);
1558c79dff0fSKonstantin Belousov 		taskqueue_free(ump->um_trim_tq);
15597e038bc2SKirk McKusick 		free (ump->um_trimhash, M_TRIM);
1560c79dff0fSKonstantin Belousov 	}
156143920011SPoul-Henning Kamp 	g_topology_lock();
1562927a12aeSKirk McKusick 	if (ump->um_fsckpid > 0) {
1563927a12aeSKirk McKusick 		/*
1564927a12aeSKirk McKusick 		 * Return to normal read-only mode.
1565927a12aeSKirk McKusick 		 */
1566927a12aeSKirk McKusick 		error = g_access(ump->um_cp, 0, -1, 0);
1567927a12aeSKirk McKusick 		ump->um_fsckpid = 0;
1568927a12aeSKirk McKusick 	}
15690d7935fdSAttilio Rao 	g_vfs_close(ump->um_cp);
157043920011SPoul-Henning Kamp 	g_topology_unlock();
1571f15ccf88SChuck Silvers 	BO_LOCK(&ump->um_odevvp->v_bufobj);
1572f15ccf88SChuck Silvers 	ump->um_odevvp->v_bufobj.bo_flag &= ~BO_NOBUFS;
1573f15ccf88SChuck Silvers 	BO_UNLOCK(&ump->um_odevvp->v_bufobj);
1574c70b3cd2SKonstantin Belousov 	atomic_store_rel_ptr((uintptr_t *)&ump->um_dev->si_mountpt, 0);
1575f15ccf88SChuck Silvers 	mntfs_freevp(ump->um_devvp);
1576f15ccf88SChuck Silvers 	vrele(ump->um_odevvp);
157749c4791cSEdward Tomasz Napierala 	dev_rel(ump->um_dev);
15783ba649d7SJeff Roberson 	mtx_destroy(UFS_MTX(ump));
15791a60c7fcSPawel Jakub Dawidek 	if (mp->mnt_gjprovider != NULL) {
15801a60c7fcSPawel Jakub Dawidek 		free(mp->mnt_gjprovider, M_UFSMNT);
15811a60c7fcSPawel Jakub Dawidek 		mp->mnt_gjprovider = NULL;
15821a60c7fcSPawel Jakub Dawidek 	}
1583f55ff3f3SIan Dowse 	free(fs->fs_csp, M_UFSMNT);
158434816cb9SKirk McKusick 	free(fs->fs_si, M_UFSMNT);
1585df8bae1dSRodney W. Grimes 	free(fs, M_UFSMNT);
1586d79ff54bSChuck Silvers 	if (ump->um_fsfail_task != NULL)
1587d79ff54bSChuck Silvers 		free(ump->um_fsfail_task, M_UFSMNT);
1588df8bae1dSRodney W. Grimes 	free(ump, M_UFSMNT);
158977465d93SAlfred Perlstein 	mp->mnt_data = NULL;
15905da56ddbSTor Egge 	MNT_ILOCK(mp);
1591cc9d8990SPeter Wemm 	mp->mnt_flag &= ~MNT_LOCAL;
15925da56ddbSTor Egge 	MNT_IUNLOCK(mp);
15934cbc378cSKonstantin Belousov 	if (td->td_su == mp) {
15944cbc378cSKonstantin Belousov 		td->td_su = NULL;
15954cbc378cSKonstantin Belousov 		vfs_rel(mp);
15964cbc378cSKonstantin Belousov 	}
1597df8bae1dSRodney W. Grimes 	return (error);
15986fecb4e4SKonstantin Belousov 
15996fecb4e4SKonstantin Belousov fail:
1600ddd6b3fcSKonstantin Belousov 	if (susp)
1601ddd6b3fcSKonstantin Belousov 		vfs_write_resume(mp, VR_START_WRITE);
1602895b3782SKonstantin Belousov fail1:
1603df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR
1604df86ccf6SKonstantin Belousov 	if (e_restart) {
1605df86ccf6SKonstantin Belousov 		ufs_extattr_uepm_init(&ump->um_extattr);
1606df86ccf6SKonstantin Belousov #ifdef UFS_EXTATTR_AUTOSTART
1607df86ccf6SKonstantin Belousov 		(void) ufs_extattr_autostart(mp, td);
1608df86ccf6SKonstantin Belousov #endif
1609df86ccf6SKonstantin Belousov 	}
1610df86ccf6SKonstantin Belousov #endif
1611df86ccf6SKonstantin Belousov 
16126fecb4e4SKonstantin Belousov 	return (error);
1613df8bae1dSRodney W. Grimes }
1614df8bae1dSRodney W. Grimes 
1615df8bae1dSRodney W. Grimes /*
1616df8bae1dSRodney W. Grimes  * Flush out all the files in a filesystem.
1617df8bae1dSRodney W. Grimes  */
161826f9a767SRodney W. Grimes int
1619b40ce416SJulian Elischer ffs_flushfiles(mp, flags, td)
162005f4ff5dSPoul-Henning Kamp 	struct mount *mp;
1621df8bae1dSRodney W. Grimes 	int flags;
1622b40ce416SJulian Elischer 	struct thread *td;
1623df8bae1dSRodney W. Grimes {
162405f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
1625ba05dec5SKonstantin Belousov 	int qerror, error;
1626df8bae1dSRodney W. Grimes 
1627df8bae1dSRodney W. Grimes 	ump = VFSTOUFS(mp);
1628ba05dec5SKonstantin Belousov 	qerror = 0;
1629df8bae1dSRodney W. Grimes #ifdef QUOTA
1630df8bae1dSRodney W. Grimes 	if (mp->mnt_flag & MNT_QUOTA) {
1631c1d9efcbSPoul-Henning Kamp 		int i;
1632f257b7a5SAlfred Perlstein 		error = vflush(mp, 0, SKIPSYSTEM|flags, td);
1633c1d9efcbSPoul-Henning Kamp 		if (error)
1634df8bae1dSRodney W. Grimes 			return (error);
1635df8bae1dSRodney W. Grimes 		for (i = 0; i < MAXQUOTAS; i++) {
1636ba05dec5SKonstantin Belousov 			error = quotaoff(td, mp, i);
1637ba05dec5SKonstantin Belousov 			if (error != 0) {
1638ba05dec5SKonstantin Belousov 				if ((flags & EARLYFLUSH) == 0)
1639ba05dec5SKonstantin Belousov 					return (error);
1640ba05dec5SKonstantin Belousov 				else
1641ba05dec5SKonstantin Belousov 					qerror = error;
1642df8bae1dSRodney W. Grimes 			}
1643ba05dec5SKonstantin Belousov 		}
1644ba05dec5SKonstantin Belousov 
1645df8bae1dSRodney W. Grimes 		/*
1646ba05dec5SKonstantin Belousov 		 * Here we fall through to vflush again to ensure that
1647ba05dec5SKonstantin Belousov 		 * we have gotten rid of all the system vnodes, unless
1648ba05dec5SKonstantin Belousov 		 * quotas must not be closed.
1649df8bae1dSRodney W. Grimes 		 */
1650df8bae1dSRodney W. Grimes 	}
1651df8bae1dSRodney W. Grimes #endif
1652e6e370a7SJeff Roberson 	ASSERT_VOP_LOCKED(ump->um_devvp, "ffs_flushfiles");
1653e6e370a7SJeff Roberson 	if (ump->um_devvp->v_vflag & VV_COPYONWRITE) {
1654f257b7a5SAlfred Perlstein 		if ((error = vflush(mp, 0, SKIPSYSTEM | flags, td)) != 0)
1655f2a2857bSKirk McKusick 			return (error);
1656f2a2857bSKirk McKusick 		ffs_snapshot_unmount(mp);
165795e7a3c3STor Egge 		flags |= FORCECLOSE;
1658f2a2857bSKirk McKusick 		/*
1659f2a2857bSKirk McKusick 		 * Here we fall through to vflush again to ensure
1660f2a2857bSKirk McKusick 		 * that we have gotten rid of all the system vnodes.
1661f2a2857bSKirk McKusick 		 */
1662f2a2857bSKirk McKusick 	}
1663ba05dec5SKonstantin Belousov 
1664b1897c19SJulian Elischer 	/*
1665ba05dec5SKonstantin Belousov 	 * Do not close system files if quotas were not closed, to be
1666ba05dec5SKonstantin Belousov 	 * able to sync the remaining dquots.  The freeblks softupdate
1667ba05dec5SKonstantin Belousov 	 * workitems might hold a reference on a dquot, preventing
1668ba05dec5SKonstantin Belousov 	 * quotaoff() from completing.  Next round of
1669ba05dec5SKonstantin Belousov 	 * softdep_flushworklist() iteration should process the
1670ba05dec5SKonstantin Belousov 	 * blockers, allowing the next run of quotaoff() to finally
1671ba05dec5SKonstantin Belousov 	 * flush held dquots.
1672ba05dec5SKonstantin Belousov 	 *
1673ba05dec5SKonstantin Belousov 	 * Otherwise, flush all the files.
1674b1897c19SJulian Elischer 	 */
1675ba05dec5SKonstantin Belousov 	if (qerror == 0 && (error = vflush(mp, 0, flags, td)) != 0)
1676b1897c19SJulian Elischer 		return (error);
1677ba05dec5SKonstantin Belousov 
1678b1897c19SJulian Elischer 	/*
1679b1897c19SJulian Elischer 	 * Flush filesystem metadata.
1680b1897c19SJulian Elischer 	 */
1681cb05b60aSAttilio Rao 	vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY);
16828df6bac4SPoul-Henning Kamp 	error = VOP_FSYNC(ump->um_devvp, MNT_WAIT, td);
1683b249ce48SMateusz Guzik 	VOP_UNLOCK(ump->um_devvp);
1684df8bae1dSRodney W. Grimes 	return (error);
1685df8bae1dSRodney W. Grimes }
1686df8bae1dSRodney W. Grimes 
1687df8bae1dSRodney W. Grimes /*
1688df8bae1dSRodney W. Grimes  * Get filesystem statistics.
1689df8bae1dSRodney W. Grimes  */
1690adf41577SPoul-Henning Kamp static int
1691dfd233edSAttilio Rao ffs_statfs(mp, sbp)
1692df8bae1dSRodney W. Grimes 	struct mount *mp;
169305f4ff5dSPoul-Henning Kamp 	struct statfs *sbp;
1694df8bae1dSRodney W. Grimes {
169505f4ff5dSPoul-Henning Kamp 	struct ufsmount *ump;
169605f4ff5dSPoul-Henning Kamp 	struct fs *fs;
1697df8bae1dSRodney W. Grimes 
1698df8bae1dSRodney W. Grimes 	ump = VFSTOUFS(mp);
1699df8bae1dSRodney W. Grimes 	fs = ump->um_fs;
17001c85e6a3SKirk McKusick 	if (fs->fs_magic != FS_UFS1_MAGIC && fs->fs_magic != FS_UFS2_MAGIC)
1701df8bae1dSRodney W. Grimes 		panic("ffs_statfs");
1702fde81c7dSKirk McKusick 	sbp->f_version = STATFS_VERSION;
1703df8bae1dSRodney W. Grimes 	sbp->f_bsize = fs->fs_fsize;
1704df8bae1dSRodney W. Grimes 	sbp->f_iosize = fs->fs_bsize;
1705df8bae1dSRodney W. Grimes 	sbp->f_blocks = fs->fs_dsize;
17063ba649d7SJeff Roberson 	UFS_LOCK(ump);
1707df8bae1dSRodney W. Grimes 	sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag +
17089ccb939eSKirk McKusick 	    fs->fs_cstotal.cs_nffree + dbtofsb(fs, fs->fs_pendingblocks);
17099ccb939eSKirk McKusick 	sbp->f_bavail = freespace(fs, fs->fs_minfree) +
17109ccb939eSKirk McKusick 	    dbtofsb(fs, fs->fs_pendingblocks);
17111dc349abSEd Maste 	sbp->f_files =  fs->fs_ncg * fs->fs_ipg - UFS_ROOTINO;
17129ccb939eSKirk McKusick 	sbp->f_ffree = fs->fs_cstotal.cs_nifree + fs->fs_pendinginodes;
17133ba649d7SJeff Roberson 	UFS_UNLOCK(ump);
1714a96da1c3SConrad Meyer 	sbp->f_namemax = UFS_MAXNAMLEN;
1715df8bae1dSRodney W. Grimes 	return (0);
1716df8bae1dSRodney W. Grimes }
1717df8bae1dSRodney W. Grimes 
17181eabd967SKonstantin Belousov static bool
17191eabd967SKonstantin Belousov sync_doupdate(struct inode *ip)
17201eabd967SKonstantin Belousov {
17211eabd967SKonstantin Belousov 
17221eabd967SKonstantin Belousov 	return ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED |
17231eabd967SKonstantin Belousov 	    IN_UPDATE)) != 0);
17241eabd967SKonstantin Belousov }
17251eabd967SKonstantin Belousov 
172680663cadSMateusz Guzik static int
172780663cadSMateusz Guzik ffs_sync_lazy_filter(struct vnode *vp, void *arg __unused)
172880663cadSMateusz Guzik {
172980663cadSMateusz Guzik 	struct inode *ip;
173080663cadSMateusz Guzik 
173180663cadSMateusz Guzik 	/*
173280663cadSMateusz Guzik 	 * Flags are safe to access because ->v_data invalidation
173380663cadSMateusz Guzik 	 * is held off by listmtx.
173480663cadSMateusz Guzik 	 */
173580663cadSMateusz Guzik 	if (vp->v_type == VNON)
173680663cadSMateusz Guzik 		return (false);
173780663cadSMateusz Guzik 	ip = VTOI(vp);
173880663cadSMateusz Guzik 	if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0)
173980663cadSMateusz Guzik 		return (false);
174080663cadSMateusz Guzik 	return (true);
174180663cadSMateusz Guzik }
174280663cadSMateusz Guzik 
1743df8bae1dSRodney W. Grimes /*
1744a988a5c6SKonstantin Belousov  * For a lazy sync, we only care about access times, quotas and the
1745a988a5c6SKonstantin Belousov  * superblock.  Other filesystem changes are already converted to
1746a988a5c6SKonstantin Belousov  * cylinder group blocks or inode blocks updates and are written to
1747a988a5c6SKonstantin Belousov  * disk by syncer.
1748a988a5c6SKonstantin Belousov  */
1749a988a5c6SKonstantin Belousov static int
1750a988a5c6SKonstantin Belousov ffs_sync_lazy(mp)
1751a988a5c6SKonstantin Belousov      struct mount *mp;
1752a988a5c6SKonstantin Belousov {
1753a988a5c6SKonstantin Belousov 	struct vnode *mvp, *vp;
1754a988a5c6SKonstantin Belousov 	struct inode *ip;
1755a988a5c6SKonstantin Belousov 	struct thread *td;
1756a988a5c6SKonstantin Belousov 	int allerror, error;
1757a988a5c6SKonstantin Belousov 
1758a988a5c6SKonstantin Belousov 	allerror = 0;
1759a988a5c6SKonstantin Belousov 	td = curthread;
17600297c138SKirk McKusick 	if ((mp->mnt_flag & MNT_NOATIME) != 0) {
17610297c138SKirk McKusick #ifdef QUOTA
17620297c138SKirk McKusick 		qsync(mp);
17630297c138SKirk McKusick #endif
17640297c138SKirk McKusick 		goto sbupdate;
17650297c138SKirk McKusick 	}
176680663cadSMateusz Guzik 	MNT_VNODE_FOREACH_LAZY(vp, mp, mvp, ffs_sync_lazy_filter, NULL) {
176771469bb3SKirk McKusick 		if (vp->v_type == VNON) {
1768a988a5c6SKonstantin Belousov 			VI_UNLOCK(vp);
1769a988a5c6SKonstantin Belousov 			continue;
1770a988a5c6SKonstantin Belousov 		}
1771a988a5c6SKonstantin Belousov 		ip = VTOI(vp);
1772a988a5c6SKonstantin Belousov 
1773a988a5c6SKonstantin Belousov 		/*
1774a988a5c6SKonstantin Belousov 		 * The IN_ACCESS flag is converted to IN_MODIFIED by
1775a988a5c6SKonstantin Belousov 		 * ufs_close() and ufs_getattr() by the calls to
1776ea573a50SKonstantin Belousov 		 * ufs_itimes_locked(), without subsequent UFS_UPDATE().
1777ea573a50SKonstantin Belousov 		 * Test also all the other timestamp flags too, to pick up
1778ea573a50SKonstantin Belousov 		 * any other cases that could be missed.
1779a988a5c6SKonstantin Belousov 		 */
17801eabd967SKonstantin Belousov 		if (!sync_doupdate(ip) && (vp->v_iflag & VI_OWEINACT) == 0) {
1781a988a5c6SKonstantin Belousov 			VI_UNLOCK(vp);
1782a988a5c6SKonstantin Belousov 			continue;
1783a988a5c6SKonstantin Belousov 		}
1784a92a971bSMateusz Guzik 		if ((error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK)) != 0)
1785a988a5c6SKonstantin Belousov 			continue;
17860297c138SKirk McKusick #ifdef QUOTA
17870297c138SKirk McKusick 		qsyncvp(vp);
17880297c138SKirk McKusick #endif
17891eabd967SKonstantin Belousov 		if (sync_doupdate(ip))
1790a988a5c6SKonstantin Belousov 			error = ffs_update(vp, 0);
1791a988a5c6SKonstantin Belousov 		if (error != 0)
1792a988a5c6SKonstantin Belousov 			allerror = error;
1793a988a5c6SKonstantin Belousov 		vput(vp);
1794a988a5c6SKonstantin Belousov 	}
17950297c138SKirk McKusick sbupdate:
1796a988a5c6SKonstantin Belousov 	if (VFSTOUFS(mp)->um_fs->fs_fmod != 0 &&
1797a988a5c6SKonstantin Belousov 	    (error = ffs_sbupdate(VFSTOUFS(mp), MNT_LAZY, 0)) != 0)
1798a988a5c6SKonstantin Belousov 		allerror = error;
1799a988a5c6SKonstantin Belousov 	return (allerror);
1800a988a5c6SKonstantin Belousov }
1801a988a5c6SKonstantin Belousov 
1802a988a5c6SKonstantin Belousov /*
1803df8bae1dSRodney W. Grimes  * Go through the disk queues to initiate sandbagged IO;
1804df8bae1dSRodney W. Grimes  * go through the inodes to write those that have been modified;
1805df8bae1dSRodney W. Grimes  * initiate the writing of the super block if it has been modified.
1806df8bae1dSRodney W. Grimes  *
1807a988a5c6SKonstantin Belousov  * Note: we are always called with the filesystem marked busy using
1808a988a5c6SKonstantin Belousov  * vfs_busy().
1809df8bae1dSRodney W. Grimes  */
1810adf41577SPoul-Henning Kamp static int
1811dfd233edSAttilio Rao ffs_sync(mp, waitfor)
1812df8bae1dSRodney W. Grimes 	struct mount *mp;
1813df8bae1dSRodney W. Grimes 	int waitfor;
1814df8bae1dSRodney W. Grimes {
181582be0a5aSTor Egge 	struct vnode *mvp, *vp, *devvp;
1816dfd233edSAttilio Rao 	struct thread *td;
1817996c772fSJohn Dyson 	struct inode *ip;
1818996c772fSJohn Dyson 	struct ufsmount *ump = VFSTOUFS(mp);
1819996c772fSJohn Dyson 	struct fs *fs;
182069baeadcSKonstantin Belousov 	int error, count, lockreq, allerror = 0;
1821791dd2faSTor Egge 	int suspend;
1822791dd2faSTor Egge 	int suspended;
1823791dd2faSTor Egge 	int secondary_writes;
1824791dd2faSTor Egge 	int secondary_accwrites;
1825791dd2faSTor Egge 	int softdep_deps;
1826791dd2faSTor Egge 	int softdep_accdeps;
1827156cb265SPoul-Henning Kamp 	struct bufobj *bo;
1828df8bae1dSRodney W. Grimes 
182919c87af0SKirk McKusick 	suspend = 0;
183019c87af0SKirk McKusick 	suspended = 0;
1831dfd233edSAttilio Rao 	td = curthread;
1832df8bae1dSRodney W. Grimes 	fs = ump->um_fs;
1833b60ee81eSKirk McKusick 	if (fs->fs_fmod != 0 && fs->fs_ronly != 0 && ump->um_fsckpid == 0)
1834b60ee81eSKirk McKusick 		panic("%s: ffs_sync: modification on read-only filesystem",
1835b60ee81eSKirk McKusick 		    fs->fs_fsmnt);
18364af9f77eSKonstantin Belousov 	if (waitfor == MNT_LAZY) {
18374af9f77eSKonstantin Belousov 		if (!rebooting)
1838a988a5c6SKonstantin Belousov 			return (ffs_sync_lazy(mp));
18394af9f77eSKonstantin Belousov 		waitfor = MNT_NOWAIT;
18404af9f77eSKonstantin Belousov 	}
1841a988a5c6SKonstantin Belousov 
184219c87af0SKirk McKusick 	/*
1843df8bae1dSRodney W. Grimes 	 * Write back each (modified) inode.
1844df8bae1dSRodney W. Grimes 	 */
1845245df27cSMatthew Dillon 	lockreq = LK_EXCLUSIVE | LK_NOWAIT;
1846791dd2faSTor Egge 	if (waitfor == MNT_SUSPEND) {
1847791dd2faSTor Egge 		suspend = 1;
1848791dd2faSTor Egge 		waitfor = MNT_WAIT;
1849791dd2faSTor Egge 	}
185069baeadcSKonstantin Belousov 	if (waitfor == MNT_WAIT)
1851245df27cSMatthew Dillon 		lockreq = LK_EXCLUSIVE;
185241d4783dSJeff Roberson 	lockreq |= LK_INTERLOCK | LK_SLEEPFAIL;
1853df8bae1dSRodney W. Grimes loop:
1854791dd2faSTor Egge 	/* Grab snapshot of secondary write counts */
185571469bb3SKirk McKusick 	MNT_ILOCK(mp);
1856791dd2faSTor Egge 	secondary_writes = mp->mnt_secondary_writes;
1857791dd2faSTor Egge 	secondary_accwrites = mp->mnt_secondary_accwrites;
185871469bb3SKirk McKusick 	MNT_IUNLOCK(mp);
1859791dd2faSTor Egge 
1860791dd2faSTor Egge 	/* Grab snapshot of softdep dependency counts */
1861791dd2faSTor Egge 	softdep_get_depcounts(mp, &softdep_deps, &softdep_accdeps);
1862791dd2faSTor Egge 
186371469bb3SKirk McKusick 	MNT_VNODE_FOREACH_ALL(vp, mp, mvp) {
1864245df27cSMatthew Dillon 		/*
1865e0c17408SKonstantin Belousov 		 * Depend on the vnode interlock to keep things stable enough
1866245df27cSMatthew Dillon 		 * for a quick test.  Since there might be hundreds of
1867245df27cSMatthew Dillon 		 * thousands of vnodes, we cannot afford even a subroutine
1868245df27cSMatthew Dillon 		 * call unless there's a good chance that we have work to do.
1869245df27cSMatthew Dillon 		 */
187071469bb3SKirk McKusick 		if (vp->v_type == VNON) {
18712f05568aSJeff Roberson 			VI_UNLOCK(vp);
18722f05568aSJeff Roberson 			continue;
18732f05568aSJeff Roberson 		}
1874df8bae1dSRodney W. Grimes 		ip = VTOI(vp);
187571469bb3SKirk McKusick 		if ((ip->i_flag &
1876cf60e8e4SKirk McKusick 		    (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 &&
187771469bb3SKirk McKusick 		    vp->v_bufobj.bo_dirty.bv_cnt == 0) {
18782f05568aSJeff Roberson 			VI_UNLOCK(vp);
1879df8bae1dSRodney W. Grimes 			continue;
1880996c772fSJohn Dyson 		}
1881a92a971bSMateusz Guzik 		if ((error = vget(vp, lockreq)) != 0) {
188282be0a5aSTor Egge 			if (error == ENOENT || error == ENOLCK) {
188371469bb3SKirk McKusick 				MNT_VNODE_FOREACH_ALL_ABORT(mp, mvp);
1884df8bae1dSRodney W. Grimes 				goto loop;
188582be0a5aSTor Egge 			}
18862f05568aSJeff Roberson 			continue;
18872f05568aSJeff Roberson 		}
18880297c138SKirk McKusick #ifdef QUOTA
18890297c138SKirk McKusick 		qsyncvp(vp);
18900297c138SKirk McKusick #endif
18918a1509e4SKonstantin Belousov 		for (;;) {
18928a1509e4SKonstantin Belousov 			error = ffs_syncvnode(vp, waitfor, 0);
18938a1509e4SKonstantin Belousov 			if (error == ERELOOKUP)
18948a1509e4SKonstantin Belousov 				continue;
18958a1509e4SKonstantin Belousov 			if (error != 0)
1896df8bae1dSRodney W. Grimes 				allerror = error;
18978a1509e4SKonstantin Belousov 			break;
18988a1509e4SKonstantin Belousov 		}
189941d4783dSJeff Roberson 		vput(vp);
1900245df27cSMatthew Dillon 	}
1901df8bae1dSRodney W. Grimes 	/*
1902df8bae1dSRodney W. Grimes 	 * Force stale filesystem control information to be flushed.
1903df8bae1dSRodney W. Grimes 	 */
19044af9f77eSKonstantin Belousov 	if (waitfor == MNT_WAIT || rebooting) {
1905b40ce416SJulian Elischer 		if ((error = softdep_flushworklist(ump->um_mountp, &count, td)))
19069b971133SKirk McKusick 			allerror = error;
1907d79ff54bSChuck Silvers 		if (ffs_fsfail_cleanup(ump, allerror))
1908d79ff54bSChuck Silvers 			allerror = 0;
19099b971133SKirk McKusick 		/* Flushed work items may create new vnodes to clean */
191071469bb3SKirk McKusick 		if (allerror == 0 && count)
19119b971133SKirk McKusick 			goto loop;
19129b971133SKirk McKusick 	}
191319c87af0SKirk McKusick 
1914112f7372SKirk McKusick 	devvp = ump->um_devvp;
1915156cb265SPoul-Henning Kamp 	bo = &devvp->v_bufobj;
1916698b1a66SJeff Roberson 	BO_LOCK(bo);
191719c87af0SKirk McKusick 	if (bo->bo_numoutput > 0 || bo->bo_dirty.bv_cnt > 0) {
1918698b1a66SJeff Roberson 		BO_UNLOCK(bo);
1919698b1a66SJeff Roberson 		vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
19204af9f77eSKonstantin Belousov 		error = VOP_FSYNC(devvp, waitfor, td);
1921b249ce48SMateusz Guzik 		VOP_UNLOCK(devvp);
19224af9f77eSKonstantin Belousov 		if (MOUNTEDSOFTDEP(mp) && (error == 0 || error == EAGAIN))
19234af9f77eSKonstantin Belousov 			error = ffs_sbupdate(ump, waitfor, 0);
19244af9f77eSKonstantin Belousov 		if (error != 0)
19254af9f77eSKonstantin Belousov 			allerror = error;
1926d79ff54bSChuck Silvers 		if (ffs_fsfail_cleanup(ump, allerror))
1927d79ff54bSChuck Silvers 			allerror = 0;
192871469bb3SKirk McKusick 		if (allerror == 0 && waitfor == MNT_WAIT)
1929112f7372SKirk McKusick 			goto loop;
1930791dd2faSTor Egge 	} else if (suspend != 0) {
1931791dd2faSTor Egge 		if (softdep_check_suspend(mp,
1932791dd2faSTor Egge 					  devvp,
1933791dd2faSTor Egge 					  softdep_deps,
1934791dd2faSTor Egge 					  softdep_accdeps,
1935791dd2faSTor Egge 					  secondary_writes,
193671469bb3SKirk McKusick 					  secondary_accwrites) != 0) {
193771469bb3SKirk McKusick 			MNT_IUNLOCK(mp);
1938791dd2faSTor Egge 			goto loop;	/* More work needed */
193971469bb3SKirk McKusick 		}
1940791dd2faSTor Egge 		mtx_assert(MNT_MTX(mp), MA_OWNED);
1941ca2fa807STor Egge 		mp->mnt_kern_flag |= MNTK_SUSPEND2 | MNTK_SUSPENDED;
1942791dd2faSTor Egge 		MNT_IUNLOCK(mp);
1943791dd2faSTor Egge 		suspended = 1;
1944112f7372SKirk McKusick 	} else
1945698b1a66SJeff Roberson 		BO_UNLOCK(bo);
1946996c772fSJohn Dyson 	/*
1947996c772fSJohn Dyson 	 * Write back modified superblock.
1948996c772fSJohn Dyson 	 */
1949791dd2faSTor Egge 	if (fs->fs_fmod != 0 &&
1950791dd2faSTor Egge 	    (error = ffs_sbupdate(ump, waitfor, suspended)) != 0)
1951996c772fSJohn Dyson 		allerror = error;
1952d79ff54bSChuck Silvers 	if (ffs_fsfail_cleanup(ump, allerror))
1953d79ff54bSChuck Silvers 		allerror = 0;
1954df8bae1dSRodney W. Grimes 	return (allerror);
1955df8bae1dSRodney W. Grimes }
1956df8bae1dSRodney W. Grimes 
1957df8bae1dSRodney W. Grimes int
1958a0595d02SKirk McKusick ffs_vget(mp, ino, flags, vpp)
1959df8bae1dSRodney W. Grimes 	struct mount *mp;
1960df8bae1dSRodney W. Grimes 	ino_t ino;
1961a0595d02SKirk McKusick 	int flags;
1962df8bae1dSRodney W. Grimes 	struct vnode **vpp;
1963df8bae1dSRodney W. Grimes {
19647b7ed832SKonstantin Belousov 	return (ffs_vgetf(mp, ino, flags, vpp, 0));
19657b7ed832SKonstantin Belousov }
19667b7ed832SKonstantin Belousov 
19677b7ed832SKonstantin Belousov int
19687b7ed832SKonstantin Belousov ffs_vgetf(mp, ino, flags, vpp, ffs_flags)
19697b7ed832SKonstantin Belousov 	struct mount *mp;
19707b7ed832SKonstantin Belousov 	ino_t ino;
19717b7ed832SKonstantin Belousov 	int flags;
19727b7ed832SKonstantin Belousov 	struct vnode **vpp;
19737b7ed832SKonstantin Belousov 	int ffs_flags;
19747b7ed832SKonstantin Belousov {
1975996c772fSJohn Dyson 	struct fs *fs;
1976996c772fSJohn Dyson 	struct inode *ip;
1977df8bae1dSRodney W. Grimes 	struct ufsmount *ump;
1978df8bae1dSRodney W. Grimes 	struct buf *bp;
1979df8bae1dSRodney W. Grimes 	struct vnode *vp;
1980d79ff54bSChuck Silvers 	daddr_t dbn;
1981f576a00dSSemen Ustimenko 	int error;
1982df8bae1dSRodney W. Grimes 
1983f16c26b1SKonstantin Belousov 	MPASS((ffs_flags & (FFSV_REPLACE | FFSV_REPLACE_DOOMED)) == 0 ||
1984f16c26b1SKonstantin Belousov 	    (flags & LK_EXCLUSIVE) != 0);
198516040222SKonstantin Belousov 
198651f5ce0cSPoul-Henning Kamp 	error = vfs_hash_get(mp, ino, flags, curthread, vpp, NULL, NULL);
198716040222SKonstantin Belousov 	if (error != 0)
198814bc0685SPoul-Henning Kamp 		return (error);
198916040222SKonstantin Belousov 	if (*vpp != NULL) {
1990f16c26b1SKonstantin Belousov 		if ((ffs_flags & FFSV_REPLACE) == 0 ||
1991f16c26b1SKonstantin Belousov 		    ((ffs_flags & FFSV_REPLACE_DOOMED) == 0 ||
1992f16c26b1SKonstantin Belousov 		    !VN_IS_DOOMED(*vpp)))
199316040222SKonstantin Belousov 			return (0);
199416040222SKonstantin Belousov 		vgone(*vpp);
199516040222SKonstantin Belousov 		vput(*vpp);
199616040222SKonstantin Belousov 	}
1997f576a00dSSemen Ustimenko 
1998f576a00dSSemen Ustimenko 	/*
1999d6919865SJeff Roberson 	 * We must promote to an exclusive lock for vnode creation.  This
2000d6919865SJeff Roberson 	 * can happen if lookup is passed LOCKSHARED.
2001d6919865SJeff Roberson 	 */
2002d6919865SJeff Roberson 	if ((flags & LK_TYPE_MASK) == LK_SHARED) {
2003d6919865SJeff Roberson 		flags &= ~LK_TYPE_MASK;
2004d6919865SJeff Roberson 		flags |= LK_EXCLUSIVE;
2005d6919865SJeff Roberson 	}
2006d6919865SJeff Roberson 
2007d6919865SJeff Roberson 	/*
200813866b3fSSemen Ustimenko 	 * We do not lock vnode creation as it is believed to be too
2009f576a00dSSemen Ustimenko 	 * expensive for such rare case as simultaneous creation of vnode
2010f576a00dSSemen Ustimenko 	 * for same ino by different processes. We just allow them to race
2011f576a00dSSemen Ustimenko 	 * and check later to decide who wins. Let the race begin!
2012f576a00dSSemen Ustimenko 	 */
201314bc0685SPoul-Henning Kamp 
201414bc0685SPoul-Henning Kamp 	ump = VFSTOUFS(mp);
201514bc0685SPoul-Henning Kamp 	fs = ump->um_fs;
20169d5a594fSMateusz Guzik 	ip = uma_zalloc_smr(uma_inode, M_WAITOK | M_ZERO);
20172f9bae59SDavid Greenman 
2018df8bae1dSRodney W. Grimes 	/* Allocate a new vnode/inode. */
201943a993bbSKirk McKusick 	error = getnewvnode("ufs", mp, fs->fs_magic == FS_UFS1_MAGIC ?
202043a993bbSKirk McKusick 	    &ffs_vnodeops1 : &ffs_vnodeops2, &vp);
2021c9671602SPoul-Henning Kamp 	if (error) {
2022df8bae1dSRodney W. Grimes 		*vpp = NULL;
20239d5a594fSMateusz Guzik 		uma_zfree_smr(uma_inode, ip);
2024df8bae1dSRodney W. Grimes 		return (error);
2025df8bae1dSRodney W. Grimes 	}
202667e87166SBoris Popov 	/*
202733fc3625SJohn Baldwin 	 * FFS supports recursive locking.
202867e87166SBoris Popov 	 */
20293634d5b2SJohn Baldwin 	lockmgr(vp->v_vnlock, LK_EXCLUSIVE, NULL);
2030628f51d2SAttilio Rao 	VN_LOCK_AREC(vp);
2031df8bae1dSRodney W. Grimes 	vp->v_data = ip;
20325d9d81e7SPoul-Henning Kamp 	vp->v_bufobj.bo_bsize = fs->fs_bsize;
2033df8bae1dSRodney W. Grimes 	ip->i_vnode = vp;
20341c85e6a3SKirk McKusick 	ip->i_ump = ump;
2035df8bae1dSRodney W. Grimes 	ip->i_number = ino;
2036e65f5a4eSKonstantin Belousov 	ip->i_ea_refs = 0;
203774a87c38SKirk McKusick 	ip->i_nextclustercg = -1;
2038e1db6897SKonstantin Belousov 	ip->i_flag = fs->fs_magic == FS_UFS1_MAGIC ? 0 : IN_UFS2;
203972d28f97SKirk McKusick 	ip->i_mode = 0; /* ensure error cases below throw away vnode */
20402bfd8992SKonstantin Belousov 	cluster_init_vn(&ip->i_clusterw);
204161846fc4SKonstantin Belousov #ifdef DIAGNOSTIC
204261846fc4SKonstantin Belousov 	ufs_init_trackers(ip);
204361846fc4SKonstantin Belousov #endif
2044df8bae1dSRodney W. Grimes #ifdef QUOTA
2045c1d9efcbSPoul-Henning Kamp 	{
2046c1d9efcbSPoul-Henning Kamp 		int i;
2047df8bae1dSRodney W. Grimes 		for (i = 0; i < MAXQUOTAS; i++)
2048df8bae1dSRodney W. Grimes 			ip->i_dquot[i] = NODQUOT;
2049c1d9efcbSPoul-Henning Kamp 	}
2050df8bae1dSRodney W. Grimes #endif
2051df8bae1dSRodney W. Grimes 
20527b7ed832SKonstantin Belousov 	if (ffs_flags & FFSV_FORCEINSMQ)
20537b7ed832SKonstantin Belousov 		vp->v_vflag |= VV_FORCEINSMQ;
205461b9d89fSTor Egge 	error = insmntque(vp, mp);
205561b9d89fSTor Egge 	if (error != 0) {
20569d5a594fSMateusz Guzik 		uma_zfree_smr(uma_inode, ip);
205761b9d89fSTor Egge 		*vpp = NULL;
205861b9d89fSTor Egge 		return (error);
205961b9d89fSTor Egge 	}
20607b7ed832SKonstantin Belousov 	vp->v_vflag &= ~VV_FORCEINSMQ;
2061a80d8caaSPawel Jakub Dawidek 	error = vfs_hash_insert(vp, ino, flags, curthread, vpp, NULL, NULL);
206216040222SKonstantin Belousov 	if (error != 0)
2063f576a00dSSemen Ustimenko 		return (error);
206416040222SKonstantin Belousov 	if (*vpp != NULL) {
206516040222SKonstantin Belousov 		/*
206616040222SKonstantin Belousov 		 * Calls from ffs_valloc() (i.e. FFSV_REPLACE set)
206716040222SKonstantin Belousov 		 * operate on empty inode, which must not be found by
206816040222SKonstantin Belousov 		 * other threads until fully filled.  Vnode for empty
206916040222SKonstantin Belousov 		 * inode must be not re-inserted on the hash by other
207016040222SKonstantin Belousov 		 * thread, after removal by us at the beginning.
207116040222SKonstantin Belousov 		 */
207216040222SKonstantin Belousov 		MPASS((ffs_flags & FFSV_REPLACE) == 0);
207316040222SKonstantin Belousov 		return (0);
207416040222SKonstantin Belousov 	}
2075f576a00dSSemen Ustimenko 
2076df8bae1dSRodney W. Grimes 	/* Read in the disk contents for the inode, copy into the inode. */
2077d79ff54bSChuck Silvers 	dbn = fsbtodb(fs, ino_to_fsba(fs, ino));
2078d79ff54bSChuck Silvers 	error = ffs_breadz(ump, ump->um_devvp, dbn, dbn, (int)fs->fs_bsize,
2079d79ff54bSChuck Silvers 	    NULL, NULL, 0, NOCRED, 0, NULL, &bp);
2080d79ff54bSChuck Silvers 	if (error != 0) {
2081df8bae1dSRodney W. Grimes 		/*
2082df8bae1dSRodney W. Grimes 		 * The inode does not contain anything useful, so it would
2083df8bae1dSRodney W. Grimes 		 * be misleading to leave it on its hash chain. With mode
2084df8bae1dSRodney W. Grimes 		 * still zero, it will be unlinked and returned to the free
2085df8bae1dSRodney W. Grimes 		 * list by vput().
2086df8bae1dSRodney W. Grimes 		 */
20876c44a3e0SMateusz Guzik 		vgone(vp);
2088bd7e5f99SJohn Dyson 		vput(vp);
2089df8bae1dSRodney W. Grimes 		*vpp = NULL;
2090df8bae1dSRodney W. Grimes 		return (error);
2091df8bae1dSRodney W. Grimes 	}
2092e1db6897SKonstantin Belousov 	if (I_IS_UFS1(ip))
2093a163d034SWarner Losh 		ip->i_din1 = uma_zalloc(uma_ufs1, M_WAITOK);
2094de6ba7c0SPoul-Henning Kamp 	else
2095a163d034SWarner Losh 		ip->i_din2 = uma_zalloc(uma_ufs2, M_WAITOK);
20969fc5d538SKirk McKusick 	if ((error = ffs_load_inode(bp, ip, fs, ino)) != 0) {
20979fc5d538SKirk McKusick 		bqrelse(bp);
20986c44a3e0SMateusz Guzik 		vgone(vp);
20999fc5d538SKirk McKusick 		vput(vp);
21009fc5d538SKirk McKusick 		*vpp = NULL;
21019fc5d538SKirk McKusick 		return (error);
21029fc5d538SKirk McKusick 	}
2103fd97fa64SKonstantin Belousov 	if (DOINGSOFTDEP(vp) && (!fs->fs_ronly ||
2104fd97fa64SKonstantin Belousov 	    (ffs_flags & FFSV_FORCEINODEDEP) != 0))
2105b1897c19SJulian Elischer 		softdep_load_inodeblock(ip);
2106b1897c19SJulian Elischer 	else
2107b1897c19SJulian Elischer 		ip->i_effnlink = ip->i_nlink;
2108bd7e5f99SJohn Dyson 	bqrelse(bp);
2109df8bae1dSRodney W. Grimes 
2110df8bae1dSRodney W. Grimes 	/*
2111df8bae1dSRodney W. Grimes 	 * Initialize the vnode from the inode, check for aliases.
2112df8bae1dSRodney W. Grimes 	 * Note that the underlying vnode may have changed.
2113df8bae1dSRodney W. Grimes 	 */
2114e1db6897SKonstantin Belousov 	error = ufs_vinit(mp, I_IS_UFS1(ip) ? &ffs_fifoops1 : &ffs_fifoops2,
2115e1db6897SKonstantin Belousov 	    &vp);
2116c9671602SPoul-Henning Kamp 	if (error) {
21176c44a3e0SMateusz Guzik 		vgone(vp);
2118df8bae1dSRodney W. Grimes 		vput(vp);
2119df8bae1dSRodney W. Grimes 		*vpp = NULL;
2120df8bae1dSRodney W. Grimes 		return (error);
2121df8bae1dSRodney W. Grimes 	}
2122de68347bSPoul-Henning Kamp 
2123df8bae1dSRodney W. Grimes 	/*
21245c24d6eeSPoul-Henning Kamp 	 * Finish inode initialization.
2125df8bae1dSRodney W. Grimes 	 */
212633fc3625SJohn Baldwin 	if (vp->v_type != VFIFO) {
212733fc3625SJohn Baldwin 		/* FFS supports shared locking for all files except fifos. */
212833fc3625SJohn Baldwin 		VN_LOCK_ASHARE(vp);
212933fc3625SJohn Baldwin 	}
2130de68347bSPoul-Henning Kamp 
2131df8bae1dSRodney W. Grimes 	/*
2132df8bae1dSRodney W. Grimes 	 * Set up a generation number for this inode if it does not
2133df8bae1dSRodney W. Grimes 	 * already have one. This should only happen on old filesystems.
2134df8bae1dSRodney W. Grimes 	 */
2135df8bae1dSRodney W. Grimes 	if (ip->i_gen == 0) {
213657d2ac2fSKevin Lo 		while (ip->i_gen == 0)
213757d2ac2fSKevin Lo 			ip->i_gen = arc4random();
21381c85e6a3SKirk McKusick 		if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) {
2139ac4ec141SMateusz Guzik 			UFS_INODE_SET_FLAG(ip, IN_MODIFIED);
2140b403319bSAlexander Kabaev 			DIP_SET(ip, i_gen, ip->i_gen);
21411c85e6a3SKirk McKusick 		}
2142df8bae1dSRodney W. Grimes 	}
2143763bbd2fSRobert Watson #ifdef MAC
2144763bbd2fSRobert Watson 	if ((mp->mnt_flag & MNT_MULTILABEL) && ip->i_mode) {
2145763bbd2fSRobert Watson 		/*
2146763bbd2fSRobert Watson 		 * If this vnode is already allocated, and we're running
2147763bbd2fSRobert Watson 		 * multi-label, attempt to perform a label association
2148763bbd2fSRobert Watson 		 * from the extended attributes on the inode.
2149763bbd2fSRobert Watson 		 */
215030d239bcSRobert Watson 		error = mac_vnode_associate_extattr(mp, vp);
2151763bbd2fSRobert Watson 		if (error) {
2152763bbd2fSRobert Watson 			/* ufs_inactive will release ip->i_devvp ref. */
21536c44a3e0SMateusz Guzik 			vgone(vp);
2154763bbd2fSRobert Watson 			vput(vp);
2155763bbd2fSRobert Watson 			*vpp = NULL;
2156763bbd2fSRobert Watson 			return (error);
2157763bbd2fSRobert Watson 		}
2158763bbd2fSRobert Watson 	}
2159763bbd2fSRobert Watson #endif
2160763bbd2fSRobert Watson 
2161df8bae1dSRodney W. Grimes 	*vpp = vp;
2162df8bae1dSRodney W. Grimes 	return (0);
2163df8bae1dSRodney W. Grimes }
2164df8bae1dSRodney W. Grimes 
2165df8bae1dSRodney W. Grimes /*
2166df8bae1dSRodney W. Grimes  * File handle to vnode
2167df8bae1dSRodney W. Grimes  *
2168df8bae1dSRodney W. Grimes  * Have to be really careful about stale file handles:
2169df8bae1dSRodney W. Grimes  * - check that the inode number is valid
2170abe53f7eSKirk McKusick  * - for UFS2 check that the inode number is initialized
2171df8bae1dSRodney W. Grimes  * - call ffs_vget() to get the locked inode
2172df8bae1dSRodney W. Grimes  * - check for an unallocated inode (i_mode == 0)
2173df8bae1dSRodney W. Grimes  * - check that the given client host has export rights and return
2174df8bae1dSRodney W. Grimes  *   those rights via. exflagsp and credanonp
2175df8bae1dSRodney W. Grimes  */
2176adf41577SPoul-Henning Kamp static int
2177694a586aSRick Macklem ffs_fhtovp(mp, fhp, flags, vpp)
217805f4ff5dSPoul-Henning Kamp 	struct mount *mp;
2179df8bae1dSRodney W. Grimes 	struct fid *fhp;
2180694a586aSRick Macklem 	int flags;
2181df8bae1dSRodney W. Grimes 	struct vnode **vpp;
2182df8bae1dSRodney W. Grimes {
218305f4ff5dSPoul-Henning Kamp 	struct ufid *ufhp;
21845952c86cSKonstantin Belousov 
21855952c86cSKonstantin Belousov 	ufhp = (struct ufid *)fhp;
21865952c86cSKonstantin Belousov 	return (ffs_inotovp(mp, ufhp->ufid_ino, ufhp->ufid_gen, flags,
21875952c86cSKonstantin Belousov 	    vpp, 0));
21885952c86cSKonstantin Belousov }
21895952c86cSKonstantin Belousov 
21905952c86cSKonstantin Belousov int
21915952c86cSKonstantin Belousov ffs_inotovp(mp, ino, gen, lflags, vpp, ffs_flags)
21925952c86cSKonstantin Belousov 	struct mount *mp;
21935952c86cSKonstantin Belousov 	ino_t ino;
21945952c86cSKonstantin Belousov 	u_int64_t gen;
21955952c86cSKonstantin Belousov 	int lflags;
21965952c86cSKonstantin Belousov 	struct vnode **vpp;
21975952c86cSKonstantin Belousov 	int ffs_flags;
21985952c86cSKonstantin Belousov {
2199abe53f7eSKirk McKusick 	struct ufsmount *ump;
22005952c86cSKonstantin Belousov 	struct vnode *nvp;
220189fd61d9SKonstantin Belousov 	struct inode *ip;
2202df8bae1dSRodney W. Grimes 	struct fs *fs;
2203abe53f7eSKirk McKusick 	struct cg *cgp;
2204abe53f7eSKirk McKusick 	struct buf *bp;
2205abe53f7eSKirk McKusick 	u_int cg;
2206abe53f7eSKirk McKusick 	int error;
2207df8bae1dSRodney W. Grimes 
2208abe53f7eSKirk McKusick 	ump = VFSTOUFS(mp);
2209abe53f7eSKirk McKusick 	fs = ump->um_fs;
221089fd61d9SKonstantin Belousov 	*vpp = NULL;
221189fd61d9SKonstantin Belousov 
22121dc349abSEd Maste 	if (ino < UFS_ROOTINO || ino >= fs->fs_ncg * fs->fs_ipg)
2213df8bae1dSRodney W. Grimes 		return (ESTALE);
22145952c86cSKonstantin Belousov 
2215abe53f7eSKirk McKusick 	/*
2216abe53f7eSKirk McKusick 	 * Need to check if inode is initialized because UFS2 does lazy
2217abe53f7eSKirk McKusick 	 * initialization and nfs_fhtovp can offer arbitrary inode numbers.
2218abe53f7eSKirk McKusick 	 */
22195952c86cSKonstantin Belousov 	if (fs->fs_magic == FS_UFS2_MAGIC) {
2220abe53f7eSKirk McKusick 		cg = ino_to_cg(fs, ino);
22215952c86cSKonstantin Belousov 		error = ffs_getcg(fs, ump->um_devvp, cg, 0, &bp, &cgp);
22225952c86cSKonstantin Belousov 		if (error != 0)
2223abe53f7eSKirk McKusick 			return (error);
22249c4f551eSKirk McKusick 		if (ino >= cg * fs->fs_ipg + cgp->cg_initediblk) {
2225abe53f7eSKirk McKusick 			brelse(bp);
2226abe53f7eSKirk McKusick 			return (ESTALE);
2227abe53f7eSKirk McKusick 		}
2228abe53f7eSKirk McKusick 		brelse(bp);
22295952c86cSKonstantin Belousov 	}
22305952c86cSKonstantin Belousov 
22315952c86cSKonstantin Belousov 	error = ffs_vgetf(mp, ino, lflags, &nvp, ffs_flags);
223289fd61d9SKonstantin Belousov 	if (error != 0)
22335952c86cSKonstantin Belousov 		return (error);
223489fd61d9SKonstantin Belousov 
223589fd61d9SKonstantin Belousov 	ip = VTOI(nvp);
223689fd61d9SKonstantin Belousov 	if (ip->i_mode == 0 || ip->i_gen != gen || ip->i_effnlink <= 0) {
223789fd61d9SKonstantin Belousov 		if (ip->i_mode == 0)
223889fd61d9SKonstantin Belousov 			vgone(nvp);
223989fd61d9SKonstantin Belousov 		vput(nvp);
224089fd61d9SKonstantin Belousov 		return (ESTALE);
224189fd61d9SKonstantin Belousov 	}
224289fd61d9SKonstantin Belousov 
224389fd61d9SKonstantin Belousov 	vnode_create_vobject(nvp, DIP(ip, i_size), curthread);
224489fd61d9SKonstantin Belousov 	*vpp = nvp;
224589fd61d9SKonstantin Belousov 	return (0);
2246df8bae1dSRodney W. Grimes }
2247df8bae1dSRodney W. Grimes 
2248df8bae1dSRodney W. Grimes /*
22495346934fSIan Dowse  * Initialize the filesystem.
2250996c772fSJohn Dyson  */
2251996c772fSJohn Dyson static int
2252996c772fSJohn Dyson ffs_init(vfsp)
2253996c772fSJohn Dyson 	struct vfsconf *vfsp;
2254996c772fSJohn Dyson {
2255996c772fSJohn Dyson 
22561848286aSEdward Tomasz Napierala 	ffs_susp_initialize();
2257b1897c19SJulian Elischer 	softdep_initialize();
2258996c772fSJohn Dyson 	return (ufs_init(vfsp));
2259996c772fSJohn Dyson }
2260996c772fSJohn Dyson 
2261996c772fSJohn Dyson /*
22625346934fSIan Dowse  * Undo the work of ffs_init().
22635346934fSIan Dowse  */
22645346934fSIan Dowse static int
22655346934fSIan Dowse ffs_uninit(vfsp)
22665346934fSIan Dowse 	struct vfsconf *vfsp;
22675346934fSIan Dowse {
22685346934fSIan Dowse 	int ret;
22695346934fSIan Dowse 
22705346934fSIan Dowse 	ret = ufs_uninit(vfsp);
22715346934fSIan Dowse 	softdep_uninitialize();
22721848286aSEdward Tomasz Napierala 	ffs_susp_uninitialize();
2273d79ff54bSChuck Silvers 	taskqueue_drain_all(taskqueue_thread);
22745346934fSIan Dowse 	return (ret);
22755346934fSIan Dowse }
22765346934fSIan Dowse 
22775346934fSIan Dowse /*
2278dffce215SKirk McKusick  * Structure used to pass information from ffs_sbupdate to its
2279dffce215SKirk McKusick  * helper routine ffs_use_bwrite.
2280dffce215SKirk McKusick  */
2281dffce215SKirk McKusick struct devfd {
2282dffce215SKirk McKusick 	struct ufsmount	*ump;
2283dffce215SKirk McKusick 	struct buf	*sbbp;
2284dffce215SKirk McKusick 	int		 waitfor;
2285dffce215SKirk McKusick 	int		 suspended;
2286dffce215SKirk McKusick 	int		 error;
2287dffce215SKirk McKusick };
2288dffce215SKirk McKusick 
2289dffce215SKirk McKusick /*
2290df8bae1dSRodney W. Grimes  * Write a superblock and associated information back to disk.
2291df8bae1dSRodney W. Grimes  */
22921a60c7fcSPawel Jakub Dawidek int
2293927a12aeSKirk McKusick ffs_sbupdate(ump, waitfor, suspended)
2294927a12aeSKirk McKusick 	struct ufsmount *ump;
2295df8bae1dSRodney W. Grimes 	int waitfor;
2296791dd2faSTor Egge 	int suspended;
2297df8bae1dSRodney W. Grimes {
2298dffce215SKirk McKusick 	struct fs *fs;
22993ba649d7SJeff Roberson 	struct buf *sbbp;
2300dffce215SKirk McKusick 	struct devfd devfd;
2301df8bae1dSRodney W. Grimes 
2302dffce215SKirk McKusick 	fs = ump->um_fs;
230374f3809aSKirk McKusick 	if (fs->fs_ronly == 1 &&
2304927a12aeSKirk McKusick 	    (ump->um_mountp->mnt_flag & (MNT_RDONLY | MNT_UPDATE)) !=
2305927a12aeSKirk McKusick 	    (MNT_RDONLY | MNT_UPDATE) && ump->um_fsckpid == 0)
230674f3809aSKirk McKusick 		panic("ffs_sbupdate: write read-only filesystem");
2307996c772fSJohn Dyson 	/*
23083ba649d7SJeff Roberson 	 * We use the superblock's buf to serialize calls to ffs_sbupdate().
23093ba649d7SJeff Roberson 	 */
2310927a12aeSKirk McKusick 	sbbp = getblk(ump->um_devvp, btodb(fs->fs_sblockloc),
2311927a12aeSKirk McKusick 	    (int)fs->fs_sbsize, 0, 0, 0);
23123ba649d7SJeff Roberson 	/*
2313dffce215SKirk McKusick 	 * Initialize info needed for write function.
2314996c772fSJohn Dyson 	 */
2315dffce215SKirk McKusick 	devfd.ump = ump;
2316dffce215SKirk McKusick 	devfd.sbbp = sbbp;
2317dffce215SKirk McKusick 	devfd.waitfor = waitfor;
2318dffce215SKirk McKusick 	devfd.suspended = suspended;
2319dffce215SKirk McKusick 	devfd.error = 0;
2320dffce215SKirk McKusick 	return (ffs_sbput(&devfd, fs, fs->fs_sblockloc, ffs_use_bwrite));
2321dffce215SKirk McKusick }
2322dffce215SKirk McKusick 
2323dffce215SKirk McKusick /*
2324dffce215SKirk McKusick  * Write function for use by filesystem-layer routines.
2325dffce215SKirk McKusick  */
2326dffce215SKirk McKusick static int
2327dffce215SKirk McKusick ffs_use_bwrite(void *devfd, off_t loc, void *buf, int size)
2328dffce215SKirk McKusick {
2329dffce215SKirk McKusick 	struct devfd *devfdp;
2330dffce215SKirk McKusick 	struct ufsmount *ump;
2331dffce215SKirk McKusick 	struct buf *bp;
2332dffce215SKirk McKusick 	struct fs *fs;
2333dffce215SKirk McKusick 	int error;
2334dffce215SKirk McKusick 
2335dffce215SKirk McKusick 	devfdp = devfd;
2336dffce215SKirk McKusick 	ump = devfdp->ump;
2337dffce215SKirk McKusick 	fs = ump->um_fs;
2338dffce215SKirk McKusick 	/*
2339dffce215SKirk McKusick 	 * Writing the superblock summary information.
2340dffce215SKirk McKusick 	 */
2341dffce215SKirk McKusick 	if (loc != fs->fs_sblockloc) {
2342dffce215SKirk McKusick 		bp = getblk(ump->um_devvp, btodb(loc), size, 0, 0, 0);
2343dffce215SKirk McKusick 		bcopy(buf, bp->b_data, (u_int)size);
2344dffce215SKirk McKusick 		if (devfdp->suspended)
2345791dd2faSTor Egge 			bp->b_flags |= B_VALIDSUSPWRT;
2346dffce215SKirk McKusick 		if (devfdp->waitfor != MNT_WAIT)
2347df8bae1dSRodney W. Grimes 			bawrite(bp);
23488aef1712SMatthew Dillon 		else if ((error = bwrite(bp)) != 0)
2349dffce215SKirk McKusick 			devfdp->error = error;
2350dffce215SKirk McKusick 		return (0);
2351df8bae1dSRodney W. Grimes 	}
2352996c772fSJohn Dyson 	/*
2353dffce215SKirk McKusick 	 * Writing the superblock itself. We need to do special checks for it.
2354996c772fSJohn Dyson 	 */
2355dffce215SKirk McKusick 	bp = devfdp->sbbp;
2356d79ff54bSChuck Silvers 	if (ffs_fsfail_cleanup(ump, devfdp->error))
2357d79ff54bSChuck Silvers 		devfdp->error = 0;
2358dffce215SKirk McKusick 	if (devfdp->error != 0) {
2359dffce215SKirk McKusick 		brelse(bp);
2360dffce215SKirk McKusick 		return (devfdp->error);
23613ba649d7SJeff Roberson 	}
236231574422SKirk McKusick 	if (fs->fs_magic == FS_UFS1_MAGIC && fs->fs_sblockloc != SBLOCK_UFS1 &&
2363e9838c11SJohn-Mark Gurney 	    (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) {
2364b60ee81eSKirk McKusick 		printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n",
2365fa5d33e2SKirk McKusick 		    fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS1);
2366fa5d33e2SKirk McKusick 		fs->fs_sblockloc = SBLOCK_UFS1;
2367fa5d33e2SKirk McKusick 	}
236831574422SKirk McKusick 	if (fs->fs_magic == FS_UFS2_MAGIC && fs->fs_sblockloc != SBLOCK_UFS2 &&
2369e9838c11SJohn-Mark Gurney 	    (fs->fs_old_flags & FS_FLAGS_UPDATED) == 0) {
2370b60ee81eSKirk McKusick 		printf("WARNING: %s: correcting fs_sblockloc from %jd to %d\n",
2371fa5d33e2SKirk McKusick 		    fs->fs_fsmnt, fs->fs_sblockloc, SBLOCK_UFS2);
2372fa5d33e2SKirk McKusick 		fs->fs_sblockloc = SBLOCK_UFS2;
2373fa5d33e2SKirk McKusick 	}
2374519e3c3bSKirk McKusick 	if (MOUNTEDSOFTDEP(ump->um_mountp))
2375927a12aeSKirk McKusick 		softdep_setup_sbupdate(ump, (struct fs *)bp->b_data, bp);
2376996c772fSJohn Dyson 	bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize);
23779454b4fdSKirk McKusick 	fs = (struct fs *)bp->b_data;
23789454b4fdSKirk McKusick 	ffs_oldfscompat_write(fs, ump);
237993440bbeSKirk McKusick 	fs->fs_si = NULL;
238034816cb9SKirk McKusick 	/* Recalculate the superblock hash */
23819454b4fdSKirk McKusick 	fs->fs_ckhash = ffs_calc_sbhash(fs);
2382dffce215SKirk McKusick 	if (devfdp->suspended)
2383791dd2faSTor Egge 		bp->b_flags |= B_VALIDSUSPWRT;
2384dffce215SKirk McKusick 	if (devfdp->waitfor != MNT_WAIT)
2385996c772fSJohn Dyson 		bawrite(bp);
23868aef1712SMatthew Dillon 	else if ((error = bwrite(bp)) != 0)
2387dffce215SKirk McKusick 		devfdp->error = error;
2388dffce215SKirk McKusick 	return (devfdp->error);
2389df8bae1dSRodney W. Grimes }
2390d6fe88e4SPoul-Henning Kamp 
2391d6fe88e4SPoul-Henning Kamp static int
2392d6fe88e4SPoul-Henning Kamp ffs_extattrctl(struct mount *mp, int cmd, struct vnode *filename_vp,
2393dfd233edSAttilio Rao 	int attrnamespace, const char *attrname)
2394d6fe88e4SPoul-Henning Kamp {
2395d6fe88e4SPoul-Henning Kamp 
2396d6fe88e4SPoul-Henning Kamp #ifdef UFS_EXTATTR
2397d6fe88e4SPoul-Henning Kamp 	return (ufs_extattrctl(mp, cmd, filename_vp, attrnamespace,
2398dfd233edSAttilio Rao 	    attrname));
2399d6fe88e4SPoul-Henning Kamp #else
2400d6fe88e4SPoul-Henning Kamp 	return (vfs_stdextattrctl(mp, cmd, filename_vp, attrnamespace,
2401dfd233edSAttilio Rao 	    attrname));
2402d6fe88e4SPoul-Henning Kamp #endif
2403d6fe88e4SPoul-Henning Kamp }
2404975512a9SPoul-Henning Kamp 
2405975512a9SPoul-Henning Kamp static void
2406975512a9SPoul-Henning Kamp ffs_ifree(struct ufsmount *ump, struct inode *ip)
2407975512a9SPoul-Henning Kamp {
2408975512a9SPoul-Henning Kamp 
240936329289STim J. Robbins 	if (ump->um_fstype == UFS1 && ip->i_din1 != NULL)
2410aa4d7a8aSPoul-Henning Kamp 		uma_zfree(uma_ufs1, ip->i_din1);
241136329289STim J. Robbins 	else if (ip->i_din2 != NULL)
24128d721e87STim J. Robbins 		uma_zfree(uma_ufs2, ip->i_din2);
24139d5a594fSMateusz Guzik 	uma_zfree_smr(uma_inode, ip);
2414975512a9SPoul-Henning Kamp }
24156e77a041SPoul-Henning Kamp 
2416dd19a799SPoul-Henning Kamp static int dobkgrdwrite = 1;
2417dd19a799SPoul-Henning Kamp SYSCTL_INT(_debug, OID_AUTO, dobkgrdwrite, CTLFLAG_RW, &dobkgrdwrite, 0,
2418dd19a799SPoul-Henning Kamp     "Do background writes (honoring the BV_BKGRDWRITE flag)?");
2419dd19a799SPoul-Henning Kamp 
2420dd19a799SPoul-Henning Kamp /*
2421dd19a799SPoul-Henning Kamp  * Complete a background write started from bwrite.
2422dd19a799SPoul-Henning Kamp  */
2423dd19a799SPoul-Henning Kamp static void
2424dd19a799SPoul-Henning Kamp ffs_backgroundwritedone(struct buf *bp)
2425dd19a799SPoul-Henning Kamp {
2426204ec66dSJeff Roberson 	struct bufobj *bufobj;
2427dd19a799SPoul-Henning Kamp 	struct buf *origbp;
2428dd19a799SPoul-Henning Kamp 
2429d79ff54bSChuck Silvers #ifdef SOFTUPDATES
2430d79ff54bSChuck Silvers 	if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) != 0)
2431d79ff54bSChuck Silvers 		softdep_handle_error(bp);
2432d79ff54bSChuck Silvers #endif
2433d79ff54bSChuck Silvers 
2434dd19a799SPoul-Henning Kamp 	/*
2435dd19a799SPoul-Henning Kamp 	 * Find the original buffer that we are writing.
2436dd19a799SPoul-Henning Kamp 	 */
2437204ec66dSJeff Roberson 	bufobj = bp->b_bufobj;
2438204ec66dSJeff Roberson 	BO_LOCK(bufobj);
2439dd19a799SPoul-Henning Kamp 	if ((origbp = gbincore(bp->b_bufobj, bp->b_lblkno)) == NULL)
2440dd19a799SPoul-Henning Kamp 		panic("backgroundwritedone: lost buffer");
2441b2c3df84SKonstantin Belousov 
2442b2c3df84SKonstantin Belousov 	/*
2443b2c3df84SKonstantin Belousov 	 * We should mark the cylinder group buffer origbp as
2444d79ff54bSChuck Silvers 	 * dirty, to not lose the failed write.
2445b2c3df84SKonstantin Belousov 	 */
2446b2c3df84SKonstantin Belousov 	if ((bp->b_ioflags & BIO_ERROR) != 0)
2447b2c3df84SKonstantin Belousov 		origbp->b_vflags |= BV_BKGRDERR;
2448204ec66dSJeff Roberson 	BO_UNLOCK(bufobj);
2449dd19a799SPoul-Henning Kamp 	/*
2450dd19a799SPoul-Henning Kamp 	 * Process dependencies then return any unfinished ones.
2451dd19a799SPoul-Henning Kamp 	 */
2452b2c3df84SKonstantin Belousov 	if (!LIST_EMPTY(&bp->b_dep) && (bp->b_ioflags & BIO_ERROR) == 0)
2453dd19a799SPoul-Henning Kamp 		buf_complete(bp);
2454dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES
245504533fc6SXin LI 	if (!LIST_EMPTY(&bp->b_dep))
2456dd19a799SPoul-Henning Kamp 		softdep_move_dependencies(bp, origbp);
2457dd19a799SPoul-Henning Kamp #endif
2458dd19a799SPoul-Henning Kamp 	/*
2459204ec66dSJeff Roberson 	 * This buffer is marked B_NOCACHE so when it is released
2460bf0db193SKonstantin Belousov 	 * by biodone it will be tossed.  Clear B_IOSTARTED in case of error.
2461dd19a799SPoul-Henning Kamp 	 */
2462dd19a799SPoul-Henning Kamp 	bp->b_flags |= B_NOCACHE;
2463bf0db193SKonstantin Belousov 	bp->b_flags &= ~(B_CACHE | B_IOSTARTED);
2464377f88fbSKonstantin Belousov 	pbrelvp(bp);
2465b2c3df84SKonstantin Belousov 
2466b2c3df84SKonstantin Belousov 	/*
2467b2c3df84SKonstantin Belousov 	 * Prevent brelse() from trying to keep and re-dirtying bp on
2468b2c3df84SKonstantin Belousov 	 * errors. It causes b_bufobj dereference in
2469b2c3df84SKonstantin Belousov 	 * bdirty()/reassignbuf(), and b_bufobj was cleared in
2470b2c3df84SKonstantin Belousov 	 * pbrelvp() above.
2471b2c3df84SKonstantin Belousov 	 */
2472b2c3df84SKonstantin Belousov 	if ((bp->b_ioflags & BIO_ERROR) != 0)
2473b2c3df84SKonstantin Belousov 		bp->b_flags |= B_INVAL;
2474dd19a799SPoul-Henning Kamp 	bufdone(bp);
2475204ec66dSJeff Roberson 	BO_LOCK(bufobj);
2476dd19a799SPoul-Henning Kamp 	/*
2477dd19a799SPoul-Henning Kamp 	 * Clear the BV_BKGRDINPROG flag in the original buffer
2478dd19a799SPoul-Henning Kamp 	 * and awaken it if it is waiting for the write to complete.
2479dd19a799SPoul-Henning Kamp 	 * If BV_BKGRDINPROG is not set in the original buffer it must
2480dd19a799SPoul-Henning Kamp 	 * have been released and re-instantiated - which is not legal.
2481dd19a799SPoul-Henning Kamp 	 */
2482dd19a799SPoul-Henning Kamp 	KASSERT((origbp->b_vflags & BV_BKGRDINPROG),
2483dd19a799SPoul-Henning Kamp 	    ("backgroundwritedone: lost buffer2"));
2484dd19a799SPoul-Henning Kamp 	origbp->b_vflags &= ~BV_BKGRDINPROG;
2485dd19a799SPoul-Henning Kamp 	if (origbp->b_vflags & BV_BKGRDWAIT) {
2486dd19a799SPoul-Henning Kamp 		origbp->b_vflags &= ~BV_BKGRDWAIT;
2487dd19a799SPoul-Henning Kamp 		wakeup(&origbp->b_xflags);
2488dd19a799SPoul-Henning Kamp 	}
2489204ec66dSJeff Roberson 	BO_UNLOCK(bufobj);
2490dd19a799SPoul-Henning Kamp }
2491dd19a799SPoul-Henning Kamp 
2492dd19a799SPoul-Henning Kamp /*
2493dd19a799SPoul-Henning Kamp  * Write, release buffer on completion.  (Done by iodone
2494dd19a799SPoul-Henning Kamp  * if async).  Do not bother writing anything if the buffer
2495dd19a799SPoul-Henning Kamp  * is invalid.
2496dd19a799SPoul-Henning Kamp  *
2497dd19a799SPoul-Henning Kamp  * Note that we set B_CACHE here, indicating that buffer is
2498dd19a799SPoul-Henning Kamp  * fully valid and thus cacheable.  This is true even of NFS
2499dd19a799SPoul-Henning Kamp  * now so we set it generally.  This could be set either here
2500dd19a799SPoul-Henning Kamp  * or in biodone() since the I/O is synchronous.  We put it
2501dd19a799SPoul-Henning Kamp  * here.
2502dd19a799SPoul-Henning Kamp  */
2503dd19a799SPoul-Henning Kamp static int
2504dd19a799SPoul-Henning Kamp ffs_bufwrite(struct buf *bp)
2505dd19a799SPoul-Henning Kamp {
2506dd19a799SPoul-Henning Kamp 	struct buf *newbp;
250747806d1bSKirk McKusick 	struct cg *cgp;
2508dd19a799SPoul-Henning Kamp 
2509dd19a799SPoul-Henning Kamp 	CTR3(KTR_BUF, "bufwrite(%p) vp %p flags %X", bp, bp->b_vp, bp->b_flags);
2510dd19a799SPoul-Henning Kamp 	if (bp->b_flags & B_INVAL) {
2511dd19a799SPoul-Henning Kamp 		brelse(bp);
2512dd19a799SPoul-Henning Kamp 		return (0);
2513dd19a799SPoul-Henning Kamp 	}
2514dd19a799SPoul-Henning Kamp 
2515d638e093SAttilio Rao 	if (!BUF_ISLOCKED(bp))
2516dd19a799SPoul-Henning Kamp 		panic("bufwrite: buffer is not busy???");
2517dd19a799SPoul-Henning Kamp 	/*
2518dd19a799SPoul-Henning Kamp 	 * If a background write is already in progress, delay
2519dd19a799SPoul-Henning Kamp 	 * writing this block if it is asynchronous. Otherwise
2520dd19a799SPoul-Henning Kamp 	 * wait for the background write to complete.
2521dd19a799SPoul-Henning Kamp 	 */
2522dd19a799SPoul-Henning Kamp 	BO_LOCK(bp->b_bufobj);
2523dd19a799SPoul-Henning Kamp 	if (bp->b_vflags & BV_BKGRDINPROG) {
2524dd19a799SPoul-Henning Kamp 		if (bp->b_flags & B_ASYNC) {
2525dd19a799SPoul-Henning Kamp 			BO_UNLOCK(bp->b_bufobj);
2526dd19a799SPoul-Henning Kamp 			bdwrite(bp);
2527dd19a799SPoul-Henning Kamp 			return (0);
2528dd19a799SPoul-Henning Kamp 		}
2529dd19a799SPoul-Henning Kamp 		bp->b_vflags |= BV_BKGRDWAIT;
253022a72260SJeff Roberson 		msleep(&bp->b_xflags, BO_LOCKPTR(bp->b_bufobj), PRIBIO,
253122a72260SJeff Roberson 		    "bwrbg", 0);
2532dd19a799SPoul-Henning Kamp 		if (bp->b_vflags & BV_BKGRDINPROG)
2533dd19a799SPoul-Henning Kamp 			panic("bufwrite: still writing");
2534dd19a799SPoul-Henning Kamp 	}
2535b2c3df84SKonstantin Belousov 	bp->b_vflags &= ~BV_BKGRDERR;
2536dd19a799SPoul-Henning Kamp 	BO_UNLOCK(bp->b_bufobj);
2537dd19a799SPoul-Henning Kamp 
2538dd19a799SPoul-Henning Kamp 	/*
2539dd19a799SPoul-Henning Kamp 	 * If this buffer is marked for background writing and we
2540dd19a799SPoul-Henning Kamp 	 * do not have to wait for it, make a copy and write the
2541dd19a799SPoul-Henning Kamp 	 * copy so as to leave this buffer ready for further use.
2542dd19a799SPoul-Henning Kamp 	 *
2543dd19a799SPoul-Henning Kamp 	 * This optimization eats a lot of memory.  If we have a page
2544dd19a799SPoul-Henning Kamp 	 * or buffer shortfall we can't do it.
2545dd19a799SPoul-Henning Kamp 	 */
2546dd19a799SPoul-Henning Kamp 	if (dobkgrdwrite && (bp->b_xflags & BX_BKGRDWRITE) &&
2547dd19a799SPoul-Henning Kamp 	    (bp->b_flags & B_ASYNC) &&
2548dd19a799SPoul-Henning Kamp 	    !vm_page_count_severe() &&
2549dd19a799SPoul-Henning Kamp 	    !buf_dirty_count_severe()) {
2550dd19a799SPoul-Henning Kamp 		KASSERT(bp->b_iodone == NULL,
2551dd19a799SPoul-Henning Kamp 		    ("bufwrite: needs chained iodone (%p)", bp->b_iodone));
2552dd19a799SPoul-Henning Kamp 
2553dd19a799SPoul-Henning Kamp 		/* get a new block */
2554c1d8b5e8SKonstantin Belousov 		newbp = geteblk(bp->b_bufsize, GB_NOWAIT_BD);
2555c1d8b5e8SKonstantin Belousov 		if (newbp == NULL)
2556c1d8b5e8SKonstantin Belousov 			goto normal_write;
2557dd19a799SPoul-Henning Kamp 
2558fade8dd7SJeff Roberson 		KASSERT(buf_mapped(bp), ("Unmapped cg"));
2559dd19a799SPoul-Henning Kamp 		memcpy(newbp->b_data, bp->b_data, bp->b_bufsize);
2560dd19a799SPoul-Henning Kamp 		BO_LOCK(bp->b_bufobj);
2561dd19a799SPoul-Henning Kamp 		bp->b_vflags |= BV_BKGRDINPROG;
2562dd19a799SPoul-Henning Kamp 		BO_UNLOCK(bp->b_bufobj);
256375e3597aSKirk McKusick 		newbp->b_xflags |=
256475e3597aSKirk McKusick 		    (bp->b_xflags & BX_FSPRIV) | BX_BKGRDMARKER;
256526089666SJeff Roberson 		newbp->b_lblkno = bp->b_lblkno;
2566dd19a799SPoul-Henning Kamp 		newbp->b_blkno = bp->b_blkno;
2567dd19a799SPoul-Henning Kamp 		newbp->b_offset = bp->b_offset;
2568dd19a799SPoul-Henning Kamp 		newbp->b_iodone = ffs_backgroundwritedone;
2569dd19a799SPoul-Henning Kamp 		newbp->b_flags |= B_ASYNC;
2570dd19a799SPoul-Henning Kamp 		newbp->b_flags &= ~B_INVAL;
257126089666SJeff Roberson 		pbgetvp(bp->b_vp, newbp);
2572dd19a799SPoul-Henning Kamp 
2573dd19a799SPoul-Henning Kamp #ifdef SOFTUPDATES
2574113db2ddSJeff Roberson 		/*
2575113db2ddSJeff Roberson 		 * Move over the dependencies.  If there are rollbacks,
2576113db2ddSJeff Roberson 		 * leave the parent buffer dirtied as it will need to
2577113db2ddSJeff Roberson 		 * be written again.
2578113db2ddSJeff Roberson 		 */
2579113db2ddSJeff Roberson 		if (LIST_EMPTY(&bp->b_dep) ||
2580113db2ddSJeff Roberson 		    softdep_move_dependencies(bp, newbp) == 0)
2581113db2ddSJeff Roberson 			bundirty(bp);
2582113db2ddSJeff Roberson #else
2583113db2ddSJeff Roberson 		bundirty(bp);
2584dd19a799SPoul-Henning Kamp #endif
2585dd19a799SPoul-Henning Kamp 
2586dd19a799SPoul-Henning Kamp 		/*
258726089666SJeff Roberson 		 * Initiate write on the copy, release the original.  The
258826089666SJeff Roberson 		 * BKGRDINPROG flag prevents it from going away until
258947806d1bSKirk McKusick 		 * the background write completes. We have to recalculate
259047806d1bSKirk McKusick 		 * its check hash in case the buffer gets freed and then
259147806d1bSKirk McKusick 		 * reconstituted from the buffer cache during a later read.
2592dd19a799SPoul-Henning Kamp 		 */
259347806d1bSKirk McKusick 		if ((bp->b_xflags & BX_CYLGRP) != 0) {
259447806d1bSKirk McKusick 			cgp = (struct cg *)bp->b_data;
259547806d1bSKirk McKusick 			cgp->cg_ckhash = 0;
259647806d1bSKirk McKusick 			cgp->cg_ckhash =
259747806d1bSKirk McKusick 			    calculate_crc32c(~0L, bp->b_data, bp->b_bcount);
259847806d1bSKirk McKusick 		}
2599dd19a799SPoul-Henning Kamp 		bqrelse(bp);
2600dd19a799SPoul-Henning Kamp 		bp = newbp;
2601113db2ddSJeff Roberson 	} else
2602113db2ddSJeff Roberson 		/* Mark the buffer clean */
2603113db2ddSJeff Roberson 		bundirty(bp);
2604113db2ddSJeff Roberson 
2605dd19a799SPoul-Henning Kamp 	/* Let the normal bufwrite do the rest for us */
2606c1d8b5e8SKonstantin Belousov normal_write:
260747806d1bSKirk McKusick 	/*
260847806d1bSKirk McKusick 	 * If we are writing a cylinder group, update its time.
260947806d1bSKirk McKusick 	 */
261047806d1bSKirk McKusick 	if ((bp->b_xflags & BX_CYLGRP) != 0) {
261147806d1bSKirk McKusick 		cgp = (struct cg *)bp->b_data;
261247806d1bSKirk McKusick 		cgp->cg_old_time = cgp->cg_time = time_second;
261347806d1bSKirk McKusick 	}
26149248a827STor Egge 	return (bufwrite(bp));
2615dd19a799SPoul-Henning Kamp }
2616dd19a799SPoul-Henning Kamp 
26178dd56505SPoul-Henning Kamp static void
26186e77a041SPoul-Henning Kamp ffs_geom_strategy(struct bufobj *bo, struct buf *bp)
26196e77a041SPoul-Henning Kamp {
2620153910e0SJeff Roberson 	struct vnode *vp;
26217de3839dSTor Egge 	struct buf *tbp;
262275e3597aSKirk McKusick 	int error, nocopy;
26236e77a041SPoul-Henning Kamp 
2624f15ccf88SChuck Silvers 	/*
2625f15ccf88SChuck Silvers 	 * This is the bufobj strategy for the private VCHR vnodes
2626f15ccf88SChuck Silvers 	 * used by FFS to access the underlying storage device.
2627f15ccf88SChuck Silvers 	 * We override the default bufobj strategy and thus bypass
2628f15ccf88SChuck Silvers 	 * VOP_STRATEGY() for these vnodes.
2629f15ccf88SChuck Silvers 	 */
26308660b707SMateusz Guzik 	vp = bo2vnode(bo);
2631f15ccf88SChuck Silvers 	KASSERT(bp->b_vp == NULL || bp->b_vp->v_type != VCHR ||
2632f15ccf88SChuck Silvers 	    bp->b_vp->v_rdev == NULL ||
2633f15ccf88SChuck Silvers 	    bp->b_vp->v_rdev->si_mountpt == NULL ||
2634f15ccf88SChuck Silvers 	    VFSTOUFS(bp->b_vp->v_rdev->si_mountpt) == NULL ||
2635f15ccf88SChuck Silvers 	    vp == VFSTOUFS(bp->b_vp->v_rdev->si_mountpt)->um_devvp,
2636f15ccf88SChuck Silvers 	    ("ffs_geom_strategy() with wrong vp"));
2637153910e0SJeff Roberson 	if (bp->b_iocmd == BIO_WRITE) {
2638153910e0SJeff Roberson 		if ((bp->b_flags & B_VALIDSUSPWRT) == 0 &&
2639153910e0SJeff Roberson 		    bp->b_vp != NULL && bp->b_vp->v_mount != NULL &&
2640153910e0SJeff Roberson 		    (bp->b_vp->v_mount->mnt_kern_flag & MNTK_SUSPENDED) != 0)
2641153910e0SJeff Roberson 			panic("ffs_geom_strategy: bad I/O");
2642113db2ddSJeff Roberson 		nocopy = bp->b_flags & B_NOCOPY;
2643113db2ddSJeff Roberson 		bp->b_flags &= ~(B_VALIDSUSPWRT | B_NOCOPY);
2644113db2ddSJeff Roberson 		if ((vp->v_vflag & VV_COPYONWRITE) && nocopy == 0 &&
26457de3839dSTor Egge 		    vp->v_rdev->si_snapdata != NULL) {
26467de3839dSTor Egge 			if ((bp->b_flags & B_CLUSTER) != 0) {
2647868bb88fSTor Egge 				runningbufwakeup(bp);
26487de3839dSTor Egge 				TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head,
26497de3839dSTor Egge 					      b_cluster.cluster_entry) {
26507de3839dSTor Egge 					error = ffs_copyonwrite(vp, tbp);
26517de3839dSTor Egge 					if (error != 0 &&
2652153910e0SJeff Roberson 					    error != EOPNOTSUPP) {
2653153910e0SJeff Roberson 						bp->b_error = error;
2654153910e0SJeff Roberson 						bp->b_ioflags |= BIO_ERROR;
2655e1ef4c29SKonstantin Belousov 						bp->b_flags &= ~B_BARRIER;
2656153910e0SJeff Roberson 						bufdone(bp);
2657153910e0SJeff Roberson 						return;
2658153910e0SJeff Roberson 					}
2659153910e0SJeff Roberson 				}
2660868bb88fSTor Egge 				bp->b_runningbufspace = bp->b_bufsize;
26615bd65606SJohn Baldwin 				atomic_add_long(&runningbufspace,
2662868bb88fSTor Egge 					       bp->b_runningbufspace);
26637de3839dSTor Egge 			} else {
26647de3839dSTor Egge 				error = ffs_copyonwrite(vp, bp);
26657de3839dSTor Egge 				if (error != 0 && error != EOPNOTSUPP) {
26667de3839dSTor Egge 					bp->b_error = error;
26677de3839dSTor Egge 					bp->b_ioflags |= BIO_ERROR;
2668e1ef4c29SKonstantin Belousov 					bp->b_flags &= ~B_BARRIER;
26697de3839dSTor Egge 					bufdone(bp);
26707de3839dSTor Egge 					return;
26717de3839dSTor Egge 				}
26727de3839dSTor Egge 			}
26737de3839dSTor Egge 		}
26747de3839dSTor Egge #ifdef SOFTUPDATES
26757de3839dSTor Egge 		if ((bp->b_flags & B_CLUSTER) != 0) {
26767de3839dSTor Egge 			TAILQ_FOREACH(tbp, &bp->b_cluster.cluster_head,
26777de3839dSTor Egge 				      b_cluster.cluster_entry) {
267804533fc6SXin LI 				if (!LIST_EMPTY(&tbp->b_dep))
26797de3839dSTor Egge 					buf_start(tbp);
26807de3839dSTor Egge 			}
26817de3839dSTor Egge 		} else {
268204533fc6SXin LI 			if (!LIST_EMPTY(&bp->b_dep))
26837de3839dSTor Egge 				buf_start(bp);
26847de3839dSTor Egge 		}
26857de3839dSTor Egge 
26867de3839dSTor Egge #endif
268775e3597aSKirk McKusick 		/*
268875e3597aSKirk McKusick 		 * Check for metadata that needs check-hashes and update them.
268975e3597aSKirk McKusick 		 */
269075e3597aSKirk McKusick 		switch (bp->b_xflags & BX_FSPRIV) {
269175e3597aSKirk McKusick 		case BX_CYLGRP:
269275e3597aSKirk McKusick 			((struct cg *)bp->b_data)->cg_ckhash = 0;
269375e3597aSKirk McKusick 			((struct cg *)bp->b_data)->cg_ckhash =
269475e3597aSKirk McKusick 			    calculate_crc32c(~0L, bp->b_data, bp->b_bcount);
269575e3597aSKirk McKusick 			break;
269675e3597aSKirk McKusick 
269775e3597aSKirk McKusick 		case BX_SUPERBLOCK:
269875e3597aSKirk McKusick 		case BX_INODE:
269975e3597aSKirk McKusick 		case BX_INDIR:
270075e3597aSKirk McKusick 		case BX_DIR:
270175e3597aSKirk McKusick 			printf("Check-hash write is unimplemented!!!\n");
270275e3597aSKirk McKusick 			break;
270375e3597aSKirk McKusick 
270475e3597aSKirk McKusick 		case 0:
270575e3597aSKirk McKusick 			break;
270675e3597aSKirk McKusick 
270775e3597aSKirk McKusick 		default:
270875e3597aSKirk McKusick 			printf("multiple buffer types 0x%b\n",
270975e3597aSKirk McKusick 			    (u_int)(bp->b_xflags & BX_FSPRIV),
271075e3597aSKirk McKusick 			    PRINT_UFS_BUF_XFLAGS);
271175e3597aSKirk McKusick 			break;
271275e3597aSKirk McKusick 		}
27137de3839dSTor Egge 	}
2714d79ff54bSChuck Silvers 	if (bp->b_iocmd != BIO_READ && ffs_enxio_enable)
2715d79ff54bSChuck Silvers 		bp->b_xflags |= BX_CVTENXIO;
271643920011SPoul-Henning Kamp 	g_vfs_strategy(bo, bp);
27176e77a041SPoul-Henning Kamp }
271852dfc8d7SKonstantin Belousov 
27191848286aSEdward Tomasz Napierala int
27201848286aSEdward Tomasz Napierala ffs_own_mount(const struct mount *mp)
27211848286aSEdward Tomasz Napierala {
27221848286aSEdward Tomasz Napierala 
27231848286aSEdward Tomasz Napierala 	if (mp->mnt_op == &ufs_vfsops)
27241848286aSEdward Tomasz Napierala 		return (1);
27251848286aSEdward Tomasz Napierala 	return (0);
27261848286aSEdward Tomasz Napierala }
27271848286aSEdward Tomasz Napierala 
272852dfc8d7SKonstantin Belousov #ifdef	DDB
2729cf058082SBrooks Davis #ifdef SOFTUPDATES
273052dfc8d7SKonstantin Belousov 
2731519e3c3bSKirk McKusick /* defined in ffs_softdep.c */
2732519e3c3bSKirk McKusick extern void db_print_ffs(struct ufsmount *ump);
273352dfc8d7SKonstantin Belousov 
273452dfc8d7SKonstantin Belousov DB_SHOW_COMMAND(ffs, db_show_ffs)
273552dfc8d7SKonstantin Belousov {
273652dfc8d7SKonstantin Belousov 	struct mount *mp;
273752dfc8d7SKonstantin Belousov 	struct ufsmount *ump;
273852dfc8d7SKonstantin Belousov 
273952dfc8d7SKonstantin Belousov 	if (have_addr) {
274052dfc8d7SKonstantin Belousov 		ump = VFSTOUFS((struct mount *)addr);
274152dfc8d7SKonstantin Belousov 		db_print_ffs(ump);
274252dfc8d7SKonstantin Belousov 		return;
274352dfc8d7SKonstantin Belousov 	}
274452dfc8d7SKonstantin Belousov 
274552dfc8d7SKonstantin Belousov 	TAILQ_FOREACH(mp, &mountlist, mnt_list) {
274652dfc8d7SKonstantin Belousov 		if (!strcmp(mp->mnt_stat.f_fstypename, ufs_vfsconf.vfc_name))
274752dfc8d7SKonstantin Belousov 			db_print_ffs(VFSTOUFS(mp));
274852dfc8d7SKonstantin Belousov 	}
274952dfc8d7SKonstantin Belousov }
275052dfc8d7SKonstantin Belousov 
2751cf058082SBrooks Davis #endif	/* SOFTUPDATES */
275252dfc8d7SKonstantin Belousov #endif	/* DDB */
2753