xref: /freebsd/sys/geom/geom_vfs.c (revision e521fb0558bac9d41774c255c348ef655ab87218)
14d13ab3dSPoul-Henning Kamp /*-
24d13ab3dSPoul-Henning Kamp  * Copyright (c) 2004 Poul-Henning Kamp
34d13ab3dSPoul-Henning Kamp  * All rights reserved.
44d13ab3dSPoul-Henning Kamp  *
54d13ab3dSPoul-Henning Kamp  * Redistribution and use in source and binary forms, with or without
64d13ab3dSPoul-Henning Kamp  * modification, are permitted provided that the following conditions
74d13ab3dSPoul-Henning Kamp  * are met:
84d13ab3dSPoul-Henning Kamp  * 1. Redistributions of source code must retain the above copyright
94d13ab3dSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer.
104d13ab3dSPoul-Henning Kamp  * 2. Redistributions in binary form must reproduce the above copyright
114d13ab3dSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer in the
124d13ab3dSPoul-Henning Kamp  *    documentation and/or other materials provided with the distribution.
134d13ab3dSPoul-Henning Kamp  *
144d13ab3dSPoul-Henning Kamp  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
154d13ab3dSPoul-Henning Kamp  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
164d13ab3dSPoul-Henning Kamp  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
174d13ab3dSPoul-Henning Kamp  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
184d13ab3dSPoul-Henning Kamp  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
194d13ab3dSPoul-Henning Kamp  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
204d13ab3dSPoul-Henning Kamp  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
214d13ab3dSPoul-Henning Kamp  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
224d13ab3dSPoul-Henning Kamp  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
234d13ab3dSPoul-Henning Kamp  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
244d13ab3dSPoul-Henning Kamp  * SUCH DAMAGE.
254d13ab3dSPoul-Henning Kamp  */
264d13ab3dSPoul-Henning Kamp 
274d13ab3dSPoul-Henning Kamp #include <sys/cdefs.h>
284d13ab3dSPoul-Henning Kamp __FBSDID("$FreeBSD$");
294d13ab3dSPoul-Henning Kamp 
304d13ab3dSPoul-Henning Kamp #include <sys/param.h>
314d13ab3dSPoul-Henning Kamp #include <sys/systm.h>
324d13ab3dSPoul-Henning Kamp #include <sys/bio.h>
334d13ab3dSPoul-Henning Kamp #include <sys/kernel.h>
34ea5791d7SAlexander Motin #include <sys/lock.h>
354d13ab3dSPoul-Henning Kamp #include <sys/malloc.h>
36ea5791d7SAlexander Motin #include <sys/mutex.h>
374d13ab3dSPoul-Henning Kamp #include <sys/vnode.h>
381907e620SJeff Roberson #include <sys/mount.h>	/* XXX Temporary for VFS_LOCK_GIANT */
394d13ab3dSPoul-Henning Kamp 
404d13ab3dSPoul-Henning Kamp #include <geom/geom.h>
414d13ab3dSPoul-Henning Kamp #include <geom/geom_vfs.h>
424d13ab3dSPoul-Henning Kamp 
434d13ab3dSPoul-Henning Kamp /*
444d13ab3dSPoul-Henning Kamp  * subroutines for use by filesystems.
454d13ab3dSPoul-Henning Kamp  *
464d13ab3dSPoul-Henning Kamp  * XXX: should maybe live somewhere else ?
474d13ab3dSPoul-Henning Kamp  */
484d13ab3dSPoul-Henning Kamp #include <sys/buf.h>
494d13ab3dSPoul-Henning Kamp 
50ea5791d7SAlexander Motin struct g_vfs_softc {
51ea5791d7SAlexander Motin 	struct mtx	 sc_mtx;
52ea5791d7SAlexander Motin 	struct bufobj	*sc_bo;
53ea5791d7SAlexander Motin 	int		 sc_active;
54ea5791d7SAlexander Motin 	int		 sc_orphaned;
55ea5791d7SAlexander Motin };
56ea5791d7SAlexander Motin 
574d13ab3dSPoul-Henning Kamp static struct buf_ops __g_vfs_bufops = {
584d13ab3dSPoul-Henning Kamp 	.bop_name =	"GEOM_VFS",
594d13ab3dSPoul-Henning Kamp 	.bop_write =	bufwrite,
604d13ab3dSPoul-Henning Kamp 	.bop_strategy =	g_vfs_strategy,
616ef8480aSPoul-Henning Kamp 	.bop_sync =	bufsync,
622cc7d26fSKonstantin Belousov 	.bop_bdflush =	bufbdflush
634d13ab3dSPoul-Henning Kamp };
644d13ab3dSPoul-Henning Kamp 
654d13ab3dSPoul-Henning Kamp struct buf_ops *g_vfs_bufops = &__g_vfs_bufops;
664d13ab3dSPoul-Henning Kamp 
6707e95ed6SPoul-Henning Kamp static g_orphan_t g_vfs_orphan;
6807e95ed6SPoul-Henning Kamp 
694d13ab3dSPoul-Henning Kamp static struct g_class g_vfs_class = {
704d13ab3dSPoul-Henning Kamp 	.name =		"VFS",
714d13ab3dSPoul-Henning Kamp 	.version =	G_VERSION,
724d13ab3dSPoul-Henning Kamp 	.orphan =	g_vfs_orphan,
734d13ab3dSPoul-Henning Kamp };
744d13ab3dSPoul-Henning Kamp 
754d13ab3dSPoul-Henning Kamp DECLARE_GEOM_CLASS(g_vfs_class, g_vfs);
764d13ab3dSPoul-Henning Kamp 
774d13ab3dSPoul-Henning Kamp static void
78ea5791d7SAlexander Motin g_vfs_destroy(void *arg, int flags __unused)
79ea5791d7SAlexander Motin {
80ea5791d7SAlexander Motin 	struct g_consumer *cp;
81ea5791d7SAlexander Motin 
82ea5791d7SAlexander Motin 	g_topology_assert();
83ea5791d7SAlexander Motin 	cp = arg;
84ea5791d7SAlexander Motin 	if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0)
85ea5791d7SAlexander Motin 		g_access(cp, -cp->acr, -cp->acw, -cp->ace);
86ea5791d7SAlexander Motin 	g_detach(cp);
87ea5791d7SAlexander Motin 	if (cp->geom->softc == NULL)
88ea5791d7SAlexander Motin 		g_wither_geom(cp->geom, ENXIO);
89ea5791d7SAlexander Motin }
90ea5791d7SAlexander Motin 
91ea5791d7SAlexander Motin static void
924d13ab3dSPoul-Henning Kamp g_vfs_done(struct bio *bip)
934d13ab3dSPoul-Henning Kamp {
94ea5791d7SAlexander Motin 	struct g_consumer *cp;
95ea5791d7SAlexander Motin 	struct g_vfs_softc *sc;
964d13ab3dSPoul-Henning Kamp 	struct buf *bp;
97ea5791d7SAlexander Motin 	int vfslocked, destroy;
981faacf5dSKirk McKusick 	struct mount *mp;
991faacf5dSKirk McKusick 	struct vnode *vp;
10085121b09SKirk McKusick 	struct cdev *cdevp;
1011faacf5dSKirk McKusick 
1021faacf5dSKirk McKusick 	/*
1031faacf5dSKirk McKusick 	 * Collect statistics on synchronous and asynchronous read
1041faacf5dSKirk McKusick 	 * and write counts for disks that have associated filesystems.
1051faacf5dSKirk McKusick 	 * Since this run by the g_up thread it is single threaded and
1061faacf5dSKirk McKusick 	 * we do not need to use atomic increments on the counters.
1071faacf5dSKirk McKusick 	 */
1081faacf5dSKirk McKusick 	bp = bip->bio_caller2;
1091faacf5dSKirk McKusick 	vp = bp->b_vp;
11085121b09SKirk McKusick 	if (vp == NULL) {
1111faacf5dSKirk McKusick 		mp = NULL;
11285121b09SKirk McKusick 	} else {
11385121b09SKirk McKusick 		/*
11485121b09SKirk McKusick 		 * If not a disk vnode, use its associated mount point
11585121b09SKirk McKusick 		 * otherwise use the mountpoint associated with the disk.
11685121b09SKirk McKusick 		 */
11785121b09SKirk McKusick 		VI_LOCK(vp);
11885121b09SKirk McKusick 		if (vp->v_type != VCHR ||
11985121b09SKirk McKusick 		    (cdevp = vp->v_rdev) == NULL ||
12085121b09SKirk McKusick 		    cdevp->si_devsw == NULL ||
12185121b09SKirk McKusick 		    (cdevp->si_devsw->d_flags & D_DISK) == 0)
1221faacf5dSKirk McKusick 			mp = vp->v_mount;
12385121b09SKirk McKusick 		else
12485121b09SKirk McKusick 			mp = cdevp->si_mountpt;
12585121b09SKirk McKusick 		VI_UNLOCK(vp);
12685121b09SKirk McKusick 	}
1271faacf5dSKirk McKusick 	if (mp != NULL) {
1281faacf5dSKirk McKusick 		if (bp->b_iocmd == BIO_WRITE) {
1291faacf5dSKirk McKusick 			if (LK_HOLDER(bp->b_lock.lk_lock) == LK_KERNPROC)
1301faacf5dSKirk McKusick 				mp->mnt_stat.f_asyncwrites++;
1311faacf5dSKirk McKusick 			else
1321faacf5dSKirk McKusick 				mp->mnt_stat.f_syncwrites++;
1331faacf5dSKirk McKusick 		} else {
1341faacf5dSKirk McKusick 			if (LK_HOLDER(bp->b_lock.lk_lock) == LK_KERNPROC)
1351faacf5dSKirk McKusick 				mp->mnt_stat.f_asyncreads++;
1361faacf5dSKirk McKusick 			else
1371faacf5dSKirk McKusick 				mp->mnt_stat.f_syncreads++;
1381faacf5dSKirk McKusick 		}
1391faacf5dSKirk McKusick 	}
1404d13ab3dSPoul-Henning Kamp 
141ea5791d7SAlexander Motin 	cp = bip->bio_from;
142ea5791d7SAlexander Motin 	sc = cp->geom->softc;
1434d13ab3dSPoul-Henning Kamp 	if (bip->bio_error) {
144f9eeb895SPoul-Henning Kamp 		printf("g_vfs_done():");
1454d13ab3dSPoul-Henning Kamp 		g_print_bio(bip);
1464d13ab3dSPoul-Henning Kamp 		printf("error = %d\n", bip->bio_error);
1474d13ab3dSPoul-Henning Kamp 	}
1484d13ab3dSPoul-Henning Kamp 	bp->b_error = bip->bio_error;
1494d13ab3dSPoul-Henning Kamp 	bp->b_ioflags = bip->bio_flags;
1504d13ab3dSPoul-Henning Kamp 	if (bip->bio_error)
1514d13ab3dSPoul-Henning Kamp 		bp->b_ioflags |= BIO_ERROR;
1524d13ab3dSPoul-Henning Kamp 	bp->b_resid = bp->b_bcount - bip->bio_completed;
1534d13ab3dSPoul-Henning Kamp 	g_destroy_bio(bip);
154ea5791d7SAlexander Motin 
155ea5791d7SAlexander Motin 	mtx_lock(&sc->sc_mtx);
156ea5791d7SAlexander Motin 	destroy = ((--sc->sc_active) == 0 && sc->sc_orphaned);
157ea5791d7SAlexander Motin 	mtx_unlock(&sc->sc_mtx);
158ea5791d7SAlexander Motin 	if (destroy)
159ea5791d7SAlexander Motin 		g_post_event(g_vfs_destroy, cp, M_WAITOK, NULL);
160ea5791d7SAlexander Motin 
1611907e620SJeff Roberson 	vfslocked = VFS_LOCK_GIANT(((struct mount *)NULL));
1624d13ab3dSPoul-Henning Kamp 	bufdone(bp);
1631907e620SJeff Roberson 	VFS_UNLOCK_GIANT(vfslocked);
1644d13ab3dSPoul-Henning Kamp }
1654d13ab3dSPoul-Henning Kamp 
1664d13ab3dSPoul-Henning Kamp void
1674d13ab3dSPoul-Henning Kamp g_vfs_strategy(struct bufobj *bo, struct buf *bp)
1684d13ab3dSPoul-Henning Kamp {
169ea5791d7SAlexander Motin 	struct g_vfs_softc *sc;
1704d13ab3dSPoul-Henning Kamp 	struct g_consumer *cp;
1714d13ab3dSPoul-Henning Kamp 	struct bio *bip;
172ce8be7b8SEdward Tomasz Napierala 	int vfslocked;
1734d13ab3dSPoul-Henning Kamp 
1744d13ab3dSPoul-Henning Kamp 	cp = bo->bo_private;
175ea5791d7SAlexander Motin 	sc = cp->geom->softc;
1764d13ab3dSPoul-Henning Kamp 
177ce8be7b8SEdward Tomasz Napierala 	/*
1786bccea7cSRebecca Cran 	 * If the provider has orphaned us, just return EXIO.
179ce8be7b8SEdward Tomasz Napierala 	 */
180ea5791d7SAlexander Motin 	mtx_lock(&sc->sc_mtx);
181ea5791d7SAlexander Motin 	if (sc->sc_orphaned) {
182ea5791d7SAlexander Motin 		mtx_unlock(&sc->sc_mtx);
183ce8be7b8SEdward Tomasz Napierala 		bp->b_error = ENXIO;
184ce8be7b8SEdward Tomasz Napierala 		bp->b_ioflags |= BIO_ERROR;
185ce8be7b8SEdward Tomasz Napierala 		vfslocked = VFS_LOCK_GIANT(((struct mount *)NULL));
186ce8be7b8SEdward Tomasz Napierala 		bufdone(bp);
187ce8be7b8SEdward Tomasz Napierala 		VFS_UNLOCK_GIANT(vfslocked);
188ce8be7b8SEdward Tomasz Napierala 		return;
189ce8be7b8SEdward Tomasz Napierala 	}
190ea5791d7SAlexander Motin 	sc->sc_active++;
191ea5791d7SAlexander Motin 	mtx_unlock(&sc->sc_mtx);
192ce8be7b8SEdward Tomasz Napierala 
1934d13ab3dSPoul-Henning Kamp 	bip = g_alloc_bio();
1944d13ab3dSPoul-Henning Kamp 	bip->bio_cmd = bp->b_iocmd;
1954d13ab3dSPoul-Henning Kamp 	bip->bio_offset = bp->b_iooffset;
1964d13ab3dSPoul-Henning Kamp 	bip->bio_data = bp->b_data;
1974d13ab3dSPoul-Henning Kamp 	bip->bio_done = g_vfs_done;
1984d13ab3dSPoul-Henning Kamp 	bip->bio_caller2 = bp;
1994d13ab3dSPoul-Henning Kamp 	bip->bio_length = bp->b_bcount;
2004d13ab3dSPoul-Henning Kamp 	g_io_request(bip, cp);
2014d13ab3dSPoul-Henning Kamp }
2024d13ab3dSPoul-Henning Kamp 
20307e95ed6SPoul-Henning Kamp static void
2044d13ab3dSPoul-Henning Kamp g_vfs_orphan(struct g_consumer *cp)
2054d13ab3dSPoul-Henning Kamp {
206ce8be7b8SEdward Tomasz Napierala 	struct g_geom *gp;
207ea5791d7SAlexander Motin 	struct g_vfs_softc *sc;
208ea5791d7SAlexander Motin 	int destroy;
209ce8be7b8SEdward Tomasz Napierala 
210ce8be7b8SEdward Tomasz Napierala 	g_topology_assert();
211ce8be7b8SEdward Tomasz Napierala 
212ce8be7b8SEdward Tomasz Napierala 	gp = cp->geom;
213ce8be7b8SEdward Tomasz Napierala 	g_trace(G_T_TOPOLOGY, "g_vfs_orphan(%p(%s))", cp, gp->name);
214a2fa37feSAlexander Motin 	sc = gp->softc;
215a2fa37feSAlexander Motin 	if (sc == NULL)
216a2fa37feSAlexander Motin 		return;
217ea5791d7SAlexander Motin 	mtx_lock(&sc->sc_mtx);
218ea5791d7SAlexander Motin 	sc->sc_orphaned = 1;
219*e521fb05SAlexander Motin 	destroy = (sc->sc_active == 0);
220ea5791d7SAlexander Motin 	mtx_unlock(&sc->sc_mtx);
221ea5791d7SAlexander Motin 	if (destroy)
222ea5791d7SAlexander Motin 		g_vfs_destroy(cp, 0);
2234d13ab3dSPoul-Henning Kamp 
2244d13ab3dSPoul-Henning Kamp 	/*
22538153e80SEdward Tomasz Napierala 	 * Do not destroy the geom.  Filesystem will do that during unmount.
2264d13ab3dSPoul-Henning Kamp 	 */
2274d13ab3dSPoul-Henning Kamp }
2284d13ab3dSPoul-Henning Kamp 
2294d13ab3dSPoul-Henning Kamp int
2304d13ab3dSPoul-Henning Kamp g_vfs_open(struct vnode *vp, struct g_consumer **cpp, const char *fsname, int wr)
2314d13ab3dSPoul-Henning Kamp {
2324d13ab3dSPoul-Henning Kamp 	struct g_geom *gp;
2334d13ab3dSPoul-Henning Kamp 	struct g_provider *pp;
2344d13ab3dSPoul-Henning Kamp 	struct g_consumer *cp;
235ea5791d7SAlexander Motin 	struct g_vfs_softc *sc;
2364d13ab3dSPoul-Henning Kamp 	struct bufobj *bo;
237420239c7SJeff Roberson 	int vfslocked;
2384d13ab3dSPoul-Henning Kamp 	int error;
2394d13ab3dSPoul-Henning Kamp 
2404d13ab3dSPoul-Henning Kamp 	g_topology_assert();
2414d13ab3dSPoul-Henning Kamp 
2424d13ab3dSPoul-Henning Kamp 	*cpp = NULL;
2438f128ff5SAndriy Gapon 	bo = &vp->v_bufobj;
2448f128ff5SAndriy Gapon 	if (bo->bo_private != vp)
2458f128ff5SAndriy Gapon 		return (EBUSY);
2468f128ff5SAndriy Gapon 
2474d13ab3dSPoul-Henning Kamp 	pp = g_dev_getprovider(vp->v_rdev);
2484d13ab3dSPoul-Henning Kamp 	if (pp == NULL)
2494d13ab3dSPoul-Henning Kamp 		return (ENOENT);
2504d13ab3dSPoul-Henning Kamp 	gp = g_new_geomf(&g_vfs_class, "%s.%s", fsname, pp->name);
251ea5791d7SAlexander Motin 	sc = g_malloc(sizeof(*sc), M_WAITOK | M_ZERO);
252ea5791d7SAlexander Motin 	mtx_init(&sc->sc_mtx, "g_vfs", NULL, MTX_DEF);
253ea5791d7SAlexander Motin 	sc->sc_bo = bo;
254ea5791d7SAlexander Motin 	gp->softc = sc;
2554d13ab3dSPoul-Henning Kamp 	cp = g_new_consumer(gp);
2564d13ab3dSPoul-Henning Kamp 	g_attach(cp, pp);
2578795189cSKirk McKusick 	error = g_access(cp, 1, wr, wr);
2584d13ab3dSPoul-Henning Kamp 	if (error) {
2594d13ab3dSPoul-Henning Kamp 		g_wither_geom(gp, ENXIO);
2604d13ab3dSPoul-Henning Kamp 		return (error);
2614d13ab3dSPoul-Henning Kamp 	}
262420239c7SJeff Roberson 	vfslocked = VFS_LOCK_GIANT(vp->v_mount);
263bc0fc6fcSPoul-Henning Kamp 	vnode_create_vobject(vp, pp->mediasize, curthread);
264420239c7SJeff Roberson 	VFS_UNLOCK_GIANT(vfslocked);
2654d13ab3dSPoul-Henning Kamp 	*cpp = cp;
2668f128ff5SAndriy Gapon 	cp->private = vp;
2674d13ab3dSPoul-Henning Kamp 	bo->bo_ops = g_vfs_bufops;
2684d13ab3dSPoul-Henning Kamp 	bo->bo_private = cp;
2691b4bc5f8SAndriy Gapon 	bo->bo_bsize = pp->sectorsize;
2704d13ab3dSPoul-Henning Kamp 
2714d13ab3dSPoul-Henning Kamp 	return (error);
2724d13ab3dSPoul-Henning Kamp }
27384a69752SPoul-Henning Kamp 
27484a69752SPoul-Henning Kamp void
2750d7935fdSAttilio Rao g_vfs_close(struct g_consumer *cp)
27684a69752SPoul-Henning Kamp {
27784a69752SPoul-Henning Kamp 	struct g_geom *gp;
278ea5791d7SAlexander Motin 	struct g_vfs_softc *sc;
27984a69752SPoul-Henning Kamp 
28084a69752SPoul-Henning Kamp 	g_topology_assert();
28184a69752SPoul-Henning Kamp 
28284a69752SPoul-Henning Kamp 	gp = cp->geom;
283ea5791d7SAlexander Motin 	sc = gp->softc;
284ea5791d7SAlexander Motin 	bufobj_invalbuf(sc->sc_bo, V_SAVE, 0, 0);
285ea5791d7SAlexander Motin 	sc->sc_bo->bo_private = cp->private;
286ea5791d7SAlexander Motin 	gp->softc = NULL;
287ea5791d7SAlexander Motin 	mtx_destroy(&sc->sc_mtx);
288ea5791d7SAlexander Motin 	if (!sc->sc_orphaned || cp->provider == NULL)
28984a69752SPoul-Henning Kamp 		g_wither_geom_close(gp, ENXIO);
290ea5791d7SAlexander Motin 	g_free(sc);
29184a69752SPoul-Henning Kamp }
292