14d13ab3dSPoul-Henning Kamp /*- 23728855aSPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 33728855aSPedro F. Giffuni * 44d13ab3dSPoul-Henning Kamp * Copyright (c) 2004 Poul-Henning Kamp 54d13ab3dSPoul-Henning Kamp * All rights reserved. 64d13ab3dSPoul-Henning Kamp * 74d13ab3dSPoul-Henning Kamp * Redistribution and use in source and binary forms, with or without 84d13ab3dSPoul-Henning Kamp * modification, are permitted provided that the following conditions 94d13ab3dSPoul-Henning Kamp * are met: 104d13ab3dSPoul-Henning Kamp * 1. Redistributions of source code must retain the above copyright 114d13ab3dSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer. 124d13ab3dSPoul-Henning Kamp * 2. Redistributions in binary form must reproduce the above copyright 134d13ab3dSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer in the 144d13ab3dSPoul-Henning Kamp * documentation and/or other materials provided with the distribution. 154d13ab3dSPoul-Henning Kamp * 164d13ab3dSPoul-Henning Kamp * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 174d13ab3dSPoul-Henning Kamp * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 184d13ab3dSPoul-Henning Kamp * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 194d13ab3dSPoul-Henning Kamp * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 204d13ab3dSPoul-Henning Kamp * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 214d13ab3dSPoul-Henning Kamp * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 224d13ab3dSPoul-Henning Kamp * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 234d13ab3dSPoul-Henning Kamp * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 244d13ab3dSPoul-Henning Kamp * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 254d13ab3dSPoul-Henning Kamp * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 264d13ab3dSPoul-Henning Kamp * SUCH DAMAGE. 274d13ab3dSPoul-Henning Kamp */ 284d13ab3dSPoul-Henning Kamp 294d13ab3dSPoul-Henning Kamp #include <sys/cdefs.h> 304d13ab3dSPoul-Henning Kamp __FBSDID("$FreeBSD$"); 314d13ab3dSPoul-Henning Kamp 324d13ab3dSPoul-Henning Kamp #include <sys/param.h> 334d13ab3dSPoul-Henning Kamp #include <sys/systm.h> 344d13ab3dSPoul-Henning Kamp #include <sys/bio.h> 354d13ab3dSPoul-Henning Kamp #include <sys/kernel.h> 36ea5791d7SAlexander Motin #include <sys/lock.h> 374d13ab3dSPoul-Henning Kamp #include <sys/malloc.h> 38ea5791d7SAlexander Motin #include <sys/mutex.h> 39ac03832eSConrad Meyer #include <sys/sbuf.h> 404d13ab3dSPoul-Henning Kamp #include <sys/vnode.h> 415050aa86SKonstantin Belousov #include <sys/mount.h> 424d13ab3dSPoul-Henning Kamp 434d13ab3dSPoul-Henning Kamp #include <geom/geom.h> 444d13ab3dSPoul-Henning Kamp #include <geom/geom_vfs.h> 454d13ab3dSPoul-Henning Kamp 464d13ab3dSPoul-Henning Kamp /* 474d13ab3dSPoul-Henning Kamp * subroutines for use by filesystems. 484d13ab3dSPoul-Henning Kamp * 494d13ab3dSPoul-Henning Kamp * XXX: should maybe live somewhere else ? 504d13ab3dSPoul-Henning Kamp */ 514d13ab3dSPoul-Henning Kamp #include <sys/buf.h> 524d13ab3dSPoul-Henning Kamp 53ea5791d7SAlexander Motin struct g_vfs_softc { 54ea5791d7SAlexander Motin struct mtx sc_mtx; 55ea5791d7SAlexander Motin struct bufobj *sc_bo; 56419d406eSJohn Baldwin struct g_event *sc_event; 57ea5791d7SAlexander Motin int sc_active; 58f58385f3SWarner Losh bool sc_orphaned; 59d79ff54bSChuck Silvers int sc_enxio_active; 60*347a8e93SWarner Losh int sc_enxio_reported; 61ea5791d7SAlexander Motin }; 62ea5791d7SAlexander Motin 634d13ab3dSPoul-Henning Kamp static struct buf_ops __g_vfs_bufops = { 644d13ab3dSPoul-Henning Kamp .bop_name = "GEOM_VFS", 654d13ab3dSPoul-Henning Kamp .bop_write = bufwrite, 664d13ab3dSPoul-Henning Kamp .bop_strategy = g_vfs_strategy, 676ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 682cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush 694d13ab3dSPoul-Henning Kamp }; 704d13ab3dSPoul-Henning Kamp 714d13ab3dSPoul-Henning Kamp struct buf_ops *g_vfs_bufops = &__g_vfs_bufops; 724d13ab3dSPoul-Henning Kamp 7307e95ed6SPoul-Henning Kamp static g_orphan_t g_vfs_orphan; 7407e95ed6SPoul-Henning Kamp 754d13ab3dSPoul-Henning Kamp static struct g_class g_vfs_class = { 764d13ab3dSPoul-Henning Kamp .name = "VFS", 774d13ab3dSPoul-Henning Kamp .version = G_VERSION, 784d13ab3dSPoul-Henning Kamp .orphan = g_vfs_orphan, 794d13ab3dSPoul-Henning Kamp }; 804d13ab3dSPoul-Henning Kamp 814d13ab3dSPoul-Henning Kamp DECLARE_GEOM_CLASS(g_vfs_class, g_vfs); 824d13ab3dSPoul-Henning Kamp 834d13ab3dSPoul-Henning Kamp static void 84ea5791d7SAlexander Motin g_vfs_destroy(void *arg, int flags __unused) 85ea5791d7SAlexander Motin { 86ea5791d7SAlexander Motin struct g_consumer *cp; 87ea5791d7SAlexander Motin 88ea5791d7SAlexander Motin g_topology_assert(); 89ea5791d7SAlexander Motin cp = arg; 90ea5791d7SAlexander Motin if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0) 91ea5791d7SAlexander Motin g_access(cp, -cp->acr, -cp->acw, -cp->ace); 92ea5791d7SAlexander Motin g_detach(cp); 93ea5791d7SAlexander Motin if (cp->geom->softc == NULL) 94ea5791d7SAlexander Motin g_wither_geom(cp->geom, ENXIO); 95ea5791d7SAlexander Motin } 96ea5791d7SAlexander Motin 97ea5791d7SAlexander Motin static void 984d13ab3dSPoul-Henning Kamp g_vfs_done(struct bio *bip) 994d13ab3dSPoul-Henning Kamp { 100ea5791d7SAlexander Motin struct g_consumer *cp; 101419d406eSJohn Baldwin struct g_event *event; 102ea5791d7SAlexander Motin struct g_vfs_softc *sc; 1034d13ab3dSPoul-Henning Kamp struct buf *bp; 1045050aa86SKonstantin Belousov int destroy; 1051faacf5dSKirk McKusick struct mount *mp; 1061faacf5dSKirk McKusick struct vnode *vp; 10785121b09SKirk McKusick struct cdev *cdevp; 1081faacf5dSKirk McKusick 1091faacf5dSKirk McKusick /* 1101faacf5dSKirk McKusick * Collect statistics on synchronous and asynchronous read 1111faacf5dSKirk McKusick * and write counts for disks that have associated filesystems. 1121faacf5dSKirk McKusick */ 1131faacf5dSKirk McKusick bp = bip->bio_caller2; 1141faacf5dSKirk McKusick vp = bp->b_vp; 11540ea77a0SAlexander Motin if (vp != NULL) { 11685121b09SKirk McKusick /* 11785121b09SKirk McKusick * If not a disk vnode, use its associated mount point 11885121b09SKirk McKusick * otherwise use the mountpoint associated with the disk. 11985121b09SKirk McKusick */ 12085121b09SKirk McKusick VI_LOCK(vp); 12185121b09SKirk McKusick if (vp->v_type != VCHR || 12285121b09SKirk McKusick (cdevp = vp->v_rdev) == NULL || 12385121b09SKirk McKusick cdevp->si_devsw == NULL || 12485121b09SKirk McKusick (cdevp->si_devsw->d_flags & D_DISK) == 0) 1251faacf5dSKirk McKusick mp = vp->v_mount; 12685121b09SKirk McKusick else 12785121b09SKirk McKusick mp = cdevp->si_mountpt; 1281faacf5dSKirk McKusick if (mp != NULL) { 12940ea77a0SAlexander Motin if (bp->b_iocmd == BIO_READ) { 1301faacf5dSKirk McKusick if (LK_HOLDER(bp->b_lock.lk_lock) == LK_KERNPROC) 1311faacf5dSKirk McKusick mp->mnt_stat.f_asyncreads++; 1321faacf5dSKirk McKusick else 1331faacf5dSKirk McKusick mp->mnt_stat.f_syncreads++; 13440ea77a0SAlexander Motin } else if (bp->b_iocmd == BIO_WRITE) { 13540ea77a0SAlexander Motin if (LK_HOLDER(bp->b_lock.lk_lock) == LK_KERNPROC) 13640ea77a0SAlexander Motin mp->mnt_stat.f_asyncwrites++; 13740ea77a0SAlexander Motin else 13840ea77a0SAlexander Motin mp->mnt_stat.f_syncwrites++; 1391faacf5dSKirk McKusick } 1401faacf5dSKirk McKusick } 14140ea77a0SAlexander Motin VI_UNLOCK(vp); 14240ea77a0SAlexander Motin } 1434d13ab3dSPoul-Henning Kamp 144ea5791d7SAlexander Motin cp = bip->bio_from; 145ea5791d7SAlexander Motin sc = cp->geom->softc; 146d79ff54bSChuck Silvers if (bip->bio_error != 0 && bip->bio_error != EOPNOTSUPP) { 147e8827f40SWarner Losh if ((bp->b_xflags & BX_CVTENXIO) != 0) { 148e8827f40SWarner Losh if (atomic_cmpset_int(&sc->sc_enxio_active, 0, 1)) 149e8827f40SWarner Losh printf("g_vfs_done(): %s converting all errors to ENXIO\n", 150e8827f40SWarner Losh bip->bio_to->name); 151e8827f40SWarner Losh } 152d79ff54bSChuck Silvers if (sc->sc_enxio_active) 153d79ff54bSChuck Silvers bip->bio_error = ENXIO; 154*347a8e93SWarner Losh if (bip->bio_error != ENXIO || 155*347a8e93SWarner Losh atomic_cmpset_int(&sc->sc_enxio_reported, 0, 1)) { 156*347a8e93SWarner Losh g_print_bio("g_vfs_done():", bip, "error = %d%s", 157*347a8e93SWarner Losh bip->bio_error, 158*347a8e93SWarner Losh bip->bio_error != ENXIO ? "" : 159*347a8e93SWarner Losh " supressing further ENXIO"); 160*347a8e93SWarner Losh } 161d79ff54bSChuck Silvers } 1624d13ab3dSPoul-Henning Kamp bp->b_error = bip->bio_error; 1634d13ab3dSPoul-Henning Kamp bp->b_ioflags = bip->bio_flags; 1644d13ab3dSPoul-Henning Kamp if (bip->bio_error) 1654d13ab3dSPoul-Henning Kamp bp->b_ioflags |= BIO_ERROR; 1664d13ab3dSPoul-Henning Kamp bp->b_resid = bp->b_bcount - bip->bio_completed; 1674d13ab3dSPoul-Henning Kamp g_destroy_bio(bip); 168ea5791d7SAlexander Motin 169ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 170ea5791d7SAlexander Motin destroy = ((--sc->sc_active) == 0 && sc->sc_orphaned); 171419d406eSJohn Baldwin if (destroy) { 172419d406eSJohn Baldwin event = sc->sc_event; 173419d406eSJohn Baldwin sc->sc_event = NULL; 174419d406eSJohn Baldwin } else 175419d406eSJohn Baldwin event = NULL; 176ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 177ea5791d7SAlexander Motin if (destroy) 178419d406eSJohn Baldwin g_post_event_ep(g_vfs_destroy, cp, event, NULL); 179ea5791d7SAlexander Motin 1804d13ab3dSPoul-Henning Kamp bufdone(bp); 1814d13ab3dSPoul-Henning Kamp } 1824d13ab3dSPoul-Henning Kamp 1834d13ab3dSPoul-Henning Kamp void 1844d13ab3dSPoul-Henning Kamp g_vfs_strategy(struct bufobj *bo, struct buf *bp) 1854d13ab3dSPoul-Henning Kamp { 186ea5791d7SAlexander Motin struct g_vfs_softc *sc; 1874d13ab3dSPoul-Henning Kamp struct g_consumer *cp; 1884d13ab3dSPoul-Henning Kamp struct bio *bip; 1894d13ab3dSPoul-Henning Kamp 1904d13ab3dSPoul-Henning Kamp cp = bo->bo_private; 191ea5791d7SAlexander Motin sc = cp->geom->softc; 1924d13ab3dSPoul-Henning Kamp 193ce8be7b8SEdward Tomasz Napierala /* 1946635c8edSEdward Tomasz Napierala * If the provider has orphaned us, just return ENXIO. 195ce8be7b8SEdward Tomasz Napierala */ 196ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 197d79ff54bSChuck Silvers if (sc->sc_orphaned || sc->sc_enxio_active) { 198ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 199ce8be7b8SEdward Tomasz Napierala bp->b_error = ENXIO; 200ce8be7b8SEdward Tomasz Napierala bp->b_ioflags |= BIO_ERROR; 201ce8be7b8SEdward Tomasz Napierala bufdone(bp); 202ce8be7b8SEdward Tomasz Napierala return; 203ce8be7b8SEdward Tomasz Napierala } 204ea5791d7SAlexander Motin sc->sc_active++; 205ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 206ce8be7b8SEdward Tomasz Napierala 2074d13ab3dSPoul-Henning Kamp bip = g_alloc_bio(); 2084d13ab3dSPoul-Henning Kamp bip->bio_cmd = bp->b_iocmd; 2094d13ab3dSPoul-Henning Kamp bip->bio_offset = bp->b_iooffset; 2104d13ab3dSPoul-Henning Kamp bip->bio_length = bp->b_bcount; 211ee75e7deSKonstantin Belousov bdata2bio(bp, bip); 212ee75e7deSKonstantin Belousov if ((bp->b_flags & B_BARRIER) != 0) { 2132bc1a1feSKirk McKusick bip->bio_flags |= BIO_ORDERED; 2142bc1a1feSKirk McKusick bp->b_flags &= ~B_BARRIER; 2152bc1a1feSKirk McKusick } 2163cf5dd84SWarner Losh if (bp->b_iocmd == BIO_SPEEDUP) 2173cf5dd84SWarner Losh bip->bio_flags |= bp->b_ioflags; 218ee75e7deSKonstantin Belousov bip->bio_done = g_vfs_done; 219ee75e7deSKonstantin Belousov bip->bio_caller2 = bp; 2208532d381SConrad Meyer #if defined(BUF_TRACKING) || defined(FULL_BUF_TRACKING) 2218532d381SConrad Meyer buf_track(bp, __func__); 2228532d381SConrad Meyer bip->bio_track_bp = bp; 2238532d381SConrad Meyer #endif 2244d13ab3dSPoul-Henning Kamp g_io_request(bip, cp); 2254d13ab3dSPoul-Henning Kamp } 2264d13ab3dSPoul-Henning Kamp 22707e95ed6SPoul-Henning Kamp static void 2284d13ab3dSPoul-Henning Kamp g_vfs_orphan(struct g_consumer *cp) 2294d13ab3dSPoul-Henning Kamp { 230ce8be7b8SEdward Tomasz Napierala struct g_geom *gp; 231419d406eSJohn Baldwin struct g_event *event; 232ea5791d7SAlexander Motin struct g_vfs_softc *sc; 233ea5791d7SAlexander Motin int destroy; 234ce8be7b8SEdward Tomasz Napierala 235ce8be7b8SEdward Tomasz Napierala g_topology_assert(); 236ce8be7b8SEdward Tomasz Napierala 237ce8be7b8SEdward Tomasz Napierala gp = cp->geom; 238ce8be7b8SEdward Tomasz Napierala g_trace(G_T_TOPOLOGY, "g_vfs_orphan(%p(%s))", cp, gp->name); 239a2fa37feSAlexander Motin sc = gp->softc; 240a2fa37feSAlexander Motin if (sc == NULL) 241a2fa37feSAlexander Motin return; 242419d406eSJohn Baldwin event = g_alloc_event(M_WAITOK); 243ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 244419d406eSJohn Baldwin KASSERT(sc->sc_event == NULL, ("g_vfs %p already has an event", sc)); 245f58385f3SWarner Losh sc->sc_orphaned = true; 246e521fb05SAlexander Motin destroy = (sc->sc_active == 0); 247419d406eSJohn Baldwin if (!destroy) { 248419d406eSJohn Baldwin sc->sc_event = event; 249419d406eSJohn Baldwin event = NULL; 250419d406eSJohn Baldwin } 251ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 252419d406eSJohn Baldwin if (destroy) { 253419d406eSJohn Baldwin g_free(event); 254ea5791d7SAlexander Motin g_vfs_destroy(cp, 0); 255419d406eSJohn Baldwin } 2564d13ab3dSPoul-Henning Kamp 2574d13ab3dSPoul-Henning Kamp /* 25838153e80SEdward Tomasz Napierala * Do not destroy the geom. Filesystem will do that during unmount. 2594d13ab3dSPoul-Henning Kamp */ 2604d13ab3dSPoul-Henning Kamp } 2614d13ab3dSPoul-Henning Kamp 2624d13ab3dSPoul-Henning Kamp int 2634d13ab3dSPoul-Henning Kamp g_vfs_open(struct vnode *vp, struct g_consumer **cpp, const char *fsname, int wr) 2644d13ab3dSPoul-Henning Kamp { 2654d13ab3dSPoul-Henning Kamp struct g_geom *gp; 2664d13ab3dSPoul-Henning Kamp struct g_provider *pp; 2674d13ab3dSPoul-Henning Kamp struct g_consumer *cp; 268ea5791d7SAlexander Motin struct g_vfs_softc *sc; 2694d13ab3dSPoul-Henning Kamp struct bufobj *bo; 2704d13ab3dSPoul-Henning Kamp int error; 2714d13ab3dSPoul-Henning Kamp 2724d13ab3dSPoul-Henning Kamp g_topology_assert(); 2734d13ab3dSPoul-Henning Kamp 2744d13ab3dSPoul-Henning Kamp *cpp = NULL; 2758f128ff5SAndriy Gapon bo = &vp->v_bufobj; 2768f128ff5SAndriy Gapon if (bo->bo_private != vp) 2778f128ff5SAndriy Gapon return (EBUSY); 2788f128ff5SAndriy Gapon 2794d13ab3dSPoul-Henning Kamp pp = g_dev_getprovider(vp->v_rdev); 2804d13ab3dSPoul-Henning Kamp if (pp == NULL) 2814d13ab3dSPoul-Henning Kamp return (ENOENT); 2824d13ab3dSPoul-Henning Kamp gp = g_new_geomf(&g_vfs_class, "%s.%s", fsname, pp->name); 283ea5791d7SAlexander Motin sc = g_malloc(sizeof(*sc), M_WAITOK | M_ZERO); 284ea5791d7SAlexander Motin mtx_init(&sc->sc_mtx, "g_vfs", NULL, MTX_DEF); 285ea5791d7SAlexander Motin sc->sc_bo = bo; 286ea5791d7SAlexander Motin gp->softc = sc; 2874d13ab3dSPoul-Henning Kamp cp = g_new_consumer(gp); 288d22ff249SEdward Tomasz Napierala error = g_attach(cp, pp); 289d22ff249SEdward Tomasz Napierala if (error) { 290d22ff249SEdward Tomasz Napierala g_wither_geom(gp, ENXIO); 291d22ff249SEdward Tomasz Napierala return (error); 292d22ff249SEdward Tomasz Napierala } 2938795189cSKirk McKusick error = g_access(cp, 1, wr, wr); 2944d13ab3dSPoul-Henning Kamp if (error) { 2954d13ab3dSPoul-Henning Kamp g_wither_geom(gp, ENXIO); 2964d13ab3dSPoul-Henning Kamp return (error); 2974d13ab3dSPoul-Henning Kamp } 298bc0fc6fcSPoul-Henning Kamp vnode_create_vobject(vp, pp->mediasize, curthread); 2994d13ab3dSPoul-Henning Kamp *cpp = cp; 3008f128ff5SAndriy Gapon cp->private = vp; 30140ea77a0SAlexander Motin cp->flags |= G_CF_DIRECT_SEND | G_CF_DIRECT_RECEIVE; 3024d13ab3dSPoul-Henning Kamp bo->bo_ops = g_vfs_bufops; 3034d13ab3dSPoul-Henning Kamp bo->bo_private = cp; 3041b4bc5f8SAndriy Gapon bo->bo_bsize = pp->sectorsize; 3054d13ab3dSPoul-Henning Kamp 3064d13ab3dSPoul-Henning Kamp return (error); 3074d13ab3dSPoul-Henning Kamp } 30884a69752SPoul-Henning Kamp 30984a69752SPoul-Henning Kamp void 3100d7935fdSAttilio Rao g_vfs_close(struct g_consumer *cp) 31184a69752SPoul-Henning Kamp { 31284a69752SPoul-Henning Kamp struct g_geom *gp; 313ea5791d7SAlexander Motin struct g_vfs_softc *sc; 31484a69752SPoul-Henning Kamp 31584a69752SPoul-Henning Kamp g_topology_assert(); 31684a69752SPoul-Henning Kamp 31784a69752SPoul-Henning Kamp gp = cp->geom; 318ea5791d7SAlexander Motin sc = gp->softc; 319ea5791d7SAlexander Motin bufobj_invalbuf(sc->sc_bo, V_SAVE, 0, 0); 320ea5791d7SAlexander Motin sc->sc_bo->bo_private = cp->private; 321ea5791d7SAlexander Motin gp->softc = NULL; 322ea5791d7SAlexander Motin mtx_destroy(&sc->sc_mtx); 323ea5791d7SAlexander Motin if (!sc->sc_orphaned || cp->provider == NULL) 32484a69752SPoul-Henning Kamp g_wither_geom_close(gp, ENXIO); 325419d406eSJohn Baldwin KASSERT(sc->sc_event == NULL, ("g_vfs %p event is non-NULL", sc)); 326ea5791d7SAlexander Motin g_free(sc); 32784a69752SPoul-Henning Kamp } 328