14d13ab3dSPoul-Henning Kamp /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 33728855aSPedro F. Giffuni * 44d13ab3dSPoul-Henning Kamp * Copyright (c) 2004 Poul-Henning Kamp 54d13ab3dSPoul-Henning Kamp * All rights reserved. 64d13ab3dSPoul-Henning Kamp * 74d13ab3dSPoul-Henning Kamp * Redistribution and use in source and binary forms, with or without 84d13ab3dSPoul-Henning Kamp * modification, are permitted provided that the following conditions 94d13ab3dSPoul-Henning Kamp * are met: 104d13ab3dSPoul-Henning Kamp * 1. Redistributions of source code must retain the above copyright 114d13ab3dSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer. 124d13ab3dSPoul-Henning Kamp * 2. Redistributions in binary form must reproduce the above copyright 134d13ab3dSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer in the 144d13ab3dSPoul-Henning Kamp * documentation and/or other materials provided with the distribution. 154d13ab3dSPoul-Henning Kamp * 164d13ab3dSPoul-Henning Kamp * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 174d13ab3dSPoul-Henning Kamp * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 184d13ab3dSPoul-Henning Kamp * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 194d13ab3dSPoul-Henning Kamp * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 204d13ab3dSPoul-Henning Kamp * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 214d13ab3dSPoul-Henning Kamp * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 224d13ab3dSPoul-Henning Kamp * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 234d13ab3dSPoul-Henning Kamp * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 244d13ab3dSPoul-Henning Kamp * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 254d13ab3dSPoul-Henning Kamp * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 264d13ab3dSPoul-Henning Kamp * SUCH DAMAGE. 274d13ab3dSPoul-Henning Kamp */ 284d13ab3dSPoul-Henning Kamp 294d13ab3dSPoul-Henning Kamp #include <sys/param.h> 304d13ab3dSPoul-Henning Kamp #include <sys/systm.h> 314d13ab3dSPoul-Henning Kamp #include <sys/bio.h> 324d13ab3dSPoul-Henning Kamp #include <sys/kernel.h> 33ea5791d7SAlexander Motin #include <sys/lock.h> 344d13ab3dSPoul-Henning Kamp #include <sys/malloc.h> 35ea5791d7SAlexander Motin #include <sys/mutex.h> 36ac03832eSConrad Meyer #include <sys/sbuf.h> 374d13ab3dSPoul-Henning Kamp #include <sys/vnode.h> 385050aa86SKonstantin Belousov #include <sys/mount.h> 394d13ab3dSPoul-Henning Kamp 404d13ab3dSPoul-Henning Kamp #include <geom/geom.h> 414d13ab3dSPoul-Henning Kamp #include <geom/geom_vfs.h> 424d13ab3dSPoul-Henning Kamp 434d13ab3dSPoul-Henning Kamp /* 444d13ab3dSPoul-Henning Kamp * subroutines for use by filesystems. 454d13ab3dSPoul-Henning Kamp * 464d13ab3dSPoul-Henning Kamp * XXX: should maybe live somewhere else ? 474d13ab3dSPoul-Henning Kamp */ 484d13ab3dSPoul-Henning Kamp #include <sys/buf.h> 494d13ab3dSPoul-Henning Kamp 50ea5791d7SAlexander Motin struct g_vfs_softc { 51ea5791d7SAlexander Motin struct mtx sc_mtx; 52ea5791d7SAlexander Motin struct bufobj *sc_bo; 53419d406eSJohn Baldwin struct g_event *sc_event; 54ea5791d7SAlexander Motin int sc_active; 55f58385f3SWarner Losh bool sc_orphaned; 56d79ff54bSChuck Silvers int sc_enxio_active; 57347a8e93SWarner Losh int sc_enxio_reported; 58ea5791d7SAlexander Motin }; 59ea5791d7SAlexander Motin 604d13ab3dSPoul-Henning Kamp static struct buf_ops __g_vfs_bufops = { 614d13ab3dSPoul-Henning Kamp .bop_name = "GEOM_VFS", 624d13ab3dSPoul-Henning Kamp .bop_write = bufwrite, 634d13ab3dSPoul-Henning Kamp .bop_strategy = g_vfs_strategy, 646ef8480aSPoul-Henning Kamp .bop_sync = bufsync, 652cc7d26fSKonstantin Belousov .bop_bdflush = bufbdflush 664d13ab3dSPoul-Henning Kamp }; 674d13ab3dSPoul-Henning Kamp 684d13ab3dSPoul-Henning Kamp struct buf_ops *g_vfs_bufops = &__g_vfs_bufops; 694d13ab3dSPoul-Henning Kamp 7007e95ed6SPoul-Henning Kamp static g_orphan_t g_vfs_orphan; 7107e95ed6SPoul-Henning Kamp 724d13ab3dSPoul-Henning Kamp static struct g_class g_vfs_class = { 734d13ab3dSPoul-Henning Kamp .name = "VFS", 744d13ab3dSPoul-Henning Kamp .version = G_VERSION, 754d13ab3dSPoul-Henning Kamp .orphan = g_vfs_orphan, 764d13ab3dSPoul-Henning Kamp }; 774d13ab3dSPoul-Henning Kamp 784d13ab3dSPoul-Henning Kamp DECLARE_GEOM_CLASS(g_vfs_class, g_vfs); 794d13ab3dSPoul-Henning Kamp 804d13ab3dSPoul-Henning Kamp static void 81ea5791d7SAlexander Motin g_vfs_destroy(void *arg, int flags __unused) 82ea5791d7SAlexander Motin { 83ea5791d7SAlexander Motin struct g_consumer *cp; 84ea5791d7SAlexander Motin 85ea5791d7SAlexander Motin g_topology_assert(); 86ea5791d7SAlexander Motin cp = arg; 87ea5791d7SAlexander Motin if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0) 88ea5791d7SAlexander Motin g_access(cp, -cp->acr, -cp->acw, -cp->ace); 89ea5791d7SAlexander Motin g_detach(cp); 90ea5791d7SAlexander Motin if (cp->geom->softc == NULL) 91ea5791d7SAlexander Motin g_wither_geom(cp->geom, ENXIO); 92ea5791d7SAlexander Motin } 93ea5791d7SAlexander Motin 94ea5791d7SAlexander Motin static void 954d13ab3dSPoul-Henning Kamp g_vfs_done(struct bio *bip) 964d13ab3dSPoul-Henning Kamp { 97ea5791d7SAlexander Motin struct g_consumer *cp; 98419d406eSJohn Baldwin struct g_event *event; 99ea5791d7SAlexander Motin struct g_vfs_softc *sc; 1004d13ab3dSPoul-Henning Kamp struct buf *bp; 1015050aa86SKonstantin Belousov int destroy; 1021faacf5dSKirk McKusick struct mount *mp; 1031faacf5dSKirk McKusick struct vnode *vp; 10485121b09SKirk McKusick struct cdev *cdevp; 1051faacf5dSKirk McKusick 1061faacf5dSKirk McKusick /* 1071faacf5dSKirk McKusick * Collect statistics on synchronous and asynchronous read 1081faacf5dSKirk McKusick * and write counts for disks that have associated filesystems. 1091faacf5dSKirk McKusick */ 1101faacf5dSKirk McKusick bp = bip->bio_caller2; 1111faacf5dSKirk McKusick vp = bp->b_vp; 11240ea77a0SAlexander Motin if (vp != NULL) { 11385121b09SKirk McKusick /* 11485121b09SKirk McKusick * If not a disk vnode, use its associated mount point 11585121b09SKirk McKusick * otherwise use the mountpoint associated with the disk. 11685121b09SKirk McKusick */ 11785121b09SKirk McKusick VI_LOCK(vp); 11885121b09SKirk McKusick if (vp->v_type != VCHR || 11985121b09SKirk McKusick (cdevp = vp->v_rdev) == NULL || 12085121b09SKirk McKusick cdevp->si_devsw == NULL || 12185121b09SKirk McKusick (cdevp->si_devsw->d_flags & D_DISK) == 0) 1221faacf5dSKirk McKusick mp = vp->v_mount; 12385121b09SKirk McKusick else 12485121b09SKirk McKusick mp = cdevp->si_mountpt; 1251faacf5dSKirk McKusick if (mp != NULL) { 12640ea77a0SAlexander Motin if (bp->b_iocmd == BIO_READ) { 127bd56aad3SRyan Libby if (BUF_DISOWNED(bp)) 1281faacf5dSKirk McKusick mp->mnt_stat.f_asyncreads++; 1291faacf5dSKirk McKusick else 1301faacf5dSKirk McKusick mp->mnt_stat.f_syncreads++; 13140ea77a0SAlexander Motin } else if (bp->b_iocmd == BIO_WRITE) { 132bd56aad3SRyan Libby if (BUF_DISOWNED(bp)) 13340ea77a0SAlexander Motin mp->mnt_stat.f_asyncwrites++; 13440ea77a0SAlexander Motin else 13540ea77a0SAlexander Motin mp->mnt_stat.f_syncwrites++; 1361faacf5dSKirk McKusick } 1371faacf5dSKirk McKusick } 13840ea77a0SAlexander Motin VI_UNLOCK(vp); 13940ea77a0SAlexander Motin } 1404d13ab3dSPoul-Henning Kamp 141ea5791d7SAlexander Motin cp = bip->bio_from; 142ea5791d7SAlexander Motin sc = cp->geom->softc; 143d79ff54bSChuck Silvers if (bip->bio_error != 0 && bip->bio_error != EOPNOTSUPP) { 144e8827f40SWarner Losh if ((bp->b_xflags & BX_CVTENXIO) != 0) { 145e8827f40SWarner Losh if (atomic_cmpset_int(&sc->sc_enxio_active, 0, 1)) 146e8827f40SWarner Losh printf("g_vfs_done(): %s converting all errors to ENXIO\n", 147e8827f40SWarner Losh bip->bio_to->name); 148e8827f40SWarner Losh } 149d79ff54bSChuck Silvers if (sc->sc_enxio_active) 150d79ff54bSChuck Silvers bip->bio_error = ENXIO; 151347a8e93SWarner Losh if (bip->bio_error != ENXIO || 152347a8e93SWarner Losh atomic_cmpset_int(&sc->sc_enxio_reported, 0, 1)) { 153347a8e93SWarner Losh g_print_bio("g_vfs_done():", bip, "error = %d%s", 154347a8e93SWarner Losh bip->bio_error, 155347a8e93SWarner Losh bip->bio_error != ENXIO ? "" : 156347a8e93SWarner Losh " supressing further ENXIO"); 157347a8e93SWarner Losh } 158d79ff54bSChuck Silvers } 1594d13ab3dSPoul-Henning Kamp bp->b_error = bip->bio_error; 1604d13ab3dSPoul-Henning Kamp bp->b_ioflags = bip->bio_flags; 1614d13ab3dSPoul-Henning Kamp if (bip->bio_error) 1624d13ab3dSPoul-Henning Kamp bp->b_ioflags |= BIO_ERROR; 1634d13ab3dSPoul-Henning Kamp bp->b_resid = bp->b_bcount - bip->bio_completed; 1644d13ab3dSPoul-Henning Kamp g_destroy_bio(bip); 165ea5791d7SAlexander Motin 166ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 167ea5791d7SAlexander Motin destroy = ((--sc->sc_active) == 0 && sc->sc_orphaned); 168419d406eSJohn Baldwin if (destroy) { 169419d406eSJohn Baldwin event = sc->sc_event; 170419d406eSJohn Baldwin sc->sc_event = NULL; 171419d406eSJohn Baldwin } else 172419d406eSJohn Baldwin event = NULL; 173ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 174ea5791d7SAlexander Motin if (destroy) 175419d406eSJohn Baldwin g_post_event_ep(g_vfs_destroy, cp, event, NULL); 176ea5791d7SAlexander Motin 1774d13ab3dSPoul-Henning Kamp bufdone(bp); 1784d13ab3dSPoul-Henning Kamp } 1794d13ab3dSPoul-Henning Kamp 1804d13ab3dSPoul-Henning Kamp void 1814d13ab3dSPoul-Henning Kamp g_vfs_strategy(struct bufobj *bo, struct buf *bp) 1824d13ab3dSPoul-Henning Kamp { 183ea5791d7SAlexander Motin struct g_vfs_softc *sc; 1844d13ab3dSPoul-Henning Kamp struct g_consumer *cp; 1854d13ab3dSPoul-Henning Kamp struct bio *bip; 1864d13ab3dSPoul-Henning Kamp 1874d13ab3dSPoul-Henning Kamp cp = bo->bo_private; 188ea5791d7SAlexander Motin sc = cp->geom->softc; 1894d13ab3dSPoul-Henning Kamp 190ce8be7b8SEdward Tomasz Napierala /* 1916635c8edSEdward Tomasz Napierala * If the provider has orphaned us, just return ENXIO. 192ce8be7b8SEdward Tomasz Napierala */ 193ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 194d79ff54bSChuck Silvers if (sc->sc_orphaned || sc->sc_enxio_active) { 195ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 196ce8be7b8SEdward Tomasz Napierala bp->b_error = ENXIO; 197ce8be7b8SEdward Tomasz Napierala bp->b_ioflags |= BIO_ERROR; 198ce8be7b8SEdward Tomasz Napierala bufdone(bp); 199ce8be7b8SEdward Tomasz Napierala return; 200ce8be7b8SEdward Tomasz Napierala } 201ea5791d7SAlexander Motin sc->sc_active++; 202ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 203ce8be7b8SEdward Tomasz Napierala 2044d13ab3dSPoul-Henning Kamp bip = g_alloc_bio(); 2054d13ab3dSPoul-Henning Kamp bip->bio_cmd = bp->b_iocmd; 2064d13ab3dSPoul-Henning Kamp bip->bio_offset = bp->b_iooffset; 2074d13ab3dSPoul-Henning Kamp bip->bio_length = bp->b_bcount; 208ee75e7deSKonstantin Belousov bdata2bio(bp, bip); 209ee75e7deSKonstantin Belousov if ((bp->b_flags & B_BARRIER) != 0) { 2102bc1a1feSKirk McKusick bip->bio_flags |= BIO_ORDERED; 2112bc1a1feSKirk McKusick bp->b_flags &= ~B_BARRIER; 2122bc1a1feSKirk McKusick } 2133cf5dd84SWarner Losh if (bp->b_iocmd == BIO_SPEEDUP) 2143cf5dd84SWarner Losh bip->bio_flags |= bp->b_ioflags; 215ee75e7deSKonstantin Belousov bip->bio_done = g_vfs_done; 216ee75e7deSKonstantin Belousov bip->bio_caller2 = bp; 2178532d381SConrad Meyer #if defined(BUF_TRACKING) || defined(FULL_BUF_TRACKING) 2188532d381SConrad Meyer buf_track(bp, __func__); 2198532d381SConrad Meyer bip->bio_track_bp = bp; 2208532d381SConrad Meyer #endif 2214d13ab3dSPoul-Henning Kamp g_io_request(bip, cp); 2224d13ab3dSPoul-Henning Kamp } 2234d13ab3dSPoul-Henning Kamp 22407e95ed6SPoul-Henning Kamp static void 2254d13ab3dSPoul-Henning Kamp g_vfs_orphan(struct g_consumer *cp) 2264d13ab3dSPoul-Henning Kamp { 227ce8be7b8SEdward Tomasz Napierala struct g_geom *gp; 228419d406eSJohn Baldwin struct g_event *event; 229ea5791d7SAlexander Motin struct g_vfs_softc *sc; 230ea5791d7SAlexander Motin int destroy; 231ce8be7b8SEdward Tomasz Napierala 232ce8be7b8SEdward Tomasz Napierala g_topology_assert(); 233ce8be7b8SEdward Tomasz Napierala 234ce8be7b8SEdward Tomasz Napierala gp = cp->geom; 235ce8be7b8SEdward Tomasz Napierala g_trace(G_T_TOPOLOGY, "g_vfs_orphan(%p(%s))", cp, gp->name); 236a2fa37feSAlexander Motin sc = gp->softc; 237a2fa37feSAlexander Motin if (sc == NULL) 238a2fa37feSAlexander Motin return; 239419d406eSJohn Baldwin event = g_alloc_event(M_WAITOK); 240ea5791d7SAlexander Motin mtx_lock(&sc->sc_mtx); 241419d406eSJohn Baldwin KASSERT(sc->sc_event == NULL, ("g_vfs %p already has an event", sc)); 242f58385f3SWarner Losh sc->sc_orphaned = true; 243e521fb05SAlexander Motin destroy = (sc->sc_active == 0); 244419d406eSJohn Baldwin if (!destroy) { 245419d406eSJohn Baldwin sc->sc_event = event; 246419d406eSJohn Baldwin event = NULL; 247419d406eSJohn Baldwin } 248ea5791d7SAlexander Motin mtx_unlock(&sc->sc_mtx); 249419d406eSJohn Baldwin if (destroy) { 250419d406eSJohn Baldwin g_free(event); 251ea5791d7SAlexander Motin g_vfs_destroy(cp, 0); 252419d406eSJohn Baldwin } 2534d13ab3dSPoul-Henning Kamp 2544d13ab3dSPoul-Henning Kamp /* 25538153e80SEdward Tomasz Napierala * Do not destroy the geom. Filesystem will do that during unmount. 2564d13ab3dSPoul-Henning Kamp */ 2574d13ab3dSPoul-Henning Kamp } 2584d13ab3dSPoul-Henning Kamp 2594d13ab3dSPoul-Henning Kamp int 2604d13ab3dSPoul-Henning Kamp g_vfs_open(struct vnode *vp, struct g_consumer **cpp, const char *fsname, int wr) 2614d13ab3dSPoul-Henning Kamp { 2624d13ab3dSPoul-Henning Kamp struct g_geom *gp; 2634d13ab3dSPoul-Henning Kamp struct g_provider *pp; 2644d13ab3dSPoul-Henning Kamp struct g_consumer *cp; 265ea5791d7SAlexander Motin struct g_vfs_softc *sc; 2664d13ab3dSPoul-Henning Kamp struct bufobj *bo; 2674d13ab3dSPoul-Henning Kamp int error; 2684d13ab3dSPoul-Henning Kamp 2694d13ab3dSPoul-Henning Kamp g_topology_assert(); 2704d13ab3dSPoul-Henning Kamp 2714d13ab3dSPoul-Henning Kamp *cpp = NULL; 2728f128ff5SAndriy Gapon bo = &vp->v_bufobj; 2738f128ff5SAndriy Gapon if (bo->bo_private != vp) 2748f128ff5SAndriy Gapon return (EBUSY); 2758f128ff5SAndriy Gapon 2764d13ab3dSPoul-Henning Kamp pp = g_dev_getprovider(vp->v_rdev); 2774d13ab3dSPoul-Henning Kamp if (pp == NULL) 2784d13ab3dSPoul-Henning Kamp return (ENOENT); 2794d13ab3dSPoul-Henning Kamp gp = g_new_geomf(&g_vfs_class, "%s.%s", fsname, pp->name); 280ea5791d7SAlexander Motin sc = g_malloc(sizeof(*sc), M_WAITOK | M_ZERO); 281ea5791d7SAlexander Motin mtx_init(&sc->sc_mtx, "g_vfs", NULL, MTX_DEF); 282ea5791d7SAlexander Motin sc->sc_bo = bo; 283ea5791d7SAlexander Motin gp->softc = sc; 2844d13ab3dSPoul-Henning Kamp cp = g_new_consumer(gp); 285d22ff249SEdward Tomasz Napierala error = g_attach(cp, pp); 286d22ff249SEdward Tomasz Napierala if (error) { 287d22ff249SEdward Tomasz Napierala g_wither_geom(gp, ENXIO); 288d22ff249SEdward Tomasz Napierala return (error); 289d22ff249SEdward Tomasz Napierala } 2908795189cSKirk McKusick error = g_access(cp, 1, wr, wr); 2914d13ab3dSPoul-Henning Kamp if (error) { 2924d13ab3dSPoul-Henning Kamp g_wither_geom(gp, ENXIO); 2934d13ab3dSPoul-Henning Kamp return (error); 2944d13ab3dSPoul-Henning Kamp } 295*56a8aca8SPawel Jakub Dawidek /* 296*56a8aca8SPawel Jakub Dawidek * Mediasize might not be set until first access (see g_disk_access()), 297*56a8aca8SPawel Jakub Dawidek * That's why we check it here and not earlier. 298*56a8aca8SPawel Jakub Dawidek */ 299*56a8aca8SPawel Jakub Dawidek if (pp->mediasize == 0) { 300*56a8aca8SPawel Jakub Dawidek (void)g_access(cp, -1, -wr, -wr); 301*56a8aca8SPawel Jakub Dawidek g_wither_geom(gp, ENXIO); 302*56a8aca8SPawel Jakub Dawidek return (ENXIO); 303*56a8aca8SPawel Jakub Dawidek } 304*56a8aca8SPawel Jakub Dawidek vnode_create_disk_vobject(vp, pp->mediasize, curthread); 3054d13ab3dSPoul-Henning Kamp *cpp = cp; 3068f128ff5SAndriy Gapon cp->private = vp; 30740ea77a0SAlexander Motin cp->flags |= G_CF_DIRECT_SEND | G_CF_DIRECT_RECEIVE; 3084d13ab3dSPoul-Henning Kamp bo->bo_ops = g_vfs_bufops; 3094d13ab3dSPoul-Henning Kamp bo->bo_private = cp; 3101b4bc5f8SAndriy Gapon bo->bo_bsize = pp->sectorsize; 3114d13ab3dSPoul-Henning Kamp 3124d13ab3dSPoul-Henning Kamp return (error); 3134d13ab3dSPoul-Henning Kamp } 31484a69752SPoul-Henning Kamp 31584a69752SPoul-Henning Kamp void 3160d7935fdSAttilio Rao g_vfs_close(struct g_consumer *cp) 31784a69752SPoul-Henning Kamp { 31884a69752SPoul-Henning Kamp struct g_geom *gp; 319ea5791d7SAlexander Motin struct g_vfs_softc *sc; 32084a69752SPoul-Henning Kamp 32184a69752SPoul-Henning Kamp g_topology_assert(); 32284a69752SPoul-Henning Kamp 32384a69752SPoul-Henning Kamp gp = cp->geom; 324ea5791d7SAlexander Motin sc = gp->softc; 325ea5791d7SAlexander Motin bufobj_invalbuf(sc->sc_bo, V_SAVE, 0, 0); 326ea5791d7SAlexander Motin sc->sc_bo->bo_private = cp->private; 327ea5791d7SAlexander Motin gp->softc = NULL; 328ea5791d7SAlexander Motin mtx_destroy(&sc->sc_mtx); 329ea5791d7SAlexander Motin if (!sc->sc_orphaned || cp->provider == NULL) 33084a69752SPoul-Henning Kamp g_wither_geom_close(gp, ENXIO); 331419d406eSJohn Baldwin KASSERT(sc->sc_event == NULL, ("g_vfs %p event is non-NULL", sc)); 332ea5791d7SAlexander Motin g_free(sc); 33384a69752SPoul-Henning Kamp } 334