1dd84a43cSPoul-Henning Kamp /*- 2dd84a43cSPoul-Henning Kamp * Copyright (c) 2002 Poul-Henning Kamp 3dd84a43cSPoul-Henning Kamp * Copyright (c) 2002 Networks Associates Technology, Inc. 4dd84a43cSPoul-Henning Kamp * All rights reserved. 5dd84a43cSPoul-Henning Kamp * 6dd84a43cSPoul-Henning Kamp * This software was developed for the FreeBSD Project by Poul-Henning Kamp 7dd84a43cSPoul-Henning Kamp * and NAI Labs, the Security Research Division of Network Associates, Inc. 8dd84a43cSPoul-Henning Kamp * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the 9dd84a43cSPoul-Henning Kamp * DARPA CHATS research program. 10dd84a43cSPoul-Henning Kamp * 11dd84a43cSPoul-Henning Kamp * Redistribution and use in source and binary forms, with or without 12dd84a43cSPoul-Henning Kamp * modification, are permitted provided that the following conditions 13dd84a43cSPoul-Henning Kamp * are met: 14dd84a43cSPoul-Henning Kamp * 1. Redistributions of source code must retain the above copyright 15dd84a43cSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer. 16dd84a43cSPoul-Henning Kamp * 2. Redistributions in binary form must reproduce the above copyright 17dd84a43cSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer in the 18dd84a43cSPoul-Henning Kamp * documentation and/or other materials provided with the distribution. 19dd84a43cSPoul-Henning Kamp * 3. The names of the authors may not be used to endorse or promote 20dd84a43cSPoul-Henning Kamp * products derived from this software without specific prior written 21dd84a43cSPoul-Henning Kamp * permission. 22dd84a43cSPoul-Henning Kamp * 23dd84a43cSPoul-Henning Kamp * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 24dd84a43cSPoul-Henning Kamp * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 25dd84a43cSPoul-Henning Kamp * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 26dd84a43cSPoul-Henning Kamp * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 27dd84a43cSPoul-Henning Kamp * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 28dd84a43cSPoul-Henning Kamp * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 29dd84a43cSPoul-Henning Kamp * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 30dd84a43cSPoul-Henning Kamp * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 31dd84a43cSPoul-Henning Kamp * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 32dd84a43cSPoul-Henning Kamp * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 33dd84a43cSPoul-Henning Kamp * SUCH DAMAGE. 34dd84a43cSPoul-Henning Kamp */ 35dd84a43cSPoul-Henning Kamp 3650b1faefSDavid E. O'Brien #include <sys/cdefs.h> 3750b1faefSDavid E. O'Brien __FBSDID("$FreeBSD$"); 38dd84a43cSPoul-Henning Kamp 39dd84a43cSPoul-Henning Kamp #include <sys/param.h> 40dd84a43cSPoul-Henning Kamp #include <sys/systm.h> 41dd84a43cSPoul-Henning Kamp #include <sys/kernel.h> 42dd84a43cSPoul-Henning Kamp #include <sys/malloc.h> 43dd84a43cSPoul-Henning Kamp #include <sys/bio.h> 4449dbb61dSRobert Watson #include <sys/ktr.h> 45dd84a43cSPoul-Henning Kamp 46dd84a43cSPoul-Henning Kamp #include <sys/errno.h> 47dd84a43cSPoul-Henning Kamp #include <geom/geom.h> 48b1876192SPoul-Henning Kamp #include <geom/geom_int.h> 49e24cbd90SPoul-Henning Kamp #include <sys/devicestat.h> 50dd84a43cSPoul-Henning Kamp 515ffb2c8bSPoul-Henning Kamp #include <vm/uma.h> 525ffb2c8bSPoul-Henning Kamp 53dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_down; 54dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_up; 555fcf4e43SPoul-Henning Kamp static struct g_bioq g_bio_run_task; 56dd84a43cSPoul-Henning Kamp 573432e4fdSPoul-Henning Kamp static u_int pace; 585ffb2c8bSPoul-Henning Kamp static uma_zone_t biozone; 593432e4fdSPoul-Henning Kamp 60dd84a43cSPoul-Henning Kamp #include <machine/atomic.h> 61dd84a43cSPoul-Henning Kamp 62dd84a43cSPoul-Henning Kamp static void 63dd84a43cSPoul-Henning Kamp g_bioq_lock(struct g_bioq *bq) 64dd84a43cSPoul-Henning Kamp { 65dd84a43cSPoul-Henning Kamp 66dd84a43cSPoul-Henning Kamp mtx_lock(&bq->bio_queue_lock); 67dd84a43cSPoul-Henning Kamp } 68dd84a43cSPoul-Henning Kamp 69dd84a43cSPoul-Henning Kamp static void 70dd84a43cSPoul-Henning Kamp g_bioq_unlock(struct g_bioq *bq) 71dd84a43cSPoul-Henning Kamp { 72dd84a43cSPoul-Henning Kamp 73dd84a43cSPoul-Henning Kamp mtx_unlock(&bq->bio_queue_lock); 74dd84a43cSPoul-Henning Kamp } 75dd84a43cSPoul-Henning Kamp 76dd84a43cSPoul-Henning Kamp #if 0 77dd84a43cSPoul-Henning Kamp static void 78dd84a43cSPoul-Henning Kamp g_bioq_destroy(struct g_bioq *bq) 79dd84a43cSPoul-Henning Kamp { 80dd84a43cSPoul-Henning Kamp 81dd84a43cSPoul-Henning Kamp mtx_destroy(&bq->bio_queue_lock); 82dd84a43cSPoul-Henning Kamp } 83dd84a43cSPoul-Henning Kamp #endif 84dd84a43cSPoul-Henning Kamp 85dd84a43cSPoul-Henning Kamp static void 86dd84a43cSPoul-Henning Kamp g_bioq_init(struct g_bioq *bq) 87dd84a43cSPoul-Henning Kamp { 88dd84a43cSPoul-Henning Kamp 89dd84a43cSPoul-Henning Kamp TAILQ_INIT(&bq->bio_queue); 906008862bSJohn Baldwin mtx_init(&bq->bio_queue_lock, "bio queue", NULL, MTX_DEF); 91dd84a43cSPoul-Henning Kamp } 92dd84a43cSPoul-Henning Kamp 93dd84a43cSPoul-Henning Kamp static struct bio * 94dd84a43cSPoul-Henning Kamp g_bioq_first(struct g_bioq *bq) 95dd84a43cSPoul-Henning Kamp { 96dd84a43cSPoul-Henning Kamp struct bio *bp; 97dd84a43cSPoul-Henning Kamp 98dd84a43cSPoul-Henning Kamp bp = TAILQ_FIRST(&bq->bio_queue); 99dd84a43cSPoul-Henning Kamp if (bp != NULL) { 100dcbd0fe5SPoul-Henning Kamp KASSERT((bp->bio_flags & BIO_ONQUEUE), 101dcbd0fe5SPoul-Henning Kamp ("Bio not on queue bp=%p target %p", bp, bq)); 102dcbd0fe5SPoul-Henning Kamp bp->bio_flags &= ~BIO_ONQUEUE; 103dd84a43cSPoul-Henning Kamp TAILQ_REMOVE(&bq->bio_queue, bp, bio_queue); 104dd84a43cSPoul-Henning Kamp bq->bio_queue_length--; 105dd84a43cSPoul-Henning Kamp } 106dd84a43cSPoul-Henning Kamp return (bp); 107dd84a43cSPoul-Henning Kamp } 108dd84a43cSPoul-Henning Kamp 109dd84a43cSPoul-Henning Kamp struct bio * 110dd84a43cSPoul-Henning Kamp g_new_bio(void) 111dd84a43cSPoul-Henning Kamp { 112dd84a43cSPoul-Henning Kamp struct bio *bp; 113dd84a43cSPoul-Henning Kamp 1145ffb2c8bSPoul-Henning Kamp bp = uma_zalloc(biozone, M_NOWAIT | M_ZERO); 115dd84a43cSPoul-Henning Kamp return (bp); 116dd84a43cSPoul-Henning Kamp } 117dd84a43cSPoul-Henning Kamp 118a2033c96SPoul-Henning Kamp struct bio * 119a2033c96SPoul-Henning Kamp g_alloc_bio(void) 120a2033c96SPoul-Henning Kamp { 121a2033c96SPoul-Henning Kamp struct bio *bp; 122a2033c96SPoul-Henning Kamp 123a2033c96SPoul-Henning Kamp bp = uma_zalloc(biozone, M_WAITOK | M_ZERO); 124a2033c96SPoul-Henning Kamp return (bp); 125a2033c96SPoul-Henning Kamp } 126a2033c96SPoul-Henning Kamp 127dd84a43cSPoul-Henning Kamp void 128dd84a43cSPoul-Henning Kamp g_destroy_bio(struct bio *bp) 129dd84a43cSPoul-Henning Kamp { 130dd84a43cSPoul-Henning Kamp 1315ffb2c8bSPoul-Henning Kamp uma_zfree(biozone, bp); 132dd84a43cSPoul-Henning Kamp } 133dd84a43cSPoul-Henning Kamp 134dd84a43cSPoul-Henning Kamp struct bio * 135dd84a43cSPoul-Henning Kamp g_clone_bio(struct bio *bp) 136dd84a43cSPoul-Henning Kamp { 137dd84a43cSPoul-Henning Kamp struct bio *bp2; 138dd84a43cSPoul-Henning Kamp 1395ffb2c8bSPoul-Henning Kamp bp2 = uma_zalloc(biozone, M_NOWAIT | M_ZERO); 140a1bd3ee2SPoul-Henning Kamp if (bp2 != NULL) { 141936cc461SPoul-Henning Kamp bp2->bio_parent = bp; 142dd84a43cSPoul-Henning Kamp bp2->bio_cmd = bp->bio_cmd; 143dd84a43cSPoul-Henning Kamp bp2->bio_length = bp->bio_length; 144dd84a43cSPoul-Henning Kamp bp2->bio_offset = bp->bio_offset; 145dd84a43cSPoul-Henning Kamp bp2->bio_data = bp->bio_data; 146dd84a43cSPoul-Henning Kamp bp2->bio_attribute = bp->bio_attribute; 147801bb689SPoul-Henning Kamp bp->bio_children++; 148a1bd3ee2SPoul-Henning Kamp } 149dd84a43cSPoul-Henning Kamp return(bp2); 150dd84a43cSPoul-Henning Kamp } 151dd84a43cSPoul-Henning Kamp 152dd84a43cSPoul-Henning Kamp void 153dd84a43cSPoul-Henning Kamp g_io_init() 154dd84a43cSPoul-Henning Kamp { 155dd84a43cSPoul-Henning Kamp 156dd84a43cSPoul-Henning Kamp g_bioq_init(&g_bio_run_down); 157dd84a43cSPoul-Henning Kamp g_bioq_init(&g_bio_run_up); 1585fcf4e43SPoul-Henning Kamp g_bioq_init(&g_bio_run_task); 1595ffb2c8bSPoul-Henning Kamp biozone = uma_zcreate("g_bio", sizeof (struct bio), 1605ffb2c8bSPoul-Henning Kamp NULL, NULL, 1615ffb2c8bSPoul-Henning Kamp NULL, NULL, 1625ffb2c8bSPoul-Henning Kamp 0, 0); 163dd84a43cSPoul-Henning Kamp } 164dd84a43cSPoul-Henning Kamp 165dd84a43cSPoul-Henning Kamp int 1660d3f37a8SPoul-Henning Kamp g_io_getattr(const char *attr, struct g_consumer *cp, int *len, void *ptr) 167dd84a43cSPoul-Henning Kamp { 168dd84a43cSPoul-Henning Kamp struct bio *bp; 169dd84a43cSPoul-Henning Kamp int error; 170dd84a43cSPoul-Henning Kamp 171dd84a43cSPoul-Henning Kamp g_trace(G_T_BIO, "bio_getattr(%s)", attr); 172a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 173dd84a43cSPoul-Henning Kamp bp->bio_cmd = BIO_GETATTR; 174dd84a43cSPoul-Henning Kamp bp->bio_done = NULL; 175dd84a43cSPoul-Henning Kamp bp->bio_attribute = attr; 176dd84a43cSPoul-Henning Kamp bp->bio_length = *len; 177dd84a43cSPoul-Henning Kamp bp->bio_data = ptr; 178dd84a43cSPoul-Henning Kamp g_io_request(bp, cp); 17953706245SPoul-Henning Kamp error = biowait(bp, "ggetattr"); 180dd84a43cSPoul-Henning Kamp *len = bp->bio_completed; 181dd84a43cSPoul-Henning Kamp g_destroy_bio(bp); 182dd84a43cSPoul-Henning Kamp return (error); 183dd84a43cSPoul-Henning Kamp } 184dd84a43cSPoul-Henning Kamp 185e39d70d4SPoul-Henning Kamp static int 186e39d70d4SPoul-Henning Kamp g_io_check(struct bio *bp) 187e39d70d4SPoul-Henning Kamp { 188e39d70d4SPoul-Henning Kamp struct g_consumer *cp; 189e39d70d4SPoul-Henning Kamp struct g_provider *pp; 190e39d70d4SPoul-Henning Kamp 191e39d70d4SPoul-Henning Kamp cp = bp->bio_from; 192e39d70d4SPoul-Henning Kamp pp = bp->bio_to; 193e39d70d4SPoul-Henning Kamp 194e39d70d4SPoul-Henning Kamp /* Fail if access counters dont allow the operation */ 195e39d70d4SPoul-Henning Kamp switch(bp->bio_cmd) { 196e39d70d4SPoul-Henning Kamp case BIO_READ: 197e39d70d4SPoul-Henning Kamp case BIO_GETATTR: 198e39d70d4SPoul-Henning Kamp if (cp->acr == 0) 199e39d70d4SPoul-Henning Kamp return (EPERM); 200e39d70d4SPoul-Henning Kamp break; 201e39d70d4SPoul-Henning Kamp case BIO_WRITE: 202e39d70d4SPoul-Henning Kamp case BIO_DELETE: 203e39d70d4SPoul-Henning Kamp if (cp->acw == 0) 204e39d70d4SPoul-Henning Kamp return (EPERM); 205e39d70d4SPoul-Henning Kamp break; 206e39d70d4SPoul-Henning Kamp default: 207e39d70d4SPoul-Henning Kamp return (EPERM); 208e39d70d4SPoul-Henning Kamp } 209e39d70d4SPoul-Henning Kamp /* if provider is marked for error, don't disturb. */ 210e39d70d4SPoul-Henning Kamp if (pp->error) 211e39d70d4SPoul-Henning Kamp return (pp->error); 212e39d70d4SPoul-Henning Kamp 213e39d70d4SPoul-Henning Kamp switch(bp->bio_cmd) { 214e39d70d4SPoul-Henning Kamp case BIO_READ: 215e39d70d4SPoul-Henning Kamp case BIO_WRITE: 216e39d70d4SPoul-Henning Kamp case BIO_DELETE: 21743bff1a7SPoul-Henning Kamp /* Zero sectorsize is a probably lack of media */ 21843bff1a7SPoul-Henning Kamp if (pp->sectorsize == 0) 21943bff1a7SPoul-Henning Kamp return (ENXIO); 220e39d70d4SPoul-Henning Kamp /* Reject I/O not on sector boundary */ 221e39d70d4SPoul-Henning Kamp if (bp->bio_offset % pp->sectorsize) 222e39d70d4SPoul-Henning Kamp return (EINVAL); 223e39d70d4SPoul-Henning Kamp /* Reject I/O not integral sector long */ 224e39d70d4SPoul-Henning Kamp if (bp->bio_length % pp->sectorsize) 225e39d70d4SPoul-Henning Kamp return (EINVAL); 226d1b8bf47SPoul-Henning Kamp /* Reject requests before or past the end of media. */ 227d1b8bf47SPoul-Henning Kamp if (bp->bio_offset < 0) 228d1b8bf47SPoul-Henning Kamp return (EIO); 229e39d70d4SPoul-Henning Kamp if (bp->bio_offset > pp->mediasize) 230e39d70d4SPoul-Henning Kamp return (EIO); 231e39d70d4SPoul-Henning Kamp break; 232e39d70d4SPoul-Henning Kamp default: 233e39d70d4SPoul-Henning Kamp break; 234e39d70d4SPoul-Henning Kamp } 235e39d70d4SPoul-Henning Kamp return (0); 236e39d70d4SPoul-Henning Kamp } 237e39d70d4SPoul-Henning Kamp 238dd84a43cSPoul-Henning Kamp void 239dd84a43cSPoul-Henning Kamp g_io_request(struct bio *bp, struct g_consumer *cp) 240dd84a43cSPoul-Henning Kamp { 241801bb689SPoul-Henning Kamp struct g_provider *pp; 242dd84a43cSPoul-Henning Kamp 243d0e17c1bSPoul-Henning Kamp KASSERT(cp != NULL, ("NULL cp in g_io_request")); 244d0e17c1bSPoul-Henning Kamp KASSERT(bp != NULL, ("NULL bp in g_io_request")); 245d0e17c1bSPoul-Henning Kamp KASSERT(bp->bio_data != NULL, ("NULL bp->data in g_io_request")); 246e060b6bdSPoul-Henning Kamp pp = cp->provider; 247801bb689SPoul-Henning Kamp KASSERT(pp != NULL, ("consumer not attached in g_io_request")); 248801bb689SPoul-Henning Kamp 249dcbd0fe5SPoul-Henning Kamp if (bp->bio_cmd & (BIO_READ|BIO_WRITE|BIO_DELETE)) { 250dcbd0fe5SPoul-Henning Kamp KASSERT(bp->bio_offset % cp->provider->sectorsize == 0, 251dcbd0fe5SPoul-Henning Kamp ("wrong offset %jd for sectorsize %u", 252dcbd0fe5SPoul-Henning Kamp bp->bio_offset, cp->provider->sectorsize)); 253dcbd0fe5SPoul-Henning Kamp KASSERT(bp->bio_length % cp->provider->sectorsize == 0, 254dcbd0fe5SPoul-Henning Kamp ("wrong length %jd for sectorsize %u", 255dcbd0fe5SPoul-Henning Kamp bp->bio_length, cp->provider->sectorsize)); 256dcbd0fe5SPoul-Henning Kamp } 257dcbd0fe5SPoul-Henning Kamp 258f7717523SStephan Uphoff g_trace(G_T_BIO, "bio_request(%p) from %p(%s) to %p(%s) cmd %d", 259f7717523SStephan Uphoff bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd); 260f7717523SStephan Uphoff 261dd84a43cSPoul-Henning Kamp bp->bio_from = cp; 262801bb689SPoul-Henning Kamp bp->bio_to = pp; 2632fccec19SPoul-Henning Kamp bp->bio_error = 0; 2642fccec19SPoul-Henning Kamp bp->bio_completed = 0; 265dd84a43cSPoul-Henning Kamp 26619fa21aaSPoul-Henning Kamp KASSERT(!(bp->bio_flags & BIO_ONQUEUE), 26719fa21aaSPoul-Henning Kamp ("Bio already on queue bp=%p", bp)); 26819fa21aaSPoul-Henning Kamp bp->bio_flags |= BIO_ONQUEUE; 26919fa21aaSPoul-Henning Kamp 27019fa21aaSPoul-Henning Kamp binuptime(&bp->bio_t0); 2718827c821SPoul-Henning Kamp 2728827c821SPoul-Henning Kamp /* 2738827c821SPoul-Henning Kamp * The statistics collection is lockless, as such, but we 2748827c821SPoul-Henning Kamp * can not update one instance of the statistics from more 2758827c821SPoul-Henning Kamp * than one thread at a time, so grab the lock first. 2768827c821SPoul-Henning Kamp */ 27719fa21aaSPoul-Henning Kamp g_bioq_lock(&g_bio_run_down); 278cf457284SPoul-Henning Kamp if (g_collectstats & 1) 27919fa21aaSPoul-Henning Kamp devstat_start_transaction(pp->stat, &bp->bio_t0); 280cf457284SPoul-Henning Kamp if (g_collectstats & 2) 28119fa21aaSPoul-Henning Kamp devstat_start_transaction(cp->stat, &bp->bio_t0); 28219fa21aaSPoul-Henning Kamp 28319fa21aaSPoul-Henning Kamp pp->nstart++; 284cf457284SPoul-Henning Kamp cp->nstart++; 28519fa21aaSPoul-Henning Kamp TAILQ_INSERT_TAIL(&g_bio_run_down.bio_queue, bp, bio_queue); 28619fa21aaSPoul-Henning Kamp g_bio_run_down.bio_queue_length++; 28719fa21aaSPoul-Henning Kamp g_bioq_unlock(&g_bio_run_down); 288e39d70d4SPoul-Henning Kamp 2892fccec19SPoul-Henning Kamp /* Pass it on down. */ 290dd84a43cSPoul-Henning Kamp wakeup(&g_wait_down); 291dd84a43cSPoul-Henning Kamp } 292dd84a43cSPoul-Henning Kamp 293dd84a43cSPoul-Henning Kamp void 29472840432SPoul-Henning Kamp g_io_deliver(struct bio *bp, int error) 295dd84a43cSPoul-Henning Kamp { 296801bb689SPoul-Henning Kamp struct g_consumer *cp; 297801bb689SPoul-Henning Kamp struct g_provider *pp; 298dd84a43cSPoul-Henning Kamp 299e060b6bdSPoul-Henning Kamp KASSERT(bp != NULL, ("NULL bp in g_io_deliver")); 300801bb689SPoul-Henning Kamp pp = bp->bio_to; 301f7eeab17SPoul-Henning Kamp KASSERT(pp != NULL, ("NULL bio_to in g_io_deliver")); 302f7eeab17SPoul-Henning Kamp cp = bp->bio_from; 303f7eeab17SPoul-Henning Kamp if (cp == NULL) { 304f7eeab17SPoul-Henning Kamp bp->bio_error = error; 305f7eeab17SPoul-Henning Kamp bp->bio_done(bp); 306f7eeab17SPoul-Henning Kamp return; 307f7eeab17SPoul-Henning Kamp } 308801bb689SPoul-Henning Kamp KASSERT(cp != NULL, ("NULL bio_from in g_io_deliver")); 309801bb689SPoul-Henning Kamp KASSERT(cp->geom != NULL, ("NULL bio_from->geom in g_io_deliver")); 31046aeebecSPawel Jakub Dawidek KASSERT(bp->bio_completed >= 0, ("bio_completed can't be less than 0")); 31146aeebecSPawel Jakub Dawidek KASSERT(bp->bio_completed <= bp->bio_length, 31246aeebecSPawel Jakub Dawidek ("bio_completed can't be greater than bio_length")); 3135ab413bfSPoul-Henning Kamp 314dd84a43cSPoul-Henning Kamp g_trace(G_T_BIO, 3150355b86eSPoul-Henning Kamp "g_io_deliver(%p) from %p(%s) to %p(%s) cmd %d error %d off %jd len %jd", 316801bb689SPoul-Henning Kamp bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd, error, 3170355b86eSPoul-Henning Kamp (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length); 318801bb689SPoul-Henning Kamp 31919fa21aaSPoul-Henning Kamp KASSERT(!(bp->bio_flags & BIO_ONQUEUE), 32019fa21aaSPoul-Henning Kamp ("Bio already on queue bp=%p", bp)); 32119fa21aaSPoul-Henning Kamp 322dcbd0fe5SPoul-Henning Kamp /* 323dcbd0fe5SPoul-Henning Kamp * XXX: next two doesn't belong here 324dcbd0fe5SPoul-Henning Kamp */ 325e24cbd90SPoul-Henning Kamp bp->bio_bcount = bp->bio_length; 326e24cbd90SPoul-Henning Kamp bp->bio_resid = bp->bio_bcount - bp->bio_completed; 32719fa21aaSPoul-Henning Kamp 3288827c821SPoul-Henning Kamp /* 3298827c821SPoul-Henning Kamp * The statistics collection is lockless, as such, but we 3308827c821SPoul-Henning Kamp * can not update one instance of the statistics from more 3318827c821SPoul-Henning Kamp * than one thread at a time, so grab the lock first. 3328827c821SPoul-Henning Kamp */ 33319fa21aaSPoul-Henning Kamp g_bioq_lock(&g_bio_run_up); 334cf457284SPoul-Henning Kamp if (g_collectstats & 1) 335e24cbd90SPoul-Henning Kamp devstat_end_transaction_bio(pp->stat, bp); 336cf457284SPoul-Henning Kamp if (g_collectstats & 2) 337cf457284SPoul-Henning Kamp devstat_end_transaction_bio(cp->stat, bp); 3388827c821SPoul-Henning Kamp 339c6ae9b5fSPoul-Henning Kamp cp->nend++; 340c6ae9b5fSPoul-Henning Kamp pp->nend++; 34119fa21aaSPoul-Henning Kamp if (error != ENOMEM) { 34219fa21aaSPoul-Henning Kamp bp->bio_error = error; 34319fa21aaSPoul-Henning Kamp TAILQ_INSERT_TAIL(&g_bio_run_up.bio_queue, bp, bio_queue); 344276f72c5SPoul-Henning Kamp bp->bio_flags |= BIO_ONQUEUE; 34519fa21aaSPoul-Henning Kamp g_bio_run_up.bio_queue_length++; 34619fa21aaSPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 34719fa21aaSPoul-Henning Kamp wakeup(&g_wait_up); 34819fa21aaSPoul-Henning Kamp return; 34919fa21aaSPoul-Henning Kamp } 35019fa21aaSPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 351dd84a43cSPoul-Henning Kamp 3522cc9686eSPoul-Henning Kamp if (bootverbose) 353801bb689SPoul-Henning Kamp printf("ENOMEM %p on %p(%s)\n", bp, pp, pp->name); 3541b949c05SPawel Jakub Dawidek bp->bio_children = 0; 3551b949c05SPawel Jakub Dawidek bp->bio_inbed = 0; 356801bb689SPoul-Henning Kamp g_io_request(bp, cp); 3573432e4fdSPoul-Henning Kamp pace++; 3583432e4fdSPoul-Henning Kamp return; 3593432e4fdSPoul-Henning Kamp } 360dd84a43cSPoul-Henning Kamp 361dd84a43cSPoul-Henning Kamp void 362dd84a43cSPoul-Henning Kamp g_io_schedule_down(struct thread *tp __unused) 363dd84a43cSPoul-Henning Kamp { 364dd84a43cSPoul-Henning Kamp struct bio *bp; 365e39d70d4SPoul-Henning Kamp off_t excess; 366e39d70d4SPoul-Henning Kamp int error; 3675706472cSRobert Watson #ifdef WITNESS 368f0e185d7SPoul-Henning Kamp struct mtx mymutex; 369f0e185d7SPoul-Henning Kamp 370f0e185d7SPoul-Henning Kamp bzero(&mymutex, sizeof mymutex); 3712cf0d8a6SDon Lewis mtx_init(&mymutex, "g_xdown", NULL, MTX_DEF); 3725706472cSRobert Watson #endif 373dd84a43cSPoul-Henning Kamp 374dd84a43cSPoul-Henning Kamp for(;;) { 375f0e185d7SPoul-Henning Kamp g_bioq_lock(&g_bio_run_down); 376dd84a43cSPoul-Henning Kamp bp = g_bioq_first(&g_bio_run_down); 377f0e185d7SPoul-Henning Kamp if (bp == NULL) { 37849dbb61dSRobert Watson CTR0(KTR_GEOM, "g_down going to sleep"); 379f0e185d7SPoul-Henning Kamp msleep(&g_wait_down, &g_bio_run_down.bio_queue_lock, 38044be139bSPoul-Henning Kamp PRIBIO | PDROP, "-", hz/10); 381f0e185d7SPoul-Henning Kamp continue; 382f0e185d7SPoul-Henning Kamp } 38349dbb61dSRobert Watson CTR0(KTR_GEOM, "g_down has work to do"); 384f0e185d7SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_down); 385376ceb79SPoul-Henning Kamp if (pace > 0) { 38649dbb61dSRobert Watson CTR1(KTR_GEOM, "g_down pacing self (pace %d)", pace); 387376ceb79SPoul-Henning Kamp msleep(&error, NULL, PRIBIO, "g_down", hz/10); 388376ceb79SPoul-Henning Kamp pace--; 389376ceb79SPoul-Henning Kamp } 390e39d70d4SPoul-Henning Kamp error = g_io_check(bp); 391e39d70d4SPoul-Henning Kamp if (error) { 39249dbb61dSRobert Watson CTR3(KTR_GEOM, "g_down g_io_check on bp %p provider " 39349dbb61dSRobert Watson "%s returned %d", bp, bp->bio_to->name, error); 394e39d70d4SPoul-Henning Kamp g_io_deliver(bp, error); 395e39d70d4SPoul-Henning Kamp continue; 396e39d70d4SPoul-Henning Kamp } 39749dbb61dSRobert Watson CTR2(KTR_GEOM, "g_down processing bp %p provider %s", bp, 39849dbb61dSRobert Watson bp->bio_to->name); 399392d56b4SPoul-Henning Kamp switch (bp->bio_cmd) { 400392d56b4SPoul-Henning Kamp case BIO_READ: 401392d56b4SPoul-Henning Kamp case BIO_WRITE: 402392d56b4SPoul-Henning Kamp case BIO_DELETE: 403e39d70d4SPoul-Henning Kamp /* Truncate requests to the end of providers media. */ 40449dbb61dSRobert Watson /* 40549dbb61dSRobert Watson * XXX: What if we truncate because of offset being 40649dbb61dSRobert Watson * bad, not length? 40749dbb61dSRobert Watson */ 408e39d70d4SPoul-Henning Kamp excess = bp->bio_offset + bp->bio_length; 409e39d70d4SPoul-Henning Kamp if (excess > bp->bio_to->mediasize) { 410e39d70d4SPoul-Henning Kamp excess -= bp->bio_to->mediasize; 411e39d70d4SPoul-Henning Kamp bp->bio_length -= excess; 41249dbb61dSRobert Watson if (excess > 0) 41349dbb61dSRobert Watson CTR3(KTR_GEOM, "g_down truncated bio " 41449dbb61dSRobert Watson "%p provider %s by %d", bp, 41549dbb61dSRobert Watson bp->bio_to->name, excess); 416e39d70d4SPoul-Henning Kamp } 417e39d70d4SPoul-Henning Kamp /* Deliver zero length transfers right here. */ 418e39d70d4SPoul-Henning Kamp if (bp->bio_length == 0) { 419e39d70d4SPoul-Henning Kamp g_io_deliver(bp, 0); 42049dbb61dSRobert Watson CTR2(KTR_GEOM, "g_down terminated 0-length " 42149dbb61dSRobert Watson "bp %p provider %s", bp, bp->bio_to->name); 422e39d70d4SPoul-Henning Kamp continue; 423e39d70d4SPoul-Henning Kamp } 424392d56b4SPoul-Henning Kamp break; 425392d56b4SPoul-Henning Kamp default: 426392d56b4SPoul-Henning Kamp break; 427392d56b4SPoul-Henning Kamp } 4285706472cSRobert Watson #ifdef WITNESS 429f0e185d7SPoul-Henning Kamp mtx_lock(&mymutex); 4305706472cSRobert Watson #endif 43149dbb61dSRobert Watson CTR4(KTR_GEOM, "g_down starting bp %p provider %s off %ld " 43249dbb61dSRobert Watson "len %ld", bp, bp->bio_to->name, bp->bio_offset, 43349dbb61dSRobert Watson bp->bio_length); 434dd84a43cSPoul-Henning Kamp bp->bio_to->geom->start(bp); 4355706472cSRobert Watson #ifdef WITNESS 436f0e185d7SPoul-Henning Kamp mtx_unlock(&mymutex); 4375706472cSRobert Watson #endif 438dd84a43cSPoul-Henning Kamp } 439dd84a43cSPoul-Henning Kamp } 440dd84a43cSPoul-Henning Kamp 441dd84a43cSPoul-Henning Kamp void 4425fcf4e43SPoul-Henning Kamp bio_taskqueue(struct bio *bp, bio_task_t *func, void *arg) 4435fcf4e43SPoul-Henning Kamp { 4445fcf4e43SPoul-Henning Kamp bp->bio_task = func; 4455fcf4e43SPoul-Henning Kamp bp->bio_task_arg = arg; 4465fcf4e43SPoul-Henning Kamp /* 4475fcf4e43SPoul-Henning Kamp * The taskqueue is actually just a second queue off the "up" 4485fcf4e43SPoul-Henning Kamp * queue, so we use the same lock. 4495fcf4e43SPoul-Henning Kamp */ 4505fcf4e43SPoul-Henning Kamp g_bioq_lock(&g_bio_run_up); 451dcbd0fe5SPoul-Henning Kamp KASSERT(!(bp->bio_flags & BIO_ONQUEUE), 452dcbd0fe5SPoul-Henning Kamp ("Bio already on queue bp=%p target taskq", bp)); 453dcbd0fe5SPoul-Henning Kamp bp->bio_flags |= BIO_ONQUEUE; 4545fcf4e43SPoul-Henning Kamp TAILQ_INSERT_TAIL(&g_bio_run_task.bio_queue, bp, bio_queue); 4555fcf4e43SPoul-Henning Kamp g_bio_run_task.bio_queue_length++; 4565fcf4e43SPoul-Henning Kamp wakeup(&g_wait_up); 4575fcf4e43SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 4585fcf4e43SPoul-Henning Kamp } 4595fcf4e43SPoul-Henning Kamp 4605fcf4e43SPoul-Henning Kamp 4615fcf4e43SPoul-Henning Kamp void 462dd84a43cSPoul-Henning Kamp g_io_schedule_up(struct thread *tp __unused) 463dd84a43cSPoul-Henning Kamp { 464dd84a43cSPoul-Henning Kamp struct bio *bp; 4655706472cSRobert Watson #ifdef WITNESS 466f0e185d7SPoul-Henning Kamp struct mtx mymutex; 467dd84a43cSPoul-Henning Kamp 468f0e185d7SPoul-Henning Kamp bzero(&mymutex, sizeof mymutex); 4692cf0d8a6SDon Lewis mtx_init(&mymutex, "g_xup", NULL, MTX_DEF); 4705706472cSRobert Watson #endif 471dd84a43cSPoul-Henning Kamp for(;;) { 472f0e185d7SPoul-Henning Kamp g_bioq_lock(&g_bio_run_up); 4735fcf4e43SPoul-Henning Kamp bp = g_bioq_first(&g_bio_run_task); 4745fcf4e43SPoul-Henning Kamp if (bp != NULL) { 4755fcf4e43SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 4765706472cSRobert Watson #ifdef WITNESS 4775fcf4e43SPoul-Henning Kamp mtx_lock(&mymutex); 4785706472cSRobert Watson #endif 47949dbb61dSRobert Watson CTR1(KTR_GEOM, "g_up processing task bp %p", bp); 4805fcf4e43SPoul-Henning Kamp bp->bio_task(bp->bio_task_arg); 4815706472cSRobert Watson #ifdef WITNESS 4825fcf4e43SPoul-Henning Kamp mtx_unlock(&mymutex); 4835706472cSRobert Watson #endif 4845fcf4e43SPoul-Henning Kamp continue; 4855fcf4e43SPoul-Henning Kamp } 486dd84a43cSPoul-Henning Kamp bp = g_bioq_first(&g_bio_run_up); 487f0e185d7SPoul-Henning Kamp if (bp != NULL) { 488f0e185d7SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 4895706472cSRobert Watson #ifdef WITNESS 490f0e185d7SPoul-Henning Kamp mtx_lock(&mymutex); 4915706472cSRobert Watson #endif 49249dbb61dSRobert Watson CTR4(KTR_GEOM, "g_up biodone bp %p provider %s off " 49349dbb61dSRobert Watson "%ld len %ld", bp, bp->bio_to->name, 49449dbb61dSRobert Watson bp->bio_offset, bp->bio_length); 49553706245SPoul-Henning Kamp biodone(bp); 4965706472cSRobert Watson #ifdef WITNESS 497f0e185d7SPoul-Henning Kamp mtx_unlock(&mymutex); 4985706472cSRobert Watson #endif 499f0e185d7SPoul-Henning Kamp continue; 500f0e185d7SPoul-Henning Kamp } 50149dbb61dSRobert Watson CTR0(KTR_GEOM, "g_up going to sleep"); 502f0e185d7SPoul-Henning Kamp msleep(&g_wait_up, &g_bio_run_up.bio_queue_lock, 50344be139bSPoul-Henning Kamp PRIBIO | PDROP, "-", hz/10); 504dd84a43cSPoul-Henning Kamp } 505dd84a43cSPoul-Henning Kamp } 506dd84a43cSPoul-Henning Kamp 507dd84a43cSPoul-Henning Kamp void * 508dd84a43cSPoul-Henning Kamp g_read_data(struct g_consumer *cp, off_t offset, off_t length, int *error) 509dd84a43cSPoul-Henning Kamp { 510dd84a43cSPoul-Henning Kamp struct bio *bp; 511dd84a43cSPoul-Henning Kamp void *ptr; 512dd84a43cSPoul-Henning Kamp int errorc; 513dd84a43cSPoul-Henning Kamp 5148dd5480dSPawel Jakub Dawidek KASSERT(length > 0 && length >= cp->provider->sectorsize && 5158dd5480dSPawel Jakub Dawidek length <= MAXPHYS, ("g_read_data(): invalid length %jd", 5168dd5480dSPawel Jakub Dawidek (intmax_t)length)); 5173eb6ffdfSPoul-Henning Kamp 518a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 519dd84a43cSPoul-Henning Kamp bp->bio_cmd = BIO_READ; 520dd84a43cSPoul-Henning Kamp bp->bio_done = NULL; 521dd84a43cSPoul-Henning Kamp bp->bio_offset = offset; 522dd84a43cSPoul-Henning Kamp bp->bio_length = length; 523a163d034SWarner Losh ptr = g_malloc(length, M_WAITOK); 524dd84a43cSPoul-Henning Kamp bp->bio_data = ptr; 525dd84a43cSPoul-Henning Kamp g_io_request(bp, cp); 52653706245SPoul-Henning Kamp errorc = biowait(bp, "gread"); 527dd84a43cSPoul-Henning Kamp if (error != NULL) 528dd84a43cSPoul-Henning Kamp *error = errorc; 529dd84a43cSPoul-Henning Kamp g_destroy_bio(bp); 530dd84a43cSPoul-Henning Kamp if (errorc) { 531dd84a43cSPoul-Henning Kamp g_free(ptr); 532dd84a43cSPoul-Henning Kamp ptr = NULL; 533dd84a43cSPoul-Henning Kamp } 534dd84a43cSPoul-Henning Kamp return (ptr); 535dd84a43cSPoul-Henning Kamp } 53690b1cd56SPoul-Henning Kamp 53790b1cd56SPoul-Henning Kamp int 53890b1cd56SPoul-Henning Kamp g_write_data(struct g_consumer *cp, off_t offset, void *ptr, off_t length) 53990b1cd56SPoul-Henning Kamp { 54090b1cd56SPoul-Henning Kamp struct bio *bp; 54190b1cd56SPoul-Henning Kamp int error; 54290b1cd56SPoul-Henning Kamp 5438dd5480dSPawel Jakub Dawidek KASSERT(length > 0 && length >= cp->provider->sectorsize && 5448dd5480dSPawel Jakub Dawidek length <= MAXPHYS, ("g_write_data(): invalid length %jd", 5458dd5480dSPawel Jakub Dawidek (intmax_t)length)); 5463eb6ffdfSPoul-Henning Kamp 547a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 54890b1cd56SPoul-Henning Kamp bp->bio_cmd = BIO_WRITE; 54990b1cd56SPoul-Henning Kamp bp->bio_done = NULL; 55090b1cd56SPoul-Henning Kamp bp->bio_offset = offset; 55190b1cd56SPoul-Henning Kamp bp->bio_length = length; 55290b1cd56SPoul-Henning Kamp bp->bio_data = ptr; 55390b1cd56SPoul-Henning Kamp g_io_request(bp, cp); 55490b1cd56SPoul-Henning Kamp error = biowait(bp, "gwrite"); 55590b1cd56SPoul-Henning Kamp g_destroy_bio(bp); 55690b1cd56SPoul-Henning Kamp return (error); 55790b1cd56SPoul-Henning Kamp } 55872e33095SPawel Jakub Dawidek 55972e33095SPawel Jakub Dawidek void 56072e33095SPawel Jakub Dawidek g_print_bio(struct bio *bp) 56172e33095SPawel Jakub Dawidek { 56272e33095SPawel Jakub Dawidek const char *pname, *cmd = NULL; 56372e33095SPawel Jakub Dawidek 56472e33095SPawel Jakub Dawidek if (bp->bio_to != NULL) 56572e33095SPawel Jakub Dawidek pname = bp->bio_to->name; 56672e33095SPawel Jakub Dawidek else 56772e33095SPawel Jakub Dawidek pname = "[unknown]"; 56872e33095SPawel Jakub Dawidek 56972e33095SPawel Jakub Dawidek switch (bp->bio_cmd) { 57072e33095SPawel Jakub Dawidek case BIO_GETATTR: 57172e33095SPawel Jakub Dawidek cmd = "GETATTR"; 57272e33095SPawel Jakub Dawidek printf("%s[%s(attr=%s)]", pname, cmd, bp->bio_attribute); 57372e33095SPawel Jakub Dawidek return; 57472e33095SPawel Jakub Dawidek case BIO_READ: 57572e33095SPawel Jakub Dawidek cmd = "READ"; 57672e33095SPawel Jakub Dawidek case BIO_WRITE: 57772e33095SPawel Jakub Dawidek if (cmd == NULL) 57872e33095SPawel Jakub Dawidek cmd = "WRITE"; 57972e33095SPawel Jakub Dawidek case BIO_DELETE: 58072e33095SPawel Jakub Dawidek if (cmd == NULL) 58172e33095SPawel Jakub Dawidek cmd = "DELETE"; 58272e33095SPawel Jakub Dawidek printf("%s[%s(offset=%jd, length=%jd)]", pname, cmd, 58372e33095SPawel Jakub Dawidek (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length); 58472e33095SPawel Jakub Dawidek return; 58572e33095SPawel Jakub Dawidek default: 58672e33095SPawel Jakub Dawidek cmd = "UNKNOWN"; 58772e33095SPawel Jakub Dawidek printf("%s[%s()]", pname, cmd); 58872e33095SPawel Jakub Dawidek return; 58972e33095SPawel Jakub Dawidek } 59072e33095SPawel Jakub Dawidek /* NOTREACHED */ 59172e33095SPawel Jakub Dawidek } 592