1dd84a43cSPoul-Henning Kamp /*- 23728855aSPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 33728855aSPedro F. Giffuni * 4dd84a43cSPoul-Henning Kamp * Copyright (c) 2002 Poul-Henning Kamp 5dd84a43cSPoul-Henning Kamp * Copyright (c) 2002 Networks Associates Technology, Inc. 6ee75e7deSKonstantin Belousov * Copyright (c) 2013 The FreeBSD Foundation 7dd84a43cSPoul-Henning Kamp * All rights reserved. 8dd84a43cSPoul-Henning Kamp * 9dd84a43cSPoul-Henning Kamp * This software was developed for the FreeBSD Project by Poul-Henning Kamp 10dd84a43cSPoul-Henning Kamp * and NAI Labs, the Security Research Division of Network Associates, Inc. 11dd84a43cSPoul-Henning Kamp * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the 12dd84a43cSPoul-Henning Kamp * DARPA CHATS research program. 13dd84a43cSPoul-Henning Kamp * 14ee75e7deSKonstantin Belousov * Portions of this software were developed by Konstantin Belousov 15ee75e7deSKonstantin Belousov * under sponsorship from the FreeBSD Foundation. 16ee75e7deSKonstantin Belousov * 17dd84a43cSPoul-Henning Kamp * Redistribution and use in source and binary forms, with or without 18dd84a43cSPoul-Henning Kamp * modification, are permitted provided that the following conditions 19dd84a43cSPoul-Henning Kamp * are met: 20dd84a43cSPoul-Henning Kamp * 1. Redistributions of source code must retain the above copyright 21dd84a43cSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer. 22dd84a43cSPoul-Henning Kamp * 2. Redistributions in binary form must reproduce the above copyright 23dd84a43cSPoul-Henning Kamp * notice, this list of conditions and the following disclaimer in the 24dd84a43cSPoul-Henning Kamp * documentation and/or other materials provided with the distribution. 25dd84a43cSPoul-Henning Kamp * 3. The names of the authors may not be used to endorse or promote 26dd84a43cSPoul-Henning Kamp * products derived from this software without specific prior written 27dd84a43cSPoul-Henning Kamp * permission. 28dd84a43cSPoul-Henning Kamp * 29dd84a43cSPoul-Henning Kamp * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 30dd84a43cSPoul-Henning Kamp * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 31dd84a43cSPoul-Henning Kamp * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 32dd84a43cSPoul-Henning Kamp * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 33dd84a43cSPoul-Henning Kamp * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 34dd84a43cSPoul-Henning Kamp * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 35dd84a43cSPoul-Henning Kamp * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 36dd84a43cSPoul-Henning Kamp * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 37dd84a43cSPoul-Henning Kamp * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 38dd84a43cSPoul-Henning Kamp * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 39dd84a43cSPoul-Henning Kamp * SUCH DAMAGE. 40dd84a43cSPoul-Henning Kamp */ 41dd84a43cSPoul-Henning Kamp 4250b1faefSDavid E. O'Brien #include <sys/cdefs.h> 4350b1faefSDavid E. O'Brien __FBSDID("$FreeBSD$"); 44dd84a43cSPoul-Henning Kamp 45dd84a43cSPoul-Henning Kamp #include <sys/param.h> 46dd84a43cSPoul-Henning Kamp #include <sys/systm.h> 47dd84a43cSPoul-Henning Kamp #include <sys/kernel.h> 48dd84a43cSPoul-Henning Kamp #include <sys/malloc.h> 49dd84a43cSPoul-Henning Kamp #include <sys/bio.h> 5049dbb61dSRobert Watson #include <sys/ktr.h> 5151460da8SJohn Baldwin #include <sys/proc.h> 52ac03832eSConrad Meyer #include <sys/sbuf.h> 533b378147SPawel Jakub Dawidek #include <sys/stack.h> 54ee75e7deSKonstantin Belousov #include <sys/sysctl.h> 555f518366SJeff Roberson #include <sys/vmem.h> 56ac03832eSConrad Meyer #include <machine/stdarg.h> 57dd84a43cSPoul-Henning Kamp 58dd84a43cSPoul-Henning Kamp #include <sys/errno.h> 59dd84a43cSPoul-Henning Kamp #include <geom/geom.h> 60b1876192SPoul-Henning Kamp #include <geom/geom_int.h> 61e24cbd90SPoul-Henning Kamp #include <sys/devicestat.h> 62dd84a43cSPoul-Henning Kamp 635ffb2c8bSPoul-Henning Kamp #include <vm/uma.h> 64ee75e7deSKonstantin Belousov #include <vm/vm.h> 65ee75e7deSKonstantin Belousov #include <vm/vm_param.h> 66ee75e7deSKonstantin Belousov #include <vm/vm_kern.h> 67ee75e7deSKonstantin Belousov #include <vm/vm_page.h> 68ee75e7deSKonstantin Belousov #include <vm/vm_object.h> 69ee75e7deSKonstantin Belousov #include <vm/vm_extern.h> 70ee75e7deSKonstantin Belousov #include <vm/vm_map.h> 715ffb2c8bSPoul-Henning Kamp 7240ea77a0SAlexander Motin static int g_io_transient_map_bio(struct bio *bp); 7340ea77a0SAlexander Motin 74dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_down; 75dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_up; 76dd84a43cSPoul-Henning Kamp 773f2e5b85SWarner Losh /* 783f2e5b85SWarner Losh * Pace is a hint that we've had some trouble recently allocating 793f2e5b85SWarner Losh * bios, so we should back off trying to send I/O down the stack 803f2e5b85SWarner Losh * a bit to let the problem resolve. When pacing, we also turn 813f2e5b85SWarner Losh * off direct dispatch to also reduce memory pressure from I/Os 823f2e5b85SWarner Losh * there, at the expxense of some added latency while the memory 833f2e5b85SWarner Losh * pressures exist. See g_io_schedule_down() for more details 843f2e5b85SWarner Losh * and limitations. 853f2e5b85SWarner Losh */ 8661322a0aSAlexander Motin static volatile u_int __read_mostly pace; 873f2e5b85SWarner Losh 8861322a0aSAlexander Motin static uma_zone_t __read_mostly biozone; 893432e4fdSPoul-Henning Kamp 906231f75bSLuigi Rizzo /* 916231f75bSLuigi Rizzo * The head of the list of classifiers used in g_io_request. 926231f75bSLuigi Rizzo * Use g_register_classifier() and g_unregister_classifier() 936231f75bSLuigi Rizzo * to add/remove entries to the list. 946231f75bSLuigi Rizzo * Classifiers are invoked in registration order. 956231f75bSLuigi Rizzo */ 9661322a0aSAlexander Motin static TAILQ_HEAD(, g_classifier_hook) g_classifier_tailq __read_mostly = 9761322a0aSAlexander Motin TAILQ_HEAD_INITIALIZER(g_classifier_tailq); 986231f75bSLuigi Rizzo 99dd84a43cSPoul-Henning Kamp #include <machine/atomic.h> 100dd84a43cSPoul-Henning Kamp 101dd84a43cSPoul-Henning Kamp static void 102dd84a43cSPoul-Henning Kamp g_bioq_lock(struct g_bioq *bq) 103dd84a43cSPoul-Henning Kamp { 104dd84a43cSPoul-Henning Kamp 105dd84a43cSPoul-Henning Kamp mtx_lock(&bq->bio_queue_lock); 106dd84a43cSPoul-Henning Kamp } 107dd84a43cSPoul-Henning Kamp 108dd84a43cSPoul-Henning Kamp static void 109dd84a43cSPoul-Henning Kamp g_bioq_unlock(struct g_bioq *bq) 110dd84a43cSPoul-Henning Kamp { 111dd84a43cSPoul-Henning Kamp 112dd84a43cSPoul-Henning Kamp mtx_unlock(&bq->bio_queue_lock); 113dd84a43cSPoul-Henning Kamp } 114dd84a43cSPoul-Henning Kamp 115dd84a43cSPoul-Henning Kamp #if 0 116dd84a43cSPoul-Henning Kamp static void 117dd84a43cSPoul-Henning Kamp g_bioq_destroy(struct g_bioq *bq) 118dd84a43cSPoul-Henning Kamp { 119dd84a43cSPoul-Henning Kamp 120dd84a43cSPoul-Henning Kamp mtx_destroy(&bq->bio_queue_lock); 121dd84a43cSPoul-Henning Kamp } 122dd84a43cSPoul-Henning Kamp #endif 123dd84a43cSPoul-Henning Kamp 124dd84a43cSPoul-Henning Kamp static void 125dd84a43cSPoul-Henning Kamp g_bioq_init(struct g_bioq *bq) 126dd84a43cSPoul-Henning Kamp { 127dd84a43cSPoul-Henning Kamp 128dd84a43cSPoul-Henning Kamp TAILQ_INIT(&bq->bio_queue); 1296008862bSJohn Baldwin mtx_init(&bq->bio_queue_lock, "bio queue", NULL, MTX_DEF); 130dd84a43cSPoul-Henning Kamp } 131dd84a43cSPoul-Henning Kamp 132dd84a43cSPoul-Henning Kamp static struct bio * 133dd84a43cSPoul-Henning Kamp g_bioq_first(struct g_bioq *bq) 134dd84a43cSPoul-Henning Kamp { 135dd84a43cSPoul-Henning Kamp struct bio *bp; 136dd84a43cSPoul-Henning Kamp 137dd84a43cSPoul-Henning Kamp bp = TAILQ_FIRST(&bq->bio_queue); 138dd84a43cSPoul-Henning Kamp if (bp != NULL) { 139dcbd0fe5SPoul-Henning Kamp KASSERT((bp->bio_flags & BIO_ONQUEUE), 140dcbd0fe5SPoul-Henning Kamp ("Bio not on queue bp=%p target %p", bp, bq)); 141dcbd0fe5SPoul-Henning Kamp bp->bio_flags &= ~BIO_ONQUEUE; 142dd84a43cSPoul-Henning Kamp TAILQ_REMOVE(&bq->bio_queue, bp, bio_queue); 143dd84a43cSPoul-Henning Kamp bq->bio_queue_length--; 144dd84a43cSPoul-Henning Kamp } 145dd84a43cSPoul-Henning Kamp return (bp); 146dd84a43cSPoul-Henning Kamp } 147dd84a43cSPoul-Henning Kamp 148dd84a43cSPoul-Henning Kamp struct bio * 149dd84a43cSPoul-Henning Kamp g_new_bio(void) 150dd84a43cSPoul-Henning Kamp { 151dd84a43cSPoul-Henning Kamp struct bio *bp; 152dd84a43cSPoul-Henning Kamp 1535ffb2c8bSPoul-Henning Kamp bp = uma_zalloc(biozone, M_NOWAIT | M_ZERO); 1543b378147SPawel Jakub Dawidek #ifdef KTR 155b656c1b8SPawel Jakub Dawidek if ((KTR_COMPILE & KTR_GEOM) && (ktr_mask & KTR_GEOM)) { 1563b378147SPawel Jakub Dawidek struct stack st; 1573b378147SPawel Jakub Dawidek 1583b378147SPawel Jakub Dawidek CTR1(KTR_GEOM, "g_new_bio(): %p", bp); 1593b378147SPawel Jakub Dawidek stack_save(&st); 16054533f66SConrad Meyer CTRSTACK(KTR_GEOM, &st, 3); 1613b378147SPawel Jakub Dawidek } 1623b378147SPawel Jakub Dawidek #endif 163dd84a43cSPoul-Henning Kamp return (bp); 164dd84a43cSPoul-Henning Kamp } 165dd84a43cSPoul-Henning Kamp 166a2033c96SPoul-Henning Kamp struct bio * 167a2033c96SPoul-Henning Kamp g_alloc_bio(void) 168a2033c96SPoul-Henning Kamp { 169a2033c96SPoul-Henning Kamp struct bio *bp; 170a2033c96SPoul-Henning Kamp 171a2033c96SPoul-Henning Kamp bp = uma_zalloc(biozone, M_WAITOK | M_ZERO); 1723b378147SPawel Jakub Dawidek #ifdef KTR 173b656c1b8SPawel Jakub Dawidek if ((KTR_COMPILE & KTR_GEOM) && (ktr_mask & KTR_GEOM)) { 1743b378147SPawel Jakub Dawidek struct stack st; 1753b378147SPawel Jakub Dawidek 1763b378147SPawel Jakub Dawidek CTR1(KTR_GEOM, "g_alloc_bio(): %p", bp); 1773b378147SPawel Jakub Dawidek stack_save(&st); 17854533f66SConrad Meyer CTRSTACK(KTR_GEOM, &st, 3); 1793b378147SPawel Jakub Dawidek } 1803b378147SPawel Jakub Dawidek #endif 181a2033c96SPoul-Henning Kamp return (bp); 182a2033c96SPoul-Henning Kamp } 183a2033c96SPoul-Henning Kamp 184dd84a43cSPoul-Henning Kamp void 185dd84a43cSPoul-Henning Kamp g_destroy_bio(struct bio *bp) 186dd84a43cSPoul-Henning Kamp { 1873b378147SPawel Jakub Dawidek #ifdef KTR 188b656c1b8SPawel Jakub Dawidek if ((KTR_COMPILE & KTR_GEOM) && (ktr_mask & KTR_GEOM)) { 1893b378147SPawel Jakub Dawidek struct stack st; 190dd84a43cSPoul-Henning Kamp 1913b378147SPawel Jakub Dawidek CTR1(KTR_GEOM, "g_destroy_bio(): %p", bp); 1923b378147SPawel Jakub Dawidek stack_save(&st); 19354533f66SConrad Meyer CTRSTACK(KTR_GEOM, &st, 3); 1943b378147SPawel Jakub Dawidek } 1953b378147SPawel Jakub Dawidek #endif 1965ffb2c8bSPoul-Henning Kamp uma_zfree(biozone, bp); 197dd84a43cSPoul-Henning Kamp } 198dd84a43cSPoul-Henning Kamp 199dd84a43cSPoul-Henning Kamp struct bio * 200dd84a43cSPoul-Henning Kamp g_clone_bio(struct bio *bp) 201dd84a43cSPoul-Henning Kamp { 202dd84a43cSPoul-Henning Kamp struct bio *bp2; 203dd84a43cSPoul-Henning Kamp 2045ffb2c8bSPoul-Henning Kamp bp2 = uma_zalloc(biozone, M_NOWAIT | M_ZERO); 205a1bd3ee2SPoul-Henning Kamp if (bp2 != NULL) { 206936cc461SPoul-Henning Kamp bp2->bio_parent = bp; 207dd84a43cSPoul-Henning Kamp bp2->bio_cmd = bp->bio_cmd; 20882a6ae10SJim Harris /* 20982a6ae10SJim Harris * BIO_ORDERED flag may be used by disk drivers to enforce 21082a6ae10SJim Harris * ordering restrictions, so this flag needs to be cloned. 211a9934668SKenneth D. Merry * BIO_UNMAPPED and BIO_VLIST should be inherited, to properly 212a9934668SKenneth D. Merry * indicate which way the buffer is passed. 21382a6ae10SJim Harris * Other bio flags are not suitable for cloning. 21482a6ae10SJim Harris */ 215a9934668SKenneth D. Merry bp2->bio_flags = bp->bio_flags & 216a9934668SKenneth D. Merry (BIO_ORDERED | BIO_UNMAPPED | BIO_VLIST); 217dd84a43cSPoul-Henning Kamp bp2->bio_length = bp->bio_length; 218dd84a43cSPoul-Henning Kamp bp2->bio_offset = bp->bio_offset; 219dd84a43cSPoul-Henning Kamp bp2->bio_data = bp->bio_data; 220ee75e7deSKonstantin Belousov bp2->bio_ma = bp->bio_ma; 221ee75e7deSKonstantin Belousov bp2->bio_ma_n = bp->bio_ma_n; 222ee75e7deSKonstantin Belousov bp2->bio_ma_offset = bp->bio_ma_offset; 223dd84a43cSPoul-Henning Kamp bp2->bio_attribute = bp->bio_attribute; 2249a6844d5SKenneth D. Merry if (bp->bio_cmd == BIO_ZONE) 2259a6844d5SKenneth D. Merry bcopy(&bp->bio_zone, &bp2->bio_zone, 2269a6844d5SKenneth D. Merry sizeof(bp->bio_zone)); 2276231f75bSLuigi Rizzo /* Inherit classification info from the parent */ 2286231f75bSLuigi Rizzo bp2->bio_classifier1 = bp->bio_classifier1; 2296231f75bSLuigi Rizzo bp2->bio_classifier2 = bp->bio_classifier2; 2308532d381SConrad Meyer #if defined(BUF_TRACKING) || defined(FULL_BUF_TRACKING) 2318532d381SConrad Meyer bp2->bio_track_bp = bp->bio_track_bp; 2328532d381SConrad Meyer #endif 233801bb689SPoul-Henning Kamp bp->bio_children++; 234a1bd3ee2SPoul-Henning Kamp } 2353b378147SPawel Jakub Dawidek #ifdef KTR 236b656c1b8SPawel Jakub Dawidek if ((KTR_COMPILE & KTR_GEOM) && (ktr_mask & KTR_GEOM)) { 2373b378147SPawel Jakub Dawidek struct stack st; 2383b378147SPawel Jakub Dawidek 239ad572235SRuslan Ermilov CTR2(KTR_GEOM, "g_clone_bio(%p): %p", bp, bp2); 2403b378147SPawel Jakub Dawidek stack_save(&st); 24154533f66SConrad Meyer CTRSTACK(KTR_GEOM, &st, 3); 2423b378147SPawel Jakub Dawidek } 2433b378147SPawel Jakub Dawidek #endif 244dd84a43cSPoul-Henning Kamp return(bp2); 245dd84a43cSPoul-Henning Kamp } 246dd84a43cSPoul-Henning Kamp 2474bec0ff1SPawel Jakub Dawidek struct bio * 2484bec0ff1SPawel Jakub Dawidek g_duplicate_bio(struct bio *bp) 2494bec0ff1SPawel Jakub Dawidek { 2504bec0ff1SPawel Jakub Dawidek struct bio *bp2; 2514bec0ff1SPawel Jakub Dawidek 2524bec0ff1SPawel Jakub Dawidek bp2 = uma_zalloc(biozone, M_WAITOK | M_ZERO); 253a9934668SKenneth D. Merry bp2->bio_flags = bp->bio_flags & (BIO_UNMAPPED | BIO_VLIST); 2544bec0ff1SPawel Jakub Dawidek bp2->bio_parent = bp; 2554bec0ff1SPawel Jakub Dawidek bp2->bio_cmd = bp->bio_cmd; 2564bec0ff1SPawel Jakub Dawidek bp2->bio_length = bp->bio_length; 2574bec0ff1SPawel Jakub Dawidek bp2->bio_offset = bp->bio_offset; 2584bec0ff1SPawel Jakub Dawidek bp2->bio_data = bp->bio_data; 259ee75e7deSKonstantin Belousov bp2->bio_ma = bp->bio_ma; 260ee75e7deSKonstantin Belousov bp2->bio_ma_n = bp->bio_ma_n; 261ee75e7deSKonstantin Belousov bp2->bio_ma_offset = bp->bio_ma_offset; 2624bec0ff1SPawel Jakub Dawidek bp2->bio_attribute = bp->bio_attribute; 2634bec0ff1SPawel Jakub Dawidek bp->bio_children++; 2644bec0ff1SPawel Jakub Dawidek #ifdef KTR 265b656c1b8SPawel Jakub Dawidek if ((KTR_COMPILE & KTR_GEOM) && (ktr_mask & KTR_GEOM)) { 2664bec0ff1SPawel Jakub Dawidek struct stack st; 2674bec0ff1SPawel Jakub Dawidek 2684bec0ff1SPawel Jakub Dawidek CTR2(KTR_GEOM, "g_duplicate_bio(%p): %p", bp, bp2); 2694bec0ff1SPawel Jakub Dawidek stack_save(&st); 27054533f66SConrad Meyer CTRSTACK(KTR_GEOM, &st, 3); 2714bec0ff1SPawel Jakub Dawidek } 2724bec0ff1SPawel Jakub Dawidek #endif 2734bec0ff1SPawel Jakub Dawidek return(bp2); 2744bec0ff1SPawel Jakub Dawidek } 2754bec0ff1SPawel Jakub Dawidek 276dd84a43cSPoul-Henning Kamp void 277c55f5707SWarner Losh g_reset_bio(struct bio *bp) 278c55f5707SWarner Losh { 279c55f5707SWarner Losh 280bd4c1dd6SWarner Losh bzero(bp, sizeof(*bp)); 281c55f5707SWarner Losh } 282c55f5707SWarner Losh 283c55f5707SWarner Losh void 284dd84a43cSPoul-Henning Kamp g_io_init() 285dd84a43cSPoul-Henning Kamp { 286dd84a43cSPoul-Henning Kamp 287dd84a43cSPoul-Henning Kamp g_bioq_init(&g_bio_run_down); 288dd84a43cSPoul-Henning Kamp g_bioq_init(&g_bio_run_up); 2895ffb2c8bSPoul-Henning Kamp biozone = uma_zcreate("g_bio", sizeof (struct bio), 2905ffb2c8bSPoul-Henning Kamp NULL, NULL, 2915ffb2c8bSPoul-Henning Kamp NULL, NULL, 2925ffb2c8bSPoul-Henning Kamp 0, 0); 293dd84a43cSPoul-Henning Kamp } 294dd84a43cSPoul-Henning Kamp 295dd84a43cSPoul-Henning Kamp int 2960d3f37a8SPoul-Henning Kamp g_io_getattr(const char *attr, struct g_consumer *cp, int *len, void *ptr) 297dd84a43cSPoul-Henning Kamp { 298dd84a43cSPoul-Henning Kamp struct bio *bp; 299dd84a43cSPoul-Henning Kamp int error; 300dd84a43cSPoul-Henning Kamp 301dd84a43cSPoul-Henning Kamp g_trace(G_T_BIO, "bio_getattr(%s)", attr); 302a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 303dd84a43cSPoul-Henning Kamp bp->bio_cmd = BIO_GETATTR; 304dd84a43cSPoul-Henning Kamp bp->bio_done = NULL; 305dd84a43cSPoul-Henning Kamp bp->bio_attribute = attr; 306dd84a43cSPoul-Henning Kamp bp->bio_length = *len; 307dd84a43cSPoul-Henning Kamp bp->bio_data = ptr; 308dd84a43cSPoul-Henning Kamp g_io_request(bp, cp); 30953706245SPoul-Henning Kamp error = biowait(bp, "ggetattr"); 310dd84a43cSPoul-Henning Kamp *len = bp->bio_completed; 311dd84a43cSPoul-Henning Kamp g_destroy_bio(bp); 312dd84a43cSPoul-Henning Kamp return (error); 313dd84a43cSPoul-Henning Kamp } 314dd84a43cSPoul-Henning Kamp 315c3618c65SPawel Jakub Dawidek int 3169a6844d5SKenneth D. Merry g_io_zonecmd(struct disk_zone_args *zone_args, struct g_consumer *cp) 3179a6844d5SKenneth D. Merry { 3189a6844d5SKenneth D. Merry struct bio *bp; 3199a6844d5SKenneth D. Merry int error; 3209a6844d5SKenneth D. Merry 3219a6844d5SKenneth D. Merry g_trace(G_T_BIO, "bio_zone(%d)", zone_args->zone_cmd); 3229a6844d5SKenneth D. Merry bp = g_alloc_bio(); 3239a6844d5SKenneth D. Merry bp->bio_cmd = BIO_ZONE; 3249a6844d5SKenneth D. Merry bp->bio_done = NULL; 3259a6844d5SKenneth D. Merry /* 3269a6844d5SKenneth D. Merry * XXX KDM need to handle report zone data. 3279a6844d5SKenneth D. Merry */ 3289a6844d5SKenneth D. Merry bcopy(zone_args, &bp->bio_zone, sizeof(*zone_args)); 3299a6844d5SKenneth D. Merry if (zone_args->zone_cmd == DISK_ZONE_REPORT_ZONES) 3309a6844d5SKenneth D. Merry bp->bio_length = 3319a6844d5SKenneth D. Merry zone_args->zone_params.report.entries_allocated * 3329a6844d5SKenneth D. Merry sizeof(struct disk_zone_rep_entry); 3339a6844d5SKenneth D. Merry else 3349a6844d5SKenneth D. Merry bp->bio_length = 0; 3359a6844d5SKenneth D. Merry 3369a6844d5SKenneth D. Merry g_io_request(bp, cp); 3379a6844d5SKenneth D. Merry error = biowait(bp, "gzone"); 3389a6844d5SKenneth D. Merry bcopy(&bp->bio_zone, zone_args, sizeof(*zone_args)); 3399a6844d5SKenneth D. Merry g_destroy_bio(bp); 3409a6844d5SKenneth D. Merry return (error); 3419a6844d5SKenneth D. Merry } 3429a6844d5SKenneth D. Merry 343*b182c792SWarner Losh /* 344*b182c792SWarner Losh * Send a BIO_SPEEDUP down the stack. This is used to tell the lower layers that 345*b182c792SWarner Losh * the upper layers have detected a resource shortage. The lower layers are 346*b182c792SWarner Losh * advised to stop delaying I/O that they might be holding for performance 347*b182c792SWarner Losh * reasons and to schedule it (non-trims) or complete it successfully (trims) as 348*b182c792SWarner Losh * quickly as it can. bio_length is the amount of the shortage. This call 349*b182c792SWarner Losh * should be non-blocking. bio_resid is used to communicate back if the lower 350*b182c792SWarner Losh * layers couldn't find bio_length worth of I/O to schedule or discard. A length 351*b182c792SWarner Losh * of 0 means to do as much as you can (schedule the h/w queues full, discard 352*b182c792SWarner Losh * all trims). flags are a hint from the upper layers to the lower layers what 353*b182c792SWarner Losh * operation should be done. 354*b182c792SWarner Losh */ 355*b182c792SWarner Losh int 356*b182c792SWarner Losh g_io_speedup(size_t shortage, u_int flags, size_t *resid, struct g_consumer *cp) 357*b182c792SWarner Losh { 358*b182c792SWarner Losh struct bio *bp; 359*b182c792SWarner Losh int error; 360*b182c792SWarner Losh 361*b182c792SWarner Losh KASSERT((flags & (BIO_SPEEDUP_TRIM | BIO_SPEEDUP_WRITE)) != 0, 362*b182c792SWarner Losh ("Invalid flags passed to g_io_speedup: %#x", flags)); 363*b182c792SWarner Losh g_trace(G_T_BIO, "bio_speedup(%s, %zu, %#x)", cp->provider->name, 364*b182c792SWarner Losh shortage, flags); 365*b182c792SWarner Losh bp = g_new_bio(); 366*b182c792SWarner Losh if (bp == NULL) 367*b182c792SWarner Losh return (ENOMEM); 368*b182c792SWarner Losh bp->bio_cmd = BIO_SPEEDUP; 369*b182c792SWarner Losh bp->bio_length = shortage; 370*b182c792SWarner Losh bp->bio_done = NULL; 371*b182c792SWarner Losh bp->bio_flags |= flags; 372*b182c792SWarner Losh g_io_request(bp, cp); 373*b182c792SWarner Losh error = biowait(bp, "gflush"); 374*b182c792SWarner Losh *resid = bp->bio_resid; 375*b182c792SWarner Losh g_destroy_bio(bp); 376*b182c792SWarner Losh return (error); 377*b182c792SWarner Losh } 378*b182c792SWarner Losh 3799a6844d5SKenneth D. Merry int 380c3618c65SPawel Jakub Dawidek g_io_flush(struct g_consumer *cp) 381c3618c65SPawel Jakub Dawidek { 382c3618c65SPawel Jakub Dawidek struct bio *bp; 383c3618c65SPawel Jakub Dawidek int error; 384c3618c65SPawel Jakub Dawidek 385c3618c65SPawel Jakub Dawidek g_trace(G_T_BIO, "bio_flush(%s)", cp->provider->name); 386c3618c65SPawel Jakub Dawidek bp = g_alloc_bio(); 387c3618c65SPawel Jakub Dawidek bp->bio_cmd = BIO_FLUSH; 388f03f7a0cSJustin T. Gibbs bp->bio_flags |= BIO_ORDERED; 389c3618c65SPawel Jakub Dawidek bp->bio_done = NULL; 390c3618c65SPawel Jakub Dawidek bp->bio_attribute = NULL; 391c3618c65SPawel Jakub Dawidek bp->bio_offset = cp->provider->mediasize; 392c3618c65SPawel Jakub Dawidek bp->bio_length = 0; 393c3618c65SPawel Jakub Dawidek bp->bio_data = NULL; 394c3618c65SPawel Jakub Dawidek g_io_request(bp, cp); 395c3618c65SPawel Jakub Dawidek error = biowait(bp, "gflush"); 396c3618c65SPawel Jakub Dawidek g_destroy_bio(bp); 397c3618c65SPawel Jakub Dawidek return (error); 398c3618c65SPawel Jakub Dawidek } 399c3618c65SPawel Jakub Dawidek 400e39d70d4SPoul-Henning Kamp static int 401e39d70d4SPoul-Henning Kamp g_io_check(struct bio *bp) 402e39d70d4SPoul-Henning Kamp { 403e39d70d4SPoul-Henning Kamp struct g_consumer *cp; 404e39d70d4SPoul-Henning Kamp struct g_provider *pp; 40540ea77a0SAlexander Motin off_t excess; 40640ea77a0SAlexander Motin int error; 407e39d70d4SPoul-Henning Kamp 4088532d381SConrad Meyer biotrack(bp, __func__); 4098532d381SConrad Meyer 410e39d70d4SPoul-Henning Kamp cp = bp->bio_from; 411e39d70d4SPoul-Henning Kamp pp = bp->bio_to; 412e39d70d4SPoul-Henning Kamp 413e39d70d4SPoul-Henning Kamp /* Fail if access counters dont allow the operation */ 414e39d70d4SPoul-Henning Kamp switch(bp->bio_cmd) { 415e39d70d4SPoul-Henning Kamp case BIO_READ: 416e39d70d4SPoul-Henning Kamp case BIO_GETATTR: 417e39d70d4SPoul-Henning Kamp if (cp->acr == 0) 418e39d70d4SPoul-Henning Kamp return (EPERM); 419e39d70d4SPoul-Henning Kamp break; 420e39d70d4SPoul-Henning Kamp case BIO_WRITE: 421e39d70d4SPoul-Henning Kamp case BIO_DELETE: 422c3618c65SPawel Jakub Dawidek case BIO_FLUSH: 423e39d70d4SPoul-Henning Kamp if (cp->acw == 0) 424e39d70d4SPoul-Henning Kamp return (EPERM); 425e39d70d4SPoul-Henning Kamp break; 4269a6844d5SKenneth D. Merry case BIO_ZONE: 4279a6844d5SKenneth D. Merry if ((bp->bio_zone.zone_cmd == DISK_ZONE_REPORT_ZONES) || 4289a6844d5SKenneth D. Merry (bp->bio_zone.zone_cmd == DISK_ZONE_GET_PARAMS)) { 4299a6844d5SKenneth D. Merry if (cp->acr == 0) 4309a6844d5SKenneth D. Merry return (EPERM); 4319a6844d5SKenneth D. Merry } else if (cp->acw == 0) 4329a6844d5SKenneth D. Merry return (EPERM); 4339a6844d5SKenneth D. Merry break; 434e39d70d4SPoul-Henning Kamp default: 435e39d70d4SPoul-Henning Kamp return (EPERM); 436e39d70d4SPoul-Henning Kamp } 437e39d70d4SPoul-Henning Kamp /* if provider is marked for error, don't disturb. */ 438e39d70d4SPoul-Henning Kamp if (pp->error) 439e39d70d4SPoul-Henning Kamp return (pp->error); 4403631c638SAlexander Motin if (cp->flags & G_CF_ORPHAN) 4413631c638SAlexander Motin return (ENXIO); 442e39d70d4SPoul-Henning Kamp 443e39d70d4SPoul-Henning Kamp switch(bp->bio_cmd) { 444e39d70d4SPoul-Henning Kamp case BIO_READ: 445e39d70d4SPoul-Henning Kamp case BIO_WRITE: 446e39d70d4SPoul-Henning Kamp case BIO_DELETE: 4472a842317SAndriy Gapon /* Zero sectorsize or mediasize is probably a lack of media. */ 4482a842317SAndriy Gapon if (pp->sectorsize == 0 || pp->mediasize == 0) 44943bff1a7SPoul-Henning Kamp return (ENXIO); 450e39d70d4SPoul-Henning Kamp /* Reject I/O not on sector boundary */ 451e39d70d4SPoul-Henning Kamp if (bp->bio_offset % pp->sectorsize) 452e39d70d4SPoul-Henning Kamp return (EINVAL); 453e39d70d4SPoul-Henning Kamp /* Reject I/O not integral sector long */ 454e39d70d4SPoul-Henning Kamp if (bp->bio_length % pp->sectorsize) 455e39d70d4SPoul-Henning Kamp return (EINVAL); 456d1b8bf47SPoul-Henning Kamp /* Reject requests before or past the end of media. */ 457d1b8bf47SPoul-Henning Kamp if (bp->bio_offset < 0) 458d1b8bf47SPoul-Henning Kamp return (EIO); 459e39d70d4SPoul-Henning Kamp if (bp->bio_offset > pp->mediasize) 460e39d70d4SPoul-Henning Kamp return (EIO); 46140ea77a0SAlexander Motin 46240ea77a0SAlexander Motin /* Truncate requests to the end of providers media. */ 46340ea77a0SAlexander Motin excess = bp->bio_offset + bp->bio_length; 46440ea77a0SAlexander Motin if (excess > bp->bio_to->mediasize) { 46540ea77a0SAlexander Motin KASSERT((bp->bio_flags & BIO_UNMAPPED) == 0 || 46640ea77a0SAlexander Motin round_page(bp->bio_ma_offset + 46740ea77a0SAlexander Motin bp->bio_length) / PAGE_SIZE == bp->bio_ma_n, 46840ea77a0SAlexander Motin ("excess bio %p too short", bp)); 46940ea77a0SAlexander Motin excess -= bp->bio_to->mediasize; 47040ea77a0SAlexander Motin bp->bio_length -= excess; 47140ea77a0SAlexander Motin if ((bp->bio_flags & BIO_UNMAPPED) != 0) { 47240ea77a0SAlexander Motin bp->bio_ma_n = round_page(bp->bio_ma_offset + 47340ea77a0SAlexander Motin bp->bio_length) / PAGE_SIZE; 47440ea77a0SAlexander Motin } 47540ea77a0SAlexander Motin if (excess > 0) 47640ea77a0SAlexander Motin CTR3(KTR_GEOM, "g_down truncated bio " 47740ea77a0SAlexander Motin "%p provider %s by %d", bp, 47840ea77a0SAlexander Motin bp->bio_to->name, excess); 47940ea77a0SAlexander Motin } 48040ea77a0SAlexander Motin 48140ea77a0SAlexander Motin /* Deliver zero length transfers right here. */ 48240ea77a0SAlexander Motin if (bp->bio_length == 0) { 48340ea77a0SAlexander Motin CTR2(KTR_GEOM, "g_down terminated 0-length " 48440ea77a0SAlexander Motin "bp %p provider %s", bp, bp->bio_to->name); 48540ea77a0SAlexander Motin return (0); 48640ea77a0SAlexander Motin } 48740ea77a0SAlexander Motin 48840ea77a0SAlexander Motin if ((bp->bio_flags & BIO_UNMAPPED) != 0 && 48940ea77a0SAlexander Motin (bp->bio_to->flags & G_PF_ACCEPT_UNMAPPED) == 0 && 49040ea77a0SAlexander Motin (bp->bio_cmd == BIO_READ || bp->bio_cmd == BIO_WRITE)) { 49140ea77a0SAlexander Motin if ((error = g_io_transient_map_bio(bp)) >= 0) 49240ea77a0SAlexander Motin return (error); 49340ea77a0SAlexander Motin } 494e39d70d4SPoul-Henning Kamp break; 495e39d70d4SPoul-Henning Kamp default: 496e39d70d4SPoul-Henning Kamp break; 497e39d70d4SPoul-Henning Kamp } 49840ea77a0SAlexander Motin return (EJUSTRETURN); 499e39d70d4SPoul-Henning Kamp } 500e39d70d4SPoul-Henning Kamp 5016231f75bSLuigi Rizzo /* 5026231f75bSLuigi Rizzo * bio classification support. 5036231f75bSLuigi Rizzo * 5046231f75bSLuigi Rizzo * g_register_classifier() and g_unregister_classifier() 5056231f75bSLuigi Rizzo * are used to add/remove a classifier from the list. 5066231f75bSLuigi Rizzo * The list is protected using the g_bio_run_down lock, 5076231f75bSLuigi Rizzo * because the classifiers are called in this path. 5086231f75bSLuigi Rizzo * 5096231f75bSLuigi Rizzo * g_io_request() passes bio's that are not already classified 5106231f75bSLuigi Rizzo * (i.e. those with bio_classifier1 == NULL) to g_run_classifiers(). 5116231f75bSLuigi Rizzo * Classifiers can store their result in the two fields 5126231f75bSLuigi Rizzo * bio_classifier1 and bio_classifier2. 5136231f75bSLuigi Rizzo * A classifier that updates one of the fields should 5146231f75bSLuigi Rizzo * return a non-zero value. 5156231f75bSLuigi Rizzo * If no classifier updates the field, g_run_classifiers() sets 5166231f75bSLuigi Rizzo * bio_classifier1 = BIO_NOTCLASSIFIED to avoid further calls. 5176231f75bSLuigi Rizzo */ 5186231f75bSLuigi Rizzo 5196231f75bSLuigi Rizzo int 5206231f75bSLuigi Rizzo g_register_classifier(struct g_classifier_hook *hook) 5216231f75bSLuigi Rizzo { 5226231f75bSLuigi Rizzo 5236231f75bSLuigi Rizzo g_bioq_lock(&g_bio_run_down); 5246231f75bSLuigi Rizzo TAILQ_INSERT_TAIL(&g_classifier_tailq, hook, link); 5256231f75bSLuigi Rizzo g_bioq_unlock(&g_bio_run_down); 5266231f75bSLuigi Rizzo 5276231f75bSLuigi Rizzo return (0); 5286231f75bSLuigi Rizzo } 5296231f75bSLuigi Rizzo 5306231f75bSLuigi Rizzo void 5316231f75bSLuigi Rizzo g_unregister_classifier(struct g_classifier_hook *hook) 5326231f75bSLuigi Rizzo { 5336231f75bSLuigi Rizzo struct g_classifier_hook *entry; 5346231f75bSLuigi Rizzo 5356231f75bSLuigi Rizzo g_bioq_lock(&g_bio_run_down); 5366231f75bSLuigi Rizzo TAILQ_FOREACH(entry, &g_classifier_tailq, link) { 5376231f75bSLuigi Rizzo if (entry == hook) { 5386231f75bSLuigi Rizzo TAILQ_REMOVE(&g_classifier_tailq, hook, link); 5396231f75bSLuigi Rizzo break; 5406231f75bSLuigi Rizzo } 5416231f75bSLuigi Rizzo } 5426231f75bSLuigi Rizzo g_bioq_unlock(&g_bio_run_down); 5436231f75bSLuigi Rizzo } 5446231f75bSLuigi Rizzo 5456231f75bSLuigi Rizzo static void 5466231f75bSLuigi Rizzo g_run_classifiers(struct bio *bp) 5476231f75bSLuigi Rizzo { 5486231f75bSLuigi Rizzo struct g_classifier_hook *hook; 5496231f75bSLuigi Rizzo int classified = 0; 5506231f75bSLuigi Rizzo 5518532d381SConrad Meyer biotrack(bp, __func__); 5528532d381SConrad Meyer 5536231f75bSLuigi Rizzo TAILQ_FOREACH(hook, &g_classifier_tailq, link) 5546231f75bSLuigi Rizzo classified |= hook->func(hook->arg, bp); 5556231f75bSLuigi Rizzo 5566231f75bSLuigi Rizzo if (!classified) 5576231f75bSLuigi Rizzo bp->bio_classifier1 = BIO_NOTCLASSIFIED; 5586231f75bSLuigi Rizzo } 5596231f75bSLuigi Rizzo 560dd84a43cSPoul-Henning Kamp void 561dd84a43cSPoul-Henning Kamp g_io_request(struct bio *bp, struct g_consumer *cp) 562dd84a43cSPoul-Henning Kamp { 563801bb689SPoul-Henning Kamp struct g_provider *pp; 56440ea77a0SAlexander Motin struct mtx *mtxp; 56540ea77a0SAlexander Motin int direct, error, first; 5668076d204SWarner Losh uint8_t cmd; 567dd84a43cSPoul-Henning Kamp 5688532d381SConrad Meyer biotrack(bp, __func__); 5698532d381SConrad Meyer 570d0e17c1bSPoul-Henning Kamp KASSERT(cp != NULL, ("NULL cp in g_io_request")); 571d0e17c1bSPoul-Henning Kamp KASSERT(bp != NULL, ("NULL bp in g_io_request")); 572e060b6bdSPoul-Henning Kamp pp = cp->provider; 573801bb689SPoul-Henning Kamp KASSERT(pp != NULL, ("consumer not attached in g_io_request")); 57492ee312dSPawel Jakub Dawidek #ifdef DIAGNOSTIC 57592ee312dSPawel Jakub Dawidek KASSERT(bp->bio_driver1 == NULL, 57692ee312dSPawel Jakub Dawidek ("bio_driver1 used by the consumer (geom %s)", cp->geom->name)); 57792ee312dSPawel Jakub Dawidek KASSERT(bp->bio_driver2 == NULL, 57892ee312dSPawel Jakub Dawidek ("bio_driver2 used by the consumer (geom %s)", cp->geom->name)); 57992ee312dSPawel Jakub Dawidek KASSERT(bp->bio_pflags == 0, 58092ee312dSPawel Jakub Dawidek ("bio_pflags used by the consumer (geom %s)", cp->geom->name)); 58192ee312dSPawel Jakub Dawidek /* 58292ee312dSPawel Jakub Dawidek * Remember consumer's private fields, so we can detect if they were 58392ee312dSPawel Jakub Dawidek * modified by the provider. 58492ee312dSPawel Jakub Dawidek */ 58592ee312dSPawel Jakub Dawidek bp->_bio_caller1 = bp->bio_caller1; 58692ee312dSPawel Jakub Dawidek bp->_bio_caller2 = bp->bio_caller2; 58792ee312dSPawel Jakub Dawidek bp->_bio_cflags = bp->bio_cflags; 58892ee312dSPawel Jakub Dawidek #endif 589801bb689SPoul-Henning Kamp 5908076d204SWarner Losh cmd = bp->bio_cmd; 5918076d204SWarner Losh if (cmd == BIO_READ || cmd == BIO_WRITE || cmd == BIO_GETATTR) { 592c3618c65SPawel Jakub Dawidek KASSERT(bp->bio_data != NULL, 5939a8fa125SWarner Losh ("NULL bp->data in g_io_request(cmd=%hu)", bp->bio_cmd)); 5941ded77b2SPawel Jakub Dawidek } 5958076d204SWarner Losh if (cmd == BIO_DELETE || cmd == BIO_FLUSH) { 5961ded77b2SPawel Jakub Dawidek KASSERT(bp->bio_data == NULL, 5979a8fa125SWarner Losh ("non-NULL bp->data in g_io_request(cmd=%hu)", 5981ded77b2SPawel Jakub Dawidek bp->bio_cmd)); 599c3618c65SPawel Jakub Dawidek } 6008076d204SWarner Losh if (cmd == BIO_READ || cmd == BIO_WRITE || cmd == BIO_DELETE) { 601dcbd0fe5SPoul-Henning Kamp KASSERT(bp->bio_offset % cp->provider->sectorsize == 0, 602dcbd0fe5SPoul-Henning Kamp ("wrong offset %jd for sectorsize %u", 603dcbd0fe5SPoul-Henning Kamp bp->bio_offset, cp->provider->sectorsize)); 604dcbd0fe5SPoul-Henning Kamp KASSERT(bp->bio_length % cp->provider->sectorsize == 0, 605dcbd0fe5SPoul-Henning Kamp ("wrong length %jd for sectorsize %u", 606dcbd0fe5SPoul-Henning Kamp bp->bio_length, cp->provider->sectorsize)); 607dcbd0fe5SPoul-Henning Kamp } 608dcbd0fe5SPoul-Henning Kamp 609f7717523SStephan Uphoff g_trace(G_T_BIO, "bio_request(%p) from %p(%s) to %p(%s) cmd %d", 610f7717523SStephan Uphoff bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd); 611f7717523SStephan Uphoff 612dd84a43cSPoul-Henning Kamp bp->bio_from = cp; 613801bb689SPoul-Henning Kamp bp->bio_to = pp; 6142fccec19SPoul-Henning Kamp bp->bio_error = 0; 6152fccec19SPoul-Henning Kamp bp->bio_completed = 0; 616dd84a43cSPoul-Henning Kamp 61719fa21aaSPoul-Henning Kamp KASSERT(!(bp->bio_flags & BIO_ONQUEUE), 61819fa21aaSPoul-Henning Kamp ("Bio already on queue bp=%p", bp)); 61940ea77a0SAlexander Motin if ((g_collectstats & G_STATS_CONSUMERS) != 0 || 62040ea77a0SAlexander Motin ((g_collectstats & G_STATS_PROVIDERS) != 0 && pp->stat != NULL)) 62119fa21aaSPoul-Henning Kamp binuptime(&bp->bio_t0); 622a5be8eb5SAlexander Motin else 623a5be8eb5SAlexander Motin getbinuptime(&bp->bio_t0); 6248827c821SPoul-Henning Kamp 62540ea77a0SAlexander Motin #ifdef GET_STACK_USAGE 626347e9d54SKonstantin Belousov direct = (cp->flags & G_CF_DIRECT_SEND) != 0 && 627347e9d54SKonstantin Belousov (pp->flags & G_PF_DIRECT_RECEIVE) != 0 && 62840ea77a0SAlexander Motin !g_is_geom_thread(curthread) && 6299b349650SKonstantin Belousov ((pp->flags & G_PF_ACCEPT_UNMAPPED) != 0 || 6303f2e5b85SWarner Losh (bp->bio_flags & BIO_UNMAPPED) == 0 || THREAD_CAN_SLEEP()) && 6313f2e5b85SWarner Losh pace == 0; 63240ea77a0SAlexander Motin if (direct) { 63340ea77a0SAlexander Motin /* Block direct execution if less then half of stack left. */ 63440ea77a0SAlexander Motin size_t st, su; 63540ea77a0SAlexander Motin GET_STACK_USAGE(st, su); 63640ea77a0SAlexander Motin if (su * 2 > st) 63740ea77a0SAlexander Motin direct = 0; 63840ea77a0SAlexander Motin } 63940ea77a0SAlexander Motin #else 64040ea77a0SAlexander Motin direct = 0; 64140ea77a0SAlexander Motin #endif 64240ea77a0SAlexander Motin 64340ea77a0SAlexander Motin if (!TAILQ_EMPTY(&g_classifier_tailq) && !bp->bio_classifier1) { 64440ea77a0SAlexander Motin g_bioq_lock(&g_bio_run_down); 64540ea77a0SAlexander Motin g_run_classifiers(bp); 64640ea77a0SAlexander Motin g_bioq_unlock(&g_bio_run_down); 64740ea77a0SAlexander Motin } 64840ea77a0SAlexander Motin 6498827c821SPoul-Henning Kamp /* 6508827c821SPoul-Henning Kamp * The statistics collection is lockless, as such, but we 6518827c821SPoul-Henning Kamp * can not update one instance of the statistics from more 6528827c821SPoul-Henning Kamp * than one thread at a time, so grab the lock first. 6538827c821SPoul-Henning Kamp */ 65440ea77a0SAlexander Motin mtxp = mtx_pool_find(mtxpool_sleep, pp); 65540ea77a0SAlexander Motin mtx_lock(mtxp); 65640ea77a0SAlexander Motin if (g_collectstats & G_STATS_PROVIDERS) 65719fa21aaSPoul-Henning Kamp devstat_start_transaction(pp->stat, &bp->bio_t0); 65840ea77a0SAlexander Motin if (g_collectstats & G_STATS_CONSUMERS) 65919fa21aaSPoul-Henning Kamp devstat_start_transaction(cp->stat, &bp->bio_t0); 66019fa21aaSPoul-Henning Kamp pp->nstart++; 661cf457284SPoul-Henning Kamp cp->nstart++; 66240ea77a0SAlexander Motin mtx_unlock(mtxp); 66340ea77a0SAlexander Motin 66440ea77a0SAlexander Motin if (direct) { 66540ea77a0SAlexander Motin error = g_io_check(bp); 66640ea77a0SAlexander Motin if (error >= 0) { 66740ea77a0SAlexander Motin CTR3(KTR_GEOM, "g_io_request g_io_check on bp %p " 66840ea77a0SAlexander Motin "provider %s returned %d", bp, bp->bio_to->name, 66940ea77a0SAlexander Motin error); 67040ea77a0SAlexander Motin g_io_deliver(bp, error); 67140ea77a0SAlexander Motin return; 67240ea77a0SAlexander Motin } 67340ea77a0SAlexander Motin bp->bio_to->geom->start(bp); 67440ea77a0SAlexander Motin } else { 67540ea77a0SAlexander Motin g_bioq_lock(&g_bio_run_down); 6760d883b11SAlexander Motin first = TAILQ_EMPTY(&g_bio_run_down.bio_queue); 67719fa21aaSPoul-Henning Kamp TAILQ_INSERT_TAIL(&g_bio_run_down.bio_queue, bp, bio_queue); 67840ea77a0SAlexander Motin bp->bio_flags |= BIO_ONQUEUE; 67919fa21aaSPoul-Henning Kamp g_bio_run_down.bio_queue_length++; 68019fa21aaSPoul-Henning Kamp g_bioq_unlock(&g_bio_run_down); 6812fccec19SPoul-Henning Kamp /* Pass it on down. */ 6820d883b11SAlexander Motin if (first) 683dd84a43cSPoul-Henning Kamp wakeup(&g_wait_down); 684dd84a43cSPoul-Henning Kamp } 68540ea77a0SAlexander Motin } 686dd84a43cSPoul-Henning Kamp 687dd84a43cSPoul-Henning Kamp void 68872840432SPoul-Henning Kamp g_io_deliver(struct bio *bp, int error) 689dd84a43cSPoul-Henning Kamp { 690e431d66cSAlexander Motin struct bintime now; 691801bb689SPoul-Henning Kamp struct g_consumer *cp; 692801bb689SPoul-Henning Kamp struct g_provider *pp; 69340ea77a0SAlexander Motin struct mtx *mtxp; 69440ea77a0SAlexander Motin int direct, first; 695dd84a43cSPoul-Henning Kamp 6968532d381SConrad Meyer biotrack(bp, __func__); 6978532d381SConrad Meyer 698e060b6bdSPoul-Henning Kamp KASSERT(bp != NULL, ("NULL bp in g_io_deliver")); 699801bb689SPoul-Henning Kamp pp = bp->bio_to; 700f7eeab17SPoul-Henning Kamp KASSERT(pp != NULL, ("NULL bio_to in g_io_deliver")); 701f7eeab17SPoul-Henning Kamp cp = bp->bio_from; 702f7eeab17SPoul-Henning Kamp if (cp == NULL) { 703f7eeab17SPoul-Henning Kamp bp->bio_error = error; 704f7eeab17SPoul-Henning Kamp bp->bio_done(bp); 705f7eeab17SPoul-Henning Kamp return; 706f7eeab17SPoul-Henning Kamp } 707801bb689SPoul-Henning Kamp KASSERT(cp != NULL, ("NULL bio_from in g_io_deliver")); 708801bb689SPoul-Henning Kamp KASSERT(cp->geom != NULL, ("NULL bio_from->geom in g_io_deliver")); 709fb231f36SEdward Tomasz Napierala #ifdef DIAGNOSTIC 710fb231f36SEdward Tomasz Napierala /* 711fb231f36SEdward Tomasz Napierala * Some classes - GJournal in particular - can modify bio's 712fb231f36SEdward Tomasz Napierala * private fields while the bio is in transit; G_GEOM_VOLATILE_BIO 713fb231f36SEdward Tomasz Napierala * flag means it's an expected behaviour for that particular geom. 714fb231f36SEdward Tomasz Napierala */ 715fb231f36SEdward Tomasz Napierala if ((cp->geom->flags & G_GEOM_VOLATILE_BIO) == 0) { 716fb231f36SEdward Tomasz Napierala KASSERT(bp->bio_caller1 == bp->_bio_caller1, 717fb231f36SEdward Tomasz Napierala ("bio_caller1 used by the provider %s", pp->name)); 718fb231f36SEdward Tomasz Napierala KASSERT(bp->bio_caller2 == bp->_bio_caller2, 719fb231f36SEdward Tomasz Napierala ("bio_caller2 used by the provider %s", pp->name)); 720fb231f36SEdward Tomasz Napierala KASSERT(bp->bio_cflags == bp->_bio_cflags, 721fb231f36SEdward Tomasz Napierala ("bio_cflags used by the provider %s", pp->name)); 722fb231f36SEdward Tomasz Napierala } 723fb231f36SEdward Tomasz Napierala #endif 72446aeebecSPawel Jakub Dawidek KASSERT(bp->bio_completed >= 0, ("bio_completed can't be less than 0")); 72546aeebecSPawel Jakub Dawidek KASSERT(bp->bio_completed <= bp->bio_length, 72646aeebecSPawel Jakub Dawidek ("bio_completed can't be greater than bio_length")); 7275ab413bfSPoul-Henning Kamp 728dd84a43cSPoul-Henning Kamp g_trace(G_T_BIO, 7290355b86eSPoul-Henning Kamp "g_io_deliver(%p) from %p(%s) to %p(%s) cmd %d error %d off %jd len %jd", 730801bb689SPoul-Henning Kamp bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd, error, 7310355b86eSPoul-Henning Kamp (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length); 732801bb689SPoul-Henning Kamp 73319fa21aaSPoul-Henning Kamp KASSERT(!(bp->bio_flags & BIO_ONQUEUE), 73419fa21aaSPoul-Henning Kamp ("Bio already on queue bp=%p", bp)); 73519fa21aaSPoul-Henning Kamp 736dcbd0fe5SPoul-Henning Kamp /* 737dcbd0fe5SPoul-Henning Kamp * XXX: next two doesn't belong here 738dcbd0fe5SPoul-Henning Kamp */ 739e24cbd90SPoul-Henning Kamp bp->bio_bcount = bp->bio_length; 740e24cbd90SPoul-Henning Kamp bp->bio_resid = bp->bio_bcount - bp->bio_completed; 74119fa21aaSPoul-Henning Kamp 74240ea77a0SAlexander Motin #ifdef GET_STACK_USAGE 74340ea77a0SAlexander Motin direct = (pp->flags & G_PF_DIRECT_SEND) && 74440ea77a0SAlexander Motin (cp->flags & G_CF_DIRECT_RECEIVE) && 74540ea77a0SAlexander Motin !g_is_geom_thread(curthread); 74640ea77a0SAlexander Motin if (direct) { 74740ea77a0SAlexander Motin /* Block direct execution if less then half of stack left. */ 74840ea77a0SAlexander Motin size_t st, su; 74940ea77a0SAlexander Motin GET_STACK_USAGE(st, su); 75040ea77a0SAlexander Motin if (su * 2 > st) 75140ea77a0SAlexander Motin direct = 0; 75240ea77a0SAlexander Motin } 75340ea77a0SAlexander Motin #else 75440ea77a0SAlexander Motin direct = 0; 75540ea77a0SAlexander Motin #endif 75640ea77a0SAlexander Motin 7578827c821SPoul-Henning Kamp /* 7588827c821SPoul-Henning Kamp * The statistics collection is lockless, as such, but we 7598827c821SPoul-Henning Kamp * can not update one instance of the statistics from more 7608827c821SPoul-Henning Kamp * than one thread at a time, so grab the lock first. 7618827c821SPoul-Henning Kamp */ 76240ea77a0SAlexander Motin if ((g_collectstats & G_STATS_CONSUMERS) != 0 || 76340ea77a0SAlexander Motin ((g_collectstats & G_STATS_PROVIDERS) != 0 && pp->stat != NULL)) 764e431d66cSAlexander Motin binuptime(&now); 76540ea77a0SAlexander Motin mtxp = mtx_pool_find(mtxpool_sleep, cp); 76640ea77a0SAlexander Motin mtx_lock(mtxp); 76740ea77a0SAlexander Motin if (g_collectstats & G_STATS_PROVIDERS) 768e431d66cSAlexander Motin devstat_end_transaction_bio_bt(pp->stat, bp, &now); 76940ea77a0SAlexander Motin if (g_collectstats & G_STATS_CONSUMERS) 770e431d66cSAlexander Motin devstat_end_transaction_bio_bt(cp->stat, bp, &now); 771c6ae9b5fSPoul-Henning Kamp cp->nend++; 772c6ae9b5fSPoul-Henning Kamp pp->nend++; 77340ea77a0SAlexander Motin mtx_unlock(mtxp); 77440ea77a0SAlexander Motin 77519fa21aaSPoul-Henning Kamp if (error != ENOMEM) { 77619fa21aaSPoul-Henning Kamp bp->bio_error = error; 77740ea77a0SAlexander Motin if (direct) { 77840ea77a0SAlexander Motin biodone(bp); 77940ea77a0SAlexander Motin } else { 78040ea77a0SAlexander Motin g_bioq_lock(&g_bio_run_up); 7810d883b11SAlexander Motin first = TAILQ_EMPTY(&g_bio_run_up.bio_queue); 78219fa21aaSPoul-Henning Kamp TAILQ_INSERT_TAIL(&g_bio_run_up.bio_queue, bp, bio_queue); 783276f72c5SPoul-Henning Kamp bp->bio_flags |= BIO_ONQUEUE; 78419fa21aaSPoul-Henning Kamp g_bio_run_up.bio_queue_length++; 78519fa21aaSPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 7860d883b11SAlexander Motin if (first) 78719fa21aaSPoul-Henning Kamp wakeup(&g_wait_up); 78840ea77a0SAlexander Motin } 78919fa21aaSPoul-Henning Kamp return; 79019fa21aaSPoul-Henning Kamp } 791dd84a43cSPoul-Henning Kamp 7922cc9686eSPoul-Henning Kamp if (bootverbose) 793801bb689SPoul-Henning Kamp printf("ENOMEM %p on %p(%s)\n", bp, pp, pp->name); 7941b949c05SPawel Jakub Dawidek bp->bio_children = 0; 7951b949c05SPawel Jakub Dawidek bp->bio_inbed = 0; 79660114438SPawel Jakub Dawidek bp->bio_driver1 = NULL; 79760114438SPawel Jakub Dawidek bp->bio_driver2 = NULL; 79860114438SPawel Jakub Dawidek bp->bio_pflags = 0; 799801bb689SPoul-Henning Kamp g_io_request(bp, cp); 8003f2e5b85SWarner Losh pace = 1; 8013432e4fdSPoul-Henning Kamp return; 8023432e4fdSPoul-Henning Kamp } 803dd84a43cSPoul-Henning Kamp 804ee75e7deSKonstantin Belousov SYSCTL_DECL(_kern_geom); 805ee75e7deSKonstantin Belousov 806ee75e7deSKonstantin Belousov static long transient_maps; 807ee75e7deSKonstantin Belousov SYSCTL_LONG(_kern_geom, OID_AUTO, transient_maps, CTLFLAG_RD, 808ee75e7deSKonstantin Belousov &transient_maps, 0, 809ee75e7deSKonstantin Belousov "Total count of the transient mapping requests"); 810ee75e7deSKonstantin Belousov u_int transient_map_retries = 10; 811ee75e7deSKonstantin Belousov SYSCTL_UINT(_kern_geom, OID_AUTO, transient_map_retries, CTLFLAG_RW, 812ee75e7deSKonstantin Belousov &transient_map_retries, 0, 813ee75e7deSKonstantin Belousov "Max count of retries used before giving up on creating transient map"); 814ee75e7deSKonstantin Belousov int transient_map_hard_failures; 815ee75e7deSKonstantin Belousov SYSCTL_INT(_kern_geom, OID_AUTO, transient_map_hard_failures, CTLFLAG_RD, 816ee75e7deSKonstantin Belousov &transient_map_hard_failures, 0, 817ee75e7deSKonstantin Belousov "Failures to establish the transient mapping due to retry attempts " 818ee75e7deSKonstantin Belousov "exhausted"); 819ee75e7deSKonstantin Belousov int transient_map_soft_failures; 820ee75e7deSKonstantin Belousov SYSCTL_INT(_kern_geom, OID_AUTO, transient_map_soft_failures, CTLFLAG_RD, 821ee75e7deSKonstantin Belousov &transient_map_soft_failures, 0, 822ee75e7deSKonstantin Belousov "Count of retried failures to establish the transient mapping"); 823ee75e7deSKonstantin Belousov int inflight_transient_maps; 824ee75e7deSKonstantin Belousov SYSCTL_INT(_kern_geom, OID_AUTO, inflight_transient_maps, CTLFLAG_RD, 825ee75e7deSKonstantin Belousov &inflight_transient_maps, 0, 826ee75e7deSKonstantin Belousov "Current count of the active transient maps"); 827ee75e7deSKonstantin Belousov 828ee75e7deSKonstantin Belousov static int 829ee75e7deSKonstantin Belousov g_io_transient_map_bio(struct bio *bp) 830ee75e7deSKonstantin Belousov { 831ee75e7deSKonstantin Belousov vm_offset_t addr; 832ee75e7deSKonstantin Belousov long size; 833ee75e7deSKonstantin Belousov u_int retried; 834ee75e7deSKonstantin Belousov 8356c83fce3SKonstantin Belousov KASSERT(unmapped_buf_allowed, ("unmapped disabled")); 8366c83fce3SKonstantin Belousov 837ee75e7deSKonstantin Belousov size = round_page(bp->bio_ma_offset + bp->bio_length); 838ee75e7deSKonstantin Belousov KASSERT(size / PAGE_SIZE == bp->bio_ma_n, ("Bio too short %p", bp)); 839ee75e7deSKonstantin Belousov addr = 0; 840ee75e7deSKonstantin Belousov retried = 0; 841ee75e7deSKonstantin Belousov atomic_add_long(&transient_maps, 1); 842ee75e7deSKonstantin Belousov retry: 8435f518366SJeff Roberson if (vmem_alloc(transient_arena, size, M_BESTFIT | M_NOWAIT, &addr)) { 844ee75e7deSKonstantin Belousov if (transient_map_retries != 0 && 845ee75e7deSKonstantin Belousov retried >= transient_map_retries) { 846ee75e7deSKonstantin Belousov CTR2(KTR_GEOM, "g_down cannot map bp %p provider %s", 847ee75e7deSKonstantin Belousov bp, bp->bio_to->name); 848ee75e7deSKonstantin Belousov atomic_add_int(&transient_map_hard_failures, 1); 84940ea77a0SAlexander Motin return (EDEADLK/* XXXKIB */); 850ee75e7deSKonstantin Belousov } else { 851ee75e7deSKonstantin Belousov /* 852ee75e7deSKonstantin Belousov * Naive attempt to quisce the I/O to get more 853ee75e7deSKonstantin Belousov * in-flight requests completed and defragment 8545f518366SJeff Roberson * the transient_arena. 855ee75e7deSKonstantin Belousov */ 856ee75e7deSKonstantin Belousov CTR3(KTR_GEOM, "g_down retrymap bp %p provider %s r %d", 857ee75e7deSKonstantin Belousov bp, bp->bio_to->name, retried); 858ee75e7deSKonstantin Belousov pause("g_d_tra", hz / 10); 859ee75e7deSKonstantin Belousov retried++; 860ee75e7deSKonstantin Belousov atomic_add_int(&transient_map_soft_failures, 1); 861ee75e7deSKonstantin Belousov goto retry; 862ee75e7deSKonstantin Belousov } 863ee75e7deSKonstantin Belousov } 864ee75e7deSKonstantin Belousov atomic_add_int(&inflight_transient_maps, 1); 865ee75e7deSKonstantin Belousov pmap_qenter((vm_offset_t)addr, bp->bio_ma, OFF_TO_IDX(size)); 866ee75e7deSKonstantin Belousov bp->bio_data = (caddr_t)addr + bp->bio_ma_offset; 867ee75e7deSKonstantin Belousov bp->bio_flags |= BIO_TRANSIENT_MAPPING; 868ee75e7deSKonstantin Belousov bp->bio_flags &= ~BIO_UNMAPPED; 86940ea77a0SAlexander Motin return (EJUSTRETURN); 870ee75e7deSKonstantin Belousov } 871ee75e7deSKonstantin Belousov 872dd84a43cSPoul-Henning Kamp void 873dd84a43cSPoul-Henning Kamp g_io_schedule_down(struct thread *tp __unused) 874dd84a43cSPoul-Henning Kamp { 875dd84a43cSPoul-Henning Kamp struct bio *bp; 876e39d70d4SPoul-Henning Kamp int error; 877dd84a43cSPoul-Henning Kamp 878dd84a43cSPoul-Henning Kamp for(;;) { 879f0e185d7SPoul-Henning Kamp g_bioq_lock(&g_bio_run_down); 880dd84a43cSPoul-Henning Kamp bp = g_bioq_first(&g_bio_run_down); 881f0e185d7SPoul-Henning Kamp if (bp == NULL) { 88249dbb61dSRobert Watson CTR0(KTR_GEOM, "g_down going to sleep"); 883f0e185d7SPoul-Henning Kamp msleep(&g_wait_down, &g_bio_run_down.bio_queue_lock, 8847fc019afSAlexander Motin PRIBIO | PDROP, "-", 0); 885f0e185d7SPoul-Henning Kamp continue; 886f0e185d7SPoul-Henning Kamp } 88749dbb61dSRobert Watson CTR0(KTR_GEOM, "g_down has work to do"); 888f0e185d7SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_down); 8898532d381SConrad Meyer biotrack(bp, __func__); 8903f2e5b85SWarner Losh if (pace != 0) { 8913f2e5b85SWarner Losh /* 8923f2e5b85SWarner Losh * There has been at least one memory allocation 8933f2e5b85SWarner Losh * failure since the last I/O completed. Pause 1ms to 8943f2e5b85SWarner Losh * give the system a chance to free up memory. We only 8953f2e5b85SWarner Losh * do this once because a large number of allocations 8963f2e5b85SWarner Losh * can fail in the direct dispatch case and there's no 8973f2e5b85SWarner Losh * relationship between the number of these failures and 8983f2e5b85SWarner Losh * the length of the outage. If there's still an outage, 8993f2e5b85SWarner Losh * we'll pause again and again until it's 9003f2e5b85SWarner Losh * resolved. Older versions paused longer and once per 9013f2e5b85SWarner Losh * allocation failure. This was OK for a single threaded 9023f2e5b85SWarner Losh * g_down, but with direct dispatch would lead to max of 9033f2e5b85SWarner Losh * 10 IOPs for minutes at a time when transient memory 9043f2e5b85SWarner Losh * issues prevented allocation for a batch of requests 9053f2e5b85SWarner Losh * from the upper layers. 9063f2e5b85SWarner Losh * 9073f2e5b85SWarner Losh * XXX This pacing is really lame. It needs to be solved 9083f2e5b85SWarner Losh * by other methods. This is OK only because the worst 9093f2e5b85SWarner Losh * case scenario is so rare. In the worst case scenario 9103f2e5b85SWarner Losh * all memory is tied up waiting for I/O to complete 9113f2e5b85SWarner Losh * which can never happen since we can't allocate bios 9123f2e5b85SWarner Losh * for that I/O. 9133f2e5b85SWarner Losh */ 9143f2e5b85SWarner Losh CTR0(KTR_GEOM, "g_down pacing self"); 9153f2e5b85SWarner Losh pause("g_down", min(hz/1000, 1)); 9163f2e5b85SWarner Losh pace = 0; 917376ceb79SPoul-Henning Kamp } 91840ea77a0SAlexander Motin CTR2(KTR_GEOM, "g_down processing bp %p provider %s", bp, 91940ea77a0SAlexander Motin bp->bio_to->name); 920e39d70d4SPoul-Henning Kamp error = g_io_check(bp); 92140ea77a0SAlexander Motin if (error >= 0) { 92249dbb61dSRobert Watson CTR3(KTR_GEOM, "g_down g_io_check on bp %p provider " 92349dbb61dSRobert Watson "%s returned %d", bp, bp->bio_to->name, error); 924e39d70d4SPoul-Henning Kamp g_io_deliver(bp, error); 925e39d70d4SPoul-Henning Kamp continue; 926e39d70d4SPoul-Henning Kamp } 92751460da8SJohn Baldwin THREAD_NO_SLEEPING(); 92849dbb61dSRobert Watson CTR4(KTR_GEOM, "g_down starting bp %p provider %s off %ld " 92949dbb61dSRobert Watson "len %ld", bp, bp->bio_to->name, bp->bio_offset, 93049dbb61dSRobert Watson bp->bio_length); 931dd84a43cSPoul-Henning Kamp bp->bio_to->geom->start(bp); 93251460da8SJohn Baldwin THREAD_SLEEPING_OK(); 933dd84a43cSPoul-Henning Kamp } 934dd84a43cSPoul-Henning Kamp } 935dd84a43cSPoul-Henning Kamp 936dd84a43cSPoul-Henning Kamp void 937dd84a43cSPoul-Henning Kamp g_io_schedule_up(struct thread *tp __unused) 938dd84a43cSPoul-Henning Kamp { 939dd84a43cSPoul-Henning Kamp struct bio *bp; 9400c4440c3SEdward Tomasz Napierala 941dd84a43cSPoul-Henning Kamp for(;;) { 942f0e185d7SPoul-Henning Kamp g_bioq_lock(&g_bio_run_up); 9430c4440c3SEdward Tomasz Napierala bp = g_bioq_first(&g_bio_run_up); 9440c4440c3SEdward Tomasz Napierala if (bp == NULL) { 9450c4440c3SEdward Tomasz Napierala CTR0(KTR_GEOM, "g_up going to sleep"); 9460c4440c3SEdward Tomasz Napierala msleep(&g_wait_up, &g_bio_run_up.bio_queue_lock, 9470c4440c3SEdward Tomasz Napierala PRIBIO | PDROP, "-", 0); 9485fcf4e43SPoul-Henning Kamp continue; 9495fcf4e43SPoul-Henning Kamp } 950f0e185d7SPoul-Henning Kamp g_bioq_unlock(&g_bio_run_up); 95151460da8SJohn Baldwin THREAD_NO_SLEEPING(); 95249dbb61dSRobert Watson CTR4(KTR_GEOM, "g_up biodone bp %p provider %s off " 953c4901b67SSean Bruno "%jd len %ld", bp, bp->bio_to->name, 95449dbb61dSRobert Watson bp->bio_offset, bp->bio_length); 95553706245SPoul-Henning Kamp biodone(bp); 95651460da8SJohn Baldwin THREAD_SLEEPING_OK(); 957dd84a43cSPoul-Henning Kamp } 958dd84a43cSPoul-Henning Kamp } 959dd84a43cSPoul-Henning Kamp 960dd84a43cSPoul-Henning Kamp void * 961dd84a43cSPoul-Henning Kamp g_read_data(struct g_consumer *cp, off_t offset, off_t length, int *error) 962dd84a43cSPoul-Henning Kamp { 963dd84a43cSPoul-Henning Kamp struct bio *bp; 964dd84a43cSPoul-Henning Kamp void *ptr; 965dd84a43cSPoul-Henning Kamp int errorc; 966dd84a43cSPoul-Henning Kamp 9678dd5480dSPawel Jakub Dawidek KASSERT(length > 0 && length >= cp->provider->sectorsize && 9688dd5480dSPawel Jakub Dawidek length <= MAXPHYS, ("g_read_data(): invalid length %jd", 9698dd5480dSPawel Jakub Dawidek (intmax_t)length)); 9703eb6ffdfSPoul-Henning Kamp 971a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 972dd84a43cSPoul-Henning Kamp bp->bio_cmd = BIO_READ; 973dd84a43cSPoul-Henning Kamp bp->bio_done = NULL; 974dd84a43cSPoul-Henning Kamp bp->bio_offset = offset; 975dd84a43cSPoul-Henning Kamp bp->bio_length = length; 976a163d034SWarner Losh ptr = g_malloc(length, M_WAITOK); 977dd84a43cSPoul-Henning Kamp bp->bio_data = ptr; 978dd84a43cSPoul-Henning Kamp g_io_request(bp, cp); 97953706245SPoul-Henning Kamp errorc = biowait(bp, "gread"); 980dd84a43cSPoul-Henning Kamp if (error != NULL) 981dd84a43cSPoul-Henning Kamp *error = errorc; 982dd84a43cSPoul-Henning Kamp g_destroy_bio(bp); 983dd84a43cSPoul-Henning Kamp if (errorc) { 984dd84a43cSPoul-Henning Kamp g_free(ptr); 985dd84a43cSPoul-Henning Kamp ptr = NULL; 986dd84a43cSPoul-Henning Kamp } 987dd84a43cSPoul-Henning Kamp return (ptr); 988dd84a43cSPoul-Henning Kamp } 98990b1cd56SPoul-Henning Kamp 990dffce215SKirk McKusick /* 991dffce215SKirk McKusick * A read function for use by ffs_sbget when used by GEOM-layer routines. 992dffce215SKirk McKusick */ 993dffce215SKirk McKusick int 994dffce215SKirk McKusick g_use_g_read_data(void *devfd, off_t loc, void **bufp, int size) 995dffce215SKirk McKusick { 996dffce215SKirk McKusick struct g_consumer *cp; 997dffce215SKirk McKusick 998efbf3964SKirk McKusick KASSERT(*bufp == NULL, 999efbf3964SKirk McKusick ("g_use_g_read_data: non-NULL *bufp %p\n", *bufp)); 1000efbf3964SKirk McKusick 1001dffce215SKirk McKusick cp = (struct g_consumer *)devfd; 1002dffce215SKirk McKusick /* 1003dffce215SKirk McKusick * Take care not to issue an invalid I/O request. The offset of 1004dffce215SKirk McKusick * the superblock candidate must be multiples of the provider's 1005dffce215SKirk McKusick * sector size, otherwise an FFS can't exist on the provider 1006dffce215SKirk McKusick * anyway. 1007dffce215SKirk McKusick */ 1008dffce215SKirk McKusick if (loc % cp->provider->sectorsize != 0) 1009dffce215SKirk McKusick return (ENOENT); 1010dffce215SKirk McKusick *bufp = g_read_data(cp, loc, size, NULL); 1011dffce215SKirk McKusick if (*bufp == NULL) 1012dffce215SKirk McKusick return (ENOENT); 1013dffce215SKirk McKusick return (0); 1014dffce215SKirk McKusick } 1015dffce215SKirk McKusick 101690b1cd56SPoul-Henning Kamp int 101790b1cd56SPoul-Henning Kamp g_write_data(struct g_consumer *cp, off_t offset, void *ptr, off_t length) 101890b1cd56SPoul-Henning Kamp { 101990b1cd56SPoul-Henning Kamp struct bio *bp; 102090b1cd56SPoul-Henning Kamp int error; 102190b1cd56SPoul-Henning Kamp 10228dd5480dSPawel Jakub Dawidek KASSERT(length > 0 && length >= cp->provider->sectorsize && 10238dd5480dSPawel Jakub Dawidek length <= MAXPHYS, ("g_write_data(): invalid length %jd", 10248dd5480dSPawel Jakub Dawidek (intmax_t)length)); 10253eb6ffdfSPoul-Henning Kamp 1026a2033c96SPoul-Henning Kamp bp = g_alloc_bio(); 102790b1cd56SPoul-Henning Kamp bp->bio_cmd = BIO_WRITE; 102890b1cd56SPoul-Henning Kamp bp->bio_done = NULL; 102990b1cd56SPoul-Henning Kamp bp->bio_offset = offset; 103090b1cd56SPoul-Henning Kamp bp->bio_length = length; 103190b1cd56SPoul-Henning Kamp bp->bio_data = ptr; 103290b1cd56SPoul-Henning Kamp g_io_request(bp, cp); 103390b1cd56SPoul-Henning Kamp error = biowait(bp, "gwrite"); 103490b1cd56SPoul-Henning Kamp g_destroy_bio(bp); 103590b1cd56SPoul-Henning Kamp return (error); 103690b1cd56SPoul-Henning Kamp } 103772e33095SPawel Jakub Dawidek 1038dffce215SKirk McKusick /* 1039dffce215SKirk McKusick * A write function for use by ffs_sbput when used by GEOM-layer routines. 1040dffce215SKirk McKusick */ 1041dffce215SKirk McKusick int 1042dffce215SKirk McKusick g_use_g_write_data(void *devfd, off_t loc, void *buf, int size) 1043dffce215SKirk McKusick { 1044dffce215SKirk McKusick 1045dffce215SKirk McKusick return (g_write_data((struct g_consumer *)devfd, loc, buf, size)); 1046dffce215SKirk McKusick } 1047dffce215SKirk McKusick 10482b17fb95SPawel Jakub Dawidek int 10492b17fb95SPawel Jakub Dawidek g_delete_data(struct g_consumer *cp, off_t offset, off_t length) 10502b17fb95SPawel Jakub Dawidek { 10512b17fb95SPawel Jakub Dawidek struct bio *bp; 10522b17fb95SPawel Jakub Dawidek int error; 10532b17fb95SPawel Jakub Dawidek 1054eed6cda9SPoul-Henning Kamp KASSERT(length > 0 && length >= cp->provider->sectorsize, 1055eed6cda9SPoul-Henning Kamp ("g_delete_data(): invalid length %jd", (intmax_t)length)); 10562b17fb95SPawel Jakub Dawidek 10572b17fb95SPawel Jakub Dawidek bp = g_alloc_bio(); 10582b17fb95SPawel Jakub Dawidek bp->bio_cmd = BIO_DELETE; 10592b17fb95SPawel Jakub Dawidek bp->bio_done = NULL; 10602b17fb95SPawel Jakub Dawidek bp->bio_offset = offset; 10612b17fb95SPawel Jakub Dawidek bp->bio_length = length; 10622b17fb95SPawel Jakub Dawidek bp->bio_data = NULL; 10632b17fb95SPawel Jakub Dawidek g_io_request(bp, cp); 10642b17fb95SPawel Jakub Dawidek error = biowait(bp, "gdelete"); 10652b17fb95SPawel Jakub Dawidek g_destroy_bio(bp); 10662b17fb95SPawel Jakub Dawidek return (error); 10672b17fb95SPawel Jakub Dawidek } 10682b17fb95SPawel Jakub Dawidek 106972e33095SPawel Jakub Dawidek void 1070ac03832eSConrad Meyer g_print_bio(const char *prefix, const struct bio *bp, const char *fmtsuffix, 1071ac03832eSConrad Meyer ...) 1072ac03832eSConrad Meyer { 1073ac03832eSConrad Meyer #ifndef PRINTF_BUFR_SIZE 1074ac03832eSConrad Meyer #define PRINTF_BUFR_SIZE 64 1075ac03832eSConrad Meyer #endif 1076ac03832eSConrad Meyer char bufr[PRINTF_BUFR_SIZE]; 1077ac03832eSConrad Meyer struct sbuf sb, *sbp __unused; 1078ac03832eSConrad Meyer va_list ap; 1079ac03832eSConrad Meyer 1080ac03832eSConrad Meyer sbp = sbuf_new(&sb, bufr, sizeof(bufr), SBUF_FIXEDLEN); 1081ac03832eSConrad Meyer KASSERT(sbp != NULL, ("sbuf_new misused?")); 1082ac03832eSConrad Meyer 1083ac03832eSConrad Meyer sbuf_set_drain(&sb, sbuf_printf_drain, NULL); 1084ac03832eSConrad Meyer 1085ac03832eSConrad Meyer sbuf_cat(&sb, prefix); 1086ac03832eSConrad Meyer g_format_bio(&sb, bp); 1087ac03832eSConrad Meyer 1088ac03832eSConrad Meyer va_start(ap, fmtsuffix); 1089ac03832eSConrad Meyer sbuf_vprintf(&sb, fmtsuffix, ap); 1090ac03832eSConrad Meyer va_end(ap); 1091ac03832eSConrad Meyer 1092ac03832eSConrad Meyer sbuf_nl_terminate(&sb); 1093ac03832eSConrad Meyer 1094ac03832eSConrad Meyer sbuf_finish(&sb); 1095ac03832eSConrad Meyer sbuf_delete(&sb); 1096ac03832eSConrad Meyer } 1097ac03832eSConrad Meyer 1098ac03832eSConrad Meyer void 1099ac03832eSConrad Meyer g_format_bio(struct sbuf *sb, const struct bio *bp) 110072e33095SPawel Jakub Dawidek { 110172e33095SPawel Jakub Dawidek const char *pname, *cmd = NULL; 110272e33095SPawel Jakub Dawidek 110372e33095SPawel Jakub Dawidek if (bp->bio_to != NULL) 110472e33095SPawel Jakub Dawidek pname = bp->bio_to->name; 110572e33095SPawel Jakub Dawidek else 110672e33095SPawel Jakub Dawidek pname = "[unknown]"; 110772e33095SPawel Jakub Dawidek 110872e33095SPawel Jakub Dawidek switch (bp->bio_cmd) { 110972e33095SPawel Jakub Dawidek case BIO_GETATTR: 111072e33095SPawel Jakub Dawidek cmd = "GETATTR"; 1111ac03832eSConrad Meyer sbuf_printf(sb, "%s[%s(attr=%s)]", pname, cmd, 1112ac03832eSConrad Meyer bp->bio_attribute); 111372e33095SPawel Jakub Dawidek return; 1114c3618c65SPawel Jakub Dawidek case BIO_FLUSH: 1115c3618c65SPawel Jakub Dawidek cmd = "FLUSH"; 1116ac03832eSConrad Meyer sbuf_printf(sb, "%s[%s]", pname, cmd); 1117c3618c65SPawel Jakub Dawidek return; 11189a6844d5SKenneth D. Merry case BIO_ZONE: { 11199a6844d5SKenneth D. Merry char *subcmd = NULL; 11209a6844d5SKenneth D. Merry cmd = "ZONE"; 11219a6844d5SKenneth D. Merry switch (bp->bio_zone.zone_cmd) { 11229a6844d5SKenneth D. Merry case DISK_ZONE_OPEN: 11239a6844d5SKenneth D. Merry subcmd = "OPEN"; 11249a6844d5SKenneth D. Merry break; 11259a6844d5SKenneth D. Merry case DISK_ZONE_CLOSE: 11269a6844d5SKenneth D. Merry subcmd = "CLOSE"; 11279a6844d5SKenneth D. Merry break; 11289a6844d5SKenneth D. Merry case DISK_ZONE_FINISH: 11299a6844d5SKenneth D. Merry subcmd = "FINISH"; 11309a6844d5SKenneth D. Merry break; 11319a6844d5SKenneth D. Merry case DISK_ZONE_RWP: 11329a6844d5SKenneth D. Merry subcmd = "RWP"; 11339a6844d5SKenneth D. Merry break; 11349a6844d5SKenneth D. Merry case DISK_ZONE_REPORT_ZONES: 11359a6844d5SKenneth D. Merry subcmd = "REPORT ZONES"; 11369a6844d5SKenneth D. Merry break; 11379a6844d5SKenneth D. Merry case DISK_ZONE_GET_PARAMS: 11389a6844d5SKenneth D. Merry subcmd = "GET PARAMS"; 11399a6844d5SKenneth D. Merry break; 11409a6844d5SKenneth D. Merry default: 11419a6844d5SKenneth D. Merry subcmd = "UNKNOWN"; 11429a6844d5SKenneth D. Merry break; 11439a6844d5SKenneth D. Merry } 1144ac03832eSConrad Meyer sbuf_printf(sb, "%s[%s,%s]", pname, cmd, subcmd); 11459a6844d5SKenneth D. Merry return; 11469a6844d5SKenneth D. Merry } 114772e33095SPawel Jakub Dawidek case BIO_READ: 114872e33095SPawel Jakub Dawidek cmd = "READ"; 11497ce513a5SEdward Tomasz Napierala break; 115072e33095SPawel Jakub Dawidek case BIO_WRITE: 115172e33095SPawel Jakub Dawidek cmd = "WRITE"; 11527ce513a5SEdward Tomasz Napierala break; 115372e33095SPawel Jakub Dawidek case BIO_DELETE: 115472e33095SPawel Jakub Dawidek cmd = "DELETE"; 11557ce513a5SEdward Tomasz Napierala break; 115672e33095SPawel Jakub Dawidek default: 115772e33095SPawel Jakub Dawidek cmd = "UNKNOWN"; 1158ac03832eSConrad Meyer sbuf_printf(sb, "%s[%s()]", pname, cmd); 115972e33095SPawel Jakub Dawidek return; 116072e33095SPawel Jakub Dawidek } 1161ac03832eSConrad Meyer sbuf_printf(sb, "%s[%s(offset=%jd, length=%jd)]", pname, cmd, 11627ce513a5SEdward Tomasz Napierala (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length); 116372e33095SPawel Jakub Dawidek } 1164