xref: /freebsd/sys/geom/geom_io.c (revision 8827c821de75121d09ec2a8001a94067dce7d49b)
1dd84a43cSPoul-Henning Kamp /*-
2dd84a43cSPoul-Henning Kamp  * Copyright (c) 2002 Poul-Henning Kamp
3dd84a43cSPoul-Henning Kamp  * Copyright (c) 2002 Networks Associates Technology, Inc.
4dd84a43cSPoul-Henning Kamp  * All rights reserved.
5dd84a43cSPoul-Henning Kamp  *
6dd84a43cSPoul-Henning Kamp  * This software was developed for the FreeBSD Project by Poul-Henning Kamp
7dd84a43cSPoul-Henning Kamp  * and NAI Labs, the Security Research Division of Network Associates, Inc.
8dd84a43cSPoul-Henning Kamp  * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the
9dd84a43cSPoul-Henning Kamp  * DARPA CHATS research program.
10dd84a43cSPoul-Henning Kamp  *
11dd84a43cSPoul-Henning Kamp  * Redistribution and use in source and binary forms, with or without
12dd84a43cSPoul-Henning Kamp  * modification, are permitted provided that the following conditions
13dd84a43cSPoul-Henning Kamp  * are met:
14dd84a43cSPoul-Henning Kamp  * 1. Redistributions of source code must retain the above copyright
15dd84a43cSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer.
16dd84a43cSPoul-Henning Kamp  * 2. Redistributions in binary form must reproduce the above copyright
17dd84a43cSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer in the
18dd84a43cSPoul-Henning Kamp  *    documentation and/or other materials provided with the distribution.
19dd84a43cSPoul-Henning Kamp  * 3. The names of the authors may not be used to endorse or promote
20dd84a43cSPoul-Henning Kamp  *    products derived from this software without specific prior written
21dd84a43cSPoul-Henning Kamp  *    permission.
22dd84a43cSPoul-Henning Kamp  *
23dd84a43cSPoul-Henning Kamp  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
24dd84a43cSPoul-Henning Kamp  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25dd84a43cSPoul-Henning Kamp  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26dd84a43cSPoul-Henning Kamp  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
27dd84a43cSPoul-Henning Kamp  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28dd84a43cSPoul-Henning Kamp  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29dd84a43cSPoul-Henning Kamp  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30dd84a43cSPoul-Henning Kamp  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31dd84a43cSPoul-Henning Kamp  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32dd84a43cSPoul-Henning Kamp  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33dd84a43cSPoul-Henning Kamp  * SUCH DAMAGE.
34dd84a43cSPoul-Henning Kamp  */
35dd84a43cSPoul-Henning Kamp 
3650b1faefSDavid E. O'Brien #include <sys/cdefs.h>
3750b1faefSDavid E. O'Brien __FBSDID("$FreeBSD$");
38dd84a43cSPoul-Henning Kamp 
39dd84a43cSPoul-Henning Kamp #include <sys/param.h>
40dd84a43cSPoul-Henning Kamp #include <sys/systm.h>
41dd84a43cSPoul-Henning Kamp #include <sys/kernel.h>
42dd84a43cSPoul-Henning Kamp #include <sys/malloc.h>
43dd84a43cSPoul-Henning Kamp #include <sys/bio.h>
4449dbb61dSRobert Watson #include <sys/ktr.h>
45dd84a43cSPoul-Henning Kamp 
46dd84a43cSPoul-Henning Kamp #include <sys/errno.h>
47dd84a43cSPoul-Henning Kamp #include <geom/geom.h>
48b1876192SPoul-Henning Kamp #include <geom/geom_int.h>
49e24cbd90SPoul-Henning Kamp #include <sys/devicestat.h>
50dd84a43cSPoul-Henning Kamp 
515ffb2c8bSPoul-Henning Kamp #include <vm/uma.h>
525ffb2c8bSPoul-Henning Kamp 
53dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_down;
54dd84a43cSPoul-Henning Kamp static struct g_bioq g_bio_run_up;
555fcf4e43SPoul-Henning Kamp static struct g_bioq g_bio_run_task;
56dd84a43cSPoul-Henning Kamp 
573432e4fdSPoul-Henning Kamp static u_int pace;
585ffb2c8bSPoul-Henning Kamp static uma_zone_t	biozone;
593432e4fdSPoul-Henning Kamp 
60dd84a43cSPoul-Henning Kamp #include <machine/atomic.h>
61dd84a43cSPoul-Henning Kamp 
62dd84a43cSPoul-Henning Kamp static void
63dd84a43cSPoul-Henning Kamp g_bioq_lock(struct g_bioq *bq)
64dd84a43cSPoul-Henning Kamp {
65dd84a43cSPoul-Henning Kamp 
66dd84a43cSPoul-Henning Kamp 	mtx_lock(&bq->bio_queue_lock);
67dd84a43cSPoul-Henning Kamp }
68dd84a43cSPoul-Henning Kamp 
69dd84a43cSPoul-Henning Kamp static void
70dd84a43cSPoul-Henning Kamp g_bioq_unlock(struct g_bioq *bq)
71dd84a43cSPoul-Henning Kamp {
72dd84a43cSPoul-Henning Kamp 
73dd84a43cSPoul-Henning Kamp 	mtx_unlock(&bq->bio_queue_lock);
74dd84a43cSPoul-Henning Kamp }
75dd84a43cSPoul-Henning Kamp 
76dd84a43cSPoul-Henning Kamp #if 0
77dd84a43cSPoul-Henning Kamp static void
78dd84a43cSPoul-Henning Kamp g_bioq_destroy(struct g_bioq *bq)
79dd84a43cSPoul-Henning Kamp {
80dd84a43cSPoul-Henning Kamp 
81dd84a43cSPoul-Henning Kamp 	mtx_destroy(&bq->bio_queue_lock);
82dd84a43cSPoul-Henning Kamp }
83dd84a43cSPoul-Henning Kamp #endif
84dd84a43cSPoul-Henning Kamp 
85dd84a43cSPoul-Henning Kamp static void
86dd84a43cSPoul-Henning Kamp g_bioq_init(struct g_bioq *bq)
87dd84a43cSPoul-Henning Kamp {
88dd84a43cSPoul-Henning Kamp 
89dd84a43cSPoul-Henning Kamp 	TAILQ_INIT(&bq->bio_queue);
906008862bSJohn Baldwin 	mtx_init(&bq->bio_queue_lock, "bio queue", NULL, MTX_DEF);
91dd84a43cSPoul-Henning Kamp }
92dd84a43cSPoul-Henning Kamp 
93dd84a43cSPoul-Henning Kamp static struct bio *
94dd84a43cSPoul-Henning Kamp g_bioq_first(struct g_bioq *bq)
95dd84a43cSPoul-Henning Kamp {
96dd84a43cSPoul-Henning Kamp 	struct bio *bp;
97dd84a43cSPoul-Henning Kamp 
98dd84a43cSPoul-Henning Kamp 	bp = TAILQ_FIRST(&bq->bio_queue);
99dd84a43cSPoul-Henning Kamp 	if (bp != NULL) {
100dcbd0fe5SPoul-Henning Kamp 		KASSERT((bp->bio_flags & BIO_ONQUEUE),
101dcbd0fe5SPoul-Henning Kamp 		    ("Bio not on queue bp=%p target %p", bp, bq));
102dcbd0fe5SPoul-Henning Kamp 		bp->bio_flags &= ~BIO_ONQUEUE;
103dd84a43cSPoul-Henning Kamp 		TAILQ_REMOVE(&bq->bio_queue, bp, bio_queue);
104dd84a43cSPoul-Henning Kamp 		bq->bio_queue_length--;
105dd84a43cSPoul-Henning Kamp 	}
106dd84a43cSPoul-Henning Kamp 	return (bp);
107dd84a43cSPoul-Henning Kamp }
108dd84a43cSPoul-Henning Kamp 
109dd84a43cSPoul-Henning Kamp struct bio *
110dd84a43cSPoul-Henning Kamp g_new_bio(void)
111dd84a43cSPoul-Henning Kamp {
112dd84a43cSPoul-Henning Kamp 	struct bio *bp;
113dd84a43cSPoul-Henning Kamp 
1145ffb2c8bSPoul-Henning Kamp 	bp = uma_zalloc(biozone, M_NOWAIT | M_ZERO);
115dd84a43cSPoul-Henning Kamp 	return (bp);
116dd84a43cSPoul-Henning Kamp }
117dd84a43cSPoul-Henning Kamp 
118a2033c96SPoul-Henning Kamp struct bio *
119a2033c96SPoul-Henning Kamp g_alloc_bio(void)
120a2033c96SPoul-Henning Kamp {
121a2033c96SPoul-Henning Kamp 	struct bio *bp;
122a2033c96SPoul-Henning Kamp 
123a2033c96SPoul-Henning Kamp 	bp = uma_zalloc(biozone, M_WAITOK | M_ZERO);
124a2033c96SPoul-Henning Kamp 	return (bp);
125a2033c96SPoul-Henning Kamp }
126a2033c96SPoul-Henning Kamp 
127dd84a43cSPoul-Henning Kamp void
128dd84a43cSPoul-Henning Kamp g_destroy_bio(struct bio *bp)
129dd84a43cSPoul-Henning Kamp {
130dd84a43cSPoul-Henning Kamp 
1315ffb2c8bSPoul-Henning Kamp 	uma_zfree(biozone, bp);
132dd84a43cSPoul-Henning Kamp }
133dd84a43cSPoul-Henning Kamp 
134dd84a43cSPoul-Henning Kamp struct bio *
135dd84a43cSPoul-Henning Kamp g_clone_bio(struct bio *bp)
136dd84a43cSPoul-Henning Kamp {
137dd84a43cSPoul-Henning Kamp 	struct bio *bp2;
138dd84a43cSPoul-Henning Kamp 
1395ffb2c8bSPoul-Henning Kamp 	bp2 = uma_zalloc(biozone, M_NOWAIT | M_ZERO);
140a1bd3ee2SPoul-Henning Kamp 	if (bp2 != NULL) {
141936cc461SPoul-Henning Kamp 		bp2->bio_parent = bp;
142dd84a43cSPoul-Henning Kamp 		bp2->bio_cmd = bp->bio_cmd;
143dd84a43cSPoul-Henning Kamp 		bp2->bio_length = bp->bio_length;
144dd84a43cSPoul-Henning Kamp 		bp2->bio_offset = bp->bio_offset;
145dd84a43cSPoul-Henning Kamp 		bp2->bio_data = bp->bio_data;
146dd84a43cSPoul-Henning Kamp 		bp2->bio_attribute = bp->bio_attribute;
147801bb689SPoul-Henning Kamp 		bp->bio_children++;
148a1bd3ee2SPoul-Henning Kamp 	}
149dd84a43cSPoul-Henning Kamp 	return(bp2);
150dd84a43cSPoul-Henning Kamp }
151dd84a43cSPoul-Henning Kamp 
152dd84a43cSPoul-Henning Kamp void
153dd84a43cSPoul-Henning Kamp g_io_init()
154dd84a43cSPoul-Henning Kamp {
155dd84a43cSPoul-Henning Kamp 
156dd84a43cSPoul-Henning Kamp 	g_bioq_init(&g_bio_run_down);
157dd84a43cSPoul-Henning Kamp 	g_bioq_init(&g_bio_run_up);
1585fcf4e43SPoul-Henning Kamp 	g_bioq_init(&g_bio_run_task);
1595ffb2c8bSPoul-Henning Kamp 	biozone = uma_zcreate("g_bio", sizeof (struct bio),
1605ffb2c8bSPoul-Henning Kamp 	    NULL, NULL,
1615ffb2c8bSPoul-Henning Kamp 	    NULL, NULL,
1625ffb2c8bSPoul-Henning Kamp 	    0, 0);
163dd84a43cSPoul-Henning Kamp }
164dd84a43cSPoul-Henning Kamp 
165dd84a43cSPoul-Henning Kamp int
1660d3f37a8SPoul-Henning Kamp g_io_getattr(const char *attr, struct g_consumer *cp, int *len, void *ptr)
167dd84a43cSPoul-Henning Kamp {
168dd84a43cSPoul-Henning Kamp 	struct bio *bp;
169dd84a43cSPoul-Henning Kamp 	int error;
170dd84a43cSPoul-Henning Kamp 
171dd84a43cSPoul-Henning Kamp 	g_trace(G_T_BIO, "bio_getattr(%s)", attr);
172a2033c96SPoul-Henning Kamp 	bp = g_alloc_bio();
173dd84a43cSPoul-Henning Kamp 	bp->bio_cmd = BIO_GETATTR;
174dd84a43cSPoul-Henning Kamp 	bp->bio_done = NULL;
175dd84a43cSPoul-Henning Kamp 	bp->bio_attribute = attr;
176dd84a43cSPoul-Henning Kamp 	bp->bio_length = *len;
177dd84a43cSPoul-Henning Kamp 	bp->bio_data = ptr;
178dd84a43cSPoul-Henning Kamp 	g_io_request(bp, cp);
17953706245SPoul-Henning Kamp 	error = biowait(bp, "ggetattr");
180dd84a43cSPoul-Henning Kamp 	*len = bp->bio_completed;
181dd84a43cSPoul-Henning Kamp 	g_destroy_bio(bp);
182dd84a43cSPoul-Henning Kamp 	return (error);
183dd84a43cSPoul-Henning Kamp }
184dd84a43cSPoul-Henning Kamp 
185e39d70d4SPoul-Henning Kamp static int
186e39d70d4SPoul-Henning Kamp g_io_check(struct bio *bp)
187e39d70d4SPoul-Henning Kamp {
188e39d70d4SPoul-Henning Kamp 	struct g_consumer *cp;
189e39d70d4SPoul-Henning Kamp 	struct g_provider *pp;
190e39d70d4SPoul-Henning Kamp 
191e39d70d4SPoul-Henning Kamp 	cp = bp->bio_from;
192e39d70d4SPoul-Henning Kamp 	pp = bp->bio_to;
193e39d70d4SPoul-Henning Kamp 
194e39d70d4SPoul-Henning Kamp 	/* Fail if access counters dont allow the operation */
195e39d70d4SPoul-Henning Kamp 	switch(bp->bio_cmd) {
196e39d70d4SPoul-Henning Kamp 	case BIO_READ:
197e39d70d4SPoul-Henning Kamp 	case BIO_GETATTR:
198e39d70d4SPoul-Henning Kamp 		if (cp->acr == 0)
199e39d70d4SPoul-Henning Kamp 			return (EPERM);
200e39d70d4SPoul-Henning Kamp 		break;
201e39d70d4SPoul-Henning Kamp 	case BIO_WRITE:
202e39d70d4SPoul-Henning Kamp 	case BIO_DELETE:
203e39d70d4SPoul-Henning Kamp 		if (cp->acw == 0)
204e39d70d4SPoul-Henning Kamp 			return (EPERM);
205e39d70d4SPoul-Henning Kamp 		break;
206e39d70d4SPoul-Henning Kamp 	default:
207e39d70d4SPoul-Henning Kamp 		return (EPERM);
208e39d70d4SPoul-Henning Kamp 	}
209e39d70d4SPoul-Henning Kamp 	/* if provider is marked for error, don't disturb. */
210e39d70d4SPoul-Henning Kamp 	if (pp->error)
211e39d70d4SPoul-Henning Kamp 		return (pp->error);
212e39d70d4SPoul-Henning Kamp 
213e39d70d4SPoul-Henning Kamp 	switch(bp->bio_cmd) {
214e39d70d4SPoul-Henning Kamp 	case BIO_READ:
215e39d70d4SPoul-Henning Kamp 	case BIO_WRITE:
216e39d70d4SPoul-Henning Kamp 	case BIO_DELETE:
21743bff1a7SPoul-Henning Kamp 		/* Zero sectorsize is a probably lack of media */
21843bff1a7SPoul-Henning Kamp 		if (pp->sectorsize == 0)
21943bff1a7SPoul-Henning Kamp 			return (ENXIO);
220e39d70d4SPoul-Henning Kamp 		/* Reject I/O not on sector boundary */
221e39d70d4SPoul-Henning Kamp 		if (bp->bio_offset % pp->sectorsize)
222e39d70d4SPoul-Henning Kamp 			return (EINVAL);
223e39d70d4SPoul-Henning Kamp 		/* Reject I/O not integral sector long */
224e39d70d4SPoul-Henning Kamp 		if (bp->bio_length % pp->sectorsize)
225e39d70d4SPoul-Henning Kamp 			return (EINVAL);
226d1b8bf47SPoul-Henning Kamp 		/* Reject requests before or past the end of media. */
227d1b8bf47SPoul-Henning Kamp 		if (bp->bio_offset < 0)
228d1b8bf47SPoul-Henning Kamp 			return (EIO);
229e39d70d4SPoul-Henning Kamp 		if (bp->bio_offset > pp->mediasize)
230e39d70d4SPoul-Henning Kamp 			return (EIO);
231e39d70d4SPoul-Henning Kamp 		break;
232e39d70d4SPoul-Henning Kamp 	default:
233e39d70d4SPoul-Henning Kamp 		break;
234e39d70d4SPoul-Henning Kamp 	}
235e39d70d4SPoul-Henning Kamp 	return (0);
236e39d70d4SPoul-Henning Kamp }
237e39d70d4SPoul-Henning Kamp 
238dd84a43cSPoul-Henning Kamp void
239dd84a43cSPoul-Henning Kamp g_io_request(struct bio *bp, struct g_consumer *cp)
240dd84a43cSPoul-Henning Kamp {
241801bb689SPoul-Henning Kamp 	struct g_provider *pp;
242dd84a43cSPoul-Henning Kamp 
243d0e17c1bSPoul-Henning Kamp 	KASSERT(cp != NULL, ("NULL cp in g_io_request"));
244d0e17c1bSPoul-Henning Kamp 	KASSERT(bp != NULL, ("NULL bp in g_io_request"));
245d0e17c1bSPoul-Henning Kamp 	KASSERT(bp->bio_data != NULL, ("NULL bp->data in g_io_request"));
246e060b6bdSPoul-Henning Kamp 	pp = cp->provider;
247801bb689SPoul-Henning Kamp 	KASSERT(pp != NULL, ("consumer not attached in g_io_request"));
248801bb689SPoul-Henning Kamp 
249dcbd0fe5SPoul-Henning Kamp 	if (bp->bio_cmd & (BIO_READ|BIO_WRITE|BIO_DELETE)) {
250dcbd0fe5SPoul-Henning Kamp 		KASSERT(bp->bio_offset % cp->provider->sectorsize == 0,
251dcbd0fe5SPoul-Henning Kamp 		    ("wrong offset %jd for sectorsize %u",
252dcbd0fe5SPoul-Henning Kamp 		    bp->bio_offset, cp->provider->sectorsize));
253dcbd0fe5SPoul-Henning Kamp 		KASSERT(bp->bio_length % cp->provider->sectorsize == 0,
254dcbd0fe5SPoul-Henning Kamp 		    ("wrong length %jd for sectorsize %u",
255dcbd0fe5SPoul-Henning Kamp 		    bp->bio_length, cp->provider->sectorsize));
256dcbd0fe5SPoul-Henning Kamp 	}
257dcbd0fe5SPoul-Henning Kamp 
258f7717523SStephan Uphoff 	g_trace(G_T_BIO, "bio_request(%p) from %p(%s) to %p(%s) cmd %d",
259f7717523SStephan Uphoff 	    bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd);
260f7717523SStephan Uphoff 
261dd84a43cSPoul-Henning Kamp 	bp->bio_from = cp;
262801bb689SPoul-Henning Kamp 	bp->bio_to = pp;
2632fccec19SPoul-Henning Kamp 	bp->bio_error = 0;
2642fccec19SPoul-Henning Kamp 	bp->bio_completed = 0;
265dd84a43cSPoul-Henning Kamp 
26619fa21aaSPoul-Henning Kamp 	KASSERT(!(bp->bio_flags & BIO_ONQUEUE),
26719fa21aaSPoul-Henning Kamp 	    ("Bio already on queue bp=%p", bp));
26819fa21aaSPoul-Henning Kamp 	bp->bio_flags |= BIO_ONQUEUE;
26919fa21aaSPoul-Henning Kamp 
27019fa21aaSPoul-Henning Kamp 	binuptime(&bp->bio_t0);
2718827c821SPoul-Henning Kamp 
2728827c821SPoul-Henning Kamp 	/*
2738827c821SPoul-Henning Kamp 	 * The statistics collection is lockless, as such, but we
2748827c821SPoul-Henning Kamp 	 * can not update one instance of the statistics from more
2758827c821SPoul-Henning Kamp 	 * than one thread at a time, so grab the lock first.
2768827c821SPoul-Henning Kamp 	 */
27719fa21aaSPoul-Henning Kamp 	g_bioq_lock(&g_bio_run_down);
278cf457284SPoul-Henning Kamp 	if (g_collectstats & 1)
27919fa21aaSPoul-Henning Kamp 		devstat_start_transaction(pp->stat, &bp->bio_t0);
280cf457284SPoul-Henning Kamp 	if (g_collectstats & 2)
28119fa21aaSPoul-Henning Kamp 		devstat_start_transaction(cp->stat, &bp->bio_t0);
28219fa21aaSPoul-Henning Kamp 
28319fa21aaSPoul-Henning Kamp 	pp->nstart++;
284cf457284SPoul-Henning Kamp 	cp->nstart++;
28519fa21aaSPoul-Henning Kamp 	TAILQ_INSERT_TAIL(&g_bio_run_down.bio_queue, bp, bio_queue);
28619fa21aaSPoul-Henning Kamp 	g_bio_run_down.bio_queue_length++;
28719fa21aaSPoul-Henning Kamp 	g_bioq_unlock(&g_bio_run_down);
288e39d70d4SPoul-Henning Kamp 
2892fccec19SPoul-Henning Kamp 	/* Pass it on down. */
290dd84a43cSPoul-Henning Kamp 	wakeup(&g_wait_down);
291dd84a43cSPoul-Henning Kamp }
292dd84a43cSPoul-Henning Kamp 
293dd84a43cSPoul-Henning Kamp void
29472840432SPoul-Henning Kamp g_io_deliver(struct bio *bp, int error)
295dd84a43cSPoul-Henning Kamp {
296801bb689SPoul-Henning Kamp 	struct g_consumer *cp;
297801bb689SPoul-Henning Kamp 	struct g_provider *pp;
298dd84a43cSPoul-Henning Kamp 
299e060b6bdSPoul-Henning Kamp 	KASSERT(bp != NULL, ("NULL bp in g_io_deliver"));
300801bb689SPoul-Henning Kamp 	pp = bp->bio_to;
301f7eeab17SPoul-Henning Kamp 	KASSERT(pp != NULL, ("NULL bio_to in g_io_deliver"));
302f7eeab17SPoul-Henning Kamp 	cp = bp->bio_from;
303f7eeab17SPoul-Henning Kamp 	if (cp == NULL) {
304f7eeab17SPoul-Henning Kamp 		bp->bio_error = error;
305f7eeab17SPoul-Henning Kamp 		bp->bio_done(bp);
306f7eeab17SPoul-Henning Kamp 		return;
307f7eeab17SPoul-Henning Kamp 	}
308801bb689SPoul-Henning Kamp 	KASSERT(cp != NULL, ("NULL bio_from in g_io_deliver"));
309801bb689SPoul-Henning Kamp 	KASSERT(cp->geom != NULL, ("NULL bio_from->geom in g_io_deliver"));
31046aeebecSPawel Jakub Dawidek 	KASSERT(bp->bio_completed >= 0, ("bio_completed can't be less than 0"));
31146aeebecSPawel Jakub Dawidek 	KASSERT(bp->bio_completed <= bp->bio_length,
31246aeebecSPawel Jakub Dawidek 	    ("bio_completed can't be greater than bio_length"));
3135ab413bfSPoul-Henning Kamp 
314dd84a43cSPoul-Henning Kamp 	g_trace(G_T_BIO,
3150355b86eSPoul-Henning Kamp "g_io_deliver(%p) from %p(%s) to %p(%s) cmd %d error %d off %jd len %jd",
316801bb689SPoul-Henning Kamp 	    bp, cp, cp->geom->name, pp, pp->name, bp->bio_cmd, error,
3170355b86eSPoul-Henning Kamp 	    (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length);
318801bb689SPoul-Henning Kamp 
31919fa21aaSPoul-Henning Kamp 	KASSERT(!(bp->bio_flags & BIO_ONQUEUE),
32019fa21aaSPoul-Henning Kamp 	    ("Bio already on queue bp=%p", bp));
32119fa21aaSPoul-Henning Kamp 
322dcbd0fe5SPoul-Henning Kamp 	/*
323dcbd0fe5SPoul-Henning Kamp 	 * XXX: next two doesn't belong here
324dcbd0fe5SPoul-Henning Kamp 	 */
325e24cbd90SPoul-Henning Kamp 	bp->bio_bcount = bp->bio_length;
326e24cbd90SPoul-Henning Kamp 	bp->bio_resid = bp->bio_bcount - bp->bio_completed;
32719fa21aaSPoul-Henning Kamp 
3288827c821SPoul-Henning Kamp 	/*
3298827c821SPoul-Henning Kamp 	 * The statistics collection is lockless, as such, but we
3308827c821SPoul-Henning Kamp 	 * can not update one instance of the statistics from more
3318827c821SPoul-Henning Kamp 	 * than one thread at a time, so grab the lock first.
3328827c821SPoul-Henning Kamp 	 */
33319fa21aaSPoul-Henning Kamp 	g_bioq_lock(&g_bio_run_up);
334cf457284SPoul-Henning Kamp 	if (g_collectstats & 1)
335e24cbd90SPoul-Henning Kamp 		devstat_end_transaction_bio(pp->stat, bp);
336cf457284SPoul-Henning Kamp 	if (g_collectstats & 2)
337cf457284SPoul-Henning Kamp 		devstat_end_transaction_bio(cp->stat, bp);
3388827c821SPoul-Henning Kamp 
339c6ae9b5fSPoul-Henning Kamp 	cp->nend++;
340c6ae9b5fSPoul-Henning Kamp 	pp->nend++;
34119fa21aaSPoul-Henning Kamp 	if (error != ENOMEM) {
34219fa21aaSPoul-Henning Kamp 		bp->bio_error = error;
34319fa21aaSPoul-Henning Kamp 		TAILQ_INSERT_TAIL(&g_bio_run_up.bio_queue, bp, bio_queue);
344276f72c5SPoul-Henning Kamp 		bp->bio_flags |= BIO_ONQUEUE;
34519fa21aaSPoul-Henning Kamp 		g_bio_run_up.bio_queue_length++;
34619fa21aaSPoul-Henning Kamp 		g_bioq_unlock(&g_bio_run_up);
34719fa21aaSPoul-Henning Kamp 		wakeup(&g_wait_up);
34819fa21aaSPoul-Henning Kamp 		return;
34919fa21aaSPoul-Henning Kamp 	}
35019fa21aaSPoul-Henning Kamp 	g_bioq_unlock(&g_bio_run_up);
351dd84a43cSPoul-Henning Kamp 
3522cc9686eSPoul-Henning Kamp 	if (bootverbose)
353801bb689SPoul-Henning Kamp 		printf("ENOMEM %p on %p(%s)\n", bp, pp, pp->name);
3541b949c05SPawel Jakub Dawidek 	bp->bio_children = 0;
3551b949c05SPawel Jakub Dawidek 	bp->bio_inbed = 0;
356801bb689SPoul-Henning Kamp 	g_io_request(bp, cp);
3573432e4fdSPoul-Henning Kamp 	pace++;
3583432e4fdSPoul-Henning Kamp 	return;
3593432e4fdSPoul-Henning Kamp }
360dd84a43cSPoul-Henning Kamp 
361dd84a43cSPoul-Henning Kamp void
362dd84a43cSPoul-Henning Kamp g_io_schedule_down(struct thread *tp __unused)
363dd84a43cSPoul-Henning Kamp {
364dd84a43cSPoul-Henning Kamp 	struct bio *bp;
365e39d70d4SPoul-Henning Kamp 	off_t excess;
366e39d70d4SPoul-Henning Kamp 	int error;
3675706472cSRobert Watson #ifdef WITNESS
368f0e185d7SPoul-Henning Kamp 	struct mtx mymutex;
369f0e185d7SPoul-Henning Kamp 
370f0e185d7SPoul-Henning Kamp 	bzero(&mymutex, sizeof mymutex);
3712cf0d8a6SDon Lewis 	mtx_init(&mymutex, "g_xdown", NULL, MTX_DEF);
3725706472cSRobert Watson #endif
373dd84a43cSPoul-Henning Kamp 
374dd84a43cSPoul-Henning Kamp 	for(;;) {
375f0e185d7SPoul-Henning Kamp 		g_bioq_lock(&g_bio_run_down);
376dd84a43cSPoul-Henning Kamp 		bp = g_bioq_first(&g_bio_run_down);
377f0e185d7SPoul-Henning Kamp 		if (bp == NULL) {
37849dbb61dSRobert Watson 			CTR0(KTR_GEOM, "g_down going to sleep");
379f0e185d7SPoul-Henning Kamp 			msleep(&g_wait_down, &g_bio_run_down.bio_queue_lock,
38044be139bSPoul-Henning Kamp 			    PRIBIO | PDROP, "-", hz/10);
381f0e185d7SPoul-Henning Kamp 			continue;
382f0e185d7SPoul-Henning Kamp 		}
38349dbb61dSRobert Watson 		CTR0(KTR_GEOM, "g_down has work to do");
384f0e185d7SPoul-Henning Kamp 		g_bioq_unlock(&g_bio_run_down);
385376ceb79SPoul-Henning Kamp 		if (pace > 0) {
38649dbb61dSRobert Watson 			CTR1(KTR_GEOM, "g_down pacing self (pace %d)", pace);
387376ceb79SPoul-Henning Kamp 			msleep(&error, NULL, PRIBIO, "g_down", hz/10);
388376ceb79SPoul-Henning Kamp 			pace--;
389376ceb79SPoul-Henning Kamp 		}
390e39d70d4SPoul-Henning Kamp 		error = g_io_check(bp);
391e39d70d4SPoul-Henning Kamp 		if (error) {
39249dbb61dSRobert Watson 			CTR3(KTR_GEOM, "g_down g_io_check on bp %p provider "
39349dbb61dSRobert Watson 			    "%s returned %d", bp, bp->bio_to->name, error);
394e39d70d4SPoul-Henning Kamp 			g_io_deliver(bp, error);
395e39d70d4SPoul-Henning Kamp 			continue;
396e39d70d4SPoul-Henning Kamp 		}
39749dbb61dSRobert Watson 		CTR2(KTR_GEOM, "g_down processing bp %p provider %s", bp,
39849dbb61dSRobert Watson 		    bp->bio_to->name);
399392d56b4SPoul-Henning Kamp 		switch (bp->bio_cmd) {
400392d56b4SPoul-Henning Kamp 		case BIO_READ:
401392d56b4SPoul-Henning Kamp 		case BIO_WRITE:
402392d56b4SPoul-Henning Kamp 		case BIO_DELETE:
403e39d70d4SPoul-Henning Kamp 			/* Truncate requests to the end of providers media. */
40449dbb61dSRobert Watson 			/*
40549dbb61dSRobert Watson 			 * XXX: What if we truncate because of offset being
40649dbb61dSRobert Watson 			 * bad, not length?
40749dbb61dSRobert Watson 			 */
408e39d70d4SPoul-Henning Kamp 			excess = bp->bio_offset + bp->bio_length;
409e39d70d4SPoul-Henning Kamp 			if (excess > bp->bio_to->mediasize) {
410e39d70d4SPoul-Henning Kamp 				excess -= bp->bio_to->mediasize;
411e39d70d4SPoul-Henning Kamp 				bp->bio_length -= excess;
41249dbb61dSRobert Watson 				if (excess > 0)
41349dbb61dSRobert Watson 					CTR3(KTR_GEOM, "g_down truncated bio "
41449dbb61dSRobert Watson 					    "%p provider %s by %d", bp,
41549dbb61dSRobert Watson 					    bp->bio_to->name, excess);
416e39d70d4SPoul-Henning Kamp 			}
417e39d70d4SPoul-Henning Kamp 			/* Deliver zero length transfers right here. */
418e39d70d4SPoul-Henning Kamp 			if (bp->bio_length == 0) {
419e39d70d4SPoul-Henning Kamp 				g_io_deliver(bp, 0);
42049dbb61dSRobert Watson 				CTR2(KTR_GEOM, "g_down terminated 0-length "
42149dbb61dSRobert Watson 				    "bp %p provider %s", bp, bp->bio_to->name);
422e39d70d4SPoul-Henning Kamp 				continue;
423e39d70d4SPoul-Henning Kamp 			}
424392d56b4SPoul-Henning Kamp 			break;
425392d56b4SPoul-Henning Kamp 		default:
426392d56b4SPoul-Henning Kamp 			break;
427392d56b4SPoul-Henning Kamp 		}
4285706472cSRobert Watson #ifdef WITNESS
429f0e185d7SPoul-Henning Kamp 		mtx_lock(&mymutex);
4305706472cSRobert Watson #endif
43149dbb61dSRobert Watson 		CTR4(KTR_GEOM, "g_down starting bp %p provider %s off %ld "
43249dbb61dSRobert Watson 		    "len %ld", bp, bp->bio_to->name, bp->bio_offset,
43349dbb61dSRobert Watson 		    bp->bio_length);
434dd84a43cSPoul-Henning Kamp 		bp->bio_to->geom->start(bp);
4355706472cSRobert Watson #ifdef WITNESS
436f0e185d7SPoul-Henning Kamp 		mtx_unlock(&mymutex);
4375706472cSRobert Watson #endif
438dd84a43cSPoul-Henning Kamp 	}
439dd84a43cSPoul-Henning Kamp }
440dd84a43cSPoul-Henning Kamp 
441dd84a43cSPoul-Henning Kamp void
4425fcf4e43SPoul-Henning Kamp bio_taskqueue(struct bio *bp, bio_task_t *func, void *arg)
4435fcf4e43SPoul-Henning Kamp {
4445fcf4e43SPoul-Henning Kamp 	bp->bio_task = func;
4455fcf4e43SPoul-Henning Kamp 	bp->bio_task_arg = arg;
4465fcf4e43SPoul-Henning Kamp 	/*
4475fcf4e43SPoul-Henning Kamp 	 * The taskqueue is actually just a second queue off the "up"
4485fcf4e43SPoul-Henning Kamp 	 * queue, so we use the same lock.
4495fcf4e43SPoul-Henning Kamp 	 */
4505fcf4e43SPoul-Henning Kamp 	g_bioq_lock(&g_bio_run_up);
451dcbd0fe5SPoul-Henning Kamp 	KASSERT(!(bp->bio_flags & BIO_ONQUEUE),
452dcbd0fe5SPoul-Henning Kamp 	    ("Bio already on queue bp=%p target taskq", bp));
453dcbd0fe5SPoul-Henning Kamp 	bp->bio_flags |= BIO_ONQUEUE;
4545fcf4e43SPoul-Henning Kamp 	TAILQ_INSERT_TAIL(&g_bio_run_task.bio_queue, bp, bio_queue);
4555fcf4e43SPoul-Henning Kamp 	g_bio_run_task.bio_queue_length++;
4565fcf4e43SPoul-Henning Kamp 	wakeup(&g_wait_up);
4575fcf4e43SPoul-Henning Kamp 	g_bioq_unlock(&g_bio_run_up);
4585fcf4e43SPoul-Henning Kamp }
4595fcf4e43SPoul-Henning Kamp 
4605fcf4e43SPoul-Henning Kamp 
4615fcf4e43SPoul-Henning Kamp void
462dd84a43cSPoul-Henning Kamp g_io_schedule_up(struct thread *tp __unused)
463dd84a43cSPoul-Henning Kamp {
464dd84a43cSPoul-Henning Kamp 	struct bio *bp;
4655706472cSRobert Watson #ifdef WITNESS
466f0e185d7SPoul-Henning Kamp 	struct mtx mymutex;
467dd84a43cSPoul-Henning Kamp 
468f0e185d7SPoul-Henning Kamp 	bzero(&mymutex, sizeof mymutex);
4692cf0d8a6SDon Lewis 	mtx_init(&mymutex, "g_xup", NULL, MTX_DEF);
4705706472cSRobert Watson #endif
471dd84a43cSPoul-Henning Kamp 	for(;;) {
472f0e185d7SPoul-Henning Kamp 		g_bioq_lock(&g_bio_run_up);
4735fcf4e43SPoul-Henning Kamp 		bp = g_bioq_first(&g_bio_run_task);
4745fcf4e43SPoul-Henning Kamp 		if (bp != NULL) {
4755fcf4e43SPoul-Henning Kamp 			g_bioq_unlock(&g_bio_run_up);
4765706472cSRobert Watson #ifdef WITNESS
4775fcf4e43SPoul-Henning Kamp 			mtx_lock(&mymutex);
4785706472cSRobert Watson #endif
47949dbb61dSRobert Watson 			CTR1(KTR_GEOM, "g_up processing task bp %p", bp);
4805fcf4e43SPoul-Henning Kamp 			bp->bio_task(bp->bio_task_arg);
4815706472cSRobert Watson #ifdef WITNESS
4825fcf4e43SPoul-Henning Kamp 			mtx_unlock(&mymutex);
4835706472cSRobert Watson #endif
4845fcf4e43SPoul-Henning Kamp 			continue;
4855fcf4e43SPoul-Henning Kamp 		}
486dd84a43cSPoul-Henning Kamp 		bp = g_bioq_first(&g_bio_run_up);
487f0e185d7SPoul-Henning Kamp 		if (bp != NULL) {
488f0e185d7SPoul-Henning Kamp 			g_bioq_unlock(&g_bio_run_up);
4895706472cSRobert Watson #ifdef WITNESS
490f0e185d7SPoul-Henning Kamp 			mtx_lock(&mymutex);
4915706472cSRobert Watson #endif
49249dbb61dSRobert Watson 			CTR4(KTR_GEOM, "g_up biodone bp %p provider %s off "
49349dbb61dSRobert Watson 			    "%ld len %ld", bp, bp->bio_to->name,
49449dbb61dSRobert Watson 			    bp->bio_offset, bp->bio_length);
49553706245SPoul-Henning Kamp 			biodone(bp);
4965706472cSRobert Watson #ifdef WITNESS
497f0e185d7SPoul-Henning Kamp 			mtx_unlock(&mymutex);
4985706472cSRobert Watson #endif
499f0e185d7SPoul-Henning Kamp 			continue;
500f0e185d7SPoul-Henning Kamp 		}
50149dbb61dSRobert Watson 		CTR0(KTR_GEOM, "g_up going to sleep");
502f0e185d7SPoul-Henning Kamp 		msleep(&g_wait_up, &g_bio_run_up.bio_queue_lock,
50344be139bSPoul-Henning Kamp 		    PRIBIO | PDROP, "-", hz/10);
504dd84a43cSPoul-Henning Kamp 	}
505dd84a43cSPoul-Henning Kamp }
506dd84a43cSPoul-Henning Kamp 
507dd84a43cSPoul-Henning Kamp void *
508dd84a43cSPoul-Henning Kamp g_read_data(struct g_consumer *cp, off_t offset, off_t length, int *error)
509dd84a43cSPoul-Henning Kamp {
510dd84a43cSPoul-Henning Kamp 	struct bio *bp;
511dd84a43cSPoul-Henning Kamp 	void *ptr;
512dd84a43cSPoul-Henning Kamp 	int errorc;
513dd84a43cSPoul-Henning Kamp 
5148dd5480dSPawel Jakub Dawidek 	KASSERT(length > 0 && length >= cp->provider->sectorsize &&
5158dd5480dSPawel Jakub Dawidek 	    length <= MAXPHYS, ("g_read_data(): invalid length %jd",
5168dd5480dSPawel Jakub Dawidek 	    (intmax_t)length));
5173eb6ffdfSPoul-Henning Kamp 
518a2033c96SPoul-Henning Kamp 	bp = g_alloc_bio();
519dd84a43cSPoul-Henning Kamp 	bp->bio_cmd = BIO_READ;
520dd84a43cSPoul-Henning Kamp 	bp->bio_done = NULL;
521dd84a43cSPoul-Henning Kamp 	bp->bio_offset = offset;
522dd84a43cSPoul-Henning Kamp 	bp->bio_length = length;
523a163d034SWarner Losh 	ptr = g_malloc(length, M_WAITOK);
524dd84a43cSPoul-Henning Kamp 	bp->bio_data = ptr;
525dd84a43cSPoul-Henning Kamp 	g_io_request(bp, cp);
52653706245SPoul-Henning Kamp 	errorc = biowait(bp, "gread");
527dd84a43cSPoul-Henning Kamp 	if (error != NULL)
528dd84a43cSPoul-Henning Kamp 		*error = errorc;
529dd84a43cSPoul-Henning Kamp 	g_destroy_bio(bp);
530dd84a43cSPoul-Henning Kamp 	if (errorc) {
531dd84a43cSPoul-Henning Kamp 		g_free(ptr);
532dd84a43cSPoul-Henning Kamp 		ptr = NULL;
533dd84a43cSPoul-Henning Kamp 	}
534dd84a43cSPoul-Henning Kamp 	return (ptr);
535dd84a43cSPoul-Henning Kamp }
53690b1cd56SPoul-Henning Kamp 
53790b1cd56SPoul-Henning Kamp int
53890b1cd56SPoul-Henning Kamp g_write_data(struct g_consumer *cp, off_t offset, void *ptr, off_t length)
53990b1cd56SPoul-Henning Kamp {
54090b1cd56SPoul-Henning Kamp 	struct bio *bp;
54190b1cd56SPoul-Henning Kamp 	int error;
54290b1cd56SPoul-Henning Kamp 
5438dd5480dSPawel Jakub Dawidek 	KASSERT(length > 0 && length >= cp->provider->sectorsize &&
5448dd5480dSPawel Jakub Dawidek 	    length <= MAXPHYS, ("g_write_data(): invalid length %jd",
5458dd5480dSPawel Jakub Dawidek 	    (intmax_t)length));
5463eb6ffdfSPoul-Henning Kamp 
547a2033c96SPoul-Henning Kamp 	bp = g_alloc_bio();
54890b1cd56SPoul-Henning Kamp 	bp->bio_cmd = BIO_WRITE;
54990b1cd56SPoul-Henning Kamp 	bp->bio_done = NULL;
55090b1cd56SPoul-Henning Kamp 	bp->bio_offset = offset;
55190b1cd56SPoul-Henning Kamp 	bp->bio_length = length;
55290b1cd56SPoul-Henning Kamp 	bp->bio_data = ptr;
55390b1cd56SPoul-Henning Kamp 	g_io_request(bp, cp);
55490b1cd56SPoul-Henning Kamp 	error = biowait(bp, "gwrite");
55590b1cd56SPoul-Henning Kamp 	g_destroy_bio(bp);
55690b1cd56SPoul-Henning Kamp 	return (error);
55790b1cd56SPoul-Henning Kamp }
55872e33095SPawel Jakub Dawidek 
55972e33095SPawel Jakub Dawidek void
56072e33095SPawel Jakub Dawidek g_print_bio(struct bio *bp)
56172e33095SPawel Jakub Dawidek {
56272e33095SPawel Jakub Dawidek 	const char *pname, *cmd = NULL;
56372e33095SPawel Jakub Dawidek 
56472e33095SPawel Jakub Dawidek 	if (bp->bio_to != NULL)
56572e33095SPawel Jakub Dawidek 		pname = bp->bio_to->name;
56672e33095SPawel Jakub Dawidek 	else
56772e33095SPawel Jakub Dawidek 		pname = "[unknown]";
56872e33095SPawel Jakub Dawidek 
56972e33095SPawel Jakub Dawidek 	switch (bp->bio_cmd) {
57072e33095SPawel Jakub Dawidek 	case BIO_GETATTR:
57172e33095SPawel Jakub Dawidek 		cmd = "GETATTR";
57272e33095SPawel Jakub Dawidek 		printf("%s[%s(attr=%s)]", pname, cmd, bp->bio_attribute);
57372e33095SPawel Jakub Dawidek 		return;
57472e33095SPawel Jakub Dawidek 	case BIO_READ:
57572e33095SPawel Jakub Dawidek 		cmd = "READ";
57672e33095SPawel Jakub Dawidek 	case BIO_WRITE:
57772e33095SPawel Jakub Dawidek 		if (cmd == NULL)
57872e33095SPawel Jakub Dawidek 			cmd = "WRITE";
57972e33095SPawel Jakub Dawidek 	case BIO_DELETE:
58072e33095SPawel Jakub Dawidek 		if (cmd == NULL)
58172e33095SPawel Jakub Dawidek 			cmd = "DELETE";
58272e33095SPawel Jakub Dawidek 		printf("%s[%s(offset=%jd, length=%jd)]", pname, cmd,
58372e33095SPawel Jakub Dawidek 		    (intmax_t)bp->bio_offset, (intmax_t)bp->bio_length);
58472e33095SPawel Jakub Dawidek 		return;
58572e33095SPawel Jakub Dawidek 	default:
58672e33095SPawel Jakub Dawidek 		cmd = "UNKNOWN";
58772e33095SPawel Jakub Dawidek 		printf("%s[%s()]", pname, cmd);
58872e33095SPawel Jakub Dawidek 		return;
58972e33095SPawel Jakub Dawidek 	}
59072e33095SPawel Jakub Dawidek 	/* NOTREACHED */
59172e33095SPawel Jakub Dawidek }
592