1fa521b03SWarner Losh /*- 22afb21f3SPedro F. Giffuni * SPDX-License-Identifier: (BSD-2-Clause-NetBSD AND BSD-3-Clause) 33728855aSPedro F. Giffuni * 43b1746dfSPoul-Henning Kamp * Copyright (c) 2003 Poul-Henning Kamp. 52afb21f3SPedro F. Giffuni * Copyright (c) 1996, 1997 The NetBSD Foundation, Inc. 62afb21f3SPedro F. Giffuni * All rights reserved. 72afb21f3SPedro F. Giffuni * 82afb21f3SPedro F. Giffuni * This code is derived from software contributed to The NetBSD Foundation 92afb21f3SPedro F. Giffuni * by Jason R. Thorpe. 102afb21f3SPedro F. Giffuni * 112afb21f3SPedro F. Giffuni * Redistribution and use in source and binary forms, with or without 122afb21f3SPedro F. Giffuni * modification, are permitted provided that the following conditions 132afb21f3SPedro F. Giffuni * are met: 142afb21f3SPedro F. Giffuni * 1. Redistributions of source code must retain the above copyright 152afb21f3SPedro F. Giffuni * notice, this list of conditions and the following disclaimer. 162afb21f3SPedro F. Giffuni * 2. Redistributions in binary form must reproduce the above copyright 172afb21f3SPedro F. Giffuni * notice, this list of conditions and the following disclaimer in the 182afb21f3SPedro F. Giffuni * documentation and/or other materials provided with the distribution. 192afb21f3SPedro F. Giffuni * 202afb21f3SPedro F. Giffuni * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 212afb21f3SPedro F. Giffuni * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 222afb21f3SPedro F. Giffuni * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 232afb21f3SPedro F. Giffuni * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 242afb21f3SPedro F. Giffuni * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 252afb21f3SPedro F. Giffuni * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 262afb21f3SPedro F. Giffuni * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 272afb21f3SPedro F. Giffuni * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 282afb21f3SPedro F. Giffuni * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 292afb21f3SPedro F. Giffuni * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 302afb21f3SPedro F. Giffuni * POSSIBILITY OF SUCH DAMAGE. 312afb21f3SPedro F. Giffuni * 322afb21f3SPedro F. Giffuni * $NetBSD: ccd.c,v 1.22 1995/12/08 19:13:26 thorpej Exp $ 332afb21f3SPedro F. Giffuni */ 342afb21f3SPedro F. Giffuni 352afb21f3SPedro F. Giffuni /*- 362afb21f3SPedro F. Giffuni * Copyright (c) 1988 University of Utah. 37a56bb8a5SSatoshi Asami * Copyright (c) 1990, 1993 38a56bb8a5SSatoshi Asami * The Regents of the University of California. All rights reserved. 39a56bb8a5SSatoshi Asami * 40a56bb8a5SSatoshi Asami * This code is derived from software contributed to Berkeley by 41a56bb8a5SSatoshi Asami * the Systems Programming Group of the University of Utah Computer 42a56bb8a5SSatoshi Asami * Science Department. 43a56bb8a5SSatoshi Asami * 44a56bb8a5SSatoshi Asami * Redistribution and use in source and binary forms, with or without 45a56bb8a5SSatoshi Asami * modification, are permitted provided that the following conditions 46a56bb8a5SSatoshi Asami * are met: 47a56bb8a5SSatoshi Asami * 1. Redistributions of source code must retain the above copyright 48a56bb8a5SSatoshi Asami * notice, this list of conditions and the following disclaimer. 49a56bb8a5SSatoshi Asami * 2. Redistributions in binary form must reproduce the above copyright 50a56bb8a5SSatoshi Asami * notice, this list of conditions and the following disclaimer in the 51a56bb8a5SSatoshi Asami * documentation and/or other materials provided with the distribution. 522afb21f3SPedro F. Giffuni * 3. Neither the name of the University nor the names of its contributors 532afb21f3SPedro F. Giffuni * may be used to endorse or promote products derived from this software 542afb21f3SPedro F. Giffuni * without specific prior written permission. 55a56bb8a5SSatoshi Asami * 562afb21f3SPedro F. Giffuni * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 572afb21f3SPedro F. Giffuni * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 582afb21f3SPedro F. Giffuni * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 592afb21f3SPedro F. Giffuni * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 602afb21f3SPedro F. Giffuni * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 612afb21f3SPedro F. Giffuni * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 622afb21f3SPedro F. Giffuni * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 632afb21f3SPedro F. Giffuni * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 642afb21f3SPedro F. Giffuni * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 65a56bb8a5SSatoshi Asami * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 66a56bb8a5SSatoshi Asami * SUCH DAMAGE. 67a56bb8a5SSatoshi Asami * 682afb21f3SPedro F. Giffuni * from: Utah $Hdr: cd.c 1.6 90/11/28$ 692afb21f3SPedro F. Giffuni * 702afb21f3SPedro F. Giffuni * @(#)cd.c 8.2 (Berkeley) 11/16/93 712afb21f3SPedro F. Giffuni */ 722afb21f3SPedro F. Giffuni 732afb21f3SPedro F. Giffuni /* 74a56bb8a5SSatoshi Asami * Dynamic configuration and disklabel support by: 75a56bb8a5SSatoshi Asami * Jason R. Thorpe <thorpej@nas.nasa.gov> 76a56bb8a5SSatoshi Asami * Numerical Aerodynamic Simulation Facility 77a56bb8a5SSatoshi Asami * Mail Stop 258-6 78a56bb8a5SSatoshi Asami * NASA Ames Research Center 79a56bb8a5SSatoshi Asami * Moffett Field, CA 94035 80a56bb8a5SSatoshi Asami */ 81a56bb8a5SSatoshi Asami 8250b1faefSDavid E. O'Brien #include <sys/cdefs.h> 8350b1faefSDavid E. O'Brien __FBSDID("$FreeBSD$"); 8450b1faefSDavid E. O'Brien 85a56bb8a5SSatoshi Asami #include <sys/param.h> 86a56bb8a5SSatoshi Asami #include <sys/systm.h> 87e2a13e8cSSatoshi Asami #include <sys/kernel.h> 88b7b98418SPeter Wemm #include <sys/module.h> 899626b608SPoul-Henning Kamp #include <sys/bio.h> 90a56bb8a5SSatoshi Asami #include <sys/malloc.h> 915d807a0eSAndrey V. Elsukov #include <sys/sbuf.h> 92189337d8SPoul-Henning Kamp #include <geom/geom.h> 93a56bb8a5SSatoshi Asami 940f557e0aSPoul-Henning Kamp /* 953a3fcd72SPoul-Henning Kamp * Number of blocks to untouched in front of a component partition. 963a3fcd72SPoul-Henning Kamp * This is to avoid violating its disklabel area when it starts at the 973a3fcd72SPoul-Henning Kamp * beginning of the slice. 980f557e0aSPoul-Henning Kamp */ 993a3fcd72SPoul-Henning Kamp #if !defined(CCD_OFFSET) 1003a3fcd72SPoul-Henning Kamp #define CCD_OFFSET 16 1013a3fcd72SPoul-Henning Kamp #endif 1023a3fcd72SPoul-Henning Kamp 1033a3fcd72SPoul-Henning Kamp /* sc_flags */ 1043a3fcd72SPoul-Henning Kamp #define CCDF_UNIFORM 0x02 /* use LCCD of sizes for uniform interleave */ 1053a3fcd72SPoul-Henning Kamp #define CCDF_MIRROR 0x04 /* use mirroring */ 1063f4f4a14SMartin Cracauer #define CCDF_NO_OFFSET 0x08 /* do not leave space in front */ 1073f4f4a14SMartin Cracauer #define CCDF_LINUX 0x10 /* use Linux compatibility mode */ 1083a3fcd72SPoul-Henning Kamp 1093a3fcd72SPoul-Henning Kamp /* Mask of user-settable ccd flags. */ 1103a3fcd72SPoul-Henning Kamp #define CCDF_USERMASK (CCDF_UNIFORM|CCDF_MIRROR) 1110f557e0aSPoul-Henning Kamp 1120f557e0aSPoul-Henning Kamp /* 1130f557e0aSPoul-Henning Kamp * Interleave description table. 1140f557e0aSPoul-Henning Kamp * Computed at boot time to speed irregular-interleave lookups. 1150f557e0aSPoul-Henning Kamp * The idea is that we interleave in "groups". First we interleave 1160f557e0aSPoul-Henning Kamp * evenly over all component disks up to the size of the smallest 1170f557e0aSPoul-Henning Kamp * component (the first group), then we interleave evenly over all 1180f557e0aSPoul-Henning Kamp * remaining disks up to the size of the next-smallest (second group), 1190f557e0aSPoul-Henning Kamp * and so on. 1200f557e0aSPoul-Henning Kamp * 1210f557e0aSPoul-Henning Kamp * Each table entry describes the interleave characteristics of one 1220f557e0aSPoul-Henning Kamp * of these groups. For example if a concatenated disk consisted of 1230f557e0aSPoul-Henning Kamp * three components of 5, 3, and 7 DEV_BSIZE blocks interleaved at 1240f557e0aSPoul-Henning Kamp * DEV_BSIZE (1), the table would have three entries: 1250f557e0aSPoul-Henning Kamp * 1260f557e0aSPoul-Henning Kamp * ndisk startblk startoff dev 1270f557e0aSPoul-Henning Kamp * 3 0 0 0, 1, 2 1280f557e0aSPoul-Henning Kamp * 2 9 3 0, 2 1290f557e0aSPoul-Henning Kamp * 1 13 5 2 1300f557e0aSPoul-Henning Kamp * 0 - - - 1310f557e0aSPoul-Henning Kamp * 1320f557e0aSPoul-Henning Kamp * which says that the first nine blocks (0-8) are interleaved over 1330f557e0aSPoul-Henning Kamp * 3 disks (0, 1, 2) starting at block offset 0 on any component disk, 1340f557e0aSPoul-Henning Kamp * the next 4 blocks (9-12) are interleaved over 2 disks (0, 2) starting 1350f557e0aSPoul-Henning Kamp * at component block 3, and the remaining blocks (13-14) are on disk 1360f557e0aSPoul-Henning Kamp * 2 starting at offset 5. 1370f557e0aSPoul-Henning Kamp */ 1380f557e0aSPoul-Henning Kamp struct ccdiinfo { 1390f557e0aSPoul-Henning Kamp int ii_ndisk; /* # of disks range is interleaved over */ 1400f557e0aSPoul-Henning Kamp daddr_t ii_startblk; /* starting scaled block # for range */ 1410f557e0aSPoul-Henning Kamp daddr_t ii_startoff; /* starting component offset (block #) */ 1420f557e0aSPoul-Henning Kamp int *ii_index; /* ordered list of components in range */ 1430f557e0aSPoul-Henning Kamp }; 1440f557e0aSPoul-Henning Kamp 1450f557e0aSPoul-Henning Kamp /* 1463a3fcd72SPoul-Henning Kamp * Component info table. 1473a3fcd72SPoul-Henning Kamp * Describes a single component of a concatenated disk. 1480f557e0aSPoul-Henning Kamp */ 1493a3fcd72SPoul-Henning Kamp struct ccdcinfo { 150e65b2137SPaul Saab daddr_t ci_size; /* size */ 1513a3fcd72SPoul-Henning Kamp struct g_provider *ci_provider; /* provider */ 1523a3fcd72SPoul-Henning Kamp struct g_consumer *ci_consumer; /* consumer */ 1530f557e0aSPoul-Henning Kamp }; 1540f557e0aSPoul-Henning Kamp 1550f557e0aSPoul-Henning Kamp /* 1560f557e0aSPoul-Henning Kamp * A concatenated disk is described by this structure. 1570f557e0aSPoul-Henning Kamp */ 1583a3fcd72SPoul-Henning Kamp 1590f557e0aSPoul-Henning Kamp struct ccd_s { 1600f557e0aSPoul-Henning Kamp LIST_ENTRY(ccd_s) list; 1610f557e0aSPoul-Henning Kamp 1620f557e0aSPoul-Henning Kamp int sc_unit; /* logical unit number */ 1630f557e0aSPoul-Henning Kamp int sc_flags; /* flags */ 164e65b2137SPaul Saab daddr_t sc_size; /* size of ccd */ 1650f557e0aSPoul-Henning Kamp int sc_ileave; /* interleave */ 1663a3fcd72SPoul-Henning Kamp u_int sc_ndisks; /* number of components */ 1670f557e0aSPoul-Henning Kamp struct ccdcinfo *sc_cinfo; /* component info */ 1680f557e0aSPoul-Henning Kamp struct ccdiinfo *sc_itable; /* interleave table */ 1693a3fcd72SPoul-Henning Kamp u_int32_t sc_secsize; /* # bytes per sector */ 1700f557e0aSPoul-Henning Kamp int sc_pick; /* side of mirror picked */ 1710f557e0aSPoul-Henning Kamp daddr_t sc_blk[2]; /* mirror localization */ 1723f4f4a14SMartin Cracauer u_int32_t sc_offset; /* actual offset used */ 1730f557e0aSPoul-Henning Kamp }; 1740f557e0aSPoul-Henning Kamp 1753a3fcd72SPoul-Henning Kamp static g_start_t g_ccd_start; 17601706d20SPoul-Henning Kamp static void ccdiodone(struct bio *bp); 1773a3fcd72SPoul-Henning Kamp static void ccdinterleave(struct ccd_s *); 1783a3fcd72SPoul-Henning Kamp static int ccdinit(struct gctl_req *req, struct ccd_s *); 1793a3fcd72SPoul-Henning Kamp static int ccdbuffer(struct bio **ret, struct ccd_s *, 18001706d20SPoul-Henning Kamp struct bio *, daddr_t, caddr_t, long); 181a56bb8a5SSatoshi Asami 182e2738b4fSPoul-Henning Kamp static void 1833a3fcd72SPoul-Henning Kamp g_ccd_orphan(struct g_consumer *cp) 184a56bb8a5SSatoshi Asami { 185c44c213fSPoul-Henning Kamp /* 186c44c213fSPoul-Henning Kamp * XXX: We don't do anything here. It is not obvious 187c44c213fSPoul-Henning Kamp * XXX: what DTRT would be, so we do what the previous 188c44c213fSPoul-Henning Kamp * XXX: code did: ignore it and let the user cope. 189c44c213fSPoul-Henning Kamp */ 190b7b98418SPeter Wemm } 191d8594dfbSSatoshi Asami 192b7b98418SPeter Wemm static int 1933a3fcd72SPoul-Henning Kamp g_ccd_access(struct g_provider *pp, int dr, int dw, int de) 194b7b98418SPeter Wemm { 1953a3fcd72SPoul-Henning Kamp struct g_geom *gp; 1963a3fcd72SPoul-Henning Kamp struct g_consumer *cp1, *cp2; 1973a3fcd72SPoul-Henning Kamp int error; 198b7b98418SPeter Wemm 1993a3fcd72SPoul-Henning Kamp de += dr; 2003a3fcd72SPoul-Henning Kamp de += dw; 2013a3fcd72SPoul-Henning Kamp 2023a3fcd72SPoul-Henning Kamp gp = pp->geom; 2033a3fcd72SPoul-Henning Kamp error = ENXIO; 2043a3fcd72SPoul-Henning Kamp LIST_FOREACH(cp1, &gp->consumer, consumer) { 205d2bae332SPoul-Henning Kamp error = g_access(cp1, dr, dw, de); 2063a3fcd72SPoul-Henning Kamp if (error) { 2073a3fcd72SPoul-Henning Kamp LIST_FOREACH(cp2, &gp->consumer, consumer) { 2083a3fcd72SPoul-Henning Kamp if (cp1 == cp2) 209b7b98418SPeter Wemm break; 210d2bae332SPoul-Henning Kamp g_access(cp2, -dr, -dw, -de); 2113a3fcd72SPoul-Henning Kamp } 212b7b98418SPeter Wemm break; 2133a3fcd72SPoul-Henning Kamp } 214e2a13e8cSSatoshi Asami } 215b7b98418SPeter Wemm return (error); 216e2a13e8cSSatoshi Asami } 217b7b98418SPeter Wemm 2183a3fcd72SPoul-Henning Kamp /* 2193a3fcd72SPoul-Henning Kamp * Free the softc and its substructures. 2203a3fcd72SPoul-Henning Kamp */ 2213a3fcd72SPoul-Henning Kamp static void 2223a3fcd72SPoul-Henning Kamp g_ccd_freesc(struct ccd_s *sc) 2233a3fcd72SPoul-Henning Kamp { 2243a3fcd72SPoul-Henning Kamp struct ccdiinfo *ii; 2253a3fcd72SPoul-Henning Kamp 2263a3fcd72SPoul-Henning Kamp g_free(sc->sc_cinfo); 2273a3fcd72SPoul-Henning Kamp if (sc->sc_itable != NULL) { 2283a3fcd72SPoul-Henning Kamp for (ii = sc->sc_itable; ii->ii_ndisk > 0; ii++) 2293a3fcd72SPoul-Henning Kamp if (ii->ii_index != NULL) 2303a3fcd72SPoul-Henning Kamp g_free(ii->ii_index); 2313a3fcd72SPoul-Henning Kamp g_free(sc->sc_itable); 2323a3fcd72SPoul-Henning Kamp } 2333a3fcd72SPoul-Henning Kamp g_free(sc); 2343a3fcd72SPoul-Henning Kamp } 2353a3fcd72SPoul-Henning Kamp 236a56bb8a5SSatoshi Asami 237a56bb8a5SSatoshi Asami static int 2383a3fcd72SPoul-Henning Kamp ccdinit(struct gctl_req *req, struct ccd_s *cs) 239a56bb8a5SSatoshi Asami { 2403a3fcd72SPoul-Henning Kamp struct ccdcinfo *ci; 241e65b2137SPaul Saab daddr_t size; 2421464240eSMatthew Dillon int ix; 243e65b2137SPaul Saab daddr_t minsize; 244a56bb8a5SSatoshi Asami int maxsecsize; 245ffee6e99SPoul-Henning Kamp off_t mediasize; 246ffee6e99SPoul-Henning Kamp u_int sectorsize; 247a56bb8a5SSatoshi Asami 248a56bb8a5SSatoshi Asami cs->sc_size = 0; 249a56bb8a5SSatoshi Asami 250a56bb8a5SSatoshi Asami maxsecsize = 0; 251a56bb8a5SSatoshi Asami minsize = 0; 2523f4f4a14SMartin Cracauer 2533f4f4a14SMartin Cracauer if (cs->sc_flags & CCDF_LINUX) { 2543f4f4a14SMartin Cracauer cs->sc_offset = 0; 2553f4f4a14SMartin Cracauer cs->sc_ileave *= 2; 2563f4f4a14SMartin Cracauer if (cs->sc_flags & CCDF_MIRROR && cs->sc_ndisks != 2) 2573f4f4a14SMartin Cracauer gctl_error(req, "Mirror mode for Linux raids is " 2583f4f4a14SMartin Cracauer "only supported with 2 devices"); 2593f4f4a14SMartin Cracauer } else { 2603f4f4a14SMartin Cracauer if (cs->sc_flags & CCDF_NO_OFFSET) 2613f4f4a14SMartin Cracauer cs->sc_offset = 0; 2623f4f4a14SMartin Cracauer else 2633f4f4a14SMartin Cracauer cs->sc_offset = CCD_OFFSET; 2643f4f4a14SMartin Cracauer 2653f4f4a14SMartin Cracauer } 2663a3fcd72SPoul-Henning Kamp for (ix = 0; ix < cs->sc_ndisks; ix++) { 267a56bb8a5SSatoshi Asami ci = &cs->sc_cinfo[ix]; 268a56bb8a5SSatoshi Asami 2693a3fcd72SPoul-Henning Kamp mediasize = ci->ci_provider->mediasize; 2703a3fcd72SPoul-Henning Kamp sectorsize = ci->ci_provider->sectorsize; 271ffee6e99SPoul-Henning Kamp if (sectorsize > maxsecsize) 272ffee6e99SPoul-Henning Kamp maxsecsize = sectorsize; 2733f4f4a14SMartin Cracauer size = mediasize / DEV_BSIZE - cs->sc_offset; 274a56bb8a5SSatoshi Asami 2753a3fcd72SPoul-Henning Kamp /* Truncate to interleave boundary */ 276a56bb8a5SSatoshi Asami 277a56bb8a5SSatoshi Asami if (cs->sc_ileave > 1) 278a56bb8a5SSatoshi Asami size -= size % cs->sc_ileave; 279a56bb8a5SSatoshi Asami 280a56bb8a5SSatoshi Asami if (size == 0) { 2813a3fcd72SPoul-Henning Kamp gctl_error(req, "Component %s has effective size zero", 2823a3fcd72SPoul-Henning Kamp ci->ci_provider->name); 2833a3fcd72SPoul-Henning Kamp return(ENODEV); 284a56bb8a5SSatoshi Asami } 285a56bb8a5SSatoshi Asami 286a56bb8a5SSatoshi Asami if (minsize == 0 || size < minsize) 287a56bb8a5SSatoshi Asami minsize = size; 288a56bb8a5SSatoshi Asami ci->ci_size = size; 289a56bb8a5SSatoshi Asami cs->sc_size += size; 290a56bb8a5SSatoshi Asami } 291a56bb8a5SSatoshi Asami 292a56bb8a5SSatoshi Asami /* 293a56bb8a5SSatoshi Asami * Don't allow the interleave to be smaller than 294a56bb8a5SSatoshi Asami * the biggest component sector. 295a56bb8a5SSatoshi Asami */ 296a56bb8a5SSatoshi Asami if ((cs->sc_ileave > 0) && 297a56bb8a5SSatoshi Asami (cs->sc_ileave < (maxsecsize / DEV_BSIZE))) { 2983a3fcd72SPoul-Henning Kamp gctl_error(req, "Interleave to small for sector size"); 2993a3fcd72SPoul-Henning Kamp return(EINVAL); 300a56bb8a5SSatoshi Asami } 301a56bb8a5SSatoshi Asami 302a56bb8a5SSatoshi Asami /* 303a56bb8a5SSatoshi Asami * If uniform interleave is desired set all sizes to that of 304e8d57122SPedro F. Giffuni * the smallest component. This will guarantee that a single 3051464240eSMatthew Dillon * interleave table is generated. 3061464240eSMatthew Dillon * 3071464240eSMatthew Dillon * Lost space must be taken into account when calculating the 3081464240eSMatthew Dillon * overall size. Half the space is lost when CCDF_MIRROR is 309ddbf51afSPoul-Henning Kamp * specified. 310a56bb8a5SSatoshi Asami */ 31101706d20SPoul-Henning Kamp if (cs->sc_flags & CCDF_UNIFORM) { 3123a3fcd72SPoul-Henning Kamp for (ix = 0; ix < cs->sc_ndisks; ix++) { 3133a3fcd72SPoul-Henning Kamp ci = &cs->sc_cinfo[ix]; 314a56bb8a5SSatoshi Asami ci->ci_size = minsize; 3151464240eSMatthew Dillon } 3163a3fcd72SPoul-Henning Kamp cs->sc_size = cs->sc_ndisks * minsize; 3173a3fcd72SPoul-Henning Kamp } 3183a3fcd72SPoul-Henning Kamp 31901706d20SPoul-Henning Kamp if (cs->sc_flags & CCDF_MIRROR) { 32034f35216SSatoshi Asami /* 32134f35216SSatoshi Asami * Check to see if an even number of components 3221464240eSMatthew Dillon * have been specified. The interleave must also 3231464240eSMatthew Dillon * be non-zero in order for us to be able to 324e8d57122SPedro F. Giffuni * guarantee the topology. 32534f35216SSatoshi Asami */ 3263a3fcd72SPoul-Henning Kamp if (cs->sc_ndisks % 2) { 3273a3fcd72SPoul-Henning Kamp gctl_error(req, 3283a3fcd72SPoul-Henning Kamp "Mirroring requires an even number of disks"); 3293a3fcd72SPoul-Henning Kamp return(EINVAL); 33034f35216SSatoshi Asami } 3311464240eSMatthew Dillon if (cs->sc_ileave == 0) { 3323a3fcd72SPoul-Henning Kamp gctl_error(req, 3333a3fcd72SPoul-Henning Kamp "An interleave must be specified when mirroring"); 3343a3fcd72SPoul-Henning Kamp return(EINVAL); 33509b59204SSatoshi Asami } 3363a3fcd72SPoul-Henning Kamp cs->sc_size = (cs->sc_ndisks/2) * minsize; 3371464240eSMatthew Dillon } 338a56bb8a5SSatoshi Asami 339a56bb8a5SSatoshi Asami /* 340a56bb8a5SSatoshi Asami * Construct the interleave table. 341a56bb8a5SSatoshi Asami */ 3423a3fcd72SPoul-Henning Kamp ccdinterleave(cs); 343a56bb8a5SSatoshi Asami 344a56bb8a5SSatoshi Asami /* 345a56bb8a5SSatoshi Asami * Create pseudo-geometry based on 1MB cylinders. It's 346a56bb8a5SSatoshi Asami * pretty close. 347a56bb8a5SSatoshi Asami */ 3483a3fcd72SPoul-Henning Kamp cs->sc_secsize = maxsecsize; 349a56bb8a5SSatoshi Asami 350a56bb8a5SSatoshi Asami return (0); 351a56bb8a5SSatoshi Asami } 352a56bb8a5SSatoshi Asami 353a56bb8a5SSatoshi Asami static void 3543a3fcd72SPoul-Henning Kamp ccdinterleave(struct ccd_s *cs) 355a56bb8a5SSatoshi Asami { 3561464240eSMatthew Dillon struct ccdcinfo *ci, *smallci; 3571464240eSMatthew Dillon struct ccdiinfo *ii; 3581464240eSMatthew Dillon daddr_t bn, lbn; 3591464240eSMatthew Dillon int ix; 360e65b2137SPaul Saab daddr_t size; 361a56bb8a5SSatoshi Asami 3621464240eSMatthew Dillon 363a56bb8a5SSatoshi Asami /* 3641464240eSMatthew Dillon * Allocate an interleave table. The worst case occurs when each 3651464240eSMatthew Dillon * of N disks is of a different size, resulting in N interleave 3661464240eSMatthew Dillon * tables. 3671464240eSMatthew Dillon * 368a56bb8a5SSatoshi Asami * Chances are this is too big, but we don't care. 369a56bb8a5SSatoshi Asami */ 3703a3fcd72SPoul-Henning Kamp size = (cs->sc_ndisks + 1) * sizeof(struct ccdiinfo); 3713a3fcd72SPoul-Henning Kamp cs->sc_itable = g_malloc(size, M_WAITOK | M_ZERO); 372a56bb8a5SSatoshi Asami 373a56bb8a5SSatoshi Asami /* 374a56bb8a5SSatoshi Asami * Trivial case: no interleave (actually interleave of disk size). 375a56bb8a5SSatoshi Asami * Each table entry represents a single component in its entirety. 3761464240eSMatthew Dillon * 377ddbf51afSPoul-Henning Kamp * An interleave of 0 may not be used with a mirror setup. 378a56bb8a5SSatoshi Asami */ 379a56bb8a5SSatoshi Asami if (cs->sc_ileave == 0) { 380a56bb8a5SSatoshi Asami bn = 0; 381a56bb8a5SSatoshi Asami ii = cs->sc_itable; 382a56bb8a5SSatoshi Asami 3833a3fcd72SPoul-Henning Kamp for (ix = 0; ix < cs->sc_ndisks; ix++) { 384a56bb8a5SSatoshi Asami /* Allocate space for ii_index. */ 3853a3fcd72SPoul-Henning Kamp ii->ii_index = g_malloc(sizeof(int), M_WAITOK); 386a56bb8a5SSatoshi Asami ii->ii_ndisk = 1; 387a56bb8a5SSatoshi Asami ii->ii_startblk = bn; 388a56bb8a5SSatoshi Asami ii->ii_startoff = 0; 389a56bb8a5SSatoshi Asami ii->ii_index[0] = ix; 390a56bb8a5SSatoshi Asami bn += cs->sc_cinfo[ix].ci_size; 391a56bb8a5SSatoshi Asami ii++; 392a56bb8a5SSatoshi Asami } 393a56bb8a5SSatoshi Asami ii->ii_ndisk = 0; 394a56bb8a5SSatoshi Asami return; 395a56bb8a5SSatoshi Asami } 396a56bb8a5SSatoshi Asami 397a56bb8a5SSatoshi Asami /* 398a56bb8a5SSatoshi Asami * The following isn't fast or pretty; it doesn't have to be. 399a56bb8a5SSatoshi Asami */ 400a56bb8a5SSatoshi Asami size = 0; 401a56bb8a5SSatoshi Asami bn = lbn = 0; 402a56bb8a5SSatoshi Asami for (ii = cs->sc_itable; ; ii++) { 4031464240eSMatthew Dillon /* 4041464240eSMatthew Dillon * Allocate space for ii_index. We might allocate more then 4051464240eSMatthew Dillon * we use. 4061464240eSMatthew Dillon */ 4073a3fcd72SPoul-Henning Kamp ii->ii_index = g_malloc((sizeof(int) * cs->sc_ndisks), 4083a3fcd72SPoul-Henning Kamp M_WAITOK); 409a56bb8a5SSatoshi Asami 410a56bb8a5SSatoshi Asami /* 411a56bb8a5SSatoshi Asami * Locate the smallest of the remaining components 412a56bb8a5SSatoshi Asami */ 413a56bb8a5SSatoshi Asami smallci = NULL; 4143a3fcd72SPoul-Henning Kamp for (ci = cs->sc_cinfo; ci < &cs->sc_cinfo[cs->sc_ndisks]; 4151464240eSMatthew Dillon ci++) { 416a56bb8a5SSatoshi Asami if (ci->ci_size > size && 417a56bb8a5SSatoshi Asami (smallci == NULL || 4181464240eSMatthew Dillon ci->ci_size < smallci->ci_size)) { 419a56bb8a5SSatoshi Asami smallci = ci; 4201464240eSMatthew Dillon } 4211464240eSMatthew Dillon } 422a56bb8a5SSatoshi Asami 423a56bb8a5SSatoshi Asami /* 424a56bb8a5SSatoshi Asami * Nobody left, all done 425a56bb8a5SSatoshi Asami */ 426a56bb8a5SSatoshi Asami if (smallci == NULL) { 427a56bb8a5SSatoshi Asami ii->ii_ndisk = 0; 4283a3fcd72SPoul-Henning Kamp g_free(ii->ii_index); 4293a3fcd72SPoul-Henning Kamp ii->ii_index = NULL; 430a56bb8a5SSatoshi Asami break; 431a56bb8a5SSatoshi Asami } 432a56bb8a5SSatoshi Asami 433a56bb8a5SSatoshi Asami /* 4341464240eSMatthew Dillon * Record starting logical block using an sc_ileave blocksize. 435a56bb8a5SSatoshi Asami */ 436a56bb8a5SSatoshi Asami ii->ii_startblk = bn / cs->sc_ileave; 4371464240eSMatthew Dillon 4381464240eSMatthew Dillon /* 4393a3fcd72SPoul-Henning Kamp * Record starting component block using an sc_ileave 4401464240eSMatthew Dillon * blocksize. This value is relative to the beginning of 4411464240eSMatthew Dillon * a component disk. 4421464240eSMatthew Dillon */ 443a56bb8a5SSatoshi Asami ii->ii_startoff = lbn; 444a56bb8a5SSatoshi Asami 445a56bb8a5SSatoshi Asami /* 446a56bb8a5SSatoshi Asami * Determine how many disks take part in this interleave 447a56bb8a5SSatoshi Asami * and record their indices. 448a56bb8a5SSatoshi Asami */ 449a56bb8a5SSatoshi Asami ix = 0; 450a56bb8a5SSatoshi Asami for (ci = cs->sc_cinfo; 4513a3fcd72SPoul-Henning Kamp ci < &cs->sc_cinfo[cs->sc_ndisks]; ci++) { 4521464240eSMatthew Dillon if (ci->ci_size >= smallci->ci_size) { 453a56bb8a5SSatoshi Asami ii->ii_index[ix++] = ci - cs->sc_cinfo; 4541464240eSMatthew Dillon } 4551464240eSMatthew Dillon } 456a56bb8a5SSatoshi Asami ii->ii_ndisk = ix; 457a56bb8a5SSatoshi Asami bn += ix * (smallci->ci_size - size); 458a56bb8a5SSatoshi Asami lbn = smallci->ci_size / cs->sc_ileave; 459a56bb8a5SSatoshi Asami size = smallci->ci_size; 460a56bb8a5SSatoshi Asami } 461a56bb8a5SSatoshi Asami } 462a56bb8a5SSatoshi Asami 463e2738b4fSPoul-Henning Kamp static void 4643a3fcd72SPoul-Henning Kamp g_ccd_start(struct bio *bp) 465a56bb8a5SSatoshi Asami { 4661464240eSMatthew Dillon long bcount, rcount; 4673a3fcd72SPoul-Henning Kamp struct bio *cbp[2]; 468a56bb8a5SSatoshi Asami caddr_t addr; 469a56bb8a5SSatoshi Asami daddr_t bn; 4700f76d6d8SPoul-Henning Kamp int err; 4713a3fcd72SPoul-Henning Kamp struct ccd_s *cs; 4723a3fcd72SPoul-Henning Kamp 4733a3fcd72SPoul-Henning Kamp cs = bp->bio_to->geom->softc; 474a56bb8a5SSatoshi Asami 475a56bb8a5SSatoshi Asami /* 476e30b2edaSPoul-Henning Kamp * Block all GETATTR requests, we wouldn't know which of our 477e30b2edaSPoul-Henning Kamp * subdevices we should ship it off to. 478e30b2edaSPoul-Henning Kamp * XXX: this may not be the right policy. 479e30b2edaSPoul-Henning Kamp */ 480e30b2edaSPoul-Henning Kamp if(bp->bio_cmd == BIO_GETATTR) { 481e30b2edaSPoul-Henning Kamp g_io_deliver(bp, EINVAL); 482e30b2edaSPoul-Henning Kamp return; 483e30b2edaSPoul-Henning Kamp } 484e30b2edaSPoul-Henning Kamp 485e30b2edaSPoul-Henning Kamp /* 486a56bb8a5SSatoshi Asami * Translate the partition-relative block number to an absolute. 487a56bb8a5SSatoshi Asami */ 4883a3fcd72SPoul-Henning Kamp bn = bp->bio_offset / cs->sc_secsize; 489a56bb8a5SSatoshi Asami 490a56bb8a5SSatoshi Asami /* 491a56bb8a5SSatoshi Asami * Allocate component buffers and fire off the requests 492a56bb8a5SSatoshi Asami */ 4939d7f7369SPoul-Henning Kamp addr = bp->bio_data; 4943a3fcd72SPoul-Henning Kamp for (bcount = bp->bio_length; bcount > 0; bcount -= rcount) { 4950f76d6d8SPoul-Henning Kamp err = ccdbuffer(cbp, cs, bp, bn, addr, bcount); 4960f76d6d8SPoul-Henning Kamp if (err) { 497ec421aecSPoul-Henning Kamp bp->bio_completed += bcount; 498c12ec49eSPoul-Henning Kamp if (bp->bio_error == 0) 49977154759SPoul-Henning Kamp bp->bio_error = err; 500ec421aecSPoul-Henning Kamp if (bp->bio_completed == bp->bio_length) 501ec421aecSPoul-Henning Kamp g_io_deliver(bp, bp->bio_error); 5020f76d6d8SPoul-Henning Kamp return; 5030f76d6d8SPoul-Henning Kamp } 5043a3fcd72SPoul-Henning Kamp rcount = cbp[0]->bio_length; 5051464240eSMatthew Dillon 5063a3fcd72SPoul-Henning Kamp if (cs->sc_flags & CCDF_MIRROR) { 5071464240eSMatthew Dillon /* 5081464240eSMatthew Dillon * Mirroring. Writes go to both disks, reads are 5091464240eSMatthew Dillon * taken from whichever disk seems most appropriate. 5101464240eSMatthew Dillon * 5111464240eSMatthew Dillon * We attempt to localize reads to the disk whos arm 5121464240eSMatthew Dillon * is nearest the read request. We ignore seeks due 5131464240eSMatthew Dillon * to writes when making this determination and we 5141464240eSMatthew Dillon * also try to avoid hogging. 5151464240eSMatthew Dillon */ 5163a3fcd72SPoul-Henning Kamp if (cbp[0]->bio_cmd != BIO_READ) { 5173a3fcd72SPoul-Henning Kamp g_io_request(cbp[0], cbp[0]->bio_from); 5183a3fcd72SPoul-Henning Kamp g_io_request(cbp[1], cbp[1]->bio_from); 5191464240eSMatthew Dillon } else { 5201464240eSMatthew Dillon int pick = cs->sc_pick; 5211464240eSMatthew Dillon daddr_t range = cs->sc_size / 16; 5221464240eSMatthew Dillon 5231464240eSMatthew Dillon if (bn < cs->sc_blk[pick] - range || 5241464240eSMatthew Dillon bn > cs->sc_blk[pick] + range 5251464240eSMatthew Dillon ) { 5261464240eSMatthew Dillon cs->sc_pick = pick = 1 - pick; 5271464240eSMatthew Dillon } 5281464240eSMatthew Dillon cs->sc_blk[pick] = bn + btodb(rcount); 5293a3fcd72SPoul-Henning Kamp g_io_request(cbp[pick], cbp[pick]->bio_from); 5301464240eSMatthew Dillon } 5311464240eSMatthew Dillon } else { 5321464240eSMatthew Dillon /* 5331464240eSMatthew Dillon * Not mirroring 5341464240eSMatthew Dillon */ 5353a3fcd72SPoul-Henning Kamp g_io_request(cbp[0], cbp[0]->bio_from); 5363bc746beSSatoshi Asami } 537a56bb8a5SSatoshi Asami bn += btodb(rcount); 538a56bb8a5SSatoshi Asami addr += rcount; 539a56bb8a5SSatoshi Asami } 540a56bb8a5SSatoshi Asami } 541a56bb8a5SSatoshi Asami 542a56bb8a5SSatoshi Asami /* 543a56bb8a5SSatoshi Asami * Build a component buffer header. 544a56bb8a5SSatoshi Asami */ 5450f76d6d8SPoul-Henning Kamp static int 5463a3fcd72SPoul-Henning Kamp ccdbuffer(struct bio **cb, struct ccd_s *cs, struct bio *bp, daddr_t bn, caddr_t addr, long bcount) 547a56bb8a5SSatoshi Asami { 548ec421aecSPoul-Henning Kamp struct ccdcinfo *ci, *ci2 = NULL; 5493a3fcd72SPoul-Henning Kamp struct bio *cbp; 5501464240eSMatthew Dillon daddr_t cbn, cboff; 5511464240eSMatthew Dillon off_t cbc; 552a56bb8a5SSatoshi Asami 553a56bb8a5SSatoshi Asami /* 554a56bb8a5SSatoshi Asami * Determine which component bn falls in. 555a56bb8a5SSatoshi Asami */ 556a56bb8a5SSatoshi Asami cbn = bn; 557a56bb8a5SSatoshi Asami cboff = 0; 558a56bb8a5SSatoshi Asami 559a56bb8a5SSatoshi Asami if (cs->sc_ileave == 0) { 5601464240eSMatthew Dillon /* 5611464240eSMatthew Dillon * Serially concatenated and neither a mirror nor a parity 5621464240eSMatthew Dillon * config. This is a special case. 5631464240eSMatthew Dillon */ 5641464240eSMatthew Dillon daddr_t sblk; 565a56bb8a5SSatoshi Asami 566a56bb8a5SSatoshi Asami sblk = 0; 567a56bb8a5SSatoshi Asami for (ci = cs->sc_cinfo; cbn >= sblk + ci->ci_size; ci++) 568a56bb8a5SSatoshi Asami sblk += ci->ci_size; 569a56bb8a5SSatoshi Asami cbn -= sblk; 5701464240eSMatthew Dillon } else { 5711464240eSMatthew Dillon struct ccdiinfo *ii; 572a56bb8a5SSatoshi Asami int ccdisk, off; 573a56bb8a5SSatoshi Asami 5741464240eSMatthew Dillon /* 5751464240eSMatthew Dillon * Calculate cbn, the logical superblock (sc_ileave chunks), 5761464240eSMatthew Dillon * and cboff, a normal block offset (DEV_BSIZE chunks) relative 5771464240eSMatthew Dillon * to cbn. 5781464240eSMatthew Dillon */ 5791464240eSMatthew Dillon cboff = cbn % cs->sc_ileave; /* DEV_BSIZE gran */ 5801464240eSMatthew Dillon cbn = cbn / cs->sc_ileave; /* DEV_BSIZE * ileave gran */ 5811464240eSMatthew Dillon 5821464240eSMatthew Dillon /* 5831464240eSMatthew Dillon * Figure out which interleave table to use. 5841464240eSMatthew Dillon */ 5851464240eSMatthew Dillon for (ii = cs->sc_itable; ii->ii_ndisk; ii++) { 586a56bb8a5SSatoshi Asami if (ii->ii_startblk > cbn) 587a56bb8a5SSatoshi Asami break; 5881464240eSMatthew Dillon } 589a56bb8a5SSatoshi Asami ii--; 5901464240eSMatthew Dillon 5911464240eSMatthew Dillon /* 5921464240eSMatthew Dillon * off is the logical superblock relative to the beginning 5931464240eSMatthew Dillon * of this interleave block. 5941464240eSMatthew Dillon */ 595a56bb8a5SSatoshi Asami off = cbn - ii->ii_startblk; 5961464240eSMatthew Dillon 5971464240eSMatthew Dillon /* 5981464240eSMatthew Dillon * We must calculate which disk component to use (ccdisk), 5991464240eSMatthew Dillon * and recalculate cbn to be the superblock relative to 6001464240eSMatthew Dillon * the beginning of the component. This is typically done by 6011464240eSMatthew Dillon * adding 'off' and ii->ii_startoff together. However, 'off' 6021464240eSMatthew Dillon * must typically be divided by the number of components in 6031464240eSMatthew Dillon * this interleave array to be properly convert it from a 6041464240eSMatthew Dillon * CCD-relative logical superblock number to a 6051464240eSMatthew Dillon * component-relative superblock number. 6061464240eSMatthew Dillon */ 607a56bb8a5SSatoshi Asami if (ii->ii_ndisk == 1) { 6081464240eSMatthew Dillon /* 6091464240eSMatthew Dillon * When we have just one disk, it can't be a mirror 6101464240eSMatthew Dillon * or a parity config. 6111464240eSMatthew Dillon */ 612a56bb8a5SSatoshi Asami ccdisk = ii->ii_index[0]; 613a56bb8a5SSatoshi Asami cbn = ii->ii_startoff + off; 614a56bb8a5SSatoshi Asami } else { 6153a3fcd72SPoul-Henning Kamp if (cs->sc_flags & CCDF_MIRROR) { 6161464240eSMatthew Dillon /* 6171464240eSMatthew Dillon * We have forced a uniform mapping, resulting 6181464240eSMatthew Dillon * in a single interleave array. We double 6191464240eSMatthew Dillon * up on the first half of the available 6201464240eSMatthew Dillon * components and our mirror is in the second 6211464240eSMatthew Dillon * half. This only works with a single 6221464240eSMatthew Dillon * interleave array because doubling up 6231464240eSMatthew Dillon * doubles the number of sectors, so there 6241464240eSMatthew Dillon * cannot be another interleave array because 6251464240eSMatthew Dillon * the next interleave array's calculations 6261464240eSMatthew Dillon * would be off. 6271464240eSMatthew Dillon */ 6281464240eSMatthew Dillon int ndisk2 = ii->ii_ndisk / 2; 6291464240eSMatthew Dillon ccdisk = ii->ii_index[off % ndisk2]; 6301464240eSMatthew Dillon cbn = ii->ii_startoff + off / ndisk2; 6311464240eSMatthew Dillon ci2 = &cs->sc_cinfo[ccdisk + ndisk2]; 6321464240eSMatthew Dillon } else { 633a56bb8a5SSatoshi Asami ccdisk = ii->ii_index[off % ii->ii_ndisk]; 634a56bb8a5SSatoshi Asami cbn = ii->ii_startoff + off / ii->ii_ndisk; 635a56bb8a5SSatoshi Asami } 6367ecb65faSSatoshi Asami } 6371464240eSMatthew Dillon 638a56bb8a5SSatoshi Asami ci = &cs->sc_cinfo[ccdisk]; 6391464240eSMatthew Dillon 6401464240eSMatthew Dillon /* 6411464240eSMatthew Dillon * Convert cbn from a superblock to a normal block so it 6421464240eSMatthew Dillon * can be used to calculate (along with cboff) the normal 6431464240eSMatthew Dillon * block index into this particular disk. 6441464240eSMatthew Dillon */ 6451464240eSMatthew Dillon cbn *= cs->sc_ileave; 646a56bb8a5SSatoshi Asami } 647a56bb8a5SSatoshi Asami 648a56bb8a5SSatoshi Asami /* 649a56bb8a5SSatoshi Asami * Fill in the component buf structure. 650a56bb8a5SSatoshi Asami */ 6513a3fcd72SPoul-Henning Kamp cbp = g_clone_bio(bp); 652ec421aecSPoul-Henning Kamp if (cbp == NULL) 653ec421aecSPoul-Henning Kamp return (ENOMEM); 6543a3fcd72SPoul-Henning Kamp cbp->bio_done = g_std_done; 6553f4f4a14SMartin Cracauer cbp->bio_offset = dbtob(cbn + cboff + cs->sc_offset); 6563a3fcd72SPoul-Henning Kamp cbp->bio_data = addr; 657a56bb8a5SSatoshi Asami if (cs->sc_ileave == 0) 65840969e38SDavid Greenman cbc = dbtob((off_t)(ci->ci_size - cbn)); 659a56bb8a5SSatoshi Asami else 66040969e38SDavid Greenman cbc = dbtob((off_t)(cs->sc_ileave - cboff)); 6613a3fcd72SPoul-Henning Kamp cbp->bio_length = (cbc < bcount) ? cbc : bcount; 662c0b89506SJohn Dyson 6633a3fcd72SPoul-Henning Kamp cbp->bio_from = ci->ci_consumer; 6643bc746beSSatoshi Asami cb[0] = cbp; 6651464240eSMatthew Dillon 6663a3fcd72SPoul-Henning Kamp if (cs->sc_flags & CCDF_MIRROR) { 6673a3fcd72SPoul-Henning Kamp cbp = g_clone_bio(bp); 668ec421aecSPoul-Henning Kamp if (cbp == NULL) 669ec421aecSPoul-Henning Kamp return (ENOMEM); 6703a3fcd72SPoul-Henning Kamp cbp->bio_done = cb[0]->bio_done = ccdiodone; 6713a3fcd72SPoul-Henning Kamp cbp->bio_offset = cb[0]->bio_offset; 6723a3fcd72SPoul-Henning Kamp cbp->bio_data = cb[0]->bio_data; 6733a3fcd72SPoul-Henning Kamp cbp->bio_length = cb[0]->bio_length; 6743a3fcd72SPoul-Henning Kamp cbp->bio_from = ci2->ci_consumer; 6753a3fcd72SPoul-Henning Kamp cbp->bio_caller1 = cb[0]; 6763a3fcd72SPoul-Henning Kamp cb[0]->bio_caller1 = cbp; 6773bc746beSSatoshi Asami cb[1] = cbp; 6783bc746beSSatoshi Asami } 6790f76d6d8SPoul-Henning Kamp return (0); 680a56bb8a5SSatoshi Asami } 681a56bb8a5SSatoshi Asami 682a56bb8a5SSatoshi Asami /* 683c44c213fSPoul-Henning Kamp * Called only for mirrored operations. 684a56bb8a5SSatoshi Asami */ 685e2738b4fSPoul-Henning Kamp static void 6863a3fcd72SPoul-Henning Kamp ccdiodone(struct bio *cbp) 687a56bb8a5SSatoshi Asami { 6883a3fcd72SPoul-Henning Kamp struct bio *mbp, *pbp; 689a56bb8a5SSatoshi Asami 6903a3fcd72SPoul-Henning Kamp mbp = cbp->bio_caller1; 6913a3fcd72SPoul-Henning Kamp pbp = cbp->bio_parent; 692a56bb8a5SSatoshi Asami 6933a3fcd72SPoul-Henning Kamp if (pbp->bio_cmd == BIO_READ) { 6943a3fcd72SPoul-Henning Kamp if (cbp->bio_error == 0) { 695c44c213fSPoul-Henning Kamp /* We will not be needing the partner bio */ 696c44c213fSPoul-Henning Kamp if (mbp != NULL) { 6973a3fcd72SPoul-Henning Kamp pbp->bio_inbed++; 6983a3fcd72SPoul-Henning Kamp g_destroy_bio(mbp); 699c44c213fSPoul-Henning Kamp } 700c44c213fSPoul-Henning Kamp g_std_done(cbp); 701e7322872SSatoshi Asami return; 702e7322872SSatoshi Asami } 7033a3fcd72SPoul-Henning Kamp if (mbp != NULL) { 704c44c213fSPoul-Henning Kamp /* Try partner the bio instead */ 7053a3fcd72SPoul-Henning Kamp mbp->bio_caller1 = NULL; 7063a3fcd72SPoul-Henning Kamp pbp->bio_inbed++; 7073a3fcd72SPoul-Henning Kamp g_destroy_bio(cbp); 7083a3fcd72SPoul-Henning Kamp g_io_request(mbp, mbp->bio_from); 709c44c213fSPoul-Henning Kamp /* 710c44c213fSPoul-Henning Kamp * XXX: If this comes back OK, we should actually 711c44c213fSPoul-Henning Kamp * try to write the good data on the failed mirror 712c44c213fSPoul-Henning Kamp */ 7131464240eSMatthew Dillon return; 7141464240eSMatthew Dillon } 7153a3fcd72SPoul-Henning Kamp g_std_done(cbp); 716114ebb2fSPoul-Henning Kamp return; 7171464240eSMatthew Dillon } 7183a3fcd72SPoul-Henning Kamp if (mbp != NULL) { 7193a3fcd72SPoul-Henning Kamp mbp->bio_caller1 = NULL; 7203a3fcd72SPoul-Henning Kamp pbp->bio_inbed++; 721c44c213fSPoul-Henning Kamp if (cbp->bio_error != 0 && pbp->bio_error == 0) 7223a3fcd72SPoul-Henning Kamp pbp->bio_error = cbp->bio_error; 723114ebb2fSPoul-Henning Kamp g_destroy_bio(cbp); 7243a3fcd72SPoul-Henning Kamp return; 7251464240eSMatthew Dillon } 7263a3fcd72SPoul-Henning Kamp g_std_done(cbp); 7271464240eSMatthew Dillon } 728e7322872SSatoshi Asami 729a56bb8a5SSatoshi Asami static void 7303a3fcd72SPoul-Henning Kamp g_ccd_create(struct gctl_req *req, struct g_class *mp) 731a56bb8a5SSatoshi Asami { 7323a3fcd72SPoul-Henning Kamp int *unit, *ileave, *nprovider; 7333a3fcd72SPoul-Henning Kamp struct g_geom *gp; 7343a3fcd72SPoul-Henning Kamp struct g_consumer *cp; 7353a3fcd72SPoul-Henning Kamp struct g_provider *pp; 7363a3fcd72SPoul-Henning Kamp struct ccd_s *sc; 737189337d8SPoul-Henning Kamp struct sbuf *sb; 7383a3fcd72SPoul-Henning Kamp char buf[20]; 7393a3fcd72SPoul-Henning Kamp int i, error; 7403a3fcd72SPoul-Henning Kamp 7413a3fcd72SPoul-Henning Kamp g_topology_assert(); 7423a3fcd72SPoul-Henning Kamp unit = gctl_get_paraml(req, "unit", sizeof (*unit)); 743251048a1SUlf Lilleengen if (unit == NULL) { 744251048a1SUlf Lilleengen gctl_error(req, "unit parameter not given"); 745251048a1SUlf Lilleengen return; 746251048a1SUlf Lilleengen } 7473a3fcd72SPoul-Henning Kamp ileave = gctl_get_paraml(req, "ileave", sizeof (*ileave)); 748251048a1SUlf Lilleengen if (ileave == NULL) { 749251048a1SUlf Lilleengen gctl_error(req, "ileave parameter not given"); 750251048a1SUlf Lilleengen return; 751251048a1SUlf Lilleengen } 7523a3fcd72SPoul-Henning Kamp nprovider = gctl_get_paraml(req, "nprovider", sizeof (*nprovider)); 753251048a1SUlf Lilleengen if (nprovider == NULL) { 754251048a1SUlf Lilleengen gctl_error(req, "nprovider parameter not given"); 755251048a1SUlf Lilleengen return; 756251048a1SUlf Lilleengen } 7573a3fcd72SPoul-Henning Kamp 7583a3fcd72SPoul-Henning Kamp /* Check for duplicate unit */ 7593a3fcd72SPoul-Henning Kamp LIST_FOREACH(gp, &mp->geom, geom) { 7603a3fcd72SPoul-Henning Kamp sc = gp->softc; 76192b5e86eSPoul-Henning Kamp if (sc != NULL && sc->sc_unit == *unit) { 7623a3fcd72SPoul-Henning Kamp gctl_error(req, "Unit %d already configured", *unit); 7633a3fcd72SPoul-Henning Kamp return; 7643a3fcd72SPoul-Henning Kamp } 7653a3fcd72SPoul-Henning Kamp } 7663a3fcd72SPoul-Henning Kamp 7673a3fcd72SPoul-Henning Kamp if (*nprovider <= 0) { 7683a3fcd72SPoul-Henning Kamp gctl_error(req, "Bogus nprovider argument (= %d)", *nprovider); 7693a3fcd72SPoul-Henning Kamp return; 7703a3fcd72SPoul-Henning Kamp } 7713a3fcd72SPoul-Henning Kamp 7723a3fcd72SPoul-Henning Kamp /* Check all providers are valid */ 7733a3fcd72SPoul-Henning Kamp for (i = 0; i < *nprovider; i++) { 7743a3fcd72SPoul-Henning Kamp sprintf(buf, "provider%d", i); 7753a3fcd72SPoul-Henning Kamp pp = gctl_get_provider(req, buf); 7763a3fcd72SPoul-Henning Kamp if (pp == NULL) 7773a3fcd72SPoul-Henning Kamp return; 7783a3fcd72SPoul-Henning Kamp } 7793a3fcd72SPoul-Henning Kamp 7803a3fcd72SPoul-Henning Kamp gp = g_new_geomf(mp, "ccd%d", *unit); 7813a3fcd72SPoul-Henning Kamp sc = g_malloc(sizeof *sc, M_WAITOK | M_ZERO); 7823a3fcd72SPoul-Henning Kamp gp->softc = sc; 7833a3fcd72SPoul-Henning Kamp sc->sc_ndisks = *nprovider; 7843a3fcd72SPoul-Henning Kamp 7853a3fcd72SPoul-Henning Kamp /* Allocate space for the component info. */ 7863a3fcd72SPoul-Henning Kamp sc->sc_cinfo = g_malloc(sc->sc_ndisks * sizeof(struct ccdcinfo), 7873a3fcd72SPoul-Henning Kamp M_WAITOK | M_ZERO); 7883a3fcd72SPoul-Henning Kamp 7893a3fcd72SPoul-Henning Kamp /* Create consumers and attach to all providers */ 7903a3fcd72SPoul-Henning Kamp for (i = 0; i < *nprovider; i++) { 7913a3fcd72SPoul-Henning Kamp sprintf(buf, "provider%d", i); 7923a3fcd72SPoul-Henning Kamp pp = gctl_get_provider(req, buf); 7933a3fcd72SPoul-Henning Kamp cp = g_new_consumer(gp); 7943a3fcd72SPoul-Henning Kamp error = g_attach(cp, pp); 7953a3fcd72SPoul-Henning Kamp KASSERT(error == 0, ("attach to %s failed", pp->name)); 7963a3fcd72SPoul-Henning Kamp sc->sc_cinfo[i].ci_consumer = cp; 7973a3fcd72SPoul-Henning Kamp sc->sc_cinfo[i].ci_provider = pp; 7983a3fcd72SPoul-Henning Kamp } 7993a3fcd72SPoul-Henning Kamp 8003a3fcd72SPoul-Henning Kamp sc->sc_unit = *unit; 8013a3fcd72SPoul-Henning Kamp sc->sc_ileave = *ileave; 8023a3fcd72SPoul-Henning Kamp 8033f4f4a14SMartin Cracauer if (gctl_get_param(req, "no_offset", NULL)) 8043f4f4a14SMartin Cracauer sc->sc_flags |= CCDF_NO_OFFSET; 8053f4f4a14SMartin Cracauer if (gctl_get_param(req, "linux", NULL)) 8063f4f4a14SMartin Cracauer sc->sc_flags |= CCDF_LINUX; 8073f4f4a14SMartin Cracauer 8083a3fcd72SPoul-Henning Kamp if (gctl_get_param(req, "uniform", NULL)) 8093a3fcd72SPoul-Henning Kamp sc->sc_flags |= CCDF_UNIFORM; 8103a3fcd72SPoul-Henning Kamp if (gctl_get_param(req, "mirror", NULL)) 8113a3fcd72SPoul-Henning Kamp sc->sc_flags |= CCDF_MIRROR; 8123a3fcd72SPoul-Henning Kamp 8133a3fcd72SPoul-Henning Kamp if (sc->sc_ileave == 0 && (sc->sc_flags & CCDF_MIRROR)) { 8143a3fcd72SPoul-Henning Kamp printf("%s: disabling mirror, interleave is 0\n", gp->name); 8153a3fcd72SPoul-Henning Kamp sc->sc_flags &= ~(CCDF_MIRROR); 8163a3fcd72SPoul-Henning Kamp } 8173a3fcd72SPoul-Henning Kamp 8183a3fcd72SPoul-Henning Kamp if ((sc->sc_flags & CCDF_MIRROR) && !(sc->sc_flags & CCDF_UNIFORM)) { 8193a3fcd72SPoul-Henning Kamp printf("%s: mirror/parity forces uniform flag\n", gp->name); 8203a3fcd72SPoul-Henning Kamp sc->sc_flags |= CCDF_UNIFORM; 8213a3fcd72SPoul-Henning Kamp } 8223a3fcd72SPoul-Henning Kamp 8233a3fcd72SPoul-Henning Kamp error = ccdinit(req, sc); 8243a3fcd72SPoul-Henning Kamp if (error != 0) { 8253a3fcd72SPoul-Henning Kamp g_ccd_freesc(sc); 8263a3fcd72SPoul-Henning Kamp gp->softc = NULL; 8273a3fcd72SPoul-Henning Kamp g_wither_geom(gp, ENXIO); 8283a3fcd72SPoul-Henning Kamp return; 8293a3fcd72SPoul-Henning Kamp } 8303a3fcd72SPoul-Henning Kamp 8313a3fcd72SPoul-Henning Kamp pp = g_new_providerf(gp, "%s", gp->name); 8323a3fcd72SPoul-Henning Kamp pp->mediasize = sc->sc_size * (off_t)sc->sc_secsize; 8333a3fcd72SPoul-Henning Kamp pp->sectorsize = sc->sc_secsize; 8343a3fcd72SPoul-Henning Kamp g_error_provider(pp, 0); 835189337d8SPoul-Henning Kamp 8362616144eSDag-Erling Smørgrav sb = sbuf_new_auto(); 8373a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "ccd%d: %d components ", sc->sc_unit, *nprovider); 8383a3fcd72SPoul-Henning Kamp for (i = 0; i < *nprovider; i++) { 8393a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "%s%s", 8403a3fcd72SPoul-Henning Kamp i == 0 ? "(" : ", ", 8413a3fcd72SPoul-Henning Kamp sc->sc_cinfo[i].ci_provider->name); 8423a3fcd72SPoul-Henning Kamp } 8433a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "), %jd blocks ", (off_t)pp->mediasize / DEV_BSIZE); 8443a3fcd72SPoul-Henning Kamp if (sc->sc_ileave != 0) 8453a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "interleaved at %d blocks\n", 8463a3fcd72SPoul-Henning Kamp sc->sc_ileave); 8473a3fcd72SPoul-Henning Kamp else 8483a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "concatenated\n"); 8493a3fcd72SPoul-Henning Kamp sbuf_finish(sb); 85041063f93SMarcel Moolenaar gctl_set_param_err(req, "output", sbuf_data(sb), sbuf_len(sb) + 1); 8513a3fcd72SPoul-Henning Kamp sbuf_delete(sb); 8523a3fcd72SPoul-Henning Kamp } 8533a3fcd72SPoul-Henning Kamp 854f6367971SPoul-Henning Kamp static int 855f6367971SPoul-Henning Kamp g_ccd_destroy_geom(struct gctl_req *req, struct g_class *mp, struct g_geom *gp) 8563a3fcd72SPoul-Henning Kamp { 8573a3fcd72SPoul-Henning Kamp struct g_provider *pp; 8583a3fcd72SPoul-Henning Kamp struct ccd_s *sc; 8593a3fcd72SPoul-Henning Kamp 8603a3fcd72SPoul-Henning Kamp g_topology_assert(); 8613a3fcd72SPoul-Henning Kamp sc = gp->softc; 8623a3fcd72SPoul-Henning Kamp pp = LIST_FIRST(&gp->provider); 863f6367971SPoul-Henning Kamp if (sc == NULL || pp == NULL) 864f6367971SPoul-Henning Kamp return (EBUSY); 8653a3fcd72SPoul-Henning Kamp if (pp->acr != 0 || pp->acw != 0 || pp->ace != 0) { 8663a3fcd72SPoul-Henning Kamp gctl_error(req, "%s is open(r%dw%de%d)", gp->name, 8673a3fcd72SPoul-Henning Kamp pp->acr, pp->acw, pp->ace); 868f6367971SPoul-Henning Kamp return (EBUSY); 8693a3fcd72SPoul-Henning Kamp } 8703a3fcd72SPoul-Henning Kamp g_ccd_freesc(sc); 8713a3fcd72SPoul-Henning Kamp gp->softc = NULL; 8723a3fcd72SPoul-Henning Kamp g_wither_geom(gp, ENXIO); 873f6367971SPoul-Henning Kamp return (0); 8743a3fcd72SPoul-Henning Kamp } 8753a3fcd72SPoul-Henning Kamp 8763a3fcd72SPoul-Henning Kamp static void 8773a3fcd72SPoul-Henning Kamp g_ccd_list(struct gctl_req *req, struct g_class *mp) 8783a3fcd72SPoul-Henning Kamp { 8793a3fcd72SPoul-Henning Kamp struct sbuf *sb; 8803a3fcd72SPoul-Henning Kamp struct ccd_s *cs; 8813a3fcd72SPoul-Henning Kamp struct g_geom *gp; 8823a3fcd72SPoul-Henning Kamp int i, unit, *up; 8833a3fcd72SPoul-Henning Kamp 884251048a1SUlf Lilleengen up = gctl_get_paraml(req, "unit", sizeof (*up)); 885251048a1SUlf Lilleengen if (up == NULL) { 886251048a1SUlf Lilleengen gctl_error(req, "unit parameter not given"); 887251048a1SUlf Lilleengen return; 888251048a1SUlf Lilleengen } 8893a3fcd72SPoul-Henning Kamp unit = *up; 8902616144eSDag-Erling Smørgrav sb = sbuf_new_auto(); 8913a3fcd72SPoul-Henning Kamp LIST_FOREACH(gp, &mp->geom, geom) { 8923a3fcd72SPoul-Henning Kamp cs = gp->softc; 89392b5e86eSPoul-Henning Kamp if (cs == NULL || (unit >= 0 && unit != cs->sc_unit)) 8940f557e0aSPoul-Henning Kamp continue; 895189337d8SPoul-Henning Kamp sbuf_printf(sb, "ccd%d\t\t%d\t%d\t", 8963a3fcd72SPoul-Henning Kamp cs->sc_unit, cs->sc_ileave, cs->sc_flags & CCDF_USERMASK); 897189337d8SPoul-Henning Kamp 8983a3fcd72SPoul-Henning Kamp for (i = 0; i < cs->sc_ndisks; ++i) { 8993a3fcd72SPoul-Henning Kamp sbuf_printf(sb, "%s/dev/%s", i == 0 ? "" : " ", 9003a3fcd72SPoul-Henning Kamp cs->sc_cinfo[i].ci_provider->name); 901189337d8SPoul-Henning Kamp } 902189337d8SPoul-Henning Kamp sbuf_printf(sb, "\n"); 903189337d8SPoul-Henning Kamp } 904189337d8SPoul-Henning Kamp sbuf_finish(sb); 90541063f93SMarcel Moolenaar gctl_set_param_err(req, "output", sbuf_data(sb), sbuf_len(sb) + 1); 9063a3fcd72SPoul-Henning Kamp sbuf_delete(sb); 907189337d8SPoul-Henning Kamp } 908189337d8SPoul-Henning Kamp 909189337d8SPoul-Henning Kamp static void 910189337d8SPoul-Henning Kamp g_ccd_config(struct gctl_req *req, struct g_class *mp, char const *verb) 911189337d8SPoul-Henning Kamp { 912f6367971SPoul-Henning Kamp struct g_geom *gp; 913189337d8SPoul-Henning Kamp 914189337d8SPoul-Henning Kamp g_topology_assert(); 915189337d8SPoul-Henning Kamp if (!strcmp(verb, "create geom")) { 9163a3fcd72SPoul-Henning Kamp g_ccd_create(req, mp); 917189337d8SPoul-Henning Kamp } else if (!strcmp(verb, "destroy geom")) { 918f6367971SPoul-Henning Kamp gp = gctl_get_geom(req, mp, "geom"); 919f6367971SPoul-Henning Kamp if (gp != NULL) 920f6367971SPoul-Henning Kamp g_ccd_destroy_geom(req, mp, gp); 921189337d8SPoul-Henning Kamp } else if (!strcmp(verb, "list")) { 9223a3fcd72SPoul-Henning Kamp g_ccd_list(req, mp); 923189337d8SPoul-Henning Kamp } else { 924189337d8SPoul-Henning Kamp gctl_error(req, "unknown verb"); 925189337d8SPoul-Henning Kamp } 926189337d8SPoul-Henning Kamp } 927189337d8SPoul-Henning Kamp 928189337d8SPoul-Henning Kamp static struct g_class g_ccd_class = { 929189337d8SPoul-Henning Kamp .name = "CCD", 9305721c9c7SPoul-Henning Kamp .version = G_VERSION, 931189337d8SPoul-Henning Kamp .ctlreq = g_ccd_config, 932f6367971SPoul-Henning Kamp .destroy_geom = g_ccd_destroy_geom, 933650ee351SPoul-Henning Kamp .start = g_ccd_start, 934650ee351SPoul-Henning Kamp .orphan = g_ccd_orphan, 935650ee351SPoul-Henning Kamp .access = g_ccd_access, 936189337d8SPoul-Henning Kamp }; 937189337d8SPoul-Henning Kamp 938189337d8SPoul-Henning Kamp DECLARE_GEOM_CLASS(g_ccd_class, g_ccd); 939*74d6c131SKyle Evans MODULE_VERSION(geom_ccd, 0); 940