1da9e4f55SPoul-Henning Kamp /* 2da9e4f55SPoul-Henning Kamp * ---------------------------------------------------------------------------- 3da9e4f55SPoul-Henning Kamp * "THE BEER-WARE LICENSE" (Revision 42): 4da9e4f55SPoul-Henning Kamp * <phk@FreeBSD.ORG> wrote this file. As long as you retain this notice you 5da9e4f55SPoul-Henning Kamp * can do whatever you want with this stuff. If we meet some day, and you think 6da9e4f55SPoul-Henning Kamp * this stuff is worth it, you can buy me a beer in return. Poul-Henning Kamp 7da9e4f55SPoul-Henning Kamp * ---------------------------------------------------------------------------- 8da9e4f55SPoul-Henning Kamp * 9da9e4f55SPoul-Henning Kamp * $FreeBSD$ 10da9e4f55SPoul-Henning Kamp * 11da9e4f55SPoul-Henning Kamp */ 12da9e4f55SPoul-Henning Kamp 13417fb7f6SPoul-Henning Kamp #include "opt_geom.h" 14417fb7f6SPoul-Henning Kamp 15da9e4f55SPoul-Henning Kamp #include <sys/param.h> 16da9e4f55SPoul-Henning Kamp #include <sys/systm.h> 17f90c382cSPoul-Henning Kamp #include <sys/stdint.h> 189626b608SPoul-Henning Kamp #include <sys/bio.h> 19da9e4f55SPoul-Henning Kamp #include <sys/conf.h> 20da9e4f55SPoul-Henning Kamp #include <sys/disk.h> 217812d86fSPoul-Henning Kamp #include <sys/disklabel.h> 22f90c382cSPoul-Henning Kamp 23f90c382cSPoul-Henning Kamp /*- 24f90c382cSPoul-Henning Kamp * Disk error is the preface to plaintive error messages 25f90c382cSPoul-Henning Kamp * about failing disk transfers. It prints messages of the form 26f90c382cSPoul-Henning Kamp * "hp0g: BLABLABLA cmd=read fsbn 12345 of 12344-12347" 27f90c382cSPoul-Henning Kamp * blkdone should be -1 if the position of the error is unknown. 28f90c382cSPoul-Henning Kamp * The message is printed with printf. 29f90c382cSPoul-Henning Kamp */ 30f90c382cSPoul-Henning Kamp void 31f90c382cSPoul-Henning Kamp disk_err(struct bio *bp, const char *what, int blkdone, int nl) 32f90c382cSPoul-Henning Kamp { 33f90c382cSPoul-Henning Kamp daddr_t sn; 34f90c382cSPoul-Henning Kamp 35a9463ba8SPoul-Henning Kamp if (bp->bio_dev != NULL) 36f90c382cSPoul-Henning Kamp printf("%s: %s ", devtoname(bp->bio_dev), what); 37a9463ba8SPoul-Henning Kamp else if (bp->bio_disk != NULL) 38a9463ba8SPoul-Henning Kamp printf("%s%d: %s ", 39a9463ba8SPoul-Henning Kamp bp->bio_disk->d_name, bp->bio_disk->d_unit, what); 40a9463ba8SPoul-Henning Kamp else 41a9463ba8SPoul-Henning Kamp printf("disk??: %s ", what); 42f90c382cSPoul-Henning Kamp switch(bp->bio_cmd) { 43f90c382cSPoul-Henning Kamp case BIO_READ: printf("cmd=read "); break; 44f90c382cSPoul-Henning Kamp case BIO_WRITE: printf("cmd=write "); break; 45f90c382cSPoul-Henning Kamp case BIO_DELETE: printf("cmd=delete "); break; 46f90c382cSPoul-Henning Kamp case BIO_GETATTR: printf("cmd=getattr "); break; 47f90c382cSPoul-Henning Kamp case BIO_SETATTR: printf("cmd=setattr "); break; 48f90c382cSPoul-Henning Kamp default: printf("cmd=%x ", bp->bio_cmd); break; 49f90c382cSPoul-Henning Kamp } 50f90c382cSPoul-Henning Kamp sn = bp->bio_blkno; 51f90c382cSPoul-Henning Kamp if (bp->bio_bcount <= DEV_BSIZE) { 52f90c382cSPoul-Henning Kamp printf("fsbn %jd%s", (intmax_t)sn, nl ? "\n" : ""); 53f90c382cSPoul-Henning Kamp return; 54f90c382cSPoul-Henning Kamp } 55f90c382cSPoul-Henning Kamp if (blkdone >= 0) { 56f90c382cSPoul-Henning Kamp sn += blkdone; 57f90c382cSPoul-Henning Kamp printf("fsbn %jd of ", (intmax_t)sn); 58f90c382cSPoul-Henning Kamp } 59f90c382cSPoul-Henning Kamp printf("%jd-%jd", (intmax_t)bp->bio_blkno, 60f90c382cSPoul-Henning Kamp (intmax_t)(bp->bio_blkno + (bp->bio_bcount - 1) / DEV_BSIZE)); 61f90c382cSPoul-Henning Kamp if (nl) 62f90c382cSPoul-Henning Kamp printf("\n"); 63f90c382cSPoul-Henning Kamp } 642382fb0aSPoul-Henning Kamp 652382fb0aSPoul-Henning Kamp /* 662382fb0aSPoul-Henning Kamp * Seek sort for disks. 672382fb0aSPoul-Henning Kamp * 682382fb0aSPoul-Henning Kamp * The buf_queue keep two queues, sorted in ascending block order. The first 692382fb0aSPoul-Henning Kamp * queue holds those requests which are positioned after the current block 702382fb0aSPoul-Henning Kamp * (in the first request); the second, which starts at queue->switch_point, 712382fb0aSPoul-Henning Kamp * holds requests which came in after their block number was passed. Thus 722382fb0aSPoul-Henning Kamp * we implement a one way scan, retracting after reaching the end of the drive 732382fb0aSPoul-Henning Kamp * to the first request on the second queue, at which time it becomes the 742382fb0aSPoul-Henning Kamp * first queue. 752382fb0aSPoul-Henning Kamp * 762382fb0aSPoul-Henning Kamp * A one-way scan is natural because of the way UNIX read-ahead blocks are 772382fb0aSPoul-Henning Kamp * allocated. 782382fb0aSPoul-Henning Kamp */ 792382fb0aSPoul-Henning Kamp 802382fb0aSPoul-Henning Kamp void 812382fb0aSPoul-Henning Kamp bioq_disksort(bioq, bp) 822382fb0aSPoul-Henning Kamp struct bio_queue_head *bioq; 832382fb0aSPoul-Henning Kamp struct bio *bp; 842382fb0aSPoul-Henning Kamp { 852382fb0aSPoul-Henning Kamp struct bio *bq; 862382fb0aSPoul-Henning Kamp struct bio *bn; 872382fb0aSPoul-Henning Kamp struct bio *be; 882382fb0aSPoul-Henning Kamp 892382fb0aSPoul-Henning Kamp if (!atomic_cmpset_int(&bioq->busy, 0, 1)) 902382fb0aSPoul-Henning Kamp panic("Recursing in bioq_disksort()"); 912382fb0aSPoul-Henning Kamp be = TAILQ_LAST(&bioq->queue, bio_queue); 922382fb0aSPoul-Henning Kamp /* 932382fb0aSPoul-Henning Kamp * If the queue is empty or we are an 942382fb0aSPoul-Henning Kamp * ordered transaction, then it's easy. 952382fb0aSPoul-Henning Kamp */ 962382fb0aSPoul-Henning Kamp if ((bq = bioq_first(bioq)) == NULL) { 972382fb0aSPoul-Henning Kamp bioq_insert_tail(bioq, bp); 982382fb0aSPoul-Henning Kamp bioq->busy = 0; 992382fb0aSPoul-Henning Kamp return; 1002382fb0aSPoul-Henning Kamp } else if (bioq->insert_point != NULL) { 1012382fb0aSPoul-Henning Kamp 1022382fb0aSPoul-Henning Kamp /* 1032382fb0aSPoul-Henning Kamp * A certain portion of the list is 1042382fb0aSPoul-Henning Kamp * "locked" to preserve ordering, so 1052382fb0aSPoul-Henning Kamp * we can only insert after the insert 1062382fb0aSPoul-Henning Kamp * point. 1072382fb0aSPoul-Henning Kamp */ 1082382fb0aSPoul-Henning Kamp bq = bioq->insert_point; 1092382fb0aSPoul-Henning Kamp } else { 1102382fb0aSPoul-Henning Kamp 1112382fb0aSPoul-Henning Kamp /* 1122382fb0aSPoul-Henning Kamp * If we lie before the last removed (currently active) 1132382fb0aSPoul-Henning Kamp * request, and are not inserting ourselves into the 1142382fb0aSPoul-Henning Kamp * "locked" portion of the list, then we must add ourselves 1152382fb0aSPoul-Henning Kamp * to the second request list. 1162382fb0aSPoul-Henning Kamp */ 1172382fb0aSPoul-Henning Kamp if (bp->bio_pblkno < bioq->last_pblkno) { 1182382fb0aSPoul-Henning Kamp 1192382fb0aSPoul-Henning Kamp bq = bioq->switch_point; 1202382fb0aSPoul-Henning Kamp /* 1212382fb0aSPoul-Henning Kamp * If we are starting a new secondary list, 1222382fb0aSPoul-Henning Kamp * then it's easy. 1232382fb0aSPoul-Henning Kamp */ 1242382fb0aSPoul-Henning Kamp if (bq == NULL) { 1252382fb0aSPoul-Henning Kamp bioq->switch_point = bp; 1262382fb0aSPoul-Henning Kamp bioq_insert_tail(bioq, bp); 1272382fb0aSPoul-Henning Kamp bioq->busy = 0; 1282382fb0aSPoul-Henning Kamp return; 1292382fb0aSPoul-Henning Kamp } 1302382fb0aSPoul-Henning Kamp /* 1312382fb0aSPoul-Henning Kamp * If we lie ahead of the current switch point, 1322382fb0aSPoul-Henning Kamp * insert us before the switch point and move 1332382fb0aSPoul-Henning Kamp * the switch point. 1342382fb0aSPoul-Henning Kamp */ 1352382fb0aSPoul-Henning Kamp if (bp->bio_pblkno < bq->bio_pblkno) { 1362382fb0aSPoul-Henning Kamp bioq->switch_point = bp; 1372382fb0aSPoul-Henning Kamp TAILQ_INSERT_BEFORE(bq, bp, bio_queue); 1382382fb0aSPoul-Henning Kamp bioq->busy = 0; 1392382fb0aSPoul-Henning Kamp return; 1402382fb0aSPoul-Henning Kamp } 1412382fb0aSPoul-Henning Kamp } else { 1422382fb0aSPoul-Henning Kamp if (bioq->switch_point != NULL) 1432382fb0aSPoul-Henning Kamp be = TAILQ_PREV(bioq->switch_point, 1442382fb0aSPoul-Henning Kamp bio_queue, bio_queue); 1452382fb0aSPoul-Henning Kamp /* 1462382fb0aSPoul-Henning Kamp * If we lie between last_pblkno and bq, 1472382fb0aSPoul-Henning Kamp * insert before bq. 1482382fb0aSPoul-Henning Kamp */ 1492382fb0aSPoul-Henning Kamp if (bp->bio_pblkno < bq->bio_pblkno) { 1502382fb0aSPoul-Henning Kamp TAILQ_INSERT_BEFORE(bq, bp, bio_queue); 1512382fb0aSPoul-Henning Kamp bioq->busy = 0; 1522382fb0aSPoul-Henning Kamp return; 1532382fb0aSPoul-Henning Kamp } 1542382fb0aSPoul-Henning Kamp } 1552382fb0aSPoul-Henning Kamp } 1562382fb0aSPoul-Henning Kamp 1572382fb0aSPoul-Henning Kamp /* 1582382fb0aSPoul-Henning Kamp * Request is at/after our current position in the list. 1592382fb0aSPoul-Henning Kamp * Optimize for sequential I/O by seeing if we go at the tail. 1602382fb0aSPoul-Henning Kamp */ 1612382fb0aSPoul-Henning Kamp if (bp->bio_pblkno > be->bio_pblkno) { 1622382fb0aSPoul-Henning Kamp TAILQ_INSERT_AFTER(&bioq->queue, be, bp, bio_queue); 1632382fb0aSPoul-Henning Kamp bioq->busy = 0; 1642382fb0aSPoul-Henning Kamp return; 1652382fb0aSPoul-Henning Kamp } 1662382fb0aSPoul-Henning Kamp 1672382fb0aSPoul-Henning Kamp /* Otherwise, insertion sort */ 1682382fb0aSPoul-Henning Kamp while ((bn = TAILQ_NEXT(bq, bio_queue)) != NULL) { 1692382fb0aSPoul-Henning Kamp 1702382fb0aSPoul-Henning Kamp /* 1712382fb0aSPoul-Henning Kamp * We want to go after the current request if it is the end 1722382fb0aSPoul-Henning Kamp * of the first request list, or if the next request is a 1732382fb0aSPoul-Henning Kamp * larger cylinder than our request. 1742382fb0aSPoul-Henning Kamp */ 1752382fb0aSPoul-Henning Kamp if (bn == bioq->switch_point 1762382fb0aSPoul-Henning Kamp || bp->bio_pblkno < bn->bio_pblkno) 1772382fb0aSPoul-Henning Kamp break; 1782382fb0aSPoul-Henning Kamp bq = bn; 1792382fb0aSPoul-Henning Kamp } 1802382fb0aSPoul-Henning Kamp TAILQ_INSERT_AFTER(&bioq->queue, bq, bp, bio_queue); 1812382fb0aSPoul-Henning Kamp bioq->busy = 0; 1822382fb0aSPoul-Henning Kamp } 1832382fb0aSPoul-Henning Kamp 1842382fb0aSPoul-Henning Kamp 185