1 /*- 2 * Copyright (c) 1998 Robert Nordier 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms are freely 6 * permitted provided that the above copyright notice and this 7 * paragraph and the following disclaimer are duplicated in all 8 * such forms. 9 * 10 * This software is provided "AS IS" and without any express or 11 * implied warranties, including, without limitation, the implied 12 * warranties of merchantability and fitness for a particular 13 * purpose. 14 */ 15 16 #include <sys/cdefs.h> 17 __FBSDID("$FreeBSD$"); 18 19 #include "stand.h" 20 21 #include <sys/param.h> 22 #include <sys/errno.h> 23 #include <sys/diskmbr.h> 24 #ifdef GPT 25 #include <sys/gpt.h> 26 #endif 27 #include <sys/reboot.h> 28 #include <sys/queue.h> 29 30 #include <machine/bootinfo.h> 31 #include <machine/elf.h> 32 #include <machine/pc/bios.h> 33 34 #include <stdarg.h> 35 #include <stddef.h> 36 37 #include <a.out.h> 38 39 #include <btxv86.h> 40 41 #include "lib.h" 42 #include "rbx.h" 43 #include "drv.h" 44 #include "edd.h" 45 #include "cons.h" 46 #include "bootargs.h" 47 #include "paths.h" 48 49 #include "libzfs.h" 50 51 #define ARGS 0x900 52 #define NOPT 14 53 #define NDEV 3 54 55 #define BIOS_NUMDRIVES 0x475 56 #define DRV_HARD 0x80 57 #define DRV_MASK 0x7f 58 59 #define TYPE_AD 0 60 #define TYPE_DA 1 61 #define TYPE_MAXHARD TYPE_DA 62 #define TYPE_FD 2 63 64 #define DEV_GELIBOOT_BSIZE 4096 65 66 extern uint32_t _end; 67 68 #ifdef GPT 69 static const uuid_t freebsd_zfs_uuid = GPT_ENT_TYPE_FREEBSD_ZFS; 70 #endif 71 static const char optstr[NOPT] = "DhaCcdgmnpqrsv"; /* Also 'P', 'S' */ 72 static const unsigned char flags[NOPT] = { 73 RBX_DUAL, 74 RBX_SERIAL, 75 RBX_ASKNAME, 76 RBX_CDROM, 77 RBX_CONFIG, 78 RBX_KDB, 79 RBX_GDB, 80 RBX_MUTE, 81 RBX_NOINTR, 82 RBX_PAUSE, 83 RBX_QUIET, 84 RBX_DFLTROOT, 85 RBX_SINGLE, 86 RBX_VERBOSE 87 }; 88 uint32_t opts; 89 90 static const unsigned char dev_maj[NDEV] = {30, 4, 2}; 91 92 static char cmd[512]; 93 static char cmddup[512]; 94 static char kname[1024]; 95 static char rootname[256]; 96 static int comspeed = SIOSPD; 97 static struct bootinfo bootinfo; 98 static uint32_t bootdev; 99 static struct zfs_boot_args zfsargs; 100 101 vm_offset_t high_heap_base; 102 uint32_t bios_basemem, bios_extmem, high_heap_size; 103 104 static struct bios_smap smap; 105 106 /* 107 * The minimum amount of memory to reserve in bios_extmem for the heap. 108 */ 109 #define HEAP_MIN (64 * 1024 * 1024) 110 111 static char *heap_next; 112 static char *heap_end; 113 114 /* Buffers that must not span a 64k boundary. */ 115 #define READ_BUF_SIZE 8192 116 struct dmadat { 117 char rdbuf[READ_BUF_SIZE]; /* for reading large things */ 118 char secbuf[READ_BUF_SIZE]; /* for MBR/disklabel */ 119 }; 120 static struct dmadat *dmadat; 121 122 void exit(int); 123 void reboot(void); 124 static void load(void); 125 static int parse_cmd(void); 126 static void bios_getmem(void); 127 int main(void); 128 129 #ifdef LOADER_GELI_SUPPORT 130 #include "geliboot.h" 131 static char gelipw[GELI_PW_MAXLEN]; 132 #endif 133 134 struct zfsdsk { 135 struct dsk dsk; 136 #ifdef LOADER_GELI_SUPPORT 137 struct geli_dev *gdev; 138 #endif 139 }; 140 141 #include "zfsimpl.c" 142 143 /* 144 * Read from a dnode (which must be from a ZPL filesystem). 145 */ 146 static int 147 zfs_read(spa_t *spa, const dnode_phys_t *dnode, off_t *offp, void *start, size_t size) 148 { 149 const znode_phys_t *zp = (const znode_phys_t *) dnode->dn_bonus; 150 size_t n; 151 int rc; 152 153 n = size; 154 if (*offp + n > zp->zp_size) 155 n = zp->zp_size - *offp; 156 157 rc = dnode_read(spa, dnode, *offp, start, n); 158 if (rc) 159 return (-1); 160 *offp += n; 161 162 return (n); 163 } 164 165 /* 166 * Current ZFS pool 167 */ 168 static spa_t *spa; 169 static spa_t *primary_spa; 170 static vdev_t *primary_vdev; 171 172 /* 173 * A wrapper for dskread that doesn't have to worry about whether the 174 * buffer pointer crosses a 64k boundary. 175 */ 176 static int 177 vdev_read(void *xvdev, void *priv, off_t off, void *buf, size_t bytes) 178 { 179 char *p; 180 daddr_t lba, alignlba; 181 off_t diff; 182 unsigned int nb, alignnb; 183 struct zfsdsk *zdsk = (struct zfsdsk *) priv; 184 185 if ((off & (DEV_BSIZE - 1)) || (bytes & (DEV_BSIZE - 1))) 186 return -1; 187 188 p = buf; 189 lba = off / DEV_BSIZE; 190 lba += zdsk->dsk.start; 191 /* 192 * Align reads to 4k else 4k sector GELIs will not decrypt. 193 * Round LBA down to nearest multiple of DEV_GELIBOOT_BSIZE bytes. 194 */ 195 alignlba = rounddown2(off, DEV_GELIBOOT_BSIZE) / DEV_BSIZE; 196 /* 197 * The read must be aligned to DEV_GELIBOOT_BSIZE bytes relative to the 198 * start of the GELI partition, not the start of the actual disk. 199 */ 200 alignlba += zdsk->dsk.start; 201 diff = (lba - alignlba) * DEV_BSIZE; 202 203 while (bytes > 0) { 204 nb = bytes / DEV_BSIZE; 205 /* 206 * Ensure that the read size plus the leading offset does not 207 * exceed the size of the read buffer. 208 */ 209 if (nb > (READ_BUF_SIZE - diff) / DEV_BSIZE) 210 nb = (READ_BUF_SIZE - diff) / DEV_BSIZE; 211 /* 212 * Round the number of blocks to read up to the nearest multiple 213 * of DEV_GELIBOOT_BSIZE. 214 */ 215 alignnb = roundup2(nb * DEV_BSIZE + diff, DEV_GELIBOOT_BSIZE) 216 / DEV_BSIZE; 217 218 if (zdsk->dsk.size > 0 && alignlba + alignnb > 219 zdsk->dsk.size + zdsk->dsk.start) { 220 printf("Shortening read at %lld from %d to %lld\n", 221 alignlba, alignnb, 222 (zdsk->dsk.size + zdsk->dsk.start) - alignlba); 223 alignnb = (zdsk->dsk.size + zdsk->dsk.start) - alignlba; 224 } 225 226 if (drvread(&zdsk->dsk, dmadat->rdbuf, alignlba, alignnb)) 227 return -1; 228 #ifdef LOADER_GELI_SUPPORT 229 /* decrypt */ 230 if (zdsk->gdev != NULL) { 231 if (geli_read(zdsk->gdev, ((alignlba - zdsk->dsk.start) * 232 DEV_BSIZE), dmadat->rdbuf, alignnb * DEV_BSIZE)) 233 return (-1); 234 } 235 #endif 236 memcpy(p, dmadat->rdbuf + diff, nb * DEV_BSIZE); 237 p += nb * DEV_BSIZE; 238 lba += nb; 239 alignlba += alignnb; 240 bytes -= nb * DEV_BSIZE; 241 /* Don't need the leading offset after the first block. */ 242 diff = 0; 243 } 244 245 return 0; 246 } 247 /* Match the signature exactly due to signature madness */ 248 static int 249 vdev_read2(vdev_t *vdev, void *priv, off_t off, void *buf, size_t bytes) 250 { 251 return vdev_read(vdev, priv, off, buf, bytes); 252 } 253 254 255 static int 256 vdev_write(vdev_t *vdev, void *priv, off_t off, void *buf, size_t bytes) 257 { 258 char *p; 259 daddr_t lba; 260 unsigned int nb; 261 struct zfsdsk *zdsk = (struct zfsdsk *) priv; 262 263 if ((off & (DEV_BSIZE - 1)) || (bytes & (DEV_BSIZE - 1))) 264 return -1; 265 266 p = buf; 267 lba = off / DEV_BSIZE; 268 lba += zdsk->dsk.start; 269 while (bytes > 0) { 270 nb = bytes / DEV_BSIZE; 271 if (nb > READ_BUF_SIZE / DEV_BSIZE) 272 nb = READ_BUF_SIZE / DEV_BSIZE; 273 memcpy(dmadat->rdbuf, p, nb * DEV_BSIZE); 274 if (drvwrite(&zdsk->dsk, dmadat->rdbuf, lba, nb)) 275 return -1; 276 p += nb * DEV_BSIZE; 277 lba += nb; 278 bytes -= nb * DEV_BSIZE; 279 } 280 281 return 0; 282 } 283 284 static int 285 xfsread(const dnode_phys_t *dnode, off_t *offp, void *buf, size_t nbyte) 286 { 287 if ((size_t)zfs_read(spa, dnode, offp, buf, nbyte) != nbyte) { 288 printf("Invalid format\n"); 289 return -1; 290 } 291 return 0; 292 } 293 294 /* 295 * Read Pad2 (formerly "Boot Block Header") area of the first 296 * vdev label of the given vdev. 297 */ 298 static int 299 vdev_read_pad2(vdev_t *vdev, char *buf, size_t size) 300 { 301 blkptr_t bp; 302 char *tmp = zap_scratch; 303 off_t off = offsetof(vdev_label_t, vl_pad2); 304 305 if (size > VDEV_PAD_SIZE) 306 size = VDEV_PAD_SIZE; 307 308 BP_ZERO(&bp); 309 BP_SET_LSIZE(&bp, VDEV_PAD_SIZE); 310 BP_SET_PSIZE(&bp, VDEV_PAD_SIZE); 311 BP_SET_CHECKSUM(&bp, ZIO_CHECKSUM_LABEL); 312 BP_SET_COMPRESS(&bp, ZIO_COMPRESS_OFF); 313 DVA_SET_OFFSET(BP_IDENTITY(&bp), off); 314 if (vdev_read_phys(vdev, &bp, tmp, off, 0)) 315 return (EIO); 316 memcpy(buf, tmp, size); 317 return (0); 318 } 319 320 static int 321 vdev_clear_pad2(vdev_t *vdev) 322 { 323 char *zeroes = zap_scratch; 324 uint64_t *end; 325 off_t off = offsetof(vdev_label_t, vl_pad2); 326 327 memset(zeroes, 0, VDEV_PAD_SIZE); 328 end = (uint64_t *)(zeroes + VDEV_PAD_SIZE); 329 /* ZIO_CHECKSUM_LABEL magic and pre-calcualted checksum for all zeros */ 330 end[-5] = 0x0210da7ab10c7a11; 331 end[-4] = 0x97f48f807f6e2a3f; 332 end[-3] = 0xaf909f1658aacefc; 333 end[-2] = 0xcbd1ea57ff6db48b; 334 end[-1] = 0x6ec692db0d465fab; 335 if (vdev_write(vdev, vdev->v_read_priv, off, zeroes, VDEV_PAD_SIZE)) 336 return (EIO); 337 return (0); 338 } 339 340 static void 341 bios_getmem(void) 342 { 343 uint64_t size; 344 345 /* Parse system memory map */ 346 v86.ebx = 0; 347 do { 348 v86.ctl = V86_FLAGS; 349 v86.addr = 0x15; /* int 0x15 function 0xe820*/ 350 v86.eax = 0xe820; 351 v86.ecx = sizeof(struct bios_smap); 352 v86.edx = SMAP_SIG; 353 v86.es = VTOPSEG(&smap); 354 v86.edi = VTOPOFF(&smap); 355 v86int(); 356 if (V86_CY(v86.efl) || (v86.eax != SMAP_SIG)) 357 break; 358 /* look for a low-memory segment that's large enough */ 359 if ((smap.type == SMAP_TYPE_MEMORY) && (smap.base == 0) && 360 (smap.length >= (512 * 1024))) 361 bios_basemem = smap.length; 362 /* look for the first segment in 'extended' memory */ 363 if ((smap.type == SMAP_TYPE_MEMORY) && (smap.base == 0x100000)) { 364 bios_extmem = smap.length; 365 } 366 367 /* 368 * Look for the largest segment in 'extended' memory beyond 369 * 1MB but below 4GB. 370 */ 371 if ((smap.type == SMAP_TYPE_MEMORY) && (smap.base > 0x100000) && 372 (smap.base < 0x100000000ull)) { 373 size = smap.length; 374 375 /* 376 * If this segment crosses the 4GB boundary, truncate it. 377 */ 378 if (smap.base + size > 0x100000000ull) 379 size = 0x100000000ull - smap.base; 380 381 if (size > high_heap_size) { 382 high_heap_size = size; 383 high_heap_base = smap.base; 384 } 385 } 386 } while (v86.ebx != 0); 387 388 /* Fall back to the old compatibility function for base memory */ 389 if (bios_basemem == 0) { 390 v86.ctl = 0; 391 v86.addr = 0x12; /* int 0x12 */ 392 v86int(); 393 394 bios_basemem = (v86.eax & 0xffff) * 1024; 395 } 396 397 /* Fall back through several compatibility functions for extended memory */ 398 if (bios_extmem == 0) { 399 v86.ctl = V86_FLAGS; 400 v86.addr = 0x15; /* int 0x15 function 0xe801*/ 401 v86.eax = 0xe801; 402 v86int(); 403 if (!V86_CY(v86.efl)) { 404 bios_extmem = ((v86.ecx & 0xffff) + ((v86.edx & 0xffff) * 64)) * 1024; 405 } 406 } 407 if (bios_extmem == 0) { 408 v86.ctl = 0; 409 v86.addr = 0x15; /* int 0x15 function 0x88*/ 410 v86.eax = 0x8800; 411 v86int(); 412 bios_extmem = (v86.eax & 0xffff) * 1024; 413 } 414 415 /* 416 * If we have extended memory and did not find a suitable heap 417 * region in the SMAP, use the last 3MB of 'extended' memory as a 418 * high heap candidate. 419 */ 420 if (bios_extmem >= HEAP_MIN && high_heap_size < HEAP_MIN) { 421 high_heap_size = HEAP_MIN; 422 high_heap_base = bios_extmem + 0x100000 - HEAP_MIN; 423 } 424 } 425 426 /* 427 * Try to detect a device supported by the legacy int13 BIOS 428 */ 429 static int 430 int13probe(int drive) 431 { 432 v86.ctl = V86_FLAGS; 433 v86.addr = 0x13; 434 v86.eax = 0x800; 435 v86.edx = drive; 436 v86int(); 437 438 if (!V86_CY(v86.efl) && /* carry clear */ 439 ((v86.edx & 0xff) != (drive & DRV_MASK))) { /* unit # OK */ 440 if ((v86.ecx & 0x3f) == 0) { /* absurd sector size */ 441 return(0); /* skip device */ 442 } 443 return (1); 444 } 445 return(0); 446 } 447 448 /* 449 * We call this when we find a ZFS vdev - ZFS consumes the dsk 450 * structure so we must make a new one. 451 */ 452 static struct zfsdsk * 453 copy_dsk(struct zfsdsk *zdsk) 454 { 455 struct zfsdsk *newdsk; 456 457 newdsk = malloc(sizeof(struct zfsdsk)); 458 *newdsk = *zdsk; 459 return (newdsk); 460 } 461 462 /* 463 * Get disk size from eax=0x800 and 0x4800. We need to probe both 464 * because 0x4800 may not be available and we would like to get more 465 * or less correct disk size - if it is possible at all. 466 * Note we do not really want to touch drv.c because that code is shared 467 * with boot2 and we can not afford to grow that code. 468 */ 469 static uint64_t 470 drvsize_ext(struct zfsdsk *zdsk) 471 { 472 struct dsk *dskp; 473 uint64_t size, tmp; 474 int cyl, hds, sec; 475 476 dskp = &zdsk->dsk; 477 478 v86.ctl = V86_FLAGS; 479 v86.addr = 0x13; 480 v86.eax = 0x800; 481 v86.edx = dskp->drive; 482 v86int(); 483 484 /* Don't error out if we get bad sector number, try EDD as well */ 485 if (V86_CY(v86.efl) || /* carry set */ 486 (v86.edx & 0xff) <= (unsigned)(dskp->drive & 0x7f)) /* unit # bad */ 487 return (0); 488 cyl = ((v86.ecx & 0xc0) << 2) + ((v86.ecx & 0xff00) >> 8) + 1; 489 /* Convert max head # -> # of heads */ 490 hds = ((v86.edx & 0xff00) >> 8) + 1; 491 sec = v86.ecx & 0x3f; 492 493 size = (uint64_t)cyl * hds * sec; 494 495 /* Determine if we can use EDD with this device. */ 496 v86.ctl = V86_FLAGS; 497 v86.addr = 0x13; 498 v86.eax = 0x4100; 499 v86.edx = dskp->drive; 500 v86.ebx = 0x55aa; 501 v86int(); 502 if (V86_CY(v86.efl) || /* carry set */ 503 (v86.ebx & 0xffff) != 0xaa55 || /* signature */ 504 (v86.ecx & EDD_INTERFACE_FIXED_DISK) == 0) 505 return (size); 506 507 tmp = drvsize(dskp); 508 if (tmp > size) 509 size = tmp; 510 511 return (size); 512 } 513 514 /* 515 * The "layered" ioctl to read disk/partition size. Unfortunately 516 * the zfsboot case is hardest, because we do not have full software 517 * stack available, so we need to do some manual work here. 518 */ 519 uint64_t 520 ldi_get_size(void *priv) 521 { 522 struct zfsdsk *zdsk = priv; 523 uint64_t size = zdsk->dsk.size; 524 525 if (zdsk->dsk.start == 0) 526 size = drvsize_ext(zdsk); 527 528 return (size * DEV_BSIZE); 529 } 530 531 static void 532 probe_drive(struct zfsdsk *zdsk) 533 { 534 #ifdef GPT 535 struct gpt_hdr hdr; 536 struct gpt_ent *ent; 537 unsigned part, entries_per_sec; 538 daddr_t slba; 539 #endif 540 #if defined(GPT) || defined(LOADER_GELI_SUPPORT) 541 daddr_t elba; 542 #endif 543 544 struct dos_partition *dp; 545 char *sec; 546 unsigned i; 547 548 #ifdef LOADER_GELI_SUPPORT 549 /* 550 * Taste the disk, if it is GELI encrypted, decrypt it then dig out the 551 * partition table and probe each slice/partition in turn for a vdev or 552 * GELI encrypted vdev. 553 */ 554 elba = drvsize_ext(zdsk); 555 if (elba > 0) { 556 elba--; 557 } 558 zdsk->gdev = geli_taste(vdev_read, zdsk, elba, "disk%u:0:"); 559 if ((zdsk->gdev != NULL) && (geli_havekey(zdsk->gdev) == 0)) 560 geli_passphrase(zdsk->gdev, gelipw); 561 #endif /* LOADER_GELI_SUPPORT */ 562 563 sec = dmadat->secbuf; 564 zdsk->dsk.start = 0; 565 566 #ifdef GPT 567 /* 568 * First check for GPT. 569 */ 570 if (drvread(&zdsk->dsk, sec, 1, 1)) { 571 return; 572 } 573 memcpy(&hdr, sec, sizeof(hdr)); 574 if (memcmp(hdr.hdr_sig, GPT_HDR_SIG, sizeof(hdr.hdr_sig)) != 0 || 575 hdr.hdr_lba_self != 1 || hdr.hdr_revision < 0x00010000 || 576 hdr.hdr_entsz < sizeof(*ent) || DEV_BSIZE % hdr.hdr_entsz != 0) { 577 goto trymbr; 578 } 579 580 /* 581 * Probe all GPT partitions for the presence of ZFS pools. We 582 * return the spa_t for the first we find (if requested). This 583 * will have the effect of booting from the first pool on the 584 * disk. 585 * 586 * If no vdev is found, GELI decrypting the device and try again 587 */ 588 entries_per_sec = DEV_BSIZE / hdr.hdr_entsz; 589 slba = hdr.hdr_lba_table; 590 elba = slba + hdr.hdr_entries / entries_per_sec; 591 while (slba < elba) { 592 zdsk->dsk.start = 0; 593 if (drvread(&zdsk->dsk, sec, slba, 1)) 594 return; 595 for (part = 0; part < entries_per_sec; part++) { 596 ent = (struct gpt_ent *)(sec + part * hdr.hdr_entsz); 597 if (memcmp(&ent->ent_type, &freebsd_zfs_uuid, 598 sizeof(uuid_t)) == 0) { 599 zdsk->dsk.start = ent->ent_lba_start; 600 zdsk->dsk.size = ent->ent_lba_end - ent->ent_lba_start + 1; 601 zdsk->dsk.slice = part + 1; 602 zdsk->dsk.part = 255; 603 if (vdev_probe(vdev_read2, zdsk, NULL) == 0) { 604 /* 605 * This slice had a vdev. We need a new dsk 606 * structure now since the vdev now owns this one. 607 */ 608 zdsk = copy_dsk(zdsk); 609 } 610 #ifdef LOADER_GELI_SUPPORT 611 else if ((zdsk->gdev = geli_taste(vdev_read, zdsk, 612 ent->ent_lba_end - ent->ent_lba_start, "disk%up%u:", 613 zdsk->dsk.unit, zdsk->dsk.slice)) != NULL) { 614 if (geli_havekey(zdsk->gdev) == 0 || 615 geli_passphrase(zdsk->gdev, gelipw) == 0) { 616 /* 617 * This slice has GELI, check it for ZFS. 618 */ 619 if (vdev_probe(vdev_read2, zdsk, NULL) == 0) { 620 /* 621 * This slice had a vdev. We need a new dsk 622 * structure now since the vdev now owns this one. 623 */ 624 zdsk = copy_dsk(zdsk); 625 } 626 break; 627 } 628 } 629 #endif /* LOADER_GELI_SUPPORT */ 630 } 631 } 632 slba++; 633 } 634 return; 635 trymbr: 636 #endif /* GPT */ 637 638 if (drvread(&zdsk->dsk, sec, DOSBBSECTOR, 1)) 639 return; 640 dp = (void *)(sec + DOSPARTOFF); 641 642 for (i = 0; i < NDOSPART; i++) { 643 if (!dp[i].dp_typ) 644 continue; 645 zdsk->dsk.start = dp[i].dp_start; 646 zdsk->dsk.size = dp[i].dp_size; 647 zdsk->dsk.slice = i + 1; 648 if (vdev_probe(vdev_read2, zdsk, NULL) == 0) { 649 zdsk = copy_dsk(zdsk); 650 } 651 #ifdef LOADER_GELI_SUPPORT 652 else if ((zdsk->gdev = geli_taste(vdev_read, zdsk, dp[i].dp_size - 653 dp[i].dp_start, "disk%us%u:")) != NULL) { 654 if (geli_havekey(zdsk->gdev) == 0 || 655 geli_passphrase(zdsk->gdev, gelipw) == 0) { 656 /* 657 * This slice has GELI, check it for ZFS. 658 */ 659 if (vdev_probe(vdev_read2, zdsk, NULL) == 0) { 660 /* 661 * This slice had a vdev. We need a new dsk 662 * structure now since the vdev now owns this one. 663 */ 664 zdsk = copy_dsk(zdsk); 665 } 666 break; 667 } 668 } 669 #endif /* LOADER_GELI_SUPPORT */ 670 } 671 } 672 673 int 674 main(void) 675 { 676 dnode_phys_t dn; 677 off_t off; 678 struct zfsdsk *zdsk; 679 int autoboot, i; 680 int nextboot; 681 int rc; 682 683 dmadat = (void *)(roundup2(__base + (int32_t)&_end, 0x10000) - __base); 684 685 bios_getmem(); 686 687 if (high_heap_size > 0) { 688 heap_end = PTOV(high_heap_base + high_heap_size); 689 heap_next = PTOV(high_heap_base); 690 } else { 691 heap_next = (char *)dmadat + sizeof(*dmadat); 692 heap_end = (char *)PTOV(bios_basemem); 693 } 694 setheap(heap_next, heap_end); 695 696 zdsk = calloc(1, sizeof(struct zfsdsk)); 697 zdsk->dsk.drive = *(uint8_t *)PTOV(ARGS); 698 zdsk->dsk.type = zdsk->dsk.drive & DRV_HARD ? TYPE_AD : TYPE_FD; 699 zdsk->dsk.unit = zdsk->dsk.drive & DRV_MASK; 700 zdsk->dsk.slice = *(uint8_t *)PTOV(ARGS + 1) + 1; 701 zdsk->dsk.part = 0; 702 zdsk->dsk.start = 0; 703 zdsk->dsk.size = drvsize_ext(zdsk); 704 705 bootinfo.bi_version = BOOTINFO_VERSION; 706 bootinfo.bi_size = sizeof(bootinfo); 707 bootinfo.bi_basemem = bios_basemem / 1024; 708 bootinfo.bi_extmem = bios_extmem / 1024; 709 bootinfo.bi_memsizes_valid++; 710 bootinfo.bi_bios_dev = zdsk->dsk.drive; 711 712 bootdev = MAKEBOOTDEV(dev_maj[zdsk->dsk.type], 713 zdsk->dsk.slice, zdsk->dsk.unit, zdsk->dsk.part); 714 715 /* Process configuration file */ 716 717 autoboot = 1; 718 719 zfs_init(); 720 721 /* 722 * Probe the boot drive first - we will try to boot from whatever 723 * pool we find on that drive. 724 */ 725 probe_drive(zdsk); 726 727 /* 728 * Probe the rest of the drives that the bios knows about. This 729 * will find any other available pools and it may fill in missing 730 * vdevs for the boot pool. 731 */ 732 #ifndef VIRTUALBOX 733 for (i = 0; i < *(unsigned char *)PTOV(BIOS_NUMDRIVES); i++) 734 #else 735 for (i = 0; i < MAXBDDEV; i++) 736 #endif 737 { 738 if ((i | DRV_HARD) == *(uint8_t *)PTOV(ARGS)) 739 continue; 740 741 if (!int13probe(i | DRV_HARD)) 742 break; 743 744 zdsk = calloc(1, sizeof(struct zfsdsk)); 745 zdsk->dsk.drive = i | DRV_HARD; 746 zdsk->dsk.type = zdsk->dsk.drive & TYPE_AD; 747 zdsk->dsk.unit = i; 748 zdsk->dsk.slice = 0; 749 zdsk->dsk.part = 0; 750 zdsk->dsk.start = 0; 751 zdsk->dsk.size = drvsize_ext(zdsk); 752 probe_drive(zdsk); 753 } 754 755 /* 756 * The first discovered pool, if any, is the pool. 757 */ 758 spa = spa_get_primary(); 759 if (!spa) { 760 printf("%s: No ZFS pools located, can't boot\n", BOOTPROG); 761 for (;;) 762 ; 763 } 764 765 primary_spa = spa; 766 primary_vdev = spa_get_primary_vdev(spa); 767 768 nextboot = 0; 769 rc = vdev_read_pad2(primary_vdev, cmd, sizeof(cmd)); 770 if (vdev_clear_pad2(primary_vdev)) 771 printf("failed to clear pad2 area of primary vdev\n"); 772 if (rc == 0) { 773 if (*cmd) { 774 /* 775 * We could find an old-style ZFS Boot Block header here. 776 * Simply ignore it. 777 */ 778 if (*(uint64_t *)cmd != 0x2f5b007b10c) { 779 /* 780 * Note that parse() is destructive to cmd[] and we also want 781 * to honor RBX_QUIET option that could be present in cmd[]. 782 */ 783 nextboot = 1; 784 memcpy(cmddup, cmd, sizeof(cmd)); 785 if (parse_cmd()) { 786 printf("failed to parse pad2 area of primary vdev\n"); 787 reboot(); 788 } 789 if (!OPT_CHECK(RBX_QUIET)) 790 printf("zfs nextboot: %s\n", cmddup); 791 } 792 /* Do not process this command twice */ 793 *cmd = 0; 794 } 795 } else 796 printf("failed to read pad2 area of primary vdev\n"); 797 798 /* Mount ZFS only if it's not already mounted via nextboot parsing. */ 799 if (zfsmount.spa == NULL && 800 (zfs_spa_init(spa) != 0 || zfs_mount(spa, 0, &zfsmount) != 0)) { 801 printf("%s: failed to mount default pool %s\n", 802 BOOTPROG, spa->spa_name); 803 autoboot = 0; 804 } else if (zfs_lookup(&zfsmount, PATH_CONFIG, &dn) == 0 || 805 zfs_lookup(&zfsmount, PATH_DOTCONFIG, &dn) == 0) { 806 off = 0; 807 zfs_read(spa, &dn, &off, cmd, sizeof(cmd)); 808 } 809 810 if (*cmd) { 811 /* 812 * Note that parse_cmd() is destructive to cmd[] and we also want 813 * to honor RBX_QUIET option that could be present in cmd[]. 814 */ 815 memcpy(cmddup, cmd, sizeof(cmd)); 816 if (parse_cmd()) 817 autoboot = 0; 818 if (!OPT_CHECK(RBX_QUIET)) 819 printf("%s: %s\n", PATH_CONFIG, cmddup); 820 /* Do not process this command twice */ 821 *cmd = 0; 822 } 823 824 /* Do not risk waiting at the prompt forever. */ 825 if (nextboot && !autoboot) 826 reboot(); 827 828 /* 829 * Try to exec /boot/loader. If interrupted by a keypress, 830 * or in case of failure, try to load a kernel directly instead. 831 */ 832 833 if (autoboot && !*kname) { 834 memcpy(kname, PATH_LOADER, sizeof(PATH_LOADER)); 835 if (!keyhit(3)) { 836 load(); 837 memcpy(kname, PATH_KERNEL, sizeof(PATH_KERNEL)); 838 } 839 } 840 841 /* Present the user with the boot2 prompt. */ 842 843 for (;;) { 844 if (!autoboot || !OPT_CHECK(RBX_QUIET)) { 845 printf("\nFreeBSD/x86 boot\n"); 846 if (zfs_rlookup(spa, zfsmount.rootobj, rootname) != 0) 847 printf("Default: %s/<0x%llx>:%s\n" 848 "boot: ", 849 spa->spa_name, zfsmount.rootobj, kname); 850 else if (rootname[0] != '\0') 851 printf("Default: %s/%s:%s\n" 852 "boot: ", 853 spa->spa_name, rootname, kname); 854 else 855 printf("Default: %s:%s\n" 856 "boot: ", 857 spa->spa_name, kname); 858 } 859 if (ioctrl & IO_SERIAL) 860 sio_flush(); 861 if (!autoboot || keyhit(5)) 862 getstr(cmd, sizeof(cmd)); 863 else if (!autoboot || !OPT_CHECK(RBX_QUIET)) 864 putchar('\n'); 865 autoboot = 0; 866 if (parse_cmd()) 867 putchar('\a'); 868 else 869 load(); 870 } 871 } 872 873 /* XXX - Needed for btxld to link the boot2 binary; do not remove. */ 874 void 875 exit(int x) 876 { 877 __exit(x); 878 } 879 880 void 881 reboot(void) 882 { 883 __exit(0); 884 } 885 886 static void 887 load(void) 888 { 889 union { 890 struct exec ex; 891 Elf32_Ehdr eh; 892 } hdr; 893 static Elf32_Phdr ep[2]; 894 static Elf32_Shdr es[2]; 895 caddr_t p; 896 dnode_phys_t dn; 897 off_t off; 898 uint32_t addr, x; 899 int fmt, i, j; 900 901 if (zfs_lookup(&zfsmount, kname, &dn)) { 902 printf("\nCan't find %s\n", kname); 903 return; 904 } 905 off = 0; 906 if (xfsread(&dn, &off, &hdr, sizeof(hdr))) 907 return; 908 if (N_GETMAGIC(hdr.ex) == ZMAGIC) 909 fmt = 0; 910 else if (IS_ELF(hdr.eh)) 911 fmt = 1; 912 else { 913 printf("Invalid %s\n", "format"); 914 return; 915 } 916 if (fmt == 0) { 917 addr = hdr.ex.a_entry & 0xffffff; 918 p = PTOV(addr); 919 off = PAGE_SIZE; 920 if (xfsread(&dn, &off, p, hdr.ex.a_text)) 921 return; 922 p += roundup2(hdr.ex.a_text, PAGE_SIZE); 923 if (xfsread(&dn, &off, p, hdr.ex.a_data)) 924 return; 925 p += hdr.ex.a_data + roundup2(hdr.ex.a_bss, PAGE_SIZE); 926 bootinfo.bi_symtab = VTOP(p); 927 memcpy(p, &hdr.ex.a_syms, sizeof(hdr.ex.a_syms)); 928 p += sizeof(hdr.ex.a_syms); 929 if (hdr.ex.a_syms) { 930 if (xfsread(&dn, &off, p, hdr.ex.a_syms)) 931 return; 932 p += hdr.ex.a_syms; 933 if (xfsread(&dn, &off, p, sizeof(int))) 934 return; 935 x = *(uint32_t *)p; 936 p += sizeof(int); 937 x -= sizeof(int); 938 if (xfsread(&dn, &off, p, x)) 939 return; 940 p += x; 941 } 942 } else { 943 off = hdr.eh.e_phoff; 944 for (j = i = 0; i < hdr.eh.e_phnum && j < 2; i++) { 945 if (xfsread(&dn, &off, ep + j, sizeof(ep[0]))) 946 return; 947 if (ep[j].p_type == PT_LOAD) 948 j++; 949 } 950 for (i = 0; i < 2; i++) { 951 p = PTOV(ep[i].p_paddr & 0xffffff); 952 off = ep[i].p_offset; 953 if (xfsread(&dn, &off, p, ep[i].p_filesz)) 954 return; 955 } 956 p += roundup2(ep[1].p_memsz, PAGE_SIZE); 957 bootinfo.bi_symtab = VTOP(p); 958 if (hdr.eh.e_shnum == hdr.eh.e_shstrndx + 3) { 959 off = hdr.eh.e_shoff + sizeof(es[0]) * 960 (hdr.eh.e_shstrndx + 1); 961 if (xfsread(&dn, &off, &es, sizeof(es))) 962 return; 963 for (i = 0; i < 2; i++) { 964 memcpy(p, &es[i].sh_size, sizeof(es[i].sh_size)); 965 p += sizeof(es[i].sh_size); 966 off = es[i].sh_offset; 967 if (xfsread(&dn, &off, p, es[i].sh_size)) 968 return; 969 p += es[i].sh_size; 970 } 971 } 972 addr = hdr.eh.e_entry & 0xffffff; 973 } 974 bootinfo.bi_esymtab = VTOP(p); 975 bootinfo.bi_kernelname = VTOP(kname); 976 zfsargs.size = sizeof(zfsargs); 977 zfsargs.pool = zfsmount.spa->spa_guid; 978 zfsargs.root = zfsmount.rootobj; 979 zfsargs.primary_pool = primary_spa->spa_guid; 980 #ifdef LOADER_GELI_SUPPORT 981 explicit_bzero(gelipw, sizeof(gelipw)); 982 export_geli_boot_data(&zfsargs.gelidata); 983 #endif 984 if (primary_vdev != NULL) 985 zfsargs.primary_vdev = primary_vdev->v_guid; 986 else 987 printf("failed to detect primary vdev\n"); 988 /* 989 * Note that the zfsargs struct is passed by value, not by pointer. Code in 990 * btxldr.S copies the values from the entry stack to a fixed location 991 * within loader(8) at startup due to the presence of KARGS_FLAGS_EXTARG. 992 */ 993 __exec((caddr_t)addr, RB_BOOTINFO | (opts & RBX_MASK), 994 bootdev, 995 KARGS_FLAGS_ZFS | KARGS_FLAGS_EXTARG, 996 (uint32_t) spa->spa_guid, 997 (uint32_t) (spa->spa_guid >> 32), 998 VTOP(&bootinfo), 999 zfsargs); 1000 } 1001 1002 static int 1003 zfs_mount_ds(char *dsname) 1004 { 1005 uint64_t newroot; 1006 spa_t *newspa; 1007 char *q; 1008 1009 q = strchr(dsname, '/'); 1010 if (q) 1011 *q++ = '\0'; 1012 newspa = spa_find_by_name(dsname); 1013 if (newspa == NULL) { 1014 printf("\nCan't find ZFS pool %s\n", dsname); 1015 return -1; 1016 } 1017 1018 if (zfs_spa_init(newspa)) 1019 return -1; 1020 1021 newroot = 0; 1022 if (q) { 1023 if (zfs_lookup_dataset(newspa, q, &newroot)) { 1024 printf("\nCan't find dataset %s in ZFS pool %s\n", 1025 q, newspa->spa_name); 1026 return -1; 1027 } 1028 } 1029 if (zfs_mount(newspa, newroot, &zfsmount)) { 1030 printf("\nCan't mount ZFS dataset\n"); 1031 return -1; 1032 } 1033 spa = newspa; 1034 return (0); 1035 } 1036 1037 static int 1038 parse_cmd(void) 1039 { 1040 char *arg = cmd; 1041 char *ep, *p, *q; 1042 const char *cp; 1043 int c, i, j; 1044 1045 while ((c = *arg++)) { 1046 if (c == ' ' || c == '\t' || c == '\n') 1047 continue; 1048 for (p = arg; *p && *p != '\n' && *p != ' ' && *p != '\t'; p++); 1049 ep = p; 1050 if (*p) 1051 *p++ = 0; 1052 if (c == '-') { 1053 while ((c = *arg++)) { 1054 if (c == 'P') { 1055 if (*(uint8_t *)PTOV(0x496) & 0x10) { 1056 cp = "yes"; 1057 } else { 1058 opts |= OPT_SET(RBX_DUAL) | OPT_SET(RBX_SERIAL); 1059 cp = "no"; 1060 } 1061 printf("Keyboard: %s\n", cp); 1062 continue; 1063 } else if (c == 'S') { 1064 j = 0; 1065 while ((unsigned int)(i = *arg++ - '0') <= 9) 1066 j = j * 10 + i; 1067 if (j > 0 && i == -'0') { 1068 comspeed = j; 1069 break; 1070 } 1071 /* Fall through to error below ('S' not in optstr[]). */ 1072 } 1073 for (i = 0; c != optstr[i]; i++) 1074 if (i == NOPT - 1) 1075 return -1; 1076 opts ^= OPT_SET(flags[i]); 1077 } 1078 ioctrl = OPT_CHECK(RBX_DUAL) ? (IO_SERIAL|IO_KEYBOARD) : 1079 OPT_CHECK(RBX_SERIAL) ? IO_SERIAL : IO_KEYBOARD; 1080 if (ioctrl & IO_SERIAL) { 1081 if (sio_init(115200 / comspeed) != 0) 1082 ioctrl &= ~IO_SERIAL; 1083 } 1084 } if (c == '?') { 1085 dnode_phys_t dn; 1086 1087 if (zfs_lookup(&zfsmount, arg, &dn) == 0) { 1088 zap_list(spa, &dn); 1089 } 1090 return -1; 1091 } else { 1092 arg--; 1093 1094 /* 1095 * Report pool status if the comment is 'status'. Lets 1096 * hope no-one wants to load /status as a kernel. 1097 */ 1098 if (!strcmp(arg, "status")) { 1099 spa_all_status(); 1100 return -1; 1101 } 1102 1103 /* 1104 * If there is "zfs:" prefix simply ignore it. 1105 */ 1106 if (strncmp(arg, "zfs:", 4) == 0) 1107 arg += 4; 1108 1109 /* 1110 * If there is a colon, switch pools. 1111 */ 1112 q = strchr(arg, ':'); 1113 if (q) { 1114 *q++ = '\0'; 1115 if (zfs_mount_ds(arg) != 0) 1116 return -1; 1117 arg = q; 1118 } 1119 if ((i = ep - arg)) { 1120 if ((size_t)i >= sizeof(kname)) 1121 return -1; 1122 memcpy(kname, arg, i + 1); 1123 } 1124 } 1125 arg = p; 1126 } 1127 return 0; 1128 } 1129